Function: qmcplusplus::DiracMatrix<double, double>::invert_transpose(qmcplusplus::Matrix<double, std ... | Module: libqmcwfs.so | Source: DiracMatrix.h:28-120 [...] | Coverage: 0.37% |
---|
Function: qmcplusplus::DiracMatrix<double, double>::invert_transpose(qmcplusplus::Matrix<double, std ... | Module: libqmcwfs.so | Source: DiracMatrix.h:28-120 [...] | Coverage: 0.37% |
---|
/usr/include/c++/13.1.1/bits/alloc_traits.h: 276 - 360 |
-------------------------------------------------------------------------------- |
276: ::new((void*)__p) _Tp(std::forward<_Args>(__args)...); |
[...] |
360: { __a.deallocate(__p, __n); } |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Platforms/CPU/SIMD/Mallocator.hpp: 45 - 68 |
-------------------------------------------------------------------------------- |
45: T* allocate(std::size_t n) |
46: { |
47: if (n == 0) |
48: throw std::runtime_error("Mallocator::allocate does not accept size 0 allocations."); |
49: void* pt(nullptr); |
50: std::size_t asize = n * sizeof(T); |
51: std::size_t amod = asize % ALIGN; |
52: if (amod != 0) |
53: asize += ALIGN - amod; |
[...] |
61: pt = aligned_alloc(ALIGN, asize); |
[...] |
68: if (pt == nullptr) |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/DiracMatrix.h: 28 - 120 |
-------------------------------------------------------------------------------- |
28: T logdet(0); |
29: int sign_det = 1; |
30: for (size_t i = 0; i < n; i++) |
31: { |
32: sign_det *= (pivot[i] == i + 1) ? 1 : -1; |
33: sign_det *= (diag[i] > 0) ? 1 : -1; |
34: logdet += std::log(std::abs(diag[i])); |
35: } |
36: phase = (sign_det > 0) ? T(0) : M_PI; |
[...] |
75: m_pivot.resize(lda); |
76: Lwork = -1; |
[...] |
82: Lwork = static_cast<int>(lw); |
83: m_work.resize(Lwork); |
84: LU_diag.resize(lda); |
[...] |
93: inline void invert_transpose(const Matrix<T>& amat, Matrix<T>& invMat, real_type& LogDet, real_type& Phase) |
94: { |
95: BlasThreadingEnv knob(getNextLevelNumThreads()); |
96: const int n = invMat.rows(); |
97: const int lda = invMat.cols(); |
98: T_FP* invMat_ptr(nullptr); |
99: #if !defined(MIXED_PRECISION) |
100: simd::transpose(amat.data(), n, amat.cols(), invMat.data(), n, invMat.cols()); |
[...] |
107: if (Lwork < lda) |
108: reset(invMat_ptr, lda); |
109: int status; |
110: LAPACK::getrf(n, n, invMat_ptr, lda, m_pivot.data(), status); |
111: for (int i = 0; i < n; i++) |
112: LU_diag[i] = invMat_ptr[i * lda + i]; |
113: real_type_fp Phase_tmp; |
114: LogDet = computeLogDet(LU_diag.data(), n, m_pivot.data(), Phase_tmp); |
115: Phase = Phase_tmp; |
116: LAPACK::getri(n, invMat_ptr, lda, m_pivot.data(), m_work.data(), Lwork, status); |
117: #if defined(MIXED_PRECISION) |
118: invMat = psiM_fp; |
119: #endif |
120: } |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsMatrix.h: 78 - 78 |
-------------------------------------------------------------------------------- |
78: inline size_type cols() const { return D2; } |
/usr/include/c++/13.1.1/bits/std_abs.h: 72 - 72 |
-------------------------------------------------------------------------------- |
72: { return __builtin_fabs(__x); } |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Platforms/CPU/BLAS.hpp: 790 - 828 |
-------------------------------------------------------------------------------- |
790: dgetrf(n, m, a, n0, piv, st); |
[...] |
827: dgetri(n, a, n0, piv, work, n1, status); |
828: } |
/usr/include/c++/13.1.1/bits/stl_uninitialized.h: 754 - 1099 |
-------------------------------------------------------------------------------- |
754: for (; __n > 0; --__n, (void) ++__cur) |
[...] |
1098: _ForwardIterator __cur = __result; |
1099: for (; __first != __last; ++__first, (void)++__cur) |
/usr/include/c++/13.1.1/bits/stl_vector.h: 386 - 1936 |
-------------------------------------------------------------------------------- |
386: if (__p) |
[...] |
990: { return size_type(this->_M_impl._M_finish - this->_M_impl._M_start); } |
[...] |
1012: if (__new_size > size()) |
1013: _M_default_append(__new_size - size()); |
1014: else if (__new_size < size()) |
1015: _M_erase_at_end(this->_M_impl._M_start + __new_size); |
[...] |
1258: { return _M_data_ptr(this->_M_impl._M_start); } |
[...] |
1895: if (max_size() - size() < __n) |
1896: __throw_length_error(__N(__s)); |
1897: |
1898: const size_type __len = size() + (std::max)(size(), __n); |
[...] |
1932: if (size_type __n = this->_M_impl._M_finish - __pos) |
1933: { |
1934: std::_Destroy(__pos, this->_M_impl._M_finish, |
1935: _M_get_Tp_allocator()); |
1936: this->_M_impl._M_finish = __pos; |
/usr/include/c++/13.1.1/bits/vector.tcc: 640 - 707 |
-------------------------------------------------------------------------------- |
640: size_type __navail = size_type(this->_M_impl._M_end_of_storage |
641: - this->_M_impl._M_finish); |
642: |
643: if (__size > max_size() || __navail > max_size() - __size) |
644: __builtin_unreachable(); |
645: |
646: if (__navail >= __n) |
647: { |
648: _GLIBCXX_ASAN_ANNOTATE_GROW(__n); |
649: this->_M_impl._M_finish = |
[...] |
668: std::__uninitialized_default_n_a(__new_start + __size, |
[...] |
704: this->_M_impl._M_end_of_storage - __old_start); |
705: this->_M_impl._M_start = __new_start; |
706: this->_M_impl._M_finish = __new_start + __size + __n; |
707: this->_M_impl._M_end_of_storage = __new_start + __len; |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 248 - 249 |
-------------------------------------------------------------------------------- |
248: inline pointer data() { return X; } |
249: inline const_pointer data() const { return X; } |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Platforms/CPU/SIMD/inner_product.hpp: 209 - 211 |
-------------------------------------------------------------------------------- |
209: for (size_t i = 0; i < n; ++i) |
210: for (size_t j = 0; j < m; ++j) |
211: B[i * ldb + j] = A[j * lda + i]; |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Utilities/Configuration.h: 57 - 57 |
-------------------------------------------------------------------------------- |
57: #pragma omp parallel |
0x53610 PUSH %RBP |
0x53611 MOV %RSP,%RBP |
0x53614 PUSH %R15 |
0x53616 MOV %RSI,%R15 |
0x53619 PUSH %R14 |
0x5361b MOV %RDX,%R14 |
0x5361e XOR %EDX,%EDX |
0x53620 PUSH %R13 |
0x53622 LEA -0x88(%RBP),%R13 |
0x53629 MOV %R13,%RSI |
0x5362c PUSH %R12 |
0x5362e MOV %RDI,%R12 |
0x53631 LEA -0x4e18(%RIP),%RDI |
0x53638 PUSH %RBX |
0x53639 SUB $0xe8,%RSP |
0x53640 MOV %R8,-0xf0(%RBP) |
0x53647 MOV %RCX,-0xe8(%RBP) |
0x5364e XOR %ECX,%ECX |
0x53650 MOV %FS:0x28,%RAX |
0x53659 MOV %RAX,-0x38(%RBP) |
0x5365d XOR %EAX,%EAX |
0x5365f MOVL $0x1,-0x88(%RBP) |
0x53669 CALL 84e0 <GOMP_parallel@plt> |
0x5366e MOV -0x88(%RBP),%ESI |
0x53674 LEA -0xa0(%RBP),%RDI |
0x5367b MOV %RDI,-0xe0(%RBP) |
0x53682 CALL 81d0 <_ZN11qmcplusplus16BlasThreadingEnvC1Ei@plt> |
0x53687 MOV (%R14),%R11 |
0x5368a MOV 0x8(%R14),%RBX |
0x5368e MOV 0x30(%R14),%RAX |
0x53692 MOV 0x8(%R15),%RSI |
0x53696 MOV %R11D,-0xa4(%RBP) |
0x5369d MOVSXD %R11D,%R11 |
0x536a0 MOV 0x30(%R15),%R8 |
0x536a4 MOV %EBX,-0xa8(%RBP) |
0x536aa MOV %RAX,-0xb8(%RBP) |
0x536b1 TEST %R11,%R11 |
0x536b4 JE 5381e |
0x536ba LEA (,%R11,8),%R10 |
0x536c2 LEA (,%RBX,8),%R14 |
0x536ca SAL $0x3,%RSI |
0x536ce XOR %R9D,%R9D |
0x536d1 LEA (%RAX,%R10,1),%RDI |
0x536d5 NOPL (%RAX) |
(578) 0x536d8 LEA -0x8(%R10),%RCX |
(578) 0x536dc MOV %RDI,%RDX |
(578) 0x536df MOV %R8,%R15 |
(578) 0x536e2 SHR $0x3,%RCX |
(578) 0x536e6 SUB %R10,%RDX |
(578) 0x536e9 INC %RCX |
(578) 0x536ec AND $0x7,%ECX |
(578) 0x536ef JE 5379a |
(578) 0x536f5 CMP $0x1,%RCX |
(578) 0x536f9 JE 53784 |
(578) 0x536ff CMP $0x2,%RCX |
(578) 0x53703 JE 53773 |
(578) 0x53705 CMP $0x3,%RCX |
(578) 0x53709 JE 53762 |
(578) 0x5370b CMP $0x4,%RCX |
(578) 0x5370f JE 53751 |
(578) 0x53711 CMP $0x5,%RCX |
(578) 0x53715 JE 53740 |
(578) 0x53717 CMP $0x6,%RCX |
(578) 0x5371b JE 5372f |
(578) 0x5371d VMOVSD (%R8),%XMM0 |
(578) 0x53722 LEA (%R8,%RSI,1),%R15 |
(578) 0x53726 ADD $0x8,%RDX |
(578) 0x5372a VMOVSD %XMM0,-0x8(%RDX) |
(578) 0x5372f VMOVSD (%R15),%XMM1 |
(578) 0x53734 ADD $0x8,%RDX |
(578) 0x53738 ADD %RSI,%R15 |
(578) 0x5373b VMOVSD %XMM1,-0x8(%RDX) |
(578) 0x53740 VMOVSD (%R15),%XMM2 |
(578) 0x53745 ADD $0x8,%RDX |
(578) 0x53749 ADD %RSI,%R15 |
(578) 0x5374c VMOVSD %XMM2,-0x8(%RDX) |
(578) 0x53751 VMOVSD (%R15),%XMM3 |
(578) 0x53756 ADD $0x8,%RDX |
(578) 0x5375a ADD %RSI,%R15 |
(578) 0x5375d VMOVSD %XMM3,-0x8(%RDX) |
(578) 0x53762 VMOVSD (%R15),%XMM4 |
(578) 0x53767 ADD $0x8,%RDX |
(578) 0x5376b ADD %RSI,%R15 |
(578) 0x5376e VMOVSD %XMM4,-0x8(%RDX) |
(578) 0x53773 VMOVSD (%R15),%XMM5 |
(578) 0x53778 ADD $0x8,%RDX |
(578) 0x5377c ADD %RSI,%R15 |
(578) 0x5377f VMOVSD %XMM5,-0x8(%RDX) |
(578) 0x53784 VMOVSD (%R15),%XMM6 |
(578) 0x53789 ADD $0x8,%RDX |
(578) 0x5378d ADD %RSI,%R15 |
(578) 0x53790 VMOVSD %XMM6,-0x8(%RDX) |
(578) 0x53795 CMP %RDX,%RDI |
(578) 0x53798 JE 5380b |
(577) 0x5379a VMOVSD (%R15),%XMM7 |
(577) 0x5379f ADD %RSI,%R15 |
(577) 0x537a2 ADD $0x40,%RDX |
(577) 0x537a6 VMOVSD (%R15),%XMM8 |
(577) 0x537ab ADD %RSI,%R15 |
(577) 0x537ae VMOVSD (%R15),%XMM9 |
(577) 0x537b3 ADD %RSI,%R15 |
(577) 0x537b6 VMOVSD %XMM7,-0x40(%RDX) |
(577) 0x537bb VMOVSD (%R15),%XMM10 |
(577) 0x537c0 ADD %RSI,%R15 |
(577) 0x537c3 VMOVSD %XMM8,-0x38(%RDX) |
(577) 0x537c8 VMOVSD (%R15),%XMM11 |
(577) 0x537cd ADD %RSI,%R15 |
(577) 0x537d0 VMOVSD %XMM9,-0x30(%RDX) |
(577) 0x537d5 VMOVSD (%R15),%XMM12 |
(577) 0x537da ADD %RSI,%R15 |
(577) 0x537dd VMOVSD %XMM10,-0x28(%RDX) |
(577) 0x537e2 VMOVSD (%R15),%XMM13 |
(577) 0x537e7 ADD %RSI,%R15 |
(577) 0x537ea VMOVSD %XMM11,-0x20(%RDX) |
(577) 0x537ef VMOVSD (%R15),%XMM14 |
(577) 0x537f4 VMOVSD %XMM12,-0x18(%RDX) |
(577) 0x537f9 ADD %RSI,%R15 |
(577) 0x537fc VMOVSD %XMM13,-0x10(%RDX) |
(577) 0x53801 VMOVSD %XMM14,-0x8(%RDX) |
(577) 0x53806 CMP %RDX,%RDI |
(577) 0x53809 JNE 5379a |
(578) 0x5380b INC %R9 |
(578) 0x5380e ADD $0x8,%R8 |
(578) 0x53812 ADD %R14,%RDI |
(578) 0x53815 CMP %R9,%R11 |
(578) 0x53818 JNE 536d8 |
0x5381e MOV 0x18(%R12),%RCX |
0x53823 MOV %RCX,%R8 |
0x53826 CMP 0x30(%R12),%EBX |
0x5382b JLE 538c7 |
0x53831 MOV 0x20(%R12),%RDI |
0x53836 MOVSXD %EBX,%R14 |
0x53839 MOV %RDI,%R15 |
0x5383c SUB %RCX,%R15 |
0x5383f MOV %R15,%RAX |
0x53842 SAR $0x2,%RAX |
0x53846 CMP %R14,%RAX |
0x53849 JB 53db7 |
0x5384f CMP %RAX,%R14 |
0x53852 JB 53da0 |
0x53858 MOV %EBX,-0x8c(%RBP) |
0x5385e SUB $0x8,%RSP |
0x53862 MOV -0xb8(%RBP),%RSI |
0x53869 LEA -0x90(%RBP),%RDX |
0x53870 MOV %EBX,-0x90(%RBP) |
0x53876 LEA -0x94(%RBP),%RBX |
0x5387d LEA -0x8c(%RBP),%RDI |
0x53884 MOV %R13,%R8 |
0x53887 MOVL $-0x1,0x30(%R12) |
0x53890 LEA 0x30(%R12),%R9 |
0x53895 PUSH %RBX |
0x53896 CALL 8250 <dgetri_@plt> |
0x5389b VCVTTSD2SI -0x88(%RBP),%R13D |
0x538a3 POP %RCX |
0x538a4 MOV %R12,%RDI |
0x538a7 POP %RSI |
0x538a8 MOV %R13D,0x30(%R12) |
0x538ad MOVSXD %R13D,%RSI |
0x538b0 CALL 2b160 <_ZNSt6vectorIdN11qmcplusplus10MallocatorIdLm64EEEE6resizeEm> |
0x538b5 LEA 0x78(%R12),%RDI |
0x538ba MOV %R14,%RSI |
0x538bd CALL 2b160 <_ZNSt6vectorIdN11qmcplusplus10MallocatorIdLm64EEEE6resizeEm> |
0x538c2 MOV 0x18(%R12),%R8 |
0x538c7 LEA -0xa4(%RBP),%RDI |
0x538ce MOV -0xb8(%RBP),%RDX |
0x538d5 LEA -0xac(%RBP),%R9 |
0x538dc LEA -0xa8(%RBP),%RCX |
0x538e3 MOV %RDI,%RSI |
0x538e6 MOV %R9,-0xf8(%RBP) |
0x538ed CALL 8430 <dgetrf_@plt> |
0x538f2 MOV -0xa8(%RBP),%R14D |
0x538f9 MOV -0xa4(%RBP),%R15D |
0x53900 MOV 0x78(%R12),%RBX |
0x53905 MOV %R14D,-0xd8(%RBP) |
0x5390c TEST %R15D,%R15D |
0x5390f JLE 53e1a |
0x53915 MOVSXD %R15D,%RSI |
0x53918 MOVSXD -0xd8(%RBP),%R10 |
0x5391f MOV -0xb8(%RBP),%RAX |
0x53926 MOV %RBX,%R13 |
0x53929 LEA -0x8(,%RSI,8),%R8 |
0x53931 LEA (%RBX,%RSI,8),%R11 |
0x53935 SHR $0x3,%R8 |
0x53939 LEA 0x8(,%R10,8),%RCX |
0x53941 INC %R8 |
0x53944 AND $0x7,%R8D |
0x53948 JE 539e1 |
0x5394e CMP $0x1,%R8 |
0x53952 JE 539cb |
0x53954 CMP $0x2,%R8 |
0x53958 JE 539ba |
0x5395a CMP $0x3,%R8 |
0x5395e JE 539a9 |
0x53960 CMP $0x4,%R8 |
0x53964 JE 53998 |
0x53966 CMP $0x5,%R8 |
0x5396a JE 53987 |
0x5396c CMP $0x6,%R8 |
0x53970 JNE 53dff |
0x53976 VMOVSD (%RAX),%XMM2 |
0x5397a ADD $0x8,%R13 |
0x5397e ADD %RCX,%RAX |
0x53981 VMOVSD %XMM2,-0x8(%R13) |
0x53987 VMOVSD (%RAX),%XMM3 |
0x5398b ADD $0x8,%R13 |
0x5398f ADD %RCX,%RAX |
0x53992 VMOVSD %XMM3,-0x8(%R13) |
0x53998 VMOVSD (%RAX),%XMM4 |
0x5399c ADD $0x8,%R13 |
0x539a0 ADD %RCX,%RAX |
0x539a3 VMOVSD %XMM4,-0x8(%R13) |
0x539a9 VMOVSD (%RAX),%XMM5 |
0x539ad ADD $0x8,%R13 |
0x539b1 ADD %RCX,%RAX |
0x539b4 VMOVSD %XMM5,-0x8(%R13) |
0x539ba VMOVSD (%RAX),%XMM6 |
0x539be ADD $0x8,%R13 |
0x539c2 ADD %RCX,%RAX |
0x539c5 VMOVSD %XMM6,-0x8(%R13) |
0x539cb VMOVSD (%RAX),%XMM7 |
0x539cf ADD $0x8,%R13 |
0x539d3 ADD %RCX,%RAX |
0x539d6 VMOVSD %XMM7,-0x8(%R13) |
0x539dc CMP %R13,%R11 |
0x539df JE 53a52 |
(575) 0x539e1 VMOVSD (%RAX),%XMM8 |
(575) 0x539e5 ADD %RCX,%RAX |
(575) 0x539e8 ADD $0x40,%R13 |
(575) 0x539ec VMOVSD %XMM8,-0x40(%R13) |
(575) 0x539f2 VMOVSD (%RAX),%XMM9 |
(575) 0x539f6 ADD %RCX,%RAX |
(575) 0x539f9 VMOVSD %XMM9,-0x38(%R13) |
(575) 0x539ff VMOVSD (%RAX),%XMM10 |
(575) 0x53a03 ADD %RCX,%RAX |
(575) 0x53a06 VMOVSD %XMM10,-0x30(%R13) |
(575) 0x53a0c VMOVSD (%RAX),%XMM11 |
(575) 0x53a10 ADD %RCX,%RAX |
(575) 0x53a13 VMOVSD %XMM11,-0x28(%R13) |
(575) 0x53a19 VMOVSD (%RAX),%XMM12 |
(575) 0x53a1d ADD %RCX,%RAX |
(575) 0x53a20 VMOVSD %XMM12,-0x20(%R13) |
(575) 0x53a26 VMOVSD (%RAX),%XMM13 |
(575) 0x53a2a ADD %RCX,%RAX |
(575) 0x53a2d VMOVSD %XMM13,-0x18(%R13) |
(575) 0x53a33 VMOVSD (%RAX),%XMM14 |
(575) 0x53a37 ADD %RCX,%RAX |
(575) 0x53a3a VMOVSD %XMM14,-0x10(%R13) |
(575) 0x53a40 VMOVSD (%RAX),%XMM15 |
(575) 0x53a44 ADD %RCX,%RAX |
(575) 0x53a47 VMOVSD %XMM15,-0x8(%R13) |
(575) 0x53a4d CMP %R13,%R11 |
(575) 0x53a50 JNE 539e1 |
0x53a52 MOV 0x18(%R12),%R9 |
0x53a57 MOV %RSI,-0xc0(%RBP) |
0x53a5e MOV %R9,-0xc8(%RBP) |
(574) 0x53a65 MOV -0xc0(%RBP),%RDI |
(574) 0x53a6c VXORPD %XMM7,%XMM7,%XMM7 |
(574) 0x53a70 MOV $0x1,%R14D |
(574) 0x53a76 XOR %R13D,%R13D |
(574) 0x53a79 AND $0x3,%EDI |
(574) 0x53a7c JE 53b90 |
(574) 0x53a82 CMP $0x1,%RDI |
(574) 0x53a86 JE 53b2c |
(574) 0x53a8c CMP $0x2,%RDI |
(574) 0x53a90 JE 53ad5 |
(574) 0x53a92 MOV -0xc8(%RBP),%RDX |
(574) 0x53a99 MOV $-0x1,%R10D |
(574) 0x53a9f MOV $0x1,%R13D |
(574) 0x53aa5 VMOVSD -0x8(%RBX,%R13,8),%XMM0 |
(574) 0x53aac CMPL $0x1,(%RDX) |
(574) 0x53aaf CMOVE %R14D,%R10D |
(574) 0x53ab3 MOV %R10D,%R14D |
(574) 0x53ab6 NEG %R14D |
(574) 0x53ab9 VCOMISD %XMM7,%XMM0 |
(574) 0x53abd VANDPD 0x12f9b(%RIP),%XMM0,%XMM0 |
(574) 0x53ac5 CMOVBE %R14D,%R10D |
(574) 0x53ac9 MOV %R10D,%R14D |
(574) 0x53acc CALL 8070 <log@plt> |
(574) 0x53ad1 VMOVSD %XMM0,%XMM0,%XMM7 |
(574) 0x53ad5 MOV -0xc8(%RBP),%RCX |
(574) 0x53adc MOV %R14D,%ESI |
(574) 0x53adf VXORPD %XMM2,%XMM2,%XMM2 |
(574) 0x53ae3 VMOVSD %XMM7,-0xd0(%RBP) |
(574) 0x53aeb NEG %ESI |
(574) 0x53aed MOVSXD (%RCX,%R13,4),%R11 |
(574) 0x53af1 INC %R13 |
(574) 0x53af4 VMOVSD -0x8(%RBX,%R13,8),%XMM1 |
(574) 0x53afb CMP %R11,%R13 |
(574) 0x53afe CMOVE %R14D,%ESI |
(574) 0x53b02 VANDPD 0x12f56(%RIP),%XMM1,%XMM0 |
(574) 0x53b0a MOV %ESI,%R8D |
(574) 0x53b0d NEG %R8D |
(574) 0x53b10 VCOMISD %XMM2,%XMM1 |
(574) 0x53b14 CMOVBE %R8D,%ESI |
(574) 0x53b18 MOV %ESI,%R14D |
(574) 0x53b1b CALL 8070 <log@plt> |
(574) 0x53b20 VMOVSD -0xd0(%RBP),%XMM3 |
(574) 0x53b28 VADDSD %XMM0,%XMM3,%XMM7 |
(574) 0x53b2c MOV -0xc8(%RBP),%RAX |
(574) 0x53b33 MOV %R14D,%EDI |
(574) 0x53b36 VXORPD %XMM5,%XMM5,%XMM5 |
(574) 0x53b3a VMOVSD %XMM7,-0xd0(%RBP) |
(574) 0x53b42 NEG %EDI |
(574) 0x53b44 MOVSXD (%RAX,%R13,4),%R9 |
(574) 0x53b48 INC %R13 |
(574) 0x53b4b VMOVSD -0x8(%RBX,%R13,8),%XMM4 |
(574) 0x53b52 CMP %R9,%R13 |
(574) 0x53b55 CMOVE %R14D,%EDI |
(574) 0x53b59 VANDPD 0x12eff(%RIP),%XMM4,%XMM0 |
(574) 0x53b61 MOV %EDI,%EDX |
(574) 0x53b63 NEG %EDX |
(574) 0x53b65 VCOMISD %XMM5,%XMM4 |
(574) 0x53b69 CMOVBE %EDX,%EDI |
(574) 0x53b6c MOV %EDI,%R14D |
(574) 0x53b6f CALL 8070 <log@plt> |
(574) 0x53b74 VMOVSD -0xd0(%RBP),%XMM6 |
(574) 0x53b7c MOV -0xc0(%RBP),%R10 |
(574) 0x53b83 VADDSD %XMM0,%XMM6,%XMM7 |
(574) 0x53b87 CMP %R10,%R13 |
(574) 0x53b8a JE 53cff |
(574) 0x53b90 MOV %R15D,-0x100(%RBP) |
(574) 0x53b97 MOV %R12,-0x108(%RBP) |
(574) 0x53b9e MOV %RBX,%R12 |
(574) 0x53ba1 MOV %R14D,%EBX |
(574) 0x53ba4 MOV %R13,%R14 |
(574) 0x53ba7 MOV -0xc8(%RBP),%R13 |
(572) 0x53bae MOVSXD (%R13,%R14,4),%R11 |
(572) 0x53bb3 LEA 0x1(%R14),%R15 |
(572) 0x53bb7 MOV %EBX,%ECX |
(572) 0x53bb9 VXORPD %XMM9,%XMM9,%XMM9 |
(572) 0x53bbe NEG %ECX |
(572) 0x53bc0 VMOVSD -0x8(%R12,%R15,8),%XMM8 |
(572) 0x53bc7 VMOVSD %XMM7,-0xd0(%RBP) |
(572) 0x53bcf CMP %R11,%R15 |
(572) 0x53bd2 CMOVE %EBX,%ECX |
(572) 0x53bd5 VANDPD 0x12e83(%RIP),%XMM8,%XMM0 |
(572) 0x53bdd MOV %ECX,%ESI |
(572) 0x53bdf MOV %ECX,%EBX |
(572) 0x53be1 NEG %ESI |
(572) 0x53be3 VCOMISD %XMM9,%XMM8 |
(572) 0x53be8 CMOVBE %ESI,%EBX |
(572) 0x53beb CALL 8070 <log@plt> |
(572) 0x53bf0 MOVSXD (%R13,%R15,4),%R8 |
(572) 0x53bf5 LEA 0x2(%R14),%R15 |
(572) 0x53bf9 VMOVSD -0xd0(%RBP),%XMM10 |
(572) 0x53c01 MOV %EBX,%EAX |
(572) 0x53c03 VMOVSD -0x8(%R12,%R15,8),%XMM12 |
(572) 0x53c0a VXORPD %XMM13,%XMM13,%XMM13 |
(572) 0x53c0f NEG %EAX |
(572) 0x53c11 CMP %R8,%R15 |
(572) 0x53c14 VADDSD %XMM0,%XMM10,%XMM11 |
(572) 0x53c18 CMOVE %EBX,%EAX |
(572) 0x53c1b VANDPD 0x12e3d(%RIP),%XMM12,%XMM0 |
(572) 0x53c23 MOV %EAX,%R9D |
(572) 0x53c26 MOV %EAX,%EBX |
(572) 0x53c28 VMOVSD %XMM11,-0xd0(%RBP) |
(572) 0x53c30 NEG %R9D |
(572) 0x53c33 VCOMISD %XMM13,%XMM12 |
(572) 0x53c38 CMOVBE %R9D,%EBX |
(572) 0x53c3c CALL 8070 <log@plt> |
(572) 0x53c41 MOVSXD (%R13,%R15,4),%RDI |
(572) 0x53c46 LEA 0x3(%R14),%R15 |
(572) 0x53c4a MOV %EBX,%R10D |
(572) 0x53c4d VMOVSD -0x8(%R12,%R15,8),%XMM15 |
(572) 0x53c54 VADDSD -0xd0(%RBP),%XMM0,%XMM14 |
(572) 0x53c5c VXORPD %XMM0,%XMM0,%XMM0 |
(572) 0x53c60 NEG %R10D |
(572) 0x53c63 CMP %RDI,%R15 |
(572) 0x53c66 CMOVE %EBX,%R10D |
(572) 0x53c6a VMOVSD %XMM14,-0xd0(%RBP) |
(572) 0x53c72 MOV %R10D,%EDX |
(572) 0x53c75 MOV %R10D,%EBX |
(572) 0x53c78 NEG %EDX |
(572) 0x53c7a VCOMISD %XMM0,%XMM15 |
(572) 0x53c7e VANDPD 0x12dda(%RIP),%XMM15,%XMM0 |
(572) 0x53c86 CMOVBE %EDX,%EBX |
(572) 0x53c89 ADD $0x4,%R14 |
(572) 0x53c8d CALL 8070 <log@plt> |
(572) 0x53c92 MOVSXD (%R13,%R15,4),%R11 |
(572) 0x53c97 VMOVSD -0x8(%R12,%R14,8),%XMM2 |
(572) 0x53c9e VXORPD %XMM3,%XMM3,%XMM3 |
(572) 0x53ca2 MOV %EBX,%ECX |
(572) 0x53ca4 VADDSD -0xd0(%RBP),%XMM0,%XMM1 |
(572) 0x53cac NEG %ECX |
(572) 0x53cae CMP %R11,%R14 |
(572) 0x53cb1 VANDPD 0x12da7(%RIP),%XMM2,%XMM0 |
(572) 0x53cb9 CMOVE %EBX,%ECX |
(572) 0x53cbc VMOVSD %XMM1,-0xd0(%RBP) |
(572) 0x53cc4 MOV %ECX,%ESI |
(572) 0x53cc6 MOV %ECX,%EBX |
(572) 0x53cc8 NEG %ESI |
(572) 0x53cca VCOMISD %XMM3,%XMM2 |
(572) 0x53cce CMOVBE %ESI,%EBX |
(572) 0x53cd1 CALL 8070 <log@plt> |
(572) 0x53cd6 MOV -0xc0(%RBP),%R8 |
(572) 0x53cdd VADDSD -0xd0(%RBP),%XMM0,%XMM7 |
(572) 0x53ce5 CMP %R8,%R14 |
(572) 0x53ce8 JNE 53bae |
(574) 0x53cee MOV -0x100(%RBP),%R15D |
(574) 0x53cf5 MOV -0x108(%RBP),%R12 |
(574) 0x53cfc MOV %EBX,%R14D |
(574) 0x53cff VMOVSD 0x13b31(%RIP),%XMM4 |
(574) 0x53d07 TEST %R14D,%R14D |
(574) 0x53d0a JLE 53d10 |
(574) 0x53d0c VXORPD %XMM4,%XMM4,%XMM4 |
(574) 0x53d10 MOV -0xe8(%RBP),%R14 |
(574) 0x53d17 MOV -0xf0(%RBP),%R13 |
(574) 0x53d1e SUB $0x8,%RSP |
(574) 0x53d22 MOV %R15D,-0x9c(%RBP) |
(574) 0x53d29 MOV -0xd8(%RBP),%EAX |
(574) 0x53d2f MOV (%R12),%R8 |
(574) 0x53d33 LEA -0x98(%RBP),%RDX |
(574) 0x53d3a LEA -0x9c(%RBP),%RDI |
(574) 0x53d41 VMOVSD %XMM7,(%R14) |
(574) 0x53d46 MOV -0xc8(%RBP),%RCX |
(574) 0x53d4d MOV -0xb8(%RBP),%RSI |
(574) 0x53d54 LEA 0x30(%R12),%R9 |
(574) 0x53d59 MOV %EAX,-0x98(%RBP) |
(574) 0x53d5f VMOVSD %XMM4,(%R13) |
(574) 0x53d65 PUSHQ -0xf8(%RBP) |
(574) 0x53d6b CALL 8250 <dgetri_@plt> |
(574) 0x53d70 POP %RAX |
(574) 0x53d71 MOV -0xe0(%RBP),%RDI |
(574) 0x53d78 POP %RDX |
(574) 0x53d79 CALL 8550 <_ZN11qmcplusplus16BlasThreadingEnvD1Ev@plt> |
(574) 0x53d7e MOV -0x38(%RBP),%RAX |
(574) 0x53d82 SUB %FS:0x28,%RAX |
(574) 0x53d8b JNE 54050 |
0x53d91 LEA -0x28(%RBP),%RSP |
0x53d95 POP %RBX |
0x53d96 POP %R12 |
0x53d98 POP %R13 |
0x53d9a POP %R14 |
0x53d9c POP %R15 |
0x53d9e POP %RBP |
0x53d9f RET |
0x53da0 LEA (%RCX,%R14,4),%RDX |
0x53da4 CMP %RDX,%RDI |
0x53da7 JE 53858 |
0x53dad MOV %RDX,0x20(%R12) |
0x53db2 JMP 53858 |
0x53db7 MOV 0x28(%R12),%R10 |
0x53dbc MOV %RCX,-0xc0(%RBP) |
0x53dc3 MOV %R14,%R9 |
0x53dc6 SUB %RAX,%R9 |
0x53dc9 MOV %R10,%RCX |
0x53dcc SUB %RDI,%RCX |
0x53dcf SAR $0x2,%RCX |
0x53dd3 CMP %R9,%RCX |
0x53dd6 JB 53e39 |
0x53dd8 LEA (,%R9,4),%R15 |
0x53de0 XOR %ESI,%ESI |
0x53de2 MOV %R15,%RDX |
0x53de5 CALL 80e0 <memset@plt> |
0x53dea MOV -0xc0(%RBP),%RCX |
0x53df1 LEA (%RAX,%R15,1),%RAX |
0x53df5 MOV %RAX,0x20(%R12) |
0x53dfa JMP 53858 |
0x53dff MOV -0xb8(%RBP),%RAX |
0x53e06 LEA 0x8(%RBX),%R13 |
0x53e0a VMOVSD (%RAX),%XMM1 |
0x53e0e ADD %RCX,%RAX |
0x53e11 VMOVSD %XMM1,(%RBX) |
0x53e15 JMP 53976 |
0x53e1a MOV 0x18(%R12),%RDI |
0x53e1f MOV %RDI,-0xc8(%RBP) |
0x53e26 JNE 54070 |
0x53e2c VXORPD %XMM7,%XMM7,%XMM7 |
0x53e30 VMOVSD %XMM7,%XMM7,%XMM4 |
0x53e34 JMP 53d10 |
0x53e39 MOV $0x1fffffffffffffff,%RSI |
0x53e43 SUB %RAX,%RSI |
0x53e46 CMP %R9,%RSI |
0x53e49 JB 54055 |
0x53e4f MOV %R8,-0x100(%RBP) |
0x53e56 LEA (%RAX,%RAX,1),%R8 |
0x53e5a CMP %R9,%RAX |
0x53e5d MOV %R8,%R11 |
0x53e60 MOV %RDI,-0xd0(%RBP) |
0x53e67 CMOVB %R14,%R11 |
0x53e6b MOV %R15,-0xd8(%RBP) |
0x53e72 MOV %R10,-0xf8(%RBP) |
0x53e79 LEA (,%R11,4),%RDI |
0x53e81 MOV %R9,-0xc8(%RBP) |
0x53e88 MOV %RDI,%R15 |
0x53e8b LEA 0x40(%RDI),%RSI |
0x53e8f MOV %RDI,-0xc0(%RBP) |
0x53e96 AND $0x3f,%R15D |
0x53e9a SUB %R15,%RSI |
0x53e9d TEST %R15,%R15 |
0x53ea0 CMOVE %RDI,%RSI |
0x53ea4 MOV $0x40,%EDI |
0x53ea9 CALL 8540 <aligned_alloc@plt> |
0x53eae MOV %RAX,%R15 |
0x53eb1 TEST %RAX,%RAX |
0x53eb4 JE a204 |
0x53eba MOV -0xd8(%RBP),%RAX |
0x53ec1 MOV -0xc8(%RBP),%RDX |
0x53ec8 XOR %ESI,%ESI |
0x53eca MOV -0xf8(%RBP),%R9 |
0x53ed1 MOV -0x100(%RBP),%R10 |
0x53ed8 SAL $0x2,%RDX |
0x53edc LEA (%R15,%RAX,1),%RDI |
0x53ee0 MOV %RAX,-0xc8(%RBP) |
0x53ee7 MOV %R9,-0xd8(%RBP) |
0x53eee MOV %R10,-0xf8(%RBP) |
0x53ef5 CALL 80e0 <memset@plt> |
0x53efa MOV -0xf8(%RBP),%R8 |
0x53f01 MOV -0xd0(%RBP),%RSI |
0x53f08 MOV %R15,%R9 |
0x53f0b MOV -0xd8(%RBP),%R11 |
0x53f12 CMP %R8,%RSI |
0x53f15 MOV %R8,%RAX |
0x53f18 JE 5400c |
0x53f1e MOV -0xc8(%RBP),%RCX |
0x53f25 LEA -0x4(%RCX),%RDI |
0x53f29 SHR $0x2,%RDI |
0x53f2d INC %RDI |
0x53f30 AND $0x7,%EDI |
0x53f33 JE 53fc6 |
0x53f39 CMP $0x1,%RDI |
0x53f3d JE 53fb3 |
0x53f3f CMP $0x2,%RDI |
0x53f43 JE 53fa4 |
0x53f45 CMP $0x3,%RDI |
0x53f49 JE 53f96 |
0x53f4b CMP $0x4,%RDI |
0x53f4f JE 53f88 |
0x53f51 CMP $0x5,%RDI |
0x53f55 JE 53f7a |
0x53f57 CMP $0x6,%RDI |
0x53f5b JE 53f6b |
0x53f5d MOV (%R8),%EDX |
0x53f60 LEA 0x4(%R8),%RAX |
0x53f64 LEA 0x4(%R15),%R9 |
0x53f68 MOV %EDX,(%R15) |
0x53f6b MOV (%RAX),%R10D |
0x53f6e ADD $0x4,%R9 |
0x53f72 ADD $0x4,%RAX |
0x53f76 MOV %R10D,-0x4(%R9) |
0x53f7a MOV (%RAX),%ECX |
0x53f7c ADD $0x4,%R9 |
0x53f80 ADD $0x4,%RAX |
0x53f84 MOV %ECX,-0x4(%R9) |
0x53f88 MOV (%RAX),%EDI |
0x53f8a ADD $0x4,%R9 |
0x53f8e ADD $0x4,%RAX |
0x53f92 MOV %EDI,-0x4(%R9) |
0x53f96 MOV (%RAX),%EDX |
0x53f98 ADD $0x4,%R9 |
0x53f9c ADD $0x4,%RAX |
0x53fa0 MOV %EDX,-0x4(%R9) |
0x53fa4 MOV (%RAX),%R10D |
0x53fa7 ADD $0x4,%R9 |
0x53fab ADD $0x4,%RAX |
0x53faf MOV %R10D,-0x4(%R9) |
0x53fb3 MOV (%RAX),%ECX |
0x53fb5 ADD $0x4,%RAX |
0x53fb9 ADD $0x4,%R9 |
0x53fbd MOV %ECX,-0x4(%R9) |
0x53fc1 CMP %RAX,%RSI |
0x53fc4 JE 5400c |
(576) 0x53fc6 MOV (%RAX),%EDI |
(576) 0x53fc8 ADD $0x20,%RAX |
(576) 0x53fcc ADD $0x20,%R9 |
(576) 0x53fd0 MOV %EDI,-0x20(%R9) |
(576) 0x53fd4 MOV -0x1c(%RAX),%EDX |
(576) 0x53fd7 MOV %EDX,-0x1c(%R9) |
(576) 0x53fdb MOV -0x18(%RAX),%R10D |
(576) 0x53fdf MOV %R10D,-0x18(%R9) |
(576) 0x53fe3 MOV -0x14(%RAX),%ECX |
(576) 0x53fe6 MOV %ECX,-0x14(%R9) |
(576) 0x53fea MOV -0x10(%RAX),%EDI |
(576) 0x53fed MOV %EDI,-0x10(%R9) |
(576) 0x53ff1 MOV -0xc(%RAX),%EDX |
(576) 0x53ff4 MOV %EDX,-0xc(%R9) |
(576) 0x53ff8 MOV -0x8(%RAX),%R10D |
(576) 0x53ffc MOV %R10D,-0x8(%R9) |
(576) 0x54000 MOV -0x4(%RAX),%ECX |
(576) 0x54003 MOV %ECX,-0x4(%R9) |
(576) 0x54007 CMP %RAX,%RSI |
(576) 0x5400a JNE 53fc6 |
0x5400c TEST %R8,%R8 |
0x5400f JE 54023 |
0x54011 MOV %R11,%RSI |
0x54014 MOV %R8,%RDI |
0x54017 SUB %R8,%RSI |
0x5401a SAR $0x2,%RSI |
0x5401e CALL 65b50 <_ZN11qmcplusplus10MallocatorIdLm64EE10deallocateEPdm.isra.0> |
0x54023 MOV -0xc0(%RBP),%RSI |
0x5402a LEA (%R15,%R14,4),%R8 |
0x5402e VMOVQ %R15,%XMM15 |
0x54033 MOV %R15,%RCX |
0x54036 VPINSRQ $0x1,%R8,%XMM15,%XMM0 |
0x5403c ADD %R15,%RSI |
0x5403f VMOVDQU %XMM0,0x18(%R12) |
0x54046 MOV %RSI,0x28(%R12) |
0x5404b JMP 53858 |
(573) 0x54050 CALL 80d0 <__stack_chk_fail@plt> |
(573) 0x54055 MOV -0x38(%RBP),%RAX |
(573) 0x54059 SUB %FS:0x28,%RAX |
(573) 0x54062 JNE 54050 |
(574) 0x54064 LEA 0x11f9c(%RIP),%RDI |
(574) 0x5406b CALL 8180 <_ZSt20__throw_length_errorPKc@plt> |
(574) 0x54070 MOVSXD %R15D,%RDX |
(574) 0x54073 MOV %RDX,-0xc0(%RBP) |
(574) 0x5407a JMP 53a65 |
0x5407f MOV %RAX,%RBX |
0x54082 VZEROUPPER |
0x54085 JMP a289 |
0x5408a NOPW (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | miniqmcreference::DiracDetermi[...] | DelayedUpdate.h:79 | libqmcwfs.so |
○ | miniqmcreference::DiracDetermi[...] | DiracDeterminantRef.cpp:238 | libqmcwfs.so |
○ | qmcplusplus::WaveFunction::eva[...] | WaveFunction.cpp:178 | libqmcwfs.so |
○ | main._omp_fn.0 | miniqmc.cpp:390 | exec |
○ | GOMP_parallel | libgomp.h:985 | libgomp.so.1.0.0 |
Path / |
Source file and lines | DiracMatrix.h:28-120 |
Module | libqmcwfs.so |
nb instructions | 300 |
nb uops | 315 |
loop length | 1320 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 9 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 20 |
micro-operation queue | 78.75 cycles |
front end | 78.75 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 40.50 | 40.50 | 39.50 | 39.17 | 62.00 | 40.50 | 40.50 | 39.33 |
cycles | 40.50 | 40.50 | 39.50 | 39.17 | 62.00 | 40.50 | 40.50 | 39.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 75.73 |
Stall cycles | 0.00 |
Front-end | 78.75 |
Dispatch | 62.00 |
Overall L1 | 78.75 |
all | 2% |
load | 0% |
store | 2% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 3% |
all | 5% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 3% |
load | 0% |
store | 2% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 5% |
all | 11% |
load | 8% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 13% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 16% |
all | 11% |
load | 11% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA -0x88(%RBP),%R13 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA -0x4e18(%RIP),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0xe8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R8,-0xf0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RCX,-0xe8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %FS:0x28,%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVL $0x1,-0x88(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 2 | 1 |
CALL 84e0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x88(%RBP),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0xa0(%RBP),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0xe0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 81d0 <_ZN11qmcplusplus16BlasThreadingEnvC1Ei@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV (%R14),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x8(%R14),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x30(%R14),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x8(%R15),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R11D,-0xa4(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOVSXD %R11D,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x30(%R15),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %EBX,-0xa8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
TEST %R11,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 5381e | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA (,%R11,8),%R10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RBX,8),%R14 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x3,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA (%RAX,%R10,1),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x18(%R12),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RCX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP 0x30(%R12),%EBX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JLE 538c7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x20(%R12),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD %EBX,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SUB %RCX,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SAR $0x2,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %R14,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JB 53db7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP %RAX,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JB 53da0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %EBX,-0x8c(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV -0xb8(%RBP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x90(%RBP),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EBX,-0x90(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA -0x94(%RBP),%RBX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0x8c(%RBP),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVL $-0x1,0x30(%R12) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 2 | 1 |
LEA 0x30(%R12),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 8250 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
VCVTTSD2SI -0x88(%RBP),%R13D | 2 | 1.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 6 | 1 |
POP %RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
POP %RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
MOV %R13D,0x30(%R12) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOVSXD %R13D,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 2b160 <_ZNSt6vectorIdN11qmcplusplus10MallocatorIdLm64EEEE6resizeEm> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
LEA 0x78(%R12),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 2b160 <_ZNSt6vectorIdN11qmcplusplus10MallocatorIdLm64EEEE6resizeEm> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x18(%R12),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0xa4(%RBP),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xb8(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0xac(%RBP),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0xa8(%RBP),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R9,-0xf8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 8430 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0xa8(%RBP),%R14D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0xa4(%RBP),%R15D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x78(%R12),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R14D,-0xd8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
TEST %R15D,%R15D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 53e1a | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVSXD %R15D,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOVSXD -0xd8(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA -0x8(,%RSI,8),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RBX,%RSI,8),%R11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x3,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
LEA 0x8(,%R10,8),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
AND $0x7,%R8D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 539e1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x1,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 539cb | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x2,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 539ba | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x3,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 539a9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x4,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53998 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x5,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53987 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x6,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JNE 53dff | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VMOVSD (%RAX),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM2,-0x8(%R13) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD (%RAX),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM3,-0x8(%R13) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD (%RAX),%XMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM4,-0x8(%R13) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD (%RAX),%XMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM5,-0x8(%R13) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD (%RAX),%XMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM6,-0x8(%R13) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD (%RAX),%XMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM7,-0x8(%R13) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMP %R13,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53a52 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x18(%R12),%R9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RSI,-0xc0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R9,-0xc8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
LEA (%RCX,%R14,4),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53858 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %RDX,0x20(%R12) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JMP 53858 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV 0x28(%R12),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RCX,-0xc0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R14,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SUB %RAX,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R10,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SUB %RDI,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SAR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %R9,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JB 53e39 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA (,%R9,4),%R15 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R15,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 80e0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0xc0(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RAX,%R15,1),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x20(%R12) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JMP 53858 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA 0x8(%RBX),%R13 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD (%RAX),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM1,(%RBX) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JMP 53976 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV 0x18(%R12),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RDI,-0xc8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JNE 54070 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VXORPD %XMM7,%XMM7,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD %XMM7,%XMM7,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
JMP 53d10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV $0x1fffffffffffffff,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SUB %RAX,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R9,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JB 54055 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R8,-0x100(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%RAX,%RAX,1),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R8,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,-0xd0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMOVB %R14,%R11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %R15,-0xd8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,-0xf8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (,%R11,4),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,-0xc8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA 0x40(%RDI),%RSI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0xc0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
AND $0x3f,%R15D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SUB %R15,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
TEST %R15,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMOVE %RDI,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV $0x40,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 8540 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE a204 <_ZN11qmcplusplus11DiracMatrixIddE16invert_transposeERKNS_6MatrixIdSaIdEEERS4_RdS8_.cold> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0xd8(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0xc8(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0xf8(%RBP),%R9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x100(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
SAL $0x2,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
LEA (%R15,%RAX,1),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R9,-0xd8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,-0xf8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 80e0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0xf8(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0xd0(%RBP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R15,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0xd8(%RBP),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %R8,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R8,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JE 5400c | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0xc8(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x4(%RCX),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x2,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
INC %RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
AND $0x7,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53fc6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x1,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53fb3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x2,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53fa4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x3,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53f96 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x4,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53f88 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x5,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53f7a | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x6,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53f6b | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV (%R8),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA 0x4(%R8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x4(%R15),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EDX,(%R15) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%R10D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x4,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R10D,-0x4(%R9) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%ECX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x4,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %ECX,-0x4(%R9) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%EDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x4,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %EDI,-0x4(%R9) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x4,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %EDX,-0x4(%R9) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%R10D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x4,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R10D,-0x4(%R9) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%ECX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x4,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %ECX,-0x4(%R9) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMP %RAX,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 5400c | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
TEST %R8,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 54023 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R11,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R8,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SUB %R8,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SAR $0x2,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CALL 65b50 <_ZN11qmcplusplus10MallocatorIdLm64EE10deallocateEPdm.isra.0> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0xc0(%RBP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R15,%R14,4),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVQ %R15,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
MOV %R15,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VPINSRQ $0x1,%R8,%XMM15,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 2 | 0 | 0 | 3 | 2 |
ADD %R15,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVDQU %XMM0,0x18(%R12) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
MOV %RSI,0x28(%R12) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JMP 53858 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VZEROUPPER | 4 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP a289 <_ZN11qmcplusplus11DiracMatrixIddE16invert_transposeERKNS_6MatrixIdSaIdEEERS4_RdS8_.cold+0x85> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Source file and lines | DiracMatrix.h:28-120 |
Module | libqmcwfs.so |
nb instructions | 300 |
nb uops | 315 |
loop length | 1320 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 9 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 20 |
micro-operation queue | 78.75 cycles |
front end | 78.75 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 40.50 | 40.50 | 39.50 | 39.17 | 62.00 | 40.50 | 40.50 | 39.33 |
cycles | 40.50 | 40.50 | 39.50 | 39.17 | 62.00 | 40.50 | 40.50 | 39.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 75.73 |
Stall cycles | 0.00 |
Front-end | 78.75 |
Dispatch | 62.00 |
Overall L1 | 78.75 |
all | 2% |
load | 0% |
store | 2% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 3% |
all | 5% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 3% |
load | 0% |
store | 2% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 5% |
all | 11% |
load | 8% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 13% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 16% |
all | 11% |
load | 11% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA -0x88(%RBP),%R13 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA -0x4e18(%RIP),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0xe8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R8,-0xf0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RCX,-0xe8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %FS:0x28,%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVL $0x1,-0x88(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 2 | 1 |
CALL 84e0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x88(%RBP),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0xa0(%RBP),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0xe0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 81d0 <_ZN11qmcplusplus16BlasThreadingEnvC1Ei@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV (%R14),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x8(%R14),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x30(%R14),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x8(%R15),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R11D,-0xa4(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOVSXD %R11D,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x30(%R15),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %EBX,-0xa8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
TEST %R11,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 5381e | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA (,%R11,8),%R10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RBX,8),%R14 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x3,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA (%RAX,%R10,1),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x18(%R12),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RCX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP 0x30(%R12),%EBX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JLE 538c7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x20(%R12),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD %EBX,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SUB %RCX,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SAR $0x2,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %R14,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JB 53db7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP %RAX,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JB 53da0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %EBX,-0x8c(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV -0xb8(%RBP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x90(%RBP),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EBX,-0x90(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA -0x94(%RBP),%RBX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0x8c(%RBP),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVL $-0x1,0x30(%R12) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 2 | 1 |
LEA 0x30(%R12),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 8250 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
VCVTTSD2SI -0x88(%RBP),%R13D | 2 | 1.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 6 | 1 |
POP %RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
POP %RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
MOV %R13D,0x30(%R12) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOVSXD %R13D,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 2b160 <_ZNSt6vectorIdN11qmcplusplus10MallocatorIdLm64EEEE6resizeEm> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
LEA 0x78(%R12),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 2b160 <_ZNSt6vectorIdN11qmcplusplus10MallocatorIdLm64EEEE6resizeEm> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x18(%R12),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0xa4(%RBP),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xb8(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0xac(%RBP),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0xa8(%RBP),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R9,-0xf8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 8430 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0xa8(%RBP),%R14D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0xa4(%RBP),%R15D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x78(%R12),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R14D,-0xd8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
TEST %R15D,%R15D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 53e1a | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVSXD %R15D,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOVSXD -0xd8(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA -0x8(,%RSI,8),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RBX,%RSI,8),%R11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x3,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
LEA 0x8(,%R10,8),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
AND $0x7,%R8D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 539e1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x1,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 539cb | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x2,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 539ba | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x3,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 539a9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x4,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53998 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x5,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53987 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x6,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JNE 53dff | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VMOVSD (%RAX),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM2,-0x8(%R13) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD (%RAX),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM3,-0x8(%R13) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD (%RAX),%XMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM4,-0x8(%R13) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD (%RAX),%XMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM5,-0x8(%R13) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD (%RAX),%XMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM6,-0x8(%R13) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD (%RAX),%XMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM7,-0x8(%R13) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMP %R13,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53a52 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x18(%R12),%R9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RSI,-0xc0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R9,-0xc8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
LEA (%RCX,%R14,4),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53858 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %RDX,0x20(%R12) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JMP 53858 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV 0x28(%R12),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RCX,-0xc0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R14,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SUB %RAX,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R10,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SUB %RDI,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SAR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %R9,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JB 53e39 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA (,%R9,4),%R15 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R15,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 80e0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0xc0(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RAX,%R15,1),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x20(%R12) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JMP 53858 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA 0x8(%RBX),%R13 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD (%RAX),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD %XMM1,(%RBX) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JMP 53976 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV 0x18(%R12),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RDI,-0xc8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JNE 54070 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VXORPD %XMM7,%XMM7,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD %XMM7,%XMM7,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
JMP 53d10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV $0x1fffffffffffffff,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SUB %RAX,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R9,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JB 54055 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R8,-0x100(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%RAX,%RAX,1),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R8,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,-0xd0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMOVB %R14,%R11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %R15,-0xd8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,-0xf8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (,%R11,4),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,-0xc8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA 0x40(%RDI),%RSI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0xc0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
AND $0x3f,%R15D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SUB %R15,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
TEST %R15,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMOVE %RDI,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV $0x40,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 8540 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE a204 <_ZN11qmcplusplus11DiracMatrixIddE16invert_transposeERKNS_6MatrixIdSaIdEEERS4_RdS8_.cold> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0xd8(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0xc8(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0xf8(%RBP),%R9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x100(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
SAL $0x2,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
LEA (%R15,%RAX,1),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R9,-0xd8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,-0xf8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 80e0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0xf8(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0xd0(%RBP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R15,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0xd8(%RBP),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %R8,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R8,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JE 5400c | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0xc8(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x4(%RCX),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x2,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
INC %RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
AND $0x7,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53fc6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x1,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53fb3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x2,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53fa4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x3,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53f96 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x4,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53f88 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x5,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53f7a | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x6,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 53f6b | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV (%R8),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA 0x4(%R8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x4(%R15),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EDX,(%R15) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%R10D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x4,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R10D,-0x4(%R9) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%ECX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x4,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %ECX,-0x4(%R9) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%EDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x4,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %EDI,-0x4(%R9) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x4,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %EDX,-0x4(%R9) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%R10D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x4,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R10D,-0x4(%R9) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%ECX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x4,%R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %ECX,-0x4(%R9) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMP %RAX,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 5400c | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
TEST %R8,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 54023 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R11,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R8,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SUB %R8,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SAR $0x2,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CALL 65b50 <_ZN11qmcplusplus10MallocatorIdLm64EE10deallocateEPdm.isra.0> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0xc0(%RBP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R15,%R14,4),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVQ %R15,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
MOV %R15,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VPINSRQ $0x1,%R8,%XMM15,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 2 | 0 | 0 | 3 | 2 |
ADD %R15,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVDQU %XMM0,0x18(%R12) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
MOV %RSI,0x28(%R12) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JMP 53858 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VZEROUPPER | 4 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP a289 <_ZN11qmcplusplus11DiracMatrixIddE16invert_transposeERKNS_6MatrixIdSaIdEEERS4_RdS8_.cold+0x85> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼qmcplusplus::DiracMatrix | 0.37 | 0 |
▼Loop 574 - DiracMatrix.h:28-120 - libqmcwfs.so– | 0 | 0 |
○Loop 572 - DiracMatrix.h:30-34 - libqmcwfs.so | 0 | 0 |
○Loop 573 - stl_vector.h:1896-1896 - libqmcwfs.so | 0 | 0 |
○Loop 576 - alloc_traits.h:276-276 - libqmcwfs.so | 0 | 0 |
▼Loop 578 - inner_product.hpp:209-211 - libqmcwfs.so– | 0 | 0 |
○Loop 577 - inner_product.hpp:210-211 - libqmcwfs.so | 0.37 | 0 |
○Loop 575 - DiracMatrix.h:111-112 - libqmcwfs.so | 0 | 0 |