Function: miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::acceptMove(qmcp ... | Module: exec | Source: TwoBodyJastrowRef.h:259-353 [...] | Coverage: 1.05% |
---|
Function: miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::acceptMove(qmcp ... | Module: exec | Source: TwoBodyJastrowRef.h:259-353 [...] | Coverage: 1.05% |
---|
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/TwoBodyJastrowRef.h: 259 - 353 |
-------------------------------------------------------------------------------- |
259: const int jelmax = triangle ? iat : N; |
[...] |
265: const int igt = P.GroupID[iat] * NumGroups; |
266: for (int jg = 0; jg < NumGroups; ++jg) |
267: { |
268: const FuncType& f2(*F[igt + jg]); |
269: int iStart = P.first(jg); |
270: int iEnd = std::min(jelmax, P.last(jg)); |
271: f2.evaluateVGL(iat, iStart, iEnd, dist, u, du, d2u, DistCompressed.data(), DistIndice.data()); |
[...] |
308: { |
309: // get the old u, du, d2u |
310: const DistanceTableData* d_table = P.DistTables[0]; |
311: computeU3(P, iat, d_table->Distances[iat], old_u.data(), old_du.data(), old_d2u.data()); |
312: if (UpdateMode == ORB_PBYP_RATIO) |
[...] |
322: for (int jat = 0; jat < N; jat++) |
323: { |
324: const valT du = cur_u[jat] - old_u[jat]; |
325: const valT newl = cur_d2u[jat] + lapfac * cur_du[jat]; |
326: const valT dl = old_d2u[jat] + lapfac * old_du[jat] - newl; |
327: Uat[jat] += du; |
328: d2Uat[jat] += dl; |
329: cur_d2Uat -= newl; |
330: } |
331: posT cur_dUat; |
332: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
[...] |
339: valT cur_g = cur_dUat[idim]; |
340: for (int jat = 0; jat < N; jat++) |
341: { |
342: const valT newg = cur_du_pt[jat] * new_dX[jat]; |
343: const valT dg = newg - old_du_pt[jat] * old_dX[jat]; |
344: save_g[jat] -= dg; |
345: cur_g += newg; |
346: } |
347: cur_dUat[idim] = cur_g; |
348: } |
349: LogValue += Uat[iat] - cur_Uat; |
350: Uat[iat] = cur_Uat; |
351: dUat(iat) = cur_dUat; |
352: d2Uat[iat] = cur_d2Uat; |
353: } |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 302 - 305 |
-------------------------------------------------------------------------------- |
302: inline int first(int igroup) const { return SubPtcl[igroup]; } |
303: |
304: /// return the last index of a group i |
305: inline int last(int igroup) const { return SubPtcl[igroup + 1]; } |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsMatrix.h: 214 - 214 |
-------------------------------------------------------------------------------- |
214: inline const Type_t* operator[](size_type i) const { return X.data() + i * D2; } |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 183 - 183 |
-------------------------------------------------------------------------------- |
183: return (const_cast<T1&>(a) = b); |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 229 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 216 - 243 |
-------------------------------------------------------------------------------- |
216: *(_base + M * i) = rhs[i]; |
[...] |
241: T* restrict data(size_t i) { return myData + i * nGhosts; } |
242: ///return the const pointer of the i-th components |
243: const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
/usr/lib64/gcc/x86_64-pc-linux-gnu/13.1.1/../../../../include/c++/13.1.1/bits/stl_algobase.h: 930 - 1123 |
-------------------------------------------------------------------------------- |
930: for (; __first != __last; ++__first) |
931: *__first = __tmp; |
[...] |
1123: if (__n <= 0) |
/usr/lib64/gcc/x86_64-pc-linux-gnu/13.1.1/../../../../include/c++/13.1.1/bits/stl_vector.h: 1126 - 1263 |
-------------------------------------------------------------------------------- |
1126: return *(this->_M_impl._M_start + __n); |
[...] |
1145: return *(this->_M_impl._M_start + __n); |
[...] |
1258: { return _M_data_ptr(this->_M_impl._M_start); } |
1259: |
1260: _GLIBCXX_NODISCARD _GLIBCXX20_CONSTEXPR |
1261: const _Tp* |
1262: data() const _GLIBCXX_NOEXCEPT |
1263: { return _M_data_ptr(this->_M_impl._M_start); } |
0x41cb30 PUSH %RBP |
0x41cb31 MOV %RSP,%RBP |
0x41cb34 PUSH %R15 |
0x41cb36 PUSH %R14 |
0x41cb38 PUSH %R13 |
0x41cb3a PUSH %R12 |
0x41cb3c PUSH %RBX |
0x41cb3d SUB $0x88,%RSP |
0x41cb44 MOV %EDX,%R14D |
0x41cb47 MOV %RSI,%R15 |
0x41cb4a MOV 0xa10(%RSI),%RAX |
0x41cb51 MOV (%RAX),%RDX |
0x41cb54 MOVSXD %R14D,%RCX |
0x41cb57 MOV 0x18(%RDX),%RBX |
0x41cb5b MOV %RCX,%RAX |
0x41cb5e MOV %RCX,-0x88(%RBP) |
0x41cb65 IMUL %RCX,%RBX |
0x41cb69 SAL $0x3,%RBX |
0x41cb6d MOV %RDX,-0x78(%RBP) |
0x41cb71 ADD 0x40(%RDX),%RBX |
0x41cb75 MOV 0x90(%RDI),%R12 |
0x41cb7c MOV 0x188(%RDI),%RSI |
0x41cb83 MOV 0x1a0(%RDI),%R10 |
0x41cb8a MOV 0x1b8(%RDI),%R11 |
0x41cb91 TEST %R12D,%R12D |
0x41cb94 MOV %RDI,-0x40(%RBP) |
0x41cb98 MOV %R10,-0x50(%RBP) |
0x41cb9c MOV %R11,-0x48(%RBP) |
0x41cba0 JLE 41cbeb |
0x41cba2 MOV %R12D,%R13D |
0x41cba5 TEST %R13,%R13 |
0x41cba8 JE 41cbeb |
0x41cbaa SAL $0x3,%R13 |
0x41cbae MOV %RSI,%RDI |
0x41cbb1 MOV %RSI,-0x60(%RBP) |
0x41cbb5 XOR %ESI,%ESI |
0x41cbb7 MOV %R13,%RDX |
0x41cbba CALL 47ebf0 <_intel_fast_memset> |
0x41cbbf MOV -0x50(%RBP),%RDI |
0x41cbc3 XOR %ESI,%ESI |
0x41cbc5 MOV %R13,%RDX |
0x41cbc8 CALL 47ebf0 <_intel_fast_memset> |
0x41cbcd MOV -0x48(%RBP),%RDI |
0x41cbd1 XOR %ESI,%ESI |
0x41cbd3 MOV %R13,%RDX |
0x41cbd6 CALL 47ebf0 <_intel_fast_memset> |
0x41cbdb MOV -0x60(%RBP),%RSI |
0x41cbdf MOV -0x48(%RBP),%R11 |
0x41cbe3 MOV -0x50(%RBP),%R10 |
0x41cbe7 MOV -0x40(%RBP),%RDI |
0x41cbeb MOV %R14D,-0x70(%RBP) |
0x41cbef MOV 0xa0(%RDI),%RAX |
0x41cbf6 TEST %RAX,%RAX |
0x41cbf9 MOV %R15,-0x60(%RBP) |
0x41cbfd JE 41ccb0 |
0x41cc03 MOV 0x5c0(%R15),%RCX |
0x41cc0a MOV -0x88(%RBP),%RDX |
0x41cc11 IMUL (%RCX,%RDX,4),%EAX |
0x41cc15 CLTQ |
0x41cc17 SAL $0x3,%RAX |
0x41cc1b MOV %RAX,-0x58(%RBP) |
0x41cc1f XOR %EAX,%EAX |
0x41cc21 MOV %RBX,-0x68(%RBP) |
0x41cc25 MOV -0x70(%RBP),%EBX |
0x41cc28 MOV %RSI,%R14 |
0x41cc2b NOPL (%RAX,%RAX,1) |
(249) 0x41cc30 MOV 0x200(%RDI),%RCX |
(249) 0x41cc37 ADD -0x58(%RBP),%RCX |
(249) 0x41cc3b MOV (%RCX,%RAX,8),%RDI |
(249) 0x41cc3f MOV 0xa98(%R15),%RCX |
(249) 0x41cc46 LEA 0x1(%RAX),%R15 |
(249) 0x41cc4a MOV (%RCX,%RAX,4),%EDX |
(249) 0x41cc4d MOV 0x4(%RCX,%RAX,4),%ECX |
(249) 0x41cc51 CMP %R12D,%ECX |
(249) 0x41cc54 CMOVGE %R12D,%ECX |
(249) 0x41cc58 MOV %EBX,%ESI |
(249) 0x41cc5a MOV -0x68(%RBP),%R8 |
(249) 0x41cc5e MOV %R14,%R9 |
(249) 0x41cc61 MOV -0x40(%RBP),%RAX |
(249) 0x41cc65 PUSHQ 0x1e8(%RAX) |
(249) 0x41cc6b MOV -0x40(%RBP),%RAX |
(249) 0x41cc6f PUSHQ 0x1d0(%RAX) |
(249) 0x41cc75 PUSH %R11 |
(249) 0x41cc77 PUSH %R10 |
(249) 0x41cc79 CALL 41aa40 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi> |
(249) 0x41cc7e MOV -0x48(%RBP),%R11 |
(249) 0x41cc82 MOV -0x50(%RBP),%R10 |
(249) 0x41cc86 MOV -0x40(%RBP),%RDI |
(249) 0x41cc8a ADD $0x20,%RSP |
(249) 0x41cc8e MOV 0xa0(%RDI),%R13 |
(249) 0x41cc95 MOV %R15,%RAX |
(249) 0x41cc98 CMP %R15,%R13 |
(249) 0x41cc9b MOV -0x60(%RBP),%R15 |
(249) 0x41cc9f JA 41cc30 |
0x41cca1 MOV %R13D,%R8D |
0x41cca4 CMPL $0,0xc(%RDI) |
0x41cca8 JNE 41cdd9 |
0x41ccae JMP 41ccc0 |
0x41ccb0 XOR %R13D,%R13D |
0x41ccb3 XOR %R8D,%R8D |
0x41ccb6 CMPL $0,0xc(%RDI) |
0x41ccba JNE 41cdd9 |
0x41ccc0 MOV -0x78(%RBP),%RAX |
0x41ccc4 MOV 0x68(%RAX),%R12 |
0x41ccc8 MOV 0x90(%RDI),%RBX |
0x41cccf MOV 0x140(%RDI),%RAX |
0x41ccd6 MOV 0x158(%RDI),%R14 |
0x41ccdd MOV 0x170(%RDI),%R10 |
0x41cce4 TEST %EBX,%EBX |
0x41cce6 MOV %RAX,-0x48(%RBP) |
0x41ccea MOV %R10,-0x50(%RBP) |
0x41ccee JLE 41cd3b |
0x41ccf0 MOV %EBX,%EDX |
0x41ccf2 TEST %RDX,%RDX |
0x41ccf5 JE 41cd3b |
0x41ccf7 SAL $0x3,%RDX |
0x41ccfb MOV %RAX,%RDI |
0x41ccfe XOR %ESI,%ESI |
0x41cd00 MOV %R8D,-0x58(%RBP) |
0x41cd04 MOV %R12,-0x68(%RBP) |
0x41cd08 MOV %RDX,%R12 |
0x41cd0b CALL 47ebf0 <_intel_fast_memset> |
0x41cd10 MOV %R14,%RDI |
0x41cd13 XOR %ESI,%ESI |
0x41cd15 MOV %R12,%RDX |
0x41cd18 CALL 47ebf0 <_intel_fast_memset> |
0x41cd1d MOV -0x50(%RBP),%RDI |
0x41cd21 XOR %ESI,%ESI |
0x41cd23 MOV %R12,%RDX |
0x41cd26 CALL 47ebf0 <_intel_fast_memset> |
0x41cd2b MOV -0x58(%RBP),%R8D |
0x41cd2f MOV -0x50(%RBP),%R10 |
0x41cd33 MOV -0x68(%RBP),%R12 |
0x41cd37 MOV -0x40(%RBP),%RDI |
0x41cd3b TEST %R13,%R13 |
0x41cd3e MOV -0x70(%RBP),%R13D |
0x41cd42 JE 41cdd9 |
0x41cd48 MOV 0x5c0(%R15),%RAX |
0x41cd4f MOV -0x88(%RBP),%RCX |
0x41cd56 IMUL (%RAX,%RCX,4),%R8D |
0x41cd5b MOVSXD %R8D,%RAX |
0x41cd5e SAL $0x3,%RAX |
0x41cd62 MOV %RAX,-0x58(%RBP) |
0x41cd66 XOR %EAX,%EAX |
0x41cd68 NOPL (%RAX,%RAX,1) |
(248) 0x41cd70 MOV 0x200(%RDI),%RCX |
(248) 0x41cd77 ADD -0x58(%RBP),%RCX |
(248) 0x41cd7b MOV (%RCX,%RAX,8),%RDI |
(248) 0x41cd7f MOV 0xa98(%R15),%RCX |
(248) 0x41cd86 LEA 0x1(%RAX),%R15 |
(248) 0x41cd8a MOV (%RCX,%RAX,4),%EDX |
(248) 0x41cd8d MOV 0x4(%RCX,%RAX,4),%ECX |
(248) 0x41cd91 CMP %EBX,%ECX |
(248) 0x41cd93 CMOVGE %EBX,%ECX |
(248) 0x41cd96 MOV %R13D,%ESI |
(248) 0x41cd99 MOV %R12,%R8 |
(248) 0x41cd9c MOV -0x48(%RBP),%R9 |
(248) 0x41cda0 MOV -0x40(%RBP),%RAX |
(248) 0x41cda4 PUSHQ 0x1e8(%RAX) |
(248) 0x41cdaa MOV -0x40(%RBP),%RAX |
(248) 0x41cdae PUSHQ 0x1d0(%RAX) |
(248) 0x41cdb4 PUSH %R10 |
(248) 0x41cdb6 PUSH %R14 |
(248) 0x41cdb8 CALL 41aa40 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi> |
(248) 0x41cdbd MOV -0x50(%RBP),%R10 |
(248) 0x41cdc1 MOV -0x40(%RBP),%RDI |
(248) 0x41cdc5 ADD $0x20,%RSP |
(248) 0x41cdc9 MOV %R15,%RAX |
(248) 0x41cdcc CMP %R15,0xa0(%RDI) |
(248) 0x41cdd3 MOV -0x60(%RBP),%R15 |
(248) 0x41cdd7 JA 41cd70 |
0x41cdd9 MOV -0x78(%RBP),%RAX |
0x41cddd MOV 0x50(%RAX),%RDX |
0x41cde1 MOV 0x90(%RDI),%RBX |
0x41cde8 TEST %RBX,%RBX |
0x41cdeb MOV %RBX,-0x60(%RBP) |
0x41cdef JE 41d08c |
0x41cdf5 MOV %RDX,-0x80(%RBP) |
0x41cdf9 MOV 0x140(%RDI),%R10 |
0x41ce00 MOV 0x188(%RDI),%R9 |
0x41ce07 MOV 0x158(%RDI),%RCX |
0x41ce0e MOV 0xd8(%RDI),%R12 |
0x41ce15 MOV 0x128(%RDI),%RSI |
0x41ce1c LEA (%R10,%RBX,8),%RAX |
0x41ce20 ADD $-0x8,%RAX |
0x41ce24 CMP %R12,%RAX |
0x41ce27 SETAEB -0x70(%RBP) |
0x41ce2b LEA (%R12,%RBX,8),%R11 |
0x41ce2f ADD $-0x8,%R11 |
0x41ce33 CMP %R10,%R11 |
0x41ce36 SETAEB -0x35(%RBP) |
0x41ce3a CMP %RSI,%RAX |
0x41ce3d SETBB -0x58(%RBP) |
0x41ce41 LEA (%RSI,%RBX,8),%R14 |
0x41ce45 ADD $-0x8,%R14 |
0x41ce49 CMP %R10,%R14 |
0x41ce4c SETBB -0x34(%RBP) |
0x41ce50 LEA (%R9,%RBX,8),%RAX |
0x41ce54 ADD $-0x8,%RAX |
0x41ce58 CMP %R12,%RAX |
0x41ce5b SETB %R13B |
0x41ce5f CMP %R9,%R11 |
0x41ce62 SETBB -0x33(%RBP) |
0x41ce66 CMP %RSI,%RAX |
0x41ce69 SETBB -0x68(%RBP) |
0x41ce6d CMP %R9,%R14 |
0x41ce70 SETBB -0x37(%RBP) |
0x41ce74 LEA (%RCX,%RBX,8),%RAX |
0x41ce78 ADD $-0x8,%RAX |
0x41ce7c CMP %R12,%RAX |
0x41ce7f SETB %DL |
0x41ce82 CMP %RCX,%R11 |
0x41ce85 SETBB -0x36(%RBP) |
0x41ce89 CMP %RSI,%RAX |
0x41ce8c SETBB -0x50(%RBP) |
0x41ce90 CMP %RCX,%R14 |
0x41ce93 SETBB -0x98(%RBP) |
0x41ce9a MOV 0x170(%RDI),%R8 |
0x41cea1 LEA (%R8,%RBX,8),%RAX |
0x41cea5 ADD $-0x8,%RAX |
0x41cea9 CMP %R12,%RAX |
0x41ceac SETBB -0x48(%RBP) |
0x41ceb0 CMP %R8,%R11 |
0x41ceb3 SETBB -0x90(%RBP) |
0x41ceba CMP %RSI,%RAX |
0x41cebd SETBB -0x32(%RBP) |
0x41cec1 CMP %R8,%R14 |
0x41cec4 SETBB -0x30(%RBP) |
0x41cec8 MOV 0x1b8(%RDI),%R15 |
0x41cecf LEA (%R15,%RBX,8),%RAX |
0x41ced3 ADD $-0x8,%RAX |
0x41ced7 CMP %R12,%RAX |
0x41ceda SETBB -0x31(%RBP) |
0x41cede CMP %R15,%R11 |
0x41cee1 SETBB -0x2f(%RBP) |
0x41cee5 CMP %RSI,%RAX |
0x41cee8 SETBB -0x2e(%RBP) |
0x41ceec CMP %R15,%R14 |
0x41ceef MOV 0x1a0(%RDI),%RDI |
0x41cef6 LEA -0x8(%RDI,%RBX,8),%RAX |
0x41cefb SETBB -0x2d(%RBP) |
0x41ceff CMP %R12,%RAX |
0x41cf02 SETBB -0x2c(%RBP) |
0x41cf06 CMP %RDI,%R11 |
0x41cf09 SETBB -0x2b(%RBP) |
0x41cf0d CMP %RSI,%RAX |
0x41cf10 SETB %BL |
0x41cf13 CMP %RDI,%R14 |
0x41cf16 SETBB -0x2a(%RBP) |
0x41cf1a CMP %RSI,%R11 |
0x41cf1d SETBB -0x29(%RBP) |
0x41cf21 CMP %R12,%R14 |
0x41cf24 SETB %R11B |
0x41cf28 MOVZX -0x35(%RBP),%EAX |
0x41cf2c TEST %AL,-0x70(%RBP) |
0x41cf2f JNE 41d09d |
0x41cf35 MOVZX -0x34(%RBP),%EAX |
0x41cf39 OR %AL,-0x58(%RBP) |
0x41cf3c JE 41d09d |
0x41cf42 OR -0x33(%RBP),%R13B |
0x41cf46 JE 41d09d |
0x41cf4c MOVZX -0x37(%RBP),%EAX |
0x41cf50 OR %AL,-0x68(%RBP) |
0x41cf53 JE 41d09d |
0x41cf59 OR -0x36(%RBP),%DL |
0x41cf5c JE 41d09d |
0x41cf62 MOVZX -0x98(%RBP),%EDX |
0x41cf69 OR %DL,-0x50(%RBP) |
0x41cf6c JE 41d09d |
0x41cf72 MOVZX -0x90(%RBP),%EDX |
0x41cf79 OR %DL,-0x48(%RBP) |
0x41cf7c JE 41d09d |
0x41cf82 MOVZX -0x30(%RBP),%EDX |
0x41cf86 OR %DL,-0x32(%RBP) |
0x41cf89 JE 41d09d |
0x41cf8f MOVZX -0x2f(%RBP),%EDX |
0x41cf93 OR %DL,-0x31(%RBP) |
0x41cf96 JE 41d09d |
0x41cf9c MOVZX -0x2d(%RBP),%EDX |
0x41cfa0 OR %DL,-0x2e(%RBP) |
0x41cfa3 JE 41d09d |
0x41cfa9 MOVZX -0x2b(%RBP),%EDX |
0x41cfad OR %DL,-0x2c(%RBP) |
0x41cfb0 JE 41d09d |
0x41cfb6 OR -0x2a(%RBP),%BL |
0x41cfb9 JE 41d09d |
0x41cfbf OR %R11B,-0x29(%RBP) |
0x41cfc3 JE 41d09d |
0x41cfc9 MOV -0x60(%RBP),%RBX |
0x41cfcd VPBROADCASTQ %RBX,%ZMM1 |
0x41cfd3 MOV %RBX,%R11 |
0x41cfd6 AND $-0x8,%R11 |
0x41cfda JE 41d10a |
0x41cfe0 LEA -0x1(%R11),%RDX |
0x41cfe4 VXORPD %XMM0,%XMM0,%XMM0 |
0x41cfe8 XOR %EAX,%EAX |
0x41cfea VBROADCASTSD 0x73f74(%RIP),%ZMM2 |
0x41cff4 NOPW %CS:(%RAX,%RAX,1) |
(247) 0x41d000 VMOVUPD (%R10,%RAX,8),%ZMM3 |
(247) 0x41d007 VSUBPD (%R9,%RAX,8),%ZMM3,%ZMM3 |
(247) 0x41d00e VMOVUPD (%RCX,%RAX,8),%ZMM4 |
(247) 0x41d015 VFMADD213PD (%R8,%RAX,8),%ZMM2,%ZMM4 |
(247) 0x41d01c VMOVUPD (%R15,%RAX,8),%ZMM5 |
(247) 0x41d023 VADDPD (%R12,%RAX,8),%ZMM3,%ZMM3 |
(247) 0x41d02a VMOVUPD (%RDI,%RAX,8),%ZMM6 |
(247) 0x41d031 VMOVUPD %ZMM3,(%R12,%RAX,8) |
(247) 0x41d038 VSUBPD %ZMM4,%ZMM5,%ZMM3 |
(247) 0x41d03e VFMADD213PD (%RSI,%RAX,8),%ZMM2,%ZMM6 |
(247) 0x41d045 VADDPD %ZMM3,%ZMM6,%ZMM3 |
(247) 0x41d04b VMOVUPD %ZMM3,(%RSI,%RAX,8) |
(247) 0x41d052 VSUBPD %ZMM4,%ZMM0,%ZMM0 |
(247) 0x41d058 ADD $0x8,%RAX |
(247) 0x41d05c CMP %RDX,%RAX |
(247) 0x41d05f JLE 41d000 |
0x41d061 VEXTRACTF64X4 $0x1,%ZMM0,%YMM2 |
0x41d068 VADDPD %ZMM2,%ZMM0,%ZMM0 |
0x41d06e VEXTRACTF128 $0x1,%YMM0,%XMM2 |
0x41d074 VADDPD %XMM2,%XMM0,%XMM0 |
0x41d078 VPERMILPD $0x1,%XMM0,%XMM2 |
0x41d07e VADDSD %XMM2,%XMM0,%XMM13 |
0x41d082 CMP %R11,%RBX |
0x41d085 JE 41d0fd |
0x41d087 JMP 41d112 |
0x41d08c MOV 0x158(%RDI),%RCX |
0x41d093 VXORPD %XMM13,%XMM13,%XMM13 |
0x41d098 JMP 41d1e4 |
0x41d09d VXORPD %XMM13,%XMM13,%XMM13 |
0x41d0a2 XOR %EAX,%EAX |
0x41d0a4 VMOVSD 0x73ebc(%RIP),%XMM1 |
0x41d0ac MOV -0x60(%RBP),%RBX |
(246) 0x41d0b0 VMOVSD (%R10,%RAX,8),%XMM2 |
(246) 0x41d0b6 VSUBSD (%R9,%RAX,8),%XMM2,%XMM2 |
(246) 0x41d0bc VMOVSD (%RCX,%RAX,8),%XMM3 |
(246) 0x41d0c1 VFMADD213SD (%R8,%RAX,8),%XMM1,%XMM3 |
(246) 0x41d0c7 VMOVSD (%R15,%RAX,8),%XMM4 |
(246) 0x41d0cd VADDSD (%R12,%RAX,8),%XMM2,%XMM2 |
(246) 0x41d0d3 VMOVSD (%RDI,%RAX,8),%XMM5 |
(246) 0x41d0d8 VMOVSD %XMM2,(%R12,%RAX,8) |
(246) 0x41d0de VSUBSD %XMM3,%XMM4,%XMM2 |
(246) 0x41d0e2 VFMADD213SD (%RSI,%RAX,8),%XMM1,%XMM5 |
(246) 0x41d0e8 VADDSD %XMM2,%XMM5,%XMM2 |
(246) 0x41d0ec VMOVSD %XMM2,(%RSI,%RAX,8) |
(246) 0x41d0f1 VSUBSD %XMM3,%XMM13,%XMM13 |
(246) 0x41d0f5 INC %RAX |
(246) 0x41d0f8 CMP %RAX,%RBX |
(246) 0x41d0fb JNE 41d0b0 |
0x41d0fd MOV -0x40(%RBP),%RDI |
0x41d101 MOV -0x80(%RBP),%RDX |
0x41d105 JMP 41d1e4 |
0x41d10a VXORPD %XMM13,%XMM13,%XMM13 |
0x41d10f XOR %R11D,%R11D |
0x41d112 MOV -0x80(%RBP),%RDX |
0x41d116 VPBROADCASTQ %R11,%ZMM2 |
0x41d11c VPORQ 0x7281a(%RIP),%ZMM2,%ZMM2 |
0x41d126 VPCMPLTUQ %ZMM1,%ZMM2,%K1 |
0x41d12d VMOVUPD (%R10,%R11,8),%ZMM1{%K1}{z} |
0x41d134 VMOVUPD (%R9,%R11,8),%ZMM2{%K1}{z} |
0x41d13b VSUBPD %ZMM2,%ZMM1,%ZMM1 |
0x41d141 VMOVUPD (%RCX,%R11,8),%ZMM2{%K1}{z} |
0x41d148 VMOVUPD (%R8,%R11,8),%ZMM3{%K1}{z} |
0x41d14f VFMADD231PD 0x73e0f(%RIP){1to8},%ZMM2,%ZMM3 |
0x41d159 VBROADCASTSD 0x73e0d(%RIP),%ZMM2 |
0x41d163 VBLENDMPD %ZMM3,%ZMM2,%ZMM3{%K1} |
0x41d169 VMOVUPD (%R15,%R11,8),%ZMM4{%K1}{z} |
0x41d170 VMOVUPD (%RDI,%R11,8),%ZMM5{%K1}{z} |
0x41d177 VADDPD %ZMM5,%ZMM5,%ZMM2{%K1} |
0x41d17d VMOVUPD (%R12,%R11,8),%ZMM5{%K1}{z} |
0x41d184 VADDPD %ZMM5,%ZMM1,%ZMM1 |
0x41d18a VMOVUPD %ZMM1,(%R12,%R11,8){%K1} |
0x41d191 VSUBPD %ZMM3,%ZMM4,%ZMM1 |
0x41d197 VMOVUPD (%RSI,%R11,8),%ZMM4{%K1}{z} |
0x41d19e VADDPD %ZMM4,%ZMM2,%ZMM2 |
0x41d1a4 VADDPD %ZMM2,%ZMM1,%ZMM1 |
0x41d1aa VMOVUPD %ZMM1,(%RSI,%R11,8){%K1} |
0x41d1b1 VXORPD 0x70ec5(%RIP){1to8},%ZMM3,%ZMM1{%K1}{z} |
0x41d1bb VEXTRACTF64X4 $0x1,%ZMM1,%YMM2 |
0x41d1c2 VADDPD %ZMM2,%ZMM1,%ZMM1 |
0x41d1c8 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
0x41d1ce VADDPD %XMM2,%XMM1,%XMM1 |
0x41d1d2 VPERMILPD $0x1,%XMM1,%XMM2 |
0x41d1d8 VADDSD %XMM2,%XMM1,%XMM1 |
0x41d1dc VADDSD %XMM1,%XMM13,%XMM13 |
0x41d1e0 MOV -0x40(%RBP),%RDI |
0x41d1e4 VXORPD %XMM1,%XMM1,%XMM1 |
0x41d1e8 VMOVUPD %XMM1,-0xb0(%RBP) |
0x41d1f0 MOVQ $0,-0xa0(%RBP) |
0x41d1fb MOV -0x78(%RBP),%RAX |
0x41d1ff MOV 0x88(%RAX),%R8 |
0x41d206 MOV 0x98(%RAX),%R10 |
0x41d20d MOV -0x88(%RBP),%RAX |
0x41d214 LEA (%RAX,%RAX,4),%RAX |
0x41d218 MOV 0x8(%RDX,%RAX,8),%R9 |
0x41d21d MOV 0x18(%RDX,%RAX,8),%R11 |
0x41d222 MOV 0x1a0(%RDI),%RSI |
0x41d229 MOV 0xf0(%RDI),%RAX |
0x41d230 MOV 0x100(%RDI),%R13 |
0x41d237 MOV %RBX,%R12 |
0x41d23a AND $-0x8,%R12 |
0x41d23e LEA -0x1(%R12),%RDX |
0x41d243 VPBROADCASTQ %RBX,%ZMM12 |
0x41d249 MOV %RAX,-0x48(%RBP) |
0x41d24d LEA (,%RAX,8),%RDI |
0x41d255 MOV %R9,-0x68(%RBP) |
0x41d259 LEA (,%R9,8),%R9 |
0x41d261 MOV %R8,-0x58(%RBP) |
0x41d265 LEA (,%R8,8),%RAX |
0x41d26d MOV %RAX,-0x50(%RBP) |
0x41d271 XOR %R8D,%R8D |
0x41d274 VMOVDQU64 0x726c2(%RIP),%ZMM8 |
0x41d27e MOV %R10,-0x70(%RBP) |
0x41d282 MOV %R11,-0x98(%RBP) |
0x41d289 MOV %R13,-0x78(%RBP) |
0x41d28d MOV %R12,-0x90(%RBP) |
0x41d294 JMP 41d3ac |
0x41d299 NOPL (%RAX) |
(244) 0x41d2a0 MOV -0x58(%RBP),%RBX |
(244) 0x41d2a4 IMUL %R8,%RBX |
(244) 0x41d2a8 MOV -0x68(%RBP),%R14 |
(244) 0x41d2ac IMUL %R8,%R14 |
(244) 0x41d2b0 MOV -0x48(%RBP),%R15 |
(244) 0x41d2b4 IMUL %R8,%R15 |
(244) 0x41d2b8 XOR %EAX,%EAX |
(244) 0x41d2ba VPBROADCASTQ %RAX,%ZMM9 |
(244) 0x41d2c0 VPORQ %ZMM8,%ZMM9,%ZMM9 |
(244) 0x41d2c6 VPCMPLTUQ %ZMM12,%ZMM9,%K1 |
(244) 0x41d2cd ADD %RAX,%RBX |
(244) 0x41d2d0 MOV %R9,%R12 |
(244) 0x41d2d3 MOV %RDI,%R9 |
(244) 0x41d2d6 MOV -0x70(%RBP),%RDI |
(244) 0x41d2da VMOVUPD (%RDI,%RBX,8),%ZMM9{%K1}{z} |
(244) 0x41d2e1 VMOVAPD %ZMM9,%ZMM7{%K1} |
(244) 0x41d2e7 VMOVUPD (%RCX,%RAX,8),%ZMM9{%K1}{z} |
(244) 0x41d2ee VMOVAPD %ZMM9,%ZMM6{%K1} |
(244) 0x41d2f4 VMULPD %ZMM6,%ZMM7,%ZMM9 |
(244) 0x41d2fa ADD %RAX,%R14 |
(244) 0x41d2fd MOV -0x98(%RBP),%RDI |
(244) 0x41d304 VMOVUPD (%RDI,%R14,8),%ZMM10{%K1}{z} |
(244) 0x41d30b MOV %R9,%RDI |
(244) 0x41d30e MOV %R12,%R9 |
(244) 0x41d311 MOV -0x90(%RBP),%R12 |
(244) 0x41d318 VMOVUPD (%RSI,%RAX,8),%ZMM11{%K1}{z} |
(244) 0x41d31f VMOVAPD %ZMM10,%ZMM5{%K1} |
(244) 0x41d325 VMOVAPD %ZMM11,%ZMM4{%K1} |
(244) 0x41d32b VMOVAPD %ZMM4,%ZMM10 |
(244) 0x41d331 VFMSUB213PD %ZMM9,%ZMM5,%ZMM10 |
(244) 0x41d337 ADD %RAX,%R15 |
(244) 0x41d33a MOV -0x78(%RBP),%RAX |
(244) 0x41d33e VMOVUPD (%RAX,%R15,8),%ZMM11{%K1}{z} |
(244) 0x41d345 VMOVAPD %ZMM11,%ZMM3{%K1} |
(244) 0x41d34b VADDPD %ZMM10,%ZMM3,%ZMM10 |
(244) 0x41d351 VMOVUPD %ZMM10,(%RAX,%R15,8){%K1} |
(244) 0x41d358 VMOVAPD %ZMM9,%ZMM9{%K1}{z} |
(244) 0x41d35e VEXTRACTF64X4 $0x1,%ZMM9,%YMM10 |
(244) 0x41d365 VADDPD %ZMM10,%ZMM9,%ZMM9 |
(244) 0x41d36b VEXTRACTF128 $0x1,%YMM9,%XMM1 |
(244) 0x41d371 VADDPD %XMM1,%XMM9,%XMM1 |
(244) 0x41d375 VPERMILPD $0x1,%XMM1,%XMM0 |
(244) 0x41d37b VADDSD %XMM0,%XMM1,%XMM0 |
(244) 0x41d37f VADDSD %XMM0,%XMM2,%XMM2 |
(244) 0x41d383 VMOVSD %XMM2,-0xb0(%RBP,%R8,8) |
(244) 0x41d38d LEA 0x1(%R8),%RAX |
(244) 0x41d391 ADD %RDI,%R13 |
(244) 0x41d394 ADD %R9,%R11 |
(244) 0x41d397 ADD -0x50(%RBP),%R10 |
(244) 0x41d39b CMP $0x2,%R8 |
(244) 0x41d39f MOV %RAX,%R8 |
(244) 0x41d3a2 MOV -0x60(%RBP),%RBX |
(244) 0x41d3a6 JE 41d468 |
(244) 0x41d3ac VMOVSD -0xb0(%RBP,%R8,8),%XMM2 |
(244) 0x41d3b6 TEST %RBX,%RBX |
(244) 0x41d3b9 JE 41d383 |
(244) 0x41d3bb TEST %R12,%R12 |
(244) 0x41d3be JE 41d2a0 |
(244) 0x41d3c4 MOV -0x58(%RBP),%RBX |
(244) 0x41d3c8 IMUL %R8,%RBX |
(244) 0x41d3cc MOV -0x68(%RBP),%R14 |
(244) 0x41d3d0 IMUL %R8,%R14 |
(244) 0x41d3d4 MOV -0x48(%RBP),%R15 |
(244) 0x41d3d8 IMUL %R8,%R15 |
(244) 0x41d3dc VXORPD %XMM9,%XMM9,%XMM9 |
(244) 0x41d3e1 XOR %EAX,%EAX |
(244) 0x41d3e3 NOPW %CS:(%RAX,%RAX,1) |
(245) 0x41d3f0 VMOVUPD (%R10,%RAX,8),%ZMM0 |
(245) 0x41d3f7 VMOVUPD (%RCX,%RAX,8),%ZMM1 |
(245) 0x41d3fe VMOVUPD (%RSI,%RAX,8),%ZMM10 |
(245) 0x41d405 VMOVUPD (%R13,%RAX,8),%ZMM11 |
(245) 0x41d40d VFMSUB231PD %ZMM0,%ZMM1,%ZMM11 |
(245) 0x41d413 VFMSUB231PD (%R11,%RAX,8),%ZMM10,%ZMM11 |
(245) 0x41d41a VMOVUPD %ZMM11,(%R13,%RAX,8) |
(245) 0x41d422 VFMADD231PD %ZMM0,%ZMM1,%ZMM9 |
(245) 0x41d428 ADD $0x8,%RAX |
(245) 0x41d42c CMP %RDX,%RAX |
(245) 0x41d42f JLE 41d3f0 |
(244) 0x41d431 VEXTRACTF64X4 $0x1,%ZMM9,%YMM0 |
(244) 0x41d438 VADDPD %ZMM0,%ZMM9,%ZMM0 |
(244) 0x41d43e VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(244) 0x41d444 VADDPD %XMM1,%XMM0,%XMM0 |
(244) 0x41d448 VPERMILPD $0x1,%XMM0,%XMM1 |
(244) 0x41d44e VADDSD %XMM1,%XMM0,%XMM0 |
(244) 0x41d452 VADDSD %XMM0,%XMM2,%XMM2 |
(244) 0x41d456 MOV %R12,%RAX |
(244) 0x41d459 CMP %R12,-0x60(%RBP) |
(244) 0x41d45d JNE 41d2ba |
(244) 0x41d463 JMP 41d383 |
0x41d468 MOV -0x40(%RBP),%RDX |
0x41d46c MOV 0xd8(%RDX),%RAX |
0x41d473 MOV -0x88(%RBP),%RCX |
0x41d47a VMOVSD (%RAX,%RCX,8),%XMM0 |
0x41d47f VMOVSD 0x138(%RDX),%XMM1 |
0x41d487 VSUBSD %XMM1,%XMM0,%XMM0 |
0x41d48b VADDSD 0x10(%RDX),%XMM0,%XMM0 |
0x41d490 VMOVSD %XMM0,0x10(%RDX) |
0x41d495 VMOVSD %XMM1,(%RAX,%RCX,8) |
0x41d49a VMOVSD -0xb0(%RBP),%XMM0 |
0x41d4a2 VMOVSD -0xa8(%RBP),%XMM1 |
0x41d4aa MOV -0x78(%RBP),%RDI |
0x41d4ae VMOVSD %XMM0,(%RDI,%RCX,8) |
0x41d4b3 MOV -0x48(%RBP),%RSI |
0x41d4b7 LEA (%RCX,%RSI,1),%RAX |
0x41d4bb VMOVSD %XMM1,(%RDI,%RAX,8) |
0x41d4c0 VMOVSD -0xa0(%RBP),%XMM0 |
0x41d4c8 LEA (%RCX,%RSI,2),%RAX |
0x41d4cc VMOVSD %XMM0,(%RDI,%RAX,8) |
0x41d4d1 MOV 0x128(%RDX),%RAX |
0x41d4d8 VMOVSD %XMM13,(%RAX,%RCX,8) |
0x41d4dd ADD $0x88,%RSP |
0x41d4e4 POP %RBX |
0x41d4e5 POP %R12 |
0x41d4e7 POP %R13 |
0x41d4e9 POP %R14 |
0x41d4eb POP %R15 |
0x41d4ed POP %RBP |
0x41d4ee VZEROUPPER |
0x41d4f1 RET |
0x41d4f2 NOPW %CS:(%RAX,%RAX,1) |
0x41d4fc NOPL (%RAX) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.21+ | qmcplusplus::WaveFunction::acc[...] | NewTimer.h:249 | exec |
○ | main.extracted.104 | stl_vector.h:1126 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 |
Path / |
Source file and lines | TwoBodyJastrowRef.h:259-353 |
Module | exec |
nb instructions | 361 |
nb uops | 400 |
loop length | 1664 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 3 |
used zmm registers | 8 |
nb stack references | 30 |
micro-operation queue | 100.00 cycles |
front end | 100.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 44.50 | 44.50 | 65.67 | 65.67 | 78.00 | 44.50 | 44.50 | 65.67 |
cycles | 44.50 | 44.50 | 65.67 | 65.67 | 78.00 | 44.50 | 44.50 | 65.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 98.12 |
Stall cycles | 0.00 |
Front-end | 100.00 |
Dispatch | 78.00 |
Overall L1 | 100.00 |
all | 5% |
load | 28% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 6% |
all | 64% |
load | 52% |
store | 33% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 66% |
fma | 100% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 86% |
all | 29% |
load | 46% |
store | 8% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 62% |
fma | 100% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 15% |
load | 34% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 15% |
all | 50% |
load | 58% |
store | 33% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 60% |
fma | 100% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 36% |
all | 29% |
load | 52% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 57% |
fma | 100% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 20% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0x88,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %EDX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RSI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0xa10(%RSI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD %R14D,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x18(%RDX),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RCX,-0x88(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
IMUL %RCX,%RBX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x3,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %RDX,-0x78(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
ADD 0x40(%RDX),%RBX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
MOV 0x90(%RDI),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x188(%RDI),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x1a0(%RDI),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x1b8(%RDI),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %R12D,%R12D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RDI,-0x40(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,-0x50(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R11,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JLE 41cbeb | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R12D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
TEST %R13,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 41cbeb | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
SAL $0x3,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %RSI,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RSI,-0x60(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x50(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x48(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x60(%RBP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x50(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R14D,-0x70(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0xa0(%RDI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R15,-0x60(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JE 41ccb0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x5c0(%R15),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x88(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
IMUL (%RCX,%RDX,4),%EAX | 1 | 0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
CLTQ | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
SAL $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RBX,-0x68(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV -0x70(%RBP),%EBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMPL $0,0xc(%RDI) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JNE 41cdd9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 41ccc0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMPL $0,0xc(%RDI) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JNE 41cdd9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x68(%RAX),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x90(%RDI),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x140(%RDI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x158(%RDI),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x170(%RDI),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %EBX,%EBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,-0x50(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JLE 41cd3b | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %EBX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
TEST %RDX,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 41cd3b | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R8D,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R12,-0x68(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x50(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x58(%RBP),%R8D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x50(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x68(%RBP),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %R13,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV -0x70(%RBP),%R13D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JE 41cdd9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x5c0(%R15),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x88(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
IMUL (%RAX,%RCX,4),%R8D | 1 | 0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
MOVSXD %R8D,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SAL $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x50(%RAX),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x90(%RDI),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %RBX,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RBX,-0x60(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JE 41d08c | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %RDX,-0x80(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x140(%RDI),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x188(%RDI),%R9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x158(%RDI),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0xd8(%RDI),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x128(%RDI),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R10,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETAEB -0x70(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
LEA (%R12,%RBX,8),%R11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R10,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETAEB -0x35(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x58(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
LEA (%RSI,%RBX,8),%R14 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R10,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x34(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
LEA (%R9,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETB %R13B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %R9,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x33(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x68(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R9,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x37(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
LEA (%RCX,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETB %DL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %RCX,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x36(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x50(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RCX,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x98(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
MOV 0x170(%RDI),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R8,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x48(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R8,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x90(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x32(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R8,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x30(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
MOV 0x1b8(%RDI),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R15,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x31(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R15,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x2f(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x2e(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R15,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x1a0(%RDI),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x8(%RDI,%RBX,8),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SETBB -0x2d(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x2c(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RDI,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x2b(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETB %BL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %RDI,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x2a(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x29(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R12,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETB %R11B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOVZX -0x35(%RBP),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %AL,-0x70(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JNE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x34(%RBP),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %AL,-0x58(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
OR -0x33(%RBP),%R13B | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x37(%RBP),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %AL,-0x68(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
OR -0x36(%RBP),%DL | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x98(%RBP),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %DL,-0x50(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x90(%RBP),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %DL,-0x48(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x30(%RBP),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %DL,-0x32(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x2f(%RBP),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %DL,-0x31(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x2d(%RBP),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %DL,-0x2e(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x2b(%RBP),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %DL,-0x2c(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
OR -0x2a(%RBP),%BL | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
OR %R11B,-0x29(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x60(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VPBROADCASTQ %RBX,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
MOV %RBX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
AND $-0x8,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 41d10a | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA -0x1(%R11),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD 0x73f74(%RIP),%ZMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VEXTRACTF64X4 $0x1,%ZMM0,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VEXTRACTF128 $0x1,%YMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %XMM2,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPERMILPD $0x1,%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VADDSD %XMM2,%XMM0,%XMM13 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R11,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 41d0fd | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 41d112 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV 0x158(%RDI),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VXORPD %XMM13,%XMM13,%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 41d1e4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
VXORPD %XMM13,%XMM13,%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x73ebc(%RIP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x60(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x80(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JMP 41d1e4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
VXORPD %XMM13,%XMM13,%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x80(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VPBROADCASTQ %R11,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPORQ 0x7281a(%RIP),%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VPCMPLTUQ %ZMM1,%ZMM2,%K1 | |||||||||||
VMOVUPD (%R10,%R11,8),%ZMM1{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD (%R9,%R11,8),%ZMM2{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VSUBPD %ZMM2,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD (%RCX,%R11,8),%ZMM2{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD (%R8,%R11,8),%ZMM3{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VFMADD231PD 0x73e0f(%RIP){1to8},%ZMM2,%ZMM3 | 1 | 0.50 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x73e0d(%RIP),%ZMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBLENDMPD %ZMM3,%ZMM2,%ZMM3{%K1} | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVUPD (%R15,%R11,8),%ZMM4{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD (%RDI,%R11,8),%ZMM5{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VADDPD %ZMM5,%ZMM5,%ZMM2{%K1} | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD (%R12,%R11,8),%ZMM5{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VADDPD %ZMM5,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM1,(%R12,%R11,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VSUBPD %ZMM3,%ZMM4,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD (%RSI,%R11,8),%ZMM4{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VADDPD %ZMM4,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VADDPD %ZMM2,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM1,(%RSI,%R11,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VXORPD 0x70ec5(%RIP){1to8},%ZMM3,%ZMM1{%K1}{z} | 1 | 0.50 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VEXTRACTF64X4 $0x1,%ZMM1,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VEXTRACTF128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %XMM2,%XMM1,%XMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPERMILPD $0x1,%XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VADDSD %XMM2,%XMM1,%XMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD %XMM1,%XMM13,%XMM13 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD %XMM1,-0xb0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOVQ $0,-0xa0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 2 | 1 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x88(%RAX),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x98(%RAX),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RAX,%RAX,4),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x8(%RDX,%RAX,8),%R9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RDX,%RAX,8),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x1a0(%RDI),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0xf0(%RDI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x100(%RDI),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RBX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
AND $-0x8,%R12 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA -0x1(%R12),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %RBX,%ZMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (,%RAX,8),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (,%R9,8),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (,%R8,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVDQU64 0x726c2(%RIP),%ZMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
MOV %R10,-0x70(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R11,-0x98(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R13,-0x78(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R12,-0x90(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JMP 41d3ac | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x40(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0xd8(%RDX),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x88(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD (%RAX,%RCX,8),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x138(%RDX),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VSUBSD %XMM1,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD 0x10(%RDX),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x10(%RDX) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD %XMM1,(%RAX,%RCX,8) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD -0xb0(%RBP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD -0xa8(%RBP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x78(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD %XMM0,(%RDI,%RCX,8) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RCX,%RSI,1),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM1,(%RDI,%RAX,8) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD -0xa0(%RBP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RCX,%RSI,2),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM0,(%RDI,%RAX,8) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x128(%RDX),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD %XMM13,(%RAX,%RCX,8) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
ADD $0x88,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
VZEROUPPER | 4 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Source file and lines | TwoBodyJastrowRef.h:259-353 |
Module | exec |
nb instructions | 361 |
nb uops | 400 |
loop length | 1664 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 3 |
used zmm registers | 8 |
nb stack references | 30 |
micro-operation queue | 100.00 cycles |
front end | 100.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 44.50 | 44.50 | 65.67 | 65.67 | 78.00 | 44.50 | 44.50 | 65.67 |
cycles | 44.50 | 44.50 | 65.67 | 65.67 | 78.00 | 44.50 | 44.50 | 65.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 98.12 |
Stall cycles | 0.00 |
Front-end | 100.00 |
Dispatch | 78.00 |
Overall L1 | 100.00 |
all | 5% |
load | 28% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 6% |
all | 64% |
load | 52% |
store | 33% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 66% |
fma | 100% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 86% |
all | 29% |
load | 46% |
store | 8% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 62% |
fma | 100% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 15% |
load | 34% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 15% |
all | 50% |
load | 58% |
store | 33% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 60% |
fma | 100% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 36% |
all | 29% |
load | 52% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 57% |
fma | 100% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 20% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0x88,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %EDX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RSI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0xa10(%RSI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD %R14D,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x18(%RDX),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RCX,-0x88(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
IMUL %RCX,%RBX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x3,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %RDX,-0x78(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
ADD 0x40(%RDX),%RBX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
MOV 0x90(%RDI),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x188(%RDI),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x1a0(%RDI),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x1b8(%RDI),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %R12D,%R12D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RDI,-0x40(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,-0x50(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R11,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JLE 41cbeb | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R12D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
TEST %R13,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 41cbeb | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
SAL $0x3,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %RSI,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RSI,-0x60(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x50(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x48(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x60(%RBP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x50(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R14D,-0x70(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0xa0(%RDI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R15,-0x60(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JE 41ccb0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x5c0(%R15),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x88(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
IMUL (%RCX,%RDX,4),%EAX | 1 | 0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
CLTQ | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
SAL $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RBX,-0x68(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV -0x70(%RBP),%EBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMPL $0,0xc(%RDI) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JNE 41cdd9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 41ccc0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMPL $0,0xc(%RDI) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JNE 41cdd9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x68(%RAX),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x90(%RDI),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x140(%RDI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x158(%RDI),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x170(%RDI),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %EBX,%EBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,-0x50(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JLE 41cd3b | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %EBX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
TEST %RDX,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 41cd3b | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R8D,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R12,-0x68(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x50(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x58(%RBP),%R8D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x50(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x68(%RBP),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %R13,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV -0x70(%RBP),%R13D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JE 41cdd9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x5c0(%R15),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x88(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
IMUL (%RAX,%RCX,4),%R8D | 1 | 0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
MOVSXD %R8D,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SAL $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x50(%RAX),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x90(%RDI),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %RBX,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RBX,-0x60(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JE 41d08c | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %RDX,-0x80(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x140(%RDI),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x188(%RDI),%R9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x158(%RDI),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0xd8(%RDI),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x128(%RDI),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R10,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETAEB -0x70(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
LEA (%R12,%RBX,8),%R11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R10,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETAEB -0x35(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x58(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
LEA (%RSI,%RBX,8),%R14 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R10,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x34(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
LEA (%R9,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETB %R13B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %R9,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x33(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x68(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R9,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x37(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
LEA (%RCX,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETB %DL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %RCX,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x36(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x50(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RCX,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x98(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
MOV 0x170(%RDI),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R8,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x48(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R8,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x90(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x32(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R8,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x30(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
MOV 0x1b8(%RDI),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R15,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x31(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R15,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x2f(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x2e(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R15,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x1a0(%RDI),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x8(%RDI,%RBX,8),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SETBB -0x2d(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x2c(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RDI,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x2b(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETB %BL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %RDI,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x2a(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %RSI,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETBB -0x29(%RBP) | 2 | 0.50 | 0 | 0.33 | 0.33 | 1 | 0 | 0.50 | 0.33 | 1 | 1 |
CMP %R12,%R14 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETB %R11B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOVZX -0x35(%RBP),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %AL,-0x70(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JNE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x34(%RBP),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %AL,-0x58(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
OR -0x33(%RBP),%R13B | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x37(%RBP),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %AL,-0x68(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
OR -0x36(%RBP),%DL | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x98(%RBP),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %DL,-0x50(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x90(%RBP),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %DL,-0x48(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x30(%RBP),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %DL,-0x32(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x2f(%RBP),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %DL,-0x31(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x2d(%RBP),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %DL,-0x2e(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVZX -0x2b(%RBP),%EDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
OR %DL,-0x2c(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
OR -0x2a(%RBP),%BL | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
OR %R11B,-0x29(%RBP) | 2 | 0.25 | 0.25 | 0.83 | 0.83 | 1 | 0.25 | 0.25 | 0.33 | 5 | 1 |
JE 41d09d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x60(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VPBROADCASTQ %RBX,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
MOV %RBX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
AND $-0x8,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 41d10a | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA -0x1(%R11),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD 0x73f74(%RIP),%ZMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VEXTRACTF64X4 $0x1,%ZMM0,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VEXTRACTF128 $0x1,%YMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %XMM2,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPERMILPD $0x1,%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VADDSD %XMM2,%XMM0,%XMM13 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R11,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 41d0fd | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 41d112 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV 0x158(%RDI),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VXORPD %XMM13,%XMM13,%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 41d1e4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
VXORPD %XMM13,%XMM13,%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x73ebc(%RIP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x60(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x80(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JMP 41d1e4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
VXORPD %XMM13,%XMM13,%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x80(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VPBROADCASTQ %R11,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPORQ 0x7281a(%RIP),%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VPCMPLTUQ %ZMM1,%ZMM2,%K1 | |||||||||||
VMOVUPD (%R10,%R11,8),%ZMM1{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD (%R9,%R11,8),%ZMM2{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VSUBPD %ZMM2,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD (%RCX,%R11,8),%ZMM2{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD (%R8,%R11,8),%ZMM3{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VFMADD231PD 0x73e0f(%RIP){1to8},%ZMM2,%ZMM3 | 1 | 0.50 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x73e0d(%RIP),%ZMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBLENDMPD %ZMM3,%ZMM2,%ZMM3{%K1} | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVUPD (%R15,%R11,8),%ZMM4{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD (%RDI,%R11,8),%ZMM5{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VADDPD %ZMM5,%ZMM5,%ZMM2{%K1} | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD (%R12,%R11,8),%ZMM5{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VADDPD %ZMM5,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM1,(%R12,%R11,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VSUBPD %ZMM3,%ZMM4,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD (%RSI,%R11,8),%ZMM4{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VADDPD %ZMM4,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VADDPD %ZMM2,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM1,(%RSI,%R11,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VXORPD 0x70ec5(%RIP){1to8},%ZMM3,%ZMM1{%K1}{z} | 1 | 0.50 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VEXTRACTF64X4 $0x1,%ZMM1,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VEXTRACTF128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %XMM2,%XMM1,%XMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPERMILPD $0x1,%XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VADDSD %XMM2,%XMM1,%XMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD %XMM1,%XMM13,%XMM13 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD %XMM1,-0xb0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOVQ $0,-0xa0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 2 | 1 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x88(%RAX),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x98(%RAX),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RAX,%RAX,4),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x8(%RDX,%RAX,8),%R9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RDX,%RAX,8),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x1a0(%RDI),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0xf0(%RDI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x100(%RDI),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RBX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
AND $-0x8,%R12 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA -0x1(%R12),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %RBX,%ZMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (,%RAX,8),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (,%R9,8),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (,%R8,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVDQU64 0x726c2(%RIP),%ZMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
MOV %R10,-0x70(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R11,-0x98(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R13,-0x78(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R12,-0x90(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JMP 41d3ac | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x40(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0xd8(%RDX),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x88(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD (%RAX,%RCX,8),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x138(%RDX),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VSUBSD %XMM1,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD 0x10(%RDX),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x10(%RDX) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD %XMM1,(%RAX,%RCX,8) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD -0xb0(%RBP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD -0xa8(%RBP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x78(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD %XMM0,(%RDI,%RCX,8) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RCX,%RSI,1),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM1,(%RDI,%RAX,8) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD -0xa0(%RBP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RCX,%RSI,2),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM0,(%RDI,%RAX,8) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x128(%RDX),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD %XMM13,(%RAX,%RCX,8) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
ADD $0x88,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
VZEROUPPER | 4 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼miniqmcreference::TwoBodyJastrowRef | 1.05 | 0.63 |
○Loop 247 - TwoBodyJastrowRef.h:322-329 - exec | 0.37 | 0.22 |
○Loop 249 - TwoBodyJastrowRef.h:266-271 - exec | 0 | 0 |
○Loop 246 - TwoBodyJastrowRef.h:322-329 - exec | 0 | 0 |
○Loop 248 - TwoBodyJastrowRef.h:266-271 - exec | 0 | 0 |
▼Loop 244 - TwoBodyJastrowRef.h:322-347 - exec– | 0 | 0 |
○Loop 245 - TwoBodyJastrowRef.h:340-345 - exec | 0.65 | 0.39 |