Function: _ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLER ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.05% |
---|
Function: _ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLER ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.05% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 231 - 273 |
-------------------------------------------------------------------------------- |
231: inline const AoSElement_t operator[](size_t i) const { return AoSElement_t(myData + i, nGhosts); } |
[...] |
244: *(_base + M * i) = rhs[i]; |
[...] |
263: inline Accessor operator()(size_t i) { return Accessor(myData + i, nGhosts); } |
[...] |
273: inline const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 313 - 316 |
-------------------------------------------------------------------------------- |
313: inline int first(int igroup) const { return (*group_offsets_)[igroup]; } |
314: |
315: ///return the last index of a group i |
316: inline int last(int igroup) const { return (*group_offsets_)[igroup + 1]; } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_numeric.h: 140 - 141 |
-------------------------------------------------------------------------------- |
140: for (; __first != __last; ++__first) |
141: __init = _GLIBCXX_MOVE_IF_20(__init) + *__first; |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
[...] |
249: inline const_pointer data() const { return X; } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/shared_ptr_base.h: 1296 - 1296 |
-------------------------------------------------------------------------------- |
1296: { return _M_ptr; } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_vector.h: 1064 - 1169 |
-------------------------------------------------------------------------------- |
1064: return *(this->_M_impl._M_start + __n); |
[...] |
1169: { return _M_data_ptr(this->_M_impl._M_start); } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_algobase.h: 923 - 1115 |
-------------------------------------------------------------------------------- |
923: for (; __first != __last; ++__first) |
924: *__first = __tmp; |
[...] |
1115: if (__n <= 0) |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_iterator.h: 1028 - 1182 |
-------------------------------------------------------------------------------- |
1028: : _M_current(__i) { } |
[...] |
1182: { return __lhs.base() != __rhs.base(); } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/TwoBodyJastrowRef.h: 268 - 432 |
-------------------------------------------------------------------------------- |
268: const int igt = P.GroupID[iat] * NumGroups; |
269: for (int jg = 0; jg < NumGroups; ++jg) |
270: { |
271: const FuncType& f2(*F[igt + jg]); |
272: int iStart = P.first(jg); |
273: int iEnd = std::min(jelmax, P.last(jg)); |
274: f2.evaluateVGL(iat, iStart, iEnd, dist, u, du, d2u, DistCompressed.data(), DistIndice.data()); |
[...] |
360: const auto& d_table = P.getDistTableAA(myTableID); |
361: for (int ig = 0; ig < NumGroups; ++ig) |
362: { |
363: const int igt = ig * NumGroups; |
364: for (int iat = P.first(ig), last = P.last(ig); iat < last; ++iat) |
365: { |
366: computeU3(P, iat, d_table.getDistRow(iat).data(), cur_u.data(), cur_du.data(), cur_d2u.data(), true); |
367: Uat[iat] = std::accumulate(cur_u.begin(), cur_u.begin() + iat, valT()); |
[...] |
375: for (int jat = 0; jat < iat; ++jat) |
376: lap += d2u[jat] + lapfac * du[jat]; |
377: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
378: { |
379: const valT* restrict dX = displ.data(idim); |
380: valT s = valT(); |
381: for (int jat = 0; jat < iat; ++jat) |
382: s += du[jat] * dX[jat]; |
383: grad[idim] = s; |
384: } |
385: dUat(iat) = grad; |
386: d2Uat[iat] = -lap; |
387: // add the contribution from the upper triangle |
388: for (int jat = 0; jat < iat; jat++) |
389: { |
390: Uat[jat] += u[jat]; |
391: d2Uat[jat] -= d2u[jat] + lapfac * du[jat]; |
[...] |
397: for (int jat = 0; jat < iat; jat++) |
398: save_g[jat] -= du[jat] * dX[jat]; |
[...] |
419: { |
420: if (fromscratch) |
421: recompute(P); |
422: LogValue = valT(0); |
423: for (int iat = 0; iat < N; ++iat) |
424: { |
425: LogValue += Uat[iat]; |
426: G[iat] += dUat[iat]; |
427: L[iat] += d2Uat[iat]; |
428: } |
429: |
430: constexpr valT mhalf(-0.5); |
431: LogValue = mhalf * LogValue; |
432: } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 94 - 94 |
-------------------------------------------------------------------------------- |
94: (const_cast<T1&>(a) += b); |
0x426520 PUSH %RBP |
0x426521 MOV %RSP,%RBP |
0x426524 PUSH %R15 |
0x426526 PUSH %R14 |
0x426528 PUSH %R13 |
0x42652a PUSH %R12 |
0x42652c PUSH %RBX |
0x42652d SUB $0x78,%RSP |
0x426531 MOV %RCX,-0x98(%RBP) |
0x426538 MOV %RDX,-0x90(%RBP) |
0x42653f MOV %RSI,-0x60(%RBP) |
0x426543 MOV %RDI,%RBX |
0x426546 TEST %R8B,%R8B |
0x426549 JE 426ed9 |
0x42654f MOV 0x248(%RBX),%ESI |
0x426555 MOV -0x60(%RBP),%RDI |
0x426559 CALL 462da0 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> |
0x42655e MOV %RAX,-0x88(%RBP) |
0x426565 MOV 0xa0(%RBX),%R10 |
0x42656c TEST %R10,%R10 |
0x42656f JE 426ed9 |
0x426575 XOR %ECX,%ECX |
0x426577 MOVSD 0xefbc9(%RIP),%XMM6 |
0x42657f MOVAPD 0xf1219(%RIP),%XMM7 |
0x426587 MOV %R10,%R12 |
0x42658a MOV %RBX,-0x70(%RBP) |
0x42658e JMP 4265a9 |
(350) 0x426590 MOV %R12,%RAX |
(350) 0x426593 MOV -0xa0(%RBP),%RCX |
(350) 0x42659a INC %RCX |
(350) 0x42659d MOV %RAX,%R12 |
(350) 0x4265a0 CMP %RCX,%RAX |
(350) 0x4265a3 JBE 426ed9 |
(350) 0x4265a9 MOV -0x60(%RBP),%RAX |
(350) 0x4265ad MOV 0x268(%RAX),%RAX |
(350) 0x4265b4 MOV 0x18(%RAX),%RAX |
(350) 0x4265b8 MOVSXD (%RAX,%RCX,4),%RSI |
(350) 0x4265bc MOV 0x4(%RAX,%RCX,4),%EAX |
(350) 0x4265c0 CMP %EAX,%ESI |
(350) 0x4265c2 MOV %RCX,-0xa0(%RBP) |
(350) 0x4265c9 JGE 426590 |
(351) 0x4265cb MOV %EAX,-0x7c(%RBP) |
(351) 0x4265ce MOV 0x140(%RBX),%R9 |
(351) 0x4265d5 MOV 0x158(%RBX),%R13 |
(351) 0x4265dc MOV 0x170(%RBX),%RDI |
(351) 0x4265e3 JMP 4265fb |
0x4265e5 NOPW %CS:(%RAX,%RAX,1) |
(351) 0x4265f0 INC %RSI |
(351) 0x4265f3 MOV %R10,%RAX |
(351) 0x4265f6 CMP %ESI,-0x7c(%RBP) |
(351) 0x4265f9 JE 426593 |
(351) 0x4265fb MOV %RDI,-0x38(%RBP) |
(351) 0x4265ff MOV -0x88(%RBP),%RAX |
(351) 0x426606 MOV 0x48(%RAX),%RAX |
(351) 0x42660a LEA (%RSI,%RSI,4),%RCX |
(351) 0x42660e MOV %RCX,-0x48(%RBP) |
(351) 0x426612 MOV 0x18(%RAX,%RCX,8),%R8 |
(351) 0x426617 TEST %RSI,%RSI |
(351) 0x42661a MOV %RSI,-0x68(%RBP) |
(351) 0x42661e MOV %R9,-0x50(%RBP) |
(351) 0x426622 JLE 426684 |
(351) 0x426624 MOV %ESI,%EDX |
(351) 0x426626 SAL $0x3,%RDX |
(351) 0x42662a MOV %R9,%RDI |
(351) 0x42662d XOR %ESI,%ESI |
(351) 0x42662f MOV %RBX,%R14 |
(351) 0x426632 MOV %R12,%RBX |
(351) 0x426635 MOV %RDX,%R12 |
(351) 0x426638 MOV %R10,-0x40(%RBP) |
(351) 0x42663c MOV %R8,%R15 |
(351) 0x42663f CALL 5074e0 <_intel_fast_memset> |
(351) 0x426644 MOV %R13,%RDI |
(351) 0x426647 XOR %ESI,%ESI |
(351) 0x426649 MOV %R12,%RDX |
(351) 0x42664c CALL 5074e0 <_intel_fast_memset> |
(351) 0x426651 MOV -0x38(%RBP),%RDI |
(351) 0x426655 XOR %ESI,%ESI |
(351) 0x426657 MOV %R12,%RDX |
(351) 0x42665a MOV %RBX,%R12 |
(351) 0x42665d MOV %R14,%RBX |
(351) 0x426660 CALL 5074e0 <_intel_fast_memset> |
(351) 0x426665 MOV %R15,%R8 |
(351) 0x426668 MOV -0x50(%RBP),%R9 |
(351) 0x42666c MOV -0x40(%RBP),%R10 |
(351) 0x426670 MOV -0x68(%RBP),%RSI |
(351) 0x426674 MOVAPD 0xf1124(%RIP),%XMM7 |
(351) 0x42667c MOVSD 0xefac4(%RIP),%XMM6 |
(351) 0x426684 TEST %R12,%R12 |
(351) 0x426687 JE 426750 |
(351) 0x42668d MOV -0x60(%RBP),%RAX |
(351) 0x426691 MOV 0x18(%RAX),%RAX |
(351) 0x426695 IMUL (%RAX,%RSI,4),%R12D |
(351) 0x42669a MOVSXD %R12D,%RAX |
(351) 0x42669d SAL $0x3,%RAX |
(351) 0x4266a1 MOV %RAX,-0x40(%RBP) |
(351) 0x4266a5 MOV $0x1,%R12D |
(351) 0x4266ab MOV %R13,%R15 |
(351) 0x4266ae MOV -0x38(%RBP),%R13 |
(351) 0x4266b2 NOPW %CS:(%RAX,%RAX,1) |
(353) 0x4266c0 MOV 0x200(%RBX),%RAX |
(353) 0x4266c7 ADD -0x40(%RBP),%RAX |
(353) 0x4266cb MOV -0x8(%RAX,%R12,8),%RDI |
(353) 0x4266d0 MOV -0x60(%RBP),%RAX |
(353) 0x4266d4 MOV 0x268(%RAX),%RAX |
(353) 0x4266db MOV 0x18(%RAX),%RAX |
(353) 0x4266df MOV -0x4(%RAX,%R12,4),%EDX |
(353) 0x4266e4 MOV (%RAX,%R12,4),%ECX |
(353) 0x4266e8 CMP %ESI,%ECX |
(353) 0x4266ea CMOVGE %ESI,%ECX |
(353) 0x4266ed MOV %R8,%R14 |
(353) 0x4266f0 PUSHQ 0x1e8(%RBX) |
(353) 0x4266f6 PUSHQ 0x1d0(%RBX) |
(353) 0x4266fc PUSH %R13 |
(353) 0x4266fe PUSH %R15 |
(353) 0x426700 CALL 423800 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi> |
(353) 0x426705 MOV %R14,%R8 |
(353) 0x426708 MOV -0x50(%RBP),%R9 |
(353) 0x42670c MOV -0x68(%RBP),%RSI |
(353) 0x426710 ADD $0x20,%RSP |
(353) 0x426714 MOV %R12D,%EAX |
(353) 0x426717 MOV 0xa0(%RBX),%R10 |
(353) 0x42671e INC %R12 |
(353) 0x426721 CMP %RAX,%R10 |
(353) 0x426724 JA 4266c0 |
(351) 0x426726 MOV 0x140(%RBX),%R9 |
(351) 0x42672d MOV %R10,%R12 |
(351) 0x426730 MOVSD 0xefa10(%RIP),%XMM6 |
(351) 0x426738 MOVAPD 0xf1060(%RIP),%XMM7 |
(351) 0x426740 JMP 426753 |
0x426742 NOPW %CS:(%RAX,%RAX,1) |
(351) 0x426750 XOR %R12D,%R12D |
(351) 0x426753 LEA (,%RSI,8),%RAX |
(351) 0x42675b XORPD %XMM0,%XMM0 |
(351) 0x42675f XORPD %XMM1,%XMM1 |
(351) 0x426763 TEST %RAX,%RAX |
(351) 0x426766 JE 426804 |
(351) 0x42676c CMP $0x8,%RSI |
(351) 0x426770 JB 4267b8 |
(351) 0x426772 MOV %RSI,%RAX |
(351) 0x426775 SHR $0x3,%RAX |
(351) 0x426779 MOV %R9,%RCX |
(351) 0x42677c NOPL (%RAX) |
(352) 0x426780 MOVUPD (%RCX),%XMM2 |
(352) 0x426784 MOVUPD 0x10(%RCX),%XMM3 |
(352) 0x426789 MOVUPD 0x20(%RCX),%XMM4 |
(352) 0x42678e ADDPD %XMM2,%XMM4 |
(352) 0x426792 MOVUPD 0x30(%RCX),%XMM2 |
(352) 0x426797 ADDPD %XMM3,%XMM2 |
(352) 0x42679b ADDPD %XMM4,%XMM2 |
(352) 0x42679f MOVAPD %XMM2,%XMM3 |
(352) 0x4267a3 UNPCKHPD %XMM2,%XMM3 |
(352) 0x4267a7 ADDSD %XMM2,%XMM3 |
(352) 0x4267ab ADDSD %XMM3,%XMM1 |
(352) 0x4267af ADD $0x40,%RCX |
(352) 0x4267b3 DEC %RAX |
(352) 0x4267b6 JNE 426780 |
(351) 0x4267b8 MOV %ESI,%ECX |
(351) 0x4267ba AND $0x7,%ECX |
(351) 0x4267bd DEC %RCX |
(351) 0x4267c0 CMP $0x6,%RCX |
(351) 0x4267c4 JA 426804 |
0x4267c6 MOV %RSI,%RAX |
0x4267c9 AND $-0x8,%RAX |
0x4267cd JMP 0x517ce8(,%RCX,8) |
0x4267d4 ADDSD 0x30(%R9,%RAX,8),%XMM1 |
0x4267db ADDSD 0x28(%R9,%RAX,8),%XMM1 |
0x4267e2 ADDSD 0x20(%R9,%RAX,8),%XMM1 |
0x4267e9 ADDSD 0x18(%R9,%RAX,8),%XMM1 |
0x4267f0 ADDSD 0x10(%R9,%RAX,8),%XMM1 |
0x4267f7 ADDSD 0x8(%R9,%RAX,8),%XMM1 |
0x4267fe ADDSD (%R9,%RAX,8),%XMM1 |
(351) 0x426804 MOV 0xd8(%RBX),%RDX |
(351) 0x42680b MOVSD %XMM1,(%RDX,%RSI,8) |
(351) 0x426810 MOV 0x158(%RBX),%R13 |
(351) 0x426817 MOV 0x170(%RBX),%RDI |
(351) 0x42681e MOV -0x88(%RBP),%RAX |
(351) 0x426825 MOV 0x60(%RAX),%RAX |
(351) 0x426829 TEST %RSI,%RSI |
(351) 0x42682c JLE 4268bc |
(351) 0x426832 MOV %RSI,%RCX |
(351) 0x426835 AND $-0x2,%RCX |
(351) 0x426839 JE 426890 |
(351) 0x42683b LEA -0x1(%RCX),%R8 |
(351) 0x42683f XORPD %XMM1,%XMM1 |
(351) 0x426843 MOV %RDI,%R11 |
(351) 0x426846 XOR %EDI,%EDI |
(351) 0x426848 NOPL (%RAX,%RAX,1) |
(370) 0x426850 MOVUPD (%R13,%RDI,8),%XMM0 |
(370) 0x426857 ADDPD %XMM0,%XMM0 |
(370) 0x42685b MOVUPD (%R11,%RDI,8),%XMM2 |
(370) 0x426861 ADDPD %XMM2,%XMM1 |
(370) 0x426865 ADDPD %XMM0,%XMM1 |
(370) 0x426869 ADD $0x2,%RDI |
(370) 0x42686d CMP %R8,%RDI |
(370) 0x426870 JLE 426850 |
(351) 0x426872 MOVAPD %XMM1,%XMM0 |
(351) 0x426876 UNPCKHPD %XMM1,%XMM0 |
(351) 0x42687a ADDSD %XMM1,%XMM0 |
(351) 0x42687e CMP %RCX,%RSI |
(351) 0x426881 MOV %R11,%RDI |
(351) 0x426884 JNE 4268a0 |
(351) 0x426886 JMP 4268bc |
0x426888 NOPL (%RAX,%RAX,1) |
(351) 0x426890 XORPD %XMM0,%XMM0 |
(351) 0x426894 XOR %ECX,%ECX |
(351) 0x426896 NOPW %CS:(%RAX,%RAX,1) |
(369) 0x4268a0 MOVSD (%R13,%RCX,8),%XMM1 |
(369) 0x4268a7 ADDSD (%RDI,%RCX,8),%XMM0 |
(369) 0x4268ac ADDSD %XMM1,%XMM1 |
(369) 0x4268b0 ADDSD %XMM1,%XMM0 |
(369) 0x4268b4 INC %RCX |
(369) 0x4268b7 CMP %RCX,%RSI |
(369) 0x4268ba JNE 4268a0 |
(351) 0x4268bc MOV -0x48(%RBP),%RCX |
(351) 0x4268c0 MOV 0x8(%RAX,%RCX,8),%R14 |
(351) 0x4268c5 MOV 0x18(%RAX,%RCX,8),%RAX |
(351) 0x4268ca XORPD %XMM1,%XMM1 |
(351) 0x4268ce XORPD %XMM2,%XMM2 |
(351) 0x4268d2 TEST %RSI,%RSI |
(351) 0x4268d5 MOV %RDI,-0x38(%RBP) |
(351) 0x4268d9 JLE 426959 |
(351) 0x4268db MOV %RSI,%R8 |
(351) 0x4268de AND $-0x2,%R8 |
(351) 0x4268e2 JE 426930 |
(351) 0x4268e4 LEA -0x1(%R8),%RCX |
(351) 0x4268e8 XORPD %XMM3,%XMM3 |
(351) 0x4268ec XOR %EDI,%EDI |
(351) 0x4268ee XCHG %AX,%AX |
(368) 0x4268f0 MOVUPD (%RAX,%RDI,8),%XMM2 |
(368) 0x4268f5 MOVUPD (%R13,%RDI,8),%XMM4 |
(368) 0x4268fc MULPD %XMM2,%XMM4 |
(368) 0x426900 ADDPD %XMM4,%XMM3 |
(368) 0x426904 ADD $0x2,%RDI |
(368) 0x426908 CMP %RCX,%RDI |
(368) 0x42690b JLE 4268f0 |
(351) 0x42690d MOVAPD %XMM3,%XMM2 |
(351) 0x426911 UNPCKHPD %XMM3,%XMM2 |
(351) 0x426915 ADDSD %XMM3,%XMM2 |
(351) 0x426919 CMP %R8,%RSI |
(351) 0x42691c MOV -0x38(%RBP),%RDI |
(351) 0x426920 JNE 426940 |
(351) 0x426922 JMP 426959 |
0x426924 NOPW %CS:(%RAX,%RAX,1) |
(351) 0x426930 XOR %R8D,%R8D |
(351) 0x426933 NOPW %CS:(%RAX,%RAX,1) |
(367) 0x426940 MOVSD (%RAX,%R8,8),%XMM3 |
(367) 0x426946 MULSD (%R13,%R8,8),%XMM3 |
(367) 0x42694d ADDSD %XMM3,%XMM2 |
(367) 0x426951 INC %R8 |
(367) 0x426954 CMP %R8,%RSI |
(367) 0x426957 JNE 426940 |
(351) 0x426959 TEST %RSI,%RSI |
(351) 0x42695c JLE 4269e9 |
(351) 0x426962 MOV %RSI,%R11 |
(351) 0x426965 AND $-0x2,%R11 |
(351) 0x426969 JE 4269c0 |
(351) 0x42696b LEA -0x1(%R11),%RCX |
(351) 0x42696f LEA (%RAX,%R14,8),%RDI |
(351) 0x426973 XORPD %XMM3,%XMM3 |
(351) 0x426977 XOR %R8D,%R8D |
(351) 0x42697a NOPW (%RAX,%RAX,1) |
(366) 0x426980 MOVUPD (%RDI,%R8,8),%XMM1 |
(366) 0x426986 MOVUPD (%R13,%R8,8),%XMM4 |
(366) 0x42698d MULPD %XMM1,%XMM4 |
(366) 0x426991 ADDPD %XMM4,%XMM3 |
(366) 0x426995 ADD $0x2,%R8 |
(366) 0x426999 CMP %RCX,%R8 |
(366) 0x42699c JLE 426980 |
(351) 0x42699e MOVAPD %XMM3,%XMM1 |
(351) 0x4269a2 UNPCKHPD %XMM3,%XMM1 |
(351) 0x4269a6 ADDSD %XMM3,%XMM1 |
(351) 0x4269aa CMP %R11,%RSI |
(351) 0x4269ad MOV -0x38(%RBP),%RDI |
(351) 0x4269b1 JNE 4269c7 |
(351) 0x4269b3 JMP 4269e9 |
0x4269b5 NOPW %CS:(%RAX,%RAX,1) |
(351) 0x4269c0 XORPD %XMM1,%XMM1 |
(351) 0x4269c4 XOR %R11D,%R11D |
(351) 0x4269c7 LEA (%RAX,%R14,8),%RCX |
(351) 0x4269cb NOPL (%RAX,%RAX,1) |
(365) 0x4269d0 MOVSD (%RCX,%R11,8),%XMM3 |
(365) 0x4269d6 MULSD (%R13,%R11,8),%XMM3 |
(365) 0x4269dd ADDSD %XMM3,%XMM1 |
(365) 0x4269e1 INC %R11 |
(365) 0x4269e4 CMP %R11,%RSI |
(365) 0x4269e7 JNE 4269d0 |
(351) 0x4269e9 TEST %RSI,%RSI |
(351) 0x4269ec JLE 426a50 |
(351) 0x4269ee MOV %RSI,%R11 |
(351) 0x4269f1 AND $-0x2,%R11 |
(351) 0x4269f5 JE 426a60 |
(351) 0x4269f7 LEA -0x1(%R11),%RCX |
(351) 0x4269fb MOV %R14,%RDI |
(351) 0x4269fe SAL $0x4,%RDI |
(351) 0x426a02 ADD %RAX,%RDI |
(351) 0x426a05 XORPD %XMM4,%XMM4 |
(351) 0x426a09 XOR %R8D,%R8D |
(351) 0x426a0c NOPL (%RAX) |
(364) 0x426a10 MOVUPD (%RDI,%R8,8),%XMM3 |
(364) 0x426a16 MOVUPD (%R13,%R8,8),%XMM5 |
(364) 0x426a1d MULPD %XMM3,%XMM5 |
(364) 0x426a21 ADDPD %XMM5,%XMM4 |
(364) 0x426a25 ADD $0x2,%R8 |
(364) 0x426a29 CMP %RCX,%R8 |
(364) 0x426a2c JLE 426a10 |
(351) 0x426a2e MOVAPD %XMM4,%XMM3 |
(351) 0x426a32 UNPCKHPD %XMM4,%XMM3 |
(351) 0x426a36 ADDSD %XMM4,%XMM3 |
(351) 0x426a3a CMP %R11,%RSI |
(351) 0x426a3d MOV -0x38(%RBP),%RDI |
(351) 0x426a41 JNE 426a67 |
(351) 0x426a43 JMP 426a99 |
0x426a45 NOPW %CS:(%RAX,%RAX,1) |
(351) 0x426a50 XORPD %XMM3,%XMM3 |
(351) 0x426a54 JMP 426a99 |
0x426a56 NOPW %CS:(%RAX,%RAX,1) |
(351) 0x426a60 XORPD %XMM3,%XMM3 |
(351) 0x426a64 XOR %R11D,%R11D |
(351) 0x426a67 MOV %R14,%RCX |
(351) 0x426a6a SAL $0x4,%RCX |
(351) 0x426a6e ADD %RAX,%RCX |
(351) 0x426a71 NOPW %CS:(%RAX,%RAX,1) |
(363) 0x426a80 MOVSD (%RCX,%R11,8),%XMM4 |
(363) 0x426a86 MULSD (%R13,%R11,8),%XMM4 |
(363) 0x426a8d ADDSD %XMM4,%XMM3 |
(363) 0x426a91 INC %R11 |
(363) 0x426a94 CMP %R11,%RSI |
(363) 0x426a97 JNE 426a80 |
(351) 0x426a99 MOV %R14,-0x48(%RBP) |
(351) 0x426a9d MOV 0xf0(%RBX),%R8 |
(351) 0x426aa4 MOV 0x100(%RBX),%R14 |
(351) 0x426aab LEA (%RSI,%R8,1),%RCX |
(351) 0x426aaf MOVSD %XMM2,(%R14,%RSI,8) |
(351) 0x426ab5 MOVSD %XMM1,(%R14,%RCX,8) |
(351) 0x426abb MOV %R8,-0x58(%RBP) |
(351) 0x426abf LEA (%RSI,%R8,2),%RCX |
(351) 0x426ac3 MOVSD %XMM3,(%R14,%RCX,8) |
(351) 0x426ac9 XORPD 0xef5df(%RIP),%XMM0 |
(351) 0x426ad1 MOV 0x128(%RBX),%R8 |
(351) 0x426ad8 MOVLPD %XMM0,(%R8,%RSI,8) |
(351) 0x426ade TEST %RSI,%RSI |
(351) 0x426ae1 JLE 4265f0 |
(351) 0x426ae7 MOV %R12,-0x78(%RBP) |
(351) 0x426aeb MOV %R10,-0x40(%RBP) |
(351) 0x426aef LEA (%RDX,%RSI,8),%R11 |
(351) 0x426af3 ADD $-0x8,%R11 |
(351) 0x426af7 CMP %R8,%R11 |
(351) 0x426afa SETAEB -0x2e(%RBP) |
(351) 0x426afe LEA (%R8,%RSI,8),%RDI |
(351) 0x426b02 ADD $-0x8,%RDI |
(351) 0x426b06 CMP %RDX,%RDI |
(351) 0x426b09 SETAE %CL |
(351) 0x426b0c CMP %R9,%R11 |
(351) 0x426b0f SETB %R15B |
(351) 0x426b13 LEA (%R9,%RSI,8),%R10 |
(351) 0x426b17 ADD $-0x8,%R10 |
(351) 0x426b1b CMP %RDX,%R10 |
(351) 0x426b1e SETBB -0x2d(%RBP) |
(351) 0x426b22 CMP %R8,%R10 |
(351) 0x426b25 SETB %R12B |
(351) 0x426b29 MOV %R9,-0x50(%RBP) |
(351) 0x426b2d CMP %R9,%RDI |
(351) 0x426b30 SETBB -0x2c(%RBP) |
(351) 0x426b34 CMP %R13,%R11 |
(351) 0x426b37 SETB %R10B |
(351) 0x426b3b LEA -0x8(,%RSI,8),%RBX |
(351) 0x426b43 ADD %R13,%RBX |
(351) 0x426b46 CMP %RDX,%RBX |
(351) 0x426b49 SETBB -0x2b(%RBP) |
(351) 0x426b4d CMP -0x38(%RBP),%R11 |
(351) 0x426b51 SETB %R11B |
(351) 0x426b55 MOV -0x38(%RBP),%R9 |
(351) 0x426b59 LEA (%R9,%RSI,8),%R9 |
(351) 0x426b5d ADD $-0x8,%R9 |
(351) 0x426b61 CMP %RDX,%R9 |
(351) 0x426b64 SETBB -0x2a(%RBP) |
(351) 0x426b68 CMP %R8,%RBX |
(351) 0x426b6b SETB %BL |
(351) 0x426b6e CMP %R13,%RDI |
(351) 0x426b71 SETBB -0x29(%RBP) |
(351) 0x426b75 CMP %R8,%R9 |
(351) 0x426b78 SETB %R9B |
(351) 0x426b7c CMP -0x38(%RBP),%RDI |
(351) 0x426b80 MOV -0x38(%RBP),%RDI |
(351) 0x426b84 SETB %SIL |
(351) 0x426b88 TEST %CL,-0x2e(%RBP) |
(351) 0x426b8b JNE 426c50 |
(351) 0x426b91 OR -0x2d(%RBP),%R15B |
(351) 0x426b95 JE 426c50 |
(351) 0x426b9b OR -0x2c(%RBP),%R12B |
(351) 0x426b9f JE 426c50 |
(351) 0x426ba5 OR -0x2b(%RBP),%R10B |
(351) 0x426ba9 JE 426c50 |
(351) 0x426baf OR -0x2a(%RBP),%R11B |
(351) 0x426bb3 JE 426c50 |
(351) 0x426bb9 OR -0x29(%RBP),%BL |
(351) 0x426bbc JE 426c50 |
(351) 0x426bc2 OR %SIL,%R9B |
(351) 0x426bc5 JE 426c50 |
(351) 0x426bcb MOV -0x68(%RBP),%RSI |
(351) 0x426bcf MOV %RSI,%R11 |
(351) 0x426bd2 AND $-0x2,%R11 |
(351) 0x426bd6 JE 426ca6 |
(351) 0x426bdc LEA -0x1(%R11),%RCX |
(351) 0x426be0 MOV %R13,%R15 |
(351) 0x426be3 MOV %RDI,%R13 |
(351) 0x426be6 XOR %EDI,%EDI |
(351) 0x426be8 MOV -0x50(%RBP),%R9 |
(351) 0x426bec NOPL (%RAX) |
(362) 0x426bf0 MOVUPD (%RDX,%RDI,8),%XMM0 |
(362) 0x426bf5 MOVUPD (%R9,%RDI,8),%XMM1 |
(362) 0x426bfb ADDPD %XMM0,%XMM1 |
(362) 0x426bff MOVUPD %XMM1,(%RDX,%RDI,8) |
(362) 0x426c04 MOVUPD (%R15,%RDI,8),%XMM0 |
(362) 0x426c0a MULPD %XMM7,%XMM0 |
(362) 0x426c0e MOVUPD (%R13,%RDI,8),%XMM1 |
(362) 0x426c15 SUBPD %XMM1,%XMM0 |
(362) 0x426c19 MOVUPD (%R8,%RDI,8),%XMM1 |
(362) 0x426c1f ADDPD %XMM0,%XMM1 |
(362) 0x426c23 MOVUPD %XMM1,(%R8,%RDI,8) |
(362) 0x426c29 ADD $0x2,%RDI |
(362) 0x426c2d CMP %RCX,%RDI |
(362) 0x426c30 JLE 426bf0 |
(351) 0x426c32 CMP %R11,%RSI |
(351) 0x426c35 MOV -0x70(%RBP),%RBX |
(351) 0x426c39 MOV -0x40(%RBP),%R10 |
(351) 0x426c3d MOV -0x78(%RBP),%R12 |
(351) 0x426c41 MOV %R13,%RDI |
(351) 0x426c44 MOV %R15,%R13 |
(351) 0x426c47 JNE 426cc0 |
(351) 0x426c49 JMP 426cf7 |
0x426c4e XCHG %AX,%AX |
(351) 0x426c50 XOR %ECX,%ECX |
(351) 0x426c52 MOV -0x70(%RBP),%RBX |
(351) 0x426c56 MOV -0x68(%RBP),%RSI |
(351) 0x426c5a MOV -0x40(%RBP),%R10 |
(351) 0x426c5e MOV -0x50(%RBP),%R9 |
(351) 0x426c62 MOV -0x78(%RBP),%R12 |
(351) 0x426c66 NOPW %CS:(%RAX,%RAX,1) |
(354) 0x426c70 MOVSD (%RDX,%RCX,8),%XMM0 |
(354) 0x426c75 ADDSD (%R9,%RCX,8),%XMM0 |
(354) 0x426c7b MOVSD %XMM0,(%RDX,%RCX,8) |
(354) 0x426c80 MOVSD (%R13,%RCX,8),%XMM0 |
(354) 0x426c87 MULSD %XMM6,%XMM0 |
(354) 0x426c8b SUBSD (%RDI,%RCX,8),%XMM0 |
(354) 0x426c90 ADDSD (%R8,%RCX,8),%XMM0 |
(354) 0x426c96 MOVSD %XMM0,(%R8,%RCX,8) |
(354) 0x426c9c INC %RCX |
(354) 0x426c9f CMP %RCX,%RSI |
(354) 0x426ca2 JNE 426c70 |
(351) 0x426ca4 JMP 426cf7 |
(351) 0x426ca6 XOR %R11D,%R11D |
(351) 0x426ca9 MOV -0x70(%RBP),%RBX |
(351) 0x426cad MOV -0x40(%RBP),%R10 |
(351) 0x426cb1 MOV -0x50(%RBP),%R9 |
(351) 0x426cb5 MOV -0x78(%RBP),%R12 |
(351) 0x426cb9 NOPL (%RAX) |
(361) 0x426cc0 MOVSD (%RDX,%R11,8),%XMM0 |
(361) 0x426cc6 ADDSD (%R9,%R11,8),%XMM0 |
(361) 0x426ccc MOVSD %XMM0,(%RDX,%R11,8) |
(361) 0x426cd2 MOVSD (%R13,%R11,8),%XMM0 |
(361) 0x426cd9 MULSD %XMM6,%XMM0 |
(361) 0x426cdd SUBSD (%RDI,%R11,8),%XMM0 |
(361) 0x426ce3 ADDSD (%R8,%R11,8),%XMM0 |
(361) 0x426ce9 MOVSD %XMM0,(%R8,%R11,8) |
(361) 0x426cef INC %R11 |
(361) 0x426cf2 CMP %R11,%RSI |
(361) 0x426cf5 JNE 426cc0 |
(351) 0x426cf7 TEST %RSI,%RSI |
(351) 0x426cfa JLE 4265f0 |
(351) 0x426d00 MOV %RSI,%RDX |
(351) 0x426d03 AND $-0x2,%RDX |
(351) 0x426d07 JE 426d44 |
(351) 0x426d09 LEA -0x1(%RDX),%RCX |
(351) 0x426d0d XOR %EDI,%EDI |
(351) 0x426d0f NOP |
(360) 0x426d10 MOVUPD (%RAX,%RDI,8),%XMM0 |
(360) 0x426d15 MOVUPD (%R13,%RDI,8),%XMM1 |
(360) 0x426d1c MULPD %XMM0,%XMM1 |
(360) 0x426d20 MOVUPD (%R14,%RDI,8),%XMM0 |
(360) 0x426d26 SUBPD %XMM1,%XMM0 |
(360) 0x426d2a MOVUPD %XMM0,(%R14,%RDI,8) |
(360) 0x426d30 ADD $0x2,%RDI |
(360) 0x426d34 CMP %RCX,%RDI |
(360) 0x426d37 JLE 426d10 |
(351) 0x426d39 CMP %RDX,%RSI |
(351) 0x426d3c MOV -0x38(%RBP),%RDI |
(351) 0x426d40 JNE 426d50 |
(351) 0x426d42 JMP 426d74 |
(351) 0x426d44 XOR %EDX,%EDX |
(351) 0x426d46 NOPW %CS:(%RAX,%RAX,1) |
(355) 0x426d50 MOVSD (%RAX,%RDX,8),%XMM0 |
(355) 0x426d55 MULSD (%R13,%RDX,8),%XMM0 |
(355) 0x426d5c MOVSD (%R14,%RDX,8),%XMM1 |
(355) 0x426d62 SUBSD %XMM0,%XMM1 |
(355) 0x426d66 MOVSD %XMM1,(%R14,%RDX,8) |
(355) 0x426d6c INC %RDX |
(355) 0x426d6f CMP %RDX,%RSI |
(355) 0x426d72 JNE 426d50 |
(351) 0x426d74 TEST %RSI,%RSI |
(351) 0x426d77 JLE 4265f0 |
(351) 0x426d7d MOV %RSI,%RDX |
(351) 0x426d80 AND $-0x2,%RDX |
(351) 0x426d84 JE 426dd1 |
(351) 0x426d86 LEA -0x1(%RDX),%RCX |
(351) 0x426d8a MOV -0x58(%RBP),%RDI |
(351) 0x426d8e LEA (%R14,%RDI,8),%RDI |
(351) 0x426d92 MOV -0x48(%RBP),%R8 |
(351) 0x426d96 LEA (%RAX,%R8,8),%R8 |
(351) 0x426d9a XOR %R11D,%R11D |
(351) 0x426d9d NOPL (%RAX) |
(359) 0x426da0 MOVUPD (%R8,%R11,8),%XMM0 |
(359) 0x426da6 MOVUPD (%R13,%R11,8),%XMM1 |
(359) 0x426dad MULPD %XMM0,%XMM1 |
(359) 0x426db1 MOVUPD (%RDI,%R11,8),%XMM0 |
(359) 0x426db7 SUBPD %XMM1,%XMM0 |
(359) 0x426dbb MOVUPD %XMM0,(%RDI,%R11,8) |
(359) 0x426dc1 ADD $0x2,%R11 |
(359) 0x426dc5 CMP %RCX,%R11 |
(359) 0x426dc8 JLE 426da0 |
(351) 0x426dca CMP %RDX,%RSI |
(351) 0x426dcd JNE 426dd3 |
(351) 0x426dcf JMP 426e12 |
(351) 0x426dd1 XOR %EDX,%EDX |
(351) 0x426dd3 MOV -0x58(%RBP),%RCX |
(351) 0x426dd7 LEA (%R14,%RCX,8),%RCX |
(351) 0x426ddb MOV -0x48(%RBP),%RDI |
(351) 0x426ddf LEA (%RAX,%RDI,8),%RDI |
(351) 0x426de3 NOPW %CS:(%RAX,%RAX,1) |
(356) 0x426df0 MOVSD (%RDI,%RDX,8),%XMM0 |
(356) 0x426df5 MULSD (%R13,%RDX,8),%XMM0 |
(356) 0x426dfc MOVSD (%RCX,%RDX,8),%XMM1 |
(356) 0x426e01 SUBSD %XMM0,%XMM1 |
(356) 0x426e05 MOVSD %XMM1,(%RCX,%RDX,8) |
(356) 0x426e0a INC %RDX |
(356) 0x426e0d CMP %RDX,%RSI |
(356) 0x426e10 JNE 426df0 |
(351) 0x426e12 TEST %RSI,%RSI |
(351) 0x426e15 MOV -0x38(%RBP),%RDI |
(351) 0x426e19 JLE 4265f0 |
(351) 0x426e1f MOV %RSI,%RDX |
(351) 0x426e22 AND $-0x2,%RDX |
(351) 0x426e26 JE 426e89 |
(351) 0x426e28 LEA -0x1(%RDX),%RCX |
(351) 0x426e2c MOV -0x58(%RBP),%RDI |
(351) 0x426e30 SAL $0x4,%RDI |
(351) 0x426e34 ADD %R14,%RDI |
(351) 0x426e37 MOV -0x48(%RBP),%R8 |
(351) 0x426e3b SAL $0x4,%R8 |
(351) 0x426e3f ADD %RAX,%R8 |
(351) 0x426e42 XOR %R11D,%R11D |
(351) 0x426e45 NOPW %CS:(%RAX,%RAX,1) |
(358) 0x426e50 MOVUPD (%R8,%R11,8),%XMM0 |
(358) 0x426e56 MOVUPD (%R13,%R11,8),%XMM1 |
(358) 0x426e5d MULPD %XMM0,%XMM1 |
(358) 0x426e61 MOVUPD (%RDI,%R11,8),%XMM0 |
(358) 0x426e67 SUBPD %XMM1,%XMM0 |
(358) 0x426e6b MOVUPD %XMM0,(%RDI,%R11,8) |
(358) 0x426e71 ADD $0x2,%R11 |
(358) 0x426e75 CMP %RCX,%R11 |
(358) 0x426e78 JLE 426e50 |
(351) 0x426e7a CMP %RDX,%RSI |
(351) 0x426e7d MOV -0x38(%RBP),%RDI |
(351) 0x426e81 JE 4265f0 |
(351) 0x426e87 JMP 426e8b |
(351) 0x426e89 XOR %EDX,%EDX |
(351) 0x426e8b MOV -0x58(%RBP),%RCX |
(351) 0x426e8f SAL $0x4,%RCX |
(351) 0x426e93 ADD %RCX,%R14 |
(351) 0x426e96 MOV -0x48(%RBP),%RCX |
(351) 0x426e9a SAL $0x4,%RCX |
(351) 0x426e9e ADD %RCX,%RAX |
(351) 0x426ea1 NOPW %CS:(%RAX,%RAX,1) |
(357) 0x426eb0 MOVSD (%RAX,%RDX,8),%XMM0 |
(357) 0x426eb5 MULSD (%R13,%RDX,8),%XMM0 |
(357) 0x426ebc MOVSD (%R14,%RDX,8),%XMM1 |
(357) 0x426ec2 SUBSD %XMM0,%XMM1 |
(357) 0x426ec6 MOVSD %XMM1,(%R14,%RDX,8) |
(357) 0x426ecc INC %RDX |
(357) 0x426ecf CMP %RDX,%RSI |
(357) 0x426ed2 JNE 426eb0 |
(351) 0x426ed4 JMP 4265f0 |
0x426ed9 MOVQ $0,0x10(%RBX) |
0x426ee1 MOV 0x90(%RBX),%RAX |
0x426ee8 TEST %RAX,%RAX |
0x426eeb JE 426fa5 |
0x426ef1 MOV 0xd8(%RBX),%RCX |
0x426ef8 MOV 0xf0(%RBX),%RDX |
0x426eff MOV 0x100(%RBX),%RSI |
0x426f06 MOV -0x90(%RBP),%RDI |
0x426f0d MOV 0x18(%RDI),%RDI |
0x426f11 MOV 0x128(%RBX),%R8 |
0x426f18 MOV -0x98(%RBP),%R9 |
0x426f1f MOV 0x18(%R9),%R9 |
0x426f23 SAL $0x20,%RDX |
0x426f27 ADD $0x10,%RDI |
0x426f2b MOV %RDX,%R10 |
0x426f2e SAR $0x1c,%R10 |
0x426f32 ADD %RSI,%R10 |
0x426f35 SAR $0x1d,%RDX |
0x426f39 ADD %RSI,%RDX |
0x426f3c XOR %R11D,%R11D |
0x426f3f NOP |
(349) 0x426f40 MOVSD 0x10(%RBX),%XMM0 |
(349) 0x426f45 ADDSD (%RCX,%R11,8),%XMM0 |
(349) 0x426f4b MOVSD %XMM0,0x10(%RBX) |
(349) 0x426f50 MOVUPD -0x10(%RDI),%XMM0 |
(349) 0x426f55 MOVSD (%RSI,%R11,8),%XMM1 |
(349) 0x426f5b MOVHPD (%RDX,%R11,8),%XMM1 |
(349) 0x426f61 ADDPD %XMM0,%XMM1 |
(349) 0x426f65 MOVSD (%RDI),%XMM0 |
(349) 0x426f69 ADDSD (%R10,%R11,8),%XMM0 |
(349) 0x426f6f MOVUPD %XMM1,-0x10(%RDI) |
(349) 0x426f74 MOVSD %XMM0,(%RDI) |
(349) 0x426f78 MOVSD (%R9,%R11,8),%XMM0 |
(349) 0x426f7e ADDSD (%R8,%R11,8),%XMM0 |
(349) 0x426f84 MOVSD %XMM0,(%R9,%R11,8) |
(349) 0x426f8a INC %R11 |
(349) 0x426f8d ADD $0x18,%RDI |
(349) 0x426f91 CMP %R11,%RAX |
(349) 0x426f94 JNE 426f40 |
0x426f96 MOVSD 0x10(%RBX),%XMM0 |
0x426f9b MULSD 0xef195(%RIP),%XMM0 |
0x426fa3 JMP 426fad |
0x426fa5 MOVSD 0xf06e3(%RIP),%XMM0 |
0x426fad MOVSD %XMM0,0x10(%RBX) |
0x426fb2 ADD $0x78,%RSP |
0x426fb6 POP %RBX |
0x426fb7 POP %R12 |
0x426fb9 POP %R13 |
0x426fbb POP %R14 |
0x426fbd POP %R15 |
0x426fbf POP %RBP |
0x426fc0 RET |
0x426fc1 NOPW %CS:(%RAX,%RAX,1) |
0x426fcb NOPL (%RAX,%RAX,1) |
Path / |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 81 |
nb uops | 72 |
loop length | 414 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 5 |
ADD-SUB / MUL ratio | 7.00 |
micro-operation queue | 12.00 cycles |
front end | 12.00 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 11.00 | 11.00 | 11.00 | 0.50 | 0.50 | 3.50 | 3.50 | 0.50 | 0.50 |
cycles | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 11.00 | 11.00 | 11.00 | 0.50 | 0.50 | 3.50 | 3.50 | 0.50 | 0.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 12.00 |
Dispatch | 11.00 |
Overall L1 | 12.00 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 7% |
load | 8% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 2% |
load | 5% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 11% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 13% |
load | 13% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 12% |
load | 12% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 11% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x78,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RSI,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %R8B,%R8B | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 426ed9 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9b9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x248(%RBX),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x60(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CALL 462da0 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0xa0(%RBX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
TEST %R10,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 426ed9 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9b9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVSD 0xefbc9(%RIP),%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVAPD 0xf1219(%RIP),%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %R10,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JMP 4265a9 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x89> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV %RSI,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x8,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JMP 0x517ce8(,%RCX,8) | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
ADDSD 0x30(%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
ADDSD 0x28(%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
ADDSD 0x20(%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
ADDSD 0x18(%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
ADDSD 0x10(%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
ADDSD 0x8(%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
ADDSD (%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOVQ $0,0x10(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x90(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 426fa5 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xa85> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0xd8(%RBX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xf0(%RBX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x100(%RBX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x90(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RDI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x128(%RBX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x98(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R9),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SAL $0x20,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD $0x10,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAR $0x1c,%R10 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %RSI,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAR $0x1d,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %RSI,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOVSD 0x10(%RBX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD 0xef195(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
JMP 426fad <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xa8d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOVSD 0xf06e3(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD %XMM0,0x10(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
ADD $0x78,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 81 |
nb uops | 72 |
loop length | 414 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 5 |
ADD-SUB / MUL ratio | 7.00 |
micro-operation queue | 12.00 cycles |
front end | 12.00 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 11.00 | 11.00 | 11.00 | 0.50 | 0.50 | 3.50 | 3.50 | 0.50 | 0.50 |
cycles | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 11.00 | 11.00 | 11.00 | 0.50 | 0.50 | 3.50 | 3.50 | 0.50 | 0.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 12.00 |
Dispatch | 11.00 |
Overall L1 | 12.00 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 7% |
load | 8% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 2% |
load | 5% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 11% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 13% |
load | 13% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 12% |
load | 12% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 11% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x78,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RSI,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %R8B,%R8B | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 426ed9 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9b9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x248(%RBX),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x60(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CALL 462da0 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0xa0(%RBX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
TEST %R10,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 426ed9 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9b9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVSD 0xefbc9(%RIP),%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVAPD 0xf1219(%RIP),%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %R10,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JMP 4265a9 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x89> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV %RSI,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x8,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JMP 0x517ce8(,%RCX,8) | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
ADDSD 0x30(%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
ADDSD 0x28(%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
ADDSD 0x20(%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
ADDSD 0x18(%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
ADDSD 0x10(%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
ADDSD 0x8(%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
ADDSD (%R9,%RAX,8),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOVQ $0,0x10(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x90(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 426fa5 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xa85> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0xd8(%RBX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xf0(%RBX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x100(%RBX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x90(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RDI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x128(%RBX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x98(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R9),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SAL $0x20,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD $0x10,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAR $0x1c,%R10 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %RSI,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAR $0x1d,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %RSI,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOVSD 0x10(%RBX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD 0xef195(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
JMP 426fad <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xa8d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOVSD 0xf06e3(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD %XMM0,0x10(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
ADD $0x78,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb– | 0.05 | 0.1 |
▼Loop 351 - TwoBodyJastrowRef.h:268-420 - exec– | 0 | 0 |
○Loop 364 - TwoBodyJastrowRef.h:381-382 - exec | 0.01 | 0.02 |
○Loop 366 - TwoBodyJastrowRef.h:381-382 - exec | 0.01 | 0.02 |
○Loop 370 - TwoBodyJastrowRef.h:375-376 - exec | 0.01 | 0.02 |
○Loop 368 - TwoBodyJastrowRef.h:381-382 - exec | 0.01 | 0.02 |
○Loop 365 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 359 - TwoBodyJastrowRef.h:397-398 - exec | 0 | 0.01 |
○Loop 354 - TwoBodyJastrowRef.h:388-391 - exec | 0 | 0 |
○Loop 355 - TwoBodyJastrowRef.h:397-398 - exec | 0 | 0 |
○Loop 367 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 358 - TwoBodyJastrowRef.h:397-398 - exec | 0 | 0 |
○Loop 357 - TwoBodyJastrowRef.h:397-398 - exec | 0 | 0 |
○Loop 360 - TwoBodyJastrowRef.h:397-398 - exec | 0 | 0.01 |
○Loop 352 - stl_numeric.h:140-141 - exec | 0 | 0 |
○Loop 369 - TwoBodyJastrowRef.h:375-376 - exec | 0 | 0 |
○Loop 350 - TwoBodyJastrowRef.h:361-364 - exec | 0 | 0 |
○Loop 363 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 353 - TwoBodyJastrowRef.h:269-274 - exec | 0 | 0 |
○Loop 361 - TwoBodyJastrowRef.h:388-391 - exec | 0 | 0 |
○Loop 362 - TwoBodyJastrowRef.h:388-420 - exec | 0 | 0.01 |
○Loop 356 - TwoBodyJastrowRef.h:397-398 - exec | 0 | 0 |
○Loop 349 - TwoBodyJastrowRef.h:423-427 - exec | 0 | 0 |