Function: miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evalua ... | Module: exec | Source: DiracDeterminantRef.cpp:231-273 [...] | Coverage: 0.08% |
---|
Function: miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evalua ... | Module: exec | Source: DiracDeterminantRef.cpp:231-273 [...] | Coverage: 0.08% |
---|
/scratch_na/users/xoserete/qaas_runs/171-284-5202/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsMatrix.h: 217 - 217 |
-------------------------------------------------------------------------------- |
217: inline Type_t* operator[](size_type i) { return X.data() + i * D2; } |
/scratch_na/users/xoserete/qaas_runs/171-284-5202/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/SPOSet.h: 106 - 111 |
-------------------------------------------------------------------------------- |
106: for (int iat = first, i = 0; iat < last; ++iat, ++i) |
107: { |
108: ValueVector_t v(logdet[i], OrbitalSetSize); |
109: GradVector_t g(dlogdet[i], OrbitalSetSize); |
110: ValueVector_t l(d2logdet[i], OrbitalSetSize); |
111: evaluate(P, iat, v, g, l); |
/scratch_na/users/xoserete/qaas_runs/171-284-5202/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 63 - 94 |
-------------------------------------------------------------------------------- |
63: return (a * b); |
[...] |
94: (const_cast<T1&>(a) += b); |
/software/compilers/gcc/gcc-13.1.0-full+isl+binutils/include/c++/13.1.0/bits/new_allocator.h: 100 - 168 |
-------------------------------------------------------------------------------- |
100: ~__new_allocator() _GLIBCXX_USE_NOEXCEPT { } |
[...] |
168: _GLIBCXX_OPERATOR_DELETE(_GLIBCXX_SIZED_DEALLOC(__p, __n)); |
/software/compilers/gcc/gcc-13.1.0-full+isl+binutils/include/c++/13.1.0/bits/unique_ptr.h: 199 - 199 |
-------------------------------------------------------------------------------- |
199: pointer _M_ptr() const noexcept { return std::get<0>(_M_t); } |
/scratch_na/users/xoserete/qaas_runs/171-284-5202/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 56 - 248 |
-------------------------------------------------------------------------------- |
56: explicit inline Vector(T* ref, size_t n) : nLocal(n), X(ref) {} |
[...] |
144: virtual ~Vector() { free(); } |
[...] |
210: if (nAllocated) |
[...] |
221: inline Type_t& operator[](size_t i) |
222: { |
223: return X[i]; |
[...] |
248: inline pointer data() { return X; } |
/scratch_na/users/xoserete/qaas_runs/171-284-5202/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 62 - 62 |
-------------------------------------------------------------------------------- |
62: X[d] = T(0); |
/scratch_na/users/xoserete/qaas_runs/171-284-5202/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVectorOps.h: 129 - 131 |
-------------------------------------------------------------------------------- |
129: Type_t res = lhs[0] * rhs[0]; |
130: for (unsigned d = 1; d < D; ++d) |
131: res += lhs[d] * rhs[d]; |
/scratch_na/users/xoserete/qaas_runs/171-284-5202/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/DiracDeterminantRef.cpp: 231 - 273 |
-------------------------------------------------------------------------------- |
231: typename DiracDeterminantRef<DU_TYPE>::RealType DiracDeterminantRef<DU_TYPE>::evaluateLog( |
[...] |
238: if (NumPtcls == 1) |
239: { |
240: ValueType y = psiM(0, 0); |
241: GradType rv = y * dpsiM(0, 0); |
242: G[FirstIndex] += rv; |
243: L[FirstIndex] += y * d2psiM(0, 0) - dot(rv, rv); |
244: } |
245: else |
246: { |
247: for (int i = 0, iat = FirstIndex; i < NumPtcls; i++, iat++) |
248: { |
249: mGradType rv = simd::dot(psiM[i], dpsiM[i], NumOrbitals); |
250: mValueType lap = simd::dot(psiM[i], d2psiM[i], NumOrbitals); |
251: G[iat] += rv; |
252: L[iat] += lap - dot(rv, rv); |
253: } |
254: } |
255: return LogValue; |
256: } |
257: |
258: template<typename DU_TYPE> |
259: void DiracDeterminantRef<DU_TYPE>::recompute(ParticleSet& P) |
260: { |
261: SPOVGLTimer->start(); |
262: Phi->evaluate_notranspose(P, FirstIndex, LastIndex, psiM_temp, dpsiM, d2psiM); |
263: SPOVGLTimer->stop(); |
264: if (NumPtcls == 1) |
265: { |
266: //CurrentDet=psiM(0,0); |
267: ValueType det = psiM_temp(0, 0); |
268: psiM(0, 0) = RealType(1) / det; |
269: LogValue = evaluateLogAndPhase(det, PhaseValue); |
270: } |
271: else |
272: { |
273: invertPsiM(psiM_temp, psiM); |
/scratch_na/users/xoserete/qaas_runs/171-284-5202/intel/miniqmc/build/miniqmc/src/Platforms/CPU/SIMD/inner_product.hpp: 82 - 156 |
-------------------------------------------------------------------------------- |
82: for (int i = 0; i < n; i++) |
83: res += a[i] * b[i]; |
[...] |
155: for (int i = 0; i < n; i++) |
156: res += a[i] * b[i]; |
/scratch_na/users/xoserete/qaas_runs/171-284-5202/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/DeterminantHelper.h: 40 - 48 |
-------------------------------------------------------------------------------- |
40: if (psi < 0.0) |
41: { |
42: phase = M_PI; |
43: return std::log(-psi); |
44: } |
45: else |
46: { |
47: phase = 0.0; |
48: return std::log(psi); |
0x494760 LEA 0x8(%RSP),%R10 |
0x494765 AND $-0x20,%RSP |
0x494769 PUSHQ -0x8(%R10) |
0x49476d PUSH %RBP |
0x49476e MOV %RSP,%RBP |
0x494771 PUSH %R15 |
0x494773 MOV %RDI,%R15 |
0x494776 PUSH %R14 |
0x494778 PUSH %R13 |
0x49477a PUSH %R12 |
0x49477c PUSH %R10 |
0x49477e PUSH %RBX |
0x49477f SUB $0xe0,%RSP |
0x494786 MOV %RSI,-0xc8(%RBP) |
0x49478d MOV 0x468(%RDI),%RDI |
0x494794 MOV %RDX,-0xd0(%RBP) |
0x49479b MOV %RCX,-0x100(%RBP) |
0x4947a2 CALL 50f9a0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> |
0x4947a7 MOV 0x470(%R15),%R12 |
0x4947ae LEA 0x90(%R15),%RDI |
0x4947b5 MOV 0x47c(%R15),%R13D |
0x4947bc MOV %RDI,-0xd8(%RBP) |
0x4947c3 MOV 0x478(%R15),%R14D |
0x4947ca MOV (%R12),%RAX |
0x4947ce MOV 0x28(%RAX),%RBX |
0x4947d2 CMP $0x475470,%RBX |
0x4947d9 JNE 495301 |
0x4947df CMP %R14D,%R13D |
0x4947e2 JLE 494911 |
0x4947e8 SUB %R14D,%R13D |
0x4947eb XOR %EBX,%EBX |
0x4947ed NOPL (%RAX) |
(1001) 0x4947f0 MOV 0x98(%R15),%RCX |
(1001) 0x4947f7 MOV 0xc0(%R15),%R8 |
(1001) 0x4947fe MOVQ $0x58c7c8,-0xc0(%RBP) |
(1001) 0x494809 MOV 0x118(%R15),%R11 |
(1001) 0x494810 MOV 0x180(%R15),%RDX |
(1001) 0x494817 MOVQ $0x58bc98,-0x90(%RBP) |
(1001) 0x494822 IMUL %RBX,%RCX |
(1001) 0x494826 MOV 0x140(%R15),%RAX |
(1001) 0x49482d MOVSXD 0x8(%R12),%RSI |
(1001) 0x494832 MOVQ $0x58c7c8,-0x60(%RBP) |
(1001) 0x49483a IMUL %RBX,%R11 |
(1001) 0x49483e MOVQ $0,-0xb0(%RBP) |
(1001) 0x494849 MOV %RSI,-0xb8(%RBP) |
(1001) 0x494850 LEA (%R8,%RCX,8),%R9 |
(1001) 0x494854 MOV 0x158(%R15),%RCX |
(1001) 0x49485b MOV %RSI,-0x88(%RBP) |
(1001) 0x494862 LEA (%R11,%R11,2),%R10 |
(1001) 0x494866 MOV %R9,-0xa8(%RBP) |
(1001) 0x49486d MOV (%R12),%R11 |
(1001) 0x494871 LEA -0x60(%RBP),%R9 |
(1001) 0x494875 IMUL %RBX,%RCX |
(1001) 0x494879 LEA (%RAX,%R10,8),%RDI |
(1001) 0x49487d MOV %RSI,-0x58(%RBP) |
(1001) 0x494881 MOV -0xc8(%RBP),%RSI |
(1001) 0x494888 MOV %RDI,-0x78(%RBP) |
(1001) 0x49488c MOV %R12,%RDI |
(1001) 0x49488f MOVQ $0,-0x80(%RBP) |
(1001) 0x494897 LEA (%RDX,%RCX,8),%R8 |
(1001) 0x49489b MOVQ $0,-0x50(%RBP) |
(1001) 0x4948a3 LEA (%R14,%RBX,1),%EDX |
(1001) 0x4948a7 MOV %R8,-0x48(%RBP) |
(1001) 0x4948ab LEA -0xc0(%RBP),%RCX |
(1001) 0x4948b2 LEA -0x90(%RBP),%R8 |
(1001) 0x4948b9 CALLQ 0x18(%R11) |
(1001) 0x4948bd MOV -0x50(%RBP),%RSI |
(1001) 0x4948c1 MOVQ $0x58c7c8,-0x60(%RBP) |
(1001) 0x4948c9 TEST %RSI,%RSI |
(1001) 0x4948cc JNE 4951a0 |
(1001) 0x4948d2 MOV -0x80(%RBP),%R9 |
(1001) 0x4948d6 MOVQ $0x58bc98,-0x90(%RBP) |
(1001) 0x4948e1 TEST %R9,%R9 |
(1001) 0x4948e4 JNE 495180 |
(1001) 0x4948ea MOV -0xb0(%RBP),%R10 |
(1001) 0x4948f1 MOVQ $0x58c7c8,-0xc0(%RBP) |
(1001) 0x4948fc TEST %R10,%R10 |
(1001) 0x4948ff JNE 495158 |
(1001) 0x494905 INC %RBX |
(1001) 0x494908 CMP %R13,%RBX |
(1001) 0x49490b JNE 4947f0 |
0x494911 MOV 0x468(%R15),%RDI |
0x494918 CALL 50fbd0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> |
0x49491d CMPL $0x1,0x484(%R15) |
0x494925 JE 49522a |
0x49492b MOV -0xd8(%RBP),%RSI |
0x494932 MOV %R15,%RDI |
0x494935 LEA 0xd0(%R15),%RDX |
0x49493c CALL 492b60 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE10invertPsiMERKNS1_6MatrixIdSaIdEEERS7_> |
0x494941 MOV 0x484(%R15),%EDI |
0x494948 CMP $0x1,%EDI |
0x49494b JE 49534a |
0x494951 MOVSXD 0x478(%R15),%RAX |
0x494958 TEST %EDI,%EDI |
0x49495a JLE 495139 |
0x494960 MOV -0xd0(%RBP),%R12 |
0x494967 LEA (%RAX,%RAX,2),%R8 |
0x49496b MOV 0x480(%R15),%R14D |
0x494972 MOV %R15,-0x110(%RBP) |
0x494979 MOV 0x100(%R15),%RCX |
0x494980 MOV 0xd8(%R15),%RDX |
0x494987 MOVSXD %EDI,%RDI |
0x49498a MOV 0x18(%R12),%R13 |
0x49498f MOV 0x118(%R15),%RBX |
0x494996 MOV %RDI,-0xe8(%RBP) |
0x49499d XOR %EDI,%EDI |
0x49499f MOV 0x140(%R15),%R11 |
0x4949a6 VMOVDQA 0xf90f2(%RIP),%YMM8 |
0x4949ae MOV %RCX,-0xc8(%RBP) |
0x4949b5 MOV %R14D,%ECX |
0x4949b8 LEA (%R13,%R8,8),%R9 |
0x4949bd MOV -0x100(%RBP),%R8 |
0x4949c4 MOV %RDX,-0xf0(%RBP) |
0x4949cb SHR $0x2,%ECX |
0x4949ce MOV %R14D,%EDX |
0x4949d1 SAL $0x5,%RCX |
0x4949d5 LEA (%RBX,%RBX,2),%RSI |
0x4949d9 MOV %RBX,-0xf8(%RBP) |
0x4949e0 MOV 0x18(%R8),%R13 |
0x4949e4 AND $-0x4,%EDX |
0x4949e7 MOV %RCX,-0xd8(%RBP) |
0x4949ee LEA (,%RSI,8),%R10 |
0x4949f6 MOV %EDX,-0xdc(%RBP) |
0x4949fc LEA -0x1(%R14),%EBX |
0x494a00 VMOVDQA 0xf90b8(%RIP),%YMM7 |
0x494a08 MOV %R11,%R12 |
0x494a0b LEA (%R13,%RAX,8),%RAX |
0x494a10 VMOVDQA 0xf90c8(%RIP),%YMM6 |
0x494a18 VMOVDQA 0xf90e0(%RIP),%YMM5 |
0x494a20 MOV %R10,-0x108(%RBP) |
0x494a27 VMOVDQA 0xf88d1(%RIP),%YMM4 |
0x494a2f VMOVDQA 0xf88e9(%RIP),%YMM3 |
0x494a37 MOV %RAX,-0x100(%RBP) |
0x494a3e XOR %R10D,%R10D |
0x494a41 MOV %EBX,-0xe0(%RBP) |
0x494a47 XOR %EBX,%EBX |
0x494a49 NOPL (%RAX) |
(998) 0x494a50 MOV -0xc8(%RBP),%R15 |
(998) 0x494a57 LEA (%R15,%RBX,8),%RCX |
(998) 0x494a5b MOV %RCX,%RDX |
(998) 0x494a5e TEST %R14D,%R14D |
(998) 0x494a61 JLE 4951dc |
(998) 0x494a67 CMPL $0x2,-0xe0(%RBP) |
(998) 0x494a6e JBE 4951f9 |
(998) 0x494a74 MOV -0xd8(%RBP),%RSI |
(998) 0x494a7b VXORPD %XMM13,%XMM13,%XMM13 |
(998) 0x494a80 MOV %R12,%R15 |
(998) 0x494a83 VMOVAPD %YMM13,%YMM11 |
(998) 0x494a88 VMOVAPD %YMM13,%YMM0 |
(998) 0x494a8c LEA (%RCX,%RSI,1),%R8 |
(998) 0x494a90 SUB $0x20,%RSI |
(998) 0x494a94 SHR $0x5,%RSI |
(998) 0x494a98 INC %RSI |
(998) 0x494a9b AND $0x3,%ESI |
(998) 0x494a9e JE 494bcd |
(998) 0x494aa4 CMP $0x1,%RSI |
(998) 0x494aa8 JE 494b6b |
(998) 0x494aae CMP $0x2,%RSI |
(998) 0x494ab2 JE 494b11 |
(998) 0x494ab4 VMOVUPD (%R12),%YMM0 |
(998) 0x494aba VMOVUPD 0x20(%R12),%YMM12 |
(998) 0x494ac1 ADD $0x20,%RCX |
(998) 0x494ac5 LEA 0x60(%R12),%R15 |
(998) 0x494aca VMOVUPD 0x40(%R12),%YMM9 |
(998) 0x494ad1 VMOVUPD -0x20(%RCX),%YMM2 |
(998) 0x494ad6 VMOVAPD %YMM0,%YMM11 |
(998) 0x494ada VMOVAPD %YMM0,%YMM1 |
(998) 0x494ade VPERMT2PD %YMM12,%YMM4,%YMM0 |
(998) 0x494ae4 VPERMT2PD %YMM12,%YMM8,%YMM11 |
(998) 0x494aea VPERMT2PD %YMM12,%YMM6,%YMM1 |
(998) 0x494af0 VPERMT2PD %YMM9,%YMM3,%YMM0 |
(998) 0x494af6 VPERMT2PD %YMM9,%YMM7,%YMM11 |
(998) 0x494afc VFMADD132PD %YMM2,%YMM13,%YMM0 |
(998) 0x494b01 VPERMT2PD %YMM9,%YMM5,%YMM1 |
(998) 0x494b07 VFMADD132PD %YMM2,%YMM13,%YMM11 |
(998) 0x494b0c VFMADD231PD %YMM1,%YMM2,%YMM13 |
(998) 0x494b11 VMOVUPD (%R15),%YMM9 |
(998) 0x494b16 VMOVUPD 0x20(%R15),%YMM14 |
(998) 0x494b1c ADD $0x20,%RCX |
(998) 0x494b20 ADD $0x60,%R15 |
(998) 0x494b24 VMOVUPD -0x20(%R15),%YMM12 |
(998) 0x494b2a VMOVUPD -0x20(%RCX),%YMM15 |
(998) 0x494b2f VMOVAPD %YMM9,%YMM10 |
(998) 0x494b34 VMOVAPD %YMM9,%YMM2 |
(998) 0x494b38 VPERMT2PD %YMM14,%YMM4,%YMM9 |
(998) 0x494b3e VPERMT2PD %YMM14,%YMM8,%YMM10 |
(998) 0x494b44 VPERMT2PD %YMM14,%YMM6,%YMM2 |
(998) 0x494b4a VPERMT2PD %YMM12,%YMM3,%YMM9 |
(998) 0x494b50 VPERMT2PD %YMM12,%YMM7,%YMM10 |
(998) 0x494b56 VFMADD231PD %YMM9,%YMM15,%YMM0 |
(998) 0x494b5b VPERMT2PD %YMM12,%YMM5,%YMM2 |
(998) 0x494b61 VFMADD231PD %YMM10,%YMM15,%YMM11 |
(998) 0x494b66 VFMADD231PD %YMM2,%YMM15,%YMM13 |
(998) 0x494b6b VMOVUPD (%R15),%YMM1 |
(998) 0x494b70 VMOVUPD 0x20(%R15),%YMM9 |
(998) 0x494b76 ADD $0x20,%RCX |
(998) 0x494b7a ADD $0x60,%R15 |
(998) 0x494b7e VMOVUPD -0x20(%R15),%YMM14 |
(998) 0x494b84 VMOVUPD -0x20(%RCX),%YMM15 |
(998) 0x494b89 VMOVAPD %YMM1,%YMM12 |
(998) 0x494b8d VMOVAPD %YMM1,%YMM10 |
(998) 0x494b91 VPERMT2PD %YMM9,%YMM4,%YMM1 |
(998) 0x494b97 VPERMT2PD %YMM9,%YMM8,%YMM12 |
(998) 0x494b9d VPERMT2PD %YMM9,%YMM6,%YMM10 |
(998) 0x494ba3 VPERMT2PD %YMM14,%YMM3,%YMM1 |
(998) 0x494ba9 VPERMT2PD %YMM14,%YMM7,%YMM12 |
(998) 0x494baf VFMADD231PD %YMM1,%YMM15,%YMM0 |
(998) 0x494bb4 VPERMT2PD %YMM14,%YMM5,%YMM10 |
(998) 0x494bba VFMADD231PD %YMM12,%YMM15,%YMM11 |
(998) 0x494bbf VFMADD231PD %YMM10,%YMM15,%YMM13 |
(998) 0x494bc4 CMP %R8,%RCX |
(998) 0x494bc7 JE 494d4a |
(1000) 0x494bcd VMOVUPD (%R15),%YMM15 |
(1000) 0x494bd2 VMOVUPD 0x20(%R15),%YMM1 |
(1000) 0x494bd8 SUB $-0x80,%RCX |
(1000) 0x494bdc ADD $0x180,%R15 |
(1000) 0x494be3 VMOVUPD -0x140(%R15),%YMM14 |
(1000) 0x494bec VMOVUPD -0x80(%RCX),%YMM2 |
(1000) 0x494bf1 VMOVAPD %YMM15,%YMM9 |
(1000) 0x494bf6 VMOVAPD %YMM15,%YMM10 |
(1000) 0x494bfb VPERMT2PD %YMM1,%YMM4,%YMM15 |
(1000) 0x494c01 VPERMT2PD %YMM1,%YMM8,%YMM9 |
(1000) 0x494c07 VPERMT2PD %YMM1,%YMM6,%YMM10 |
(1000) 0x494c0d VPERMT2PD %YMM14,%YMM3,%YMM15 |
(1000) 0x494c13 VMOVUPD -0xe0(%R15),%YMM1 |
(1000) 0x494c1c VPERMT2PD %YMM14,%YMM7,%YMM9 |
(1000) 0x494c22 VFMADD231PD %YMM15,%YMM2,%YMM0 |
(1000) 0x494c27 VPERMT2PD %YMM14,%YMM5,%YMM10 |
(1000) 0x494c2d VMOVUPD -0x100(%R15),%YMM15 |
(1000) 0x494c36 VFMADD231PD %YMM9,%YMM2,%YMM11 |
(1000) 0x494c3b VFMADD132PD %YMM2,%YMM13,%YMM10 |
(1000) 0x494c40 VMOVUPD -0x120(%R15),%YMM2 |
(1000) 0x494c49 VMOVUPD -0x60(%RCX),%YMM9 |
(1000) 0x494c4e VMOVUPD -0x80(%R15),%YMM14 |
(1000) 0x494c54 VMOVAPD %YMM2,%YMM12 |
(1000) 0x494c58 VMOVAPD %YMM2,%YMM13 |
(1000) 0x494c5c VPERMT2PD %YMM15,%YMM4,%YMM2 |
(1000) 0x494c62 VPERMT2PD %YMM15,%YMM8,%YMM12 |
(1000) 0x494c68 VPERMT2PD %YMM15,%YMM6,%YMM13 |
(1000) 0x494c6e VPERMT2PD %YMM1,%YMM3,%YMM2 |
(1000) 0x494c74 VPERMT2PD %YMM1,%YMM7,%YMM12 |
(1000) 0x494c7a VFMADD132PD %YMM9,%YMM0,%YMM2 |
(1000) 0x494c7f VPERMT2PD %YMM1,%YMM5,%YMM13 |
(1000) 0x494c85 VMOVUPD -0xc0(%R15),%YMM1 |
(1000) 0x494c8e VFMADD132PD %YMM9,%YMM11,%YMM12 |
(1000) 0x494c93 VMOVAPD %YMM9,%YMM11 |
(1000) 0x494c98 VMOVUPD -0xa0(%R15),%YMM0 |
(1000) 0x494ca1 VMOVUPD -0x40(%RCX),%YMM9 |
(1000) 0x494ca6 VFMADD132PD %YMM13,%YMM10,%YMM11 |
(1000) 0x494cab VMOVAPD %YMM1,%YMM10 |
(1000) 0x494caf VMOVAPD %YMM1,%YMM15 |
(1000) 0x494cb3 VMOVUPD -0x20(%R15),%YMM13 |
(1000) 0x494cb9 VPERMT2PD %YMM0,%YMM8,%YMM10 |
(1000) 0x494cbf VPERMT2PD %YMM0,%YMM4,%YMM1 |
(1000) 0x494cc5 VPERMT2PD %YMM0,%YMM6,%YMM15 |
(1000) 0x494ccb VMOVUPD -0x60(%R15),%YMM0 |
(1000) 0x494cd1 VPERMT2PD %YMM14,%YMM7,%YMM10 |
(1000) 0x494cd7 VPERMT2PD %YMM14,%YMM3,%YMM1 |
(1000) 0x494cdd VPERMT2PD %YMM14,%YMM5,%YMM15 |
(1000) 0x494ce3 VMOVUPD -0x40(%R15),%YMM14 |
(1000) 0x494ce9 VFMADD132PD %YMM9,%YMM2,%YMM1 |
(1000) 0x494cee VMOVAPD %YMM10,%YMM2 |
(1000) 0x494cf2 VMOVUPD -0x20(%RCX),%YMM10 |
(1000) 0x494cf7 VFMADD132PD %YMM9,%YMM12,%YMM2 |
(1000) 0x494cfc VMOVAPD %YMM0,%YMM12 |
(1000) 0x494d00 VFMADD132PD %YMM15,%YMM11,%YMM9 |
(1000) 0x494d05 VMOVAPD %YMM0,%YMM11 |
(1000) 0x494d09 VPERMT2PD %YMM14,%YMM6,%YMM12 |
(1000) 0x494d0f VPERMT2PD %YMM14,%YMM8,%YMM11 |
(1000) 0x494d15 VPERMT2PD %YMM14,%YMM4,%YMM0 |
(1000) 0x494d1b VPERMT2PD %YMM13,%YMM5,%YMM12 |
(1000) 0x494d21 VPERMT2PD %YMM13,%YMM7,%YMM11 |
(1000) 0x494d27 VPERMT2PD %YMM13,%YMM3,%YMM0 |
(1000) 0x494d2d VMOVAPD %YMM10,%YMM13 |
(1000) 0x494d32 VFMADD132PD %YMM10,%YMM1,%YMM0 |
(1000) 0x494d37 VFMADD132PD %YMM10,%YMM2,%YMM11 |
(1000) 0x494d3c VFMADD132PD %YMM12,%YMM9,%YMM13 |
(1000) 0x494d41 CMP %R8,%RCX |
(1000) 0x494d44 JNE 494bcd |
(998) 0x494d4a VEXTRACTF64X2 $0x1,%YMM13,%XMM16 |
(998) 0x494d51 VEXTRACTF64X2 $0x1,%YMM11,%XMM17 |
(998) 0x494d58 MOV -0xdc(%RBP),%EAX |
(998) 0x494d5e VADDPD %XMM13,%XMM16,%XMM9 |
(998) 0x494d64 VADDPD %XMM11,%XMM17,%XMM1 |
(998) 0x494d6a VUNPCKHPD %XMM9,%XMM9,%XMM15 |
(998) 0x494d6f VUNPCKHPD %XMM1,%XMM1,%XMM2 |
(998) 0x494d73 VADDPD %XMM9,%XMM15,%XMM10 |
(998) 0x494d78 VEXTRACTF64X2 $0x1,%YMM0,%XMM15 |
(998) 0x494d7f VADDPD %XMM1,%XMM2,%XMM12 |
(998) 0x494d83 VADDPD %XMM0,%XMM15,%XMM14 |
(998) 0x494d87 VUNPCKHPD %XMM14,%XMM14,%XMM9 |
(998) 0x494d8c VADDPD %XMM14,%XMM9,%XMM1 |
(998) 0x494d91 VMOVSD %XMM1,%XMM1,%XMM14 |
(998) 0x494d95 VUNPCKLPD %XMM12,%XMM1,%XMM1 |
(998) 0x494d9a CMP %R14D,%EAX |
(998) 0x494d9d JE 4951b6 |
(998) 0x494da3 VADDPD %XMM15,%XMM0,%XMM15 |
(998) 0x494da8 VADDPD %XMM17,%XMM11,%XMM11 |
(998) 0x494dae MOV %EAX,%R13D |
(998) 0x494db1 VADDPD %XMM16,%XMM13,%XMM13 |
(998) 0x494db7 MOV %R14D,%ESI |
(998) 0x494dba SUB %R13D,%ESI |
(998) 0x494dbd CMP $0x1,%ESI |
(998) 0x494dc0 JE 494e41 |
(998) 0x494dc2 LEA (%RDI,%R13,1),%R15 |
(998) 0x494dc6 ADD %RBX,%R13 |
(998) 0x494dc9 LEA (%R15,%R15,2),%RCX |
(998) 0x494dcd MOV -0xc8(%RBP),%R15 |
(998) 0x494dd4 LEA (%R11,%RCX,8),%R8 |
(998) 0x494dd8 VMOVUPD (%R8),%XMM0 |
(998) 0x494ddd VMOVUPD 0x10(%R8),%XMM10 |
(998) 0x494de3 VMOVUPD 0x20(%R8),%XMM12 |
(998) 0x494de9 VMOVUPD (%R15,%R13,8),%XMM2 |
(998) 0x494def VPERMILPD $0x1,%XMM0,%XMM9 |
(998) 0x494df5 VUNPCKLPD %XMM0,%XMM10,%XMM14 |
(998) 0x494df9 VBLENDPD $0x2,%XMM10,%XMM0,%XMM0 |
(998) 0x494dff VUNPCKLPD %XMM12,%XMM9,%XMM1 |
(998) 0x494e04 VFMADD132PD %XMM2,%XMM15,%XMM0 |
(998) 0x494e09 VBLENDPD $0x2,%XMM12,%XMM14,%XMM12 |
(998) 0x494e0f VFMADD132PD %XMM2,%XMM11,%XMM1 |
(998) 0x494e14 VFMADD132PD %XMM12,%XMM13,%XMM2 |
(998) 0x494e19 VUNPCKHPD %XMM2,%XMM2,%XMM11 |
(998) 0x494e1d VUNPCKHPD %XMM1,%XMM1,%XMM13 |
(998) 0x494e21 VADDPD %XMM2,%XMM11,%XMM10 |
(998) 0x494e25 VUNPCKHPD %XMM0,%XMM0,%XMM2 |
(998) 0x494e29 VADDPD %XMM1,%XMM13,%XMM15 |
(998) 0x494e2d VADDPD %XMM0,%XMM2,%XMM9 |
(998) 0x494e31 VUNPCKLPD %XMM15,%XMM9,%XMM1 |
(998) 0x494e36 TEST $0x1,%SIL |
(998) 0x494e3a JE 494e65 |
(998) 0x494e3c AND $-0x2,%ESI |
(998) 0x494e3f ADD %ESI,%EAX |
(998) 0x494e41 CLTQ |
(998) 0x494e43 LEA (%RDI,%RAX,1),%R13 |
(998) 0x494e47 VMOVSD (%RDX,%RAX,8),%XMM12 |
(998) 0x494e4c VMOVDDUP (%RDX,%RAX,8),%XMM14 |
(998) 0x494e51 LEA (%R13,%R13,2),%RSI |
(998) 0x494e56 LEA (%R11,%RSI,8),%RCX |
(998) 0x494e5a VFMADD231PD (%RCX),%XMM14,%XMM1 |
(998) 0x494e5f VFMADD231SD 0x10(%RCX),%XMM12,%XMM10 |
(998) 0x494e65 MOV -0x110(%RBP),%RAX |
(998) 0x494e6c VUNPCKHPD %XMM1,%XMM1,%XMM12 |
(998) 0x494e70 VMOVSD %XMM1,%XMM1,%XMM14 |
(998) 0x494e74 MOV 0x158(%RAX),%R13 |
(998) 0x494e7b MOV 0x180(%RAX),%RCX |
(998) 0x494e82 IMUL %R10,%R13 |
(998) 0x494e86 CMPL $0x2,-0xe0(%RBP) |
(998) 0x494e8d LEA (,%R13,8),%R8 |
(998) 0x494e95 JBE 495218 |
(998) 0x494e9b MOV -0xd8(%RBP),%RSI |
(998) 0x494ea2 LEA (%RCX,%R8,1),%R15 |
(998) 0x494ea6 XOR %EAX,%EAX |
(998) 0x494ea8 VXORPD %XMM2,%XMM2,%XMM2 |
(998) 0x494eac SUB $0x20,%RSI |
(998) 0x494eb0 SHR $0x5,%RSI |
(998) 0x494eb4 INC %RSI |
(998) 0x494eb7 AND $0x7,%ESI |
(998) 0x494eba JE 494f7a |
(998) 0x494ec0 CMP $0x1,%RSI |
(998) 0x494ec4 JE 494f59 |
(998) 0x494eca CMP $0x2,%RSI |
(998) 0x494ece JE 494f46 |
(998) 0x494ed0 CMP $0x3,%RSI |
(998) 0x494ed4 JE 494f32 |
(998) 0x494ed6 CMP $0x4,%RSI |
(998) 0x494eda JE 494f1e |
(998) 0x494edc CMP $0x5,%RSI |
(998) 0x494ee0 JE 494f0a |
(998) 0x494ee2 CMP $0x6,%RSI |
(998) 0x494ee6 JE 494ef6 |
(998) 0x494ee8 VMOVUPD (%R15),%YMM0 |
(998) 0x494eed MOV $0x20,%EAX |
(998) 0x494ef2 VMULPD (%RDX),%YMM0,%YMM2 |
(998) 0x494ef6 VMOVUPD (%R15,%RAX,1),%YMM13 |
(998) 0x494efc VMULPD (%RDX,%RAX,1),%YMM13,%YMM15 |
(998) 0x494f01 ADD $0x20,%RAX |
(998) 0x494f05 VADDPD %YMM15,%YMM2,%YMM2 |
(998) 0x494f0a VMOVUPD (%R15,%RAX,1),%YMM9 |
(998) 0x494f10 VMULPD (%RDX,%RAX,1),%YMM9,%YMM11 |
(998) 0x494f15 ADD $0x20,%RAX |
(998) 0x494f19 VADDPD %YMM11,%YMM2,%YMM2 |
(998) 0x494f1e VMOVUPD (%R15,%RAX,1),%YMM0 |
(998) 0x494f24 VMULPD (%RDX,%RAX,1),%YMM0,%YMM13 |
(998) 0x494f29 ADD $0x20,%RAX |
(998) 0x494f2d VADDPD %YMM13,%YMM2,%YMM2 |
(998) 0x494f32 VMOVUPD (%R15,%RAX,1),%YMM15 |
(998) 0x494f38 VMULPD (%RDX,%RAX,1),%YMM15,%YMM9 |
(998) 0x494f3d ADD $0x20,%RAX |
(998) 0x494f41 VADDPD %YMM9,%YMM2,%YMM2 |
(998) 0x494f46 VMOVUPD (%R15,%RAX,1),%YMM11 |
(998) 0x494f4c VMULPD (%RDX,%RAX,1),%YMM11,%YMM0 |
(998) 0x494f51 ADD $0x20,%RAX |
(998) 0x494f55 VADDPD %YMM0,%YMM2,%YMM2 |
(998) 0x494f59 VMOVUPD (%R15,%RAX,1),%YMM13 |
(998) 0x494f5f VMULPD (%RDX,%RAX,1),%YMM13,%YMM15 |
(998) 0x494f64 ADD $0x20,%RAX |
(998) 0x494f68 VADDPD %YMM15,%YMM2,%YMM2 |
(998) 0x494f6d CMP %RAX,-0xd8(%RBP) |
(998) 0x494f74 JE 495033 |
(999) 0x494f7a VMOVUPD (%R15,%RAX,1),%YMM9 |
(999) 0x494f80 VMOVUPD 0x20(%R15,%RAX,1),%YMM0 |
(999) 0x494f87 VMULPD (%RDX,%RAX,1),%YMM9,%YMM11 |
(999) 0x494f8c VMOVUPD 0x40(%R15,%RAX,1),%YMM9 |
(999) 0x494f93 VMULPD 0x20(%RDX,%RAX,1),%YMM0,%YMM15 |
(999) 0x494f99 VMOVUPD 0x60(%R15,%RAX,1),%YMM0 |
(999) 0x494fa0 VADDPD %YMM11,%YMM2,%YMM13 |
(999) 0x494fa5 VMULPD 0x40(%RDX,%RAX,1),%YMM9,%YMM11 |
(999) 0x494fab VMOVUPD 0x80(%R15,%RAX,1),%YMM9 |
(999) 0x494fb5 VADDPD %YMM15,%YMM13,%YMM2 |
(999) 0x494fba VMULPD 0x60(%RDX,%RAX,1),%YMM0,%YMM15 |
(999) 0x494fc0 VMOVUPD 0xa0(%R15,%RAX,1),%YMM0 |
(999) 0x494fca VADDPD %YMM11,%YMM2,%YMM13 |
(999) 0x494fcf VMULPD 0x80(%RDX,%RAX,1),%YMM9,%YMM11 |
(999) 0x494fd8 VMOVUPD 0xc0(%R15,%RAX,1),%YMM9 |
(999) 0x494fe2 VADDPD %YMM15,%YMM13,%YMM2 |
(999) 0x494fe7 VMULPD 0xa0(%RDX,%RAX,1),%YMM0,%YMM15 |
(999) 0x494ff0 VMOVUPD 0xe0(%R15,%RAX,1),%YMM0 |
(999) 0x494ffa VADDPD %YMM11,%YMM2,%YMM13 |
(999) 0x494fff VMULPD 0xc0(%RDX,%RAX,1),%YMM9,%YMM11 |
(999) 0x495008 VADDPD %YMM15,%YMM13,%YMM2 |
(999) 0x49500d VMULPD 0xe0(%RDX,%RAX,1),%YMM0,%YMM15 |
(999) 0x495016 ADD $0x100,%RAX |
(999) 0x49501c VADDPD %YMM11,%YMM2,%YMM13 |
(999) 0x495021 VADDPD %YMM15,%YMM13,%YMM2 |
(999) 0x495026 CMP %RAX,-0xd8(%RBP) |
(999) 0x49502d JNE 494f7a |
(998) 0x495033 VEXTRACTF64X2 $0x1,%YMM2,%XMM9 |
(998) 0x49503a MOV -0xdc(%RBP),%EAX |
(998) 0x495040 VADDPD %XMM2,%XMM9,%XMM11 |
(998) 0x495044 VUNPCKHPD %XMM11,%XMM11,%XMM13 |
(998) 0x495049 VADDPD %XMM11,%XMM13,%XMM0 |
(998) 0x49504e CMP %R14D,%EAX |
(998) 0x495051 JE 4950b6 |
(998) 0x495053 VADDPD %XMM2,%XMM9,%XMM11 |
(998) 0x495057 MOV %EAX,%ESI |
(998) 0x495059 MOV %R14D,%R15D |
(998) 0x49505c SUB %ESI,%R15D |
(998) 0x49505f MOV %R15D,-0xd0(%RBP) |
(998) 0x495066 CMP $0x1,%R15D |
(998) 0x49506a JE 4950a6 |
(998) 0x49506c LEA (%R13,%RSI,1),%R15 |
(998) 0x495071 MOV -0xc8(%RBP),%R13 |
(998) 0x495078 ADD %RBX,%RSI |
(998) 0x49507b VMOVUPD (%RCX,%R15,8),%XMM2 |
(998) 0x495081 VFMADD231PD (%R13,%RSI,8),%XMM2,%XMM11 |
(998) 0x495088 VUNPCKHPD %XMM11,%XMM11,%XMM0 |
(998) 0x49508d VADDPD %XMM11,%XMM0,%XMM0 |
(998) 0x495092 TESTB $0x1,-0xd0(%RBP) |
(998) 0x495099 JE 4950b6 |
(998) 0x49509b MOV -0xd0(%RBP),%ESI |
(998) 0x4950a1 AND $-0x2,%ESI |
(998) 0x4950a4 ADD %ESI,%EAX |
(998) 0x4950a6 CLTQ |
(998) 0x4950a8 ADD %R8,%RCX |
(998) 0x4950ab VMOVSD (%RCX,%RAX,8),%XMM15 |
(998) 0x4950b0 VFMADD231SD (%RDX,%RAX,8),%XMM15,%XMM0 |
(998) 0x4950b6 VMULSD %XMM14,%XMM14,%XMM14 |
(998) 0x4950bb VMULSD %XMM12,%XMM12,%XMM12 |
(998) 0x4950c0 VMULSD %XMM10,%XMM10,%XMM2 |
(998) 0x4950c5 VADDPD (%R9),%XMM1,%XMM1 |
(998) 0x4950ca VADDSD 0x10(%R9),%XMM10,%XMM10 |
(998) 0x4950d0 ADD $0x18,%R9 |
(998) 0x4950d4 MOV -0x100(%RBP),%RDX |
(998) 0x4950db VADDSD %XMM12,%XMM14,%XMM14 |
(998) 0x4950e0 MOV -0x108(%RBP),%R8 |
(998) 0x4950e7 MOV -0xf8(%RBP),%RCX |
(998) 0x4950ee MOV -0xf0(%RBP),%RAX |
(998) 0x4950f5 VMOVUPD %XMM1,-0x18(%R9) |
(998) 0x4950fb ADD %R8,%R12 |
(998) 0x4950fe VMOVSD %XMM10,-0x8(%R9) |
(998) 0x495104 ADD %RCX,%RDI |
(998) 0x495107 ADD %RAX,%RBX |
(998) 0x49510a VADDSD (%RDX,%R10,8),%XMM0,%XMM9 |
(998) 0x495110 VSUBSD %XMM14,%XMM9,%XMM12 |
(998) 0x495115 VSUBSD %XMM2,%XMM12,%XMM11 |
(998) 0x495119 VMOVSD %XMM11,(%RDX,%R10,8) |
(998) 0x49511f INC %R10 |
(998) 0x495122 CMP %R10,-0xe8(%RBP) |
(998) 0x495129 JNE 494a50 |
0x49512f MOV -0x110(%RBP),%R15 |
0x495136 VZEROUPPER |
0x495139 VMOVSD 0x10(%R15),%XMM0 |
0x49513f LEA -0x30(%RBP),%RSP |
0x495143 POP %RBX |
0x495144 POP %RAX |
0x495145 POP %R12 |
0x495147 POP %R13 |
0x495149 POP %R14 |
0x49514b POP %R15 |
0x49514d POP %RBP |
0x49514e LEA -0x8(%RAX),%RSP |
0x495152 RET |
0x495153 NOPL (%RAX,%RAX,1) |
(1001) 0x495158 MOV -0xa8(%RBP),%RDI |
(1001) 0x49515f LEA (,%R10,8),%RSI |
(1001) 0x495167 INC %RBX |
(1001) 0x49516a CALL 404060 <_ZdlPvm@plt> |
(1001) 0x49516f CMP %R13,%RBX |
(1001) 0x495172 JNE 4947f0 |
0x495178 JMP 494911 |
0x49517d NOPL (%RAX) |
(1001) 0x495180 LEA (%R9,%R9,2),%RSI |
(1001) 0x495184 MOV -0x78(%RBP),%RDI |
(1001) 0x495188 SAL $0x3,%RSI |
(1001) 0x49518c CALL 404060 <_ZdlPvm@plt> |
(1001) 0x495191 JMP 4948ea |
0x495196 NOPW %CS:(%RAX,%RAX,1) |
(1001) 0x4951a0 MOV -0x48(%RBP),%RDI |
(1001) 0x4951a4 LEA (,%RSI,8),%RSI |
(1001) 0x4951ac CALL 404060 <_ZdlPvm@plt> |
(1001) 0x4951b1 JMP 4948d2 |
(998) 0x4951b6 MOV -0x110(%RBP),%R13 |
(998) 0x4951bd MOV 0x180(%R13),%RCX |
(998) 0x4951c4 MOV 0x158(%R13),%R13 |
(998) 0x4951cb IMUL %R10,%R13 |
(998) 0x4951cf LEA (,%R13,8),%R8 |
(998) 0x4951d7 JMP 494e9b |
(998) 0x4951dc VXORPD %XMM2,%XMM2,%XMM2 |
(998) 0x4951e0 VXORPD %XMM1,%XMM1,%XMM1 |
(998) 0x4951e4 VMOVSD %XMM2,%XMM2,%XMM12 |
(998) 0x4951e8 VMOVSD %XMM2,%XMM2,%XMM14 |
(998) 0x4951ec VMOVSD %XMM2,%XMM2,%XMM10 |
(998) 0x4951f0 VMOVSD %XMM2,%XMM2,%XMM0 |
(998) 0x4951f4 JMP 4950c5 |
(998) 0x4951f9 VXORPD %XMM1,%XMM1,%XMM1 |
(998) 0x4951fd XOR %R13D,%R13D |
(998) 0x495200 VXORPD %XMM10,%XMM10,%XMM10 |
(998) 0x495205 XOR %EAX,%EAX |
(998) 0x495207 VMOVAPD %XMM1,%XMM13 |
(998) 0x49520b VMOVAPD %XMM1,%XMM11 |
(998) 0x49520f VMOVAPD %XMM1,%XMM15 |
(998) 0x495213 JMP 494db7 |
(998) 0x495218 VXORPD %XMM11,%XMM11,%XMM11 |
(998) 0x49521d XOR %ESI,%ESI |
(998) 0x49521f VXORPD %XMM0,%XMM0,%XMM0 |
(998) 0x495223 XOR %EAX,%EAX |
(998) 0x495225 JMP 495059 |
0x49522a MOV 0xc0(%R15),%R11 |
0x495231 VMOVSD 0xf87f7(%RIP),%XMM8 |
0x495239 VXORPD %XMM6,%XMM6,%XMM6 |
0x49523d MOV 0x100(%R15),%R14 |
0x495244 VMOVSD (%R11),%XMM0 |
0x495249 VDIVSD %XMM0,%XMM8,%XMM7 |
0x49524d VCOMISD %XMM0,%XMM6 |
0x495251 VMOVSD %XMM7,(%R14) |
0x495256 JA 495330 |
0x49525c CALL 4041a0 <__log_finite@plt> |
0x495261 VXORPD %XMM5,%XMM5,%XMM5 |
0x495265 VUNPCKLPD %XMM5,%XMM0,%XMM4 |
0x495269 VMOVUPD %XMM4,0x10(%R15) |
0x49526f VMOVSD (%R14),%XMM13 |
0x495274 MOV 0x140(%R15),%R9 |
0x49527b MOV -0xd0(%RBP),%RDI |
0x495282 MOVSXD 0x478(%R15),%R12 |
0x495289 VMOVDDUP %XMM13,%XMM3 |
0x49528e MOV -0x100(%RBP),%RDX |
0x495295 MOV 0x180(%R15),%RSI |
0x49529c VMULPD (%R9),%XMM3,%XMM0 |
0x4952a1 MOV 0x18(%RDI),%R10 |
0x4952a5 LEA (%R12,%R12,2),%RBX |
0x4952a9 VMULSD 0x10(%R9),%XMM13,%XMM2 |
0x4952af MOV 0x18(%RDX),%R8 |
0x4952b3 LEA (%R10,%RBX,8),%R13 |
0x4952b7 LEA (%R8,%R12,8),%RCX |
0x4952bb VADDPD (%R13),%XMM0,%XMM1 |
0x4952c1 VUNPCKHPD %XMM0,%XMM0,%XMM15 |
0x4952c5 VMOVSD %XMM0,%XMM0,%XMM10 |
0x4952c9 VADDSD 0x10(%R13),%XMM2,%XMM9 |
0x4952cf VMULSD %XMM15,%XMM15,%XMM14 |
0x4952d4 VMOVUPD %XMM1,(%R13) |
0x4952da VMOVSD %XMM9,0x10(%R13) |
0x4952e0 VMOVSD (%RCX),%XMM12 |
0x4952e4 VFMADD132SD %XMM0,%XMM14,%XMM10 |
0x4952e9 VFMADD132SD (%RSI),%XMM12,%XMM13 |
0x4952ee VSUBSD %XMM10,%XMM13,%XMM11 |
0x4952f3 VFNMADD132SD %XMM2,%XMM11,%XMM2 |
0x4952f8 VMOVSD %XMM2,(%RCX) |
0x4952fc JMP 495139 |
0x495301 SUB $0x8,%RSP |
0x495305 LEA 0x150(%R15),%RDX |
0x49530c MOV -0xc8(%RBP),%RSI |
0x495313 MOV %RDI,%R8 |
0x495316 PUSH %RDX |
0x495317 LEA 0x110(%R15),%R9 |
0x49531e MOV %R14D,%EDX |
0x495321 MOV %R13D,%ECX |
0x495324 MOV %R12,%RDI |
0x495327 CALL %RBX |
0x495329 POP %RAX |
0x49532a POP %RDX |
0x49532b JMP 494911 |
0x495330 VXORPD 0xf6988(%RIP),%XMM0,%XMM0 |
0x495338 CALL 4041a0 <__log_finite@plt> |
0x49533d VMOVSD 0xf86f3(%RIP),%XMM5 |
0x495345 JMP 495265 |
0x49534a MOV 0x100(%R15),%R14 |
0x495351 JMP 49526f |
0x495356 MOV %RAX,%R15 |
0x495359 MOV -0x50(%RBP),%R12 |
0x49535d MOVQ $0x58c7c8,-0x60(%RBP) |
0x495365 TEST %R12,%R12 |
0x495368 JE 4953d2 |
0x49536a MOV -0x48(%RBP),%RDI |
0x49536e LEA (,%R12,8),%RSI |
0x495376 VZEROUPPER |
0x495379 CALL 404060 <_ZdlPvm@plt> |
(997) 0x49537e MOV -0x80(%RBP),%R13 |
(997) 0x495382 MOVQ $0x58bc98,-0x90(%RBP) |
(997) 0x49538d TEST %R13,%R13 |
(997) 0x495390 JE 49539f |
(997) 0x495392 IMUL $0x18,%R13,%RSI |
(997) 0x495396 MOV -0x78(%RBP),%RDI |
(997) 0x49539a CALL 404060 <_ZdlPvm@plt> |
(997) 0x49539f MOV -0xb0(%RBP),%R14 |
(997) 0x4953a6 MOVQ $0x58c7c8,-0xc0(%RBP) |
(997) 0x4953b1 TEST %R14,%R14 |
(997) 0x4953b4 JE 4953ca |
(997) 0x4953b6 MOV -0xa8(%RBP),%RDI |
(997) 0x4953bd LEA (,%R14,8),%RSI |
(997) 0x4953c5 CALL 404060 <_ZdlPvm@plt> |
(997) 0x4953ca MOV %R15,%RDI |
(997) 0x4953cd CALL 404230 <_Unwind_Resume@plt> |
(997) 0x4953d2 VZEROUPPER |
(997) 0x4953d5 JMP 49537e |
0x4953d7 NOPW (%RAX,%RAX,1) |
Path / |
Source file and lines | DiracDeterminantRef.cpp:231-273 |
Module | exec |
nb instructions | 175 |
nb uops | 185 |
loop length | 871 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 16 |
used ymm registers | 6 |
used zmm registers | 0 |
nb stack references | 16 |
ADD-SUB / MUL ratio | 1.00 |
micro-operation queue | 30.83 cycles |
front end | 30.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 7.80 | 7.70 | 21.00 | 21.00 | 18.00 | 7.90 | 7.80 | 18.00 | 18.00 | 18.00 | 7.80 | 21.00 |
cycles | 7.80 | 7.70 | 21.00 | 21.00 | 18.00 | 7.90 | 7.80 | 18.00 | 18.00 | 18.00 | 7.80 | 21.00 |
Cycles executing div or sqrt instructions | 4.00 |
FE+BE cycles | 29.83-29.87 |
Stall cycles | 0.00 |
Front-end | 30.83 |
Dispatch | 21.00 |
DIV/SQRT | 4.00 |
Overall L1 | 30.83 |
all | 28% |
load | 85% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 28% |
all | 24% |
load | 25% |
store | 40% |
mul | 33% |
add-sub | 33% |
fma | 0% |
div/sqrt | 0% |
other | 37% |
all | 26% |
load | 47% |
store | 10% |
mul | 33% |
add-sub | 33% |
fma | 0% |
div/sqrt | 0% |
other | 33% |
all | 19% |
load | 43% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 15% |
load | 15% |
store | 17% |
mul | 16% |
add-sub | 16% |
fma | 12% |
div/sqrt | 12% |
other | 17% |
all | 17% |
load | 25% |
store | 12% |
mul | 16% |
add-sub | 16% |
fma | 12% |
div/sqrt | 12% |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
LEA 0x8(%RSP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
PUSHQ -0x8(%R10) | 2 | 0 | 0 | 0.33 | 0.33 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0.33 | 5-12 | 0.62 |
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R10 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0xe0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x468(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 50f9a0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x470(%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x90(%R15),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x47c(%R15),%R13D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x478(%R15),%R14D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RAX),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x475470,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 495301 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xba1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14D,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 494911 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x1b1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SUB %R14D,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x468(%R15),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 50fbd0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPL $0x1,0x484(%R15) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 49522a <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xaca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xd8(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0xd0(%R15),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 492b60 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE10invertPsiMERKNS1_6MatrixIdSaIdEEERS7_> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x484(%R15),%EDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 49534a <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xbea> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD 0x478(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %EDI,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 495139 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x9d9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xd0(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RAX,%RAX,2),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x480(%R15),%R14D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x100(%R15),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xd8(%R15),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD %EDI,%RDI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV 0x18(%R12),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x118(%R15),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x140(%R15),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVDQA 0xf90f2(%RIP),%YMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %RCX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14D,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%R13,%R8,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x100(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x2,%ECX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14D,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAL $0x5,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA (%RBX,%RBX,2),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%R8),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
AND $-0x4,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RSI,8),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDX,-0xdc(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0x1(%R14),%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
VMOVDQA 0xf90b8(%RIP),%YMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R11,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%R13,%RAX,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDQA 0xf90c8(%RIP),%YMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQA 0xf90e0(%RIP),%YMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R10,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVDQA 0xf88d1(%RIP),%YMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQA 0xf88e9(%RIP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %RAX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EBX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x110(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VMOVSD 0x10(%R15),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x30(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
LEA -0x8(%RAX),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 494911 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x1b1> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xc0(%R15),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xf87f7(%RIP),%XMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM6,%XMM6,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x100(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%R11),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VDIVSD %XMM0,%XMM8,%XMM7 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-15 | 4 |
VCOMISD %XMM0,%XMM6 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVSD %XMM7,(%R14) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JA 495330 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xbd0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CALL 4041a0 <__log_finite@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VXORPD %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUNPCKLPD %XMM5,%XMM0,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVUPD %XMM4,0x10(%R15) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD (%R14),%XMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x140(%R15),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0x478(%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVDDUP %XMM13,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x100(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x180(%R15),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULPD (%R9),%XMM3,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV 0x18(%RDI),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%R12,2),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMULSD 0x10(%R9),%XMM13,%XMM2 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV 0x18(%RDX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R10,%RBX,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R8,%R12,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VADDPD (%R13),%XMM0,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VUNPCKHPD %XMM0,%XMM0,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVSD %XMM0,%XMM0,%XMM10 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VADDSD 0x10(%R13),%XMM2,%XMM9 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMULSD %XMM15,%XMM15,%XMM14 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM1,(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD %XMM9,0x10(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD (%RCX),%XMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VFMADD132SD %XMM0,%XMM14,%XMM10 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD132SD (%RSI),%XMM12,%XMM13 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VSUBSD %XMM10,%XMM13,%XMM11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VFNMADD132SD %XMM2,%XMM11,%XMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM2,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 495139 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x9d9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x150(%R15),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xc8(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %RDX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
LEA 0x110(%R15),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14D,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13D,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL %RBX | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 2.14 |
POP %RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 494911 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x1b1> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
VXORPD 0xf6988(%RIP),%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
CALL 4041a0 <__log_finite@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0xf86f3(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 495265 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xb05> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x100(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 49526f <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xb0f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x50(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0x58c7c8,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4953d2 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xc72> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (,%R12,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404060 <_ZdlPvm@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | DiracDeterminantRef.cpp:231-273 |
Module | exec |
nb instructions | 175 |
nb uops | 185 |
loop length | 871 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 16 |
used ymm registers | 6 |
used zmm registers | 0 |
nb stack references | 16 |
ADD-SUB / MUL ratio | 1.00 |
micro-operation queue | 30.83 cycles |
front end | 30.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 7.80 | 7.70 | 21.00 | 21.00 | 18.00 | 7.90 | 7.80 | 18.00 | 18.00 | 18.00 | 7.80 | 21.00 |
cycles | 7.80 | 7.70 | 21.00 | 21.00 | 18.00 | 7.90 | 7.80 | 18.00 | 18.00 | 18.00 | 7.80 | 21.00 |
Cycles executing div or sqrt instructions | 4.00 |
FE+BE cycles | 29.83-29.87 |
Stall cycles | 0.00 |
Front-end | 30.83 |
Dispatch | 21.00 |
DIV/SQRT | 4.00 |
Overall L1 | 30.83 |
all | 28% |
load | 85% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 28% |
all | 24% |
load | 25% |
store | 40% |
mul | 33% |
add-sub | 33% |
fma | 0% |
div/sqrt | 0% |
other | 37% |
all | 26% |
load | 47% |
store | 10% |
mul | 33% |
add-sub | 33% |
fma | 0% |
div/sqrt | 0% |
other | 33% |
all | 19% |
load | 43% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 15% |
load | 15% |
store | 17% |
mul | 16% |
add-sub | 16% |
fma | 12% |
div/sqrt | 12% |
other | 17% |
all | 17% |
load | 25% |
store | 12% |
mul | 16% |
add-sub | 16% |
fma | 12% |
div/sqrt | 12% |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
LEA 0x8(%RSP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
PUSHQ -0x8(%R10) | 2 | 0 | 0 | 0.33 | 0.33 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0.33 | 5-12 | 0.62 |
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R10 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0xe0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x468(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 50f9a0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x470(%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x90(%R15),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x47c(%R15),%R13D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x478(%R15),%R14D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RAX),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x475470,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 495301 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xba1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14D,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 494911 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x1b1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SUB %R14D,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x468(%R15),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 50fbd0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPL $0x1,0x484(%R15) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 49522a <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xaca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xd8(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0xd0(%R15),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 492b60 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE10invertPsiMERKNS1_6MatrixIdSaIdEEERS7_> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x484(%R15),%EDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 49534a <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xbea> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD 0x478(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %EDI,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 495139 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x9d9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xd0(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RAX,%RAX,2),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x480(%R15),%R14D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x100(%R15),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xd8(%R15),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD %EDI,%RDI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV 0x18(%R12),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x118(%R15),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x140(%R15),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVDQA 0xf90f2(%RIP),%YMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %RCX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14D,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%R13,%R8,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x100(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x2,%ECX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14D,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAL $0x5,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA (%RBX,%RBX,2),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%R8),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
AND $-0x4,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RSI,8),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDX,-0xdc(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0x1(%R14),%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
VMOVDQA 0xf90b8(%RIP),%YMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R11,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%R13,%RAX,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDQA 0xf90c8(%RIP),%YMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQA 0xf90e0(%RIP),%YMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R10,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVDQA 0xf88d1(%RIP),%YMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQA 0xf88e9(%RIP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %RAX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EBX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x110(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VMOVSD 0x10(%R15),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x30(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
LEA -0x8(%RAX),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 494911 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x1b1> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xc0(%R15),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xf87f7(%RIP),%XMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM6,%XMM6,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x100(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%R11),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VDIVSD %XMM0,%XMM8,%XMM7 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-15 | 4 |
VCOMISD %XMM0,%XMM6 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVSD %XMM7,(%R14) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JA 495330 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xbd0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CALL 4041a0 <__log_finite@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VXORPD %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUNPCKLPD %XMM5,%XMM0,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVUPD %XMM4,0x10(%R15) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD (%R14),%XMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x140(%R15),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0x478(%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVDDUP %XMM13,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x100(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x180(%R15),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULPD (%R9),%XMM3,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV 0x18(%RDI),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%R12,2),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMULSD 0x10(%R9),%XMM13,%XMM2 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV 0x18(%RDX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R10,%RBX,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R8,%R12,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VADDPD (%R13),%XMM0,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VUNPCKHPD %XMM0,%XMM0,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVSD %XMM0,%XMM0,%XMM10 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VADDSD 0x10(%R13),%XMM2,%XMM9 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMULSD %XMM15,%XMM15,%XMM14 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM1,(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD %XMM9,0x10(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD (%RCX),%XMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VFMADD132SD %XMM0,%XMM14,%XMM10 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD132SD (%RSI),%XMM12,%XMM13 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VSUBSD %XMM10,%XMM13,%XMM11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VFNMADD132SD %XMM2,%XMM11,%XMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM2,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 495139 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x9d9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x150(%R15),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xc8(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %RDX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
LEA 0x110(%R15),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14D,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13D,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL %RBX | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 2.14 |
POP %RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 494911 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x1b1> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
VXORPD 0xf6988(%RIP),%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
CALL 4041a0 <__log_finite@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0xf86f3(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 495265 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xb05> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x100(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 49526f <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xb0f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x50(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0x58c7c8,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4953d2 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0xc72> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (,%R12,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404060 <_ZdlPvm@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼miniqmcreference::DiracDeterminantRef | 0.08 | 0.08 |
▼Loop 998 - DiracDeterminantRef.cpp:247-252 - exec– | 0 | 0 |
○Loop 1000 - inner_product.hpp:155-155 - exec | 0.06 | 0.05 |
○Loop 999 - inner_product.hpp:82-83 - exec | 0.02 | 0.02 |
○Loop 997 - new_allocator.h:100-168 - exec | 0 | 0 |
○Loop 1001 - SPOSet.h:106-111 - exec | 0 | 0 |