Function: miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evalua ... | Module: libqmcwfs.so | Source: DiracDeterminantRef.cpp:235-255 [...] | Coverage: 0.14% |
---|
Function: miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evalua ... | Module: libqmcwfs.so | Source: DiracDeterminantRef.cpp:235-255 [...] | Coverage: 0.14% |
---|
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 63 - 94 |
-------------------------------------------------------------------------------- |
63: return (a * b); |
[...] |
94: (const_cast<T1&>(a) += b); |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsMatrix.h: 217 - 217 |
-------------------------------------------------------------------------------- |
217: inline Type_t* operator[](size_type i) { return X.data() + i * D2; } |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/Platforms/CPU/SIMD/inner_product.hpp: 82 - 155 |
-------------------------------------------------------------------------------- |
82: for (int i = 0; i < n; i++) |
83: res += a[i] * b[i]; |
[...] |
155: for (int i = 0; i < n; i++) |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVectorOps.h: 129 - 131 |
-------------------------------------------------------------------------------- |
129: Type_t res = lhs[0] * rhs[0]; |
130: for (unsigned d = 1; d < D; ++d) |
131: res += lhs[d] * rhs[d]; |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 223 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/DiracDeterminantRef.cpp: 235 - 255 |
-------------------------------------------------------------------------------- |
235: { |
236: recompute(P); |
237: |
238: if (NumPtcls == 1) |
239: { |
240: ValueType y = psiM(0, 0); |
241: GradType rv = y * dpsiM(0, 0); |
242: G[FirstIndex] += rv; |
243: L[FirstIndex] += y * d2psiM(0, 0) - dot(rv, rv); |
244: } |
245: else |
246: { |
247: for (int i = 0, iat = FirstIndex; i < NumPtcls; i++, iat++) |
248: { |
249: mGradType rv = simd::dot(psiM[i], dpsiM[i], NumOrbitals); |
250: mValueType lap = simd::dot(psiM[i], d2psiM[i], NumOrbitals); |
251: G[iat] += rv; |
252: L[iat] += lap - dot(rv, rv); |
253: } |
254: } |
255: return LogValue; |
0x4bd00 PUSH %RBP |
0x4bd01 MOV %RSP,%RBP |
0x4bd04 PUSH %R15 |
0x4bd06 PUSH %R14 |
0x4bd08 PUSH %R13 |
0x4bd0a PUSH %R12 |
0x4bd0c PUSH %RBX |
0x4bd0d SUB $0x38,%RSP |
0x4bd11 MOV %RCX,%R12 |
0x4bd14 MOV %RDX,%R15 |
0x4bd17 MOV %RDI,%RBX |
0x4bd1a CALL 4ecb0 <@plt_start@+0x600> |
0x4bd1f MOV 0x484(%RBX),%R10D |
0x4bd26 CMP $0x1,%R10 |
0x4bd2a JNE 4bd9f |
0x4bd2c MOV 0x100(%RBX),%RAX |
0x4bd33 MOV 0x140(%RBX),%RCX |
0x4bd3a MOV 0x18(%R15),%RDX |
0x4bd3e VMOVDDUP (%RAX),%XMM0 |
0x4bd42 MOVSXD 0x478(%RBX),%RAX |
0x4bd49 VMULPD (%RCX),%XMM0,%XMM2 |
0x4bd4d VMULSD 0x10(%RCX),%XMM0,%XMM1 |
0x4bd52 LEA (%RAX,%RAX,2),%RSI |
0x4bd56 VADDPD (%RDX,%RSI,8),%XMM2,%XMM3 |
0x4bd5b VMULPD %XMM2,%XMM2,%XMM2 |
0x4bd5f VMOVUPD %XMM3,(%RDX,%RSI,8) |
0x4bd64 VADDSD 0x10(%RDX,%RSI,8),%XMM1,%XMM3 |
0x4bd6a VMOVSD %XMM3,0x10(%RDX,%RSI,8) |
0x4bd70 VPERMILPD $0x1,%XMM2,%XMM3 |
0x4bd76 MOV 0x180(%RBX),%RCX |
0x4bd7d VADDSD %XMM2,%XMM3,%XMM2 |
0x4bd81 MOV 0x18(%R12),%RDX |
0x4bd86 VFMADD231SD %XMM1,%XMM1,%XMM2 |
0x4bd8b VFMSUB231SD (%RCX),%XMM0,%XMM2 |
0x4bd90 VADDSD (%RDX,%RAX,8),%XMM2,%XMM0 |
0x4bd95 VMOVSD %XMM0,(%RDX,%RAX,8) |
0x4bd9a JMP 4c44d |
0x4bd9f TEST %R10D,%R10D |
0x4bda2 JLE 4c44d |
0x4bda8 MOV 0x118(%RBX),%RAX |
0x4bdaf VMOVAPD -0x439b7(%RIP),%YMM1 |
0x4bdb7 VMOVAPD -0x43a3f(%RIP),%YMM2 |
0x4bdbf VMOVAPD -0x43a27(%RIP),%YMM3 |
0x4bdc7 VMOVAPD -0x42c91(%RIP),%ZMM4 |
0x4bdd1 VMOVAPD -0x42c5b(%RIP),%ZMM5 |
0x4bddb VMOVAPD -0x42c25(%RIP),%ZMM6 |
0x4bde5 VMOVAPD -0x42bef(%RIP),%ZMM7 |
0x4bdef VMOVAPD -0x42bb9(%RIP),%ZMM8 |
0x4bdf9 VMOVAPD -0x42b83(%RIP),%ZMM9 |
0x4be03 MOV 0x480(%RBX),%R8D |
0x4be0a MOV 0x18(%R15),%R11 |
0x4be0e MOV 0x18(%R12),%R15 |
0x4be13 MOV 0xd8(%RBX),%RDI |
0x4be1a MOV 0x158(%RBX),%R14 |
0x4be21 MOV 0x100(%RBX),%RSI |
0x4be28 MOV 0x180(%RBX),%R9 |
0x4be2f MOVSXD 0x478(%RBX),%RCX |
0x4be36 MOV 0x140(%RBX),%RDX |
0x4be3d VXORPD %XMM0,%XMM0,%XMM0 |
0x4be41 MOV %R10,-0x30(%RBP) |
0x4be45 SAL $0x3,%RAX |
0x4be49 MOV %R8,%R13 |
0x4be4c SHR $0x5,%R13 |
0x4be50 MOV %R15,-0x48(%RBP) |
0x4be54 MOV %R8D,%R15D |
0x4be57 AND $-0x20,%R15D |
0x4be5b MOV %R8D,%R12D |
0x4be5e SAL $0x3,%RDI |
0x4be62 SAL $0x3,%R14 |
0x4be66 AND $-0x4,%R12D |
0x4be6a LEA (%RAX,%RAX,2),%RAX |
0x4be6e MOV %R15,-0x38(%RBP) |
0x4be72 SAL $0x8,%R13 |
0x4be76 LEA 0xc0(%R9),%R15 |
0x4be7d MOV %R14,-0x50(%RBP) |
0x4be81 MOV %RDI,-0x58(%RBP) |
0x4be85 XOR %R14D,%R14D |
0x4be88 MOV %RAX,-0x40(%RBP) |
0x4be8c LEA 0xc0(%RSI),%RAX |
0x4be93 JMP 4bf1c |
0x4be98 NOPL (%RAX,%RAX,1) |
(894) 0x4bea0 VXORPD %XMM10,%XMM10,%XMM10 |
(894) 0x4bea5 VXORPD %XMM12,%XMM12,%XMM12 |
(894) 0x4beaa VXORPD %XMM11,%XMM11,%XMM11 |
(894) 0x4beaf LEA (%RCX,%RCX,2),%RDI |
(894) 0x4beb3 ADD -0x40(%RBP),%RDX |
(894) 0x4beb7 INC %R14 |
(894) 0x4beba VADDPD (%R11,%RDI,8),%XMM11,%XMM13 |
(894) 0x4bec0 VMULPD %XMM11,%XMM11,%XMM11 |
(894) 0x4bec5 VMOVUPD %XMM13,(%R11,%RDI,8) |
(894) 0x4becb VADDSD 0x10(%R11,%RDI,8),%XMM10,%XMM13 |
(894) 0x4bed2 VMOVSD %XMM13,0x10(%R11,%RDI,8) |
(894) 0x4bed9 VPERMILPD $0x1,%XMM11,%XMM13 |
(894) 0x4bedf MOV -0x48(%RBP),%RDI |
(894) 0x4bee3 VADDSD %XMM11,%XMM13,%XMM11 |
(894) 0x4bee8 VFNMSUB231SD %XMM10,%XMM10,%XMM11 |
(894) 0x4beed VADDSD %XMM11,%XMM12,%XMM10 |
(894) 0x4bef2 VADDSD (%RDI,%RCX,8),%XMM10,%XMM10 |
(894) 0x4bef7 VMOVSD %XMM10,(%RDI,%RCX,8) |
(894) 0x4befc MOV -0x58(%RBP),%RDI |
(894) 0x4bf00 INC %RCX |
(894) 0x4bf03 ADD %RDI,%RAX |
(894) 0x4bf06 ADD %RDI,%RSI |
(894) 0x4bf09 MOV -0x50(%RBP),%RDI |
(894) 0x4bf0d ADD %RDI,%R15 |
(894) 0x4bf10 ADD %RDI,%R9 |
(894) 0x4bf13 CMP %R10,%R14 |
(894) 0x4bf16 JE 4c44d |
(894) 0x4bf1c TEST %R8D,%R8D |
(894) 0x4bf1f JLE 4bea0 |
(894) 0x4bf25 CMP $0x4,%R8D |
(894) 0x4bf29 JAE 4bf40 |
(894) 0x4bf2b VXORPD %XMM11,%XMM11,%XMM11 |
(894) 0x4bf30 XOR %EDI,%EDI |
(894) 0x4bf32 JMP 4c2e0 |
0x4bf37 NOPW (%RAX,%RAX,1) |
(894) 0x4bf40 CMP $0x20,%R8D |
(894) 0x4bf44 JAE 4bf57 |
(894) 0x4bf46 VXORPD %XMM11,%XMM11,%XMM11 |
(894) 0x4bf4b VXORPD %XMM10,%XMM10,%XMM10 |
(894) 0x4bf50 XOR %EDI,%EDI |
(894) 0x4bf52 JMP 4c1f4 |
(894) 0x4bf57 VXORPD %XMM11,%XMM11,%XMM11 |
(894) 0x4bf5c VXORPD %XMM12,%XMM12,%XMM12 |
(894) 0x4bf61 VXORPD %XMM13,%XMM13,%XMM13 |
(894) 0x4bf66 VXORPD %XMM14,%XMM14,%XMM14 |
(894) 0x4bf6b VXORPD %XMM15,%XMM15,%XMM15 |
(894) 0x4bf70 VXORPD %XMM16,%XMM16,%XMM16 |
(894) 0x4bf76 VXORPD %XMM17,%XMM17,%XMM17 |
(894) 0x4bf7c VXORPD %XMM18,%XMM18,%XMM18 |
(894) 0x4bf82 VXORPD %XMM10,%XMM10,%XMM10 |
(894) 0x4bf87 VXORPD %XMM19,%XMM19,%XMM19 |
(894) 0x4bf8d VXORPD %XMM20,%XMM20,%XMM20 |
(894) 0x4bf93 VXORPD %XMM21,%XMM21,%XMM21 |
(894) 0x4bf99 MOV %RDX,%RDI |
(894) 0x4bf9c XOR %R10D,%R10D |
(894) 0x4bf9f NOP |
(895) 0x4bfa0 VMOVUPD (%RDI),%ZMM23 |
(895) 0x4bfa6 VMOVUPD 0x40(%RDI),%ZMM22 |
(895) 0x4bfad VMOVUPD 0x80(%RDI),%ZMM27 |
(895) 0x4bfb4 VMOVUPD -0xc0(%RAX,%R10,1),%ZMM26 |
(895) 0x4bfbc VMOVUPD -0x80(%RAX,%R10,1),%ZMM28 |
(895) 0x4bfc4 VMOVAPD %ZMM23,%ZMM24 |
(895) 0x4bfca VPERMT2PD %ZMM22,%ZMM4,%ZMM24 |
(895) 0x4bfd0 VMOVAPD %ZMM23,%ZMM25 |
(895) 0x4bfd6 VPERMT2PD %ZMM22,%ZMM6,%ZMM25 |
(895) 0x4bfdc VPERMT2PD %ZMM23,%ZMM8,%ZMM22 |
(895) 0x4bfe2 VPERMT2PD %ZMM27,%ZMM5,%ZMM24 |
(895) 0x4bfe8 VPERMT2PD %ZMM27,%ZMM7,%ZMM25 |
(895) 0x4bfee VPERMT2PD %ZMM27,%ZMM9,%ZMM22 |
(895) 0x4bff4 VMOVUPD 0xc0(%RDI),%ZMM27 |
(895) 0x4bffb VFMADD231PD %ZMM24,%ZMM26,%ZMM11 |
(895) 0x4c001 VMOVUPD 0x100(%RDI),%ZMM24 |
(895) 0x4c008 VFMADD231PD %ZMM22,%ZMM26,%ZMM10 |
(895) 0x4c00e VFMADD231PD %ZMM25,%ZMM26,%ZMM15 |
(895) 0x4c014 VMOVUPD 0x140(%RDI),%ZMM26 |
(895) 0x4c01b VMOVAPD %ZMM27,%ZMM22 |
(895) 0x4c021 VMOVAPD %ZMM27,%ZMM23 |
(895) 0x4c027 VPERMT2PD %ZMM24,%ZMM4,%ZMM22 |
(895) 0x4c02d VPERMT2PD %ZMM24,%ZMM6,%ZMM23 |
(895) 0x4c033 VPERMT2PD %ZMM27,%ZMM8,%ZMM24 |
(895) 0x4c039 VMOVUPD 0x180(%RDI),%ZMM27 |
(895) 0x4c040 VPERMT2PD %ZMM26,%ZMM5,%ZMM22 |
(895) 0x4c046 VPERMT2PD %ZMM26,%ZMM9,%ZMM24 |
(895) 0x4c04c VPERMT2PD %ZMM26,%ZMM7,%ZMM23 |
(895) 0x4c052 VMOVUPD 0x200(%RDI),%ZMM26 |
(895) 0x4c059 VMOVAPD %ZMM27,%ZMM25 |
(895) 0x4c05f VFMADD231PD %ZMM22,%ZMM28,%ZMM12 |
(895) 0x4c065 VMOVUPD 0x1c0(%RDI),%ZMM22 |
(895) 0x4c06c VFMADD231PD %ZMM24,%ZMM28,%ZMM19 |
(895) 0x4c072 VMOVAPD %ZMM27,%ZMM24 |
(895) 0x4c078 VFMADD231PD %ZMM23,%ZMM28,%ZMM16 |
(895) 0x4c07e VPERMT2PD %ZMM22,%ZMM4,%ZMM24 |
(895) 0x4c084 VPERMT2PD %ZMM22,%ZMM6,%ZMM25 |
(895) 0x4c08a VPERMT2PD %ZMM27,%ZMM8,%ZMM22 |
(895) 0x4c090 VMOVUPD -0x40(%RAX,%R10,1),%ZMM27 |
(895) 0x4c098 VPERMT2PD %ZMM26,%ZMM5,%ZMM24 |
(895) 0x4c09e VPERMT2PD %ZMM26,%ZMM7,%ZMM25 |
(895) 0x4c0a4 VPERMT2PD %ZMM26,%ZMM9,%ZMM22 |
(895) 0x4c0aa VMOVUPD 0x240(%RDI),%ZMM26 |
(895) 0x4c0b1 VFMADD231PD %ZMM24,%ZMM27,%ZMM13 |
(895) 0x4c0b7 VMOVUPD 0x280(%RDI),%ZMM24 |
(895) 0x4c0be VFMADD231PD %ZMM22,%ZMM27,%ZMM20 |
(895) 0x4c0c4 VFMADD231PD %ZMM25,%ZMM27,%ZMM17 |
(895) 0x4c0ca VMOVUPD 0x2c0(%RDI),%ZMM27 |
(895) 0x4c0d1 ADD $0x300,%RDI |
(895) 0x4c0d8 VMOVAPD %ZMM26,%ZMM22 |
(895) 0x4c0de VMOVAPD %ZMM26,%ZMM23 |
(895) 0x4c0e4 VPERMT2PD %ZMM24,%ZMM4,%ZMM22 |
(895) 0x4c0ea VPERMT2PD %ZMM24,%ZMM6,%ZMM23 |
(895) 0x4c0f0 VPERMT2PD %ZMM26,%ZMM8,%ZMM24 |
(895) 0x4c0f6 VMOVUPD (%RAX,%R10,1),%ZMM26 |
(895) 0x4c0fd ADD $0x100,%R10 |
(895) 0x4c104 VPERMT2PD %ZMM27,%ZMM5,%ZMM22 |
(895) 0x4c10a VPERMT2PD %ZMM27,%ZMM7,%ZMM23 |
(895) 0x4c110 VPERMT2PD %ZMM27,%ZMM9,%ZMM24 |
(895) 0x4c116 VFMADD231PD %ZMM22,%ZMM26,%ZMM14 |
(895) 0x4c11c VFMADD231PD %ZMM23,%ZMM26,%ZMM18 |
(895) 0x4c122 VFMADD231PD %ZMM24,%ZMM26,%ZMM21 |
(895) 0x4c128 CMP %R10,%R13 |
(895) 0x4c12b JNE 4bfa0 |
(894) 0x4c131 VADDPD %ZMM15,%ZMM16,%ZMM15 |
(894) 0x4c137 VADDPD %ZMM17,%ZMM18,%ZMM16 |
(894) 0x4c13d VADDPD %ZMM11,%ZMM12,%ZMM11 |
(894) 0x4c143 VADDPD %ZMM13,%ZMM14,%ZMM13 |
(894) 0x4c149 VADDPD %ZMM10,%ZMM19,%ZMM10 |
(894) 0x4c14f VADDPD %ZMM20,%ZMM21,%ZMM19 |
(894) 0x4c155 MOV -0x38(%RBP),%RDI |
(894) 0x4c159 VADDPD %ZMM15,%ZMM16,%ZMM15 |
(894) 0x4c15f VADDPD %ZMM11,%ZMM13,%ZMM11 |
(894) 0x4c165 VADDPD %ZMM10,%ZMM19,%ZMM10 |
(894) 0x4c16b VEXTRACTF64X4 $0x1,%ZMM15,%YMM16 |
(894) 0x4c172 VEXTRACTF64X4 $0x1,%ZMM11,%YMM12 |
(894) 0x4c179 VEXTRACTF64X4 $0x1,%ZMM10,%YMM19 |
(894) 0x4c180 VADDPD %ZMM16,%ZMM15,%ZMM15 |
(894) 0x4c186 VADDPD %ZMM12,%ZMM11,%ZMM11 |
(894) 0x4c18c VADDPD %ZMM19,%ZMM10,%ZMM10 |
(894) 0x4c192 VEXTRACTF32X4 $0x1,%YMM15,%XMM16 |
(894) 0x4c199 VEXTRACTF128 $0x1,%YMM11,%XMM12 |
(894) 0x4c19f VEXTRACTF32X4 $0x1,%YMM10,%XMM19 |
(894) 0x4c1a6 VADDPD %XMM16,%XMM15,%XMM15 |
(894) 0x4c1ac VADDPD %XMM12,%XMM11,%XMM11 |
(894) 0x4c1b1 VADDPD %XMM19,%XMM10,%XMM10 |
(894) 0x4c1b7 VPERMILPD $0x1,%XMM15,%XMM16 |
(894) 0x4c1be VPERMILPD $0x1,%XMM11,%XMM12 |
(894) 0x4c1c4 VPERMILPD $0x1,%XMM10,%XMM19 |
(894) 0x4c1cb VADDSD %XMM16,%XMM15,%XMM15 |
(894) 0x4c1d1 VADDSD %XMM12,%XMM11,%XMM12 |
(894) 0x4c1d6 VADDSD %XMM19,%XMM10,%XMM10 |
(894) 0x4c1dc VUNPCKLPD %XMM15,%XMM12,%XMM11 |
(894) 0x4c1e1 CMP %R8,%RDI |
(894) 0x4c1e4 JE 4c2a0 |
(894) 0x4c1ea TEST $0x1c,%R8B |
(894) 0x4c1ee JE 4c2c3 |
(894) 0x4c1f4 LEA (%RDI,%RDI,2),%R10 |
(894) 0x4c1f8 VMOVQ %XMM11,%XMM12 |
(894) 0x4c1fd VUNPCKHPD %XMM0,%XMM11,%XMM11 |
(894) 0x4c201 VMOVQ %XMM10,%XMM10 |
(894) 0x4c206 LEA (%RDX,%R10,8),%R10 |
(894) 0x4c20a NOPW (%RAX,%RAX,1) |
(900) 0x4c210 VMOVUPD (%R10),%ZMM14 |
(900) 0x4c216 VMOVUPD 0x40(%R10),%YMM15 |
(900) 0x4c21c VMOVUPD (%RSI,%RDI,8),%YMM13 |
(900) 0x4c221 ADD $0x4,%RDI |
(900) 0x4c225 ADD $0x60,%R10 |
(900) 0x4c229 VMOVAPD %ZMM14,%ZMM16 |
(900) 0x4c22f VMOVAPD %ZMM14,%ZMM17 |
(900) 0x4c235 VPERMT2PD %ZMM15,%ZMM1,%ZMM16 |
(900) 0x4c23b VPERMT2PD %ZMM15,%ZMM2,%ZMM17 |
(900) 0x4c241 VPERMT2PD %ZMM15,%ZMM3,%ZMM14 |
(900) 0x4c247 VFMADD231PD %YMM16,%YMM13,%YMM12 |
(900) 0x4c24d VFMADD231PD %YMM17,%YMM13,%YMM11 |
(900) 0x4c253 VFMADD231PD %YMM14,%YMM13,%YMM10 |
(900) 0x4c258 CMP %RDI,%R12 |
(900) 0x4c25b JNE 4c210 |
(894) 0x4c25d VEXTRACTF128 $0x1,%YMM10,%XMM13 |
(894) 0x4c263 VADDPD %YMM13,%YMM10,%YMM10 |
(894) 0x4c268 VPERMILPD $0x1,%XMM10,%XMM13 |
(894) 0x4c26e VADDPD %YMM13,%YMM10,%YMM10 |
(894) 0x4c273 VEXTRACTF128 $0x1,%YMM11,%XMM13 |
(894) 0x4c279 VADDPD %XMM13,%XMM11,%XMM11 |
(894) 0x4c27e VEXTRACTF128 $0x1,%YMM12,%XMM13 |
(894) 0x4c284 VADDPD %XMM13,%XMM12,%XMM12 |
(894) 0x4c289 VUNPCKHPD %XMM11,%XMM12,%XMM13 |
(894) 0x4c28e VUNPCKLPD %XMM11,%XMM12,%XMM11 |
(894) 0x4c293 VADDPD %XMM13,%XMM11,%XMM11 |
(894) 0x4c298 CMP %R8,%R12 |
(894) 0x4c29b JNE 4c2b3 |
(894) 0x4c29d NOPL (%RAX) |
(894) 0x4c2a0 CMP $0x4,%R8D |
(894) 0x4c2a4 JAE 4c315 |
(894) 0x4c2a6 VXORPD %XMM12,%XMM12,%XMM12 |
(894) 0x4c2ab XOR %R10D,%R10D |
(894) 0x4c2ae JMP 4c430 |
(894) 0x4c2b3 VBROADCASTSD %XMM10,%YMM10 |
(894) 0x4c2b8 MOV %R12,%RDI |
(894) 0x4c2bb VBLENDPD $0xc,%YMM10,%YMM11,%YMM11 |
(894) 0x4c2c1 JMP 4c2e0 |
(894) 0x4c2c3 VUNPCKLPD %XMM15,%XMM12,%XMM11 |
(894) 0x4c2c8 VINSERTF128 $0x1,%XMM10,%YMM11,%YMM10 |
(894) 0x4c2ce VPERMILPD $0x2,%YMM10,%YMM11 |
(894) 0x4c2d4 NOPW %CS:(%RAX,%RAX,1) |
(894) 0x4c2e0 LEA (%RDI,%RDI,2),%R10 |
(894) 0x4c2e4 LEA (%RDX,%R10,8),%R10 |
(894) 0x4c2e8 NOPL (%RAX,%RAX,1) |
(899) 0x4c2f0 VPERMILPD $0x2,(%R10),%YMM10 |
(899) 0x4c2f6 ADD $0x18,%R10 |
(899) 0x4c2fa VFMADD231PD (%RSI,%RDI,8){1to4},%YMM10,%YMM11 |
(899) 0x4c301 INC %RDI |
(899) 0x4c304 CMP %RDI,%R8 |
(899) 0x4c307 JNE 4c2f0 |
(894) 0x4c309 VEXTRACTF128 $0x1,%YMM11,%XMM10 |
(894) 0x4c30f CMP $0x4,%R8D |
(894) 0x4c313 JB 4c2a6 |
(894) 0x4c315 CMP $0x20,%R8D |
(894) 0x4c319 JAE 4c327 |
(894) 0x4c31b VXORPD %XMM12,%XMM12,%XMM12 |
(894) 0x4c320 XOR %EDI,%EDI |
(894) 0x4c322 JMP 4c3dd |
(894) 0x4c327 MOV -0x38(%RBP),%R10 |
(894) 0x4c32b VXORPD %XMM12,%XMM12,%XMM12 |
(894) 0x4c330 VXORPD %XMM13,%XMM13,%XMM13 |
(894) 0x4c335 VXORPD %XMM14,%XMM14,%XMM14 |
(894) 0x4c33a VXORPD %XMM15,%XMM15,%XMM15 |
(894) 0x4c33f XOR %EDI,%EDI |
(894) 0x4c341 NOPW %CS:(%RAX,%RAX,1) |
(896) 0x4c350 VMOVUPD -0xc0(%R15,%RDI,1),%ZMM16 |
(896) 0x4c358 VMOVUPD -0x80(%R15,%RDI,1),%ZMM17 |
(896) 0x4c360 VMOVUPD -0x40(%R15,%RDI,1),%ZMM18 |
(896) 0x4c368 VMOVUPD (%R15,%RDI,1),%ZMM19 |
(896) 0x4c36f VFMADD231PD -0xc0(%RAX,%RDI,1),%ZMM16,%ZMM12 |
(896) 0x4c377 VFMADD231PD -0x80(%RAX,%RDI,1),%ZMM17,%ZMM13 |
(896) 0x4c37f VFMADD231PD -0x40(%RAX,%RDI,1),%ZMM18,%ZMM14 |
(896) 0x4c387 VFMADD231PD (%RAX,%RDI,1),%ZMM19,%ZMM15 |
(896) 0x4c38e ADD $0x100,%RDI |
(896) 0x4c395 CMP %RDI,%R13 |
(896) 0x4c398 JNE 4c350 |
(894) 0x4c39a VADDPD %ZMM12,%ZMM13,%ZMM12 |
(894) 0x4c3a0 VADDPD %ZMM14,%ZMM15,%ZMM14 |
(894) 0x4c3a6 VADDPD %ZMM12,%ZMM14,%ZMM12 |
(894) 0x4c3ac VEXTRACTF64X4 $0x1,%ZMM12,%YMM13 |
(894) 0x4c3b3 VADDPD %ZMM13,%ZMM12,%ZMM12 |
(894) 0x4c3b9 VEXTRACTF128 $0x1,%YMM12,%XMM13 |
(894) 0x4c3bf VADDPD %XMM13,%XMM12,%XMM12 |
(894) 0x4c3c4 VPERMILPD $0x1,%XMM12,%XMM13 |
(894) 0x4c3ca VADDSD %XMM13,%XMM12,%XMM12 |
(894) 0x4c3cf CMP %R8,%R10 |
(894) 0x4c3d2 JE 4c444 |
(894) 0x4c3d4 MOV %R10,%RDI |
(894) 0x4c3d7 TEST $0x1c,%R8B |
(894) 0x4c3db JE 4c430 |
(894) 0x4c3dd VMOVQ %XMM12,%XMM12 |
(894) 0x4c3e2 NOPW %CS:(%RAX,%RAX,1) |
(898) 0x4c3f0 VMOVUPD (%R9,%RDI,8),%YMM13 |
(898) 0x4c3f6 VFMADD231PD (%RSI,%RDI,8),%YMM13,%YMM12 |
(898) 0x4c3fc ADD $0x4,%RDI |
(898) 0x4c400 CMP %RDI,%R12 |
(898) 0x4c403 JNE 4c3f0 |
(894) 0x4c405 VEXTRACTF128 $0x1,%YMM12,%XMM13 |
(894) 0x4c40b MOV %R12,%R10 |
(894) 0x4c40e VADDPD %XMM13,%XMM12,%XMM12 |
(894) 0x4c413 VPERMILPD $0x1,%XMM12,%XMM13 |
(894) 0x4c419 VADDSD %XMM13,%XMM12,%XMM12 |
(894) 0x4c41e CMP %R8,%R12 |
(894) 0x4c421 JE 4c444 |
(894) 0x4c423 NOPW %CS:(%RAX,%RAX,1) |
(897) 0x4c430 VMOVSD (%R9,%R10,8),%XMM13 |
(897) 0x4c436 VFMADD231SD (%RSI,%R10,8),%XMM13,%XMM12 |
(897) 0x4c43c INC %R10 |
(897) 0x4c43f CMP %R10,%R8 |
(897) 0x4c442 JNE 4c430 |
(894) 0x4c444 MOV -0x30(%RBP),%R10 |
(894) 0x4c448 JMP 4beaf |
0x4c44d VMOVSD 0x10(%RBX),%XMM0 |
0x4c452 ADD $0x38,%RSP |
0x4c456 POP %RBX |
0x4c457 POP %R12 |
0x4c459 POP %R13 |
0x4c45b POP %R14 |
0x4c45d POP %R15 |
0x4c45f POP %RBP |
0x4c460 VZEROUPPER |
0x4c463 RET |
0x4c464 INT $0x3 |
0x4c465 INT $0x3 |
0x4c466 INT $0x3 |
0x4c467 INT $0x3 |
0x4c468 INT $0x3 |
0x4c469 INT $0x3 |
0x4c46a INT $0x3 |
0x4c46b INT $0x3 |
0x4c46c INT $0x3 |
0x4c46d INT $0x3 |
0x4c46e INT $0x3 |
0x4c46f INT $0x3 |
Path / |
Source file and lines | DiracDeterminantRef.cpp:235-255 |
Module | libqmcwfs.so |
nb instructions | 104 |
nb uops | 91 |
loop length | 460 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 3 |
used zmm registers | 6 |
nb stack references | 6 |
ADD-SUB / MUL ratio | 1.33 |
micro-operation queue | 15.17 cycles |
front end | 15.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 14.67 | 14.67 | 14.67 | 2.50 | 2.50 | 2.67 | 2.33 | 1.50 | 1.50 |
cycles | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 16.67 | 16.67 | 16.67 | 2.50 | 2.50 | 2.67 | 2.33 | 1.50 | 1.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 15.17 |
Dispatch | 16.67 |
Overall L1 | 16.67 |
all | 5% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 60% |
load | 64% |
store | 33% |
mul | 66% |
add-sub | 25% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 35% |
load | 50% |
store | 11% |
mul | 66% |
add-sub | 25% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 27% |
all | 11% |
load | 10% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 41% |
load | 51% |
store | 16% |
mul | 20% |
add-sub | 15% |
fma | 12% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 28% |
load | 42% |
store | 13% |
mul | 20% |
add-sub | 15% |
fma | 12% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x38,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4ecb0 <@plt_start@+0x600> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x484(%RBX),%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP $0x1,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JNE 4bd9f <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x9f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x100(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x140(%RBX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R15),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVDDUP (%RAX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSXD 0x478(%RBX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMULPD (%RCX),%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMULSD 0x10(%RCX),%XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
LEA (%RAX,%RAX,2),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VADDPD (%RDX,%RSI,8),%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VMULPD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVUPD %XMM3,(%RDX,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VADDSD 0x10(%RDX,%RSI,8),%XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VMOVSD %XMM3,0x10(%RDX,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
VPERMILPD $0x1,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOV 0x180(%RBX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VADDSD %XMM2,%XMM3,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOV 0x18(%R12),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VFMADD231SD %XMM1,%XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMSUB231SD (%RCX),%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD (%RDX,%RAX,8),%XMM2,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VMOVSD %XMM0,(%RDX,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
JMP 4c44d <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x74d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
TEST %R10D,%R10D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 4c44d <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x74d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x118(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVAPD -0x439b7(%RIP),%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD -0x43a3f(%RIP),%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD -0x43a27(%RIP),%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD -0x42c91(%RIP),%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42c5b(%RIP),%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42c25(%RIP),%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42bef(%RIP),%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42bb9(%RIP),%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42b83(%RIP),%ZMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x480(%RBX),%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R15),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R12),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xd8(%RBX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x158(%RBX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x100(%RBX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x180(%RBX),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVSXD 0x478(%RBX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV 0x140(%RBX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R10,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SAL $0x3,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R8,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SHR $0x5,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R8D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x20,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R8D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDI | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SAL $0x3,%R14 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x4,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA (%RAX,%RAX,2),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SAL $0x8,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA 0xc0(%R9),%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA 0xc0(%RSI),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JMP 4bf1c <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x21c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
VMOVSD 0x10(%RBX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD $0x38,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 |
Source file and lines | DiracDeterminantRef.cpp:235-255 |
Module | libqmcwfs.so |
nb instructions | 104 |
nb uops | 91 |
loop length | 460 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 3 |
used zmm registers | 6 |
nb stack references | 6 |
ADD-SUB / MUL ratio | 1.33 |
micro-operation queue | 15.17 cycles |
front end | 15.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 14.67 | 14.67 | 14.67 | 2.50 | 2.50 | 2.67 | 2.33 | 1.50 | 1.50 |
cycles | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 16.67 | 16.67 | 16.67 | 2.50 | 2.50 | 2.67 | 2.33 | 1.50 | 1.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 15.17 |
Dispatch | 16.67 |
Overall L1 | 16.67 |
all | 5% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 60% |
load | 64% |
store | 33% |
mul | 66% |
add-sub | 25% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 35% |
load | 50% |
store | 11% |
mul | 66% |
add-sub | 25% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 27% |
all | 11% |
load | 10% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 41% |
load | 51% |
store | 16% |
mul | 20% |
add-sub | 15% |
fma | 12% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 28% |
load | 42% |
store | 13% |
mul | 20% |
add-sub | 15% |
fma | 12% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x38,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4ecb0 <@plt_start@+0x600> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x484(%RBX),%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP $0x1,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JNE 4bd9f <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x9f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x100(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x140(%RBX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R15),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVDDUP (%RAX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSXD 0x478(%RBX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMULPD (%RCX),%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMULSD 0x10(%RCX),%XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
LEA (%RAX,%RAX,2),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VADDPD (%RDX,%RSI,8),%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VMULPD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVUPD %XMM3,(%RDX,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VADDSD 0x10(%RDX,%RSI,8),%XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VMOVSD %XMM3,0x10(%RDX,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
VPERMILPD $0x1,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOV 0x180(%RBX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VADDSD %XMM2,%XMM3,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOV 0x18(%R12),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VFMADD231SD %XMM1,%XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMSUB231SD (%RCX),%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD (%RDX,%RAX,8),%XMM2,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VMOVSD %XMM0,(%RDX,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
JMP 4c44d <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x74d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
TEST %R10D,%R10D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 4c44d <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x74d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x118(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVAPD -0x439b7(%RIP),%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD -0x43a3f(%RIP),%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD -0x43a27(%RIP),%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD -0x42c91(%RIP),%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42c5b(%RIP),%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42c25(%RIP),%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42bef(%RIP),%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42bb9(%RIP),%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42b83(%RIP),%ZMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x480(%RBX),%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R15),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R12),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xd8(%RBX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x158(%RBX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x100(%RBX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x180(%RBX),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVSXD 0x478(%RBX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV 0x140(%RBX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R10,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SAL $0x3,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R8,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SHR $0x5,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R8D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x20,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R8D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDI | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SAL $0x3,%R14 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x4,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA (%RAX,%RAX,2),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SAL $0x8,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA 0xc0(%R9),%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA 0xc0(%RSI),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JMP 4bf1c <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x21c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
VMOVSD 0x10(%RBX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD $0x38,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼miniqmcreference::DiracDeterminantRef | 0.14 | 0.06 |
▼Loop 894 - OhmmsMatrix.h:217-217 - libqmcwfs.so– | 0 | 0 |
○Loop 895 - inner_product.hpp:155-155 - libqmcwfs.so | 0.09 | 0.04 |
○Loop 896 - inner_product.hpp:82-83 - libqmcwfs.so | 0.05 | 0.02 |
○Loop 900 - inner_product.hpp:155-155 - libqmcwfs.so | 0 | 0 |
○Loop 899 - inner_product.hpp:155-155 - libqmcwfs.so | 0 | 0 |
○Loop 897 - inner_product.hpp:82-83 - libqmcwfs.so | 0 | 0 |
○Loop 898 - inner_product.hpp:82-83 - libqmcwfs.so | 0 | 0 |