Function: _ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLo ... | Module: libqmcwfs.so | Source: DiracDeterminantRef.cpp:235-255 [...] | Coverage: 0.06% |
---|
Function: _ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLo ... | Module: libqmcwfs.so | Source: DiracDeterminantRef.cpp:235-255 [...] | Coverage: 0.06% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsMatrix.h: 217 - 217 |
-------------------------------------------------------------------------------- |
217: inline Type_t* operator[](size_type i) { return X.data() + i * D2; } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Platforms/CPU/SIMD/inner_product.hpp: 82 - 155 |
-------------------------------------------------------------------------------- |
82: for (int i = 0; i < n; i++) |
83: res += a[i] * b[i]; |
[...] |
155: for (int i = 0; i < n; i++) |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVectorOps.h: 129 - 131 |
-------------------------------------------------------------------------------- |
129: Type_t res = lhs[0] * rhs[0]; |
130: for (unsigned d = 1; d < D; ++d) |
131: res += lhs[d] * rhs[d]; |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 223 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 63 - 94 |
-------------------------------------------------------------------------------- |
63: return (a * b); |
[...] |
94: (const_cast<T1&>(a) += b); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/DiracDeterminantRef.cpp: 235 - 255 |
-------------------------------------------------------------------------------- |
235: { |
236: recompute(P); |
237: |
238: if (NumPtcls == 1) |
239: { |
240: ValueType y = psiM(0, 0); |
241: GradType rv = y * dpsiM(0, 0); |
242: G[FirstIndex] += rv; |
243: L[FirstIndex] += y * d2psiM(0, 0) - dot(rv, rv); |
244: } |
245: else |
246: { |
247: for (int i = 0, iat = FirstIndex; i < NumPtcls; i++, iat++) |
248: { |
249: mGradType rv = simd::dot(psiM[i], dpsiM[i], NumOrbitals); |
250: mValueType lap = simd::dot(psiM[i], d2psiM[i], NumOrbitals); |
251: G[iat] += rv; |
252: L[iat] += lap - dot(rv, rv); |
253: } |
254: } |
255: return LogValue; |
0x4bff0 PUSH %RBP |
0x4bff1 MOV %RSP,%RBP |
0x4bff4 PUSH %R15 |
0x4bff6 PUSH %R14 |
0x4bff8 PUSH %R13 |
0x4bffa PUSH %R12 |
0x4bffc PUSH %RBX |
0x4bffd SUB $0x38,%RSP |
0x4c001 MOV %RCX,%R12 |
0x4c004 MOV %RDX,%R15 |
0x4c007 MOV %RDI,%RBX |
0x4c00a CALL 4efa0 <@plt_start@+0x600> |
0x4c00f MOV 0x484(%RBX),%R10D |
0x4c016 CMP $0x1,%R10 |
0x4c01a JNE 4c08f |
0x4c01c MOV 0x100(%RBX),%RAX |
0x4c023 MOV 0x140(%RBX),%RCX |
0x4c02a MOV 0x18(%R15),%RDX |
0x4c02e VMOVDDUP (%RAX),%XMM0 |
0x4c032 MOVSXD 0x478(%RBX),%RAX |
0x4c039 VMULPD (%RCX),%XMM0,%XMM2 |
0x4c03d VMULSD 0x10(%RCX),%XMM0,%XMM1 |
0x4c042 LEA (%RAX,%RAX,2),%RSI |
0x4c046 VADDPD (%RDX,%RSI,8),%XMM2,%XMM3 |
0x4c04b VMULPD %XMM2,%XMM2,%XMM2 |
0x4c04f VMOVUPD %XMM3,(%RDX,%RSI,8) |
0x4c054 VADDSD 0x10(%RDX,%RSI,8),%XMM1,%XMM3 |
0x4c05a VMOVSD %XMM3,0x10(%RDX,%RSI,8) |
0x4c060 VPERMILPD $0x1,%XMM2,%XMM3 |
0x4c066 MOV 0x180(%RBX),%RCX |
0x4c06d VADDSD %XMM2,%XMM3,%XMM2 |
0x4c071 MOV 0x18(%R12),%RDX |
0x4c076 VFMADD231SD %XMM1,%XMM1,%XMM2 |
0x4c07b VFMSUB231SD (%RCX),%XMM0,%XMM2 |
0x4c080 VADDSD (%RDX,%RAX,8),%XMM2,%XMM0 |
0x4c085 VMOVSD %XMM0,(%RDX,%RAX,8) |
0x4c08a JMP 4c73d |
0x4c08f TEST %R10D,%R10D |
0x4c092 JLE 4c73d |
0x4c098 MOV 0x118(%RBX),%RAX |
0x4c09f VMOVAPD -0x43ba7(%RIP),%YMM1 |
0x4c0a7 VMOVAPD -0x43c2f(%RIP),%YMM2 |
0x4c0af VMOVAPD -0x43c17(%RIP),%YMM3 |
0x4c0b7 VMOVAPD -0x42e81(%RIP),%ZMM4 |
0x4c0c1 VMOVAPD -0x42e4b(%RIP),%ZMM5 |
0x4c0cb VMOVAPD -0x42e15(%RIP),%ZMM6 |
0x4c0d5 VMOVAPD -0x42ddf(%RIP),%ZMM7 |
0x4c0df VMOVAPD -0x42da9(%RIP),%ZMM8 |
0x4c0e9 VMOVAPD -0x42d73(%RIP),%ZMM9 |
0x4c0f3 MOV 0x480(%RBX),%R8D |
0x4c0fa MOV 0x18(%R15),%R11 |
0x4c0fe MOV 0x18(%R12),%R15 |
0x4c103 MOV 0xd8(%RBX),%RDI |
0x4c10a MOV 0x158(%RBX),%R14 |
0x4c111 MOV 0x100(%RBX),%RSI |
0x4c118 MOV 0x180(%RBX),%R9 |
0x4c11f MOVSXD 0x478(%RBX),%RCX |
0x4c126 MOV 0x140(%RBX),%RDX |
0x4c12d VXORPD %XMM0,%XMM0,%XMM0 |
0x4c131 MOV %R10,-0x30(%RBP) |
0x4c135 SAL $0x3,%RAX |
0x4c139 MOV %R8,%R13 |
0x4c13c SHR $0x5,%R13 |
0x4c140 MOV %R15,-0x48(%RBP) |
0x4c144 MOV %R8D,%R15D |
0x4c147 AND $-0x20,%R15D |
0x4c14b MOV %R8D,%R12D |
0x4c14e SAL $0x3,%RDI |
0x4c152 SAL $0x3,%R14 |
0x4c156 AND $-0x4,%R12D |
0x4c15a LEA (%RAX,%RAX,2),%RAX |
0x4c15e MOV %R15,-0x38(%RBP) |
0x4c162 SAL $0x8,%R13 |
0x4c166 LEA 0xc0(%R9),%R15 |
0x4c16d MOV %R14,-0x50(%RBP) |
0x4c171 MOV %RDI,-0x58(%RBP) |
0x4c175 XOR %R14D,%R14D |
0x4c178 MOV %RAX,-0x40(%RBP) |
0x4c17c LEA 0xc0(%RSI),%RAX |
0x4c183 JMP 4c20c |
0x4c188 NOPL (%RAX,%RAX,1) |
(894) 0x4c190 VXORPD %XMM10,%XMM10,%XMM10 |
(894) 0x4c195 VXORPD %XMM12,%XMM12,%XMM12 |
(894) 0x4c19a VXORPD %XMM11,%XMM11,%XMM11 |
(894) 0x4c19f LEA (%RCX,%RCX,2),%RDI |
(894) 0x4c1a3 ADD -0x40(%RBP),%RDX |
(894) 0x4c1a7 INC %R14 |
(894) 0x4c1aa VADDPD (%R11,%RDI,8),%XMM11,%XMM13 |
(894) 0x4c1b0 VMULPD %XMM11,%XMM11,%XMM11 |
(894) 0x4c1b5 VMOVUPD %XMM13,(%R11,%RDI,8) |
(894) 0x4c1bb VADDSD 0x10(%R11,%RDI,8),%XMM10,%XMM13 |
(894) 0x4c1c2 VMOVSD %XMM13,0x10(%R11,%RDI,8) |
(894) 0x4c1c9 VPERMILPD $0x1,%XMM11,%XMM13 |
(894) 0x4c1cf MOV -0x48(%RBP),%RDI |
(894) 0x4c1d3 VADDSD %XMM11,%XMM13,%XMM11 |
(894) 0x4c1d8 VFNMSUB231SD %XMM10,%XMM10,%XMM11 |
(894) 0x4c1dd VADDSD %XMM11,%XMM12,%XMM10 |
(894) 0x4c1e2 VADDSD (%RDI,%RCX,8),%XMM10,%XMM10 |
(894) 0x4c1e7 VMOVSD %XMM10,(%RDI,%RCX,8) |
(894) 0x4c1ec MOV -0x58(%RBP),%RDI |
(894) 0x4c1f0 INC %RCX |
(894) 0x4c1f3 ADD %RDI,%RAX |
(894) 0x4c1f6 ADD %RDI,%RSI |
(894) 0x4c1f9 MOV -0x50(%RBP),%RDI |
(894) 0x4c1fd ADD %RDI,%R15 |
(894) 0x4c200 ADD %RDI,%R9 |
(894) 0x4c203 CMP %R10,%R14 |
(894) 0x4c206 JE 4c73d |
(894) 0x4c20c TEST %R8D,%R8D |
(894) 0x4c20f JLE 4c190 |
(894) 0x4c215 CMP $0x4,%R8D |
(894) 0x4c219 JAE 4c230 |
(894) 0x4c21b VXORPD %XMM11,%XMM11,%XMM11 |
(894) 0x4c220 XOR %EDI,%EDI |
(894) 0x4c222 JMP 4c5d0 |
0x4c227 NOPW (%RAX,%RAX,1) |
(894) 0x4c230 CMP $0x20,%R8D |
(894) 0x4c234 JAE 4c247 |
(894) 0x4c236 VXORPD %XMM11,%XMM11,%XMM11 |
(894) 0x4c23b VXORPD %XMM10,%XMM10,%XMM10 |
(894) 0x4c240 XOR %EDI,%EDI |
(894) 0x4c242 JMP 4c4e4 |
(894) 0x4c247 VXORPD %XMM11,%XMM11,%XMM11 |
(894) 0x4c24c VXORPD %XMM12,%XMM12,%XMM12 |
(894) 0x4c251 VXORPD %XMM13,%XMM13,%XMM13 |
(894) 0x4c256 VXORPD %XMM14,%XMM14,%XMM14 |
(894) 0x4c25b VXORPD %XMM15,%XMM15,%XMM15 |
(894) 0x4c260 VXORPD %XMM16,%XMM16,%XMM16 |
(894) 0x4c266 VXORPD %XMM17,%XMM17,%XMM17 |
(894) 0x4c26c VXORPD %XMM18,%XMM18,%XMM18 |
(894) 0x4c272 VXORPD %XMM10,%XMM10,%XMM10 |
(894) 0x4c277 VXORPD %XMM19,%XMM19,%XMM19 |
(894) 0x4c27d VXORPD %XMM20,%XMM20,%XMM20 |
(894) 0x4c283 VXORPD %XMM21,%XMM21,%XMM21 |
(894) 0x4c289 MOV %RDX,%RDI |
(894) 0x4c28c XOR %R10D,%R10D |
(894) 0x4c28f NOP |
(895) 0x4c290 VMOVUPD (%RDI),%ZMM23 |
(895) 0x4c296 VMOVUPD 0x40(%RDI),%ZMM22 |
(895) 0x4c29d VMOVUPD 0x80(%RDI),%ZMM27 |
(895) 0x4c2a4 VMOVUPD -0xc0(%RAX,%R10,1),%ZMM26 |
(895) 0x4c2ac VMOVUPD -0x80(%RAX,%R10,1),%ZMM28 |
(895) 0x4c2b4 VMOVAPD %ZMM23,%ZMM24 |
(895) 0x4c2ba VPERMT2PD %ZMM22,%ZMM4,%ZMM24 |
(895) 0x4c2c0 VMOVAPD %ZMM23,%ZMM25 |
(895) 0x4c2c6 VPERMT2PD %ZMM22,%ZMM6,%ZMM25 |
(895) 0x4c2cc VPERMT2PD %ZMM23,%ZMM8,%ZMM22 |
(895) 0x4c2d2 VPERMT2PD %ZMM27,%ZMM5,%ZMM24 |
(895) 0x4c2d8 VPERMT2PD %ZMM27,%ZMM7,%ZMM25 |
(895) 0x4c2de VPERMT2PD %ZMM27,%ZMM9,%ZMM22 |
(895) 0x4c2e4 VMOVUPD 0xc0(%RDI),%ZMM27 |
(895) 0x4c2eb VFMADD231PD %ZMM24,%ZMM26,%ZMM11 |
(895) 0x4c2f1 VMOVUPD 0x100(%RDI),%ZMM24 |
(895) 0x4c2f8 VFMADD231PD %ZMM22,%ZMM26,%ZMM10 |
(895) 0x4c2fe VFMADD231PD %ZMM25,%ZMM26,%ZMM15 |
(895) 0x4c304 VMOVUPD 0x140(%RDI),%ZMM26 |
(895) 0x4c30b VMOVAPD %ZMM27,%ZMM22 |
(895) 0x4c311 VMOVAPD %ZMM27,%ZMM23 |
(895) 0x4c317 VPERMT2PD %ZMM24,%ZMM4,%ZMM22 |
(895) 0x4c31d VPERMT2PD %ZMM24,%ZMM6,%ZMM23 |
(895) 0x4c323 VPERMT2PD %ZMM27,%ZMM8,%ZMM24 |
(895) 0x4c329 VMOVUPD 0x180(%RDI),%ZMM27 |
(895) 0x4c330 VPERMT2PD %ZMM26,%ZMM5,%ZMM22 |
(895) 0x4c336 VPERMT2PD %ZMM26,%ZMM9,%ZMM24 |
(895) 0x4c33c VPERMT2PD %ZMM26,%ZMM7,%ZMM23 |
(895) 0x4c342 VMOVUPD 0x200(%RDI),%ZMM26 |
(895) 0x4c349 VMOVAPD %ZMM27,%ZMM25 |
(895) 0x4c34f VFMADD231PD %ZMM22,%ZMM28,%ZMM12 |
(895) 0x4c355 VMOVUPD 0x1c0(%RDI),%ZMM22 |
(895) 0x4c35c VFMADD231PD %ZMM24,%ZMM28,%ZMM19 |
(895) 0x4c362 VMOVAPD %ZMM27,%ZMM24 |
(895) 0x4c368 VFMADD231PD %ZMM23,%ZMM28,%ZMM16 |
(895) 0x4c36e VPERMT2PD %ZMM22,%ZMM4,%ZMM24 |
(895) 0x4c374 VPERMT2PD %ZMM22,%ZMM6,%ZMM25 |
(895) 0x4c37a VPERMT2PD %ZMM27,%ZMM8,%ZMM22 |
(895) 0x4c380 VMOVUPD -0x40(%RAX,%R10,1),%ZMM27 |
(895) 0x4c388 VPERMT2PD %ZMM26,%ZMM5,%ZMM24 |
(895) 0x4c38e VPERMT2PD %ZMM26,%ZMM7,%ZMM25 |
(895) 0x4c394 VPERMT2PD %ZMM26,%ZMM9,%ZMM22 |
(895) 0x4c39a VMOVUPD 0x240(%RDI),%ZMM26 |
(895) 0x4c3a1 VFMADD231PD %ZMM24,%ZMM27,%ZMM13 |
(895) 0x4c3a7 VMOVUPD 0x280(%RDI),%ZMM24 |
(895) 0x4c3ae VFMADD231PD %ZMM22,%ZMM27,%ZMM20 |
(895) 0x4c3b4 VFMADD231PD %ZMM25,%ZMM27,%ZMM17 |
(895) 0x4c3ba VMOVUPD 0x2c0(%RDI),%ZMM27 |
(895) 0x4c3c1 ADD $0x300,%RDI |
(895) 0x4c3c8 VMOVAPD %ZMM26,%ZMM22 |
(895) 0x4c3ce VMOVAPD %ZMM26,%ZMM23 |
(895) 0x4c3d4 VPERMT2PD %ZMM24,%ZMM4,%ZMM22 |
(895) 0x4c3da VPERMT2PD %ZMM24,%ZMM6,%ZMM23 |
(895) 0x4c3e0 VPERMT2PD %ZMM26,%ZMM8,%ZMM24 |
(895) 0x4c3e6 VMOVUPD (%RAX,%R10,1),%ZMM26 |
(895) 0x4c3ed ADD $0x100,%R10 |
(895) 0x4c3f4 VPERMT2PD %ZMM27,%ZMM5,%ZMM22 |
(895) 0x4c3fa VPERMT2PD %ZMM27,%ZMM7,%ZMM23 |
(895) 0x4c400 VPERMT2PD %ZMM27,%ZMM9,%ZMM24 |
(895) 0x4c406 VFMADD231PD %ZMM22,%ZMM26,%ZMM14 |
(895) 0x4c40c VFMADD231PD %ZMM23,%ZMM26,%ZMM18 |
(895) 0x4c412 VFMADD231PD %ZMM24,%ZMM26,%ZMM21 |
(895) 0x4c418 CMP %R10,%R13 |
(895) 0x4c41b JNE 4c290 |
(894) 0x4c421 VADDPD %ZMM15,%ZMM16,%ZMM15 |
(894) 0x4c427 VADDPD %ZMM17,%ZMM18,%ZMM16 |
(894) 0x4c42d VADDPD %ZMM11,%ZMM12,%ZMM11 |
(894) 0x4c433 VADDPD %ZMM13,%ZMM14,%ZMM13 |
(894) 0x4c439 VADDPD %ZMM10,%ZMM19,%ZMM10 |
(894) 0x4c43f VADDPD %ZMM20,%ZMM21,%ZMM19 |
(894) 0x4c445 MOV -0x38(%RBP),%RDI |
(894) 0x4c449 VADDPD %ZMM15,%ZMM16,%ZMM15 |
(894) 0x4c44f VADDPD %ZMM11,%ZMM13,%ZMM11 |
(894) 0x4c455 VADDPD %ZMM10,%ZMM19,%ZMM10 |
(894) 0x4c45b VEXTRACTF64X4 $0x1,%ZMM15,%YMM16 |
(894) 0x4c462 VEXTRACTF64X4 $0x1,%ZMM11,%YMM12 |
(894) 0x4c469 VEXTRACTF64X4 $0x1,%ZMM10,%YMM19 |
(894) 0x4c470 VADDPD %ZMM16,%ZMM15,%ZMM15 |
(894) 0x4c476 VADDPD %ZMM12,%ZMM11,%ZMM11 |
(894) 0x4c47c VADDPD %ZMM19,%ZMM10,%ZMM10 |
(894) 0x4c482 VEXTRACTF32X4 $0x1,%YMM15,%XMM16 |
(894) 0x4c489 VEXTRACTF128 $0x1,%YMM11,%XMM12 |
(894) 0x4c48f VEXTRACTF32X4 $0x1,%YMM10,%XMM19 |
(894) 0x4c496 VADDPD %XMM16,%XMM15,%XMM15 |
(894) 0x4c49c VADDPD %XMM12,%XMM11,%XMM11 |
(894) 0x4c4a1 VADDPD %XMM19,%XMM10,%XMM10 |
(894) 0x4c4a7 VPERMILPD $0x1,%XMM15,%XMM16 |
(894) 0x4c4ae VPERMILPD $0x1,%XMM11,%XMM12 |
(894) 0x4c4b4 VPERMILPD $0x1,%XMM10,%XMM19 |
(894) 0x4c4bb VADDSD %XMM16,%XMM15,%XMM15 |
(894) 0x4c4c1 VADDSD %XMM12,%XMM11,%XMM12 |
(894) 0x4c4c6 VADDSD %XMM19,%XMM10,%XMM10 |
(894) 0x4c4cc VUNPCKLPD %XMM15,%XMM12,%XMM11 |
(894) 0x4c4d1 CMP %R8,%RDI |
(894) 0x4c4d4 JE 4c590 |
(894) 0x4c4da TEST $0x1c,%R8B |
(894) 0x4c4de JE 4c5b3 |
(894) 0x4c4e4 LEA (%RDI,%RDI,2),%R10 |
(894) 0x4c4e8 VMOVQ %XMM11,%XMM12 |
(894) 0x4c4ed VUNPCKHPD %XMM0,%XMM11,%XMM11 |
(894) 0x4c4f1 VMOVQ %XMM10,%XMM10 |
(894) 0x4c4f6 LEA (%RDX,%R10,8),%R10 |
(894) 0x4c4fa NOPW (%RAX,%RAX,1) |
(900) 0x4c500 VMOVUPD (%R10),%ZMM14 |
(900) 0x4c506 VMOVUPD 0x40(%R10),%YMM15 |
(900) 0x4c50c VMOVUPD (%RSI,%RDI,8),%YMM13 |
(900) 0x4c511 ADD $0x4,%RDI |
(900) 0x4c515 ADD $0x60,%R10 |
(900) 0x4c519 VMOVAPD %ZMM14,%ZMM16 |
(900) 0x4c51f VMOVAPD %ZMM14,%ZMM17 |
(900) 0x4c525 VPERMT2PD %ZMM15,%ZMM1,%ZMM16 |
(900) 0x4c52b VPERMT2PD %ZMM15,%ZMM2,%ZMM17 |
(900) 0x4c531 VPERMT2PD %ZMM15,%ZMM3,%ZMM14 |
(900) 0x4c537 VFMADD231PD %YMM16,%YMM13,%YMM12 |
(900) 0x4c53d VFMADD231PD %YMM17,%YMM13,%YMM11 |
(900) 0x4c543 VFMADD231PD %YMM14,%YMM13,%YMM10 |
(900) 0x4c548 CMP %RDI,%R12 |
(900) 0x4c54b JNE 4c500 |
(894) 0x4c54d VEXTRACTF128 $0x1,%YMM10,%XMM13 |
(894) 0x4c553 VADDPD %YMM13,%YMM10,%YMM10 |
(894) 0x4c558 VPERMILPD $0x1,%XMM10,%XMM13 |
(894) 0x4c55e VADDPD %YMM13,%YMM10,%YMM10 |
(894) 0x4c563 VEXTRACTF128 $0x1,%YMM11,%XMM13 |
(894) 0x4c569 VADDPD %XMM13,%XMM11,%XMM11 |
(894) 0x4c56e VEXTRACTF128 $0x1,%YMM12,%XMM13 |
(894) 0x4c574 VADDPD %XMM13,%XMM12,%XMM12 |
(894) 0x4c579 VUNPCKHPD %XMM11,%XMM12,%XMM13 |
(894) 0x4c57e VUNPCKLPD %XMM11,%XMM12,%XMM11 |
(894) 0x4c583 VADDPD %XMM13,%XMM11,%XMM11 |
(894) 0x4c588 CMP %R8,%R12 |
(894) 0x4c58b JNE 4c5a3 |
(894) 0x4c58d NOPL (%RAX) |
(894) 0x4c590 CMP $0x4,%R8D |
(894) 0x4c594 JAE 4c605 |
(894) 0x4c596 VXORPD %XMM12,%XMM12,%XMM12 |
(894) 0x4c59b XOR %R10D,%R10D |
(894) 0x4c59e JMP 4c720 |
(894) 0x4c5a3 VBROADCASTSD %XMM10,%YMM10 |
(894) 0x4c5a8 MOV %R12,%RDI |
(894) 0x4c5ab VBLENDPD $0xc,%YMM10,%YMM11,%YMM11 |
(894) 0x4c5b1 JMP 4c5d0 |
(894) 0x4c5b3 VUNPCKLPD %XMM15,%XMM12,%XMM11 |
(894) 0x4c5b8 VINSERTF128 $0x1,%XMM10,%YMM11,%YMM10 |
(894) 0x4c5be VPERMILPD $0x2,%YMM10,%YMM11 |
(894) 0x4c5c4 NOPW %CS:(%RAX,%RAX,1) |
(894) 0x4c5d0 LEA (%RDI,%RDI,2),%R10 |
(894) 0x4c5d4 LEA (%RDX,%R10,8),%R10 |
(894) 0x4c5d8 NOPL (%RAX,%RAX,1) |
(899) 0x4c5e0 VPERMILPD $0x2,(%R10),%YMM10 |
(899) 0x4c5e6 ADD $0x18,%R10 |
(899) 0x4c5ea VFMADD231PD (%RSI,%RDI,8){1to4},%YMM10,%YMM11 |
(899) 0x4c5f1 INC %RDI |
(899) 0x4c5f4 CMP %RDI,%R8 |
(899) 0x4c5f7 JNE 4c5e0 |
(894) 0x4c5f9 VEXTRACTF128 $0x1,%YMM11,%XMM10 |
(894) 0x4c5ff CMP $0x4,%R8D |
(894) 0x4c603 JB 4c596 |
(894) 0x4c605 CMP $0x20,%R8D |
(894) 0x4c609 JAE 4c617 |
(894) 0x4c60b VXORPD %XMM12,%XMM12,%XMM12 |
(894) 0x4c610 XOR %EDI,%EDI |
(894) 0x4c612 JMP 4c6cd |
(894) 0x4c617 MOV -0x38(%RBP),%R10 |
(894) 0x4c61b VXORPD %XMM12,%XMM12,%XMM12 |
(894) 0x4c620 VXORPD %XMM13,%XMM13,%XMM13 |
(894) 0x4c625 VXORPD %XMM14,%XMM14,%XMM14 |
(894) 0x4c62a VXORPD %XMM15,%XMM15,%XMM15 |
(894) 0x4c62f XOR %EDI,%EDI |
(894) 0x4c631 NOPW %CS:(%RAX,%RAX,1) |
(896) 0x4c640 VMOVUPD -0xc0(%R15,%RDI,1),%ZMM16 |
(896) 0x4c648 VMOVUPD -0x80(%R15,%RDI,1),%ZMM17 |
(896) 0x4c650 VMOVUPD -0x40(%R15,%RDI,1),%ZMM18 |
(896) 0x4c658 VMOVUPD (%R15,%RDI,1),%ZMM19 |
(896) 0x4c65f VFMADD231PD -0xc0(%RAX,%RDI,1),%ZMM16,%ZMM12 |
(896) 0x4c667 VFMADD231PD -0x80(%RAX,%RDI,1),%ZMM17,%ZMM13 |
(896) 0x4c66f VFMADD231PD -0x40(%RAX,%RDI,1),%ZMM18,%ZMM14 |
(896) 0x4c677 VFMADD231PD (%RAX,%RDI,1),%ZMM19,%ZMM15 |
(896) 0x4c67e ADD $0x100,%RDI |
(896) 0x4c685 CMP %RDI,%R13 |
(896) 0x4c688 JNE 4c640 |
(894) 0x4c68a VADDPD %ZMM12,%ZMM13,%ZMM12 |
(894) 0x4c690 VADDPD %ZMM14,%ZMM15,%ZMM14 |
(894) 0x4c696 VADDPD %ZMM12,%ZMM14,%ZMM12 |
(894) 0x4c69c VEXTRACTF64X4 $0x1,%ZMM12,%YMM13 |
(894) 0x4c6a3 VADDPD %ZMM13,%ZMM12,%ZMM12 |
(894) 0x4c6a9 VEXTRACTF128 $0x1,%YMM12,%XMM13 |
(894) 0x4c6af VADDPD %XMM13,%XMM12,%XMM12 |
(894) 0x4c6b4 VPERMILPD $0x1,%XMM12,%XMM13 |
(894) 0x4c6ba VADDSD %XMM13,%XMM12,%XMM12 |
(894) 0x4c6bf CMP %R8,%R10 |
(894) 0x4c6c2 JE 4c734 |
(894) 0x4c6c4 MOV %R10,%RDI |
(894) 0x4c6c7 TEST $0x1c,%R8B |
(894) 0x4c6cb JE 4c720 |
(894) 0x4c6cd VMOVQ %XMM12,%XMM12 |
(894) 0x4c6d2 NOPW %CS:(%RAX,%RAX,1) |
(898) 0x4c6e0 VMOVUPD (%R9,%RDI,8),%YMM13 |
(898) 0x4c6e6 VFMADD231PD (%RSI,%RDI,8),%YMM13,%YMM12 |
(898) 0x4c6ec ADD $0x4,%RDI |
(898) 0x4c6f0 CMP %RDI,%R12 |
(898) 0x4c6f3 JNE 4c6e0 |
(894) 0x4c6f5 VEXTRACTF128 $0x1,%YMM12,%XMM13 |
(894) 0x4c6fb MOV %R12,%R10 |
(894) 0x4c6fe VADDPD %XMM13,%XMM12,%XMM12 |
(894) 0x4c703 VPERMILPD $0x1,%XMM12,%XMM13 |
(894) 0x4c709 VADDSD %XMM13,%XMM12,%XMM12 |
(894) 0x4c70e CMP %R8,%R12 |
(894) 0x4c711 JE 4c734 |
(894) 0x4c713 NOPW %CS:(%RAX,%RAX,1) |
(897) 0x4c720 VMOVSD (%R9,%R10,8),%XMM13 |
(897) 0x4c726 VFMADD231SD (%RSI,%R10,8),%XMM13,%XMM12 |
(897) 0x4c72c INC %R10 |
(897) 0x4c72f CMP %R10,%R8 |
(897) 0x4c732 JNE 4c720 |
(894) 0x4c734 MOV -0x30(%RBP),%R10 |
(894) 0x4c738 JMP 4c19f |
0x4c73d VMOVSD 0x10(%RBX),%XMM0 |
0x4c742 ADD $0x38,%RSP |
0x4c746 POP %RBX |
0x4c747 POP %R12 |
0x4c749 POP %R13 |
0x4c74b POP %R14 |
0x4c74d POP %R15 |
0x4c74f POP %RBP |
0x4c750 VZEROUPPER |
0x4c753 RET |
0x4c754 INT $0x3 |
0x4c755 INT $0x3 |
0x4c756 INT $0x3 |
0x4c757 INT $0x3 |
0x4c758 INT $0x3 |
0x4c759 INT $0x3 |
0x4c75a INT $0x3 |
0x4c75b INT $0x3 |
0x4c75c INT $0x3 |
0x4c75d INT $0x3 |
0x4c75e INT $0x3 |
0x4c75f INT $0x3 |
Path / |
Source file and lines | DiracDeterminantRef.cpp:235-255 |
Module | libqmcwfs.so |
nb instructions | 104 |
nb uops | 91 |
loop length | 460 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 3 |
used zmm registers | 6 |
nb stack references | 6 |
ADD-SUB / MUL ratio | 1.33 |
micro-operation queue | 15.17 cycles |
front end | 15.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 14.67 | 14.67 | 14.67 | 2.50 | 2.50 | 2.67 | 2.33 | 1.50 | 1.50 |
cycles | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 16.67 | 16.67 | 16.67 | 2.50 | 2.50 | 2.67 | 2.33 | 1.50 | 1.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 15.17 |
Dispatch | 16.67 |
Overall L1 | 16.67 |
all | 5% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 60% |
load | 64% |
store | 33% |
mul | 66% |
add-sub | 25% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 35% |
load | 50% |
store | 11% |
mul | 66% |
add-sub | 25% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 27% |
all | 11% |
load | 10% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 41% |
load | 51% |
store | 16% |
mul | 20% |
add-sub | 15% |
fma | 12% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 28% |
load | 42% |
store | 13% |
mul | 20% |
add-sub | 15% |
fma | 12% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x38,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4efa0 <@plt_start@+0x600> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x484(%RBX),%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP $0x1,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JNE 4c08f <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x9f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x100(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x140(%RBX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R15),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVDDUP (%RAX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSXD 0x478(%RBX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMULPD (%RCX),%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMULSD 0x10(%RCX),%XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
LEA (%RAX,%RAX,2),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VADDPD (%RDX,%RSI,8),%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VMULPD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVUPD %XMM3,(%RDX,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VADDSD 0x10(%RDX,%RSI,8),%XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VMOVSD %XMM3,0x10(%RDX,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
VPERMILPD $0x1,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOV 0x180(%RBX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VADDSD %XMM2,%XMM3,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOV 0x18(%R12),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VFMADD231SD %XMM1,%XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMSUB231SD (%RCX),%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD (%RDX,%RAX,8),%XMM2,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VMOVSD %XMM0,(%RDX,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
JMP 4c73d <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x74d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
TEST %R10D,%R10D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 4c73d <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x74d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x118(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVAPD -0x43ba7(%RIP),%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD -0x43c2f(%RIP),%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD -0x43c17(%RIP),%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD -0x42e81(%RIP),%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42e4b(%RIP),%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42e15(%RIP),%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42ddf(%RIP),%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42da9(%RIP),%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42d73(%RIP),%ZMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x480(%RBX),%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R15),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R12),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xd8(%RBX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x158(%RBX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x100(%RBX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x180(%RBX),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVSXD 0x478(%RBX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV 0x140(%RBX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R10,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SAL $0x3,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R8,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SHR $0x5,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R8D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x20,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R8D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDI | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SAL $0x3,%R14 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x4,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA (%RAX,%RAX,2),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SAL $0x8,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA 0xc0(%R9),%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA 0xc0(%RSI),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JMP 4c20c <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x21c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
VMOVSD 0x10(%RBX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD $0x38,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 |
Source file and lines | DiracDeterminantRef.cpp:235-255 |
Module | libqmcwfs.so |
nb instructions | 104 |
nb uops | 91 |
loop length | 460 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 3 |
used zmm registers | 6 |
nb stack references | 6 |
ADD-SUB / MUL ratio | 1.33 |
micro-operation queue | 15.17 cycles |
front end | 15.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 14.67 | 14.67 | 14.67 | 2.50 | 2.50 | 2.67 | 2.33 | 1.50 | 1.50 |
cycles | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 16.67 | 16.67 | 16.67 | 2.50 | 2.50 | 2.67 | 2.33 | 1.50 | 1.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 15.17 |
Dispatch | 16.67 |
Overall L1 | 16.67 |
all | 5% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 60% |
load | 64% |
store | 33% |
mul | 66% |
add-sub | 25% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 35% |
load | 50% |
store | 11% |
mul | 66% |
add-sub | 25% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 27% |
all | 11% |
load | 10% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 41% |
load | 51% |
store | 16% |
mul | 20% |
add-sub | 15% |
fma | 12% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 28% |
load | 42% |
store | 13% |
mul | 20% |
add-sub | 15% |
fma | 12% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x38,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4efa0 <@plt_start@+0x600> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x484(%RBX),%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP $0x1,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JNE 4c08f <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x9f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x100(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x140(%RBX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R15),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVDDUP (%RAX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSXD 0x478(%RBX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMULPD (%RCX),%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMULSD 0x10(%RCX),%XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
LEA (%RAX,%RAX,2),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VADDPD (%RDX,%RSI,8),%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VMULPD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVUPD %XMM3,(%RDX,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VADDSD 0x10(%RDX,%RSI,8),%XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VMOVSD %XMM3,0x10(%RDX,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
VPERMILPD $0x1,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOV 0x180(%RBX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VADDSD %XMM2,%XMM3,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOV 0x18(%R12),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VFMADD231SD %XMM1,%XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMSUB231SD (%RCX),%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD (%RDX,%RAX,8),%XMM2,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VMOVSD %XMM0,(%RDX,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
JMP 4c73d <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x74d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
TEST %R10D,%R10D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 4c73d <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x74d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x118(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVAPD -0x43ba7(%RIP),%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD -0x43c2f(%RIP),%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD -0x43c17(%RIP),%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD -0x42e81(%RIP),%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42e4b(%RIP),%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42e15(%RIP),%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42ddf(%RIP),%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42da9(%RIP),%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD -0x42d73(%RIP),%ZMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x480(%RBX),%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R15),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%R12),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xd8(%RBX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x158(%RBX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x100(%RBX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x180(%RBX),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVSXD 0x478(%RBX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV 0x140(%RBX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R10,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SAL $0x3,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R8,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SHR $0x5,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R8D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x20,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R8D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDI | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SAL $0x3,%R14 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x4,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA (%RAX,%RAX,2),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SAL $0x8,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA 0xc0(%R9),%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA 0xc0(%RSI),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JMP 4c20c <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE+0x21c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
VMOVSD 0x10(%RBX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD $0x38,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE11evaluateLogERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEE– | 0.06 | 0.11 |
▼Loop 894 - OhmmsMatrix.h:217-217 - libqmcwfs.so– | 0 | 0 |
○Loop 895 - inner_product.hpp:155-155 - libqmcwfs.so | 0.04 | 0.08 |
○Loop 896 - inner_product.hpp:82-83 - libqmcwfs.so | 0.01 | 0.02 |
○Loop 900 - inner_product.hpp:155-155 - libqmcwfs.so | 0 | 0 |
○Loop 899 - inner_product.hpp:155-155 - libqmcwfs.so | 0 | 0 |
○Loop 897 - inner_product.hpp:82-83 - libqmcwfs.so | 0 | 0 |
○Loop 898 - inner_product.hpp:82-83 - libqmcwfs.so | 0 | 0 |