Function: miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::computeU3(qmcpl ... | Module: exec | Source: OneBodyJastrowRef.h:209-245 [...] | Coverage: 0.01% |
---|
Function: miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::computeU3(qmcpl ... | Module: exec | Source: OneBodyJastrowRef.h:209-245 [...] | Coverage: 0.01% |
---|
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/BsplineFunctor.h: 188 - 217 |
-------------------------------------------------------------------------------- |
188: if (r >= cutoff_radius) |
189: { |
190: dudr = d2udr2 = 0.0; |
191: return 0.0; |
192: } |
193: r *= DeltaRInv; |
194: real_type ipart, t; |
195: t = std::modf(r, &ipart); |
196: int i = (int)ipart; |
197: real_type tp[4]; |
198: tp[0] = t * t * t; |
199: tp[1] = t * t; |
200: tp[2] = t; |
201: tp[3] = 1.0; |
202: // clang-format off |
203: d2udr2 = DeltaRInv * DeltaRInv * |
204: (SplineCoefs[i+0]*(d2A[ 0]*tp[0] + d2A[ 1]*tp[1] + d2A[ 2]*tp[2] + d2A[ 3]*tp[3])+ |
205: SplineCoefs[i+1]*(d2A[ 4]*tp[0] + d2A[ 5]*tp[1] + d2A[ 6]*tp[2] + d2A[ 7]*tp[3])+ |
206: SplineCoefs[i+2]*(d2A[ 8]*tp[0] + d2A[ 9]*tp[1] + d2A[10]*tp[2] + d2A[11]*tp[3])+ |
207: SplineCoefs[i+3]*(d2A[12]*tp[0] + d2A[13]*tp[1] + d2A[14]*tp[2] + d2A[15]*tp[3])); |
208: dudr = DeltaRInv * |
209: (SplineCoefs[i+0]*(dA[ 0]*tp[0] + dA[ 1]*tp[1] + dA[ 2]*tp[2] + dA[ 3]*tp[3])+ |
210: SplineCoefs[i+1]*(dA[ 4]*tp[0] + dA[ 5]*tp[1] + dA[ 6]*tp[2] + dA[ 7]*tp[3])+ |
211: SplineCoefs[i+2]*(dA[ 8]*tp[0] + dA[ 9]*tp[1] + dA[10]*tp[2] + dA[11]*tp[3])+ |
212: SplineCoefs[i+3]*(dA[12]*tp[0] + dA[13]*tp[1] + dA[14]*tp[2] + dA[15]*tp[3])); |
213: return |
214: (SplineCoefs[i+0]*(A[ 0]*tp[0] + A[ 1]*tp[1] + A[ 2]*tp[2] + A[ 3]*tp[3])+ |
215: SplineCoefs[i+1]*(A[ 4]*tp[0] + A[ 5]*tp[1] + A[ 6]*tp[2] + A[ 7]*tp[3])+ |
216: SplineCoefs[i+2]*(A[ 8]*tp[0] + A[ 9]*tp[1] + A[10]*tp[2] + A[11]*tp[3])+ |
217: SplineCoefs[i+3]*(A[12]*tp[0] + A[13]*tp[1] + A[14]*tp[2] + A[15]*tp[3])); |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 229 - 229 |
-------------------------------------------------------------------------------- |
229: return X[i]; |
/usr/include/c++/13.1.1/bits/stl_vector.h: 1123 - 1258 |
-------------------------------------------------------------------------------- |
1123: operator[](size_type __n) _GLIBCXX_NOEXCEPT |
1124: { |
1125: __glibcxx_requires_subscript(__n); |
1126: return *(this->_M_impl._M_start + __n); |
[...] |
1258: { return _M_data_ptr(this->_M_impl._M_start); } |
/usr/include/c++/13.1.1/bits/stl_algobase.h: 930 - 1128 |
-------------------------------------------------------------------------------- |
930: for (; __first != __last; ++__first) |
931: *__first = __tmp; |
[...] |
1123: if (__n <= 0) |
1124: return __first; |
1125: |
1126: __glibcxx_requires_can_increment(__first, __n); |
1127: |
1128: std::__fill_a(__first, __first + __n, __value); |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/OneBodyJastrowRef.h: 209 - 245 |
-------------------------------------------------------------------------------- |
209: inline void computeU3(ParticleSet& P, int iat, const valT* dist) |
210: { |
211: if (NumGroups > 0) |
[...] |
218: for (int jg = 0; jg < NumGroups; ++jg) |
219: { |
220: if (F[jg] == nullptr) |
221: continue; |
222: F[jg]->evaluateVGL(-1, |
[...] |
235: for (int c = 0; c < Nions; ++c) |
236: { |
237: int gid = Ions.GroupID[c]; |
238: if (F[gid] != nullptr) |
239: { |
240: U[c] = F[gid]->evaluate(dist[c], dU[c], d2U[c]); |
241: dU[c] /= dist[c]; |
242: } |
243: } |
244: } |
245: } |
0x41b270 LEA 0x8(%RSP),%R10 |
0x41b275 AND $-0x20,%RSP |
0x41b279 PUSHQ -0x8(%R10) |
0x41b27d PUSH %RBP |
0x41b27e MOV %RSP,%RBP |
0x41b281 PUSH %R15 |
0x41b283 PUSH %R14 |
0x41b285 PUSH %R13 |
0x41b287 PUSH %R12 |
0x41b289 MOV %RDI,%R12 |
0x41b28c PUSH %R10 |
0x41b28e MOV %RSI,%R10 |
0x41b291 PUSH %RBX |
0x41b292 SUB $0x60,%RSP |
0x41b296 MOV %FS:0x28,%RAX |
0x41b29f MOV %RAX,-0x38(%RBP) |
0x41b2a3 XOR %EAX,%EAX |
0x41b2a5 MOV 0x9c(%RDI),%EAX |
0x41b2ab MOVSXD 0x94(%RDI),%RBX |
0x41b2b2 TEST %EAX,%EAX |
0x41b2b4 JLE 41b398 |
0x41b2ba MOV 0xf8(%RDI),%R13 |
0x41b2c1 MOV 0x128(%RDI),%R14 |
0x41b2c8 MOV 0x110(%RDI),%R15 |
0x41b2cf TEST %EBX,%EBX |
0x41b2d1 JLE 41b306 |
0x41b2d3 SAL $0x3,%RBX |
0x41b2d7 MOV %RSI,-0x48(%RBP) |
0x41b2db MOV %R13,%RDI |
0x41b2de XOR %ESI,%ESI |
0x41b2e0 MOV %RBX,%RDX |
0x41b2e3 CALL 404150 <memset@plt> |
0x41b2e8 MOV %RBX,%RDX |
0x41b2eb XOR %ESI,%ESI |
0x41b2ed MOV %R15,%RDI |
0x41b2f0 CALL 404150 <memset@plt> |
0x41b2f5 MOV %RBX,%RDX |
0x41b2f8 XOR %ESI,%ESI |
0x41b2fa MOV %R14,%RDI |
0x41b2fd CALL 404150 <memset@plt> |
0x41b302 MOV -0x48(%RBP),%R10 |
0x41b306 MOV %R10,-0x48(%RBP) |
0x41b30a XOR %EBX,%EBX |
0x41b30c NOPL (%RAX) |
(204) 0x41b310 MOV 0x1c0(%R12),%R9 |
(204) 0x41b318 MOV (%R9,%RBX,8),%RDI |
(204) 0x41b31c TEST %RDI,%RDI |
(204) 0x41b31f JE 41b360 |
(204) 0x41b321 MOV 0xa0(%R12),%R11 |
(204) 0x41b329 MOV -0x48(%RBP),%R8 |
(204) 0x41b32d MOV %R13,%R9 |
(204) 0x41b330 MOV $-0x1,%ESI |
(204) 0x41b335 MOV 0xa98(%R11),%RAX |
(204) 0x41b33c MOV 0x4(%RAX,%RBX,4),%ECX |
(204) 0x41b340 MOV (%RAX,%RBX,4),%EDX |
(204) 0x41b343 PUSHQ 0x158(%R12) |
(204) 0x41b34b PUSHQ 0x140(%R12) |
(204) 0x41b353 PUSH %R14 |
(204) 0x41b355 PUSH %R15 |
(204) 0x41b357 CALL 4476c0 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi> |
(204) 0x41b35c ADD $0x20,%RSP |
(204) 0x41b360 INC %RBX |
(204) 0x41b363 CMP %EBX,0x9c(%R12) |
(204) 0x41b36b JG 41b310 |
0x41b36d MOV -0x38(%RBP),%RAX |
0x41b371 SUB %FS:0x28,%RAX |
0x41b37a JNE 41b70b |
0x41b380 LEA -0x30(%RBP),%RSP |
0x41b384 POP %RBX |
0x41b385 POP %R8 |
0x41b387 POP %R12 |
0x41b389 POP %R13 |
0x41b38b POP %R14 |
0x41b38d POP %R15 |
0x41b38f POP %RBP |
0x41b390 LEA -0x8(%R8),%RSP |
0x41b394 RET |
0x41b395 NOPL (%RAX) |
0x41b398 TEST %EBX,%EBX |
0x41b39a JLE 41b36d |
0x41b39c MOV 0xa0(%RDI),%RDX |
0x41b3a3 MOV 0x1c0(%RDI),%RCX |
0x41b3aa LEA -0x40(%RBP),%RDI |
0x41b3ae XOR %R13D,%R13D |
0x41b3b1 MOV %RDI,-0x78(%RBP) |
0x41b3b5 MOV %R12,%R15 |
0x41b3b8 MOV 0x5c0(%RDX),%RSI |
0x41b3bf MOVSXD %EBX,%RDX |
0x41b3c2 JMP 41b406 |
0x41b3c4 NOPL (%RAX) |
(203) 0x41b3c8 MOVQ $0,(%R11) |
(203) 0x41b3cf VXORPD %XMM4,%XMM4,%XMM4 |
(203) 0x41b3d3 MOVQ $0,(%R12) |
(203) 0x41b3db MOV 0xf8(%R15),%RDI |
(203) 0x41b3e2 VMOVSD %XMM4,(%RDI,%R14,1) |
(203) 0x41b3e8 VMOVSD (%R12),%XMM0 |
(203) 0x41b3ee VDIVSD (%R10,%R13,8),%XMM0,%XMM5 |
(203) 0x41b3f4 VMOVSD %XMM5,(%R12) |
(203) 0x41b3fa INC %R13 |
(203) 0x41b3fd CMP %RDX,%R13 |
(203) 0x41b400 JE 41b36d |
(203) 0x41b406 MOVSXD (%RSI,%R13,4),%R9 |
(203) 0x41b40a MOV (%RCX,%R9,8),%RBX |
(203) 0x41b40e TEST %RBX,%RBX |
(203) 0x41b411 JE 41b3fa |
(203) 0x41b413 MOV 0x128(%R15),%R11 |
(203) 0x41b41a MOV 0x110(%R15),%R12 |
(203) 0x41b421 LEA (,%R13,8),%R14 |
(203) 0x41b429 VMOVSD (%R10,%R13,8),%XMM0 |
(203) 0x41b42f ADD %R14,%R11 |
(203) 0x41b432 ADD %R14,%R12 |
(203) 0x41b435 VCOMISD 0x8(%RBX),%XMM0 |
(203) 0x41b43a JAE 41b3c8 |
(203) 0x41b43c VMOVSD 0x238(%RBX),%XMM3 |
(203) 0x41b444 MOV -0x78(%RBP),%RDI |
(203) 0x41b448 MOV %R10,-0x70(%RBP) |
(203) 0x41b44c MOV %RCX,-0x68(%RBP) |
(203) 0x41b450 VMULSD %XMM3,%XMM0,%XMM0 |
(203) 0x41b454 MOV %RSI,-0x60(%RBP) |
(203) 0x41b458 MOV %RDX,-0x58(%RBP) |
(203) 0x41b45c VMOVSD %XMM3,-0x48(%RBP) |
(203) 0x41b461 MOV %R11,-0x50(%RBP) |
(203) 0x41b465 CALL 4042f0 <modf@plt> |
(203) 0x41b46a VMOVSD 0x120(%RBX),%XMM14 |
(203) 0x41b472 VMOVSD 0x118(%RBX),%XMM7 |
(203) 0x41b47a VMULSD %XMM0,%XMM0,%XMM5 |
(203) 0x41b47e VBROADCASTSD %XMM0,%YMM2 |
(203) 0x41b483 VMOVSD 0x178(%RBX),%XMM11 |
(203) 0x41b48b MOV 0x218(%RBX),%RSI |
(203) 0x41b492 VMOVHPD 0x140(%RBX),%XMM14,%XMM15 |
(203) 0x41b49a VMOVHPD 0x138(%RBX),%XMM7,%XMM10 |
(203) 0x41b4a2 VMOVSD 0x130(%RBX),%XMM14 |
(203) 0x41b4aa MOV -0x50(%RBP),%R8 |
(203) 0x41b4ae VMOVHPD 0x158(%RBX),%XMM11,%XMM12 |
(203) 0x41b4b6 VCVTTSD2SI -0x40(%RBP),%EAX |
(203) 0x41b4bb VINSERTF128 $0x1,%XMM10,%YMM12,%YMM13 |
(203) 0x41b4c1 VMOVSD 0x188(%RBX),%XMM10 |
(203) 0x41b4c9 VMULSD %XMM5,%XMM0,%XMM6 |
(203) 0x41b4cd VMOVSD 0x180(%RBX),%XMM0 |
(203) 0x41b4d5 VBROADCASTSD %XMM5,%YMM4 |
(203) 0x41b4da VMOVHPD 0x168(%RBX),%XMM10,%XMM11 |
(203) 0x41b4e2 CLTQ |
(203) 0x41b4e4 VMOVHPD 0x160(%RBX),%XMM0,%XMM3 |
(203) 0x41b4ec VMOVSD 0x190(%RBX),%XMM0 |
(203) 0x41b4f4 VPERMPD $0x4b,(%RSI,%RAX,8),%YMM8 |
(203) 0x41b4fb VINSERTF128 $0x1,%XMM15,%YMM3,%YMM1 |
(203) 0x41b501 VMOVHPD 0x150(%RBX),%XMM14,%XMM15 |
(203) 0x41b509 VMULPD %YMM4,%YMM1,%YMM5 |
(203) 0x41b50d VMOVHPD 0x170(%RBX),%XMM0,%XMM3 |
(203) 0x41b515 VBROADCASTSD %XMM6,%YMM9 |
(203) 0x41b51a VMOVSD 0x128(%RBX),%XMM6 |
(203) 0x41b522 VINSERTF128 $0x1,%XMM15,%YMM3,%YMM1 |
(203) 0x41b528 VMOVHPD 0x148(%RBX),%XMM6,%XMM7 |
(203) 0x41b530 VINSERTF128 $0x1,%XMM7,%YMM11,%YMM12 |
(203) 0x41b536 VMOVSD -0x48(%RBP),%XMM11 |
(203) 0x41b53b VFMADD132PD %YMM2,%YMM1,%YMM12 |
(203) 0x41b540 VFMADD132PD %YMM9,%YMM5,%YMM13 |
(203) 0x41b545 VADDPD %YMM13,%YMM12,%YMM13 |
(203) 0x41b54a VMULSD %XMM11,%XMM11,%XMM12 |
(203) 0x41b54f VMULPD %YMM8,%YMM13,%YMM8 |
(203) 0x41b554 VEXTRACTF64X2 $0x1,%YMM8,%XMM5 |
(203) 0x41b55b VADDPD %XMM8,%XMM5,%XMM6 |
(203) 0x41b560 VUNPCKHPD %XMM6,%XMM6,%XMM7 |
(203) 0x41b564 VADDPD %XMM6,%XMM7,%XMM10 |
(203) 0x41b568 VMULSD %XMM10,%XMM12,%XMM14 |
(203) 0x41b56d VMOVSD %XMM14,(%R8) |
(203) 0x41b572 VMOVSD 0xa0(%RBX),%XMM5 |
(203) 0x41b57a VMOVSD 0x100(%RBX),%XMM7 |
(203) 0x41b582 VMOVSD 0x98(%RBX),%XMM0 |
(203) 0x41b58a VMOVSD 0xf8(%RBX),%XMM3 |
(203) 0x41b592 VMOVHPD 0xc0(%RBX),%XMM5,%XMM6 |
(203) 0x41b59a VMOVHPD 0xe0(%RBX),%XMM7,%XMM10 |
(203) 0x41b5a2 VMOVSD 0xa8(%RBX),%XMM14 |
(203) 0x41b5aa VPERMPD $0x4b,(%RSI,%RAX,8),%YMM15 |
(203) 0x41b5b1 VINSERTF128 $0x1,%XMM6,%YMM10,%YMM11 |
(203) 0x41b5b7 VMOVHPD 0xd8(%RBX),%XMM3,%XMM13 |
(203) 0x41b5bf VMOVHPD 0xb8(%RBX),%XMM0,%XMM1 |
(203) 0x41b5c7 VMULPD %YMM4,%YMM11,%YMM12 |
(203) 0x41b5cb VINSERTF128 $0x1,%XMM1,%YMM13,%YMM8 |
(203) 0x41b5d1 VMOVHPD 0xc8(%RBX),%XMM14,%XMM1 |
(203) 0x41b5d9 VMOVSD 0x108(%RBX),%XMM0 |
(203) 0x41b5e1 VMOVSD 0xb0(%RBX),%XMM5 |
(203) 0x41b5e9 VMOVSD 0x110(%RBX),%XMM7 |
(203) 0x41b5f1 VMOVHPD 0xe8(%RBX),%XMM0,%XMM3 |
(203) 0x41b5f9 MOV -0x70(%RBP),%R10 |
(203) 0x41b5fd MOV -0x68(%RBP),%RCX |
(203) 0x41b601 VMOVHPD 0xd0(%RBX),%XMM5,%XMM6 |
(203) 0x41b609 VMOVHPD 0xf0(%RBX),%XMM7,%XMM10 |
(203) 0x41b611 VINSERTF128 $0x1,%XMM1,%YMM3,%YMM13 |
(203) 0x41b617 MOV -0x58(%RBP),%RDX |
(203) 0x41b61b VINSERTF128 $0x1,%XMM6,%YMM10,%YMM11 |
(203) 0x41b621 VFMADD132PD %YMM2,%YMM11,%YMM13 |
(203) 0x41b626 VFMADD132PD %YMM9,%YMM12,%YMM8 |
(203) 0x41b62b VADDPD %YMM8,%YMM13,%YMM8 |
(203) 0x41b630 VMULPD %YMM15,%YMM8,%YMM15 |
(203) 0x41b635 VEXTRACTF64X2 $0x1,%YMM15,%XMM12 |
(203) 0x41b63c VADDPD %XMM15,%XMM12,%XMM14 |
(203) 0x41b641 VUNPCKHPD %XMM14,%XMM14,%XMM1 |
(203) 0x41b646 VADDPD %XMM14,%XMM1,%XMM0 |
(203) 0x41b64b VMULSD 0x238(%RBX),%XMM0,%XMM3 |
(203) 0x41b653 VMOVSD %XMM3,(%R12) |
(203) 0x41b659 VMOVSD 0x20(%RBX),%XMM8 |
(203) 0x41b65e VMOVSD 0x80(%RBX),%XMM12 |
(203) 0x41b666 VMOVSD 0x18(%RBX),%XMM5 |
(203) 0x41b66b VMOVSD 0x78(%RBX),%XMM7 |
(203) 0x41b670 VMOVHPD 0x40(%RBX),%XMM8,%XMM15 |
(203) 0x41b675 VMOVHPD 0x60(%RBX),%XMM12,%XMM14 |
(203) 0x41b67a VMOVSD 0x28(%RBX),%XMM0 |
(203) 0x41b67f VMOVSD 0x88(%RBX),%XMM3 |
(203) 0x41b687 VINSERTF128 $0x1,%XMM15,%YMM14,%YMM1 |
(203) 0x41b68d VMOVHPD 0x38(%RBX),%XMM5,%XMM6 |
(203) 0x41b692 VMOVHPD 0x58(%RBX),%XMM7,%XMM10 |
(203) 0x41b697 VMOVSD 0x90(%RBX),%XMM8 |
(203) 0x41b69f VMULPD %YMM4,%YMM1,%YMM4 |
(203) 0x41b6a3 VINSERTF128 $0x1,%XMM6,%YMM10,%YMM11 |
(203) 0x41b6a9 VMOVSD 0x30(%RBX),%XMM10 |
(203) 0x41b6ae VMOVHPD 0x48(%RBX),%XMM0,%XMM5 |
(203) 0x41b6b3 VMOVHPD 0x68(%RBX),%XMM3,%XMM6 |
(203) 0x41b6b8 VMOVHPD 0x70(%RBX),%XMM8,%XMM15 |
(203) 0x41b6bd VPERMPD $0x4b,(%RSI,%RAX,8),%YMM13 |
(203) 0x41b6c4 MOV -0x60(%RBP),%RSI |
(203) 0x41b6c8 VINSERTF128 $0x1,%XMM5,%YMM6,%YMM7 |
(203) 0x41b6ce VFMADD132PD %YMM11,%YMM4,%YMM9 |
(203) 0x41b6d3 VMOVHPD 0x50(%RBX),%XMM10,%XMM11 |
(203) 0x41b6d8 VINSERTF128 $0x1,%XMM11,%YMM15,%YMM12 |
(203) 0x41b6de VFMADD231PD %YMM7,%YMM2,%YMM12 |
(203) 0x41b6e3 VADDPD %YMM9,%YMM12,%YMM2 |
(203) 0x41b6e8 VMULPD %YMM13,%YMM2,%YMM9 |
(203) 0x41b6ed VEXTRACTF64X2 $0x1,%YMM9,%XMM13 |
(203) 0x41b6f4 VADDPD %XMM9,%XMM13,%XMM14 |
(203) 0x41b6f9 VUNPCKHPD %XMM14,%XMM14,%XMM1 |
(203) 0x41b6fe VADDPD %XMM14,%XMM1,%XMM4 |
(203) 0x41b703 VZEROUPPER |
(203) 0x41b706 JMP 41b3db |
0x41b70b CALL 404140 <__stack_chk_fail@plt> |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | miniqmcreference::OneBodyJastr[...] | stl_vector.h:1123 | exec |
○ | qmcplusplus::WaveFunction::rat[...] | WaveFunction.cpp:207 | exec |
○ | main._omp_fn.1 | miniqmc.cpp:438 | exec |
○ | GOMP_parallel | libgomp.h:985 | libgomp.so.1.0.0 |
Path / |
Source file and lines | OneBodyJastrowRef.h:209-245 |
Module | exec |
nb instructions | 71 |
nb uops | 76 |
loop length | 256 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 6 |
micro-operation queue | 19.00 cycles |
front end | 19.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 5.50 | 5.25 | 12.33 | 12.33 | 16.00 | 5.25 | 6.00 | 12.33 |
cycles | 5.50 | 5.25 | 12.33 | 12.33 | 16.00 | 5.25 | 6.00 | 12.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 18.11 |
Stall cycles | 0.00 |
Front-end | 19.00 |
Dispatch | 16.00 |
Overall L1 | 19.00 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 7% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
LEA 0x8(%RSP),%R10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
AND $-0x20,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
PUSHQ -0x8(%R10) | 2 | 0 | 0 | 0.83 | 0.83 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R10 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSI,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0x60,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %FS:0x28,%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x9c(%RDI),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD 0x94(%RDI),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %EAX,%EAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 41b398 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd.isra.0+0x128> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0xf8(%RDI),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x128(%RDI),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x110(%RDI),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %EBX,%EBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 41b306 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd.isra.0+0x96> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
SAL $0x3,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %RSI,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 404150 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 404150 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 404150 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x48(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R10,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
SUB %FS:0x28,%RAX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JNE 41b70b <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd.isra.0+0x49b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA -0x30(%RBP),%RSP | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
LEA -0x8(%R8),%RSP | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
TEST %EBX,%EBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 41b36d <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd.isra.0+0xfd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0xa0(%RDI),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x1c0(%RDI),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x40(%RBP),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,-0x78(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R12,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x5c0(%RDX),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD %EBX,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JMP 41b406 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd.isra.0+0x196> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 404140 <__stack_chk_fail@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
Source file and lines | OneBodyJastrowRef.h:209-245 |
Module | exec |
nb instructions | 71 |
nb uops | 76 |
loop length | 256 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 6 |
micro-operation queue | 19.00 cycles |
front end | 19.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 5.50 | 5.25 | 12.33 | 12.33 | 16.00 | 5.25 | 6.00 | 12.33 |
cycles | 5.50 | 5.25 | 12.33 | 12.33 | 16.00 | 5.25 | 6.00 | 12.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 18.11 |
Stall cycles | 0.00 |
Front-end | 19.00 |
Dispatch | 16.00 |
Overall L1 | 19.00 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 7% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
LEA 0x8(%RSP),%R10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
AND $-0x20,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
PUSHQ -0x8(%R10) | 2 | 0 | 0 | 0.83 | 0.83 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R10 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSI,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0x60,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %FS:0x28,%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x9c(%RDI),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD 0x94(%RDI),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %EAX,%EAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 41b398 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd.isra.0+0x128> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0xf8(%RDI),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x128(%RDI),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x110(%RDI),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %EBX,%EBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 41b306 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd.isra.0+0x96> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
SAL $0x3,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %RSI,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 404150 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 404150 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 404150 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x48(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R10,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
SUB %FS:0x28,%RAX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JNE 41b70b <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd.isra.0+0x49b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA -0x30(%RBP),%RSP | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
LEA -0x8(%R8),%RSP | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
TEST %EBX,%EBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 41b36d <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd.isra.0+0xfd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0xa0(%RDI),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x1c0(%RDI),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x40(%RBP),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,-0x78(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R12,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x5c0(%RDX),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD %EBX,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JMP 41b406 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd.isra.0+0x196> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 404140 <__stack_chk_fail@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼miniqmcreference::OneBodyJastrowRef | 0.01 | 0 |
○Loop 204 - OneBodyJastrowRef.h:218-222 - exec | 0.01 | 0 |
○Loop 203 - BsplineFunctor.h:188-217 - exec | 0 | 0 |