Function: qmcplusplus::DistanceTableBA<double, 3u, 39>::evaluate(qmcplusplus::ParticleSet&) | Module: libqmcparticle.so | Source: DistanceTableBA.h:65-105 [...] | Coverage: 0.37% |
---|
Function: qmcplusplus::DistanceTableBA<double, 3u, 39>::evaluate(qmcplusplus::ParticleSet&) | Module: libqmcparticle.so | Source: DistanceTableBA.h:65-105 [...] | Coverage: 0.37% |
---|
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 237 - 239 |
-------------------------------------------------------------------------------- |
237: T* data() { return myData; } |
238: ///return the base |
239: const T* data() const { return myData; } |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Particle/DistanceTableBA.h: 65 - 105 |
-------------------------------------------------------------------------------- |
65: inline void evaluate(ParticleSet& P) |
[...] |
73: const size_t ntgt_local = Ntargets; |
74: const size_t ntgt_padded = getAlignedSize<T>(Ntargets); |
75: const size_t nsrc_padded = getAlignedSize<T>(Nsources); |
[...] |
83: const size_t num_teams = (nsrc_padded + ChunkSizePerTeam - 1) / ChunkSizePerTeam; |
84: |
85: PRAGMA_OFFLOAD("omp target teams distribute collapse(2) num_teams(Ntargets * num_teams) \ |
86: map(to: src_ptr[:D*Origin->RSoA.capacity()], tgt_ptr[:D*P.RSoA.capacity()]) \ |
87: map(from: dist_ptr[:Distances.size()], displ_ptr[:memoryPool.size()])") |
88: for (size_t iat = 0; iat < ntgt_local; ++iat) |
89: for (size_t team_id = 0; team_id < num_teams; ++team_id) |
90: { |
91: T pos[D]; |
92: for (int idim = 0; idim < D; idim++) |
93: pos[idim] = *(tgt_ptr + ntgt_padded * idim + iat); |
94: |
95: const size_t first = ChunkSizePerTeam * team_id; |
96: const size_t last = std::min(first + ChunkSizePerTeam, nsrc_padded); |
97: |
98: PRAGMA_OFFLOAD("omp parallel for") |
99: for (size_t jel = first; jel < last; ++jel) |
100: { |
101: DTD_BConds<T, D, SC>::computeDistancesOffload(pos, src_ptr, nsrc_padded, dist_ptr + nsrc_padded * iat, |
102: displ_ptr + nsrc_padded * D * iat, nsrc_padded, jel); |
103: } |
104: } |
105: } |
/usr/include/c++/13.1.1/bits/stl_vector.h: 1258 - 1258 |
-------------------------------------------------------------------------------- |
1258: { return _M_data_ptr(this->_M_impl._M_start); } |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Particle/Lattice/ParticleBConds.h: 235 - 278 |
-------------------------------------------------------------------------------- |
235: const T* restrict py = R0 + r0_stride; |
236: const T* restrict pz = R0 + r0_stride * 2; |
[...] |
249: const T flip = iat < flip_ind ? one : minusone; |
250: const T displ_0 = (px[iat] - x0) * flip; |
251: const T displ_1 = (py[iat] - y0) * flip; |
252: const T displ_2 = (pz[iat] - z0) * flip; |
253: |
254: const T ar_0 = -std::floor(displ_0 * g00 + displ_1 * g10 + displ_2 * g20); |
255: const T ar_1 = -std::floor(displ_0 * g01 + displ_1 * g11 + displ_2 * g21); |
256: const T ar_2 = -std::floor(displ_0 * g02 + displ_1 * g12 + displ_2 * g22); |
257: |
258: const T delx = displ_0 + ar_0 * r00 + ar_1 * r10 + ar_2 * r20; |
259: const T dely = displ_1 + ar_0 * r01 + ar_1 * r11 + ar_2 * r21; |
260: const T delz = displ_2 + ar_0 * r02 + ar_1 * r12 + ar_2 * r22; |
261: |
262: T rmin = delx * delx + dely * dely + delz * delz; |
263: int ic = 0; |
264: #pragma unroll(7) |
265: for (int c = 1; c < 8; ++c) |
266: { |
267: const T x = delx + cellx[c]; |
268: const T y = dely + celly[c]; |
269: const T z = delz + cellz[c]; |
270: const T r2 = x * x + y * y + z * z; |
271: ic = (r2 < rmin) ? c : ic; |
272: rmin = (r2 < rmin) ? r2 : rmin; |
273: } |
274: |
275: temp_r[iat] = std::sqrt(rmin); |
276: dx[iat] = flip * (delx + cellx[ic]); |
277: dy[iat] = flip * (dely + celly[ic]); |
278: dz[iat] = flip * (delz + cellz[ic]); |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 248 - 248 |
-------------------------------------------------------------------------------- |
248: inline pointer data() { return X; } |
/usr/include/c++/13.1.1/bits/stl_algobase.h: 238 - 238 |
-------------------------------------------------------------------------------- |
238: if (__b < __a) |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Platforms/CPU/SIMD/aligned_allocator.hpp: 46 - 46 |
-------------------------------------------------------------------------------- |
46: return ((n + ND - 1) / ND) * ND; |
0xa810 PUSH %RBP |
0xa811 MOV %RSI,%R8 |
0xa814 MOV %RDI,%R9 |
0xa817 MOV %RSP,%RBP |
0xa81a PUSH %R15 |
0xa81c PUSH %R14 |
0xa81e PUSH %R13 |
0xa820 PUSH %R12 |
0xa822 PUSH %RBX |
0xa823 SUB $0x78,%RSP |
0xa827 MOVSXD 0xc4(%RDI),%RSI |
0xa82e MOVSXD 0xc8(%RDI),%RDX |
0xa835 MOV 0x8(%R9),%RCX |
0xa839 MOV 0x40(%RDI),%R10 |
0xa83d ADD $0x7,%RSI |
0xa841 LEA 0x7(%RDX),%RAX |
0xa845 MOV 0xa8(%RDI),%RDI |
0xa84c MOV 0x610(%R8),%R14 |
0xa853 AND $-0x8,%RSI |
0xa857 MOV 0x610(%RCX),%R15 |
0xa85e AND $-0x8,%RAX |
0xa862 LEA 0x7f(%RSI),%RCX |
0xa866 SHR $0x7,%RCX |
0xa86a TEST %RDX,%RDX |
0xa86d JE ae14 |
0xa873 LEA (%RSI,%RSI,1),%EBX |
0xa876 SAL $0x3,%RAX |
0xa87a LEA (%RSI,%RSI,2),%R12 |
0xa87e MOV %RSI,-0xf0(%RBP) |
0xa885 MOVSXD %EBX,%R13 |
0xa888 LEA (%R14,%RAX,1),%RBX |
0xa88c LEA (,%R12,8),%R8 |
0xa894 MOV %RDI,%R12 |
0xa897 LEA (,%RSI,8),%R11 |
0xa89f ADD %RBX,%RAX |
0xa8a2 MOV %RCX,%RDI |
0xa8a5 MOV %RBX,-0xe0(%RBP) |
0xa8ac SAL $0x7,%RDI |
0xa8b0 MOV %R11,-0x100(%RBP) |
0xa8b7 VMOVSD 0x13e61(%RIP),%XMM10 |
0xa8bf MOVSXD %ESI,%R11 |
0xa8c2 MOV %R8,-0x108(%RBP) |
0xa8c9 XOR %R8D,%R8D |
0xa8cc MOV %RAX,-0xd8(%RBP) |
0xa8d3 XOR %EAX,%EAX |
0xa8d5 MOV %RDI,-0xe8(%RBP) |
0xa8dc MOV %RAX,%RDI |
0xa8df MOV %R14,-0xf8(%RBP) |
0xa8e6 MOV %R11,%R14 |
0xa8e9 MOV %R13,%R11 |
0xa8ec MOV %R8,%R13 |
(54) 0xa8ef TEST %RCX,%RCX |
(54) 0xa8f2 JE adf4 |
(54) 0xa8f8 MOV %RDX,-0x110(%RBP) |
(54) 0xa8ff XOR %EAX,%EAX |
(54) 0xa901 MOV %R10,%RBX |
(54) 0xa904 MOV %RCX,-0x118(%RBP) |
(54) 0xa90b NOPL (%RAX,%RAX,1) |
(55) 0xa910 MOV -0xf0(%RBP),%R8 |
(55) 0xa917 MOV %RAX,%RCX |
(55) 0xa91a SUB $-0x80,%RAX |
(55) 0xa91e MOV -0xf8(%RBP),%RDX |
(55) 0xa925 MOV -0xe0(%RBP),%R10 |
(55) 0xa92c MOV -0xd8(%RBP),%RSI |
(55) 0xa933 CMP %R8,%RAX |
(55) 0xa936 VMOVSD (%RDX,%RDI,8),%XMM9 |
(55) 0xa93b CMOVBE %RAX,%R8 |
(55) 0xa93f VMOVSD (%R10,%RDI,8),%XMM8 |
(55) 0xa945 VMOVSD (%RSI,%RDI,8),%XMM7 |
(55) 0xa94a CMP %R8,%RCX |
(55) 0xa94d JAE add3 |
(55) 0xa953 VMOVSD 0x208(%R9),%XMM5 |
(55) 0xa95c VMOVSD 0x190(%R9),%XMM0 |
(55) 0xa965 VMOVSD 0x1d0(%R9),%XMM1 |
(55) 0xa96e VMOVSD 0x210(%R9),%XMM2 |
(55) 0xa977 VMOVSD 0x198(%R9),%XMM3 |
(55) 0xa980 VMOVSD 0x1d8(%R9),%XMM4 |
(55) 0xa989 VMOVSD %XMM5,-0x30(%RBP) |
(55) 0xa98e VMOVSD %XMM0,-0x98(%RBP) |
(55) 0xa996 VMOVSD 0xf0(%R9),%XMM31 |
(55) 0xa99d VMOVSD 0xf8(%R9),%XMM30 |
(55) 0xa9a4 VMOVSD %XMM1,-0xa0(%RBP) |
(55) 0xa9ac VMOVSD 0x100(%R9),%XMM29 |
(55) 0xa9b3 VMOVSD 0x108(%R9),%XMM28 |
(55) 0xa9ba VMOVSD %XMM2,-0xa8(%RBP) |
(55) 0xa9c2 VMOVSD 0x110(%R9),%XMM27 |
(55) 0xa9c9 VMOVSD 0x118(%R9),%XMM26 |
(55) 0xa9d0 VMOVSD %XMM3,-0x90(%RBP) |
(55) 0xa9d8 VMOVSD 0x120(%R9),%XMM25 |
(55) 0xa9df VMOVSD 0x128(%R9),%XMM24 |
(55) 0xa9e6 VMOVSD %XMM4,-0x88(%RBP) |
(55) 0xa9ee VMOVSD 0x130(%R9),%XMM23 |
(55) 0xa9f5 VMOVSD 0x138(%R9),%XMM22 |
(55) 0xa9fc VMOVSD 0x140(%R9),%XMM21 |
(55) 0xaa03 VMOVSD 0x148(%R9),%XMM20 |
(55) 0xaa0a VMOVSD 0x150(%R9),%XMM19 |
(55) 0xaa11 VMOVSD 0x158(%R9),%XMM18 |
(55) 0xaa18 VMOVSD 0x160(%R9),%XMM17 |
(55) 0xaa1f VMOVSD 0x168(%R9),%XMM16 |
(55) 0xaa26 VMOVSD 0x170(%R9),%XMM15 |
(55) 0xaa2f VMOVSD 0x178(%R9),%XMM14 |
(55) 0xaa38 VMOVSD 0x188(%R9),%XMM13 |
(55) 0xaa41 VMOVSD 0x1c8(%R9),%XMM12 |
(55) 0xaa4a VMOVSD 0x218(%R9),%XMM6 |
(55) 0xaa53 VMOVSD 0x1a0(%R9),%XMM11 |
(55) 0xaa5c MOV %RAX,-0xc8(%RBP) |
(55) 0xaa63 VMOVSD 0x1e0(%R9),%XMM5 |
(55) 0xaa6c VMOVSD 0x220(%R9),%XMM0 |
(55) 0xaa75 MOV %RDI,-0xd0(%RBP) |
(55) 0xaa7c VMOVSD 0x1a8(%R9),%XMM1 |
(55) 0xaa85 VMOVSD 0x1e8(%R9),%XMM2 |
(55) 0xaa8e VMOVSD %XMM6,-0x80(%RBP) |
(55) 0xaa93 VMOVSD 0x228(%R9),%XMM3 |
(55) 0xaa9c VMOVSD 0x1b0(%R9),%XMM4 |
(55) 0xaaa5 VMOVSD %XMM11,-0x78(%RBP) |
(55) 0xaaaa VMOVSD 0x1f0(%R9),%XMM6 |
(55) 0xaab3 VMOVSD 0x230(%R9),%XMM11 |
(55) 0xaabc VMOVSD %XMM5,-0x70(%RBP) |
(55) 0xaac1 VMOVSD %XMM0,-0x68(%RBP) |
(55) 0xaac6 VMOVSD 0x1b8(%R9),%XMM5 |
(55) 0xaacf VMOVSD 0x1f8(%R9),%XMM0 |
(55) 0xaad8 VMOVSD %XMM1,-0x60(%RBP) |
(55) 0xaadd VMOVSD 0x238(%R9),%XMM1 |
(55) 0xaae6 VMOVSD %XMM2,-0x58(%RBP) |
(55) 0xaaeb VMOVSD %XMM3,-0x50(%RBP) |
(55) 0xaaf0 VMOVSD %XMM4,-0x48(%RBP) |
(55) 0xaaf5 VMOVSD %XMM6,-0x40(%RBP) |
(55) 0xaafa VMOVSD %XMM11,-0x38(%RBP) |
(55) 0xaaff VMOVSD %XMM5,-0xc0(%RBP) |
(55) 0xab07 VMOVSD %XMM0,-0xb8(%RBP) |
(55) 0xab0f VMOVSD %XMM1,-0xb0(%RBP) |
(55) 0xab17 NOPW (%RAX,%RAX,1) |
(56) 0xab20 MOVSXD %ECX,%RDX |
(56) 0xab23 VMOVSD %XMM10,%XMM10,%XMM5 |
(56) 0xab27 TEST %ECX,%ECX |
(56) 0xab29 JNS ab37 |
(56) 0xab2b MOV 0x13bde(%RIP),%RAX |
(56) 0xab32 VMOVQ %RAX,%XMM5 |
(56) 0xab37 LEA (%RDX,%R14,1),%RDI |
(56) 0xab3b VMOVSD (%R15,%RDX,8),%XMM2 |
(56) 0xab41 LEA (%R11,%RDX,1),%RSI |
(56) 0xab45 VMOVSD (%R15,%RDI,8),%XMM4 |
(56) 0xab4b VMOVSD (%R15,%RSI,8),%XMM11 |
(56) 0xab51 VSUBSD %XMM9,%XMM2,%XMM3 |
(56) 0xab56 VSUBSD %XMM8,%XMM4,%XMM6 |
(56) 0xab5b VSUBSD %XMM7,%XMM11,%XMM0 |
(56) 0xab5f VMULSD %XMM5,%XMM3,%XMM3 |
(56) 0xab63 VMULSD %XMM5,%XMM6,%XMM2 |
(56) 0xab67 VMULSD %XMM5,%XMM0,%XMM0 |
(56) 0xab6b VMULSD %XMM27,%XMM2,%XMM4 |
(56) 0xab71 VMULSD %XMM30,%XMM2,%XMM1 |
(56) 0xab77 VFMADD231SD %XMM28,%XMM3,%XMM4 |
(56) 0xab7d VFMADD231SD %XMM31,%XMM3,%XMM1 |
(56) 0xab83 VFMADD231SD %XMM26,%XMM0,%XMM4 |
(56) 0xab89 VFMADD231SD %XMM29,%XMM0,%XMM1 |
(56) 0xab8f VRNDSCALESD $0x9,%XMM4,%XMM4,%XMM6 |
(56) 0xab96 VMULSD %XMM24,%XMM2,%XMM4 |
(56) 0xab9c VRNDSCALESD $0x9,%XMM1,%XMM1,%XMM11 |
(56) 0xaba3 VXORPD 0x13bd5(%RIP),%XMM6,%XMM1 |
(56) 0xabab VMULSD %XMM21,%XMM1,%XMM6 |
(56) 0xabb1 VFMADD231SD %XMM25,%XMM3,%XMM4 |
(56) 0xabb7 VFNMADD231SD %XMM22,%XMM11,%XMM6 |
(56) 0xabbd VFMADD231SD %XMM23,%XMM0,%XMM4 |
(56) 0xabc3 VRNDSCALESD $0x9,%XMM4,%XMM4,%XMM4 |
(56) 0xabca VFNMADD231SD %XMM20,%XMM4,%XMM3 |
(56) 0xabd0 VFNMADD231SD %XMM17,%XMM4,%XMM2 |
(56) 0xabd6 VFNMADD231SD %XMM14,%XMM4,%XMM0 |
(56) 0xabdb VADDSD %XMM3,%XMM6,%XMM3 |
(56) 0xabdf VMULSD %XMM18,%XMM1,%XMM6 |
(56) 0xabe5 VMULSD %XMM15,%XMM1,%XMM1 |
(56) 0xabea VFNMADD231SD %XMM19,%XMM11,%XMM6 |
(56) 0xabf0 VFNMADD231SD %XMM16,%XMM11,%XMM1 |
(56) 0xabf6 VADDSD %XMM13,%XMM3,%XMM11 |
(56) 0xabfb VADDSD %XMM2,%XMM6,%XMM2 |
(56) 0xabff VADDSD %XMM0,%XMM1,%XMM0 |
(56) 0xac03 VADDSD %XMM12,%XMM2,%XMM6 |
(56) 0xac08 VMULSD %XMM2,%XMM2,%XMM4 |
(56) 0xac0c VADDSD -0x30(%RBP),%XMM0,%XMM1 |
(56) 0xac11 VMULSD %XMM6,%XMM6,%XMM6 |
(56) 0xac15 VFMADD231SD %XMM3,%XMM3,%XMM4 |
(56) 0xac1a VFMADD132SD %XMM11,%XMM6,%XMM11 |
(56) 0xac1f VADDSD -0xa8(%RBP),%XMM0,%XMM6 |
(56) 0xac27 VFMADD231SD %XMM0,%XMM0,%XMM4 |
(56) 0xac2c VFMADD132SD %XMM1,%XMM11,%XMM1 |
(56) 0xac31 VADDSD -0xa0(%RBP),%XMM2,%XMM11 |
(56) 0xac39 VMULSD %XMM11,%XMM11,%XMM11 |
(56) 0xac3e VCOMISD %XMM1,%XMM4 |
(56) 0xac42 VMINSD %XMM1,%XMM4,%XMM4 |
(56) 0xac46 VADDSD -0x98(%RBP),%XMM3,%XMM1 |
(56) 0xac4e VFMADD132SD %XMM1,%XMM11,%XMM1 |
(56) 0xac53 VADDSD -0x88(%RBP),%XMM2,%XMM11 |
(56) 0xac5b SETA %R10B |
(56) 0xac5f MOVZX %R10B,%EAX |
(56) 0xac63 MOV $0x2,%R10D |
(56) 0xac69 VMULSD %XMM11,%XMM11,%XMM11 |
(56) 0xac6e VFMADD231SD %XMM6,%XMM6,%XMM1 |
(56) 0xac73 VADDSD -0x80(%RBP),%XMM0,%XMM6 |
(56) 0xac78 VCOMISD %XMM1,%XMM4 |
(56) 0xac7c VMINSD %XMM4,%XMM1,%XMM1 |
(56) 0xac80 VADDSD -0x90(%RBP),%XMM3,%XMM4 |
(56) 0xac88 VFMADD132SD %XMM4,%XMM11,%XMM4 |
(56) 0xac8d VADDSD -0x70(%RBP),%XMM2,%XMM11 |
(56) 0xac92 CMOVA %R10,%RAX |
(56) 0xac96 MOV $0x3,%R10D |
(56) 0xac9c VMULSD %XMM11,%XMM11,%XMM11 |
(56) 0xaca1 VFMADD231SD %XMM6,%XMM6,%XMM4 |
(56) 0xaca6 VADDSD -0x68(%RBP),%XMM0,%XMM6 |
(56) 0xacab VCOMISD %XMM4,%XMM1 |
(56) 0xacaf VMINSD %XMM1,%XMM4,%XMM4 |
(56) 0xacb3 VADDSD -0x78(%RBP),%XMM3,%XMM1 |
(56) 0xacb8 VFMADD132SD %XMM1,%XMM11,%XMM1 |
(56) 0xacbd VADDSD -0x58(%RBP),%XMM2,%XMM11 |
(56) 0xacc2 CMOVA %R10,%RAX |
(56) 0xacc6 MOV $0x4,%R10D |
(56) 0xaccc VMULSD %XMM11,%XMM11,%XMM11 |
(56) 0xacd1 VFMADD231SD %XMM6,%XMM6,%XMM1 |
(56) 0xacd6 VADDSD -0x50(%RBP),%XMM0,%XMM6 |
(56) 0xacdb VCOMISD %XMM1,%XMM4 |
(56) 0xacdf VMINSD %XMM4,%XMM1,%XMM1 |
(56) 0xace3 VADDSD -0x60(%RBP),%XMM3,%XMM4 |
(56) 0xace8 VFMADD132SD %XMM4,%XMM11,%XMM4 |
(56) 0xaced VADDSD -0x40(%RBP),%XMM2,%XMM11 |
(56) 0xacf2 CMOVA %R10,%RAX |
(56) 0xacf6 MOV $0x5,%R10D |
(56) 0xacfc VMULSD %XMM11,%XMM11,%XMM11 |
(56) 0xad01 VFMADD231SD %XMM6,%XMM6,%XMM4 |
(56) 0xad06 VADDSD -0x38(%RBP),%XMM0,%XMM6 |
(56) 0xad0b VCOMISD %XMM4,%XMM1 |
(56) 0xad0f VMINSD %XMM1,%XMM4,%XMM4 |
(56) 0xad13 VADDSD -0x48(%RBP),%XMM3,%XMM1 |
(56) 0xad18 VFMADD132SD %XMM1,%XMM11,%XMM1 |
(56) 0xad1d VADDSD -0xb8(%RBP),%XMM2,%XMM11 |
(56) 0xad25 CMOVA %R10,%RAX |
(56) 0xad29 MOV $0x6,%R10D |
(56) 0xad2f VMULSD %XMM11,%XMM11,%XMM11 |
(56) 0xad34 VFMADD231SD %XMM6,%XMM6,%XMM1 |
(56) 0xad39 VADDSD -0xb0(%RBP),%XMM0,%XMM6 |
(56) 0xad41 VCOMISD %XMM1,%XMM4 |
(56) 0xad45 VMINSD %XMM4,%XMM1,%XMM1 |
(56) 0xad49 VADDSD -0xc0(%RBP),%XMM3,%XMM4 |
(56) 0xad51 VFMADD132SD %XMM4,%XMM11,%XMM4 |
(56) 0xad56 CMOVA %R10,%RAX |
(56) 0xad5a MOV $0x7,%R10D |
(56) 0xad60 VFMADD231SD %XMM6,%XMM6,%XMM4 |
(56) 0xad65 VCOMISD %XMM4,%XMM1 |
(56) 0xad69 VMINSD %XMM4,%XMM1,%XMM1 |
(56) 0xad6d CMOVA %R10,%RAX |
(56) 0xad71 VSQRTSD %XMM1,%XMM1,%XMM1 |
(56) 0xad75 LEA (%RBX,%RDX,8),%R10 |
(56) 0xad79 INC %RCX |
(56) 0xad7c LEA (%R9,%RAX,8),%RAX |
(56) 0xad80 VADDSD 0x180(%RAX),%XMM3,%XMM3 |
(56) 0xad88 VADDSD 0x1c0(%RAX),%XMM2,%XMM2 |
(56) 0xad90 VMOVSD %XMM1,(%R10,%R13,1) |
(56) 0xad96 VADDSD 0x200(%RAX),%XMM0,%XMM0 |
(56) 0xad9e VMULSD %XMM5,%XMM3,%XMM4 |
(56) 0xada2 VMULSD %XMM5,%XMM2,%XMM6 |
(56) 0xada6 VMULSD %XMM5,%XMM0,%XMM5 |
(56) 0xadaa VMOVSD %XMM4,(%R12,%RDX,8) |
(56) 0xadb0 VMOVSD %XMM6,(%R12,%RDI,8) |
(56) 0xadb6 VMOVSD %XMM5,(%R12,%RSI,8) |
(56) 0xadbc CMP %R8,%RCX |
(56) 0xadbf JNE ab20 |
(55) 0xadc5 MOV -0xc8(%RBP),%RAX |
(55) 0xadcc MOV -0xd0(%RBP),%RDI |
(55) 0xadd3 MOV -0xe8(%RBP),%RCX |
(55) 0xadda CMP %RCX,%RAX |
(55) 0xaddd JNE a910 |
(54) 0xade3 MOV -0x110(%RBP),%RDX |
(54) 0xadea MOV -0x118(%RBP),%RCX |
(54) 0xadf1 MOV %RBX,%R10 |
(54) 0xadf4 MOV -0x100(%RBP),%RBX |
(54) 0xadfb MOV -0x108(%RBP),%R8 |
(54) 0xae02 INC %RDI |
(54) 0xae05 ADD %RBX,%R13 |
(54) 0xae08 ADD %R8,%R12 |
(54) 0xae0b CMP %RDI,%RDX |
(54) 0xae0e JNE a8ef |
0xae14 ADD $0x78,%RSP |
0xae18 POP %RBX |
0xae19 POP %R12 |
0xae1b POP %R13 |
0xae1d POP %R14 |
0xae1f POP %R15 |
0xae21 POP %RBP |
0xae22 RET |
0xae23 NOP |
0xae24 NOPW %CS:(%RAX,%RAX,1) |
0xae2f NOP |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | qmcplusplus::ParticleSet::upda[...] | ParticleSet.cpp:250 | libqmcparticle.so |
○ | main._omp_fn.0 | miniqmc.cpp:390 | exec |
○ | GOMP_parallel | libgomp.h:985 | libgomp.so.1.0.0 |
Path / |
Source file and lines | DistanceTableBA.h:65-105 |
Module | libqmcparticle.so |
nb instructions | 62 |
nb uops | 62 |
loop length | 251 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 7 |
micro-operation queue | 15.50 cycles |
front end | 15.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 5.25 | 5.25 | 9.33 | 9.33 | 13.00 | 5.25 | 5.25 | 9.33 |
cycles | 5.25 | 5.75 | 9.33 | 9.33 | 13.00 | 5.25 | 5.25 | 9.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 15.61 |
Stall cycles | 0.00 |
Front-end | 15.50 |
Dispatch | 13.00 |
Overall L1 | 15.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSI,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0x78,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOVSXD 0xc4(%RDI),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD 0xc8(%RDI),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x8(%R9),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x40(%RDI),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x7,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA 0x7(%RDX),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa8(%RDI),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x610(%R8),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
AND $-0x8,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x610(%RCX),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
AND $-0x8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA 0x7f(%RSI),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x7,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
TEST %RDX,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE ae14 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA (%RSI,%RSI,1),%EBX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
LEA (%RSI,%RSI,2),%R12 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0xf0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOVSXD %EBX,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA (%R14,%RAX,1),%RBX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%R12,8),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA (,%RSI,8),%R11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RBX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RBX,-0xe0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SAL $0x7,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %R11,-0x100(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x13e61(%RIP),%XMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD %ESI,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R8,-0x108(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,-0xe8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R14,-0xf8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R11,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R8,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
ADD $0x78,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Source file and lines | DistanceTableBA.h:65-105 |
Module | libqmcparticle.so |
nb instructions | 62 |
nb uops | 62 |
loop length | 251 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 7 |
micro-operation queue | 15.50 cycles |
front end | 15.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 5.25 | 5.25 | 9.33 | 9.33 | 13.00 | 5.25 | 5.25 | 9.33 |
cycles | 5.25 | 5.75 | 9.33 | 9.33 | 13.00 | 5.25 | 5.25 | 9.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 15.61 |
Stall cycles | 0.00 |
Front-end | 15.50 |
Dispatch | 13.00 |
Overall L1 | 15.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSI,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0x78,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOVSXD 0xc4(%RDI),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD 0xc8(%RDI),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x8(%R9),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x40(%RDI),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x7,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA 0x7(%RDX),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa8(%RDI),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x610(%R8),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
AND $-0x8,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x610(%RCX),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
AND $-0x8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA 0x7f(%RSI),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x7,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
TEST %RDX,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE ae14 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA (%RSI,%RSI,1),%EBX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
LEA (%RSI,%RSI,2),%R12 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0xf0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOVSXD %EBX,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA (%R14,%RAX,1),%RBX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%R12,8),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA (,%RSI,8),%R11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RBX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RBX,-0xe0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SAL $0x7,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %R11,-0x100(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x13e61(%RIP),%XMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD %ESI,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R8,-0x108(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,-0xe8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R14,-0xf8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R11,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R8,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
ADD $0x78,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼qmcplusplus::DistanceTableBA | 0.37 | 0 |
▼Loop 54 - DistanceTableBA.h:88-101 - libqmcparticle.so– | 0 | 0 |
▼Loop 55 - DistanceTableBA.h:89-101 - libqmcparticle.so– | 0 | 0 |
○Loop 56 - DistanceTableBA.h:99-101 - libqmcparticle.so | 0.37 | 0 |