Function: miniqmcreference::einspline_spo_ref<double>::evaluate(qmcplusplus::ParticleSet const&, int ... | Module: libqmcwfs.so | Source: einspline_spo_ref.hpp:172-189 [...] | Coverage: 25.92% |
---|
Function: miniqmcreference::einspline_spo_ref<double>::evaluate(qmcplusplus::ParticleSet const&, int ... | Module: libqmcwfs.so | Source: einspline_spo_ref.hpp:172-189 [...] | Coverage: 25.92% |
---|
/usr/lib/gcc/x86_64-linux-gnu/11/../../../../include/c++/11/bits/stl_algobase.h: 235 - 924 |
-------------------------------------------------------------------------------- |
235: if (__b < __a) |
[...] |
429: const ptrdiff_t _Num = __last - __first; |
430: if (_Num) |
431: __builtin_memmove(__result, __first, sizeof(_Tp) * _Num); |
[...] |
923: for (; __first != __last; ++__first) |
924: *__first = __tmp; |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/einspline_spo_ref.hpp: 172 - 189 |
-------------------------------------------------------------------------------- |
172: ScopedTimer local_timer(timer); |
173: |
174: auto u = Lattice.toUnit_floor(P.activeR(iat)); |
175: for (int i = 0; i < nBlocks; ++i) |
176: MultiBsplineEvalRef::evaluate_v(einsplines[i], u[0], u[1], u[2], psi[i].data(), nSplinesPerBlock); |
177: } |
178: |
179: inline void evaluate(const ParticleSet& P, int iat, ValueVector_t& psi_v) |
180: { |
181: evaluate_v(P, iat); |
182: |
183: for (int i = 0; i < nBlocks; ++i) |
184: { |
185: // in real simulation, phase needs to be applied. Here just fake computation |
186: const int first = i * nBlocks; |
187: std::copy_n(psi[i].data(), std::min((i + 1) * nSplinesPerBlock, OrbitalSetSize) - first, psi_v.data() + first); |
188: } |
189: } |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineEvalHelper.hpp: 53 - 63 |
-------------------------------------------------------------------------------- |
53: if (x < 0) |
[...] |
60: ind = static_cast<int>(x); |
61: dx = x - ind; |
62: // upper bound |
63: if (ind > nmax) |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineData.hpp: 54 - 57 |
-------------------------------------------------------------------------------- |
54: a[0] = ((A00 * tx + A01) * tx + A02) * tx + A03; |
55: a[1] = ((A10 * tx + A11) * tx + A12) * tx + A13; |
56: a[2] = ((A20 * tx + A21) * tx + A22) * tx + A23; |
57: a[3] = ((A30 * tx + A31) * tx + A32) * tx + A33; |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 143 - 143 |
-------------------------------------------------------------------------------- |
143: return (active_ptcl_ == iat) ? active_pos_ : R[iat]; |
/usr/lib/gcc/x86_64-linux-gnu/11/../../../../include/c++/11/bits/stl_algo.h: 725 - 751 |
-------------------------------------------------------------------------------- |
725: { return std::copy(__first, __first + __n, __result); } |
[...] |
751: if (__n2 <= 0) |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineRef.hpp: 42 - 71 |
-------------------------------------------------------------------------------- |
42: x -= spline_m->x_grid.start; |
43: y -= spline_m->y_grid.start; |
44: z -= spline_m->z_grid.start; |
45: T tx, ty, tz; |
46: int ix, iy, iz; |
47: spline2::getSplineBound(x * spline_m->x_grid.delta_inv, tx, ix, spline_m->x_grid.num - 1); |
48: spline2::getSplineBound(y * spline_m->y_grid.delta_inv, ty, iy, spline_m->y_grid.num - 1); |
49: spline2::getSplineBound(z * spline_m->z_grid.delta_inv, tz, iz, spline_m->z_grid.num - 1); |
[...] |
56: const intptr_t xs = spline_m->x_stride; |
57: const intptr_t ys = spline_m->y_stride; |
58: const intptr_t zs = spline_m->z_stride; |
59: |
60: constexpr T zero(0); |
61: std::fill(vals, vals + num_splines, zero); |
62: |
63: for (size_t i = 0; i < 4; i++) |
64: for (size_t j = 0; j < 4; j++) |
65: { |
66: const T pre00 = a[i] * b[j]; |
67: const T* restrict coefs = spline_m->coefs + (ix + i) * xs + (iy + j) * ys + iz * zs; |
68: for (size_t n = 0; n < num_splines; n++) |
69: vals[n] += pre00 * |
70: (c[0] * coefs[n] + c[1] * coefs[n + zs] + c[2] * coefs[n + 2 * zs] + |
71: c[3] * coefs[n + 3 * zs]); |
/usr/lib/gcc/x86_64-linux-gnu/11/../../../../include/c++/11/bits/stl_vector.h: 1046 - 1169 |
-------------------------------------------------------------------------------- |
1046: return *(this->_M_impl._M_start + __n); |
[...] |
1169: { return _M_data_ptr(this->_M_impl._M_start); } |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/Particle/Lattice/CrystalLattice.h: 170 - 170 |
-------------------------------------------------------------------------------- |
170: if (-std::numeric_limits<T1>::epsilon() < val_dot[i] && val_dot[i] < 0) |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/Utilities/NewTimer.h: 242 - 249 |
-------------------------------------------------------------------------------- |
242: ScopeGuard(TIMER& t) : timer(t) { timer.start(); } |
[...] |
249: ~ScopeGuard() { timer.stop(); } |
/home/kcamus/qaas_runs/170-254-9426/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVectorTensorOps.h: 150 - 151 |
-------------------------------------------------------------------------------- |
150: return TinyVector<Type_t, 3>(lhs[0] * rhs[0] + lhs[1] * rhs[3] + lhs[2] * rhs[6], |
151: lhs[0] * rhs[1] + lhs[1] * rhs[4] + lhs[2] * rhs[7], |
0x43b40 PUSH %RBP |
0x43b41 MOV %RSP,%RBP |
0x43b44 PUSH %R15 |
0x43b46 PUSH %R14 |
0x43b48 PUSH %R13 |
0x43b4a PUSH %R12 |
0x43b4c PUSH %RBX |
0x43b4d AND $-0x40,%RSP |
0x43b51 SUB $0x200,%RSP |
0x43b58 MOV %RDI,%RBX |
0x43b5b MOV 0x358(%RDI),%RDI |
0x43b62 MOV %RCX,0xa0(%RSP) |
0x43b6a MOV %EDX,%R12D |
0x43b6d MOV %RSI,%R13 |
0x43b70 MOV %RDI,0xa8(%RSP) |
0x43b78 CALL 4e900 <@plt_start@+0x250> |
0x43b7d MOVSXD %R12D,%RCX |
0x43b80 LEA 0x128(%R13),%RDX |
0x43b87 LEA (%RCX,%RCX,2),%RAX |
0x43b8b SAL $0x3,%RAX |
0x43b8f ADD 0x40(%R13),%RAX |
0x43b93 CMP %ECX,0x124(%R13) |
0x43b9a MOV %RBX,%R13 |
0x43b9d CMOVE %RDX,%RAX |
0x43ba1 CMPL $0,0x30(%RBX) |
0x43ba5 JLE 44792 |
0x43bab VMOVUPD 0x100(%R13),%XMM2 |
0x43bb4 VMOVUPD 0x8(%RAX),%XMM1 |
0x43bb9 VMOVSD (%RAX),%XMM0 |
0x43bbd VMOVSD -0x3b9ef(%RIP),%XMM18 |
0x43bc7 VMOVSD -0x3b951(%RIP),%XMM19 |
0x43bd1 VMOVAPD -0x3ba4b(%RIP),%XMM20 |
0x43bdb VMOVSD -0x3b9e5(%RIP),%XMM21 |
0x43be5 XOR %ESI,%ESI |
0x43be7 MOV %R13,0xb0(%RSP) |
0x43bef VMOVHPD 0x118(%R13),%XMM2,%XMM2 |
0x43bf8 VMULPD %XMM1,%XMM2,%XMM2 |
0x43bfc VPERMILPD $0x1,%XMM2,%XMM3 |
0x43c02 VFMADD231SD 0xe8(%R13),%XMM0,%XMM2 |
0x43c0b VADDSD %XMM3,%XMM2,%XMM2 |
0x43c0f VROUNDSD $0x9,%XMM2,%XMM2,%XMM3 |
0x43c15 VSUBSD %XMM3,%XMM2,%XMM5 |
0x43c19 VXORPD %XMM3,%XMM3,%XMM3 |
0x43c1d VCMPSD $0x1,%XMM3,%XMM2,%K1 |
0x43c24 VMOVAPD %XMM5,%XMM4 |
0x43c28 VMOVSD %XMM3,%XMM4,%XMM4{%K1} |
0x43c2e VCMPSD $0xe,-0x3ba29(%RIP),%XMM2,%K1 |
0x43c39 VMOVDDUP %XMM1,%XMM2 |
0x43c3d VPERMILPD $0x3,%XMM1,%XMM1 |
0x43c43 VBROADCASTF128 -0x3baac(%RIP),%YMM3 |
0x43c4c VMOVDQA %YMM3,0x100(%RSP) |
0x43c55 VMOVSD %XMM4,%XMM5,%XMM5{%K1} |
0x43c5b VMOVDDUP %XMM0,%XMM0 |
0x43c5f VMULPD 0xd8(%R13),%XMM0,%XMM0 |
0x43c68 VMOVDDUP -0x3b9f0(%RIP),%XMM4 |
0x43c70 VMOVAPD %XMM5,0xf0(%RSP) |
0x43c79 VFMADD231PD 0xf0(%R13),%XMM2,%XMM0 |
0x43c82 VBROADCASTSD -0x3b9fc(%RIP),%ZMM2 |
0x43c8c VMOVAPD %XMM4,0xc0(%RSP) |
0x43c95 VMOVAPD %ZMM2,0x180(%RSP) |
0x43c9d VFMADD132PD 0x108(%R13),%XMM0,%XMM1 |
0x43ca6 VXORPD %XMM0,%XMM0,%XMM0 |
0x43caa VCMPPD $0x1,%XMM0,%XMM1,%K1 |
0x43cb1 VCMPPD $0xe,-0x3baac(%RIP){1to0},%XMM1,%K0{%K1} |
0x43cbc VROUNDPD $0x9,%XMM1,%XMM0 |
0x43cc2 KNOTW %K0,%K1 |
0x43cc6 VSUBPD %XMM0,%XMM1,%XMM0{%K1}{z} |
0x43ccc VBROADCASTSD -0x3ba3e(%RIP),%ZMM1 |
0x43cd6 VMOVAPD %XMM0,0xe0(%RSP) |
0x43cdf VPERMILPD $0x1,%XMM0,%XMM0 |
0x43ce5 VMOVAPD %XMM0,0xd0(%RSP) |
0x43cee VMOVAPD %ZMM1,0x140(%RSP) |
0x43cf6 JMP 43d20 |
0x43cf8 NOPL (%RAX,%RAX,1) |
(821) 0x43d00 MOV 0xb0(%RSP),%R13 |
(821) 0x43d08 MOV 0xb8(%RSP),%RSI |
(821) 0x43d10 MOVSXD 0x30(%R13),%RAX |
(821) 0x43d14 INC %RSI |
(821) 0x43d17 CMP %RAX,%RSI |
(821) 0x43d1a JGE 44792 |
(821) 0x43d20 MOV 0x2f8(%R13),%RAX |
(821) 0x43d27 VMOVAPD 0xe0(%RSP),%XMM0 |
(821) 0x43d30 VXORPD %XMM6,%XMM6,%XMM6 |
(821) 0x43d34 MOV (%RAX,%RSI,8),%R14 |
(821) 0x43d38 VSUBSD 0x28(%R14),%XMM0,%XMM0 |
(821) 0x43d3e VMULSD 0x48(%R14),%XMM0,%XMM0 |
(821) 0x43d44 VUCOMISD %XMM6,%XMM0 |
(821) 0x43d48 JAE 43d60 |
(821) 0x43d4a XOR %EAX,%EAX |
(821) 0x43d4c MOV %RAX,0x8(%RSP) |
(821) 0x43d51 VXORPD %XMM0,%XMM0,%XMM0 |
(821) 0x43d55 JMP 43d95 |
0x43d57 NOPW (%RAX,%RAX,1) |
(821) 0x43d60 MOV 0x38(%R14),%EAX |
(821) 0x43d64 VROUNDSD $0xb,%XMM0,%XMM0,%XMM1 |
(821) 0x43d6a VCVTTSD2SI %XMM0,%EDX |
(821) 0x43d6e VSUBSD %XMM1,%XMM0,%XMM1 |
(821) 0x43d72 VMOVAPD %XMM21,%XMM0 |
(821) 0x43d78 CMP %EDX,%EAX |
(821) 0x43d7a LEA -0x1(%RAX),%ECX |
(821) 0x43d7d SETG %AL |
(821) 0x43d80 CMOVG %EDX,%ECX |
(821) 0x43d83 KMOVD %EAX,%K1 |
(821) 0x43d87 MOVSXD %ECX,%RAX |
(821) 0x43d8a VMOVSD %XMM1,%XMM0,%XMM0{%K1} |
(821) 0x43d90 MOV %RAX,0x8(%RSP) |
(821) 0x43d95 VMOVAPD 0xd0(%RSP),%XMM1 |
(821) 0x43d9e VSUBSD 0x50(%R14),%XMM1,%XMM1 |
(821) 0x43da4 VMULSD 0x70(%R14),%XMM1,%XMM1 |
(821) 0x43daa VUCOMISD %XMM6,%XMM1 |
(821) 0x43dae JAE 43dc0 |
(821) 0x43db0 XOR %EBX,%EBX |
(821) 0x43db2 JMP 43df0 |
0x43db4 NOPW %CS:(%RAX,%RAX,1) |
(821) 0x43dc0 MOV 0x60(%R14),%EAX |
(821) 0x43dc4 VROUNDSD $0xb,%XMM1,%XMM1,%XMM2 |
(821) 0x43dca VCVTTSD2SI %XMM1,%EDX |
(821) 0x43dce VMOVAPD %XMM21,%XMM6 |
(821) 0x43dd4 VSUBSD %XMM2,%XMM1,%XMM1 |
(821) 0x43dd8 CMP %EDX,%EAX |
(821) 0x43dda LEA -0x1(%RAX),%ECX |
(821) 0x43ddd SETG %AL |
(821) 0x43de0 CMOVG %EDX,%ECX |
(821) 0x43de3 KMOVD %EAX,%K1 |
(821) 0x43de7 MOVSXD %ECX,%RBX |
(821) 0x43dea VMOVSD %XMM1,%XMM6,%XMM6{%K1} |
(821) 0x43df0 VMOVAPD 0xf0(%RSP),%XMM1 |
(821) 0x43df9 VXORPD %XMM7,%XMM7,%XMM7 |
(821) 0x43dfd VSUBSD 0x78(%R14),%XMM1,%XMM1 |
(821) 0x43e03 VMULSD 0x98(%R14),%XMM1,%XMM1 |
(821) 0x43e0c VUCOMISD %XMM7,%XMM1 |
(821) 0x43e10 JAE 43e20 |
(821) 0x43e12 XOR %R8D,%R8D |
(821) 0x43e15 JMP 43e53 |
0x43e17 NOPW (%RAX,%RAX,1) |
(821) 0x43e20 MOV 0x88(%R14),%EAX |
(821) 0x43e27 VROUNDSD $0xb,%XMM1,%XMM1,%XMM2 |
(821) 0x43e2d VCVTTSD2SI %XMM1,%EDX |
(821) 0x43e31 VMOVAPD %XMM21,%XMM7 |
(821) 0x43e37 VSUBSD %XMM2,%XMM1,%XMM1 |
(821) 0x43e3b CMP %EDX,%EAX |
(821) 0x43e3d LEA -0x1(%RAX),%ECX |
(821) 0x43e40 SETG %AL |
(821) 0x43e43 CMOVG %EDX,%ECX |
(821) 0x43e46 KMOVD %EAX,%K1 |
(821) 0x43e4a MOVSXD %ECX,%R8 |
(821) 0x43e4d VMOVSD %XMM1,%XMM7,%XMM7{%K1} |
(821) 0x43e53 VMULSD %XMM18,%XMM0,%XMM2 |
(821) 0x43e59 VMOVDDUP %XMM0,%XMM4 |
(821) 0x43e5d VMULSD %XMM0,%XMM0,%XMM1 |
(821) 0x43e61 MOV 0x310(%R13),%RCX |
(821) 0x43e68 LEA (%RSI,%RSI,2),%RAX |
(821) 0x43e6c MOVSXD 0x40(%R13),%R15 |
(821) 0x43e70 MOV %RSI,0xb8(%RSP) |
(821) 0x43e78 VSUBSD %XMM2,%XMM19,%XMM3 |
(821) 0x43e7e VBLENDPD $0x2,0xc0(%RSP),%XMM3,%XMM3 |
(821) 0x43e89 VBROADCASTSD %XMM1,%YMM1 |
(821) 0x43e8e VMOVDDUP %XMM2,%XMM2 |
(821) 0x43e92 MOV (%RCX,%RAX,8),%R12 |
(821) 0x43e96 VMULPD %XMM4,%XMM3,%XMM3 |
(821) 0x43e9a VUNPCKLPD %XMM1,%XMM4,%XMM4 |
(821) 0x43e9e VMULSD %XMM1,%XMM2,%XMM1 |
(821) 0x43ea2 VMULSD %XMM6,%XMM6,%XMM2 |
(821) 0x43ea6 VPERMILPD $0x1,%XMM3,%XMM5 |
(821) 0x43eac VADDPD %XMM20,%XMM3,%XMM3 |
(821) 0x43eb2 VBROADCASTSD %XMM1,%YMM1 |
(821) 0x43eb7 VSUBSD %XMM5,%XMM19,%XMM5 |
(821) 0x43ebd VMULPD %XMM4,%XMM3,%XMM3 |
(821) 0x43ec1 VFMADD213SD %XMM19,%XMM0,%XMM5 |
(821) 0x43ec7 VMULSD %XMM0,%XMM5,%XMM0 |
(821) 0x43ecb VBROADCASTSD %XMM0,%YMM0 |
(821) 0x43ed0 VBLENDPD $0x4,%YMM0,%YMM3,%YMM0 |
(821) 0x43ed6 VADDPD 0x100(%RSP),%YMM0,%YMM0 |
(821) 0x43edf VBLENDPD $0x8,%YMM1,%YMM0,%YMM0 |
(821) 0x43ee5 VMULSD %XMM18,%XMM6,%XMM1 |
(821) 0x43eeb VMOVUPD %YMM0,0x120(%RSP) |
(821) 0x43ef4 VMULSD %XMM19,%XMM6,%XMM0 |
(821) 0x43efa VADDSD -0x3bc94(%RIP),%XMM0,%XMM23 |
(821) 0x43f04 MOV 0x10(%R14),%RAX |
(821) 0x43f08 MOV 0x18(%R14),%R13 |
(821) 0x43f0c MOV 0x20(%R14),%RCX |
(821) 0x43f10 VSUBSD %XMM1,%XMM19,%XMM22 |
(821) 0x43f16 VFMADD213SD -0x3bcd8(%RIP),%XMM6,%XMM22 |
(821) 0x43f20 VFMADD213SD -0x3bd62(%RIP),%XMM2,%XMM23 |
(821) 0x43f2a MOV %RAX,0x68(%RSP) |
(821) 0x43f2f TEST %R15D,%R15D |
(821) 0x43f32 JE 43fe5 |
(821) 0x43f38 LEA (,%R15,8),%RDX |
(821) 0x43f40 MOV %R12,%RDI |
(821) 0x43f43 XOR %ESI,%ESI |
(821) 0x43f45 VMOVSD %XMM22,0x38(%RSP) |
(821) 0x43f4d VMOVSD %XMM23,0x30(%RSP) |
(821) 0x43f55 VMOVAPD %XMM6,0x70(%RSP) |
(821) 0x43f5b VMOVAPD %XMM7,0x50(%RSP) |
(821) 0x43f61 VMOVSD %XMM1,0x28(%RSP) |
(821) 0x43f67 VMOVSD %XMM0,0x20(%RSP) |
(821) 0x43f6d VMOVSD %XMM2,0x18(%RSP) |
(821) 0x43f73 MOV %R8,0x10(%RSP) |
(821) 0x43f78 MOV %RCX,0x48(%RSP) |
(821) 0x43f7d VZEROUPPER |
(821) 0x43f80 CALL 4ecc0 <@plt_start@+0x610> |
(821) 0x43f85 VMOVSD 0x18(%RSP),%XMM2 |
(821) 0x43f8b VMOVSD 0x20(%RSP),%XMM0 |
(821) 0x43f91 VMOVSD 0x28(%RSP),%XMM1 |
(821) 0x43f97 VMOVAPD 0x50(%RSP),%XMM7 |
(821) 0x43f9d VMOVAPD 0x70(%RSP),%XMM6 |
(821) 0x43fa3 VMOVSD 0x30(%RSP),%XMM23 |
(821) 0x43fab VMOVSD 0x38(%RSP),%XMM22 |
(821) 0x43fb3 VMOVSD -0x3bdbd(%RIP),%XMM21 |
(821) 0x43fbd VMOVAPD -0x3be37(%RIP),%XMM20 |
(821) 0x43fc7 VMOVSD -0x3bd51(%RIP),%XMM19 |
(821) 0x43fd1 VMOVSD -0x3be03(%RIP),%XMM18 |
(821) 0x43fdb MOV 0x48(%RSP),%RCX |
(821) 0x43fe0 MOV 0x10(%RSP),%R8 |
(821) 0x43fe5 VMULSD %XMM18,%XMM7,%XMM3 |
(821) 0x43feb LEA 0x2(%RBX),%RAX |
(821) 0x43fef VSUBSD %XMM0,%XMM19,%XMM0 |
(821) 0x43ff5 LEA 0x1(%RBX),%R11 |
(821) 0x43ff9 VMOVDDUP %XMM7,%XMM5 |
(821) 0x43ffd LEA 0x18(,%R8,8),%RDX |
(821) 0x44005 MOV 0x8(%R14),%R9 |
(821) 0x44009 VFMADD213SD %XMM18,%XMM6,%XMM22 |
(821) 0x4400f VMULSD %XMM2,%XMM1,%XMM1 |
(821) 0x44013 VMULSD %XMM7,%XMM7,%XMM2 |
(821) 0x44017 VMOVAPD 0x140(%RSP),%ZMM8 |
(821) 0x4401f MOV %RAX,0x10(%RSP) |
(821) 0x44024 LEA 0x3(%RBX),%RAX |
(821) 0x44028 MOV %RAX,0x50(%RSP) |
(821) 0x4402d MOV %RBX,%RAX |
(821) 0x44030 MOV 0x8(%RSP),%RBX |
(821) 0x44035 IMUL %R13,%RAX |
(821) 0x44039 IMUL %RCX,%RDX |
(821) 0x4403d SAL $0x3,%R13 |
(821) 0x44041 VSUBSD %XMM3,%XMM19,%XMM4 |
(821) 0x44047 VBLENDPD $0x2,0xc0(%RSP),%XMM4,%XMM4 |
(821) 0x44052 IMUL 0x68(%RSP),%RBX |
(821) 0x44058 VFMADD213SD %XMM19,%XMM6,%XMM0 |
(821) 0x4405e VBROADCASTSD %XMM2,%YMM2 |
(821) 0x44063 VBROADCASTSD %XMM3,%YMM3 |
(821) 0x44068 SALQ $0x3,0x68(%RSP) |
(821) 0x4406e SAL $0x3,%RAX |
(821) 0x44072 ADD %R9,%RDX |
(821) 0x44075 VFMADD213SD %XMM18,%XMM6,%XMM0 |
(821) 0x4407b LEA (%RAX,%RBX,8),%RSI |
(821) 0x4407f LEA (,%R8,8),%RAX |
(821) 0x44087 VMULPD %XMM5,%XMM4,%XMM4 |
(821) 0x4408b VUNPCKLPD %XMM2,%XMM5,%XMM5 |
(821) 0x4408f LEA (%RDX,%RSI,1),%RDI |
(821) 0x44093 MOV %RAX,%R14 |
(821) 0x44096 IMUL %RCX,%R14 |
(821) 0x4409a MOV %RDI,0x38(%RSP) |
(821) 0x4409f LEA 0x10(,%R8,8),%RDI |
(821) 0x440a7 LEA 0x8(,%R8,8),%R8 |
(821) 0x440af VPERMILPD $0x1,%XMM4,%XMM6 |
(821) 0x440b5 VADDPD %XMM20,%XMM4,%XMM4 |
(821) 0x440bb VSUBSD %XMM6,%XMM19,%XMM6 |
(821) 0x440c1 IMUL %RCX,%RDI |
(821) 0x440c5 LEA (%R9,%R14,1),%RAX |
(821) 0x440c9 IMUL %RCX,%R8 |
(821) 0x440cd ADD %RSI,%RAX |
(821) 0x440d0 VMULPD %XMM5,%XMM4,%XMM4 |
(821) 0x440d4 MOV %RAX,0x70(%RSP) |
(821) 0x440d9 MOV %R11,%RAX |
(821) 0x440dc IMUL %R13,%RAX |
(821) 0x440e0 VFMADD213SD %XMM19,%XMM7,%XMM6 |
(821) 0x440e6 ADD %R9,%RDI |
(821) 0x440e9 ADD %R9,%R8 |
(821) 0x440ec LEA (%RDI,%RSI,1),%R10 |
(821) 0x440f0 LEA (%R8,%RSI,1),%RCX |
(821) 0x440f4 MOV %R10,0x30(%RSP) |
(821) 0x440f9 MOV 0x10(%RSP),%R10 |
(821) 0x440fe LEA (%RAX,%RBX,8),%R11 |
(821) 0x44102 ADD %R9,%RAX |
(821) 0x44105 VMULSD %XMM7,%XMM6,%XMM5 |
(821) 0x44109 LEA (%RDX,%R11,1),%RSI |
(821) 0x4410d MOV %RSI,0x8(%RSP) |
(821) 0x44112 LEA (%RDI,%R11,1),%RSI |
(821) 0x44116 ADD %R8,%R11 |
(821) 0x44119 MOV %RSI,0x28(%RSP) |
(821) 0x4411e LEA (%R14,%RBX,8),%RSI |
(821) 0x44122 VBROADCASTSD %XMM5,%YMM5 |
(821) 0x44127 IMUL %R13,%R10 |
(821) 0x4412b IMUL 0x50(%RSP),%R13 |
(821) 0x44131 MOV %RCX,0x50(%RSP) |
(821) 0x44136 ADD %RSI,%RAX |
(821) 0x44139 VBLENDPD $0x4,%YMM5,%YMM4,%YMM4 |
(821) 0x4413f VMOVAPD 0x180(%RSP),%ZMM5 |
(821) 0x44147 VBLENDPD $0x8,%YMM3,%YMM4,%YMM3 |
(821) 0x4414d VBLENDPD $0x7,0x100(%RSP),%YMM2,%YMM4 |
(821) 0x44158 LEA (%R10,%RBX,8),%R14 |
(821) 0x4415c MOV %R10,%RCX |
(821) 0x4415f ADD %R9,%RCX |
(821) 0x44162 ADD %RSI,%RCX |
(821) 0x44165 LEA (%R13,%RBX,8),%R10 |
(821) 0x4416a LEA (%RDX,%R14,1),%RBX |
(821) 0x4416e ADD %R9,%R13 |
(821) 0x44171 MOV %RBX,0x20(%RSP) |
(821) 0x44176 LEA (%RDI,%R14,1),%RBX |
(821) 0x4417a ADD %RSI,%R13 |
(821) 0x4417d MOV %R15,%RSI |
(821) 0x44180 AND $-0x8,%RSI |
(821) 0x44184 ADD %R8,%R14 |
(821) 0x44187 MOV %RBX,0x18(%RSP) |
(821) 0x4418c MOV 0x8(%RSP),%RBX |
(821) 0x44191 MOV %RSI,(%RSP) |
(821) 0x44195 MOV %R15,%RSI |
(821) 0x44198 AND $-0x4,%RSI |
(821) 0x4419c ADD %R10,%RDX |
(821) 0x4419f ADD %R10,%RDI |
(821) 0x441a2 ADD %R10,%R8 |
(821) 0x441a5 XOR %R10D,%R10D |
(821) 0x441a8 MOV %RSI,0x40(%RSP) |
(821) 0x441ad VADDPD %YMM4,%YMM3,%YMM2 |
(821) 0x441b1 VMULPD %YMM4,%YMM3,%YMM13 |
(821) 0x441b5 VPERMPD %ZMM2,%ZMM5,%ZMM4 |
(821) 0x441bb VPERMPD %ZMM13,%ZMM8,%ZMM8 |
(821) 0x441c1 VEXTRACTF128 $0x1,%YMM2,%XMM6 |
(821) 0x441c7 VBLENDPD $0x8,%YMM13,%YMM2,%YMM3 |
(821) 0x441cd VPERMPD $-0x1,%YMM13,%YMM11 |
(821) 0x441d3 VEXTRACTF128 $0x1,%YMM13,%XMM13 |
(821) 0x441d9 VBROADCASTSD %XMM2,%ZMM5 |
(821) 0x441df VPERMPD $0x55,%YMM2,%YMM9 |
(821) 0x441e5 VPERMPD $-0x56,%YMM2,%YMM10 |
(821) 0x441eb VPERMILPD $0x1,%XMM2,%XMM12 |
(821) 0x441f1 VBROADCASTSD %XMM6,%ZMM7 |
(821) 0x441f7 VPERMILPD $0x1,%XMM13,%XMM13 |
(821) 0x441fd JMP 44250 |
0x441ff NOP |
(822) 0x44200 MOV 0x68(%RSP),%RSI |
(822) 0x44205 INC %R10 |
(822) 0x44208 ADD %RSI,0x38(%RSP) |
(822) 0x4420d ADD %RSI,0x30(%RSP) |
(822) 0x44212 ADD %RSI,0x50(%RSP) |
(822) 0x44217 ADD %RSI,0x70(%RSP) |
(822) 0x4421c ADD %RSI,0x28(%RSP) |
(822) 0x44221 ADD %RSI,0x20(%RSP) |
(822) 0x44226 ADD %RSI,0x18(%RSP) |
(822) 0x4422b ADD %RSI,%RBX |
(822) 0x4422e ADD %RSI,%R11 |
(822) 0x44231 ADD %RSI,%RAX |
(822) 0x44234 ADD %RSI,%R14 |
(822) 0x44237 ADD %RSI,%RCX |
(822) 0x4423a ADD %RSI,%RDX |
(822) 0x4423d ADD %RSI,%RDI |
(822) 0x44240 ADD %RSI,%R8 |
(822) 0x44243 ADD %RSI,%R13 |
(822) 0x44246 CMP $0x4,%R10 |
(822) 0x4424a JE 43d00 |
(822) 0x44250 TEST %R15D,%R15D |
(822) 0x44253 JE 44200 |
(822) 0x44255 VMOVSD 0x120(%RSP,%R10,8),%XMM14 |
(822) 0x4425f MOV %RAX,0x48(%RSP) |
(822) 0x44264 MOV %R11,0x98(%RSP) |
(822) 0x4426c MOV %RCX,0x10(%RSP) |
(822) 0x44271 MOV %RBX,0x8(%RSP) |
(822) 0x44276 MOV %R14,0x90(%RSP) |
(822) 0x4427e VMULSD %XMM14,%XMM22,%XMM15 |
(822) 0x44284 CMP $0x4,%R15D |
(822) 0x44288 JAE 442b0 |
(822) 0x4428a MOV 0x38(%RSP),%R11 |
(822) 0x4428f MOV 0x30(%RSP),%R14 |
(822) 0x44294 MOV 0x70(%RSP),%RAX |
(822) 0x44299 MOV 0x50(%RSP),%RCX |
(822) 0x4429e XOR %R9D,%R9D |
(822) 0x442a1 JMP 44390 |
0x442a6 NOPW %CS:(%RAX,%RAX,1) |
(822) 0x442b0 CMP $0x8,%R15D |
(822) 0x442b4 JAE 442ce |
(822) 0x442b6 MOV 0x38(%RSP),%R11 |
(822) 0x442bb MOV 0x30(%RSP),%R14 |
(822) 0x442c0 MOV 0x70(%RSP),%RAX |
(822) 0x442c5 MOV 0x50(%RSP),%RCX |
(822) 0x442ca XOR %ESI,%ESI |
(822) 0x442cc JMP 44339 |
(822) 0x442ce MOV 0x38(%RSP),%R11 |
(822) 0x442d3 MOV 0x30(%RSP),%R14 |
(822) 0x442d8 MOV 0x70(%RSP),%RAX |
(822) 0x442dd MOV 0x50(%RSP),%RCX |
(822) 0x442e2 MOV (%RSP),%R9 |
(822) 0x442e6 VBROADCASTSD %XMM15,%ZMM16 |
(822) 0x442ec XOR %ESI,%ESI |
(822) 0x442ee XCHG %AX,%AX |
(823) 0x442f0 VMULPD (%RAX,%RSI,8),%ZMM5,%ZMM17 |
(823) 0x442f7 VFMADD231PD (%RCX,%RSI,8),%ZMM4,%ZMM17 |
(823) 0x442fe VFMADD231PD (%R14,%RSI,8),%ZMM7,%ZMM17 |
(823) 0x44305 VFMADD231PD (%R11,%RSI,8),%ZMM8,%ZMM17 |
(823) 0x4430c VFMADD213PD (%R12,%RSI,8),%ZMM16,%ZMM17 |
(823) 0x44313 VMOVUPD %ZMM17,(%R12,%RSI,8) |
(823) 0x4431a ADD $0x8,%RSI |
(823) 0x4431e CMP %RSI,%R9 |
(823) 0x44321 JNE 442f0 |
(822) 0x44323 CMP %R15,%R9 |
(822) 0x44326 JE 443e9 |
(822) 0x4432c MOV (%RSP),%R9 |
(822) 0x44330 MOV %R9,%RSI |
(822) 0x44333 TEST $0x4,%R15B |
(822) 0x44337 JE 44390 |
(822) 0x44339 MOV 0x40(%RSP),%R9 |
(822) 0x4433e VBROADCASTSD %XMM15,%YMM16 |
(822) 0x44344 NOPW %CS:(%RAX,%RAX,1) |
(834) 0x44350 VMULPD (%RAX,%RSI,8),%YMM5,%YMM17 |
(834) 0x44357 VFMADD231PD (%RCX,%RSI,8),%YMM9,%YMM17 |
(834) 0x4435e VFMADD231PD (%R14,%RSI,8),%YMM10,%YMM17 |
(834) 0x44365 VFMADD231PD (%R11,%RSI,8),%YMM11,%YMM17 |
(834) 0x4436c VFMADD213PD (%R12,%RSI,8),%YMM16,%YMM17 |
(834) 0x44373 VMOVUPD %YMM17,(%R12,%RSI,8) |
(834) 0x4437a ADD $0x4,%RSI |
(834) 0x4437e CMP %RSI,%R9 |
(834) 0x44381 JNE 44350 |
(822) 0x44383 MOV %R9,%RSI |
(822) 0x44386 CMP %R15,%R9 |
(822) 0x44389 JE 443e9 |
(822) 0x4438b NOPL (%RAX,%RAX,1) |
(833) 0x44390 VMOVSD (%R14,%R9,8),%XMM16 |
(833) 0x44397 VMOVSD (%RAX,%R9,8),%XMM17 |
(833) 0x4439e VMOVHPD (%R11,%R9,8),%XMM16,%XMM16 |
(833) 0x443a5 VMOVHPD (%RCX,%R9,8),%XMM17,%XMM17 |
(833) 0x443ac VINSERTF32X4 $0x1,%XMM16,%YMM17,%YMM16 |
(833) 0x443b3 VMULPD %YMM16,%YMM3,%YMM16 |
(833) 0x443b9 VEXTRACTF32X4 $0x1,%YMM16,%XMM17 |
(833) 0x443c0 VADDPD %XMM17,%XMM16,%XMM16 |
(833) 0x443c6 VPERMILPD $0x1,%XMM16,%XMM17 |
(833) 0x443cd VADDSD %XMM17,%XMM16,%XMM16 |
(833) 0x443d3 VFMADD213SD (%R12,%R9,8),%XMM15,%XMM16 |
(833) 0x443da VMOVSD %XMM16,(%R12,%R9,8) |
(833) 0x443e1 INC %R9 |
(833) 0x443e4 CMP %R9,%R15 |
(833) 0x443e7 JNE 44390 |
(822) 0x443e9 VMULSD %XMM14,%XMM23,%XMM15 |
(822) 0x443ef CMP $0x4,%R15D |
(822) 0x443f3 JAE 44420 |
(822) 0x443f5 MOV 0x48(%RSP),%RAX |
(822) 0x443fa MOV 0x98(%RSP),%R11 |
(822) 0x44402 MOV 0x10(%RSP),%RCX |
(822) 0x44407 MOV 0x8(%RSP),%RBX |
(822) 0x4440c MOV 0x28(%RSP),%R14 |
(822) 0x44411 XOR %R9D,%R9D |
(822) 0x44414 JMP 44500 |
0x44419 NOPL (%RAX) |
(822) 0x44420 MOV 0x48(%RSP),%RAX |
(822) 0x44425 MOV 0x98(%RSP),%R11 |
(822) 0x4442d MOV 0x10(%RSP),%RCX |
(822) 0x44432 MOV 0x8(%RSP),%RBX |
(822) 0x44437 CMP $0x8,%R15D |
(822) 0x4443b JAE 44446 |
(822) 0x4443d MOV 0x28(%RSP),%R14 |
(822) 0x44442 XOR %ESI,%ESI |
(822) 0x44444 JMP 444a9 |
(822) 0x44446 MOV 0x28(%RSP),%R14 |
(822) 0x4444b MOV (%RSP),%R9 |
(822) 0x4444f VBROADCASTSD %XMM15,%ZMM16 |
(822) 0x44455 XOR %ESI,%ESI |
(822) 0x44457 NOPW (%RAX,%RAX,1) |
(824) 0x44460 VMULPD (%RAX,%RSI,8),%ZMM5,%ZMM17 |
(824) 0x44467 VFMADD231PD (%R11,%RSI,8),%ZMM4,%ZMM17 |
(824) 0x4446e VFMADD231PD (%R14,%RSI,8),%ZMM7,%ZMM17 |
(824) 0x44475 VFMADD231PD (%RBX,%RSI,8),%ZMM8,%ZMM17 |
(824) 0x4447c VFMADD213PD (%R12,%RSI,8),%ZMM16,%ZMM17 |
(824) 0x44483 VMOVUPD %ZMM17,(%R12,%RSI,8) |
(824) 0x4448a ADD $0x8,%RSI |
(824) 0x4448e CMP %RSI,%R9 |
(824) 0x44491 JNE 44460 |
(822) 0x44493 CMP %R15,%R9 |
(822) 0x44496 JE 44532 |
(822) 0x4449c MOV (%RSP),%R9 |
(822) 0x444a0 MOV %R9,%RSI |
(822) 0x444a3 TEST $0x4,%R15B |
(822) 0x444a7 JE 44500 |
(822) 0x444a9 MOV 0x40(%RSP),%R9 |
(822) 0x444ae VBROADCASTSD %XMM15,%YMM16 |
(822) 0x444b4 NOPW %CS:(%RAX,%RAX,1) |
(832) 0x444c0 VMULPD (%RAX,%RSI,8),%YMM5,%YMM17 |
(832) 0x444c7 VFMADD231PD (%R11,%RSI,8),%YMM9,%YMM17 |
(832) 0x444ce VFMADD231PD (%R14,%RSI,8),%YMM10,%YMM17 |
(832) 0x444d5 VFMADD231PD (%RBX,%RSI,8),%YMM11,%YMM17 |
(832) 0x444dc VFMADD213PD (%R12,%RSI,8),%YMM16,%YMM17 |
(832) 0x444e3 VMOVUPD %YMM17,(%R12,%RSI,8) |
(832) 0x444ea ADD $0x4,%RSI |
(832) 0x444ee CMP %RSI,%R9 |
(832) 0x444f1 JNE 444c0 |
(822) 0x444f3 MOV %R9,%RSI |
(822) 0x444f6 CMP %R15,%R9 |
(822) 0x444f9 JE 44532 |
(822) 0x444fb NOPL (%RAX,%RAX,1) |
(831) 0x44500 VMULSD (%RAX,%R9,8),%XMM2,%XMM16 |
(831) 0x44507 VFMADD231SD (%R11,%R9,8),%XMM12,%XMM16 |
(831) 0x4450e VFMADD231SD (%R14,%R9,8),%XMM6,%XMM16 |
(831) 0x44515 VFMADD231SD (%RBX,%R9,8),%XMM13,%XMM16 |
(831) 0x4451c VFMADD213SD (%R12,%R9,8),%XMM15,%XMM16 |
(831) 0x44523 VMOVSD %XMM16,(%R12,%R9,8) |
(831) 0x4452a INC %R9 |
(831) 0x4452d CMP %R9,%R15 |
(831) 0x44530 JNE 44500 |
(822) 0x44532 VMULSD %XMM0,%XMM14,%XMM15 |
(822) 0x44536 MOV %R10,0x88(%RSP) |
(822) 0x4453e CMP $0x4,%R15D |
(822) 0x44542 JAE 44560 |
(822) 0x44544 MOV 0x90(%RSP),%R14 |
(822) 0x4454c MOV 0x20(%RSP),%R10 |
(822) 0x44551 MOV 0x18(%RSP),%RBX |
(822) 0x44556 XOR %R9D,%R9D |
(822) 0x44559 JMP 44640 |
0x4455e XCHG %AX,%AX |
(822) 0x44560 MOV 0x90(%RSP),%R14 |
(822) 0x44568 CMP $0x8,%R15D |
(822) 0x4456c JAE 4457c |
(822) 0x4456e MOV 0x20(%RSP),%R10 |
(822) 0x44573 MOV 0x18(%RSP),%RBX |
(822) 0x44578 XOR %ESI,%ESI |
(822) 0x4457a JMP 445e9 |
(822) 0x4457c MOV 0x20(%RSP),%R10 |
(822) 0x44581 MOV 0x18(%RSP),%RBX |
(822) 0x44586 MOV (%RSP),%R9 |
(822) 0x4458a VBROADCASTSD %XMM15,%ZMM16 |
(822) 0x44590 XOR %ESI,%ESI |
(822) 0x44592 NOPW %CS:(%RAX,%RAX,1) |
(825) 0x445a0 VMULPD (%RCX,%RSI,8),%ZMM5,%ZMM17 |
(825) 0x445a7 VFMADD231PD (%R14,%RSI,8),%ZMM4,%ZMM17 |
(825) 0x445ae VFMADD231PD (%RBX,%RSI,8),%ZMM7,%ZMM17 |
(825) 0x445b5 VFMADD231PD (%R10,%RSI,8),%ZMM8,%ZMM17 |
(825) 0x445bc VFMADD213PD (%R12,%RSI,8),%ZMM16,%ZMM17 |
(825) 0x445c3 VMOVUPD %ZMM17,(%R12,%RSI,8) |
(825) 0x445ca ADD $0x8,%RSI |
(825) 0x445ce CMP %RSI,%R9 |
(825) 0x445d1 JNE 445a0 |
(822) 0x445d3 CMP %R15,%R9 |
(822) 0x445d6 JE 44672 |
(822) 0x445dc MOV (%RSP),%R9 |
(822) 0x445e0 MOV %R9,%RSI |
(822) 0x445e3 TEST $0x4,%R15B |
(822) 0x445e7 JE 44640 |
(822) 0x445e9 MOV 0x40(%RSP),%R9 |
(822) 0x445ee VBROADCASTSD %XMM15,%YMM16 |
(822) 0x445f4 NOPW %CS:(%RAX,%RAX,1) |
(830) 0x44600 VMULPD (%RCX,%RSI,8),%YMM5,%YMM17 |
(830) 0x44607 VFMADD231PD (%R14,%RSI,8),%YMM9,%YMM17 |
(830) 0x4460e VFMADD231PD (%RBX,%RSI,8),%YMM10,%YMM17 |
(830) 0x44615 VFMADD231PD (%R10,%RSI,8),%YMM11,%YMM17 |
(830) 0x4461c VFMADD213PD (%R12,%RSI,8),%YMM16,%YMM17 |
(830) 0x44623 VMOVUPD %YMM17,(%R12,%RSI,8) |
(830) 0x4462a ADD $0x4,%RSI |
(830) 0x4462e CMP %RSI,%R9 |
(830) 0x44631 JNE 44600 |
(822) 0x44633 MOV %R9,%RSI |
(822) 0x44636 CMP %R15,%R9 |
(822) 0x44639 JE 44672 |
(822) 0x4463b NOPL (%RAX,%RAX,1) |
(829) 0x44640 VMULSD (%RCX,%R9,8),%XMM2,%XMM16 |
(829) 0x44647 VFMADD231SD (%R14,%R9,8),%XMM12,%XMM16 |
(829) 0x4464e VFMADD231SD (%RBX,%R9,8),%XMM6,%XMM16 |
(829) 0x44655 VFMADD231SD (%R10,%R9,8),%XMM13,%XMM16 |
(829) 0x4465c VFMADD213SD (%R12,%R9,8),%XMM15,%XMM16 |
(829) 0x44663 VMOVSD %XMM16,(%R12,%R9,8) |
(829) 0x4466a INC %R9 |
(829) 0x4466d CMP %R9,%R15 |
(829) 0x44670 JNE 44640 |
(822) 0x44672 MOV 0x8(%RSP),%RBX |
(822) 0x44677 VMULSD %XMM1,%XMM14,%XMM14 |
(822) 0x4467b CMP $0x4,%R15D |
(822) 0x4467f JAE 446a0 |
(822) 0x44681 MOV 0x88(%RSP),%R10 |
(822) 0x44689 XOR %R9D,%R9D |
(822) 0x4468c JMP 44760 |
0x44691 NOPW %CS:(%RAX,%RAX,1) |
(822) 0x446a0 MOV 0x88(%RSP),%R10 |
(822) 0x446a8 CMP $0x8,%R15D |
(822) 0x446ac JAE 446b2 |
(822) 0x446ae XOR %ESI,%ESI |
(822) 0x446b0 JMP 4470a |
(822) 0x446b2 MOV (%RSP),%R9 |
(822) 0x446b6 VBROADCASTSD %XMM14,%ZMM15 |
(822) 0x446bc XOR %ESI,%ESI |
(822) 0x446be XCHG %AX,%AX |
(826) 0x446c0 VMULPD (%R13,%RSI,8),%ZMM5,%ZMM16 |
(826) 0x446c8 VFMADD231PD (%R8,%RSI,8),%ZMM4,%ZMM16 |
(826) 0x446cf VFMADD231PD (%RDI,%RSI,8),%ZMM7,%ZMM16 |
(826) 0x446d6 VFMADD231PD (%RDX,%RSI,8),%ZMM8,%ZMM16 |
(826) 0x446dd VFMADD213PD (%R12,%RSI,8),%ZMM15,%ZMM16 |
(826) 0x446e4 VMOVUPD %ZMM16,(%R12,%RSI,8) |
(826) 0x446eb ADD $0x8,%RSI |
(826) 0x446ef CMP %RSI,%R9 |
(826) 0x446f2 JNE 446c0 |
(822) 0x446f4 CMP %R15,%R9 |
(822) 0x446f7 JE 44200 |
(822) 0x446fd MOV (%RSP),%R9 |
(822) 0x44701 MOV %R9,%RSI |
(822) 0x44704 TEST $0x4,%R15B |
(822) 0x44708 JE 44760 |
(822) 0x4470a MOV 0x40(%RSP),%R9 |
(822) 0x4470f VBROADCASTSD %XMM14,%YMM15 |
(822) 0x44714 NOPW %CS:(%RAX,%RAX,1) |
(828) 0x44720 VMULPD (%R13,%RSI,8),%YMM5,%YMM16 |
(828) 0x44728 VFMADD231PD (%R8,%RSI,8),%YMM9,%YMM16 |
(828) 0x4472f VFMADD231PD (%RDI,%RSI,8),%YMM10,%YMM16 |
(828) 0x44736 VFMADD231PD (%RDX,%RSI,8),%YMM11,%YMM16 |
(828) 0x4473d VFMADD213PD (%R12,%RSI,8),%YMM15,%YMM16 |
(828) 0x44744 VMOVUPD %YMM16,(%R12,%RSI,8) |
(828) 0x4474b ADD $0x4,%RSI |
(828) 0x4474f CMP %RSI,%R9 |
(828) 0x44752 JNE 44720 |
(822) 0x44754 MOV %R9,%RSI |
(822) 0x44757 CMP %R15,%R9 |
(822) 0x4475a JE 44200 |
(827) 0x44760 VMULSD (%R13,%R9,8),%XMM2,%XMM15 |
(827) 0x44767 VFMADD231SD (%R8,%R9,8),%XMM12,%XMM15 |
(827) 0x4476d VFMADD231SD (%RDI,%R9,8),%XMM6,%XMM15 |
(827) 0x44773 VFMADD231SD (%RDX,%R9,8),%XMM13,%XMM15 |
(827) 0x44779 VFMADD213SD (%R12,%R9,8),%XMM14,%XMM15 |
(827) 0x4477f VMOVSD %XMM15,(%R12,%R9,8) |
(827) 0x44785 INC %R9 |
(827) 0x44788 CMP %R9,%R15 |
(827) 0x4478b JNE 44760 |
(822) 0x4478d JMP 44200 |
0x44792 MOV 0xa8(%RSP),%RDI |
0x4479a VZEROUPPER |
0x4479d CALL 4e910 <@plt_start@+0x260> |
0x447a2 MOV 0x30(%R13),%EAX |
0x447a6 MOV 0xa0(%RSP),%R15 |
0x447ae TEST %EAX,%EAX |
0x447b0 JLE 44811 |
0x447b2 XOR %EBX,%EBX |
0x447b4 XOR %R14D,%R14D |
0x447b7 JMP 447cc |
0x447b9 NOPL (%RAX) |
(820) 0x447c0 MOVSXD %EAX,%RCX |
(820) 0x447c3 ADD $0x18,%RBX |
(820) 0x447c7 CMP %RCX,%R14 |
(820) 0x447ca JGE 44811 |
(820) 0x447cc MOV 0x40(%R13),%ECX |
(820) 0x447d0 MOV 0x8(%R13),%ESI |
(820) 0x447d4 MOV %R14D,%EDX |
(820) 0x447d7 INC %R14 |
(820) 0x447da IMUL %EAX,%EDX |
(820) 0x447dd IMUL %R14D,%ECX |
(820) 0x447e1 CMP %ECX,%ESI |
(820) 0x447e3 CMOVL %ESI,%ECX |
(820) 0x447e6 SUB %EDX,%ECX |
(820) 0x447e8 JLE 447c0 |
(820) 0x447ea MOV 0x310(%R13),%RAX |
(820) 0x447f1 MOVSXD %EDX,%RDI |
(820) 0x447f4 MOV %ECX,%EDX |
(820) 0x447f6 SAL $0x3,%RDX |
(820) 0x447fa SAL $0x3,%RDI |
(820) 0x447fe ADD 0x18(%R15),%RDI |
(820) 0x44802 MOV (%RAX,%RBX,1),%RSI |
(820) 0x44806 CALL 4ed20 <@plt_start@+0x670> |
(820) 0x4480b MOV 0x30(%R13),%EAX |
(820) 0x4480f JMP 447c0 |
0x44811 LEA -0x28(%RBP),%RSP |
0x44815 POP %RBX |
0x44816 POP %R12 |
0x44818 POP %R13 |
0x4481a POP %R14 |
0x4481c POP %R15 |
0x4481e POP %RBP |
0x4481f RET |
0x44820 MOV %RAX,%RDI |
0x44823 CALL 11780 <__clang_call_terminate> |
0x44828 INT $0x3 |
0x44829 INT $0x3 |
0x4482a INT $0x3 |
0x4482b INT $0x3 |
0x4482c INT $0x3 |
0x4482d INT $0x3 |
0x4482e INT $0x3 |
0x4482f INT $0x3 |
Path / |
Source file and lines | einspline_spo_ref.hpp:172-189 |
Module | libqmcwfs.so |
nb instructions | 111 |
nb uops | 100 |
loop length | 590 |
used x86 registers | 12 |
used mmx registers | 0 |
used xmm registers | 10 |
used ymm registers | 1 |
used zmm registers | 2 |
nb stack references | 11 |
ADD-SUB / MUL ratio | 1.50 |
micro-operation queue | 16.67 cycles |
front end | 16.67 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.50 | 4.00 | 3.75 | 3.75 | 4.00 | 12.67 | 12.67 | 12.67 | 6.25 | 6.42 | 6.17 | 6.17 | 4.50 | 4.50 |
cycles | 4.50 | 4.00 | 3.75 | 3.75 | 4.00 | 12.67 | 12.67 | 12.67 | 6.25 | 6.42 | 6.17 | 6.17 | 4.50 | 4.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 16.67 |
Dispatch | 12.67 |
Overall L1 | 16.67 |
all | 18% |
load | 0% |
store | 25% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 16% |
all | 57% |
load | 44% |
store | 100% |
mul | 100% |
add-sub | 33% |
fma | 66% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 52% |
all | 49% |
load | 38% |
store | 70% |
mul | 100% |
add-sub | 33% |
fma | 66% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 44% |
all | 14% |
load | 8% |
store | 21% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 23% |
load | 18% |
store | 50% |
mul | 25% |
add-sub | 16% |
fma | 20% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 19% |
all | 21% |
load | 16% |
store | 38% |
mul | 25% |
add-sub | 16% |
fma | 20% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 16% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x200,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x358(%RDI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EDX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CALL 4e900 <@plt_start@+0x250> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD %R12D,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x128(%R13),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA (%RCX,%RCX,2),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAL $0x3,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD 0x40(%R13),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CMP %ECX,0x124(%R13) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMOVE %RDX,%RAX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMPL $0,0x30(%RBX) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JLE 44792 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xc52> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VMOVUPD 0x100(%R13),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVUPD 0x8(%RAX),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVSD (%RAX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x3b9ef(%RIP),%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x3b951(%RIP),%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVAPD -0x3ba4b(%RIP),%XMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVSD -0x3b9e5(%RIP),%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVHPD 0x118(%R13),%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
VMULPD %XMM1,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPERMILPD $0x1,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VFMADD231SD 0xe8(%R13),%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD %XMM3,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VROUNDSD $0x9,%XMM2,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VSUBSD %XMM3,%XMM2,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VXORPD %XMM3,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VCMPSD $0x1,%XMM3,%XMM2,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD %XMM5,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD %XMM3,%XMM4,%XMM4{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VCMPSD $0xe,-0x3ba29(%RIP),%XMM2,%K1 | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVDDUP %XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VPERMILPD $0x3,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VBROADCASTF128 -0x3baac(%RIP),%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDQA %YMM3,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VMOVSD %XMM4,%XMM5,%XMM5{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VMOVDDUP %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMULPD 0xd8(%R13),%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVDDUP -0x3b9f0(%RIP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVAPD %XMM5,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VFMADD231PD 0xf0(%R13),%XMM2,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD -0x3b9fc(%RIP),%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 |
VMOVAPD %XMM4,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VMOVAPD %ZMM2,0x180(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 |
VFMADD132PD 0x108(%R13),%XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VCMPPD $0x1,%XMM0,%XMM1,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VCMPPD $0xe,-0x3baac(%RIP){1to0},%XMM1,%K0{%K1} | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VROUNDPD $0x9,%XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
KNOTW %K0,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VSUBPD %XMM0,%XMM1,%XMM0{%K1}{z} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VBROADCASTSD -0x3ba3e(%RIP),%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 |
VMOVAPD %XMM0,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPERMILPD $0x1,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMOVAPD %XMM0,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VMOVAPD %ZMM1,0x140(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 |
JMP 43d20 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV 0xa8(%RSP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e910 <@plt_start@+0x260> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x30(%R13),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xa0(%RSP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
TEST %EAX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 44811 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xcd1> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 447cc <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xc8c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 11780 <__clang_call_terminate> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 |
Source file and lines | einspline_spo_ref.hpp:172-189 |
Module | libqmcwfs.so |
nb instructions | 111 |
nb uops | 100 |
loop length | 590 |
used x86 registers | 12 |
used mmx registers | 0 |
used xmm registers | 10 |
used ymm registers | 1 |
used zmm registers | 2 |
nb stack references | 11 |
ADD-SUB / MUL ratio | 1.50 |
micro-operation queue | 16.67 cycles |
front end | 16.67 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.50 | 4.00 | 3.75 | 3.75 | 4.00 | 12.67 | 12.67 | 12.67 | 6.25 | 6.42 | 6.17 | 6.17 | 4.50 | 4.50 |
cycles | 4.50 | 4.00 | 3.75 | 3.75 | 4.00 | 12.67 | 12.67 | 12.67 | 6.25 | 6.42 | 6.17 | 6.17 | 4.50 | 4.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 16.67 |
Dispatch | 12.67 |
Overall L1 | 16.67 |
all | 18% |
load | 0% |
store | 25% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 16% |
all | 57% |
load | 44% |
store | 100% |
mul | 100% |
add-sub | 33% |
fma | 66% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 52% |
all | 49% |
load | 38% |
store | 70% |
mul | 100% |
add-sub | 33% |
fma | 66% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 44% |
all | 14% |
load | 8% |
store | 21% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 23% |
load | 18% |
store | 50% |
mul | 25% |
add-sub | 16% |
fma | 20% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 19% |
all | 21% |
load | 16% |
store | 38% |
mul | 25% |
add-sub | 16% |
fma | 20% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 16% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x200,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x358(%RDI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EDX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CALL 4e900 <@plt_start@+0x250> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD %R12D,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x128(%R13),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA (%RCX,%RCX,2),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAL $0x3,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD 0x40(%R13),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CMP %ECX,0x124(%R13) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMOVE %RDX,%RAX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMPL $0,0x30(%RBX) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JLE 44792 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xc52> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VMOVUPD 0x100(%R13),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVUPD 0x8(%RAX),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVSD (%RAX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x3b9ef(%RIP),%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x3b951(%RIP),%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVAPD -0x3ba4b(%RIP),%XMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVSD -0x3b9e5(%RIP),%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVHPD 0x118(%R13),%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
VMULPD %XMM1,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPERMILPD $0x1,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VFMADD231SD 0xe8(%R13),%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD %XMM3,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VROUNDSD $0x9,%XMM2,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VSUBSD %XMM3,%XMM2,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VXORPD %XMM3,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VCMPSD $0x1,%XMM3,%XMM2,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD %XMM5,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD %XMM3,%XMM4,%XMM4{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VCMPSD $0xe,-0x3ba29(%RIP),%XMM2,%K1 | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVDDUP %XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VPERMILPD $0x3,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VBROADCASTF128 -0x3baac(%RIP),%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDQA %YMM3,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VMOVSD %XMM4,%XMM5,%XMM5{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VMOVDDUP %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMULPD 0xd8(%R13),%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVDDUP -0x3b9f0(%RIP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVAPD %XMM5,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VFMADD231PD 0xf0(%R13),%XMM2,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD -0x3b9fc(%RIP),%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 |
VMOVAPD %XMM4,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VMOVAPD %ZMM2,0x180(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 |
VFMADD132PD 0x108(%R13),%XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VCMPPD $0x1,%XMM0,%XMM1,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VCMPPD $0xe,-0x3baac(%RIP){1to0},%XMM1,%K0{%K1} | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VROUNDPD $0x9,%XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
KNOTW %K0,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VSUBPD %XMM0,%XMM1,%XMM0{%K1}{z} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VBROADCASTSD -0x3ba3e(%RIP),%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 |
VMOVAPD %XMM0,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPERMILPD $0x1,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMOVAPD %XMM0,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VMOVAPD %ZMM1,0x140(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 |
JMP 43d20 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV 0xa8(%RSP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e910 <@plt_start@+0x260> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x30(%R13),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xa0(%RSP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
TEST %EAX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 44811 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xcd1> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 447cc <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xc8c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 11780 <__clang_call_terminate> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼miniqmcreference::einspline_spo_ref | 25.92 | 48.51 |
▼Loop 821 - MultiBsplineRef.hpp:42-71 - libqmcwfs.so– | 0.02 | 0.04 |
▼Loop 822 - MultiBsplineRef.hpp:63-71 - libqmcwfs.so– | 0 | 0.01 |
○Loop 823 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 6.51 | 11.92 |
○Loop 826 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 6.47 | 11.85 |
○Loop 824 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 6.44 | 11.8 |
○Loop 825 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 6.43 | 11.78 |
○Loop 834 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 829 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 832 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 831 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 830 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 833 - MultiBsplineRef.hpp:68-71 - libqmcwfs.so | 0 | 0 |
○Loop 828 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 827 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 820 - einspline_spo_ref.hpp:183-187 - libqmcwfs.so | 0 | 0.01 |