Function: _ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6 ... | Module: libqmcwfs.so | Source: einspline_spo_ref.hpp:172-189 [...] | Coverage: 28.96% |
---|
Function: _ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6 ... | Module: libqmcwfs.so | Source: einspline_spo_ref.hpp:172-189 [...] | Coverage: 28.96% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Utilities/NewTimer.h: 242 - 249 |
-------------------------------------------------------------------------------- |
242: ScopeGuard(TIMER& t) : timer(t) { timer.start(); } |
[...] |
249: ~ScopeGuard() { timer.stop(); } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 143 - 143 |
-------------------------------------------------------------------------------- |
143: return (active_ptcl_ == iat) ? active_pos_ : R[iat]; |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineEvalHelper.hpp: 53 - 63 |
-------------------------------------------------------------------------------- |
53: if (x < 0) |
[...] |
60: ind = static_cast<int>(x); |
61: dx = x - ind; |
62: // upper bound |
63: if (ind > nmax) |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_vector.h: 1046 - 1169 |
-------------------------------------------------------------------------------- |
1046: return *(this->_M_impl._M_start + __n); |
[...] |
1169: { return _M_data_ptr(this->_M_impl._M_start); } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineData.hpp: 54 - 57 |
-------------------------------------------------------------------------------- |
54: a[0] = ((A00 * tx + A01) * tx + A02) * tx + A03; |
55: a[1] = ((A10 * tx + A11) * tx + A12) * tx + A13; |
56: a[2] = ((A20 * tx + A21) * tx + A22) * tx + A23; |
57: a[3] = ((A30 * tx + A31) * tx + A32) * tx + A33; |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_algobase.h: 235 - 924 |
-------------------------------------------------------------------------------- |
235: if (__b < __a) |
[...] |
429: const ptrdiff_t _Num = __last - __first; |
430: if (_Num) |
431: __builtin_memmove(__result, __first, sizeof(_Tp) * _Num); |
[...] |
923: for (; __first != __last; ++__first) |
924: *__first = __tmp; |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVectorTensorOps.h: 150 - 151 |
-------------------------------------------------------------------------------- |
150: return TinyVector<Type_t, 3>(lhs[0] * rhs[0] + lhs[1] * rhs[3] + lhs[2] * rhs[6], |
151: lhs[0] * rhs[1] + lhs[1] * rhs[4] + lhs[2] * rhs[7], |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_algo.h: 725 - 751 |
-------------------------------------------------------------------------------- |
725: { return std::copy(__first, __first + __n, __result); } |
[...] |
751: if (__n2 <= 0) |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/einspline_spo_ref.hpp: 172 - 189 |
-------------------------------------------------------------------------------- |
172: ScopedTimer local_timer(timer); |
173: |
174: auto u = Lattice.toUnit_floor(P.activeR(iat)); |
175: for (int i = 0; i < nBlocks; ++i) |
176: MultiBsplineEvalRef::evaluate_v(einsplines[i], u[0], u[1], u[2], psi[i].data(), nSplinesPerBlock); |
177: } |
178: |
179: inline void evaluate(const ParticleSet& P, int iat, ValueVector_t& psi_v) |
180: { |
181: evaluate_v(P, iat); |
182: |
183: for (int i = 0; i < nBlocks; ++i) |
184: { |
185: // in real simulation, phase needs to be applied. Here just fake computation |
186: const int first = i * nBlocks; |
187: std::copy_n(psi[i].data(), std::min((i + 1) * nSplinesPerBlock, OrbitalSetSize) - first, psi_v.data() + first); |
188: } |
189: } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Particle/Lattice/CrystalLattice.h: 170 - 170 |
-------------------------------------------------------------------------------- |
170: if (-std::numeric_limits<T1>::epsilon() < val_dot[i] && val_dot[i] < 0) |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineRef.hpp: 42 - 71 |
-------------------------------------------------------------------------------- |
42: x -= spline_m->x_grid.start; |
43: y -= spline_m->y_grid.start; |
44: z -= spline_m->z_grid.start; |
45: T tx, ty, tz; |
46: int ix, iy, iz; |
47: spline2::getSplineBound(x * spline_m->x_grid.delta_inv, tx, ix, spline_m->x_grid.num - 1); |
48: spline2::getSplineBound(y * spline_m->y_grid.delta_inv, ty, iy, spline_m->y_grid.num - 1); |
49: spline2::getSplineBound(z * spline_m->z_grid.delta_inv, tz, iz, spline_m->z_grid.num - 1); |
[...] |
56: const intptr_t xs = spline_m->x_stride; |
57: const intptr_t ys = spline_m->y_stride; |
58: const intptr_t zs = spline_m->z_stride; |
59: |
60: constexpr T zero(0); |
61: std::fill(vals, vals + num_splines, zero); |
62: |
63: for (size_t i = 0; i < 4; i++) |
64: for (size_t j = 0; j < 4; j++) |
65: { |
66: const T pre00 = a[i] * b[j]; |
67: const T* restrict coefs = spline_m->coefs + (ix + i) * xs + (iy + j) * ys + iz * zs; |
68: for (size_t n = 0; n < num_splines; n++) |
69: vals[n] += pre00 * |
70: (c[0] * coefs[n] + c[1] * coefs[n + zs] + c[2] * coefs[n + 2 * zs] + |
71: c[3] * coefs[n + 3 * zs]); |
0x43e30 PUSH %RBP |
0x43e31 MOV %RSP,%RBP |
0x43e34 PUSH %R15 |
0x43e36 PUSH %R14 |
0x43e38 PUSH %R13 |
0x43e3a PUSH %R12 |
0x43e3c PUSH %RBX |
0x43e3d AND $-0x40,%RSP |
0x43e41 SUB $0x200,%RSP |
0x43e48 MOV %RDI,%RBX |
0x43e4b MOV 0x358(%RDI),%RDI |
0x43e52 MOV %RCX,0xa0(%RSP) |
0x43e5a MOV %EDX,%R12D |
0x43e5d MOV %RSI,%R13 |
0x43e60 MOV %RDI,0xa8(%RSP) |
0x43e68 CALL 4ebf0 <@plt_start@+0x250> |
0x43e6d MOVSXD %R12D,%RCX |
0x43e70 LEA 0x128(%R13),%RDX |
0x43e77 LEA (%RCX,%RCX,2),%RAX |
0x43e7b SAL $0x3,%RAX |
0x43e7f ADD 0x40(%R13),%RAX |
0x43e83 CMP %ECX,0x124(%R13) |
0x43e8a MOV %RBX,%R13 |
0x43e8d CMOVE %RDX,%RAX |
0x43e91 CMPL $0,0x30(%RBX) |
0x43e95 JLE 44a82 |
0x43e9b VMOVUPD 0x100(%R13),%XMM2 |
0x43ea4 VMOVUPD 0x8(%RAX),%XMM1 |
0x43ea9 VMOVSD (%RAX),%XMM0 |
0x43ead VMOVSD -0x3bbdf(%RIP),%XMM18 |
0x43eb7 VMOVSD -0x3bb41(%RIP),%XMM19 |
0x43ec1 VMOVAPD -0x3bc3b(%RIP),%XMM20 |
0x43ecb VMOVSD -0x3bbd5(%RIP),%XMM21 |
0x43ed5 XOR %ESI,%ESI |
0x43ed7 MOV %R13,0xb0(%RSP) |
0x43edf VMOVHPD 0x118(%R13),%XMM2,%XMM2 |
0x43ee8 VMULPD %XMM1,%XMM2,%XMM2 |
0x43eec VPERMILPD $0x1,%XMM2,%XMM3 |
0x43ef2 VFMADD231SD 0xe8(%R13),%XMM0,%XMM2 |
0x43efb VADDSD %XMM3,%XMM2,%XMM2 |
0x43eff VROUNDSD $0x9,%XMM2,%XMM2,%XMM3 |
0x43f05 VSUBSD %XMM3,%XMM2,%XMM5 |
0x43f09 VXORPD %XMM3,%XMM3,%XMM3 |
0x43f0d VCMPSD $0x1,%XMM3,%XMM2,%K1 |
0x43f14 VMOVAPD %XMM5,%XMM4 |
0x43f18 VMOVSD %XMM3,%XMM4,%XMM4{%K1} |
0x43f1e VCMPSD $0xe,-0x3bc19(%RIP),%XMM2,%K1 |
0x43f29 VMOVDDUP %XMM1,%XMM2 |
0x43f2d VPERMILPD $0x3,%XMM1,%XMM1 |
0x43f33 VBROADCASTF128 -0x3bc9c(%RIP),%YMM3 |
0x43f3c VMOVDQA %YMM3,0x100(%RSP) |
0x43f45 VMOVSD %XMM4,%XMM5,%XMM5{%K1} |
0x43f4b VMOVDDUP %XMM0,%XMM0 |
0x43f4f VMULPD 0xd8(%R13),%XMM0,%XMM0 |
0x43f58 VMOVDDUP -0x3bbe0(%RIP),%XMM4 |
0x43f60 VMOVAPD %XMM5,0xf0(%RSP) |
0x43f69 VFMADD231PD 0xf0(%R13),%XMM2,%XMM0 |
0x43f72 VBROADCASTSD -0x3bbec(%RIP),%ZMM2 |
0x43f7c VMOVAPD %XMM4,0xc0(%RSP) |
0x43f85 VMOVAPD %ZMM2,0x180(%RSP) |
0x43f8d VFMADD132PD 0x108(%R13),%XMM0,%XMM1 |
0x43f96 VXORPD %XMM0,%XMM0,%XMM0 |
0x43f9a VCMPPD $0x1,%XMM0,%XMM1,%K1 |
0x43fa1 VCMPPD $0xe,-0x3bc9c(%RIP){1to0},%XMM1,%K0{%K1} |
0x43fac VROUNDPD $0x9,%XMM1,%XMM0 |
0x43fb2 KNOTW %K0,%K1 |
0x43fb6 VSUBPD %XMM0,%XMM1,%XMM0{%K1}{z} |
0x43fbc VBROADCASTSD -0x3bc2e(%RIP),%ZMM1 |
0x43fc6 VMOVAPD %XMM0,0xe0(%RSP) |
0x43fcf VPERMILPD $0x1,%XMM0,%XMM0 |
0x43fd5 VMOVAPD %XMM0,0xd0(%RSP) |
0x43fde VMOVAPD %ZMM1,0x140(%RSP) |
0x43fe6 JMP 44010 |
0x43fe8 NOPL (%RAX,%RAX,1) |
(821) 0x43ff0 MOV 0xb0(%RSP),%R13 |
(821) 0x43ff8 MOV 0xb8(%RSP),%RSI |
(821) 0x44000 MOVSXD 0x30(%R13),%RAX |
(821) 0x44004 INC %RSI |
(821) 0x44007 CMP %RAX,%RSI |
(821) 0x4400a JGE 44a82 |
(821) 0x44010 MOV 0x2f8(%R13),%RAX |
(821) 0x44017 VMOVAPD 0xe0(%RSP),%XMM0 |
(821) 0x44020 VXORPD %XMM6,%XMM6,%XMM6 |
(821) 0x44024 MOV (%RAX,%RSI,8),%R14 |
(821) 0x44028 VSUBSD 0x28(%R14),%XMM0,%XMM0 |
(821) 0x4402e VMULSD 0x48(%R14),%XMM0,%XMM0 |
(821) 0x44034 VUCOMISD %XMM6,%XMM0 |
(821) 0x44038 JAE 44050 |
(821) 0x4403a XOR %EAX,%EAX |
(821) 0x4403c MOV %RAX,0x8(%RSP) |
(821) 0x44041 VXORPD %XMM0,%XMM0,%XMM0 |
(821) 0x44045 JMP 44085 |
0x44047 NOPW (%RAX,%RAX,1) |
(821) 0x44050 MOV 0x38(%R14),%EAX |
(821) 0x44054 VROUNDSD $0xb,%XMM0,%XMM0,%XMM1 |
(821) 0x4405a VCVTTSD2SI %XMM0,%EDX |
(821) 0x4405e VSUBSD %XMM1,%XMM0,%XMM1 |
(821) 0x44062 VMOVAPD %XMM21,%XMM0 |
(821) 0x44068 CMP %EDX,%EAX |
(821) 0x4406a LEA -0x1(%RAX),%ECX |
(821) 0x4406d SETG %AL |
(821) 0x44070 CMOVG %EDX,%ECX |
(821) 0x44073 KMOVD %EAX,%K1 |
(821) 0x44077 MOVSXD %ECX,%RAX |
(821) 0x4407a VMOVSD %XMM1,%XMM0,%XMM0{%K1} |
(821) 0x44080 MOV %RAX,0x8(%RSP) |
(821) 0x44085 VMOVAPD 0xd0(%RSP),%XMM1 |
(821) 0x4408e VSUBSD 0x50(%R14),%XMM1,%XMM1 |
(821) 0x44094 VMULSD 0x70(%R14),%XMM1,%XMM1 |
(821) 0x4409a VUCOMISD %XMM6,%XMM1 |
(821) 0x4409e JAE 440b0 |
(821) 0x440a0 XOR %EBX,%EBX |
(821) 0x440a2 JMP 440e0 |
0x440a4 NOPW %CS:(%RAX,%RAX,1) |
(821) 0x440b0 MOV 0x60(%R14),%EAX |
(821) 0x440b4 VROUNDSD $0xb,%XMM1,%XMM1,%XMM2 |
(821) 0x440ba VCVTTSD2SI %XMM1,%EDX |
(821) 0x440be VMOVAPD %XMM21,%XMM6 |
(821) 0x440c4 VSUBSD %XMM2,%XMM1,%XMM1 |
(821) 0x440c8 CMP %EDX,%EAX |
(821) 0x440ca LEA -0x1(%RAX),%ECX |
(821) 0x440cd SETG %AL |
(821) 0x440d0 CMOVG %EDX,%ECX |
(821) 0x440d3 KMOVD %EAX,%K1 |
(821) 0x440d7 MOVSXD %ECX,%RBX |
(821) 0x440da VMOVSD %XMM1,%XMM6,%XMM6{%K1} |
(821) 0x440e0 VMOVAPD 0xf0(%RSP),%XMM1 |
(821) 0x440e9 VXORPD %XMM7,%XMM7,%XMM7 |
(821) 0x440ed VSUBSD 0x78(%R14),%XMM1,%XMM1 |
(821) 0x440f3 VMULSD 0x98(%R14),%XMM1,%XMM1 |
(821) 0x440fc VUCOMISD %XMM7,%XMM1 |
(821) 0x44100 JAE 44110 |
(821) 0x44102 XOR %R8D,%R8D |
(821) 0x44105 JMP 44143 |
0x44107 NOPW (%RAX,%RAX,1) |
(821) 0x44110 MOV 0x88(%R14),%EAX |
(821) 0x44117 VROUNDSD $0xb,%XMM1,%XMM1,%XMM2 |
(821) 0x4411d VCVTTSD2SI %XMM1,%EDX |
(821) 0x44121 VMOVAPD %XMM21,%XMM7 |
(821) 0x44127 VSUBSD %XMM2,%XMM1,%XMM1 |
(821) 0x4412b CMP %EDX,%EAX |
(821) 0x4412d LEA -0x1(%RAX),%ECX |
(821) 0x44130 SETG %AL |
(821) 0x44133 CMOVG %EDX,%ECX |
(821) 0x44136 KMOVD %EAX,%K1 |
(821) 0x4413a MOVSXD %ECX,%R8 |
(821) 0x4413d VMOVSD %XMM1,%XMM7,%XMM7{%K1} |
(821) 0x44143 VMULSD %XMM18,%XMM0,%XMM2 |
(821) 0x44149 VMOVDDUP %XMM0,%XMM4 |
(821) 0x4414d VMULSD %XMM0,%XMM0,%XMM1 |
(821) 0x44151 MOV 0x310(%R13),%RCX |
(821) 0x44158 LEA (%RSI,%RSI,2),%RAX |
(821) 0x4415c MOVSXD 0x40(%R13),%R15 |
(821) 0x44160 MOV %RSI,0xb8(%RSP) |
(821) 0x44168 VSUBSD %XMM2,%XMM19,%XMM3 |
(821) 0x4416e VBLENDPD $0x2,0xc0(%RSP),%XMM3,%XMM3 |
(821) 0x44179 VBROADCASTSD %XMM1,%YMM1 |
(821) 0x4417e VMOVDDUP %XMM2,%XMM2 |
(821) 0x44182 MOV (%RCX,%RAX,8),%R12 |
(821) 0x44186 VMULPD %XMM4,%XMM3,%XMM3 |
(821) 0x4418a VUNPCKLPD %XMM1,%XMM4,%XMM4 |
(821) 0x4418e VMULSD %XMM1,%XMM2,%XMM1 |
(821) 0x44192 VMULSD %XMM6,%XMM6,%XMM2 |
(821) 0x44196 VPERMILPD $0x1,%XMM3,%XMM5 |
(821) 0x4419c VADDPD %XMM20,%XMM3,%XMM3 |
(821) 0x441a2 VBROADCASTSD %XMM1,%YMM1 |
(821) 0x441a7 VSUBSD %XMM5,%XMM19,%XMM5 |
(821) 0x441ad VMULPD %XMM4,%XMM3,%XMM3 |
(821) 0x441b1 VFMADD213SD %XMM19,%XMM0,%XMM5 |
(821) 0x441b7 VMULSD %XMM0,%XMM5,%XMM0 |
(821) 0x441bb VBROADCASTSD %XMM0,%YMM0 |
(821) 0x441c0 VBLENDPD $0x4,%YMM0,%YMM3,%YMM0 |
(821) 0x441c6 VADDPD 0x100(%RSP),%YMM0,%YMM0 |
(821) 0x441cf VBLENDPD $0x8,%YMM1,%YMM0,%YMM0 |
(821) 0x441d5 VMULSD %XMM18,%XMM6,%XMM1 |
(821) 0x441db VMOVUPD %YMM0,0x120(%RSP) |
(821) 0x441e4 VMULSD %XMM19,%XMM6,%XMM0 |
(821) 0x441ea VADDSD -0x3be84(%RIP),%XMM0,%XMM23 |
(821) 0x441f4 MOV 0x10(%R14),%RAX |
(821) 0x441f8 MOV 0x18(%R14),%R13 |
(821) 0x441fc MOV 0x20(%R14),%RCX |
(821) 0x44200 VSUBSD %XMM1,%XMM19,%XMM22 |
(821) 0x44206 VFMADD213SD -0x3bec8(%RIP),%XMM6,%XMM22 |
(821) 0x44210 VFMADD213SD -0x3bf52(%RIP),%XMM2,%XMM23 |
(821) 0x4421a MOV %RAX,0x68(%RSP) |
(821) 0x4421f TEST %R15D,%R15D |
(821) 0x44222 JE 442d5 |
(821) 0x44228 LEA (,%R15,8),%RDX |
(821) 0x44230 MOV %R12,%RDI |
(821) 0x44233 XOR %ESI,%ESI |
(821) 0x44235 VMOVSD %XMM22,0x38(%RSP) |
(821) 0x4423d VMOVSD %XMM23,0x30(%RSP) |
(821) 0x44245 VMOVAPD %XMM6,0x70(%RSP) |
(821) 0x4424b VMOVAPD %XMM7,0x50(%RSP) |
(821) 0x44251 VMOVSD %XMM1,0x28(%RSP) |
(821) 0x44257 VMOVSD %XMM0,0x20(%RSP) |
(821) 0x4425d VMOVSD %XMM2,0x18(%RSP) |
(821) 0x44263 MOV %R8,0x10(%RSP) |
(821) 0x44268 MOV %RCX,0x48(%RSP) |
(821) 0x4426d VZEROUPPER |
(821) 0x44270 CALL 4efb0 <@plt_start@+0x610> |
(821) 0x44275 VMOVSD 0x18(%RSP),%XMM2 |
(821) 0x4427b VMOVSD 0x20(%RSP),%XMM0 |
(821) 0x44281 VMOVSD 0x28(%RSP),%XMM1 |
(821) 0x44287 VMOVAPD 0x50(%RSP),%XMM7 |
(821) 0x4428d VMOVAPD 0x70(%RSP),%XMM6 |
(821) 0x44293 VMOVSD 0x30(%RSP),%XMM23 |
(821) 0x4429b VMOVSD 0x38(%RSP),%XMM22 |
(821) 0x442a3 VMOVSD -0x3bfad(%RIP),%XMM21 |
(821) 0x442ad VMOVAPD -0x3c027(%RIP),%XMM20 |
(821) 0x442b7 VMOVSD -0x3bf41(%RIP),%XMM19 |
(821) 0x442c1 VMOVSD -0x3bff3(%RIP),%XMM18 |
(821) 0x442cb MOV 0x48(%RSP),%RCX |
(821) 0x442d0 MOV 0x10(%RSP),%R8 |
(821) 0x442d5 VMULSD %XMM18,%XMM7,%XMM3 |
(821) 0x442db LEA 0x2(%RBX),%RAX |
(821) 0x442df VSUBSD %XMM0,%XMM19,%XMM0 |
(821) 0x442e5 LEA 0x1(%RBX),%R11 |
(821) 0x442e9 VMOVDDUP %XMM7,%XMM5 |
(821) 0x442ed LEA 0x18(,%R8,8),%RDX |
(821) 0x442f5 MOV 0x8(%R14),%R9 |
(821) 0x442f9 VFMADD213SD %XMM18,%XMM6,%XMM22 |
(821) 0x442ff VMULSD %XMM2,%XMM1,%XMM1 |
(821) 0x44303 VMULSD %XMM7,%XMM7,%XMM2 |
(821) 0x44307 VMOVAPD 0x140(%RSP),%ZMM8 |
(821) 0x4430f MOV %RAX,0x10(%RSP) |
(821) 0x44314 LEA 0x3(%RBX),%RAX |
(821) 0x44318 MOV %RAX,0x50(%RSP) |
(821) 0x4431d MOV %RBX,%RAX |
(821) 0x44320 MOV 0x8(%RSP),%RBX |
(821) 0x44325 IMUL %R13,%RAX |
(821) 0x44329 IMUL %RCX,%RDX |
(821) 0x4432d SAL $0x3,%R13 |
(821) 0x44331 VSUBSD %XMM3,%XMM19,%XMM4 |
(821) 0x44337 VBLENDPD $0x2,0xc0(%RSP),%XMM4,%XMM4 |
(821) 0x44342 IMUL 0x68(%RSP),%RBX |
(821) 0x44348 VFMADD213SD %XMM19,%XMM6,%XMM0 |
(821) 0x4434e VBROADCASTSD %XMM2,%YMM2 |
(821) 0x44353 VBROADCASTSD %XMM3,%YMM3 |
(821) 0x44358 SALQ $0x3,0x68(%RSP) |
(821) 0x4435e SAL $0x3,%RAX |
(821) 0x44362 ADD %R9,%RDX |
(821) 0x44365 VFMADD213SD %XMM18,%XMM6,%XMM0 |
(821) 0x4436b LEA (%RAX,%RBX,8),%RSI |
(821) 0x4436f LEA (,%R8,8),%RAX |
(821) 0x44377 VMULPD %XMM5,%XMM4,%XMM4 |
(821) 0x4437b VUNPCKLPD %XMM2,%XMM5,%XMM5 |
(821) 0x4437f LEA (%RDX,%RSI,1),%RDI |
(821) 0x44383 MOV %RAX,%R14 |
(821) 0x44386 IMUL %RCX,%R14 |
(821) 0x4438a MOV %RDI,0x38(%RSP) |
(821) 0x4438f LEA 0x10(,%R8,8),%RDI |
(821) 0x44397 LEA 0x8(,%R8,8),%R8 |
(821) 0x4439f VPERMILPD $0x1,%XMM4,%XMM6 |
(821) 0x443a5 VADDPD %XMM20,%XMM4,%XMM4 |
(821) 0x443ab VSUBSD %XMM6,%XMM19,%XMM6 |
(821) 0x443b1 IMUL %RCX,%RDI |
(821) 0x443b5 LEA (%R9,%R14,1),%RAX |
(821) 0x443b9 IMUL %RCX,%R8 |
(821) 0x443bd ADD %RSI,%RAX |
(821) 0x443c0 VMULPD %XMM5,%XMM4,%XMM4 |
(821) 0x443c4 MOV %RAX,0x70(%RSP) |
(821) 0x443c9 MOV %R11,%RAX |
(821) 0x443cc IMUL %R13,%RAX |
(821) 0x443d0 VFMADD213SD %XMM19,%XMM7,%XMM6 |
(821) 0x443d6 ADD %R9,%RDI |
(821) 0x443d9 ADD %R9,%R8 |
(821) 0x443dc LEA (%RDI,%RSI,1),%R10 |
(821) 0x443e0 LEA (%R8,%RSI,1),%RCX |
(821) 0x443e4 MOV %R10,0x30(%RSP) |
(821) 0x443e9 MOV 0x10(%RSP),%R10 |
(821) 0x443ee LEA (%RAX,%RBX,8),%R11 |
(821) 0x443f2 ADD %R9,%RAX |
(821) 0x443f5 VMULSD %XMM7,%XMM6,%XMM5 |
(821) 0x443f9 LEA (%RDX,%R11,1),%RSI |
(821) 0x443fd MOV %RSI,0x8(%RSP) |
(821) 0x44402 LEA (%RDI,%R11,1),%RSI |
(821) 0x44406 ADD %R8,%R11 |
(821) 0x44409 MOV %RSI,0x28(%RSP) |
(821) 0x4440e LEA (%R14,%RBX,8),%RSI |
(821) 0x44412 VBROADCASTSD %XMM5,%YMM5 |
(821) 0x44417 IMUL %R13,%R10 |
(821) 0x4441b IMUL 0x50(%RSP),%R13 |
(821) 0x44421 MOV %RCX,0x50(%RSP) |
(821) 0x44426 ADD %RSI,%RAX |
(821) 0x44429 VBLENDPD $0x4,%YMM5,%YMM4,%YMM4 |
(821) 0x4442f VMOVAPD 0x180(%RSP),%ZMM5 |
(821) 0x44437 VBLENDPD $0x8,%YMM3,%YMM4,%YMM3 |
(821) 0x4443d VBLENDPD $0x7,0x100(%RSP),%YMM2,%YMM4 |
(821) 0x44448 LEA (%R10,%RBX,8),%R14 |
(821) 0x4444c MOV %R10,%RCX |
(821) 0x4444f ADD %R9,%RCX |
(821) 0x44452 ADD %RSI,%RCX |
(821) 0x44455 LEA (%R13,%RBX,8),%R10 |
(821) 0x4445a LEA (%RDX,%R14,1),%RBX |
(821) 0x4445e ADD %R9,%R13 |
(821) 0x44461 MOV %RBX,0x20(%RSP) |
(821) 0x44466 LEA (%RDI,%R14,1),%RBX |
(821) 0x4446a ADD %RSI,%R13 |
(821) 0x4446d MOV %R15,%RSI |
(821) 0x44470 AND $-0x8,%RSI |
(821) 0x44474 ADD %R8,%R14 |
(821) 0x44477 MOV %RBX,0x18(%RSP) |
(821) 0x4447c MOV 0x8(%RSP),%RBX |
(821) 0x44481 MOV %RSI,(%RSP) |
(821) 0x44485 MOV %R15,%RSI |
(821) 0x44488 AND $-0x4,%RSI |
(821) 0x4448c ADD %R10,%RDX |
(821) 0x4448f ADD %R10,%RDI |
(821) 0x44492 ADD %R10,%R8 |
(821) 0x44495 XOR %R10D,%R10D |
(821) 0x44498 MOV %RSI,0x40(%RSP) |
(821) 0x4449d VADDPD %YMM4,%YMM3,%YMM2 |
(821) 0x444a1 VMULPD %YMM4,%YMM3,%YMM13 |
(821) 0x444a5 VPERMPD %ZMM2,%ZMM5,%ZMM4 |
(821) 0x444ab VPERMPD %ZMM13,%ZMM8,%ZMM8 |
(821) 0x444b1 VEXTRACTF128 $0x1,%YMM2,%XMM6 |
(821) 0x444b7 VBLENDPD $0x8,%YMM13,%YMM2,%YMM3 |
(821) 0x444bd VPERMPD $-0x1,%YMM13,%YMM11 |
(821) 0x444c3 VEXTRACTF128 $0x1,%YMM13,%XMM13 |
(821) 0x444c9 VBROADCASTSD %XMM2,%ZMM5 |
(821) 0x444cf VPERMPD $0x55,%YMM2,%YMM9 |
(821) 0x444d5 VPERMPD $-0x56,%YMM2,%YMM10 |
(821) 0x444db VPERMILPD $0x1,%XMM2,%XMM12 |
(821) 0x444e1 VBROADCASTSD %XMM6,%ZMM7 |
(821) 0x444e7 VPERMILPD $0x1,%XMM13,%XMM13 |
(821) 0x444ed JMP 44540 |
0x444ef NOP |
(822) 0x444f0 MOV 0x68(%RSP),%RSI |
(822) 0x444f5 INC %R10 |
(822) 0x444f8 ADD %RSI,0x38(%RSP) |
(822) 0x444fd ADD %RSI,0x30(%RSP) |
(822) 0x44502 ADD %RSI,0x50(%RSP) |
(822) 0x44507 ADD %RSI,0x70(%RSP) |
(822) 0x4450c ADD %RSI,0x28(%RSP) |
(822) 0x44511 ADD %RSI,0x20(%RSP) |
(822) 0x44516 ADD %RSI,0x18(%RSP) |
(822) 0x4451b ADD %RSI,%RBX |
(822) 0x4451e ADD %RSI,%R11 |
(822) 0x44521 ADD %RSI,%RAX |
(822) 0x44524 ADD %RSI,%R14 |
(822) 0x44527 ADD %RSI,%RCX |
(822) 0x4452a ADD %RSI,%RDX |
(822) 0x4452d ADD %RSI,%RDI |
(822) 0x44530 ADD %RSI,%R8 |
(822) 0x44533 ADD %RSI,%R13 |
(822) 0x44536 CMP $0x4,%R10 |
(822) 0x4453a JE 43ff0 |
(822) 0x44540 TEST %R15D,%R15D |
(822) 0x44543 JE 444f0 |
(822) 0x44545 VMOVSD 0x120(%RSP,%R10,8),%XMM14 |
(822) 0x4454f MOV %RAX,0x48(%RSP) |
(822) 0x44554 MOV %R11,0x98(%RSP) |
(822) 0x4455c MOV %RCX,0x10(%RSP) |
(822) 0x44561 MOV %RBX,0x8(%RSP) |
(822) 0x44566 MOV %R14,0x90(%RSP) |
(822) 0x4456e VMULSD %XMM14,%XMM22,%XMM15 |
(822) 0x44574 CMP $0x4,%R15D |
(822) 0x44578 JAE 445a0 |
(822) 0x4457a MOV 0x38(%RSP),%R11 |
(822) 0x4457f MOV 0x30(%RSP),%R14 |
(822) 0x44584 MOV 0x70(%RSP),%RAX |
(822) 0x44589 MOV 0x50(%RSP),%RCX |
(822) 0x4458e XOR %R9D,%R9D |
(822) 0x44591 JMP 44680 |
0x44596 NOPW %CS:(%RAX,%RAX,1) |
(822) 0x445a0 CMP $0x8,%R15D |
(822) 0x445a4 JAE 445be |
(822) 0x445a6 MOV 0x38(%RSP),%R11 |
(822) 0x445ab MOV 0x30(%RSP),%R14 |
(822) 0x445b0 MOV 0x70(%RSP),%RAX |
(822) 0x445b5 MOV 0x50(%RSP),%RCX |
(822) 0x445ba XOR %ESI,%ESI |
(822) 0x445bc JMP 44629 |
(822) 0x445be MOV 0x38(%RSP),%R11 |
(822) 0x445c3 MOV 0x30(%RSP),%R14 |
(822) 0x445c8 MOV 0x70(%RSP),%RAX |
(822) 0x445cd MOV 0x50(%RSP),%RCX |
(822) 0x445d2 MOV (%RSP),%R9 |
(822) 0x445d6 VBROADCASTSD %XMM15,%ZMM16 |
(822) 0x445dc XOR %ESI,%ESI |
(822) 0x445de XCHG %AX,%AX |
(823) 0x445e0 VMULPD (%RAX,%RSI,8),%ZMM5,%ZMM17 |
(823) 0x445e7 VFMADD231PD (%RCX,%RSI,8),%ZMM4,%ZMM17 |
(823) 0x445ee VFMADD231PD (%R14,%RSI,8),%ZMM7,%ZMM17 |
(823) 0x445f5 VFMADD231PD (%R11,%RSI,8),%ZMM8,%ZMM17 |
(823) 0x445fc VFMADD213PD (%R12,%RSI,8),%ZMM16,%ZMM17 |
(823) 0x44603 VMOVUPD %ZMM17,(%R12,%RSI,8) |
(823) 0x4460a ADD $0x8,%RSI |
(823) 0x4460e CMP %RSI,%R9 |
(823) 0x44611 JNE 445e0 |
(822) 0x44613 CMP %R15,%R9 |
(822) 0x44616 JE 446d9 |
(822) 0x4461c MOV (%RSP),%R9 |
(822) 0x44620 MOV %R9,%RSI |
(822) 0x44623 TEST $0x4,%R15B |
(822) 0x44627 JE 44680 |
(822) 0x44629 MOV 0x40(%RSP),%R9 |
(822) 0x4462e VBROADCASTSD %XMM15,%YMM16 |
(822) 0x44634 NOPW %CS:(%RAX,%RAX,1) |
(834) 0x44640 VMULPD (%RAX,%RSI,8),%YMM5,%YMM17 |
(834) 0x44647 VFMADD231PD (%RCX,%RSI,8),%YMM9,%YMM17 |
(834) 0x4464e VFMADD231PD (%R14,%RSI,8),%YMM10,%YMM17 |
(834) 0x44655 VFMADD231PD (%R11,%RSI,8),%YMM11,%YMM17 |
(834) 0x4465c VFMADD213PD (%R12,%RSI,8),%YMM16,%YMM17 |
(834) 0x44663 VMOVUPD %YMM17,(%R12,%RSI,8) |
(834) 0x4466a ADD $0x4,%RSI |
(834) 0x4466e CMP %RSI,%R9 |
(834) 0x44671 JNE 44640 |
(822) 0x44673 MOV %R9,%RSI |
(822) 0x44676 CMP %R15,%R9 |
(822) 0x44679 JE 446d9 |
(822) 0x4467b NOPL (%RAX,%RAX,1) |
(833) 0x44680 VMOVSD (%R14,%R9,8),%XMM16 |
(833) 0x44687 VMOVSD (%RAX,%R9,8),%XMM17 |
(833) 0x4468e VMOVHPD (%R11,%R9,8),%XMM16,%XMM16 |
(833) 0x44695 VMOVHPD (%RCX,%R9,8),%XMM17,%XMM17 |
(833) 0x4469c VINSERTF32X4 $0x1,%XMM16,%YMM17,%YMM16 |
(833) 0x446a3 VMULPD %YMM16,%YMM3,%YMM16 |
(833) 0x446a9 VEXTRACTF32X4 $0x1,%YMM16,%XMM17 |
(833) 0x446b0 VADDPD %XMM17,%XMM16,%XMM16 |
(833) 0x446b6 VPERMILPD $0x1,%XMM16,%XMM17 |
(833) 0x446bd VADDSD %XMM17,%XMM16,%XMM16 |
(833) 0x446c3 VFMADD213SD (%R12,%R9,8),%XMM15,%XMM16 |
(833) 0x446ca VMOVSD %XMM16,(%R12,%R9,8) |
(833) 0x446d1 INC %R9 |
(833) 0x446d4 CMP %R9,%R15 |
(833) 0x446d7 JNE 44680 |
(822) 0x446d9 VMULSD %XMM14,%XMM23,%XMM15 |
(822) 0x446df CMP $0x4,%R15D |
(822) 0x446e3 JAE 44710 |
(822) 0x446e5 MOV 0x48(%RSP),%RAX |
(822) 0x446ea MOV 0x98(%RSP),%R11 |
(822) 0x446f2 MOV 0x10(%RSP),%RCX |
(822) 0x446f7 MOV 0x8(%RSP),%RBX |
(822) 0x446fc MOV 0x28(%RSP),%R14 |
(822) 0x44701 XOR %R9D,%R9D |
(822) 0x44704 JMP 447f0 |
0x44709 NOPL (%RAX) |
(822) 0x44710 MOV 0x48(%RSP),%RAX |
(822) 0x44715 MOV 0x98(%RSP),%R11 |
(822) 0x4471d MOV 0x10(%RSP),%RCX |
(822) 0x44722 MOV 0x8(%RSP),%RBX |
(822) 0x44727 CMP $0x8,%R15D |
(822) 0x4472b JAE 44736 |
(822) 0x4472d MOV 0x28(%RSP),%R14 |
(822) 0x44732 XOR %ESI,%ESI |
(822) 0x44734 JMP 44799 |
(822) 0x44736 MOV 0x28(%RSP),%R14 |
(822) 0x4473b MOV (%RSP),%R9 |
(822) 0x4473f VBROADCASTSD %XMM15,%ZMM16 |
(822) 0x44745 XOR %ESI,%ESI |
(822) 0x44747 NOPW (%RAX,%RAX,1) |
(824) 0x44750 VMULPD (%RAX,%RSI,8),%ZMM5,%ZMM17 |
(824) 0x44757 VFMADD231PD (%R11,%RSI,8),%ZMM4,%ZMM17 |
(824) 0x4475e VFMADD231PD (%R14,%RSI,8),%ZMM7,%ZMM17 |
(824) 0x44765 VFMADD231PD (%RBX,%RSI,8),%ZMM8,%ZMM17 |
(824) 0x4476c VFMADD213PD (%R12,%RSI,8),%ZMM16,%ZMM17 |
(824) 0x44773 VMOVUPD %ZMM17,(%R12,%RSI,8) |
(824) 0x4477a ADD $0x8,%RSI |
(824) 0x4477e CMP %RSI,%R9 |
(824) 0x44781 JNE 44750 |
(822) 0x44783 CMP %R15,%R9 |
(822) 0x44786 JE 44822 |
(822) 0x4478c MOV (%RSP),%R9 |
(822) 0x44790 MOV %R9,%RSI |
(822) 0x44793 TEST $0x4,%R15B |
(822) 0x44797 JE 447f0 |
(822) 0x44799 MOV 0x40(%RSP),%R9 |
(822) 0x4479e VBROADCASTSD %XMM15,%YMM16 |
(822) 0x447a4 NOPW %CS:(%RAX,%RAX,1) |
(832) 0x447b0 VMULPD (%RAX,%RSI,8),%YMM5,%YMM17 |
(832) 0x447b7 VFMADD231PD (%R11,%RSI,8),%YMM9,%YMM17 |
(832) 0x447be VFMADD231PD (%R14,%RSI,8),%YMM10,%YMM17 |
(832) 0x447c5 VFMADD231PD (%RBX,%RSI,8),%YMM11,%YMM17 |
(832) 0x447cc VFMADD213PD (%R12,%RSI,8),%YMM16,%YMM17 |
(832) 0x447d3 VMOVUPD %YMM17,(%R12,%RSI,8) |
(832) 0x447da ADD $0x4,%RSI |
(832) 0x447de CMP %RSI,%R9 |
(832) 0x447e1 JNE 447b0 |
(822) 0x447e3 MOV %R9,%RSI |
(822) 0x447e6 CMP %R15,%R9 |
(822) 0x447e9 JE 44822 |
(822) 0x447eb NOPL (%RAX,%RAX,1) |
(831) 0x447f0 VMULSD (%RAX,%R9,8),%XMM2,%XMM16 |
(831) 0x447f7 VFMADD231SD (%R11,%R9,8),%XMM12,%XMM16 |
(831) 0x447fe VFMADD231SD (%R14,%R9,8),%XMM6,%XMM16 |
(831) 0x44805 VFMADD231SD (%RBX,%R9,8),%XMM13,%XMM16 |
(831) 0x4480c VFMADD213SD (%R12,%R9,8),%XMM15,%XMM16 |
(831) 0x44813 VMOVSD %XMM16,(%R12,%R9,8) |
(831) 0x4481a INC %R9 |
(831) 0x4481d CMP %R9,%R15 |
(831) 0x44820 JNE 447f0 |
(822) 0x44822 VMULSD %XMM0,%XMM14,%XMM15 |
(822) 0x44826 MOV %R10,0x88(%RSP) |
(822) 0x4482e CMP $0x4,%R15D |
(822) 0x44832 JAE 44850 |
(822) 0x44834 MOV 0x90(%RSP),%R14 |
(822) 0x4483c MOV 0x20(%RSP),%R10 |
(822) 0x44841 MOV 0x18(%RSP),%RBX |
(822) 0x44846 XOR %R9D,%R9D |
(822) 0x44849 JMP 44930 |
0x4484e XCHG %AX,%AX |
(822) 0x44850 MOV 0x90(%RSP),%R14 |
(822) 0x44858 CMP $0x8,%R15D |
(822) 0x4485c JAE 4486c |
(822) 0x4485e MOV 0x20(%RSP),%R10 |
(822) 0x44863 MOV 0x18(%RSP),%RBX |
(822) 0x44868 XOR %ESI,%ESI |
(822) 0x4486a JMP 448d9 |
(822) 0x4486c MOV 0x20(%RSP),%R10 |
(822) 0x44871 MOV 0x18(%RSP),%RBX |
(822) 0x44876 MOV (%RSP),%R9 |
(822) 0x4487a VBROADCASTSD %XMM15,%ZMM16 |
(822) 0x44880 XOR %ESI,%ESI |
(822) 0x44882 NOPW %CS:(%RAX,%RAX,1) |
(825) 0x44890 VMULPD (%RCX,%RSI,8),%ZMM5,%ZMM17 |
(825) 0x44897 VFMADD231PD (%R14,%RSI,8),%ZMM4,%ZMM17 |
(825) 0x4489e VFMADD231PD (%RBX,%RSI,8),%ZMM7,%ZMM17 |
(825) 0x448a5 VFMADD231PD (%R10,%RSI,8),%ZMM8,%ZMM17 |
(825) 0x448ac VFMADD213PD (%R12,%RSI,8),%ZMM16,%ZMM17 |
(825) 0x448b3 VMOVUPD %ZMM17,(%R12,%RSI,8) |
(825) 0x448ba ADD $0x8,%RSI |
(825) 0x448be CMP %RSI,%R9 |
(825) 0x448c1 JNE 44890 |
(822) 0x448c3 CMP %R15,%R9 |
(822) 0x448c6 JE 44962 |
(822) 0x448cc MOV (%RSP),%R9 |
(822) 0x448d0 MOV %R9,%RSI |
(822) 0x448d3 TEST $0x4,%R15B |
(822) 0x448d7 JE 44930 |
(822) 0x448d9 MOV 0x40(%RSP),%R9 |
(822) 0x448de VBROADCASTSD %XMM15,%YMM16 |
(822) 0x448e4 NOPW %CS:(%RAX,%RAX,1) |
(830) 0x448f0 VMULPD (%RCX,%RSI,8),%YMM5,%YMM17 |
(830) 0x448f7 VFMADD231PD (%R14,%RSI,8),%YMM9,%YMM17 |
(830) 0x448fe VFMADD231PD (%RBX,%RSI,8),%YMM10,%YMM17 |
(830) 0x44905 VFMADD231PD (%R10,%RSI,8),%YMM11,%YMM17 |
(830) 0x4490c VFMADD213PD (%R12,%RSI,8),%YMM16,%YMM17 |
(830) 0x44913 VMOVUPD %YMM17,(%R12,%RSI,8) |
(830) 0x4491a ADD $0x4,%RSI |
(830) 0x4491e CMP %RSI,%R9 |
(830) 0x44921 JNE 448f0 |
(822) 0x44923 MOV %R9,%RSI |
(822) 0x44926 CMP %R15,%R9 |
(822) 0x44929 JE 44962 |
(822) 0x4492b NOPL (%RAX,%RAX,1) |
(829) 0x44930 VMULSD (%RCX,%R9,8),%XMM2,%XMM16 |
(829) 0x44937 VFMADD231SD (%R14,%R9,8),%XMM12,%XMM16 |
(829) 0x4493e VFMADD231SD (%RBX,%R9,8),%XMM6,%XMM16 |
(829) 0x44945 VFMADD231SD (%R10,%R9,8),%XMM13,%XMM16 |
(829) 0x4494c VFMADD213SD (%R12,%R9,8),%XMM15,%XMM16 |
(829) 0x44953 VMOVSD %XMM16,(%R12,%R9,8) |
(829) 0x4495a INC %R9 |
(829) 0x4495d CMP %R9,%R15 |
(829) 0x44960 JNE 44930 |
(822) 0x44962 MOV 0x8(%RSP),%RBX |
(822) 0x44967 VMULSD %XMM1,%XMM14,%XMM14 |
(822) 0x4496b CMP $0x4,%R15D |
(822) 0x4496f JAE 44990 |
(822) 0x44971 MOV 0x88(%RSP),%R10 |
(822) 0x44979 XOR %R9D,%R9D |
(822) 0x4497c JMP 44a50 |
0x44981 NOPW %CS:(%RAX,%RAX,1) |
(822) 0x44990 MOV 0x88(%RSP),%R10 |
(822) 0x44998 CMP $0x8,%R15D |
(822) 0x4499c JAE 449a2 |
(822) 0x4499e XOR %ESI,%ESI |
(822) 0x449a0 JMP 449fa |
(822) 0x449a2 MOV (%RSP),%R9 |
(822) 0x449a6 VBROADCASTSD %XMM14,%ZMM15 |
(822) 0x449ac XOR %ESI,%ESI |
(822) 0x449ae XCHG %AX,%AX |
(826) 0x449b0 VMULPD (%R13,%RSI,8),%ZMM5,%ZMM16 |
(826) 0x449b8 VFMADD231PD (%R8,%RSI,8),%ZMM4,%ZMM16 |
(826) 0x449bf VFMADD231PD (%RDI,%RSI,8),%ZMM7,%ZMM16 |
(826) 0x449c6 VFMADD231PD (%RDX,%RSI,8),%ZMM8,%ZMM16 |
(826) 0x449cd VFMADD213PD (%R12,%RSI,8),%ZMM15,%ZMM16 |
(826) 0x449d4 VMOVUPD %ZMM16,(%R12,%RSI,8) |
(826) 0x449db ADD $0x8,%RSI |
(826) 0x449df CMP %RSI,%R9 |
(826) 0x449e2 JNE 449b0 |
(822) 0x449e4 CMP %R15,%R9 |
(822) 0x449e7 JE 444f0 |
(822) 0x449ed MOV (%RSP),%R9 |
(822) 0x449f1 MOV %R9,%RSI |
(822) 0x449f4 TEST $0x4,%R15B |
(822) 0x449f8 JE 44a50 |
(822) 0x449fa MOV 0x40(%RSP),%R9 |
(822) 0x449ff VBROADCASTSD %XMM14,%YMM15 |
(822) 0x44a04 NOPW %CS:(%RAX,%RAX,1) |
(828) 0x44a10 VMULPD (%R13,%RSI,8),%YMM5,%YMM16 |
(828) 0x44a18 VFMADD231PD (%R8,%RSI,8),%YMM9,%YMM16 |
(828) 0x44a1f VFMADD231PD (%RDI,%RSI,8),%YMM10,%YMM16 |
(828) 0x44a26 VFMADD231PD (%RDX,%RSI,8),%YMM11,%YMM16 |
(828) 0x44a2d VFMADD213PD (%R12,%RSI,8),%YMM15,%YMM16 |
(828) 0x44a34 VMOVUPD %YMM16,(%R12,%RSI,8) |
(828) 0x44a3b ADD $0x4,%RSI |
(828) 0x44a3f CMP %RSI,%R9 |
(828) 0x44a42 JNE 44a10 |
(822) 0x44a44 MOV %R9,%RSI |
(822) 0x44a47 CMP %R15,%R9 |
(822) 0x44a4a JE 444f0 |
(827) 0x44a50 VMULSD (%R13,%R9,8),%XMM2,%XMM15 |
(827) 0x44a57 VFMADD231SD (%R8,%R9,8),%XMM12,%XMM15 |
(827) 0x44a5d VFMADD231SD (%RDI,%R9,8),%XMM6,%XMM15 |
(827) 0x44a63 VFMADD231SD (%RDX,%R9,8),%XMM13,%XMM15 |
(827) 0x44a69 VFMADD213SD (%R12,%R9,8),%XMM14,%XMM15 |
(827) 0x44a6f VMOVSD %XMM15,(%R12,%R9,8) |
(827) 0x44a75 INC %R9 |
(827) 0x44a78 CMP %R9,%R15 |
(827) 0x44a7b JNE 44a50 |
(822) 0x44a7d JMP 444f0 |
0x44a82 MOV 0xa8(%RSP),%RDI |
0x44a8a VZEROUPPER |
0x44a8d CALL 4ec00 <@plt_start@+0x260> |
0x44a92 MOV 0x30(%R13),%EAX |
0x44a96 MOV 0xa0(%RSP),%R15 |
0x44a9e TEST %EAX,%EAX |
0x44aa0 JLE 44b01 |
0x44aa2 XOR %EBX,%EBX |
0x44aa4 XOR %R14D,%R14D |
0x44aa7 JMP 44abc |
0x44aa9 NOPL (%RAX) |
(820) 0x44ab0 MOVSXD %EAX,%RCX |
(820) 0x44ab3 ADD $0x18,%RBX |
(820) 0x44ab7 CMP %RCX,%R14 |
(820) 0x44aba JGE 44b01 |
(820) 0x44abc MOV 0x40(%R13),%ECX |
(820) 0x44ac0 MOV 0x8(%R13),%ESI |
(820) 0x44ac4 MOV %R14D,%EDX |
(820) 0x44ac7 INC %R14 |
(820) 0x44aca IMUL %EAX,%EDX |
(820) 0x44acd IMUL %R14D,%ECX |
(820) 0x44ad1 CMP %ECX,%ESI |
(820) 0x44ad3 CMOVL %ESI,%ECX |
(820) 0x44ad6 SUB %EDX,%ECX |
(820) 0x44ad8 JLE 44ab0 |
(820) 0x44ada MOV 0x310(%R13),%RAX |
(820) 0x44ae1 MOVSXD %EDX,%RDI |
(820) 0x44ae4 MOV %ECX,%EDX |
(820) 0x44ae6 SAL $0x3,%RDX |
(820) 0x44aea SAL $0x3,%RDI |
(820) 0x44aee ADD 0x18(%R15),%RDI |
(820) 0x44af2 MOV (%RAX,%RBX,1),%RSI |
(820) 0x44af6 CALL 4f010 <@plt_start@+0x670> |
(820) 0x44afb MOV 0x30(%R13),%EAX |
(820) 0x44aff JMP 44ab0 |
0x44b01 LEA -0x28(%RBP),%RSP |
0x44b05 POP %RBX |
0x44b06 POP %R12 |
0x44b08 POP %R13 |
0x44b0a POP %R14 |
0x44b0c POP %R15 |
0x44b0e POP %RBP |
0x44b0f RET |
0x44b10 MOV %RAX,%RDI |
0x44b13 CALL 11a70 <__clang_call_terminate> |
0x44b18 INT $0x3 |
0x44b19 INT $0x3 |
0x44b1a INT $0x3 |
0x44b1b INT $0x3 |
0x44b1c INT $0x3 |
0x44b1d INT $0x3 |
0x44b1e INT $0x3 |
0x44b1f INT $0x3 |
Path / |
Source file and lines | einspline_spo_ref.hpp:172-189 |
Module | libqmcwfs.so |
nb instructions | 111 |
nb uops | 100 |
loop length | 590 |
used x86 registers | 12 |
used mmx registers | 0 |
used xmm registers | 10 |
used ymm registers | 1 |
used zmm registers | 2 |
nb stack references | 11 |
ADD-SUB / MUL ratio | 1.50 |
micro-operation queue | 16.67 cycles |
front end | 16.67 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.50 | 4.00 | 3.75 | 3.75 | 4.00 | 12.67 | 12.67 | 12.67 | 6.25 | 6.42 | 6.17 | 6.17 | 4.50 | 4.50 |
cycles | 4.50 | 4.00 | 3.75 | 3.75 | 4.00 | 12.67 | 12.67 | 12.67 | 6.25 | 6.42 | 6.17 | 6.17 | 4.50 | 4.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 16.67 |
Dispatch | 12.67 |
Overall L1 | 16.67 |
all | 18% |
load | 0% |
store | 25% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 16% |
all | 57% |
load | 44% |
store | 100% |
mul | 100% |
add-sub | 33% |
fma | 66% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 52% |
all | 49% |
load | 38% |
store | 70% |
mul | 100% |
add-sub | 33% |
fma | 66% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 44% |
all | 14% |
load | 8% |
store | 21% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 23% |
load | 18% |
store | 50% |
mul | 25% |
add-sub | 16% |
fma | 20% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 19% |
all | 21% |
load | 16% |
store | 38% |
mul | 25% |
add-sub | 16% |
fma | 20% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 16% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x200,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x358(%RDI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EDX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CALL 4ebf0 <@plt_start@+0x250> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD %R12D,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x128(%R13),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA (%RCX,%RCX,2),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAL $0x3,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD 0x40(%R13),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CMP %ECX,0x124(%R13) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMOVE %RDX,%RAX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMPL $0,0x30(%RBX) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JLE 44a82 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xc52> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VMOVUPD 0x100(%R13),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVUPD 0x8(%RAX),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVSD (%RAX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x3bbdf(%RIP),%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x3bb41(%RIP),%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVAPD -0x3bc3b(%RIP),%XMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVSD -0x3bbd5(%RIP),%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVHPD 0x118(%R13),%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
VMULPD %XMM1,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPERMILPD $0x1,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VFMADD231SD 0xe8(%R13),%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD %XMM3,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VROUNDSD $0x9,%XMM2,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VSUBSD %XMM3,%XMM2,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VXORPD %XMM3,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VCMPSD $0x1,%XMM3,%XMM2,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD %XMM5,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD %XMM3,%XMM4,%XMM4{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VCMPSD $0xe,-0x3bc19(%RIP),%XMM2,%K1 | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVDDUP %XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VPERMILPD $0x3,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VBROADCASTF128 -0x3bc9c(%RIP),%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDQA %YMM3,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VMOVSD %XMM4,%XMM5,%XMM5{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VMOVDDUP %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMULPD 0xd8(%R13),%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVDDUP -0x3bbe0(%RIP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVAPD %XMM5,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VFMADD231PD 0xf0(%R13),%XMM2,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD -0x3bbec(%RIP),%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 |
VMOVAPD %XMM4,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VMOVAPD %ZMM2,0x180(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 |
VFMADD132PD 0x108(%R13),%XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VCMPPD $0x1,%XMM0,%XMM1,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VCMPPD $0xe,-0x3bc9c(%RIP){1to0},%XMM1,%K0{%K1} | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VROUNDPD $0x9,%XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
KNOTW %K0,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VSUBPD %XMM0,%XMM1,%XMM0{%K1}{z} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VBROADCASTSD -0x3bc2e(%RIP),%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 |
VMOVAPD %XMM0,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPERMILPD $0x1,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMOVAPD %XMM0,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VMOVAPD %ZMM1,0x140(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 |
JMP 44010 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV 0xa8(%RSP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4ec00 <@plt_start@+0x260> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x30(%R13),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xa0(%RSP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
TEST %EAX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 44b01 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xcd1> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 44abc <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xc8c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 11a70 <__clang_call_terminate> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 |
Source file and lines | einspline_spo_ref.hpp:172-189 |
Module | libqmcwfs.so |
nb instructions | 111 |
nb uops | 100 |
loop length | 590 |
used x86 registers | 12 |
used mmx registers | 0 |
used xmm registers | 10 |
used ymm registers | 1 |
used zmm registers | 2 |
nb stack references | 11 |
ADD-SUB / MUL ratio | 1.50 |
micro-operation queue | 16.67 cycles |
front end | 16.67 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.50 | 4.00 | 3.75 | 3.75 | 4.00 | 12.67 | 12.67 | 12.67 | 6.25 | 6.42 | 6.17 | 6.17 | 4.50 | 4.50 |
cycles | 4.50 | 4.00 | 3.75 | 3.75 | 4.00 | 12.67 | 12.67 | 12.67 | 6.25 | 6.42 | 6.17 | 6.17 | 4.50 | 4.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 16.67 |
Dispatch | 12.67 |
Overall L1 | 16.67 |
all | 18% |
load | 0% |
store | 25% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 16% |
all | 57% |
load | 44% |
store | 100% |
mul | 100% |
add-sub | 33% |
fma | 66% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 52% |
all | 49% |
load | 38% |
store | 70% |
mul | 100% |
add-sub | 33% |
fma | 66% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 44% |
all | 14% |
load | 8% |
store | 21% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 23% |
load | 18% |
store | 50% |
mul | 25% |
add-sub | 16% |
fma | 20% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 19% |
all | 21% |
load | 16% |
store | 38% |
mul | 25% |
add-sub | 16% |
fma | 20% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 16% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x200,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x358(%RDI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EDX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CALL 4ebf0 <@plt_start@+0x250> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD %R12D,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x128(%R13),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA (%RCX,%RCX,2),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAL $0x3,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD 0x40(%R13),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CMP %ECX,0x124(%R13) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMOVE %RDX,%RAX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMPL $0,0x30(%RBX) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JLE 44a82 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xc52> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VMOVUPD 0x100(%R13),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVUPD 0x8(%RAX),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVSD (%RAX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x3bbdf(%RIP),%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x3bb41(%RIP),%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVAPD -0x3bc3b(%RIP),%XMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVSD -0x3bbd5(%RIP),%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVHPD 0x118(%R13),%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
VMULPD %XMM1,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPERMILPD $0x1,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VFMADD231SD 0xe8(%R13),%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD %XMM3,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VROUNDSD $0x9,%XMM2,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VSUBSD %XMM3,%XMM2,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VXORPD %XMM3,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VCMPSD $0x1,%XMM3,%XMM2,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVAPD %XMM5,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD %XMM3,%XMM4,%XMM4{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VCMPSD $0xe,-0x3bc19(%RIP),%XMM2,%K1 | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVDDUP %XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VPERMILPD $0x3,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VBROADCASTF128 -0x3bc9c(%RIP),%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDQA %YMM3,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VMOVSD %XMM4,%XMM5,%XMM5{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VMOVDDUP %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMULPD 0xd8(%R13),%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVDDUP -0x3bbe0(%RIP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVAPD %XMM5,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VFMADD231PD 0xf0(%R13),%XMM2,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD -0x3bbec(%RIP),%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 |
VMOVAPD %XMM4,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VMOVAPD %ZMM2,0x180(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 |
VFMADD132PD 0x108(%R13),%XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VCMPPD $0x1,%XMM0,%XMM1,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VCMPPD $0xe,-0x3bc9c(%RIP){1to0},%XMM1,%K0{%K1} | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VROUNDPD $0x9,%XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
KNOTW %K0,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VSUBPD %XMM0,%XMM1,%XMM0{%K1}{z} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VBROADCASTSD -0x3bc2e(%RIP),%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 |
VMOVAPD %XMM0,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPERMILPD $0x1,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMOVAPD %XMM0,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VMOVAPD %ZMM1,0x140(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 |
JMP 44010 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV 0xa8(%RSP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4ec00 <@plt_start@+0x260> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x30(%R13),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xa0(%RSP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
TEST %EAX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 44b01 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xcd1> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 44abc <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xc8c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 11a70 <__clang_call_terminate> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
INT $0x3 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE– | 28.96 | 59.19 |
▼Loop 821 - MultiBsplineRef.hpp:42-71 - libqmcwfs.so– | 0.02 | 0.05 |
▼Loop 822 - MultiBsplineRef.hpp:63-71 - libqmcwfs.so– | 0.04 | 0.08 |
○Loop 826 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 7.23 | 13.54 |
○Loop 825 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 7.21 | 13.5 |
○Loop 823 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 7.21 | 13.52 |
○Loop 824 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 7.18 | 13.46 |
○Loop 834 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 829 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 832 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 831 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 830 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 833 - MultiBsplineRef.hpp:68-71 - libqmcwfs.so | 0 | 0 |
○Loop 828 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 827 - MultiBsplineRef.hpp:68-70 - libqmcwfs.so | 0 | 0 |
○Loop 820 - einspline_spo_ref.hpp:183-187 - libqmcwfs.so | 0.01 | 0.01 |