Function: _ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6 ... | Module: exec | Source: einspline_spo_ref.hpp:172-189 [...] | Coverage: 27.9% |
---|
Function: _ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6 ... | Module: exec | Source: einspline_spo_ref.hpp:172-189 [...] | Coverage: 27.9% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Utilities/NewTimer.h: 242 - 249 |
-------------------------------------------------------------------------------- |
242: ScopeGuard(TIMER& t) : timer(t) { timer.start(); } |
[...] |
249: ~ScopeGuard() { timer.stop(); } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 143 - 143 |
-------------------------------------------------------------------------------- |
143: return (active_ptcl_ == iat) ? active_pos_ : R[iat]; |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/stl_algo.h: 731 - 757 |
-------------------------------------------------------------------------------- |
731: { return std::copy(__first, __first + __n, __result); } |
[...] |
757: if (__n2 <= 0) |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 229 - 229 |
-------------------------------------------------------------------------------- |
229: return X[i]; |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineEvalHelper.hpp: 53 - 63 |
-------------------------------------------------------------------------------- |
53: if (x < 0) |
[...] |
60: ind = static_cast<int>(x); |
61: dx = x - ind; |
62: // upper bound |
63: if (ind > nmax) |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineData.hpp: 54 - 57 |
-------------------------------------------------------------------------------- |
54: a[0] = ((A00 * tx + A01) * tx + A02) * tx + A03; |
55: a[1] = ((A10 * tx + A11) * tx + A12) * tx + A13; |
56: a[2] = ((A20 * tx + A21) * tx + A22) * tx + A23; |
57: a[3] = ((A30 * tx + A31) * tx + A32) * tx + A33; |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/stl_vector.h: 1258 - 1258 |
-------------------------------------------------------------------------------- |
1258: { return _M_data_ptr(this->_M_impl._M_start); } |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/stl_algobase.h: 238 - 931 |
-------------------------------------------------------------------------------- |
238: if (__b < __a) |
[...] |
398: { *__to = *__from; } |
[...] |
436: if (__builtin_expect(_Num > 1, true)) |
437: __builtin_memmove(__result, __first, sizeof(_Tp) * _Num); |
[...] |
930: for (; __first != __last; ++__first) |
931: *__first = __tmp; |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVectorTensorOps.h: 150 - 152 |
-------------------------------------------------------------------------------- |
150: return TinyVector<Type_t, 3>(lhs[0] * rhs[0] + lhs[1] * rhs[3] + lhs[2] * rhs[6], |
151: lhs[0] * rhs[1] + lhs[1] * rhs[4] + lhs[2] * rhs[7], |
152: lhs[0] * rhs[2] + lhs[1] * rhs[5] + lhs[2] * rhs[8]); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/einspline_spo_ref.hpp: 172 - 189 |
-------------------------------------------------------------------------------- |
172: ScopedTimer local_timer(timer); |
173: |
174: auto u = Lattice.toUnit_floor(P.activeR(iat)); |
175: for (int i = 0; i < nBlocks; ++i) |
176: MultiBsplineEvalRef::evaluate_v(einsplines[i], u[0], u[1], u[2], psi[i].data(), nSplinesPerBlock); |
177: } |
178: |
179: inline void evaluate(const ParticleSet& P, int iat, ValueVector_t& psi_v) |
180: { |
181: evaluate_v(P, iat); |
182: |
183: for (int i = 0; i < nBlocks; ++i) |
184: { |
185: // in real simulation, phase needs to be applied. Here just fake computation |
186: const int first = i * nBlocks; |
187: std::copy_n(psi[i].data(), std::min((i + 1) * nSplinesPerBlock, OrbitalSetSize) - first, psi_v.data() + first); |
188: } |
189: } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Particle/Lattice/CrystalLattice.h: 170 - 173 |
-------------------------------------------------------------------------------- |
170: if (-std::numeric_limits<T1>::epsilon() < val_dot[i] && val_dot[i] < 0) |
171: val_dot[i] = T1(0.0); |
172: else |
173: val_dot[i] -= std::floor(val_dot[i]); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineRef.hpp: 42 - 71 |
-------------------------------------------------------------------------------- |
42: x -= spline_m->x_grid.start; |
43: y -= spline_m->y_grid.start; |
44: z -= spline_m->z_grid.start; |
45: T tx, ty, tz; |
46: int ix, iy, iz; |
47: spline2::getSplineBound(x * spline_m->x_grid.delta_inv, tx, ix, spline_m->x_grid.num - 1); |
48: spline2::getSplineBound(y * spline_m->y_grid.delta_inv, ty, iy, spline_m->y_grid.num - 1); |
49: spline2::getSplineBound(z * spline_m->z_grid.delta_inv, tz, iz, spline_m->z_grid.num - 1); |
[...] |
56: const intptr_t xs = spline_m->x_stride; |
57: const intptr_t ys = spline_m->y_stride; |
58: const intptr_t zs = spline_m->z_stride; |
59: |
60: constexpr T zero(0); |
61: std::fill(vals, vals + num_splines, zero); |
62: |
63: for (size_t i = 0; i < 4; i++) |
64: for (size_t j = 0; j < 4; j++) |
65: { |
66: const T pre00 = a[i] * b[j]; |
67: const T* restrict coefs = spline_m->coefs + (ix + i) * xs + (iy + j) * ys + iz * zs; |
68: for (size_t n = 0; n < num_splines; n++) |
69: vals[n] += pre00 * |
70: (c[0] * coefs[n] + c[1] * coefs[n + zs] + c[2] * coefs[n + 2 * zs] + |
71: c[3] * coefs[n + 3 * zs]); |
0x4773c0 PUSH %RBP |
0x4773c1 MOV %RSP,%RBP |
0x4773c4 PUSH %R15 |
0x4773c6 PUSH %R14 |
0x4773c8 PUSH %R13 |
0x4773ca PUSH %R12 |
0x4773cc PUSH %RBX |
0x4773cd MOV %RSI,%R12 |
0x4773d0 MOV %RDI,%RBX |
0x4773d3 AND $-0x40,%RSP |
0x4773d7 MOV %RCX,%R13 |
0x4773da MOVSXD %EDX,%R15 |
0x4773dd SUB $0x140,%RSP |
0x4773e4 MOV 0x358(%RDI),%R14 |
0x4773eb MOV %R14,%RDI |
0x4773ee CALL 51ed20 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> |
0x4773f3 LEA 0x128(%R12),%RCX |
0x4773fb CMP 0x124(%R12),%R15D |
0x477403 JE 477412 |
0x477405 MOV 0x40(%R12),%RAX |
0x47740a LEA (%R15,%R15,2),%RDX |
0x47740e LEA (%RAX,%RDX,8),%RCX |
0x477412 VMOVUPD (%RCX),%XMM2 |
0x477416 VMOVSD 0x10(%RCX),%XMM4 |
0x47741b VXORPD %XMM5,%XMM5,%XMM5 |
0x47741f VMOVSD %XMM2,%XMM2,%XMM0 |
0x477423 VUNPCKHPD %XMM2,%XMM2,%XMM1 |
0x477427 VMULSD 0x100(%RBX),%XMM1,%XMM3 |
0x47742f VFMADD132SD 0xe8(%RBX),%XMM3,%XMM0 |
0x477438 VFMADD231SD 0x118(%RBX),%XMM4,%XMM0 |
0x477441 VCOMISD %XMM0,%XMM5 |
0x477445 JBE 477455 |
0x477447 VCOMISD 0x12d691(%RIP),%XMM0 |
0x47744f JA 477f15 |
0x477455 VRNDSCALESD $0x9,%XMM0,%XMM0,%XMM6 |
0x47745c VSUBSD %XMM6,%XMM0,%XMM7 |
0x477460 MOVSXD 0x30(%RBX),%RSI |
0x477464 TEST %ESI,%ESI |
0x477466 JLE 477ddc |
0x47746c VPERMILPD $0,%XMM2,%XMM10 |
0x477472 VMULPD 0xd8(%RBX),%XMM10,%XMM11 |
0x47747a VPERMILPD $0x3,%XMM2,%XMM9 |
0x477480 VMOVDDUP %XMM4,%XMM8 |
0x477484 VFMADD231PD 0xf0(%RBX),%XMM9,%XMM11 |
0x47748d VMOVDDUP 0x12d64b(%RIP),%XMM13 |
0x477495 VFMADD132PD 0x108(%RBX),%XMM11,%XMM8 |
0x47749e VCMPPD $0xe,%XMM13,%XMM8,%K1 |
0x4774a5 MOVSXD 0x40(%RBX),%RDI |
0x4774a9 VXORPD %XMM14,%XMM14,%XMM14 |
0x4774ae MOV 0x2f8(%RBX),%R9 |
0x4774b5 MOV 0x310(%RBX),%R11 |
0x4774bc MOV %R14,0x40(%RSP) |
0x4774c1 VMOVSD %XMM7,0x48(%RSP) |
0x4774c7 MOV %RBX,0x38(%RSP) |
0x4774cc MOV %R13,0x30(%RSP) |
0x4774d1 VRNDSCALEPD $0x9,%XMM8,%XMM12 |
0x4774d8 VCMPPD $0x1,%XMM14,%XMM8,%K0{%K1} |
0x4774df MOV %EDI,0x6c(%RSP) |
0x4774e3 MOV %RDI,0xd0(%RSP) |
0x4774eb MOV %R11,0x70(%RSP) |
0x4774f0 MOV %R9,0x80(%RSP) |
0x4774f8 KNOTB %K0,%K2 |
0x4774fc MOV %RDI,%R15 |
0x4774ff VSUBPD %XMM12,%XMM8,%XMM15{%K2}{z} |
0x477505 LEA (,%RDI,8),%R8 |
0x47750d LEA -0x1(%RDI),%R12 |
0x477511 SHR $0x3,%R15 |
0x477515 MOV %R8,0x78(%RSP) |
0x47751a MOV %R12,0xb0(%RSP) |
0x477522 SAL $0x6,%R15 |
0x477526 VMOVHPD %XMM15,0x50(%RSP) |
0x47752c LEA (%R9,%RSI,8),%R10 |
0x477530 AND $-0x8,%RDI |
0x477534 VMOVLPD %XMM15,0x58(%RSP) |
0x47753a MOV %R15,0xf0(%RSP) |
0x477542 MOV %R10,0x60(%RSP) |
0x477547 MOV %RDI,0x88(%RSP) |
(827) 0x47754f MOV 0x80(%RSP),%R13 |
(827) 0x477557 MOV 0x70(%RSP),%RBX |
(827) 0x47755c VMOVSD 0x50(%RSP),%XMM2 |
(827) 0x477562 VMOVSD 0x48(%RSP),%XMM0 |
(827) 0x477568 VMOVSD 0x58(%RSP),%XMM3 |
(827) 0x47756e VXORPD %XMM6,%XMM6,%XMM6 |
(827) 0x477572 MOV (%R13),%R14 |
(827) 0x477576 MOV (%RBX),%R15 |
(827) 0x477579 VSUBSD 0x28(%R14),%XMM3,%XMM4 |
(827) 0x47757f MOV 0x38(%R14),%EAX |
(827) 0x477583 VMULSD 0x48(%R14),%XMM4,%XMM5 |
(827) 0x477589 VSUBSD 0x50(%R14),%XMM2,%XMM1 |
(827) 0x47758f VSUBSD 0x78(%R14),%XMM0,%XMM7 |
(827) 0x477595 VCOMISD %XMM5,%XMM6 |
(827) 0x477599 JA 477e98 |
(827) 0x47759f DEC %EAX |
(827) 0x4775a1 VCVTTSD2SI %XMM5,%EDX |
(827) 0x4775a5 CMP %EDX,%EAX |
(827) 0x4775a7 JL 477efe |
(827) 0x4775ad VMOVSD 0x12d4bb(%RIP),%XMM14 |
(827) 0x4775b5 VRNDSCALESD $0xb,%XMM5,%XMM5,%XMM8 |
(827) 0x4775bc VSUBSD %XMM8,%XMM5,%XMM11 |
(827) 0x4775c1 VMOVSD %XMM11,%XMM11,%XMM9 |
(827) 0x4775c6 VFNMADD132SD %XMM14,%XMM14,%XMM9 |
(827) 0x4775cb VMOVSD 0x12d42d(%RIP),%XMM12 |
(827) 0x4775d3 VMOVSD %XMM11,%XMM11,%XMM0 |
(827) 0x4775d7 VMULSD %XMM12,%XMM11,%XMM13 |
(827) 0x4775dc VFMADD213SD 0x12d503(%RIP),%XMM14,%XMM0 |
(827) 0x4775e5 VSUBSD %XMM13,%XMM14,%XMM15 |
(827) 0x4775ea VMULSD %XMM11,%XMM11,%XMM10 |
(827) 0x4775ef VFMADD213SD 0x12d468(%RIP),%XMM11,%XMM15 |
(827) 0x4775f8 VFMADD132SD %XMM11,%XMM12,%XMM15 |
(827) 0x4775fd VFMADD213SD 0x12d402(%RIP),%XMM10,%XMM0 |
(827) 0x477606 VMULSD %XMM10,%XMM13,%XMM2 |
(827) 0x47760b MOVSXD %EDX,%RCX |
(827) 0x47760e MOV %RCX,0xf8(%RSP) |
(827) 0x477616 VFMADD231SD %XMM9,%XMM11,%XMM14 |
(827) 0x47761b VUNPCKLPD %XMM0,%XMM15,%XMM4 |
(827) 0x47761f VFMADD132SD %XMM14,%XMM12,%XMM11 |
(827) 0x477624 VUNPCKLPD %XMM2,%XMM11,%XMM3 |
(827) 0x477628 VINSERTF128 $0x1,%XMM3,%YMM4,%YMM11 |
(827) 0x47762e VMULSD 0x70(%R14),%XMM1,%XMM1 |
(827) 0x477634 VXORPD %XMM5,%XMM5,%XMM5 |
(827) 0x477638 MOV 0x60(%R14),%ESI |
(827) 0x47763c VCOMISD %XMM1,%XMM5 |
(827) 0x477640 JA 477eb1 |
(827) 0x477646 DEC %ESI |
(827) 0x477648 VCVTTSD2SI %XMM1,%EDI |
(827) 0x47764c CMP %EDI,%ESI |
(827) 0x47764e JL 477ec0 |
(827) 0x477654 VMOVSD 0x12d414(%RIP),%XMM14 |
(827) 0x47765c VRNDSCALESD $0xb,%XMM1,%XMM1,%XMM6 |
(827) 0x477663 VSUBSD %XMM6,%XMM1,%XMM12 |
(827) 0x477667 VMOVSD %XMM12,%XMM12,%XMM9 |
(827) 0x47766c VFNMADD132SD %XMM14,%XMM14,%XMM9 |
(827) 0x477671 VMOVSD 0x12d387(%RIP),%XMM8 |
(827) 0x477679 VMOVSD %XMM12,%XMM12,%XMM0 |
(827) 0x47767d VMULSD %XMM8,%XMM12,%XMM13 |
(827) 0x477682 VFMADD213SD 0x12d45d(%RIP),%XMM14,%XMM0 |
(827) 0x47768b VSUBSD %XMM13,%XMM14,%XMM15 |
(827) 0x477690 VMULSD %XMM12,%XMM12,%XMM10 |
(827) 0x477695 VFMADD213SD 0x12d3c2(%RIP),%XMM12,%XMM15 |
(827) 0x47769e VFMADD132SD %XMM12,%XMM8,%XMM15 |
(827) 0x4776a3 VFMADD213SD 0x12d35c(%RIP),%XMM10,%XMM0 |
(827) 0x4776ac VMULSD %XMM10,%XMM13,%XMM2 |
(827) 0x4776b1 MOVSXD %EDI,%RCX |
(827) 0x4776b4 VFMADD231SD %XMM9,%XMM12,%XMM14 |
(827) 0x4776b9 VUNPCKLPD %XMM0,%XMM15,%XMM4 |
(827) 0x4776bd VFMADD132SD %XMM14,%XMM8,%XMM12 |
(827) 0x4776c2 VUNPCKLPD %XMM2,%XMM12,%XMM3 |
(827) 0x4776c6 VINSERTF128 $0x1,%XMM3,%YMM4,%YMM1 |
(827) 0x4776cc VMULSD 0x98(%R14),%XMM7,%XMM7 |
(827) 0x4776d5 VXORPD %XMM5,%XMM5,%XMM5 |
(827) 0x4776d9 MOV 0x88(%R14),%R8D |
(827) 0x4776e0 VCOMISD %XMM7,%XMM5 |
(827) 0x4776e4 JA 477e6f |
(827) 0x4776ea DEC %R8D |
(827) 0x4776ed VCVTTSD2SI %XMM7,%R11D |
(827) 0x4776f1 CMP %R11D,%R8D |
(827) 0x4776f4 JL 477ed0 |
(827) 0x4776fa VMOVSD 0x12d36e(%RIP),%XMM10 |
(827) 0x477702 VRNDSCALESD $0xb,%XMM7,%XMM7,%XMM6 |
(827) 0x477709 VSUBSD %XMM6,%XMM7,%XMM13 |
(827) 0x47770d VMOVSD %XMM13,%XMM13,%XMM15 |
(827) 0x477712 VFNMADD132SD %XMM10,%XMM10,%XMM15 |
(827) 0x477717 VMULSD 0x12d3d1(%RIP),%XMM13,%XMM12 |
(827) 0x47771f VMOVSD %XMM13,%XMM13,%XMM18 |
(827) 0x477725 VADDSD %XMM10,%XMM12,%XMM17 |
(827) 0x47772b VFMADD213SD 0x12d3b3(%RIP),%XMM10,%XMM18 |
(827) 0x477735 VXORPD 0x12b983(%RIP),%XMM12,%XMM0 |
(827) 0x47773d VMULSD %XMM13,%XMM13,%XMM14 |
(827) 0x477742 VFMADD213SD 0x12d314(%RIP),%XMM13,%XMM17 |
(827) 0x47774c VMOVSD 0x12d2ac(%RIP),%XMM8 |
(827) 0x477754 VFMADD132SD %XMM13,%XMM8,%XMM17 |
(827) 0x47775a MOVSXD %R11D,%R13 |
(827) 0x47775d VFMADD213SD 0x12d2a1(%RIP),%XMM14,%XMM18 |
(827) 0x477767 VFMADD231SD %XMM15,%XMM13,%XMM10 |
(827) 0x47776c VMULSD %XMM14,%XMM0,%XMM16 |
(827) 0x477772 VFMADD132SD %XMM10,%XMM8,%XMM13 |
(827) 0x477777 MOV 0x10(%R14),%R12 |
(827) 0x47777b CMPQ $0,0x78(%RSP) |
(827) 0x477781 MOV 0x18(%R14),%R11 |
(827) 0x477785 VMOVAPD %YMM11,0x100(%RSP) |
(827) 0x47778e MOV 0x20(%R14),%RBX |
(827) 0x477792 VMOVAPD %YMM1,0x120(%RSP) |
(827) 0x47779b MOV %R12,0xc8(%RSP) |
(827) 0x4777a3 JE 477819 |
(827) 0x4777a5 MOV 0x78(%RSP),%RDX |
(827) 0x4777aa XOR %ESI,%ESI |
(827) 0x4777ac MOV %R15,%RDI |
(827) 0x4777af VMOVSD %XMM16,0xa8(%RSP) |
(827) 0x4777b7 VMOVSD %XMM13,0xb8(%RSP) |
(827) 0x4777c0 VMOVSD %XMM18,0xc0(%RSP) |
(827) 0x4777c8 VMOVSD %XMM17,0xd8(%RSP) |
(827) 0x4777d0 MOV %RCX,0xe0(%RSP) |
(827) 0x4777d8 MOV %R11,0xe8(%RSP) |
(827) 0x4777e0 VZEROUPPER |
(827) 0x4777e3 CALL 404140 <memset@plt> |
(827) 0x4777e8 MOV 0xe8(%RSP),%R11 |
(827) 0x4777f0 MOV 0xe0(%RSP),%RCX |
(827) 0x4777f8 VMOVSD 0xd8(%RSP),%XMM17 |
(827) 0x477800 VMOVSD 0xc0(%RSP),%XMM18 |
(827) 0x477808 VMOVSD 0xb8(%RSP),%XMM13 |
(827) 0x477811 VMOVSD 0xa8(%RSP),%XMM16 |
(827) 0x477819 IMUL %RBX,%R13 |
(827) 0x47781d CMPQ $0,0xd0(%RSP) |
(827) 0x477826 MOV 0x8(%R14),%R14 |
(827) 0x47782a JE 477da5 |
(827) 0x477830 MOV 0xf8(%RSP),%RAX |
(827) 0x477838 MOV 0xc8(%RSP),%RSI |
(827) 0x477840 MOV %RCX,%RDI |
(827) 0x477843 INC %RCX |
(827) 0x477846 LEA (%R11,%R11,1),%R9 |
(827) 0x47784a MOV %R11,%R8 |
(827) 0x47784d VBROADCASTSD %XMM17,%ZMM7 |
(827) 0x477853 VBROADCASTSD %XMM18,%ZMM6 |
(827) 0x477859 IMUL %R11,%RDI |
(827) 0x47785d LEA (,%RBX,8),%R12 |
(827) 0x477865 LEA 0x100(%RSP),%RDX |
(827) 0x47786d MOV %R9,0xb8(%RSP) |
(827) 0x477875 IMUL %R11,%RCX |
(827) 0x477879 MOV 0x6c(%RSP),%R11D |
(827) 0x47787e VMOVQ %R12,%XMM3 |
(827) 0x477883 VBROADCASTSD %XMM13,%ZMM5 |
(827) 0x477889 MOV %R15,%R12 |
(827) 0x47788c VBROADCASTSD %XMM16,%ZMM4 |
(827) 0x477892 MOV %RBX,%R15 |
(827) 0x477895 IMUL %RSI,%RAX |
(827) 0x477899 SAL $0x4,%R8 |
(827) 0x47789d ADD %RAX,%RDI |
(827) 0x4778a0 ADD %RAX,%RCX |
(827) 0x4778a3 AND $0x7,%R11D |
(827) 0x4778a7 MOV %R8,0xc0(%RSP) |
(827) 0x4778af LEA (%RDI,%R13,1),%R10 |
(827) 0x4778b3 ADD %RCX,%R13 |
(827) 0x4778b6 MOV %RDX,%R8 |
(827) 0x4778b9 MOV %R11D,0xa8(%RSP) |
(827) 0x4778c1 MOV %R13,%R9 |
(827) 0x4778c4 MOV %R14,%R13 |
(829) 0x4778c7 LEA 0x120(%RSP),%RDX |
(829) 0x4778cf LEA (%R13,%R10,8),%RDI |
(829) 0x4778d4 LEA (%R13,%R9,8),%RSI |
(829) 0x4778d9 VBROADCASTSD %XMM17,%YMM22 |
(829) 0x4778df VBROADCASTSD %XMM18,%YMM21 |
(829) 0x4778e5 VBROADCASTSD %XMM13,%YMM20 |
(829) 0x4778eb VMOVQ %XMM3,%RCX |
(829) 0x4778f0 VBROADCASTSD %XMM16,%YMM19 |
(829) 0x4778f6 VMOVSD (%R8),%XMM2 |
(829) 0x4778fb MOV %R9,0xd8(%RSP) |
(829) 0x477903 MOV %R8,0xa0(%RSP) |
(829) 0x47790b MOV %R10,0x98(%RSP) |
(829) 0x477913 MOV %R9,0x90(%RSP) |
(829) 0x47791b MOV %R10,0xf8(%RSP) |
(828) 0x477923 CMPQ $0x6,0xb0(%RSP) |
(828) 0x47792c VMULSD (%RDX),%XMM2,%XMM12 |
(828) 0x477930 JBE 477e5e |
(828) 0x477936 LEA (%RDI,%RCX,1),%R14 |
(828) 0x47793a LEA (%RCX,%RSI,1),%R11 |
(828) 0x47793e VMULSD 0x8(%RDX),%XMM2,%XMM9 |
(828) 0x477943 VBROADCASTSD %XMM12,%ZMM11 |
(828) 0x477949 LEA (%R14,%RCX,1),%RBX |
(828) 0x47794d LEA (%RCX,%R11,1),%R10 |
(828) 0x477951 VBROADCASTSD %XMM9,%ZMM10 |
(828) 0x477957 XOR %EAX,%EAX |
(828) 0x477959 LEA (%RBX,%RCX,1),%R9 |
(828) 0x47795d LEA (%R10,%RCX,1),%R8 |
(828) 0x477961 TESTB $0x40,0xf0(%RSP) |
(828) 0x477969 JE 4779d0 |
(828) 0x47796b VMULPD (%R11),%ZMM6,%ZMM8 |
(828) 0x477971 VMULPD (%R8),%ZMM4,%ZMM24 |
(828) 0x477977 CMPQ $0x40,0xf0(%RSP) |
(828) 0x477980 MOV $0x40,%EAX |
(828) 0x477985 VFMADD231PD (%RSI),%ZMM7,%ZMM8 |
(828) 0x47798b VFMADD231PD (%R10),%ZMM5,%ZMM24 |
(828) 0x477991 VADDPD %ZMM24,%ZMM8,%ZMM14 |
(828) 0x477997 VMULPD (%R14),%ZMM6,%ZMM23 |
(828) 0x47799d VMULPD (%R9),%ZMM4,%ZMM1 |
(828) 0x4779a3 VFMADD231PD (%RDI),%ZMM7,%ZMM23 |
(828) 0x4779a9 VFMADD231PD (%RBX),%ZMM5,%ZMM1 |
(828) 0x4779af VADDPD %ZMM1,%ZMM23,%ZMM25 |
(828) 0x4779b5 VFMADD213PD (%R12),%ZMM11,%ZMM25 |
(828) 0x4779bc VFMADD132PD %ZMM10,%ZMM25,%ZMM14 |
(828) 0x4779c2 VMOVUPD %ZMM14,(%R12) |
(828) 0x4779c9 JE 477a9c |
(828) 0x4779cf NOP |
(830) 0x4779d0 VMULPD (%R14,%RAX,1),%ZMM6,%ZMM26 |
(830) 0x4779d7 VMULPD (%R9,%RAX,1),%ZMM4,%ZMM15 |
(830) 0x4779de VMULPD (%R11,%RAX,1),%ZMM6,%ZMM0 |
(830) 0x4779e5 VMULPD (%R8,%RAX,1),%ZMM4,%ZMM28 |
(830) 0x4779ec VFMADD231PD (%RBX,%RAX,1),%ZMM5,%ZMM15 |
(830) 0x4779f3 VFMADD231PD (%RDI,%RAX,1),%ZMM7,%ZMM26 |
(830) 0x4779fa VADDPD %ZMM15,%ZMM26,%ZMM27 |
(830) 0x477a00 VFMADD213PD (%R12,%RAX,1),%ZMM11,%ZMM27 |
(830) 0x477a07 VMULPD 0x40(%RAX,%R11,1),%ZMM6,%ZMM14 |
(830) 0x477a0f VMULPD 0x40(%R8,%RAX,1),%ZMM4,%ZMM30 |
(830) 0x477a17 VFMADD231PD (%RSI,%RAX,1),%ZMM7,%ZMM0 |
(830) 0x477a1e VFMADD231PD (%R10,%RAX,1),%ZMM5,%ZMM28 |
(830) 0x477a25 VADDPD %ZMM28,%ZMM0,%ZMM9 |
(830) 0x477a2b VFMADD231PD 0x40(%RAX,%RSI,1),%ZMM7,%ZMM14 |
(830) 0x477a33 VFMADD231PD 0x40(%R10,%RAX,1),%ZMM5,%ZMM30 |
(830) 0x477a3b VADDPD %ZMM30,%ZMM14,%ZMM15 |
(830) 0x477a41 VMULPD 0x40(%R14,%RAX,1),%ZMM6,%ZMM1 |
(830) 0x477a49 VMULPD 0x40(%R9,%RAX,1),%ZMM4,%ZMM29 |
(830) 0x477a51 VFMADD231PD 0x40(%RDI,%RAX,1),%ZMM7,%ZMM1 |
(830) 0x477a59 VFMADD231PD 0x40(%RBX,%RAX,1),%ZMM5,%ZMM29 |
(830) 0x477a61 VFMADD132PD %ZMM10,%ZMM27,%ZMM9 |
(830) 0x477a67 VADDPD %ZMM29,%ZMM1,%ZMM8 |
(830) 0x477a6d VFMADD213PD 0x40(%R12,%RAX,1),%ZMM11,%ZMM8 |
(830) 0x477a75 VFMADD132PD %ZMM10,%ZMM8,%ZMM15 |
(830) 0x477a7b VMOVUPD %ZMM9,(%R12,%RAX,1) |
(830) 0x477a82 VMOVUPD %ZMM15,0x40(%R12,%RAX,1) |
(830) 0x477a8a SUB $-0x80,%RAX |
(830) 0x477a8e CMP %RAX,0xf0(%RSP) |
(830) 0x477a96 JNE 4779d0 |
(828) 0x477a9c MOV 0xa8(%RSP),%R14D |
(828) 0x477aa4 TEST %R14D,%R14D |
(828) 0x477aa7 JE 477d2f |
(828) 0x477aad MOV 0x88(%RSP),%RAX |
(828) 0x477ab5 MOV 0xd0(%RSP),%R10 |
(828) 0x477abd SUB %RAX,%R10 |
(828) 0x477ac0 LEA -0x1(%R10),%RBX |
(828) 0x477ac4 CMP $0x2,%RBX |
(828) 0x477ac8 JBE 477e65 |
(828) 0x477ace MOV 0xf8(%RSP),%R9 |
(828) 0x477ad6 VMOVSD 0x8(%RDX),%XMM10 |
(828) 0x477adb VMULSD %XMM10,%XMM2,%XMM8 |
(828) 0x477ae0 VBROADCASTSD %XMM8,%YMM15 |
(828) 0x477ae5 LEA (%R12,%RAX,8),%R8 |
(828) 0x477ae9 VBROADCASTSD %XMM12,%YMM0 |
(828) 0x477aee LEA (%R15,%R9,1),%R14 |
(828) 0x477af2 LEA (%R15,%R14,1),%R11 |
(828) 0x477af6 ADD %RAX,%R14 |
(828) 0x477af9 LEA (%R11,%RAX,1),%RBX |
(828) 0x477afd ADD %R15,%R11 |
(828) 0x477b00 VMULPD (%R13,%R14,8),%YMM21,%YMM9 |
(828) 0x477b08 VMOVQ %RBX,%XMM11 |
(828) 0x477b0d MOV 0xd8(%RSP),%RBX |
(828) 0x477b15 LEA (%R11,%RAX,1),%R9 |
(828) 0x477b19 MOV %R9,0xe8(%RSP) |
(828) 0x477b21 MOV 0xe8(%RSP),%R14 |
(828) 0x477b29 LEA (%RAX,%RBX,1),%R11 |
(828) 0x477b2d LEA (%R15,%RBX,1),%RBX |
(828) 0x477b31 LEA (%RBX,%RAX,1),%R9 |
(828) 0x477b35 ADD %R15,%RBX |
(828) 0x477b38 VMULPD (%R13,%R14,8),%YMM19,%YMM1 |
(828) 0x477b40 VMOVQ %R9,%XMM31 |
(828) 0x477b46 LEA (%RAX,%RBX,1),%R9 |
(828) 0x477b4a ADD %R15,%RBX |
(828) 0x477b4d ADD %RAX,%RBX |
(828) 0x477b50 VMOVQ %XMM31,%R14 |
(828) 0x477b56 MOV %RBX,0xe0(%RSP) |
(828) 0x477b5e MOV 0xf8(%RSP),%RBX |
(828) 0x477b66 ADD %RAX,%RBX |
(828) 0x477b69 VFMADD231PD (%R13,%RBX,8),%YMM22,%YMM9 |
(828) 0x477b71 VMOVQ %XMM11,%RBX |
(828) 0x477b76 VMULPD (%R13,%R14,8),%YMM21,%YMM11 |
(828) 0x477b7e VFMADD231PD (%R13,%R11,8),%YMM22,%YMM11 |
(828) 0x477b86 MOV 0xe0(%RSP),%R11 |
(828) 0x477b8e VFMADD231PD (%R13,%RBX,8),%YMM20,%YMM1 |
(828) 0x477b96 VADDPD %YMM1,%YMM9,%YMM14 |
(828) 0x477b9a VMULPD (%R13,%R11,8),%YMM19,%YMM23 |
(828) 0x477ba2 VFMADD231PD (%R13,%R9,8),%YMM20,%YMM23 |
(828) 0x477baa VADDPD %YMM23,%YMM11,%YMM9 |
(828) 0x477bb0 VMULPD %YMM15,%YMM9,%YMM1 |
(828) 0x477bb5 VFMADD132PD %YMM14,%YMM1,%YMM0 |
(828) 0x477bba VADDPD (%R8),%YMM0,%YMM0 |
(828) 0x477bbf VMOVUPD %YMM0,(%R8) |
(828) 0x477bc4 MOV %R10,%R8 |
(828) 0x477bc7 AND $-0x4,%R8 |
(828) 0x477bcb ADD %R8,%RAX |
(828) 0x477bce AND $0x3,%R10D |
(828) 0x477bd2 JE 477d2f |
(828) 0x477bd8 LEA (%R15,%RAX,1),%R10 |
(828) 0x477bdc LEA (,%RAX,8),%R11 |
(828) 0x477be4 VMULSD %XMM10,%XMM2,%XMM10 |
(828) 0x477be9 LEA (%R10,%R15,1),%RBX |
(828) 0x477bed LEA (%R12,%R11,1),%R9 |
(828) 0x477bf1 LEA (%RBX,%R15,1),%R14 |
(828) 0x477bf5 VMULSD (%RDI,%RBX,8),%XMM13,%XMM14 |
(828) 0x477bfa VMULSD (%RSI,%RBX,8),%XMM13,%XMM11 |
(828) 0x477bff VFMADD231SD (%RDI,%R10,8),%XMM18,%XMM14 |
(828) 0x477c06 VFMADD231SD (%RSI,%R10,8),%XMM18,%XMM11 |
(828) 0x477c0d VMULSD (%RDI,%R14,8),%XMM16,%XMM8 |
(828) 0x477c14 VMULSD (%RSI,%R14,8),%XMM16,%XMM9 |
(828) 0x477c1b VFMADD231SD (%RDI,%R11,1),%XMM17,%XMM8 |
(828) 0x477c22 VFMADD231SD (%RSI,%R11,1),%XMM17,%XMM9 |
(828) 0x477c29 VADDSD %XMM8,%XMM14,%XMM15 |
(828) 0x477c2e VADDSD %XMM9,%XMM11,%XMM1 |
(828) 0x477c33 VMULSD %XMM10,%XMM1,%XMM0 |
(828) 0x477c38 VFMADD132SD %XMM12,%XMM0,%XMM15 |
(828) 0x477c3d VADDSD (%R9),%XMM15,%XMM14 |
(828) 0x477c42 VMOVSD %XMM14,(%R9) |
(828) 0x477c47 MOV 0xd0(%RSP),%R9 |
(828) 0x477c4f LEA 0x1(%RAX),%R10 |
(828) 0x477c53 CMP %R9,%R10 |
(828) 0x477c56 JAE 477d2f |
(828) 0x477c5c ADD %R15,%R10 |
(828) 0x477c5f LEA 0x8(%R12,%R11,1),%R14 |
(828) 0x477c64 ADD $0x2,%RAX |
(828) 0x477c68 LEA (%R15,%R10,1),%RBX |
(828) 0x477c6c LEA (%R15,%RBX,1),%R8 |
(828) 0x477c70 VMULSD (%RDI,%RBX,8),%XMM13,%XMM15 |
(828) 0x477c75 VMULSD (%RSI,%RBX,8),%XMM13,%XMM1 |
(828) 0x477c7a VFMADD231SD (%RDI,%R10,8),%XMM18,%XMM15 |
(828) 0x477c81 VMULSD (%RDI,%R8,8),%XMM16,%XMM8 |
(828) 0x477c88 VFMADD231SD (%RSI,%R10,8),%XMM18,%XMM1 |
(828) 0x477c8f VFMADD231SD 0x8(%RDI,%R11,1),%XMM17,%XMM8 |
(828) 0x477c97 VMULSD (%RSI,%R8,8),%XMM16,%XMM9 |
(828) 0x477c9e VADDSD %XMM8,%XMM15,%XMM11 |
(828) 0x477ca3 VFMADD231SD 0x8(%RSI,%R11,1),%XMM17,%XMM9 |
(828) 0x477cab VADDSD %XMM9,%XMM1,%XMM0 |
(828) 0x477cb0 VMULSD %XMM10,%XMM0,%XMM14 |
(828) 0x477cb5 VFMADD132SD %XMM12,%XMM14,%XMM11 |
(828) 0x477cba VADDSD (%R14),%XMM11,%XMM15 |
(828) 0x477cbf VMOVSD %XMM15,(%R14) |
(828) 0x477cc4 CMP %R9,%RAX |
(828) 0x477cc7 JAE 477d2f |
(828) 0x477cc9 ADD %R15,%RAX |
(828) 0x477ccc LEA 0x10(%R12,%R11,1),%R9 |
(828) 0x477cd1 LEA (%R15,%RAX,1),%R10 |
(828) 0x477cd5 LEA (%R15,%R10,1),%R14 |
(828) 0x477cd9 VMULSD (%RDI,%R10,8),%XMM13,%XMM11 |
(828) 0x477cdf VMULSD (%RSI,%R10,8),%XMM13,%XMM0 |
(828) 0x477ce5 VFMADD231SD (%RDI,%RAX,8),%XMM18,%XMM11 |
(828) 0x477cec VMULSD (%RDI,%R14,8),%XMM16,%XMM8 |
(828) 0x477cf3 VFMADD231SD (%RSI,%RAX,8),%XMM18,%XMM0 |
(828) 0x477cfa VFMADD231SD 0x10(%RDI,%R11,1),%XMM17,%XMM8 |
(828) 0x477d02 VMULSD (%RSI,%R14,8),%XMM16,%XMM9 |
(828) 0x477d09 VADDSD %XMM8,%XMM11,%XMM1 |
(828) 0x477d0e VFMADD231SD 0x10(%RSI,%R11,1),%XMM17,%XMM9 |
(828) 0x477d16 VADDSD %XMM9,%XMM0,%XMM14 |
(828) 0x477d1b VMULSD %XMM10,%XMM14,%XMM10 |
(828) 0x477d20 VFMADD132SD %XMM12,%XMM10,%XMM1 |
(828) 0x477d25 VADDSD (%R9),%XMM1,%XMM12 |
(828) 0x477d2a VMOVSD %XMM12,(%R9) |
(828) 0x477d2f MOV 0xc0(%RSP),%RAX |
(828) 0x477d37 MOV 0xb8(%RSP),%R11 |
(828) 0x477d3f ADD $0x10,%RDX |
(828) 0x477d43 LEA 0x140(%RSP),%RBX |
(828) 0x477d4b ADD %R11,0xf8(%RSP) |
(828) 0x477d53 ADD %R11,0xd8(%RSP) |
(828) 0x477d5b ADD %RAX,%RDI |
(828) 0x477d5e ADD %RAX,%RSI |
(828) 0x477d61 CMP %RDX,%RBX |
(828) 0x477d64 JNE 477923 |
(829) 0x477d6a MOV 0xa0(%RSP),%R8 |
(829) 0x477d72 MOV 0xc8(%RSP),%RDI |
(829) 0x477d7a MOV 0x98(%RSP),%R10 |
(829) 0x477d82 LEA 0x120(%RSP),%RSI |
(829) 0x477d8a MOV 0x90(%RSP),%R9 |
(829) 0x477d92 ADD $0x8,%R8 |
(829) 0x477d96 ADD %RDI,%R10 |
(829) 0x477d99 ADD %RDI,%R9 |
(829) 0x477d9c CMP %R8,%RSI |
(829) 0x477d9f JNE 4778c7 |
(827) 0x477da5 ADDQ $0x8,0x80(%RSP) |
(827) 0x477dae MOV 0x60(%RSP),%RDX |
(827) 0x477db3 MOV 0x80(%RSP),%RCX |
(827) 0x477dbb ADDQ $0x18,0x70(%RSP) |
(827) 0x477dc1 CMP %RDX,%RCX |
(827) 0x477dc4 JNE 47754f |
0x477dca MOV 0x40(%RSP),%R14 |
0x477dcf MOV 0x38(%RSP),%RBX |
0x477dd4 MOV 0x30(%RSP),%R13 |
0x477dd9 VZEROUPPER |
0x477ddc MOV %R14,%RDI |
0x477ddf CALL 51ef50 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> |
0x477de4 MOV 0x30(%RBX),%ECX |
0x477de7 XOR %R15D,%R15D |
0x477dea XOR %R12D,%R12D |
0x477ded TEST %ECX,%ECX |
0x477def JLE 477e4f |
(826) 0x477df1 MOV 0x40(%RBX),%EAX |
(826) 0x477df4 MOV 0x8(%RBX),%R8D |
(826) 0x477df8 MOV %R12D,%R11D |
(826) 0x477dfb INC %R12D |
(826) 0x477dfe IMUL %ECX,%R11D |
(826) 0x477e02 IMUL %R12D,%EAX |
(826) 0x477e06 CMP %R8D,%EAX |
(826) 0x477e09 CMOVG %R8D,%EAX |
(826) 0x477e0d SUB %R11D,%EAX |
(826) 0x477e10 TEST %EAX,%EAX |
(826) 0x477e12 JLE 477e46 |
(826) 0x477e14 MOV 0x18(%R13),%R9 |
(826) 0x477e18 MOV 0x310(%RBX),%RSI |
(826) 0x477e1f CLTQ |
(826) 0x477e21 MOVSXD %R11D,%R10 |
(826) 0x477e24 LEA (,%RAX,8),%RDX |
(826) 0x477e2c MOV (%RSI,%R15,1),%RSI |
(826) 0x477e30 LEA (%R9,%R10,8),%RDI |
(826) 0x477e34 CMP $0x8,%RDX |
(826) 0x477e38 JE 477f1e |
(826) 0x477e3e CALL 4040d0 <memmove@plt> |
(826) 0x477e43 MOV 0x30(%RBX),%ECX |
(826) 0x477e46 ADD $0x18,%R15 |
(826) 0x477e4a CMP %ECX,%R12D |
(826) 0x477e4d JL 477df1 |
0x477e4f LEA -0x28(%RBP),%RSP |
0x477e53 POP %RBX |
0x477e54 POP %R12 |
0x477e56 POP %R13 |
0x477e58 POP %R14 |
0x477e5a POP %R15 |
0x477e5c POP %RBP |
0x477e5d RET |
(828) 0x477e5e XOR %EAX,%EAX |
(828) 0x477e60 JMP 477ab5 |
(828) 0x477e65 VMOVSD 0x8(%RDX),%XMM10 |
(828) 0x477e6a JMP 477bd8 |
(827) 0x477e6f MOV 0x12cb92(%RIP),%R10 |
(827) 0x477e76 VMOVSD 0x12cb82(%RIP),%XMM13 |
(827) 0x477e7e XOR %R13D,%R13D |
(827) 0x477e81 VXORPD %XMM16,%XMM16,%XMM16 |
(827) 0x477e87 VMOVSD %XMM13,%XMM13,%XMM17 |
(827) 0x477e8d VMOVQ %R10,%XMM18 |
(827) 0x477e93 JMP 477777 |
(827) 0x477e98 VMOVAPD 0x12cb60(%RIP),%YMM11 |
(827) 0x477ea0 MOVQ $0,0xf8(%RSP) |
(827) 0x477eac JMP 47762e |
(827) 0x477eb1 VMOVAPD 0x12cb47(%RIP),%YMM1 |
(827) 0x477eb9 XOR %ECX,%ECX |
(827) 0x477ebb JMP 4776cc |
(827) 0x477ec0 VMOVAPD 0x12cb58(%RIP),%YMM1 |
(827) 0x477ec8 MOVSXD %ESI,%RCX |
(827) 0x477ecb JMP 4776cc |
(827) 0x477ed0 MOV 0x12cb31(%RIP),%R9 |
(827) 0x477ed7 MOVSXD %R8D,%R13 |
(827) 0x477eda VMOVSD 0x12cb54(%RIP),%XMM16 |
(827) 0x477ee4 VMOVSD 0x12cb3a(%RIP),%XMM18 |
(827) 0x477eee VXORPD %XMM17,%XMM17,%XMM17 |
(827) 0x477ef4 VMOVQ %R9,%XMM13 |
(827) 0x477ef9 JMP 477777 |
(827) 0x477efe CLTQ |
(827) 0x477f00 VMOVAPD 0x12cb18(%RIP),%YMM11 |
(827) 0x477f08 MOV %RAX,0xf8(%RSP) |
(827) 0x477f10 JMP 47762e |
0x477f15 VMOVSD %XMM5,%XMM5,%XMM7 |
0x477f19 JMP 477460 |
(826) 0x477f1e VMOVSD (%RSI),%XMM2 |
(826) 0x477f22 VMOVSD %XMM2,(%RDI) |
(826) 0x477f26 JMP 477e46 |
0x477f2b NOPL (%RAX,%RAX,1) |
Path / |
Source file and lines | einspline_spo_ref.hpp:172-189 |
Module | exec |
nb instructions | 99 |
nb uops | 103 |
loop length | 467 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 16 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 16 |
ADD-SUB / MUL ratio | 1.00 |
micro-operation queue | 17.17 cycles |
front end | 17.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.75 | 5.75 | 5.50 | 5.50 | 4.50 | 12.67 | 12.67 | 12.67 | 5.50 | 5.58 | 5.50 | 5.42 | 2.50 | 2.50 |
cycles | 5.75 | 5.75 | 5.50 | 5.50 | 4.50 | 12.67 | 12.67 | 12.67 | 5.50 | 5.58 | 5.50 | 5.42 | 2.50 | 2.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 17.17 |
Dispatch | 12.67 |
Overall L1 | 17.17 |
all | 5% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 25% |
all | 42% |
load | 40% |
store | 0% |
mul | 50% |
add-sub | 50% |
fma | 50% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 27% |
load | 26% |
store | 0% |
mul | 50% |
add-sub | 50% |
fma | 50% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 44% |
all | 12% |
load | 11% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 17% |
load | 17% |
store | 12% |
mul | 18% |
add-sub | 18% |
fma | 18% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 15% |
load | 15% |
store | 12% |
mul | 18% |
add-sub | 18% |
fma | 18% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSXD %EDX,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x140,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x358(%RDI),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51ed20 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x128(%R12),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP 0x124(%R12),%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JE 477412 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x52> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x40(%R12),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA (%R15,%R15,2),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA (%RAX,%RDX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VMOVUPD (%RCX),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVSD 0x10(%RCX),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VXORPD %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD %XMM2,%XMM2,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VUNPCKHPD %XMM2,%XMM2,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMULSD 0x100(%RBX),%XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VFMADD132SD 0xe8(%RBX),%XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231SD 0x118(%RBX),%XMM4,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCOMISD %XMM0,%XMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 6 | 1 |
JBE 477455 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x95> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VCOMISD 0x12d691(%RIP),%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 6 | 1 |
JA 477f15 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xb55> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VRNDSCALESD $0x9,%XMM0,%XMM0,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VSUBSD %XMM6,%XMM0,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSXD 0x30(%RBX),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
TEST %ESI,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 477ddc <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xa1c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VPERMILPD $0,%XMM2,%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMULPD 0xd8(%RBX),%XMM10,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPERMILPD $0x3,%XMM2,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMOVDDUP %XMM4,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VFMADD231PD 0xf0(%RBX),%XMM9,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDDUP 0x12d64b(%RIP),%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VFMADD132PD 0x108(%RBX),%XMM11,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPPD $0xe,%XMM13,%XMM8,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSXD 0x40(%RBX),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VXORPD %XMM14,%XMM14,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x2f8(%RBX),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x310(%RBX),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R14,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM7,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOV %RBX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R13,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VRNDSCALEPD $0x9,%XMM8,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VCMPPD $0x1,%XMM14,%XMM8,%K0{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %EDI,0x6c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R11,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R9,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
KNOTB %K0,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VSUBPD %XMM12,%XMM8,%XMM15{%K2}{z} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
LEA (,%RDI,8),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x1(%RDI),%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SHR $0x3,%R15 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R12,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SAL $0x6,%R15 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVHPD %XMM15,0x50(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 9-11 | 1 |
LEA (%R9,%RSI,8),%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND $-0x8,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VMOVLPD %XMM15,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOV %R15,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x40(%RSP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x38(%RSP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RSP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51ef50 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x30(%RBX),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R12D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
TEST %ECX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 477e4f <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xa8f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM5,%XMM5,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
JMP 477460 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xa0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Source file and lines | einspline_spo_ref.hpp:172-189 |
Module | exec |
nb instructions | 99 |
nb uops | 103 |
loop length | 467 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 16 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 16 |
ADD-SUB / MUL ratio | 1.00 |
micro-operation queue | 17.17 cycles |
front end | 17.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.75 | 5.75 | 5.50 | 5.50 | 4.50 | 12.67 | 12.67 | 12.67 | 5.50 | 5.58 | 5.50 | 5.42 | 2.50 | 2.50 |
cycles | 5.75 | 5.75 | 5.50 | 5.50 | 4.50 | 12.67 | 12.67 | 12.67 | 5.50 | 5.58 | 5.50 | 5.42 | 2.50 | 2.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 17.17 |
Dispatch | 12.67 |
Overall L1 | 17.17 |
all | 5% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 25% |
all | 42% |
load | 40% |
store | 0% |
mul | 50% |
add-sub | 50% |
fma | 50% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 27% |
load | 26% |
store | 0% |
mul | 50% |
add-sub | 50% |
fma | 50% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 44% |
all | 12% |
load | 11% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 17% |
load | 17% |
store | 12% |
mul | 18% |
add-sub | 18% |
fma | 18% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 15% |
load | 15% |
store | 12% |
mul | 18% |
add-sub | 18% |
fma | 18% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSXD %EDX,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x140,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x358(%RDI),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51ed20 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x128(%R12),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP 0x124(%R12),%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JE 477412 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x52> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x40(%R12),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA (%R15,%R15,2),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA (%RAX,%RDX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VMOVUPD (%RCX),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVSD 0x10(%RCX),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VXORPD %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD %XMM2,%XMM2,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VUNPCKHPD %XMM2,%XMM2,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMULSD 0x100(%RBX),%XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VFMADD132SD 0xe8(%RBX),%XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231SD 0x118(%RBX),%XMM4,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCOMISD %XMM0,%XMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 6 | 1 |
JBE 477455 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x95> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VCOMISD 0x12d691(%RIP),%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 6 | 1 |
JA 477f15 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xb55> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VRNDSCALESD $0x9,%XMM0,%XMM0,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VSUBSD %XMM6,%XMM0,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSXD 0x30(%RBX),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
TEST %ESI,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 477ddc <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xa1c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VPERMILPD $0,%XMM2,%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMULPD 0xd8(%RBX),%XMM10,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPERMILPD $0x3,%XMM2,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VMOVDDUP %XMM4,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
VFMADD231PD 0xf0(%RBX),%XMM9,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDDUP 0x12d64b(%RIP),%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VFMADD132PD 0x108(%RBX),%XMM11,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPPD $0xe,%XMM13,%XMM8,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSXD 0x40(%RBX),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VXORPD %XMM14,%XMM14,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x2f8(%RBX),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x310(%RBX),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R14,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM7,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOV %RBX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R13,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VRNDSCALEPD $0x9,%XMM8,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VCMPPD $0x1,%XMM14,%XMM8,%K0{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %EDI,0x6c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R11,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R9,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
KNOTB %K0,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VSUBPD %XMM12,%XMM8,%XMM15{%K2}{z} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
LEA (,%RDI,8),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x1(%RDI),%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SHR $0x3,%R15 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R12,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SAL $0x6,%R15 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVHPD %XMM15,0x50(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 9-11 | 1 |
LEA (%R9,%RSI,8),%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND $-0x8,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VMOVLPD %XMM15,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOV %R15,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x40(%RSP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x38(%RSP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RSP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51ef50 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x30(%RBX),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R12D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
TEST %ECX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 477e4f <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xa8f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM5,%XMM5,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
JMP 477460 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0xa0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE– | 27.9 | 56.62 |
▼Loop 827 - einspline_spo_ref.hpp:175-176 - exec– | 0.02 | 0.03 |
▼Loop 829 - MultiBsplineRef.hpp:63-71 - exec– | 0 | 0.01 |
▼Loop 828 - MultiBsplineRef.hpp:64-71 - exec– | 0.01 | 0.01 |
○Loop 830 - MultiBsplineRef.hpp:68-71 - exec | 27.82 | 51.68 |
○Loop 826 - einspline_spo_ref.hpp:183-187 - exec | 0.01 | 0.02 |