Function: _ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6 ... | Module: exec | Source: einspline_spo_ref.hpp:172-189 [...] | Coverage: 27.39% |
---|
Function: _ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6 ... | Module: exec | Source: einspline_spo_ref.hpp:172-189 [...] | Coverage: 27.39% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Utilities/NewTimer.h: 242 - 249 |
-------------------------------------------------------------------------------- |
242: ScopeGuard(TIMER& t) : timer(t) { timer.start(); } |
[...] |
249: ~ScopeGuard() { timer.stop(); } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 61 - 61 |
-------------------------------------------------------------------------------- |
61: for (size_t d = 0; d < D; ++d) |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 143 - 143 |
-------------------------------------------------------------------------------- |
143: return (active_ptcl_ == iat) ? active_pos_ : R[iat]; |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineEvalHelper.hpp: 45 - 47 |
-------------------------------------------------------------------------------- |
45: T sf = std::floor(x); |
46: T dx2 = x - sf; |
47: int ind2 = std::min(std::max(0, static_cast<int>(sf)), nmax); |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_vector.h: 1046 - 1169 |
-------------------------------------------------------------------------------- |
1046: return *(this->_M_impl._M_start + __n); |
[...] |
1169: { return _M_data_ptr(this->_M_impl._M_start); } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineData.hpp: 54 - 57 |
-------------------------------------------------------------------------------- |
54: a[0] = ((A00 * tx + A01) * tx + A02) * tx + A03; |
55: a[1] = ((A10 * tx + A11) * tx + A12) * tx + A13; |
56: a[2] = ((A20 * tx + A21) * tx + A22) * tx + A23; |
57: a[3] = ((A30 * tx + A31) * tx + A32) * tx + A33; |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_algobase.h: 235 - 924 |
-------------------------------------------------------------------------------- |
235: if (__b < __a) |
[...] |
429: const ptrdiff_t _Num = __last - __first; |
430: if (_Num) |
431: __builtin_memmove(__result, __first, sizeof(_Tp) * _Num); |
[...] |
923: for (; __first != __last; ++__first) |
924: *__first = __tmp; |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVectorTensorOps.h: 150 - 152 |
-------------------------------------------------------------------------------- |
150: return TinyVector<Type_t, 3>(lhs[0] * rhs[0] + lhs[1] * rhs[3] + lhs[2] * rhs[6], |
151: lhs[0] * rhs[1] + lhs[1] * rhs[4] + lhs[2] * rhs[7], |
152: lhs[0] * rhs[2] + lhs[1] * rhs[5] + lhs[2] * rhs[8]); |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_algo.h: 725 - 751 |
-------------------------------------------------------------------------------- |
725: { return std::copy(__first, __first + __n, __result); } |
[...] |
751: if (__n2 <= 0) |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/einspline_spo_ref.hpp: 172 - 189 |
-------------------------------------------------------------------------------- |
172: ScopedTimer local_timer(timer); |
173: |
174: auto u = Lattice.toUnit_floor(P.activeR(iat)); |
175: for (int i = 0; i < nBlocks; ++i) |
176: MultiBsplineEvalRef::evaluate_v(einsplines[i], u[0], u[1], u[2], psi[i].data(), nSplinesPerBlock); |
177: } |
178: |
179: inline void evaluate(const ParticleSet& P, int iat, ValueVector_t& psi_v) |
180: { |
181: evaluate_v(P, iat); |
182: |
183: for (int i = 0; i < nBlocks; ++i) |
184: { |
185: // in real simulation, phase needs to be applied. Here just fake computation |
186: const int first = i * nBlocks; |
187: std::copy_n(psi[i].data(), std::min((i + 1) * nSplinesPerBlock, OrbitalSetSize) - first, psi_v.data() + first); |
188: } |
189: } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Particle/Lattice/CrystalLattice.h: 170 - 173 |
-------------------------------------------------------------------------------- |
170: if (-std::numeric_limits<T1>::epsilon() < val_dot[i] && val_dot[i] < 0) |
171: val_dot[i] = T1(0.0); |
172: else |
173: val_dot[i] -= std::floor(val_dot[i]); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-855-3059/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineRef.hpp: 42 - 71 |
-------------------------------------------------------------------------------- |
42: x -= spline_m->x_grid.start; |
43: y -= spline_m->y_grid.start; |
44: z -= spline_m->z_grid.start; |
45: T tx, ty, tz; |
46: int ix, iy, iz; |
47: spline2::getSplineBound(x * spline_m->x_grid.delta_inv, tx, ix, spline_m->x_grid.num - 1); |
48: spline2::getSplineBound(y * spline_m->y_grid.delta_inv, ty, iy, spline_m->y_grid.num - 1); |
49: spline2::getSplineBound(z * spline_m->z_grid.delta_inv, tz, iz, spline_m->z_grid.num - 1); |
[...] |
56: const intptr_t xs = spline_m->x_stride; |
57: const intptr_t ys = spline_m->y_stride; |
58: const intptr_t zs = spline_m->z_stride; |
59: |
60: constexpr T zero(0); |
61: std::fill(vals, vals + num_splines, zero); |
62: |
63: for (size_t i = 0; i < 4; i++) |
64: for (size_t j = 0; j < 4; j++) |
65: { |
66: const T pre00 = a[i] * b[j]; |
67: const T* restrict coefs = spline_m->coefs + (ix + i) * xs + (iy + j) * ys + iz * zs; |
68: for (size_t n = 0; n < num_splines; n++) |
69: vals[n] += pre00 * |
70: (c[0] * coefs[n] + c[1] * coefs[n + zs] + c[2] * coefs[n + 2 * zs] + |
71: c[3] * coefs[n + 3 * zs]); |
0x442320 PUSH %RBP |
0x442321 MOV %RSP,%RBP |
0x442324 PUSH %R15 |
0x442326 PUSH %R14 |
0x442328 PUSH %R13 |
0x44232a PUSH %R12 |
0x44232c PUSH %RBX |
0x44232d SUB $0x128,%RSP |
0x442334 MOV %RCX,%RBX |
0x442337 MOV %EDX,%R12D |
0x44233a MOV %RSI,%R13 |
0x44233d MOV %RDI,%R14 |
0x442340 MOV 0x358(%RDI),%RDI |
0x442347 MOV %RDI,-0xd0(%RBP) |
0x44234e CALL 497e00 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> |
0x442353 MOVSXD %R12D,%RAX |
0x442356 LEA (%RAX,%RAX,2),%RCX |
0x44235a SAL $0x3,%RCX |
0x44235e ADD 0x40(%R13),%RCX |
0x442362 CMP %EAX,0x124(%R13) |
0x442369 LEA 0x128(%R13),%RAX |
0x442370 CMOVNE %RCX,%RAX |
0x442374 MOVSD (%RAX),%XMM0 |
0x442378 MOVSD 0x8(%RAX),%XMM3 |
0x44237d MOVSD 0xd8(%R14),%XMM1 |
0x442386 MULSD %XMM0,%XMM1 |
0x44238a MOVSD 0xf0(%R14),%XMM2 |
0x442393 MULSD %XMM3,%XMM2 |
0x442397 ADDSD %XMM1,%XMM2 |
0x44239b MOVSD 0x10(%RAX),%XMM4 |
0x4423a0 MOVSD 0x108(%R14),%XMM5 |
0x4423a9 MULSD %XMM4,%XMM5 |
0x4423ad ADDSD %XMM2,%XMM5 |
0x4423b1 MOVSD 0xe0(%R14),%XMM1 |
0x4423ba MULSD %XMM0,%XMM1 |
0x4423be MOVSD 0xf8(%R14),%XMM2 |
0x4423c7 MULSD %XMM3,%XMM2 |
0x4423cb ADDSD %XMM1,%XMM2 |
0x4423cf MOVSD 0x110(%R14),%XMM1 |
0x4423d8 MULSD %XMM4,%XMM1 |
0x4423dc ADDSD %XMM2,%XMM1 |
0x4423e0 MULSD 0xe8(%R14),%XMM0 |
0x4423e9 MULSD 0x100(%R14),%XMM3 |
0x4423f2 MULSD 0x118(%R14),%XMM4 |
0x4423fb ADDSD %XMM0,%XMM3 |
0x4423ff UCOMISD 0xd7a69(%RIP),%XMM5 |
0x442407 MOVSD %XMM1,-0x60(%RBP) |
0x44240c JBE 442420 |
0x44240e XORPD %XMM0,%XMM0 |
0x442412 MOVSD %XMM0,-0xb0(%RBP) |
0x44241a UCOMISD %XMM0,%XMM5 |
0x44241e JB 442458 |
0x442420 MOVAPD %XMM5,%XMM0 |
0x442424 MOVSD %XMM3,-0x50(%RBP) |
0x442429 MOVSD %XMM4,-0x38(%RBP) |
0x44242e MOVSD %XMM5,-0x30(%RBP) |
0x442433 CALL 4f2000 <floor> |
0x442438 MOVSD -0x38(%RBP),%XMM4 |
0x44243d MOVSD -0x60(%RBP),%XMM1 |
0x442442 MOVSD -0x50(%RBP),%XMM3 |
0x442447 MOVSD -0x30(%RBP),%XMM2 |
0x44244c SUBSD %XMM0,%XMM2 |
0x442450 MOVSD %XMM2,-0xb0(%RBP) |
0x442458 ADDSD %XMM4,%XMM3 |
0x44245c UCOMISD 0xd7a0c(%RIP),%XMM1 |
0x442464 MOVSD %XMM3,-0x50(%RBP) |
0x442469 JBE 44247d |
0x44246b XORPD %XMM0,%XMM0 |
0x44246f MOVSD %XMM0,-0xa8(%RBP) |
0x442477 UCOMISD %XMM0,%XMM1 |
0x44247b JB 44249c |
0x44247d MOVAPD %XMM1,%XMM0 |
0x442481 CALL 4f2000 <floor> |
0x442486 MOVSD -0x50(%RBP),%XMM3 |
0x44248b MOVSD -0x60(%RBP),%XMM1 |
0x442490 SUBSD %XMM0,%XMM1 |
0x442494 MOVSD %XMM1,-0xa8(%RBP) |
0x44249c MOV %RBX,-0xc8(%RBP) |
0x4424a3 UCOMISD 0xd79c5(%RIP),%XMM3 |
0x4424ab JBE 4424bf |
0x4424ad XORPD %XMM0,%XMM0 |
0x4424b1 MOVSD %XMM0,-0xa0(%RBP) |
0x4424b9 UCOMISD %XMM0,%XMM3 |
0x4424bd JB 4424d9 |
0x4424bf MOVAPD %XMM3,%XMM0 |
0x4424c3 CALL 4f2000 <floor> |
0x4424c8 MOVSD -0x50(%RBP),%XMM1 |
0x4424cd SUBSD %XMM0,%XMM1 |
0x4424d1 MOVSD %XMM1,-0xa0(%RBP) |
0x4424d9 MOV %R14,-0x98(%RBP) |
0x4424e0 MOV 0x30(%R14),%EAX |
0x4424e4 MOV %RAX,-0xb8(%RBP) |
0x4424eb TEST %EAX,%EAX |
0x4424ed JLE 442b14 |
0x4424f3 MOV -0x98(%RBP),%RAX |
0x4424fa MOV 0x2f8(%RAX),%RCX |
0x442501 MOV %RCX,-0xe8(%RBP) |
0x442508 MOV 0x310(%RAX),%RCX |
0x44250f MOV %RCX,-0xe0(%RBP) |
0x442516 MOVSXD 0x40(%RAX),%R14 |
0x44251a LEA (,%R14,8),%RAX |
0x442522 MOV %RAX,-0xd8(%RBP) |
0x442529 CMP $0x1,%R14 |
0x44252d MOV %R14,%R15 |
0x442530 ADC $0,%R15 |
0x442534 DECQ -0xb8(%RBP) |
0x44253b MOV %R15,%RAX |
0x44253e SHR $0x1,%RAX |
0x442541 MOV %RAX,-0x108(%RBP) |
0x442548 MOV %R15,%RBX |
0x44254b AND $-0x2,%RBX |
0x44254f XOR %R13D,%R13D |
0x442552 JMP 442578 |
0x442554 NOPW %CS:(%RAX,%RAX,1) |
(818) 0x442560 MOV -0xf0(%RBP),%RCX |
(818) 0x442567 LEA 0x1(%RCX),%R13 |
(818) 0x44256b CMP -0xb8(%RBP),%RCX |
(818) 0x442572 JE 442b14 |
(818) 0x442578 MOV -0xe8(%RBP),%RAX |
(818) 0x44257f MOV (%RAX,%R13,8),%R12 |
(818) 0x442583 MOVSD -0xb0(%RBP),%XMM0 |
(818) 0x44258b SUBSD 0x28(%R12),%XMM0 |
(818) 0x442592 MOVSD -0xa8(%RBP),%XMM1 |
(818) 0x44259a SUBSD 0x50(%R12),%XMM1 |
(818) 0x4425a1 MOVAPD %XMM1,-0x50(%RBP) |
(818) 0x4425a6 MOVSD -0xa0(%RBP),%XMM1 |
(818) 0x4425ae SUBSD 0x78(%R12),%XMM1 |
(818) 0x4425b5 MOVAPD %XMM1,-0x60(%RBP) |
(818) 0x4425ba MULSD 0x48(%R12),%XMM0 |
(818) 0x4425c1 MOVAPD %XMM0,-0x90(%RBP) |
(818) 0x4425c9 CALL 4f2000 <floor> |
(818) 0x4425ce MOVSD %XMM0,-0x38(%RBP) |
(818) 0x4425d3 MOVAPD -0x50(%RBP),%XMM0 |
(818) 0x4425d8 MULSD 0x70(%R12),%XMM0 |
(818) 0x4425df MOVAPD %XMM0,-0x50(%RBP) |
(818) 0x4425e4 CALL 4f2000 <floor> |
(818) 0x4425e9 MOVSD %XMM0,-0x30(%RBP) |
(818) 0x4425ee MOVAPD -0x60(%RBP),%XMM0 |
(818) 0x4425f3 MULSD 0x98(%R12),%XMM0 |
(818) 0x4425fd MOVAPD %XMM0,-0x60(%RBP) |
(818) 0x442602 CALL 4f2000 <floor> |
(818) 0x442607 MOV %R13,-0xf0(%RBP) |
(818) 0x44260e LEA (,%R13,2),%RAX |
(818) 0x442616 ADD %R13,%RAX |
(818) 0x442619 MOV -0xe0(%RBP),%RCX |
(818) 0x442620 MOV (%RCX,%RAX,8),%R13 |
(818) 0x442624 MOVSXD 0x38(%R12),%R9 |
(818) 0x442629 MOVAPD -0x90(%RBP),%XMM4 |
(818) 0x442631 SUBSD -0x38(%RBP),%XMM4 |
(818) 0x442636 MOVSXD 0x60(%R12),%R10 |
(818) 0x44263b MOVAPD -0x50(%RBP),%XMM12 |
(818) 0x442641 SUBSD -0x30(%RBP),%XMM12 |
(818) 0x442647 MOVSXD 0x88(%R12),%R11 |
(818) 0x44264f MOVAPD %XMM4,%XMM10 |
(818) 0x442654 MOVSD 0xd781c(%RIP),%XMM5 |
(818) 0x44265c MULSD %XMM5,%XMM10 |
(818) 0x442661 MOVSD 0xd3aaf(%RIP),%XMM6 |
(818) 0x442669 MOVAPD %XMM6,%XMM1 |
(818) 0x44266d SUBSD %XMM10,%XMM1 |
(818) 0x442672 MOVAPD %XMM4,%XMM2 |
(818) 0x442676 MULSD %XMM4,%XMM2 |
(818) 0x44267a MOVAPD %XMM4,%XMM3 |
(818) 0x44267e MOVAPD %XMM4,%XMM11 |
(818) 0x442683 UNPCKLPD %XMM4,%XMM3 |
(818) 0x442687 MOVAPD 0xd7771(%RIP),%XMM7 |
(818) 0x44268f SHUFPD $0x2,%XMM7,%XMM1 |
(818) 0x442694 MULPD %XMM3,%XMM1 |
(818) 0x442698 MOVAPD %XMM1,%XMM3 |
(818) 0x44269c MOVAPD 0xd776b(%RIP),%XMM8 |
(818) 0x4426a5 ADDPD %XMM8,%XMM3 |
(818) 0x4426aa UNPCKLPD %XMM2,%XMM4 |
(818) 0x4426ae MULPD %XMM3,%XMM4 |
(818) 0x4426b2 MOVAPD 0xd7765(%RIP),%XMM9 |
(818) 0x4426bb ADDPD %XMM9,%XMM4 |
(818) 0x4426c0 MOVAPD %XMM4,-0x150(%RBP) |
(818) 0x4426c8 UNPCKHPD %XMM1,%XMM1 |
(818) 0x4426cc MOVAPD %XMM6,%XMM3 |
(818) 0x4426d0 SUBSD %XMM1,%XMM3 |
(818) 0x4426d4 MULSD %XMM11,%XMM3 |
(818) 0x4426d9 ADDSD %XMM6,%XMM3 |
(818) 0x4426dd MULSD %XMM11,%XMM3 |
(818) 0x4426e2 ADDSD %XMM5,%XMM3 |
(818) 0x4426e6 MOVSD %XMM3,-0x140(%RBP) |
(818) 0x4426ee MULSD %XMM10,%XMM2 |
(818) 0x4426f3 MOVSD %XMM2,-0x138(%RBP) |
(818) 0x4426fb MOVAPD %XMM12,%XMM4 |
(818) 0x442700 MOVAPD %XMM12,%XMM11 |
(818) 0x442705 MULSD %XMM5,%XMM11 |
(818) 0x44270a MOVAPD %XMM6,%XMM1 |
(818) 0x44270e SUBSD %XMM11,%XMM1 |
(818) 0x442713 MOVAPD %XMM12,%XMM2 |
(818) 0x442718 MULSD %XMM12,%XMM2 |
(818) 0x44271d MOVAPD %XMM12,%XMM3 |
(818) 0x442722 MOVAPD %XMM12,%XMM10 |
(818) 0x442727 UNPCKLPD %XMM12,%XMM3 |
(818) 0x44272c SHUFPD $0x2,%XMM7,%XMM1 |
(818) 0x442731 MULPD %XMM3,%XMM1 |
(818) 0x442735 MOVAPD %XMM1,%XMM3 |
(818) 0x442739 ADDPD %XMM8,%XMM3 |
(818) 0x44273e UNPCKLPD %XMM2,%XMM4 |
(818) 0x442742 MULPD %XMM3,%XMM4 |
(818) 0x442746 ADDPD %XMM9,%XMM4 |
(818) 0x44274b MOVAPD %XMM4,-0x130(%RBP) |
(818) 0x442753 UNPCKHPD %XMM1,%XMM1 |
(818) 0x442757 MOVAPD %XMM6,%XMM3 |
(818) 0x44275b SUBSD %XMM1,%XMM3 |
(818) 0x44275f MULSD %XMM12,%XMM3 |
(818) 0x442764 ADDSD %XMM6,%XMM3 |
(818) 0x442768 MULSD %XMM12,%XMM3 |
(818) 0x44276d ADDSD %XMM5,%XMM3 |
(818) 0x442771 MOVSD %XMM3,-0x120(%RBP) |
(818) 0x442779 MULSD %XMM11,%XMM2 |
(818) 0x44277e MOVSD %XMM2,-0x118(%RBP) |
(818) 0x442786 MOV 0x10(%R12),%RAX |
(818) 0x44278b MOV %RAX,-0xc0(%RBP) |
(818) 0x442792 MOV 0x18(%R12),%RAX |
(818) 0x442797 MOV %RAX,-0x50(%RBP) |
(818) 0x44279b MOV %R12,-0x90(%RBP) |
(818) 0x4427a2 MOV 0x20(%R12),%R12 |
(818) 0x4427a7 MOV -0xd8(%RBP),%RDX |
(818) 0x4427ae TEST %RDX,%RDX |
(818) 0x4427b1 JE 4427df |
(818) 0x4427b3 MOV %R13,%RDI |
(818) 0x4427b6 XOR %ESI,%ESI |
(818) 0x4427b8 MOV %R9,-0x80(%RBP) |
(818) 0x4427bc MOV %R11,-0x78(%RBP) |
(818) 0x4427c0 MOV %R10,-0x70(%RBP) |
(818) 0x4427c4 MOVSD %XMM0,-0x68(%RBP) |
(818) 0x4427c9 CALL 5074e0 <_intel_fast_memset> |
(818) 0x4427ce MOVSD -0x68(%RBP),%XMM0 |
(818) 0x4427d3 MOV -0x70(%RBP),%R10 |
(818) 0x4427d7 MOV -0x78(%RBP),%R11 |
(818) 0x4427db MOV -0x80(%RBP),%R9 |
(818) 0x4427df CVTTSD2SI -0x38(%RBP),%EDX |
(818) 0x4427e4 CVTTSD2SI -0x30(%RBP),%ESI |
(818) 0x4427e9 MOVAPD -0x60(%RBP),%XMM7 |
(818) 0x4427ee SUBSD %XMM0,%XMM7 |
(818) 0x4427f2 CVTTSD2SI %XMM0,%ECX |
(818) 0x4427f6 MOVAPD %XMM7,%XMM3 |
(818) 0x4427fa MOVSD 0xd7676(%RIP),%XMM5 |
(818) 0x442802 MULSD %XMM5,%XMM3 |
(818) 0x442806 MOVSD 0xd390a(%RIP),%XMM6 |
(818) 0x44280e MOVAPD %XMM6,%XMM4 |
(818) 0x442812 SUBSD %XMM3,%XMM4 |
(818) 0x442816 MOVAPD %XMM7,%XMM0 |
(818) 0x44281a MULSD %XMM7,%XMM0 |
(818) 0x44281e MOVAPD %XMM7,%XMM1 |
(818) 0x442822 UNPCKLPD %XMM7,%XMM1 |
(818) 0x442826 SHUFPD $0x2,0xd75d1(%RIP),%XMM4 |
(818) 0x44282f MULPD %XMM1,%XMM4 |
(818) 0x442833 MOVAPD %XMM4,%XMM2 |
(818) 0x442837 ADDPD 0xd75d1(%RIP),%XMM2 |
(818) 0x44283f MOVAPD %XMM7,%XMM1 |
(818) 0x442843 UNPCKLPD %XMM0,%XMM1 |
(818) 0x442847 MULPD %XMM2,%XMM1 |
(818) 0x44284b ADDPD 0xd75cd(%RIP),%XMM1 |
(818) 0x442853 UNPCKHPD %XMM4,%XMM4 |
(818) 0x442857 MOVAPD %XMM6,%XMM2 |
(818) 0x44285b SUBSD %XMM4,%XMM2 |
(818) 0x44285f MULSD %XMM7,%XMM2 |
(818) 0x442863 ADDSD %XMM6,%XMM2 |
(818) 0x442867 MULSD %XMM7,%XMM2 |
(818) 0x44286b ADDSD %XMM5,%XMM2 |
(818) 0x44286f MOV -0x90(%RBP),%RAX |
(818) 0x442876 MOV 0x8(%RAX),%RAX |
(818) 0x44287a MULSD %XMM3,%XMM0 |
(818) 0x44287e MOVAPD %XMM1,%XMM3 |
(818) 0x442882 UNPCKHPD %XMM1,%XMM3 |
(818) 0x442886 MOVAPD %XMM1,%XMM4 |
(818) 0x44288a UNPCKLPD %XMM1,%XMM4 |
(818) 0x44288e MOVAPD %XMM2,%XMM5 |
(818) 0x442892 UNPCKLPD %XMM2,%XMM5 |
(818) 0x442896 MOVAPD %XMM0,%XMM6 |
(818) 0x44289a UNPCKLPD %XMM0,%XMM6 |
(818) 0x44289e DEC %R10 |
(818) 0x4428a1 TEST %ESI,%ESI |
(818) 0x4428a3 MOV $0,%EDI |
(818) 0x4428a8 CMOVLE %EDI,%ESI |
(818) 0x4428ab CMP %RSI,%R10 |
(818) 0x4428ae CMOVGE %RSI,%R10 |
(818) 0x4428b2 MOV -0x50(%RBP),%R8 |
(818) 0x4428b6 IMUL %R8,%R10 |
(818) 0x4428ba DEC %R9 |
(818) 0x4428bd TEST %EDX,%EDX |
(818) 0x4428bf CMOVLE %EDI,%EDX |
(818) 0x4428c2 CMP %RDX,%R9 |
(818) 0x4428c5 CMOVGE %RDX,%R9 |
(818) 0x4428c9 MOV -0xc0(%RBP),%RSI |
(818) 0x4428d0 IMUL %RSI,%R9 |
(818) 0x4428d4 DEC %R11 |
(818) 0x4428d7 TEST %ECX,%ECX |
(818) 0x4428d9 CMOVLE %EDI,%ECX |
(818) 0x4428dc CMP %RCX,%R11 |
(818) 0x4428df CMOVGE %RCX,%R11 |
(818) 0x4428e3 MOV %R12,%RCX |
(818) 0x4428e6 IMUL %R11,%RCX |
(818) 0x4428ea ADD %R10,%R9 |
(818) 0x4428ed ADD %R9,%RCX |
(818) 0x4428f0 LEA (%RCX,%RBX,1),%RDX |
(818) 0x4428f4 LEA (%RDX,%R12,1),%RDI |
(818) 0x4428f8 MOV %RDI,-0x38(%RBP) |
(818) 0x4428fc LEA (%RDX,%R12,2),%RDI |
(818) 0x442900 MOV %RDI,-0x30(%RBP) |
(818) 0x442904 LEA (%R12,%R12,2),%RDI |
(818) 0x442908 MOV %RDX,-0x60(%RBP) |
(818) 0x44290c ADD %RDX,%RDI |
(818) 0x44290f MOV %RDI,-0x90(%RBP) |
(818) 0x442916 LEA 0x3(%R11),%RDX |
(818) 0x44291a IMUL %R12,%RDX |
(818) 0x44291e ADD %R9,%RDX |
(818) 0x442921 LEA (%RAX,%RDX,8),%RDI |
(818) 0x442925 LEA (,%RSI,8),%RDX |
(818) 0x44292d MOV %RDX,-0xf8(%RBP) |
(818) 0x442934 LEA 0x2(%R11),%RDX |
(818) 0x442938 IMUL %R12,%RDX |
(818) 0x44293c INC %R11 |
(818) 0x44293f IMUL %R12,%R11 |
(818) 0x442943 LEA (,%R8,8),%R10 |
(818) 0x44294b ADD %R9,%RDX |
(818) 0x44294e LEA (%RAX,%RDX,8),%R8 |
(818) 0x442952 MOV %RDI,%RDX |
(818) 0x442955 ADD %R9,%R11 |
(818) 0x442958 LEA (%RAX,%R11,8),%R9 |
(818) 0x44295c LEA (%RAX,%RCX,8),%R12 |
(818) 0x442960 XOR %ECX,%ECX |
(818) 0x442962 JMP 4429a8 |
0x442964 NOPW %CS:(%RAX,%RAX,1) |
(819) 0x442970 MOV -0x100(%RBP),%RDI |
(819) 0x442977 LEA 0x1(%RDI),%RCX |
(819) 0x44297b MOV -0x80(%RBP),%RDX |
(819) 0x44297f MOV -0xf8(%RBP),%RSI |
(819) 0x442986 ADD %RSI,%RDX |
(819) 0x442989 MOV -0x78(%RBP),%R8 |
(819) 0x44298d ADD %RSI,%R8 |
(819) 0x442990 MOV -0x70(%RBP),%R9 |
(819) 0x442994 ADD %RSI,%R9 |
(819) 0x442997 MOV -0x68(%RBP),%R12 |
(819) 0x44299b ADD %RSI,%R12 |
(819) 0x44299e CMP $0x3,%RDI |
(819) 0x4429a2 JE 442560 |
(819) 0x4429a8 MOVSD -0x150(%RBP,%RCX,8),%XMM7 |
(819) 0x4429b1 MOV -0xc0(%RBP),%R11 |
(819) 0x4429b8 MOV %RCX,-0x100(%RBP) |
(819) 0x4429bf IMUL %RCX,%R11 |
(819) 0x4429c3 MOV %R12,-0x68(%RBP) |
(819) 0x4429c7 MOV %R9,-0x70(%RBP) |
(819) 0x4429cb MOV %R8,-0x78(%RBP) |
(819) 0x4429cf MOV %RDX,-0x80(%RBP) |
(819) 0x4429d3 XOR %ECX,%ECX |
(819) 0x4429d5 JMP 4429fd |
0x4429d7 NOPW (%RAX,%RAX,1) |
(820) 0x4429e0 LEA 0x1(%RCX),%RSI |
(820) 0x4429e4 ADD %R10,%RDX |
(820) 0x4429e7 ADD %R10,%R8 |
(820) 0x4429ea ADD %R10,%R9 |
(820) 0x4429ed ADD %R10,%R12 |
(820) 0x4429f0 CMP $0x3,%RCX |
(820) 0x4429f4 MOV %RSI,%RCX |
(820) 0x4429f7 JE 442970 |
(820) 0x4429fd TEST %R14D,%R14D |
(820) 0x442a00 JE 4429e0 |
(820) 0x442a02 MOVSD -0x130(%RBP,%RCX,8),%XMM8 |
(820) 0x442a0c MULSD %XMM7,%XMM8 |
(820) 0x442a11 CMP $0x2,%R15 |
(820) 0x442a15 JB 442a8c |
(820) 0x442a17 MOVAPD %XMM8,%XMM9 |
(820) 0x442a1c UNPCKLPD %XMM8,%XMM9 |
(820) 0x442a21 MOV -0x108(%RBP),%RSI |
(820) 0x442a28 XOR %EDI,%EDI |
(820) 0x442a2a NOPW (%RAX,%RAX,1) |
(821) 0x442a30 MOVUPD (%R12,%RDI,1),%XMM10 |
(821) 0x442a36 MULPD %XMM4,%XMM10 |
(821) 0x442a3b MOVUPD (%R9,%RDI,1),%XMM11 |
(821) 0x442a41 MULPD %XMM3,%XMM11 |
(821) 0x442a46 ADDPD %XMM10,%XMM11 |
(821) 0x442a4b MOVUPD (%R8,%RDI,1),%XMM10 |
(821) 0x442a51 MULPD %XMM5,%XMM10 |
(821) 0x442a56 MOVUPD (%RDX,%RDI,1),%XMM12 |
(821) 0x442a5c MULPD %XMM6,%XMM12 |
(821) 0x442a61 ADDPD %XMM10,%XMM12 |
(821) 0x442a66 ADDPD %XMM11,%XMM12 |
(821) 0x442a6b MULPD %XMM9,%XMM12 |
(821) 0x442a70 MOVUPD (%R13,%RDI,1),%XMM10 |
(821) 0x442a77 ADDPD %XMM12,%XMM10 |
(821) 0x442a7c MOVUPD %XMM10,(%R13,%RDI,1) |
(821) 0x442a83 ADD $0x10,%RDI |
(821) 0x442a87 DEC %RSI |
(821) 0x442a8a JNE 442a30 |
(820) 0x442a8c CMP %R15,%RBX |
(820) 0x442a8f JAE 4429e0 |
(820) 0x442a95 MOV -0x50(%RBP),%RSI |
(820) 0x442a99 IMUL %RCX,%RSI |
(820) 0x442a9d ADD %R11,%RSI |
(820) 0x442aa0 MOV -0x60(%RBP),%RDI |
(820) 0x442aa4 ADD %RSI,%RDI |
(820) 0x442aa7 MOVSD (%RAX,%RDI,8),%XMM9 |
(820) 0x442aad MOV -0x38(%RBP),%RDI |
(820) 0x442ab1 ADD %RSI,%RDI |
(820) 0x442ab4 MOVHPD (%RAX,%RDI,8),%XMM9 |
(820) 0x442aba MOV -0x30(%RBP),%RDI |
(820) 0x442abe ADD %RSI,%RDI |
(820) 0x442ac1 ADD -0x90(%RBP),%RSI |
(820) 0x442ac8 MOVAPD %XMM2,%XMM10 |
(820) 0x442acd MOVHPD (%RAX,%RSI,8),%XMM10 |
(820) 0x442ad3 MOVSD (%RAX,%RDI,8),%XMM11 |
(820) 0x442ad9 UNPCKLPD %XMM0,%XMM11 |
(820) 0x442ade MULPD %XMM11,%XMM10 |
(820) 0x442ae3 MULPD %XMM1,%XMM9 |
(820) 0x442ae8 ADDPD %XMM10,%XMM9 |
(820) 0x442aed MOVAPD %XMM9,%XMM10 |
(820) 0x442af2 UNPCKHPD %XMM9,%XMM10 |
(820) 0x442af7 ADDSD %XMM9,%XMM10 |
(820) 0x442afc MULSD %XMM10,%XMM8 |
(820) 0x442b01 ADDSD (%R13,%RBX,8),%XMM8 |
(820) 0x442b08 MOVSD %XMM8,(%R13,%RBX,8) |
(820) 0x442b0f JMP 4429e0 |
0x442b14 MOV -0xd0(%RBP),%RDI |
0x442b1b CALL 497fd0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> |
0x442b20 MOV -0x98(%RBP),%R12 |
0x442b27 MOV 0x30(%R12),%EAX |
0x442b2c TEST %EAX,%EAX |
0x442b2e MOV -0xc8(%RBP),%R15 |
0x442b35 JLE 442b95 |
0x442b37 XOR %EBX,%EBX |
0x442b39 XOR %R14D,%R14D |
0x442b3c JMP 442b4c |
0x442b3e XCHG %AX,%AX |
(817) 0x442b40 MOVSXD %EAX,%RCX |
(817) 0x442b43 ADD $0x18,%RBX |
(817) 0x442b47 CMP %RCX,%R14 |
(817) 0x442b4a JGE 442b95 |
(817) 0x442b4c MOV %R14D,%EDX |
(817) 0x442b4f IMUL %EAX,%EDX |
(817) 0x442b52 INC %R14 |
(817) 0x442b55 MOV 0x40(%R12),%ECX |
(817) 0x442b5a IMUL %R14D,%ECX |
(817) 0x442b5e MOV 0x8(%R12),%ESI |
(817) 0x442b63 CMP %ECX,%ESI |
(817) 0x442b65 CMOVL %ESI,%ECX |
(817) 0x442b68 SUB %EDX,%ECX |
(817) 0x442b6a JLE 442b40 |
(817) 0x442b6c MOVSXD %EDX,%RDI |
(817) 0x442b6f SAL $0x3,%RDI |
(817) 0x442b73 ADD 0x18(%R15),%RDI |
(817) 0x442b77 MOV 0x310(%R12),%RAX |
(817) 0x442b7f MOV (%RAX,%RBX,1),%RSI |
(817) 0x442b83 MOV %ECX,%EDX |
(817) 0x442b85 SAL $0x3,%RDX |
(817) 0x442b89 CALL 4050e0 <memmove@plt> |
(817) 0x442b8e MOV 0x30(%R12),%EAX |
(817) 0x442b93 JMP 442b40 |
0x442b95 ADD $0x128,%RSP |
0x442b9c POP %RBX |
0x442b9d POP %R12 |
0x442b9f POP %R13 |
0x442ba1 POP %R14 |
0x442ba3 POP %R15 |
0x442ba5 POP %RBP |
0x442ba6 RET |
0x442ba7 MOV %RAX,%RDI |
0x442baa CALL 410010 <__clang_call_terminate> |
0x442baf NOP |
Path / |
Source file and lines | einspline_spo_ref.hpp:172-189 |
Module | exec |
nb instructions | 138 |
nb uops | 146 |
loop length | 668 |
used x86 registers | 12 |
used mmx registers | 0 |
used xmm registers | 6 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 15 |
ADD-SUB / MUL ratio | 1.00 |
micro-operation queue | 24.33 cycles |
front end | 24.33 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.00 | 6.00 | 5.75 | 5.75 | 8.50 | 20.00 | 20.00 | 20.00 | 4.50 | 4.50 | 7.50 | 7.50 | 8.50 | 8.50 |
cycles | 9.00 | 6.00 | 5.75 | 5.75 | 8.50 | 20.00 | 20.00 | 20.00 | 4.50 | 4.50 | 7.50 | 7.50 | 8.50 | 8.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 24.33 |
Dispatch | 20.00 |
Overall L1 | 24.33 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 7% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 27% |
all | 11% |
load | 11% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 13% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 13% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x128,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x358(%RDI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDI,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CALL 497e00 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD %R12D,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA (%RAX,%RAX,2),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAL $0x3,%RCX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD 0x40(%R13),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CMP %EAX,0x124(%R13) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
LEA 0x128(%R13),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNE %RCX,%RAX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD (%RAX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x8(%RAX),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0xd8(%R14),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD %XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSD 0xf0(%R14),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD %XMM3,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADDSD %XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSD 0x10(%RAX),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x108(%R14),%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD %XMM4,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADDSD %XMM2,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSD 0xe0(%R14),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD %XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSD 0xf8(%R14),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD %XMM3,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADDSD %XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSD 0x110(%R14),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD %XMM4,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADDSD %XMM2,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MULSD 0xe8(%R14),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MULSD 0x100(%R14),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MULSD 0x118(%R14),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADDSD %XMM0,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
UCOMISD 0xd7a69(%RIP),%XMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 7 | 1 |
MOVSD %XMM1,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
JBE 442420 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x100> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XORPD %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSD %XMM0,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
UCOMISD %XMM0,%XMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 7 | 1 |
JB 442458 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x138> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOVAPD %XMM5,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSD %XMM3,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOVSD %XMM4,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOVSD %XMM5,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
CALL 4f2000 <floor> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSD -0x38(%RBP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD -0x60(%RBP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD -0x50(%RBP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD -0x30(%RBP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUBSD %XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSD %XMM2,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
ADDSD %XMM4,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
UCOMISD 0xd7a0c(%RIP),%XMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 7 | 1 |
MOVSD %XMM3,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
JBE 44247d <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x15d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XORPD %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSD %XMM0,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
UCOMISD %XMM0,%XMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 7 | 1 |
JB 44249c <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x17c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOVAPD %XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4f2000 <floor> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSD -0x50(%RBP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD -0x60(%RBP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUBSD %XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSD %XMM1,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOV %RBX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
UCOMISD 0xd79c5(%RIP),%XMM3 | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 7 | 1 |
JBE 4424bf <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x19f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XORPD %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSD %XMM0,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
UCOMISD %XMM0,%XMM3 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 7 | 1 |
JB 4424d9 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x1b9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOVAPD %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4f2000 <floor> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSD -0x50(%RBP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUBSD %XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSD %XMM1,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOV %R14,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x30(%R14),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %EAX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 442b14 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x7f4> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x2f8(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x310(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVSXD 0x40(%RAX),%R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
LEA (,%R14,8),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP $0x1,%R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADC $0,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
DECQ -0xb8(%RBP) | 2 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SHR $0x1,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R15,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x2,%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 442578 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x258> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV -0xd0(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CALL 497fd0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x98(%RBP),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%R12),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
TEST %EAX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0xc8(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JLE 442b95 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x875> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 442b4c <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x82c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
ADD $0x128,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 410010 <__clang_call_terminate> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Source file and lines | einspline_spo_ref.hpp:172-189 |
Module | exec |
nb instructions | 138 |
nb uops | 146 |
loop length | 668 |
used x86 registers | 12 |
used mmx registers | 0 |
used xmm registers | 6 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 15 |
ADD-SUB / MUL ratio | 1.00 |
micro-operation queue | 24.33 cycles |
front end | 24.33 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.00 | 6.00 | 5.75 | 5.75 | 8.50 | 20.00 | 20.00 | 20.00 | 4.50 | 4.50 | 7.50 | 7.50 | 8.50 | 8.50 |
cycles | 9.00 | 6.00 | 5.75 | 5.75 | 8.50 | 20.00 | 20.00 | 20.00 | 4.50 | 4.50 | 7.50 | 7.50 | 8.50 | 8.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 24.33 |
Dispatch | 20.00 |
Overall L1 | 24.33 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 7% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 27% |
all | 11% |
load | 11% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 13% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 13% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x128,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x358(%RDI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDI,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CALL 497e00 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD %R12D,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA (%RAX,%RAX,2),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAL $0x3,%RCX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD 0x40(%R13),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CMP %EAX,0x124(%R13) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
LEA 0x128(%R13),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNE %RCX,%RAX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD (%RAX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x8(%RAX),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0xd8(%R14),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD %XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSD 0xf0(%R14),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD %XMM3,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADDSD %XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSD 0x10(%RAX),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x108(%R14),%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD %XMM4,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADDSD %XMM2,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSD 0xe0(%R14),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD %XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSD 0xf8(%R14),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD %XMM3,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADDSD %XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSD 0x110(%R14),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MULSD %XMM4,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADDSD %XMM2,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MULSD 0xe8(%R14),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MULSD 0x100(%R14),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MULSD 0x118(%R14),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADDSD %XMM0,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
UCOMISD 0xd7a69(%RIP),%XMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 7 | 1 |
MOVSD %XMM1,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
JBE 442420 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x100> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XORPD %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSD %XMM0,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
UCOMISD %XMM0,%XMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 7 | 1 |
JB 442458 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x138> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOVAPD %XMM5,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSD %XMM3,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOVSD %XMM4,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOVSD %XMM5,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
CALL 4f2000 <floor> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSD -0x38(%RBP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD -0x60(%RBP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD -0x50(%RBP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD -0x30(%RBP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUBSD %XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSD %XMM2,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
ADDSD %XMM4,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
UCOMISD 0xd7a0c(%RIP),%XMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 7 | 1 |
MOVSD %XMM3,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
JBE 44247d <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x15d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XORPD %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSD %XMM0,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
UCOMISD %XMM0,%XMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 7 | 1 |
JB 44249c <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x17c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOVAPD %XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4f2000 <floor> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSD -0x50(%RBP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD -0x60(%RBP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUBSD %XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSD %XMM1,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOV %RBX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
UCOMISD 0xd79c5(%RIP),%XMM3 | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 7 | 1 |
JBE 4424bf <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x19f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XORPD %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSD %XMM0,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
UCOMISD %XMM0,%XMM3 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 7 | 1 |
JB 4424d9 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x1b9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOVAPD %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4f2000 <floor> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSD -0x50(%RBP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUBSD %XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
MOVSD %XMM1,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOV %R14,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x30(%R14),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %EAX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 442b14 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x7f4> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x2f8(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x310(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVSXD 0x40(%RAX),%R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
LEA (,%R14,8),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP $0x1,%R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADC $0,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
DECQ -0xb8(%RBP) | 2 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SHR $0x1,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R15,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x2,%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 442578 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x258> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV -0xd0(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CALL 497fd0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x98(%RBP),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%R12),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
TEST %EAX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0xc8(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JLE 442b95 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x875> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 442b4c <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x82c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
ADD $0x128,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 410010 <__clang_call_terminate> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE– | 27.39 | 57.12 |
▼Loop 818 - MultiBsplineRef.hpp:42-71 - exec– | 0.04 | 0.07 |
▼Loop 819 - MultiBsplineRef.hpp:63-71 - exec– | 0.03 | 0.05 |
▼Loop 820 - MultiBsplineRef.hpp:64-71 - exec– | 0.02 | 0.03 |
○Loop 821 - MultiBsplineRef.hpp:68-71 - exec | 27.23 | 51.91 |
○Loop 817 - einspline_spo_ref.hpp:183-187 - exec | 0.01 | 0.01 |