Function: void qmcplusplus::DTD_BConds<double, 3u, 39>::computeDistances<qmcplusplus::TinyVector<dou ... | Module: exec | Source: ParticleBConds.h:166-219 [...] | Coverage: 13.35% |
---|
Function: void qmcplusplus::DTD_BConds<double, 3u, 39>::computeDistances<qmcplusplus::TinyVector<dou ... | Module: exec | Source: ParticleBConds.h:166-219 [...] | Coverage: 13.35% |
---|
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Particle/Lattice/ParticleBConds.h: 166 - 219 |
-------------------------------------------------------------------------------- |
166: { |
167: const T x0 = pos[0]; |
168: const T y0 = pos[1]; |
169: const T z0 = pos[2]; |
[...] |
185: #pragma omp simd aligned(temp_r, px, py, pz, dx, dy, dz: QMC_SIMD_ALIGNMENT) |
186: for (int iat = first; iat < last; ++iat) |
187: { |
188: const T flip = iat < flip_ind ? one : minusone; |
189: const T displ_0 = (px[iat] - x0) * flip; |
190: const T displ_1 = (py[iat] - y0) * flip; |
191: const T displ_2 = (pz[iat] - z0) * flip; |
192: |
193: const T ar_0 = -std::floor(displ_0 * g00 + displ_1 * g10 + displ_2 * g20); |
194: const T ar_1 = -std::floor(displ_0 * g01 + displ_1 * g11 + displ_2 * g21); |
195: const T ar_2 = -std::floor(displ_0 * g02 + displ_1 * g12 + displ_2 * g22); |
196: |
197: const T delx = displ_0 + ar_0 * r00 + ar_1 * r10 + ar_2 * r20; |
198: const T dely = displ_1 + ar_0 * r01 + ar_1 * r11 + ar_2 * r21; |
199: const T delz = displ_2 + ar_0 * r02 + ar_1 * r12 + ar_2 * r22; |
200: |
201: T rmin = delx * delx + dely * dely + delz * delz; |
202: int ic = 0; |
203: #pragma unroll(7) |
204: for (int c = 1; c < 8; ++c) |
205: { |
206: const T x = delx + cellx[c]; |
207: const T y = dely + celly[c]; |
208: const T z = delz + cellz[c]; |
209: const T r2 = x * x + y * y + z * z; |
210: ic = (r2 < rmin) ? c : ic; |
211: rmin = (r2 < rmin) ? r2 : rmin; |
212: } |
213: |
214: temp_r[iat] = std::sqrt(rmin); |
215: dx[iat] = flip * (delx + cellx[ic]); |
216: dy[iat] = flip * (dely + celly[ic]); |
217: dz[iat] = flip * (delz + cellz[ic]); |
218: } |
219: } |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 241 - 243 |
-------------------------------------------------------------------------------- |
241: T* restrict data(size_t i) { return myData + i * nGhosts; } |
242: ///return the const pointer of the i-th components |
243: const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
0x457610 PUSH %RBP |
0x457611 MOV %RSP,%RBP |
0x457614 PUSH %R15 |
0x457616 PUSH %R14 |
0x457618 PUSH %R12 |
0x45761a PUSH %RBX |
0x45761b AND $-0x40,%RSP |
0x45761f SUB $0x800,%RSP |
0x457626 MOV 0x10(%RBP),%EAX |
0x457629 SUB %R9D,%EAX |
0x45762c JLE 45843d |
0x457632 MOV 0x18(%RBP),%EBX |
0x457635 VMOVSD (%RSI),%XMM0 |
0x457639 VMOVUPS %XMM0,0x40(%RSP) |
0x45763f VMOVSD 0x8(%RSI),%XMM0 |
0x457644 VMOVUPS %XMM0,0x50(%RSP) |
0x45764a VMOVSD 0x10(%RSI),%XMM0 |
0x45764f VMOVUPS %XMM0,0x60(%RSP) |
0x457655 MOV 0x8(%RDX),%RSI |
0x457659 MOV 0x18(%RDX),%R12 |
0x45765d LEA (%R12,%RSI,8),%R15 |
0x457661 SAL $0x4,%RSI |
0x457665 ADD %R12,%RSI |
0x457668 MOV 0x8(%R8),%R11 |
0x45766c MOV 0x18(%R8),%R10 |
0x457670 LEA (%R10,%R11,8),%R8 |
0x457674 SAL $0x4,%R11 |
0x457678 ADD %R10,%R11 |
0x45767b VMOVSD (%RDI),%XMM19 |
0x457681 VMOVSD 0x8(%RDI),%XMM20 |
0x457688 VMOVSD 0x10(%RDI),%XMM21 |
0x45768f VMOVSD 0x18(%RDI),%XMM22 |
0x457696 VMOVSD 0x20(%RDI),%XMM24 |
0x45769d VMOVSD 0x28(%RDI),%XMM25 |
0x4576a4 VMOVSD 0x30(%RDI),%XMM27 |
0x4576ab VMOVSD 0x38(%RDI),%XMM9 |
0x4576b0 VMOVSD 0x40(%RDI),%XMM8 |
0x4576b5 VMOVSD 0x48(%RDI),%XMM7 |
0x4576ba VMOVSD 0x50(%RDI),%XMM28 |
0x4576c1 VMOVSD 0x58(%RDI),%XMM26 |
0x4576c8 VMOVSD 0x60(%RDI),%XMM6 |
0x4576cd VMOVSD 0x68(%RDI),%XMM29 |
0x4576d4 VMOVSD 0x70(%RDI),%XMM0 |
0x4576d9 VMOVSD 0x78(%RDI),%XMM5 |
0x4576de VMOVSD 0x80(%RDI),%XMM4 |
0x4576e6 VMOVSD 0x88(%RDI),%XMM2 |
0x4576ee VMOVSD 0x98(%RDI),%XMM14 |
0x4576f6 VMOVSD 0xd8(%RDI),%XMM17 |
0x4576fd VMOVSD 0x118(%RDI),%XMM10 |
0x457705 VMOVSD 0xa0(%RDI),%XMM11 |
0x45770d VMOVSD 0xe0(%RDI),%XMM12 |
0x457715 VMOVSD 0x120(%RDI),%XMM13 |
0x45771d VMOVSD 0xa8(%RDI),%XMM1 |
0x457725 VMOVUPS %XMM1,0x70(%RSP) |
0x45772b VMOVSD 0xe8(%RDI),%XMM15 |
0x457733 VMOVSD 0x128(%RDI),%XMM16 |
0x45773a VMOVSD 0xb0(%RDI),%XMM1 |
0x457742 VMOVUPS %XMM1,0x80(%RSP) |
0x45774b VMOVSD 0xf0(%RDI),%XMM3 |
0x457753 VMOVUPS %XMM3,0xa0(%RSP) |
0x45775c MOV %EAX,%R14D |
0x45775f VMOVSD 0x130(%RDI),%XMM23 |
0x457766 VMOVSD 0xb8(%RDI),%XMM3 |
0x45776e VMOVUPS %XMM3,0x90(%RSP) |
0x457777 VMOVSD 0xf8(%RDI),%XMM3 |
0x45777f VMOVUPS %XMM3,0xb0(%RSP) |
0x457788 VMOVSD 0x138(%RDI),%XMM1 |
0x457790 VMOVUPS %XMM1,0xc0(%RSP) |
0x457799 VMOVSD 0xc0(%RDI),%XMM3 |
0x4577a1 VMOVUPS %XMM3,0xd0(%RSP) |
0x4577aa VMOVSD 0x100(%RDI),%XMM31 |
0x4577b1 VMOVSD 0x140(%RDI),%XMM30 |
0x4577b8 VMOVSD 0xc8(%RDI),%XMM3 |
0x4577c0 VMOVSD 0x108(%RDI),%XMM1 |
0x4577c8 VMOVUPS %XMM1,0xe0(%RSP) |
0x4577d1 VMOVSD 0x148(%RDI),%XMM1 |
0x4577d9 VMOVUPD %XMM1,0xf0(%RSP) |
0x4577e2 VPBROADCASTD %EBX,%YMM18 |
0x4577e8 VMOVDQU64 %YMM18,0x2e0(%RSP) |
0x4577f0 AND $-0x8,%R14D |
0x4577f4 VMOVUPD %XMM23,0x2d0(%RSP) |
0x4577fc VMOVUPS %XMM26,0x2c0(%RSP) |
0x457804 VMOVUPS %XMM0,0x2b0(%RSP) |
0x45780d VMOVUPS %XMM28,0x2a0(%RSP) |
0x457815 VMOVUPD %XMM2,0x290(%RSP) |
0x45781e VMOVUPD %XMM29,0x280(%RSP) |
0x457826 VMOVUPD %XMM4,0x270(%RSP) |
0x45782f VMOVUPD %XMM5,0x260(%RSP) |
0x457838 VMOVUPS %XMM6,0x250(%RSP) |
0x457841 VMOVUPS %XMM7,0x240(%RSP) |
0x45784a VMOVUPS %XMM8,0x230(%RSP) |
0x457853 VMOVUPS %XMM27,0x220(%RSP) |
0x45785b JE 457f51 |
0x457861 MOV %EAX,0x3c(%RSP) |
0x457865 LEA -0x1(%R14),%EBX |
0x457869 VBROADCASTSD 0x40(%RSP),%ZMM18 |
0x457871 VMOVUPS %ZMM18,0x780(%RSP) |
0x457879 VBROADCASTSD 0x50(%RSP),%ZMM18 |
0x457881 VMOVUPS %ZMM18,0x740(%RSP) |
0x457889 VBROADCASTSD 0x60(%RSP),%ZMM18 |
0x457891 VMOVUPS %ZMM18,0x700(%RSP) |
0x457899 VMOVUPD %XMM19,0x100(%RSP) |
0x4578a1 VBROADCASTSD %XMM19,%ZMM18 |
0x4578a7 VMOVUPD %ZMM18,0x6c0(%RSP) |
0x4578af VMOVUPD %XMM20,0x110(%RSP) |
0x4578b7 VBROADCASTSD %XMM20,%ZMM18 |
0x4578bd VMOVUPD %ZMM18,0x680(%RSP) |
0x4578c5 VMOVUPD %XMM21,0x120(%RSP) |
0x4578cd VBROADCASTSD %XMM21,%ZMM18 |
0x4578d3 VMOVUPD %ZMM18,0x640(%RSP) |
0x4578db VMOVUPD %XMM22,0x130(%RSP) |
0x4578e3 VBROADCASTSD %XMM22,%ZMM18 |
0x4578e9 VMOVUPD %ZMM18,0x600(%RSP) |
0x4578f1 VMOVUPD %XMM24,0x140(%RSP) |
0x4578f9 VBROADCASTSD %XMM24,%ZMM18 |
0x4578ff VMOVUPD %ZMM18,0x5c0(%RSP) |
0x457907 VMOVUPD %XMM25,0x150(%RSP) |
0x45790f VBROADCASTSD %XMM25,%ZMM18 |
0x457915 VMOVUPD %ZMM18,0x580(%RSP) |
0x45791d VBROADCASTSD %XMM27,%ZMM18 |
0x457923 VMOVUPS %ZMM18,0x540(%RSP) |
0x45792b VMOVUPD %XMM9,0x160(%RSP) |
0x457934 VBROADCASTSD %XMM9,%ZMM9 |
0x45793a VMOVUPD %ZMM9,0x500(%RSP) |
0x457942 VBROADCASTSD %XMM8,%ZMM8 |
0x457948 VMOVUPS %ZMM8,0x4c0(%RSP) |
0x457950 VBROADCASTSD %XMM7,%ZMM7 |
0x457956 VMOVUPS %ZMM7,0x480(%RSP) |
0x45795e VMOVAPD %XMM3,%XMM27 |
0x457964 VBROADCASTSD %XMM28,%ZMM1 |
0x45796a VMOVUPS %ZMM1,0x440(%RSP) |
0x457972 VBROADCASTSD %XMM26,%ZMM1 |
0x457978 VMOVUPS %ZMM1,0x400(%RSP) |
0x457980 VBROADCASTSD %XMM6,%ZMM1 |
0x457986 VMOVUPS %ZMM1,0x3c0(%RSP) |
0x45798e VBROADCASTSD %XMM29,%ZMM1 |
0x457994 VMOVUPD %ZMM1,0x380(%RSP) |
0x45799c VBROADCASTSD %XMM0,%ZMM0 |
0x4579a2 VMOVUPS %ZMM0,0x340(%RSP) |
0x4579aa VBROADCASTSD %XMM5,%ZMM0 |
0x4579b0 VMOVUPD %ZMM0,0x300(%RSP) |
0x4579b8 VBROADCASTSD %XMM4,%ZMM6 |
0x4579be VBROADCASTSD %XMM2,%ZMM7 |
0x4579c4 VMOVUPD %XMM14,0x170(%RSP) |
0x4579cd VBROADCASTSD %XMM14,%ZMM8 |
0x4579d3 VMOVUPD %XMM17,0x180(%RSP) |
0x4579db VBROADCASTSD %XMM17,%ZMM9 |
0x4579e1 VMOVUPD %XMM10,0x190(%RSP) |
0x4579ea VBROADCASTSD %XMM10,%ZMM10 |
0x4579f0 VMOVUPD %XMM11,0x1a0(%RSP) |
0x4579f9 VBROADCASTSD %XMM11,%ZMM11 |
0x4579ff VMOVUPD %XMM12,0x1b0(%RSP) |
0x457a08 VBROADCASTSD %XMM12,%ZMM12 |
0x457a0e VMOVUPD %XMM13,0x1c0(%RSP) |
0x457a17 VBROADCASTSD %XMM13,%ZMM13 |
0x457a1d VMOVUPD 0x70(%RSP),%XMM14 |
0x457a23 VBROADCASTSD %XMM14,%ZMM14 |
0x457a29 VMOVUPD %XMM15,0x1d0(%RSP) |
0x457a32 VBROADCASTSD %XMM15,%ZMM15 |
0x457a38 VMOVUPD %XMM16,0x1e0(%RSP) |
0x457a40 VBROADCASTSD %XMM16,%ZMM16 |
0x457a46 VMOVUPD 0x80(%RSP),%XMM17 |
0x457a4e VBROADCASTSD %XMM17,%ZMM17 |
0x457a54 VMOVUPD 0xa0(%RSP),%XMM18 |
0x457a5c VBROADCASTSD %XMM18,%ZMM18 |
0x457a62 XOR %EDX,%EDX |
0x457a64 VBROADCASTSD %XMM23,%ZMM19 |
0x457a6a VMOVUPD 0x90(%RSP),%XMM20 |
0x457a72 VBROADCASTSD %XMM20,%ZMM20 |
0x457a78 VMOVUPD 0xb0(%RSP),%XMM21 |
0x457a80 VBROADCASTSD %XMM21,%ZMM21 |
0x457a86 VMOVUPD 0xc0(%RSP),%XMM22 |
0x457a8e VBROADCASTSD %XMM22,%ZMM22 |
0x457a94 VMOVUPD 0xd0(%RSP),%XMM23 |
0x457a9c VBROADCASTSD %XMM23,%ZMM23 |
0x457aa2 VMOVUPD %XMM31,0x1f0(%RSP) |
0x457aaa VBROADCASTSD %XMM31,%ZMM24 |
0x457ab0 VMOVUPD %XMM30,0x200(%RSP) |
0x457ab8 VBROADCASTSD %XMM30,%ZMM25 |
0x457abe VMOVUPD %XMM3,0x210(%RSP) |
0x457ac7 VMOVAPD %XMM3,%XMM26 |
0x457acd VBROADCASTSD %XMM3,%ZMM26 |
0x457ad3 VMOVUPD 0xe0(%RSP),%XMM27 |
0x457adb VBROADCASTSD %XMM27,%ZMM27 |
0x457ae1 VMOVUPD 0xf0(%RSP),%XMM28 |
0x457ae9 VBROADCASTSD %XMM28,%ZMM28 |
0x457aef VMOVDQU 0x2e0(%RSP),%YMM5 |
0x457af8 NOPL (%RAX,%RAX,1) |
(971) 0x457b00 LEA (%R9,%RDX,1),%EAX |
(971) 0x457b04 VPBROADCASTD %EAX,%YMM0 |
(971) 0x457b0a VPADDD 0x3e32e(%RIP),%YMM0,%YMM0 |
(971) 0x457b12 VPCMPGTD %YMM0,%YMM5,%K1 |
(971) 0x457b18 CLTQ |
(971) 0x457b1a VMOVUPD (%R12,%RAX,8),%ZMM0 |
(971) 0x457b21 VBROADCASTSD 0x36505(%RIP),%ZMM1 |
(971) 0x457b2b VBROADCASTSD 0x364f3(%RIP),%ZMM2 |
(971) 0x457b35 VBLENDMPD %ZMM2,%ZMM1,%ZMM29{%K1} |
(971) 0x457b3b VSUBPD 0x780(%RSP),%ZMM0,%ZMM0 |
(971) 0x457b43 VMOVUPD (%R15,%RAX,8),%ZMM30 |
(971) 0x457b4a VSUBPD 0x740(%RSP),%ZMM30,%ZMM30 |
(971) 0x457b52 VMULPD %ZMM29,%ZMM0,%ZMM31 |
(971) 0x457b58 VMULPD %ZMM29,%ZMM30,%ZMM30 |
(971) 0x457b5e VMOVUPD (%RSI,%RAX,8),%ZMM0 |
(971) 0x457b65 VSUBPD 0x700(%RSP),%ZMM0,%ZMM0 |
(971) 0x457b6d VMULPD 0x6c0(%RSP),%ZMM31,%ZMM1 |
(971) 0x457b75 VMULPD %ZMM29,%ZMM0,%ZMM2 |
(971) 0x457b7b VFMADD231PD 0x680(%RSP),%ZMM30,%ZMM1 |
(971) 0x457b83 VFMADD231PD 0x640(%RSP),%ZMM2,%ZMM1 |
(971) 0x457b8b VMULPD 0x600(%RSP),%ZMM31,%ZMM3 |
(971) 0x457b93 VFMADD231PD 0x5c0(%RSP),%ZMM30,%ZMM3 |
(971) 0x457b9b VRNDSCALEPD $0x9,%ZMM1,%ZMM0 |
(971) 0x457ba2 VFMADD231PD 0x580(%RSP),%ZMM2,%ZMM3 |
(971) 0x457baa VMULPD 0x540(%RSP),%ZMM31,%ZMM1 |
(971) 0x457bb2 VFMADD231PD 0x500(%RSP),%ZMM30,%ZMM1 |
(971) 0x457bba VFMADD231PD 0x4c0(%RSP),%ZMM2,%ZMM1 |
(971) 0x457bc2 VRNDSCALEPD $0x9,%ZMM3,%ZMM3 |
(971) 0x457bc9 VRNDSCALEPD $0x9,%ZMM1,%ZMM1 |
(971) 0x457bd0 VFMSUB231PD 0x480(%RSP),%ZMM0,%ZMM31 |
(971) 0x457bd8 VFMADD231PD 0x440(%RSP),%ZMM3,%ZMM31 |
(971) 0x457be0 VFMSUB231PD 0x3c0(%RSP),%ZMM0,%ZMM30 |
(971) 0x457be8 VFNMSUB231PD 0x400(%RSP),%ZMM1,%ZMM31 |
(971) 0x457bf0 VFMADD231PD 0x380(%RSP),%ZMM3,%ZMM30 |
(971) 0x457bf8 VFNMSUB231PD 0x340(%RSP),%ZMM1,%ZMM30 |
(971) 0x457c00 VFMSUB132PD 0x300(%RSP),%ZMM2,%ZMM0 |
(971) 0x457c08 VFMADD231PD %ZMM3,%ZMM6,%ZMM0 |
(971) 0x457c0e VFNMSUB231PD %ZMM1,%ZMM7,%ZMM0 |
(971) 0x457c14 VMULPD %ZMM31,%ZMM31,%ZMM1 |
(971) 0x457c1a VFMADD231PD %ZMM30,%ZMM30,%ZMM1 |
(971) 0x457c20 VADDPD %ZMM31,%ZMM8,%ZMM2 |
(971) 0x457c26 VADDPD %ZMM30,%ZMM9,%ZMM3 |
(971) 0x457c2c VADDPD %ZMM0,%ZMM10,%ZMM4 |
(971) 0x457c32 VMULPD %ZMM2,%ZMM2,%ZMM2 |
(971) 0x457c38 VFMADD231PD %ZMM0,%ZMM0,%ZMM1 |
(971) 0x457c3e VFMADD231PD %ZMM3,%ZMM3,%ZMM2 |
(971) 0x457c44 VFMADD231PD %ZMM4,%ZMM4,%ZMM2 |
(971) 0x457c4a VCMPPD $0x1,%ZMM1,%ZMM2,%K0 |
(971) 0x457c51 VADDPD %ZMM31,%ZMM11,%ZMM3 |
(971) 0x457c57 VADDPD %ZMM30,%ZMM12,%ZMM4 |
(971) 0x457c5d VMINPD %ZMM1,%ZMM2,%ZMM1 |
(971) 0x457c63 VADDPD %ZMM0,%ZMM13,%ZMM2 |
(971) 0x457c69 VMULPD %ZMM3,%ZMM3,%ZMM3 |
(971) 0x457c6f VFMADD231PD %ZMM4,%ZMM4,%ZMM3 |
(971) 0x457c75 VFMADD231PD %ZMM2,%ZMM2,%ZMM3 |
(971) 0x457c7b VADDPD %ZMM31,%ZMM14,%ZMM2 |
(971) 0x457c81 VCMPPD $0x1,%ZMM1,%ZMM3,%K1 |
(971) 0x457c88 VADDPD %ZMM30,%ZMM15,%ZMM4 |
(971) 0x457c8e VMULPD %ZMM2,%ZMM2,%ZMM2 |
(971) 0x457c94 VFMADD231PD %ZMM4,%ZMM4,%ZMM2 |
(971) 0x457c9a VADDPD %ZMM0,%ZMM16,%ZMM4 |
(971) 0x457ca0 VFMADD231PD %ZMM4,%ZMM4,%ZMM2 |
(971) 0x457ca6 VMINPD %ZMM1,%ZMM3,%ZMM1 |
(971) 0x457cac VCMPPD $0x1,%ZMM1,%ZMM2,%K2 |
(971) 0x457cb3 VMINPD %ZMM1,%ZMM2,%ZMM1 |
(971) 0x457cb9 VADDPD %ZMM31,%ZMM17,%ZMM2 |
(971) 0x457cbf VADDPD %ZMM30,%ZMM18,%ZMM3 |
(971) 0x457cc5 VMULPD %ZMM2,%ZMM2,%ZMM2 |
(971) 0x457ccb VADDPD %ZMM0,%ZMM19,%ZMM4 |
(971) 0x457cd1 VFMADD231PD %ZMM3,%ZMM3,%ZMM2 |
(971) 0x457cd7 VFMADD231PD %ZMM4,%ZMM4,%ZMM2 |
(971) 0x457cdd VCMPPD $0x1,%ZMM1,%ZMM2,%K3 |
(971) 0x457ce4 VADDPD %ZMM31,%ZMM20,%ZMM3 |
(971) 0x457cea VADDPD %ZMM30,%ZMM21,%ZMM4 |
(971) 0x457cf0 VMINPD %ZMM1,%ZMM2,%ZMM1 |
(971) 0x457cf6 VADDPD %ZMM0,%ZMM22,%ZMM2 |
(971) 0x457cfc VMULPD %ZMM3,%ZMM3,%ZMM3 |
(971) 0x457d02 VFMADD231PD %ZMM4,%ZMM4,%ZMM3 |
(971) 0x457d08 VFMADD231PD %ZMM2,%ZMM2,%ZMM3 |
(971) 0x457d0e VADDPD %ZMM31,%ZMM23,%ZMM2 |
(971) 0x457d14 VCMPPD $0x1,%ZMM1,%ZMM3,%K4 |
(971) 0x457d1b VADDPD %ZMM30,%ZMM24,%ZMM4 |
(971) 0x457d21 VMULPD %ZMM2,%ZMM2,%ZMM2 |
(971) 0x457d27 VFMADD231PD %ZMM4,%ZMM4,%ZMM2 |
(971) 0x457d2d VADDPD %ZMM0,%ZMM25,%ZMM4 |
(971) 0x457d33 VFMADD231PD %ZMM4,%ZMM4,%ZMM2 |
(971) 0x457d39 VMINPD %ZMM1,%ZMM3,%ZMM1 |
(971) 0x457d3f VADDPD %ZMM31,%ZMM26,%ZMM3 |
(971) 0x457d45 VADDPD %ZMM30,%ZMM27,%ZMM4 |
(971) 0x457d4b VMULPD %ZMM3,%ZMM3,%ZMM3 |
(971) 0x457d51 VFMADD231PD %ZMM4,%ZMM4,%ZMM3 |
(971) 0x457d57 VCMPPD $0x1,%ZMM1,%ZMM2,%K5 |
(971) 0x457d5e VMINPD %ZMM1,%ZMM2,%ZMM1 |
(971) 0x457d64 VADDPD %ZMM0,%ZMM28,%ZMM2 |
(971) 0x457d6a VFMADD231PD %ZMM2,%ZMM2,%ZMM3 |
(971) 0x457d70 VMINPD %ZMM1,%ZMM3,%ZMM2 |
(971) 0x457d76 VSQRTPD %ZMM2,%ZMM2 |
(971) 0x457d7c VCMPPD $0x1,%ZMM1,%ZMM3,%K6 |
(971) 0x457d83 VPMOVM2Q %K0,%ZMM1 |
(971) 0x457d89 VPSRLQ $0x3f,%ZMM1,%ZMM1 |
(971) 0x457d90 VPBROADCASTQ 0x3dec6(%RIP),%ZMM1{%K1} |
(971) 0x457d9a VPBROADCASTQ 0x3dec4(%RIP),%ZMM1{%K2} |
(971) 0x457da4 VPBROADCASTQ 0x3dec2(%RIP),%ZMM1{%K3} |
(971) 0x457dae VPBROADCASTQ 0x39f48(%RIP),%ZMM1{%K4} |
(971) 0x457db8 VPBROADCASTQ 0x3deb6(%RIP),%ZMM1{%K5} |
(971) 0x457dc2 VPBROADCASTQ 0x3deb4(%RIP),%ZMM1{%K6} |
(971) 0x457dcc KXNORW %K0,%K0,%K1 |
(971) 0x457dd0 VMOVUPD %ZMM2,(%RCX,%RAX,8) |
(971) 0x457dd7 VXORPD %XMM2,%XMM2,%XMM2 |
(971) 0x457ddb VGATHERQPD 0x90(%RDI,%ZMM1,8),%ZMM2{%K1} |
(971) 0x457de3 VADDPD %ZMM31,%ZMM2,%ZMM2 |
(971) 0x457de9 VMULPD %ZMM29,%ZMM2,%ZMM2 |
(971) 0x457def KXNORW %K0,%K0,%K1 |
(971) 0x457df3 VMOVUPD %ZMM2,(%R10,%RAX,8) |
(971) 0x457dfa VXORPD %XMM2,%XMM2,%XMM2 |
(971) 0x457dfe VGATHERQPD 0xd0(%RDI,%ZMM1,8),%ZMM2{%K1} |
(971) 0x457e06 VADDPD %ZMM30,%ZMM2,%ZMM2 |
(971) 0x457e0c VMULPD %ZMM29,%ZMM2,%ZMM2 |
(971) 0x457e12 KXNORW %K0,%K0,%K1 |
(971) 0x457e16 VMOVUPD %ZMM2,(%R8,%RAX,8) |
(971) 0x457e1d VXORPD %XMM2,%XMM2,%XMM2 |
(971) 0x457e21 VGATHERQPD 0x110(%RDI,%ZMM1,8),%ZMM2{%K1} |
(971) 0x457e29 VADDPD %ZMM0,%ZMM2,%ZMM0 |
(971) 0x457e2f VMULPD %ZMM29,%ZMM0,%ZMM0 |
(971) 0x457e35 VMOVUPD %ZMM0,(%R11,%RAX,8) |
(971) 0x457e3c ADD $0x8,%EDX |
(971) 0x457e3f CMP %EBX,%EDX |
(971) 0x457e41 JBE 457b00 |
0x457e47 MOV 0x3c(%RSP),%EAX |
0x457e4b CMP %R14D,%EAX |
0x457e4e VMOVUPD 0xe0(%RSP),%XMM8 |
0x457e57 VMOVUPD 0x210(%RSP),%XMM9 |
0x457e60 VMOVUPD 0x200(%RSP),%XMM30 |
0x457e68 VMOVUPD 0x1f0(%RSP),%XMM31 |
0x457e70 VMOVUPD 0xd0(%RSP),%XMM2 |
0x457e79 VMOVUPD 0xc0(%RSP),%XMM3 |
0x457e82 VMOVUPD 0xb0(%RSP),%XMM4 |
0x457e8b VMOVUPD 0xa0(%RSP),%XMM7 |
0x457e94 VMOVUPD 0x90(%RSP),%XMM6 |
0x457e9d VMOVUPD 0x80(%RSP),%XMM29 |
0x457ea5 VMOVUPD 0x1e0(%RSP),%XMM16 |
0x457ead VMOVUPD 0x1d0(%RSP),%XMM15 |
0x457eb6 VMOVUPD 0x70(%RSP),%XMM27 |
0x457ebe VMOVUPD 0x1c0(%RSP),%XMM13 |
0x457ec7 VMOVUPD 0x1b0(%RSP),%XMM12 |
0x457ed0 VMOVUPD 0x1a0(%RSP),%XMM11 |
0x457ed9 VMOVUPD 0x190(%RSP),%XMM10 |
0x457ee2 VMOVUPD 0x180(%RSP),%XMM17 |
0x457eea VMOVUPD 0x170(%RSP),%XMM14 |
0x457ef3 VMOVUPD 0x160(%RSP),%XMM18 |
0x457efb VMOVUPD 0x60(%RSP),%XMM28 |
0x457f03 VMOVUPD 0x50(%RSP),%XMM26 |
0x457f0b VMOVUPD 0x150(%RSP),%XMM25 |
0x457f13 VMOVUPD 0x140(%RSP),%XMM24 |
0x457f1b VMOVUPD 0x40(%RSP),%XMM23 |
0x457f23 VMOVUPD 0x130(%RSP),%XMM22 |
0x457f2b VMOVUPD 0x120(%RSP),%XMM21 |
0x457f33 VMOVUPD 0x110(%RSP),%XMM20 |
0x457f3b VMOVUPD 0x100(%RSP),%XMM19 |
0x457f43 JE 45843d |
0x457f49 VPBROADCASTD %EAX,%YMM0 |
0x457f4f JMP 457fcb |
0x457f51 VMOVAPD %XMM9,%XMM18 |
0x457f57 VPBROADCASTD %EAX,%YMM0 |
0x457f5d XOR %R14D,%R14D |
0x457f60 VMOVUPD 0x60(%RSP),%XMM28 |
0x457f68 VMOVUPD 0x50(%RSP),%XMM26 |
0x457f70 VMOVUPD 0x40(%RSP),%XMM23 |
0x457f78 VMOVDQU 0x2e0(%RSP),%YMM5 |
0x457f81 VMOVUPD 0xe0(%RSP),%XMM8 |
0x457f8a VMOVAPD %XMM3,%XMM9 |
0x457f8e VMOVUPD 0xd0(%RSP),%XMM2 |
0x457f97 VMOVUPD 0xc0(%RSP),%XMM3 |
0x457fa0 VMOVUPD 0xb0(%RSP),%XMM4 |
0x457fa9 VMOVUPD 0x90(%RSP),%XMM6 |
0x457fb2 VMOVUPD 0xa0(%RSP),%XMM7 |
0x457fbb VMOVUPD 0x70(%RSP),%XMM27 |
0x457fc3 VMOVUPD 0x80(%RSP),%XMM29 |
0x457fcb VPBROADCASTD %R14D,%YMM1 |
0x457fd1 VPOR 0x3de67(%RIP),%YMM1,%YMM1 |
0x457fd9 VPCMPLTUD %YMM0,%YMM1,%K1 |
0x457fe0 KORTESTB %K1,%K1 |
0x457fe4 JE 45843d |
0x457fea ADD %R9D,%R14D |
0x457fed VPBROADCASTD %R14D,%YMM0 |
0x457ff3 VPADDD 0x3de45(%RIP),%YMM0,%YMM0 |
0x457ffb VPCMPGTD %YMM0,%YMM5,%K2 |
0x458001 MOVSXD %R14D,%RBX |
0x458004 VBROADCASTSD %XMM23,%ZMM0 |
0x45800a VMOVUPD (%R12,%RBX,8),%ZMM1{%K1}{z} |
0x458011 VSUBPD %ZMM0,%ZMM1,%ZMM1 |
0x458017 VBROADCASTSD %XMM26,%ZMM0 |
0x45801d VMOVAPD %XMM2,%XMM23 |
0x458023 VMOVUPD (%R15,%RBX,8),%ZMM2{%K1}{z} |
0x45802a VSUBPD %ZMM0,%ZMM2,%ZMM2 |
0x458030 VMOVUPD (%RSI,%RBX,8),%ZMM0{%K1}{z} |
0x458037 VMOVAPD %XMM3,%XMM26 |
0x45803d VBROADCASTSD %XMM28,%ZMM3 |
0x458043 VSUBPD %ZMM3,%ZMM0,%ZMM3 |
0x458049 VBROADCASTSD 0x35fdd(%RIP),%ZMM0 |
0x458053 VBROADCASTSD 0x35fcb(%RIP),%ZMM0{%K2} |
0x45805d VMOVAPD %XMM4,%XMM28 |
0x458063 VMULPD %ZMM0,%ZMM1,%ZMM4 |
0x458069 VMULPD %ZMM0,%ZMM2,%ZMM5 |
0x45806f VBROADCASTSD %XMM19,%ZMM1 |
0x458075 VMULPD %ZMM4,%ZMM1,%ZMM1 |
0x45807b VBROADCASTSD %XMM20,%ZMM2 |
0x458081 VFMADD213PD %ZMM1,%ZMM5,%ZMM2 |
0x458087 VMOVAPD %XMM6,%XMM19 |
0x45808d VMULPD %ZMM0,%ZMM3,%ZMM6 |
0x458093 VBROADCASTSD %XMM21,%ZMM1 |
0x458099 VFMADD213PD %ZMM2,%ZMM6,%ZMM1 |
0x45809f VBROADCASTSD %XMM22,%ZMM2 |
0x4580a5 VMULPD %ZMM4,%ZMM2,%ZMM2 |
0x4580ab VBROADCASTSD %XMM24,%ZMM3 |
0x4580b1 VFMADD213PD %ZMM2,%ZMM5,%ZMM3 |
0x4580b7 VMOVAPD %XMM7,%XMM20 |
0x4580bd VBROADCASTSD %XMM25,%ZMM7 |
0x4580c3 VFMADD213PD %ZMM3,%ZMM6,%ZMM7 |
0x4580c9 VBROADCASTSD 0x220(%RSP),%ZMM2 |
0x4580d1 VMULPD %ZMM4,%ZMM2,%ZMM2 |
0x4580d7 VBROADCASTSD %XMM18,%ZMM3 |
0x4580dd VFMADD213PD %ZMM2,%ZMM5,%ZMM3 |
0x4580e3 VMOVAPD %XMM8,%XMM21 |
0x4580e9 VBROADCASTSD 0x230(%RSP),%ZMM8 |
0x4580f1 VFMADD213PD %ZMM3,%ZMM6,%ZMM8 |
0x4580f7 VMOVAPD %XMM9,%XMM22 |
0x4580fd VRNDSCALEPD $0x9,%ZMM1,%ZMM9 |
0x458104 VBROADCASTSD 0x240(%RSP),%ZMM1 |
0x45810c VFMSUB213PD %ZMM4,%ZMM9,%ZMM1 |
0x458112 VBROADCASTSD 0x250(%RSP),%ZMM2 |
0x45811a VFMSUB213PD %ZMM5,%ZMM9,%ZMM2 |
0x458120 VRNDSCALEPD $0x9,%ZMM7,%ZMM4 |
0x458127 VBROADCASTSD 0x260(%RSP),%ZMM3 |
0x45812f VFMSUB213PD %ZMM6,%ZMM9,%ZMM3 |
0x458135 VBROADCASTSD 0x2a0(%RSP),%ZMM5 |
0x45813d VFMADD231PD %ZMM5,%ZMM4,%ZMM1 |
0x458143 VBROADCASTSD 0x280(%RSP),%ZMM5 |
0x45814b VFMADD231PD %ZMM5,%ZMM4,%ZMM2 |
0x458151 VBROADCASTSD 0x270(%RSP),%ZMM5 |
0x458159 VFMADD231PD %ZMM5,%ZMM4,%ZMM3 |
0x45815f VRNDSCALEPD $0x9,%ZMM8,%ZMM4 |
0x458166 VBROADCASTSD 0x2c0(%RSP),%ZMM5 |
0x45816e VFNMSUB231PD %ZMM5,%ZMM4,%ZMM1 |
0x458174 VBROADCASTSD 0x2b0(%RSP),%ZMM5 |
0x45817c VFNMSUB231PD %ZMM5,%ZMM4,%ZMM2 |
0x458182 VBROADCASTSD 0x290(%RSP),%ZMM5 |
0x45818a VFNMSUB231PD %ZMM5,%ZMM4,%ZMM3 |
0x458190 VBROADCASTSD %XMM14,%ZMM4 |
0x458196 VADDPD %ZMM1,%ZMM4,%ZMM4 |
0x45819c VBROADCASTSD %XMM17,%ZMM5 |
0x4581a2 VADDPD %ZMM2,%ZMM5,%ZMM5 |
0x4581a8 VMULPD %ZMM4,%ZMM4,%ZMM4 |
0x4581ae VFMADD231PD %ZMM5,%ZMM5,%ZMM4 |
0x4581b4 VBROADCASTSD %XMM10,%ZMM5 |
0x4581ba VADDPD %ZMM3,%ZMM5,%ZMM5 |
0x4581c0 VFMADD231PD %ZMM5,%ZMM5,%ZMM4 |
0x4581c6 VMULPD %ZMM1,%ZMM1,%ZMM5 |
0x4581cc VFMADD231PD %ZMM2,%ZMM2,%ZMM5 |
0x4581d2 VFMADD231PD %ZMM3,%ZMM3,%ZMM5 |
0x4581d8 VCMPPD $0x1,%ZMM5,%ZMM4,%K0 |
0x4581df VMINPD %ZMM5,%ZMM4,%ZMM4 |
0x4581e5 VBROADCASTSD %XMM11,%ZMM5 |
0x4581eb VADDPD %ZMM1,%ZMM5,%ZMM5 |
0x4581f1 VBROADCASTSD %XMM12,%ZMM6 |
0x4581f7 VADDPD %ZMM2,%ZMM6,%ZMM6 |
0x4581fd VMULPD %ZMM5,%ZMM5,%ZMM5 |
0x458203 VFMADD231PD %ZMM6,%ZMM6,%ZMM5 |
0x458209 VBROADCASTSD %XMM13,%ZMM6 |
0x45820f VADDPD %ZMM3,%ZMM6,%ZMM6 |
0x458215 VFMADD231PD %ZMM6,%ZMM6,%ZMM5 |
0x45821b VCMPPD $0x1,%ZMM4,%ZMM5,%K2 |
0x458222 VMINPD %ZMM4,%ZMM5,%ZMM4 |
0x458228 VBROADCASTSD %XMM27,%ZMM5 |
0x45822e VADDPD %ZMM1,%ZMM5,%ZMM5 |
0x458234 VBROADCASTSD %XMM15,%ZMM6 |
0x45823a VADDPD %ZMM2,%ZMM6,%ZMM6 |
0x458240 VMULPD %ZMM5,%ZMM5,%ZMM5 |
0x458246 VFMADD231PD %ZMM6,%ZMM6,%ZMM5 |
0x45824c VBROADCASTSD %XMM16,%ZMM6 |
0x458252 VADDPD %ZMM3,%ZMM6,%ZMM6 |
0x458258 VFMADD231PD %ZMM6,%ZMM6,%ZMM5 |
0x45825e VCMPPD $0x1,%ZMM4,%ZMM5,%K3 |
0x458265 VMINPD %ZMM4,%ZMM5,%ZMM4 |
0x45826b VBROADCASTSD %XMM29,%ZMM5 |
0x458271 VADDPD %ZMM1,%ZMM5,%ZMM5 |
0x458277 VBROADCASTSD %XMM20,%ZMM6 |
0x45827d VADDPD %ZMM2,%ZMM6,%ZMM6 |
0x458283 VMULPD %ZMM5,%ZMM5,%ZMM5 |
0x458289 VFMADD231PD %ZMM6,%ZMM6,%ZMM5 |
0x45828f VBROADCASTSD 0x2d0(%RSP),%ZMM6 |
0x458297 VADDPD %ZMM3,%ZMM6,%ZMM6 |
0x45829d VFMADD231PD %ZMM6,%ZMM6,%ZMM5 |
0x4582a3 VCMPPD $0x1,%ZMM4,%ZMM5,%K4 |
0x4582aa VMINPD %ZMM4,%ZMM5,%ZMM4 |
0x4582b0 VBROADCASTSD %XMM19,%ZMM5 |
0x4582b6 VADDPD %ZMM1,%ZMM5,%ZMM5 |
0x4582bc VBROADCASTSD %XMM28,%ZMM6 |
0x4582c2 VADDPD %ZMM2,%ZMM6,%ZMM6 |
0x4582c8 VMULPD %ZMM5,%ZMM5,%ZMM5 |
0x4582ce VFMADD231PD %ZMM6,%ZMM6,%ZMM5 |
0x4582d4 VBROADCASTSD %XMM26,%ZMM6 |
0x4582da VADDPD %ZMM3,%ZMM6,%ZMM6 |
0x4582e0 VFMADD231PD %ZMM6,%ZMM6,%ZMM5 |
0x4582e6 VCMPPD $0x1,%ZMM4,%ZMM5,%K5 |
0x4582ed VMINPD %ZMM4,%ZMM5,%ZMM4 |
0x4582f3 VBROADCASTSD %XMM23,%ZMM5 |
0x4582f9 VADDPD %ZMM1,%ZMM5,%ZMM5 |
0x4582ff VBROADCASTSD %XMM31,%ZMM6 |
0x458305 VADDPD %ZMM2,%ZMM6,%ZMM6 |
0x45830b VMULPD %ZMM5,%ZMM5,%ZMM5 |
0x458311 VFMADD231PD %ZMM6,%ZMM6,%ZMM5 |
0x458317 VBROADCASTSD %XMM30,%ZMM6 |
0x45831d VADDPD %ZMM3,%ZMM6,%ZMM6 |
0x458323 VFMADD231PD %ZMM6,%ZMM6,%ZMM5 |
0x458329 VBROADCASTSD %XMM22,%ZMM6 |
0x45832f VADDPD %ZMM1,%ZMM6,%ZMM6 |
0x458335 VBROADCASTSD %XMM21,%ZMM7 |
0x45833b VADDPD %ZMM2,%ZMM7,%ZMM7 |
0x458341 VMULPD %ZMM6,%ZMM6,%ZMM6 |
0x458347 VFMADD231PD %ZMM7,%ZMM7,%ZMM6 |
0x45834d VMINPD %ZMM4,%ZMM5,%ZMM7 |
0x458353 VBROADCASTSD 0xf0(%RSP),%ZMM8 |
0x45835b VADDPD %ZMM3,%ZMM8,%ZMM8 |
0x458361 VFMADD231PD %ZMM8,%ZMM8,%ZMM6 |
0x458367 VMINPD %ZMM7,%ZMM6,%ZMM8 |
0x45836d VSQRTPD %ZMM8,%ZMM8 |
0x458373 VCMPPD $0x1,%ZMM4,%ZMM5,%K6 |
0x45837a VCMPPD $0x1,%ZMM7,%ZMM6,%K7 |
0x458381 VMOVUPD %ZMM8,(%RCX,%RBX,8){%K1} |
0x458388 VPMOVM2Q %K0,%ZMM4 |
0x45838e VPSRLQ $0x3f,%ZMM4,%ZMM4 |
0x458395 VPBROADCASTQ 0x3d8c1(%RIP),%ZMM4{%K2} |
0x45839f VPBROADCASTQ 0x3d8bf(%RIP),%ZMM4{%K3} |
0x4583a9 VPBROADCASTQ 0x3d8bd(%RIP),%ZMM4{%K4} |
0x4583b3 VPBROADCASTQ 0x39943(%RIP),%ZMM4{%K5} |
0x4583bd VPBROADCASTQ 0x3d8b1(%RIP),%ZMM4{%K6} |
0x4583c7 VPBROADCASTQ 0x3d8af(%RIP),%ZMM4{%K7} |
0x4583d1 KMOVQ %K1,%K2 |
0x4583d6 VXORPD %XMM5,%XMM5,%XMM5 |
0x4583da VGATHERQPD 0x90(%RDI,%ZMM4,8),%ZMM5{%K2} |
0x4583e2 VADDPD %ZMM1,%ZMM5,%ZMM1 |
0x4583e8 VMULPD %ZMM0,%ZMM1,%ZMM1 |
0x4583ee VMOVUPD %ZMM1,(%R10,%RBX,8){%K1} |
0x4583f5 KMOVQ %K1,%K2 |
0x4583fa VXORPD %XMM1,%XMM1,%XMM1 |
0x4583fe VGATHERQPD 0xd0(%RDI,%ZMM4,8),%ZMM1{%K2} |
0x458406 VADDPD %ZMM2,%ZMM1,%ZMM1 |
0x45840c VMULPD %ZMM0,%ZMM1,%ZMM1 |
0x458412 VMOVUPD %ZMM1,(%R8,%RBX,8){%K1} |
0x458419 VXORPD %XMM1,%XMM1,%XMM1 |
0x45841d KMOVQ %K1,%K2 |
0x458422 VGATHERQPD 0x110(%RDI,%ZMM4,8),%ZMM1{%K2} |
0x45842a VADDPD %ZMM3,%ZMM1,%ZMM1 |
0x458430 VMULPD %ZMM0,%ZMM1,%ZMM0 |
0x458436 VMOVUPD %ZMM0,(%R11,%RBX,8){%K1} |
0x45843d LEA -0x20(%RBP),%RSP |
0x458441 POP %RBX |
0x458442 POP %R12 |
0x458444 POP %R14 |
0x458446 POP %R15 |
0x458448 POP %RBP |
0x458449 VZEROUPPER |
0x45844c RET |
0x45844d NOPL (%RAX) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►51.38+ | qmcplusplus::DistanceTableAA<d[...] | DistanceTableAA.h:83 | exec |
○ | qmcplusplus::ParticleSet::make[...] | ParticleSet.cpp:290 | exec |
○ | main.extracted.104 | miniqmc.cpp:482 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 | |
►22.24+ | qmcplusplus::DistanceTableAA<d[...] | DistanceTableAA.h:76 | exec |
○ | qmcplusplus::ParticleSet::setA[...] | ParticleSet.cpp:259 | exec |
○ | main.extracted.104 | stl_vector.h:1126 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 | |
►13.66+ | qmcplusplus::DistanceTableAA<d[...] | DistanceTableAA.h:83 | exec |
○ | qmcplusplus::ParticleSet::make[...] | ParticleSet.cpp:290 | exec |
○ | main.extracted.104 | stl_vector.h:1126 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 | |
►4.76+ | qmcplusplus::DistanceTableBA<d[...] | DistanceTableBA.h:119 | exec |
○ | qmcplusplus::ParticleSet::make[...] | ParticleSet.cpp:290 | exec |
○ | main.extracted.104 | miniqmc.cpp:482 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 | |
►4.45+ | qmcplusplus::DistanceTableAA<d[...] | DistanceTableAA.h:69 | exec |
○ | qmcplusplus::ParticleSet::upda[...] | ParticleSet.cpp:250 | exec |
○ | main.extracted.107 | miniqmc.cpp:390 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:374 | exec |
○ | __libc_init_first | libc.so.6 | |
►1.88+ | qmcplusplus::DistanceTableBA<d[...] | DistanceTableBA.h:119 | exec |
○ | qmcplusplus::ParticleSet::make[...] | ParticleSet.cpp:290 | exec |
○ | main.extracted.104 | stl_vector.h:1126 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 | |
►1.63+ | qmcplusplus::DistanceTableBA<d[...] | DistanceTableBA.h:113 | exec |
○ | qmcplusplus::ParticleSet::setA[...] | ParticleSet.cpp:259 | exec |
○ | main.extracted.104 | stl_vector.h:1126 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 |
Path / |
Source file and lines | ParticleBConds.h:166-219 |
Module | exec |
nb instructions | 425 |
nb uops | 441 |
loop length | 2809 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 32 |
used ymm registers | 4 |
used zmm registers | 29 |
nb stack references | 66 |
ADD-SUB / MUL ratio | 1.59 |
micro-operation queue | 110.25 cycles |
front end | 110.25 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 92.00 | 11.50 | 79.00 | 79.00 | 72.00 | 92.00 | 11.50 | 73.00 |
cycles | 92.00 | 37.50 | 79.00 | 79.00 | 72.00 | 92.00 | 11.50 | 73.00 |
Cycles executing div or sqrt instructions | 18.00-24.00 |
FE+BE cycles | 290.27 |
Stall cycles | 181.92 |
ROB full (events) | 1.00 |
RS full (events) | 23.99 |
LM full (events) | 3.01 |
SB full (events) | 174.90 |
Front-end | 110.25 |
Dispatch | 92.00 |
DIV/SQRT | 18.00-24.00 |
Overall L1 | 110.25 |
all | 39% |
load | 40% |
store | 50% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 27% |
all | 63% |
load | 47% |
store | 100% |
mul | 100% |
add-sub | 100% |
fma | 100% |
div/sqrt | 100% |
other | 28% |
all | 62% |
load | 47% |
store | 98% |
mul | 100% |
add-sub | 100% |
fma | 100% |
div/sqrt | 100% |
other | 28% |
all | 25% |
load | 27% |
store | 28% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 21% |
all | 46% |
load | 22% |
store | 51% |
mul | 100% |
add-sub | 100% |
fma | 100% |
div/sqrt | 100% |
other | 28% |
all | 45% |
load | 22% |
store | 50% |
mul | 100% |
add-sub | 98% |
fma | 100% |
div/sqrt | 100% |
other | 27% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SUB $0x800,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
SUB %R9D,%EAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 45843d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x18(%RBP),%EBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD (%RSI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x40(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x8(%RSI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x50(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x10(%RSI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x60(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x8(%RDX),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RDX),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R12,%RSI,8),%R15 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x4,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
ADD %R12,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x8(%R8),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%R8),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R10,%R11,8),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x4,%R11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
ADD %R10,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD (%RDI),%XMM19 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x8(%RDI),%XMM20 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x10(%RDI),%XMM21 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x18(%RDI),%XMM22 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x20(%RDI),%XMM24 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x28(%RDI),%XMM25 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x30(%RDI),%XMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x38(%RDI),%XMM9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x40(%RDI),%XMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x48(%RDI),%XMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x50(%RDI),%XMM28 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x58(%RDI),%XMM26 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x60(%RDI),%XMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x68(%RDI),%XMM29 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x70(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x78(%RDI),%XMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x80(%RDI),%XMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x88(%RDI),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x98(%RDI),%XMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xd8(%RDI),%XMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x118(%RDI),%XMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xa0(%RDI),%XMM11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xe0(%RDI),%XMM12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x120(%RDI),%XMM13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xa8(%RDI),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM1,0x70(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xe8(%RDI),%XMM15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x128(%RDI),%XMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xb0(%RDI),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM1,0x80(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xf0(%RDI),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM3,0xa0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x130(%RDI),%XMM23 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xb8(%RDI),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM3,0x90(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xf8(%RDI),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM3,0xb0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x138(%RDI),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM1,0xc0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xc0(%RDI),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM3,0xd0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x100(%RDI),%XMM31 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x140(%RDI),%XMM30 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xc8(%RDI),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x108(%RDI),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM1,0xe0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x148(%RDI),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD %XMM1,0xf0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VPBROADCASTD %EBX,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVDQU64 %YMM18,0x2e0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
AND $-0x8,%R14D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD %XMM23,0x2d0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM26,0x2c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM0,0x2b0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM28,0x2a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM2,0x290(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM29,0x280(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM4,0x270(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM5,0x260(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM6,0x250(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM7,0x240(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM8,0x230(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM27,0x220(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JE 457f51 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %EAX,0x3c(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA -0x1(%R14),%EBX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD 0x40(%RSP),%ZMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %ZMM18,0x780(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x50(%RSP),%ZMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %ZMM18,0x740(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x60(%RSP),%ZMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %ZMM18,0x700(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM19,0x100(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM19,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM18,0x6c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM20,0x110(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM20,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM18,0x680(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM21,0x120(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM21,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM18,0x640(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM22,0x130(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM22,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM18,0x600(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM24,0x140(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM24,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM18,0x5c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM25,0x150(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM25,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM18,0x580(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM27,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM18,0x540(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM9,0x160(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM9,%ZMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM9,0x500(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM8,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM8,0x4c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM7,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM7,0x480(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM27 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM28,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM1,0x440(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM26,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM1,0x400(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM6,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM1,0x3c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM29,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM1,0x380(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM0,0x340(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM5,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM0,0x300(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM4,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM2,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM14,0x170(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM14,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM17,0x180(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM17,%ZMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM10,0x190(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM10,%ZMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM11,0x1a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM11,%ZMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM12,0x1b0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM12,%ZMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM13,0x1c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM13,%ZMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0x70(%RSP),%XMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM14,%ZMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM15,0x1d0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM15,%ZMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM16,0x1e0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM16,%ZMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0x80(%RSP),%XMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM17,%ZMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0xa0(%RSP),%XMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM18,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM23,%ZMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0x90(%RSP),%XMM20 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM20,%ZMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0xb0(%RSP),%XMM21 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM21,%ZMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0xc0(%RSP),%XMM22 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM22,%ZMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0xd0(%RSP),%XMM23 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM23,%ZMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM31,0x1f0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM31,%ZMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM30,0x200(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM30,%ZMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM3,0x210(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM26 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM3,%ZMM26 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0xe0(%RSP),%XMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM27,%ZMM27 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0xf0(%RSP),%XMM28 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM28,%ZMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVDQU 0x2e0(%RSP),%YMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x3c(%RSP),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %R14D,%EAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD 0xe0(%RSP),%XMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x210(%RSP),%XMM9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x200(%RSP),%XMM30 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1f0(%RSP),%XMM31 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xd0(%RSP),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xc0(%RSP),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xb0(%RSP),%XMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xa0(%RSP),%XMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x90(%RSP),%XMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x80(%RSP),%XMM29 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1e0(%RSP),%XMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1d0(%RSP),%XMM15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x70(%RSP),%XMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1c0(%RSP),%XMM13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1b0(%RSP),%XMM12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1a0(%RSP),%XMM11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x190(%RSP),%XMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x180(%RSP),%XMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x170(%RSP),%XMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x160(%RSP),%XMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x60(%RSP),%XMM28 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x50(%RSP),%XMM26 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x150(%RSP),%XMM25 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x140(%RSP),%XMM24 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x40(%RSP),%XMM23 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x130(%RSP),%XMM22 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x120(%RSP),%XMM21 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x110(%RSP),%XMM20 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x100(%RSP),%XMM19 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JE 45843d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
JMP 457fcb | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
VMOVAPD %XMM9,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD 0x60(%RSP),%XMM28 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x50(%RSP),%XMM26 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x40(%RSP),%XMM23 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVDQU 0x2e0(%RSP),%YMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPD 0xe0(%RSP),%XMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVAPD %XMM3,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD 0xd0(%RSP),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xc0(%RSP),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xb0(%RSP),%XMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x90(%RSP),%XMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xa0(%RSP),%XMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x70(%RSP),%XMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x80(%RSP),%XMM29 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VPBROADCASTD %R14D,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPOR 0x3de67(%RIP),%YMM1,%YMM1 | 1 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0.33 | 0 | 0 | 1 | 0.50 |
VPCMPLTUD %YMM0,%YMM1,%K1 | |||||||||||
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JE 45843d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
ADD %R9D,%R14D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VPBROADCASTD %R14D,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPADDD 0x3de45(%RIP),%YMM0,%YMM0 | 1 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0.33 | 0 | 0 | 1 | 0.50 |
VPCMPGTD %YMM0,%YMM5,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
MOVSXD %R14D,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VBROADCASTSD %XMM23,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD (%R12,%RBX,8),%ZMM1{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VSUBPD %ZMM0,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM26,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVAPD %XMM2,%XMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD (%R15,%RBX,8),%ZMM2{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VSUBPD %ZMM0,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD (%RSI,%RBX,8),%ZMM0{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %XMM3,%XMM26 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM28,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VSUBPD %ZMM3,%ZMM0,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x35fdd(%RIP),%ZMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0x35fcb(%RIP),%ZMM0{%K2} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVAPD %XMM4,%XMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMULPD %ZMM0,%ZMM1,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM0,%ZMM2,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM19,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMULPD %ZMM4,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM20,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VFMADD213PD %ZMM1,%ZMM5,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM6,%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMULPD %ZMM0,%ZMM3,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM21,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VFMADD213PD %ZMM2,%ZMM6,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM22,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMULPD %ZMM4,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM24,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VFMADD213PD %ZMM2,%ZMM5,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM7,%XMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM25,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VFMADD213PD %ZMM3,%ZMM6,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x220(%RSP),%ZMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMULPD %ZMM4,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM18,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VFMADD213PD %ZMM2,%ZMM5,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM8,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD 0x230(%RSP),%ZMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMADD213PD %ZMM3,%ZMM6,%ZMM8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM9,%XMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VRNDSCALEPD $0x9,%ZMM1,%ZMM9 | 2 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 8 | 1 |
VBROADCASTSD 0x240(%RSP),%ZMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMSUB213PD %ZMM4,%ZMM9,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x250(%RSP),%ZMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMSUB213PD %ZMM5,%ZMM9,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VRNDSCALEPD $0x9,%ZMM7,%ZMM4 | 2 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 8 | 1 |
VBROADCASTSD 0x260(%RSP),%ZMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMSUB213PD %ZMM6,%ZMM9,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x2a0(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMADD231PD %ZMM5,%ZMM4,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x280(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMADD231PD %ZMM5,%ZMM4,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x270(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMADD231PD %ZMM5,%ZMM4,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VRNDSCALEPD $0x9,%ZMM8,%ZMM4 | 2 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 8 | 1 |
VBROADCASTSD 0x2c0(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFNMSUB231PD %ZMM5,%ZMM4,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x2b0(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFNMSUB231PD %ZMM5,%ZMM4,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x290(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFNMSUB231PD %ZMM5,%ZMM4,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM14,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM4,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM17,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM4,%ZMM4,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM5,%ZMM5,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM10,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM3,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM5,%ZMM5,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM1,%ZMM1,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM2,%ZMM2,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM3,%ZMM3,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%ZMM5,%ZMM4,%K0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %ZMM5,%ZMM4,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM11,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM12,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM5,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM13,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM3,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%ZMM4,%ZMM5,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %ZMM4,%ZMM5,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM27,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM15,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM5,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM16,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM3,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%ZMM4,%ZMM5,%K3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %ZMM4,%ZMM5,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM29,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM20,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM5,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x2d0(%RSP),%ZMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VADDPD %ZMM3,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%ZMM4,%ZMM5,%K4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %ZMM4,%ZMM5,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM19,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM28,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM5,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM26,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM3,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%ZMM4,%ZMM5,%K5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %ZMM4,%ZMM5,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM23,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM31,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM5,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM30,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM3,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM22,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM21,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM7,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM6,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM7,%ZMM7,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMINPD %ZMM4,%ZMM5,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0xf0(%RSP),%ZMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VADDPD %ZMM3,%ZMM8,%ZMM8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM8,%ZMM8,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMINPD %ZMM7,%ZMM6,%ZMM8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VSQRTPD %ZMM8,%ZMM8 | 3 | 2 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 24-33 | 18-24 |
VCMPPD $0x1,%ZMM4,%ZMM5,%K6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VCMPPD $0x1,%ZMM7,%ZMM6,%K7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM8,(%RCX,%RBX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VPMOVM2Q %K0,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VPSRLQ $0x3f,%ZMM4,%ZMM4 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ 0x3d8c1(%RIP),%ZMM4{%K2} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d8bf(%RIP),%ZMM4{%K3} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d8bd(%RIP),%ZMM4{%K4} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x39943(%RIP),%ZMM4{%K5} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d8b1(%RIP),%ZMM4{%K6} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d8af(%RIP),%ZMM4{%K7} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VGATHERQPD 0x90(%RDI,%ZMM4,8),%ZMM5{%K2} | 4 | 1 | 0 | 4 | 4 | 0 | 1 | 0 | 0 | 21 | 5 |
VADDPD %ZMM1,%ZMM5,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM0,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM1,(%R10,%RBX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VGATHERQPD 0xd0(%RDI,%ZMM4,8),%ZMM1{%K2} | 4 | 1 | 0 | 4 | 4 | 0 | 1 | 0 | 0 | 21 | 5 |
VADDPD %ZMM2,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM0,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM1,(%R8,%RBX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VGATHERQPD 0x110(%RDI,%ZMM4,8),%ZMM1{%K2} | 4 | 1 | 0 | 4 | 4 | 0 | 1 | 0 | 0 | 21 | 5 |
VADDPD %ZMM3,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM0,%ZMM1,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM0,(%R11,%RBX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA -0x20(%RBP),%RSP | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
VZEROUPPER | 4 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Source file and lines | ParticleBConds.h:166-219 |
Module | exec |
nb instructions | 425 |
nb uops | 441 |
loop length | 2809 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 32 |
used ymm registers | 4 |
used zmm registers | 29 |
nb stack references | 66 |
ADD-SUB / MUL ratio | 1.59 |
micro-operation queue | 110.25 cycles |
front end | 110.25 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 92.00 | 11.50 | 79.00 | 79.00 | 72.00 | 92.00 | 11.50 | 73.00 |
cycles | 92.00 | 37.50 | 79.00 | 79.00 | 72.00 | 92.00 | 11.50 | 73.00 |
Cycles executing div or sqrt instructions | 18.00-24.00 |
FE+BE cycles | 290.27 |
Stall cycles | 181.92 |
ROB full (events) | 1.00 |
RS full (events) | 23.99 |
LM full (events) | 3.01 |
SB full (events) | 174.90 |
Front-end | 110.25 |
Dispatch | 92.00 |
DIV/SQRT | 18.00-24.00 |
Overall L1 | 110.25 |
all | 39% |
load | 40% |
store | 50% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 27% |
all | 63% |
load | 47% |
store | 100% |
mul | 100% |
add-sub | 100% |
fma | 100% |
div/sqrt | 100% |
other | 28% |
all | 62% |
load | 47% |
store | 98% |
mul | 100% |
add-sub | 100% |
fma | 100% |
div/sqrt | 100% |
other | 28% |
all | 25% |
load | 27% |
store | 28% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 21% |
all | 46% |
load | 22% |
store | 51% |
mul | 100% |
add-sub | 100% |
fma | 100% |
div/sqrt | 100% |
other | 28% |
all | 45% |
load | 22% |
store | 50% |
mul | 100% |
add-sub | 98% |
fma | 100% |
div/sqrt | 100% |
other | 27% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SUB $0x800,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
SUB %R9D,%EAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 45843d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x18(%RBP),%EBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD (%RSI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x40(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x8(%RSI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x50(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x10(%RSI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x60(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x8(%RDX),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RDX),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R12,%RSI,8),%R15 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x4,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
ADD %R12,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x8(%R8),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%R8),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R10,%R11,8),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x4,%R11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
ADD %R10,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD (%RDI),%XMM19 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x8(%RDI),%XMM20 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x10(%RDI),%XMM21 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x18(%RDI),%XMM22 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x20(%RDI),%XMM24 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x28(%RDI),%XMM25 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x30(%RDI),%XMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x38(%RDI),%XMM9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x40(%RDI),%XMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x48(%RDI),%XMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x50(%RDI),%XMM28 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x58(%RDI),%XMM26 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x60(%RDI),%XMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x68(%RDI),%XMM29 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x70(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x78(%RDI),%XMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x80(%RDI),%XMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x88(%RDI),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x98(%RDI),%XMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xd8(%RDI),%XMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x118(%RDI),%XMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xa0(%RDI),%XMM11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xe0(%RDI),%XMM12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x120(%RDI),%XMM13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xa8(%RDI),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM1,0x70(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xe8(%RDI),%XMM15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x128(%RDI),%XMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xb0(%RDI),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM1,0x80(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xf0(%RDI),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM3,0xa0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x130(%RDI),%XMM23 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xb8(%RDI),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM3,0x90(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xf8(%RDI),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM3,0xb0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x138(%RDI),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM1,0xc0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xc0(%RDI),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM3,0xd0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x100(%RDI),%XMM31 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x140(%RDI),%XMM30 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xc8(%RDI),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x108(%RDI),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM1,0xe0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x148(%RDI),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD %XMM1,0xf0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VPBROADCASTD %EBX,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVDQU64 %YMM18,0x2e0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
AND $-0x8,%R14D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD %XMM23,0x2d0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM26,0x2c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM0,0x2b0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM28,0x2a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM2,0x290(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM29,0x280(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM4,0x270(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM5,0x260(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM6,0x250(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM7,0x240(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM8,0x230(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPS %XMM27,0x220(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JE 457f51 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %EAX,0x3c(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA -0x1(%R14),%EBX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD 0x40(%RSP),%ZMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %ZMM18,0x780(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x50(%RSP),%ZMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %ZMM18,0x740(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x60(%RSP),%ZMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %ZMM18,0x700(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM19,0x100(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM19,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM18,0x6c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM20,0x110(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM20,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM18,0x680(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM21,0x120(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM21,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM18,0x640(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM22,0x130(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM22,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM18,0x600(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM24,0x140(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM24,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM18,0x5c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM25,0x150(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM25,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM18,0x580(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM27,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM18,0x540(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM9,0x160(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM9,%ZMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM9,0x500(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM8,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM8,0x4c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM7,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM7,0x480(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM27 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM28,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM1,0x440(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM26,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM1,0x400(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM6,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM1,0x3c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM29,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM1,0x380(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %ZMM0,0x340(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM5,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM0,0x300(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM4,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM2,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM14,0x170(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM14,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM17,0x180(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM17,%ZMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM10,0x190(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM10,%ZMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM11,0x1a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM11,%ZMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM12,0x1b0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM12,%ZMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM13,0x1c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM13,%ZMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0x70(%RSP),%XMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM14,%ZMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM15,0x1d0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM15,%ZMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM16,0x1e0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM16,%ZMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0x80(%RSP),%XMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM17,%ZMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0xa0(%RSP),%XMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM18,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM23,%ZMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0x90(%RSP),%XMM20 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM20,%ZMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0xb0(%RSP),%XMM21 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM21,%ZMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0xc0(%RSP),%XMM22 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM22,%ZMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0xd0(%RSP),%XMM23 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM23,%ZMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM31,0x1f0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM31,%ZMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM30,0x200(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM30,%ZMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM3,0x210(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM26 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM3,%ZMM26 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0xe0(%RSP),%XMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM27,%ZMM27 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD 0xf0(%RSP),%XMM28 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBROADCASTSD %XMM28,%ZMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVDQU 0x2e0(%RSP),%YMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x3c(%RSP),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %R14D,%EAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD 0xe0(%RSP),%XMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x210(%RSP),%XMM9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x200(%RSP),%XMM30 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1f0(%RSP),%XMM31 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xd0(%RSP),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xc0(%RSP),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xb0(%RSP),%XMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xa0(%RSP),%XMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x90(%RSP),%XMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x80(%RSP),%XMM29 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1e0(%RSP),%XMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1d0(%RSP),%XMM15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x70(%RSP),%XMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1c0(%RSP),%XMM13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1b0(%RSP),%XMM12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1a0(%RSP),%XMM11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x190(%RSP),%XMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x180(%RSP),%XMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x170(%RSP),%XMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x160(%RSP),%XMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x60(%RSP),%XMM28 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x50(%RSP),%XMM26 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x150(%RSP),%XMM25 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x140(%RSP),%XMM24 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x40(%RSP),%XMM23 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x130(%RSP),%XMM22 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x120(%RSP),%XMM21 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x110(%RSP),%XMM20 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x100(%RSP),%XMM19 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JE 45843d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
JMP 457fcb | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
VMOVAPD %XMM9,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD 0x60(%RSP),%XMM28 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x50(%RSP),%XMM26 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x40(%RSP),%XMM23 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVDQU 0x2e0(%RSP),%YMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPD 0xe0(%RSP),%XMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVAPD %XMM3,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD 0xd0(%RSP),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xc0(%RSP),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xb0(%RSP),%XMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x90(%RSP),%XMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xa0(%RSP),%XMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x70(%RSP),%XMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x80(%RSP),%XMM29 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VPBROADCASTD %R14D,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPOR 0x3de67(%RIP),%YMM1,%YMM1 | 1 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0.33 | 0 | 0 | 1 | 0.50 |
VPCMPLTUD %YMM0,%YMM1,%K1 | |||||||||||
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JE 45843d | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
ADD %R9D,%R14D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VPBROADCASTD %R14D,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPADDD 0x3de45(%RIP),%YMM0,%YMM0 | 1 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0.33 | 0 | 0 | 1 | 0.50 |
VPCMPGTD %YMM0,%YMM5,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
MOVSXD %R14D,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VBROADCASTSD %XMM23,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD (%R12,%RBX,8),%ZMM1{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VSUBPD %ZMM0,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM26,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVAPD %XMM2,%XMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD (%R15,%RBX,8),%ZMM2{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VSUBPD %ZMM0,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD (%RSI,%RBX,8),%ZMM0{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %XMM3,%XMM26 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM28,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VSUBPD %ZMM3,%ZMM0,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x35fdd(%RIP),%ZMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0x35fcb(%RIP),%ZMM0{%K2} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVAPD %XMM4,%XMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMULPD %ZMM0,%ZMM1,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM0,%ZMM2,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM19,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMULPD %ZMM4,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM20,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VFMADD213PD %ZMM1,%ZMM5,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM6,%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMULPD %ZMM0,%ZMM3,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM21,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VFMADD213PD %ZMM2,%ZMM6,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM22,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMULPD %ZMM4,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM24,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VFMADD213PD %ZMM2,%ZMM5,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM7,%XMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM25,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VFMADD213PD %ZMM3,%ZMM6,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x220(%RSP),%ZMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMULPD %ZMM4,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM18,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VFMADD213PD %ZMM2,%ZMM5,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM8,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD 0x230(%RSP),%ZMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMADD213PD %ZMM3,%ZMM6,%ZMM8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM9,%XMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VRNDSCALEPD $0x9,%ZMM1,%ZMM9 | 2 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 8 | 1 |
VBROADCASTSD 0x240(%RSP),%ZMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMSUB213PD %ZMM4,%ZMM9,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x250(%RSP),%ZMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMSUB213PD %ZMM5,%ZMM9,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VRNDSCALEPD $0x9,%ZMM7,%ZMM4 | 2 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 8 | 1 |
VBROADCASTSD 0x260(%RSP),%ZMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMSUB213PD %ZMM6,%ZMM9,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x2a0(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMADD231PD %ZMM5,%ZMM4,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x280(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMADD231PD %ZMM5,%ZMM4,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x270(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFMADD231PD %ZMM5,%ZMM4,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VRNDSCALEPD $0x9,%ZMM8,%ZMM4 | 2 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 8 | 1 |
VBROADCASTSD 0x2c0(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFNMSUB231PD %ZMM5,%ZMM4,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x2b0(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFNMSUB231PD %ZMM5,%ZMM4,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x290(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VFNMSUB231PD %ZMM5,%ZMM4,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM14,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM4,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM17,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM4,%ZMM4,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM5,%ZMM5,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM10,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM3,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM5,%ZMM5,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM1,%ZMM1,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM2,%ZMM2,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM3,%ZMM3,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%ZMM5,%ZMM4,%K0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %ZMM5,%ZMM4,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM11,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM12,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM5,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM13,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM3,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%ZMM4,%ZMM5,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %ZMM4,%ZMM5,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM27,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM15,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM5,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM16,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM3,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%ZMM4,%ZMM5,%K3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %ZMM4,%ZMM5,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM29,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM20,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM5,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x2d0(%RSP),%ZMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VADDPD %ZMM3,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%ZMM4,%ZMM5,%K4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %ZMM4,%ZMM5,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM19,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM28,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM5,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM26,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM3,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%ZMM4,%ZMM5,%K5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %ZMM4,%ZMM5,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM23,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM31,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM5,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM30,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM3,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM6,%ZMM6,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM22,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM1,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD %XMM21,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VADDPD %ZMM2,%ZMM7,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM6,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM7,%ZMM7,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMINPD %ZMM4,%ZMM5,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0xf0(%RSP),%ZMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VADDPD %ZMM3,%ZMM8,%ZMM8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %ZMM8,%ZMM8,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMINPD %ZMM7,%ZMM6,%ZMM8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VSQRTPD %ZMM8,%ZMM8 | 3 | 2 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 24-33 | 18-24 |
VCMPPD $0x1,%ZMM4,%ZMM5,%K6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VCMPPD $0x1,%ZMM7,%ZMM6,%K7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM8,(%RCX,%RBX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VPMOVM2Q %K0,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VPSRLQ $0x3f,%ZMM4,%ZMM4 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ 0x3d8c1(%RIP),%ZMM4{%K2} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d8bf(%RIP),%ZMM4{%K3} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d8bd(%RIP),%ZMM4{%K4} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x39943(%RIP),%ZMM4{%K5} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d8b1(%RIP),%ZMM4{%K6} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d8af(%RIP),%ZMM4{%K7} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VGATHERQPD 0x90(%RDI,%ZMM4,8),%ZMM5{%K2} | 4 | 1 | 0 | 4 | 4 | 0 | 1 | 0 | 0 | 21 | 5 |
VADDPD %ZMM1,%ZMM5,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM0,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM1,(%R10,%RBX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VGATHERQPD 0xd0(%RDI,%ZMM4,8),%ZMM1{%K2} | 4 | 1 | 0 | 4 | 4 | 0 | 1 | 0 | 0 | 21 | 5 |
VADDPD %ZMM2,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM0,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM1,(%R8,%RBX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VGATHERQPD 0x110(%RDI,%ZMM4,8),%ZMM1{%K2} | 4 | 1 | 0 | 4 | 4 | 0 | 1 | 0 | 0 | 21 | 5 |
VADDPD %ZMM3,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMULPD %ZMM0,%ZMM1,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM0,(%R11,%RBX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA -0x20(%RBP),%RSP | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
VZEROUPPER | 4 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼void qmcplusplus::DTD_BConds | 13.35 | 7.98 |
○Loop 971 - ParticleBConds.h:185-217 - exec | 13.24 | 7.91 |