Function: void qmcplusplus::DTD_BConds<double, 3u, 39>::computeDistances<qmcplusplus::TinyVector<dou ... | Module: exec | Source: ParticleBConds.h:166-219 [...] | Coverage: 23.44% |
---|
Function: void qmcplusplus::DTD_BConds<double, 3u, 39>::computeDistances<qmcplusplus::TinyVector<dou ... | Module: exec | Source: ParticleBConds.h:166-219 [...] | Coverage: 23.44% |
---|
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 177 - 177 |
-------------------------------------------------------------------------------- |
177: inline const Type_t& operator[](unsigned int i) const { return X[i]; } |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 241 - 243 |
-------------------------------------------------------------------------------- |
241: T* restrict data(size_t i) { return myData + i * nGhosts; } |
242: ///return the const pointer of the i-th components |
243: const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
/home/kcamus/qaas_runs/169-390-4082/intel/miniqmc/build/miniqmc/src/Particle/Lattice/ParticleBConds.h: 166 - 219 |
-------------------------------------------------------------------------------- |
166: { |
167: const T x0 = pos[0]; |
168: const T y0 = pos[1]; |
169: const T z0 = pos[2]; |
[...] |
185: #pragma omp simd aligned(temp_r, px, py, pz, dx, dy, dz: QMC_SIMD_ALIGNMENT) |
186: for (int iat = first; iat < last; ++iat) |
187: { |
188: const T flip = iat < flip_ind ? one : minusone; |
189: const T displ_0 = (px[iat] - x0) * flip; |
190: const T displ_1 = (py[iat] - y0) * flip; |
191: const T displ_2 = (pz[iat] - z0) * flip; |
192: |
193: const T ar_0 = -std::floor(displ_0 * g00 + displ_1 * g10 + displ_2 * g20); |
194: const T ar_1 = -std::floor(displ_0 * g01 + displ_1 * g11 + displ_2 * g21); |
195: const T ar_2 = -std::floor(displ_0 * g02 + displ_1 * g12 + displ_2 * g22); |
196: |
197: const T delx = displ_0 + ar_0 * r00 + ar_1 * r10 + ar_2 * r20; |
198: const T dely = displ_1 + ar_0 * r01 + ar_1 * r11 + ar_2 * r21; |
199: const T delz = displ_2 + ar_0 * r02 + ar_1 * r12 + ar_2 * r22; |
200: |
201: T rmin = delx * delx + dely * dely + delz * delz; |
202: int ic = 0; |
203: #pragma unroll(7) |
204: for (int c = 1; c < 8; ++c) |
205: { |
206: const T x = delx + cellx[c]; |
207: const T y = dely + celly[c]; |
208: const T z = delz + cellz[c]; |
209: const T r2 = x * x + y * y + z * z; |
210: ic = (r2 < rmin) ? c : ic; |
211: rmin = (r2 < rmin) ? r2 : rmin; |
212: } |
213: |
214: temp_r[iat] = std::sqrt(rmin); |
215: dx[iat] = flip * (delx + cellx[ic]); |
216: dy[iat] = flip * (dely + celly[ic]); |
217: dz[iat] = flip * (delz + cellz[ic]); |
218: } |
219: } |
0x45e060 PUSH %RBP |
0x45e061 MOV %RSP,%RBP |
0x45e064 PUSH %R15 |
0x45e066 PUSH %R14 |
0x45e068 PUSH %R13 |
0x45e06a PUSH %R12 |
0x45e06c PUSH %RBX |
0x45e06d AND $-0x20,%RSP |
0x45e071 SUB $0x4a0,%RSP |
0x45e078 MOV 0x10(%RBP),%R15D |
0x45e07c SUB %R9D,%R15D |
0x45e07f JLE 45edd3 |
0x45e085 VMOVSD (%RSI),%XMM10 |
0x45e089 VMOVSD 0x8(%RSI),%XMM9 |
0x45e08e VMOVSD 0x10(%RSI),%XMM8 |
0x45e093 MOV 0x18(%RBP),%EAX |
0x45e096 MOV 0x8(%RDX),%RSI |
0x45e09a MOV 0x18(%RDX),%R13 |
0x45e09e LEA (,%RSI,8),%R12 |
0x45e0a6 ADD %R13,%R12 |
0x45e0a9 SAL $0x4,%RSI |
0x45e0ad ADD %R13,%RSI |
0x45e0b0 MOV 0x8(%R8),%R11 |
0x45e0b4 MOV 0x18(%R8),%R10 |
0x45e0b8 LEA (%R10,%R11,8),%R8 |
0x45e0bc SAL $0x4,%R11 |
0x45e0c0 VMOVSD (%RDI),%XMM4 |
0x45e0c4 VMOVSD 0x8(%RDI),%XMM5 |
0x45e0c9 VMOVSD 0x10(%RDI),%XMM2 |
0x45e0ce VMOVSD 0x18(%RDI),%XMM1 |
0x45e0d3 VMOVSD 0x20(%RDI),%XMM3 |
0x45e0d8 VMOVSD 0x28(%RDI),%XMM7 |
0x45e0dd VMOVSD 0x30(%RDI),%XMM6 |
0x45e0e2 VMOVSD 0x38(%RDI),%XMM22 |
0x45e0e9 VMOVSD 0x40(%RDI),%XMM30 |
0x45e0f0 VMOVSD 0x48(%RDI),%XMM25 |
0x45e0f7 VMOVSD 0x50(%RDI),%XMM24 |
0x45e0fe VMOVSD 0x58(%RDI),%XMM23 |
0x45e105 VMOVSD 0x60(%RDI),%XMM11 |
0x45e10a VMOVSD 0x68(%RDI),%XMM21 |
0x45e111 VMOVSD 0x70(%RDI),%XMM28 |
0x45e118 VMOVSD 0x78(%RDI),%XMM27 |
0x45e11f VMOVSD 0x80(%RDI),%XMM26 |
0x45e126 VMOVSD 0x88(%RDI),%XMM19 |
0x45e12d VMOVSD 0x98(%RDI),%XMM18 |
0x45e134 VMOVSD 0xd8(%RDI),%XMM20 |
0x45e13b VMOVSD 0x118(%RDI),%XMM17 |
0x45e142 VMOVSD 0xa0(%RDI),%XMM16 |
0x45e149 VMOVSD 0xe0(%RDI),%XMM15 |
0x45e151 VMOVSD 0x120(%RDI),%XMM14 |
0x45e159 VMOVSD 0xa8(%RDI),%XMM0 |
0x45e161 VMOVUPS %XMM0,0x120(%RSP) |
0x45e16a VMOVSD 0xe8(%RDI),%XMM0 |
0x45e172 VMOVUPS %XMM0,(%RSP) |
0x45e177 VMOVSD 0x128(%RDI),%XMM0 |
0x45e17f VMOVUPS %XMM0,0x20(%RSP) |
0x45e185 VMOVSD 0xb0(%RDI),%XMM0 |
0x45e18d VMOVUPS %XMM0,0x40(%RSP) |
0x45e193 VMOVSD 0xf0(%RDI),%XMM0 |
0x45e19b VMOVUPS %XMM0,0x60(%RSP) |
0x45e1a1 VMOVSD 0x130(%RDI),%XMM0 |
0x45e1a9 VMOVUPS %XMM0,0x80(%RSP) |
0x45e1b2 VMOVSD 0xb8(%RDI),%XMM13 |
0x45e1ba VMOVSD 0xf8(%RDI),%XMM0 |
0x45e1c2 VMOVUPS %XMM0,0xa0(%RSP) |
0x45e1cb VMOVSD 0x138(%RDI),%XMM0 |
0x45e1d3 VMOVUPS %XMM0,0xc0(%RSP) |
0x45e1dc VMOVSD 0xc0(%RDI),%XMM0 |
0x45e1e4 VMOVUPS %XMM0,0xe0(%RSP) |
0x45e1ed VMOVSD 0x100(%RDI),%XMM12 |
0x45e1f5 VMOVSD 0x140(%RDI),%XMM0 |
0x45e1fd VMOVUPS %XMM0,0x100(%RSP) |
0x45e206 VMOVSD 0xc8(%RDI),%XMM29 |
0x45e20d ADD %R10,%R11 |
0x45e210 MOV %R15D,%R14D |
0x45e213 VMOVSD 0x108(%RDI),%XMM0 |
0x45e21b VMOVUPS %XMM0,0x140(%RSP) |
0x45e224 VMOVSD 0x148(%RDI),%XMM31 |
0x45e22b AND $-0x4,%R14D |
0x45e22f JE 45e8dd |
0x45e235 LEA -0x1(%R14),%EBX |
0x45e239 VBROADCASTSD %XMM10,%YMM10 |
0x45e23e VMOVUPD %YMM10,0x300(%RSP) |
0x45e247 VBROADCASTSD %XMM9,%YMM9 |
0x45e24c VMOVUPD %YMM9,0x340(%RSP) |
0x45e255 VBROADCASTSD %XMM8,%YMM8 |
0x45e25a VMOVUPD %YMM8,0x360(%RSP) |
0x45e263 VBROADCASTSD %XMM4,%YMM4 |
0x45e268 VMOVUPD %YMM4,0x320(%RSP) |
0x45e271 VBROADCASTSD %XMM5,%YMM4 |
0x45e276 VMOVUPD %YMM4,0x380(%RSP) |
0x45e27f VBROADCASTSD %XMM2,%YMM2 |
0x45e284 VMOVUPS %YMM2,0x1a0(%RSP) |
0x45e28d VBROADCASTSD %XMM1,%YMM1 |
0x45e292 VMOVUPD %YMM1,0x2c0(%RSP) |
0x45e29b VBROADCASTSD %XMM3,%YMM1 |
0x45e2a0 VMOVUPD %YMM1,0x2e0(%RSP) |
0x45e2a9 VBROADCASTSD %XMM7,%YMM1 |
0x45e2ae VMOVUPS %YMM1,0x1c0(%RSP) |
0x45e2b7 VBROADCASTSD %XMM6,%YMM1 |
0x45e2bc VMOVUPS %YMM1,0x1e0(%RSP) |
0x45e2c5 VBROADCASTSD %XMM22,%YMM0 |
0x45e2cb VMOVUPD %YMM0,0x200(%RSP) |
0x45e2d4 VBROADCASTSD %XMM30,%YMM0 |
0x45e2da VMOVUPD %YMM0,0x3c0(%RSP) |
0x45e2e3 VBROADCASTSD %XMM25,%YMM2 |
0x45e2e9 VBROADCASTSD %XMM24,%YMM0 |
0x45e2ef VMOVUPS %YMM0,0x180(%RSP) |
0x45e2f8 VBROADCASTSD %XMM23,%YMM7 |
0x45e2fe VBROADCASTSD %XMM11,%YMM1 |
0x45e303 VBROADCASTSD %XMM21,%YMM0 |
0x45e309 VMOVUPD %YMM0,0x160(%RSP) |
0x45e312 VBROADCASTSD %XMM28,%YMM24 |
0x45e318 VBROADCASTSD %XMM27,%YMM0 |
0x45e31e VBROADCASTSD %XMM26,%YMM3 |
0x45e324 VMOVUPD %YMM3,0x3a0(%RSP) |
0x45e32d VBROADCASTSD %XMM19,%YMM3 |
0x45e333 VMOVUPD %YMM3,0x3e0(%RSP) |
0x45e33c VBROADCASTSD %XMM18,%YMM3 |
0x45e342 VMOVUPD %YMM3,0x420(%RSP) |
0x45e34b VBROADCASTSD %XMM20,%YMM3 |
0x45e351 VMOVUPD %YMM3,0x400(%RSP) |
0x45e35a VBROADCASTSD %XMM17,%YMM3 |
0x45e360 VMOVUPD %YMM3,0x460(%RSP) |
0x45e369 VBROADCASTSD %XMM16,%YMM5 |
0x45e36f VBROADCASTSD %XMM15,%YMM6 |
0x45e374 VBROADCASTSD %XMM14,%YMM3 |
0x45e379 VMOVUPD %YMM3,0x440(%RSP) |
0x45e382 VBROADCASTSD 0x120(%RSP),%YMM3 |
0x45e38c VMOVUPS %YMM3,0x120(%RSP) |
0x45e395 VBROADCASTSD (%RSP),%YMM23 |
0x45e39c VBROADCASTSD 0x20(%RSP),%YMM19 |
0x45e3a4 VBROADCASTSD 0x40(%RSP),%YMM17 |
0x45e3ac VBROADCASTSD 0x60(%RSP),%YMM18 |
0x45e3b4 VBROADCASTSD 0x80(%RSP),%YMM16 |
0x45e3bc VBROADCASTSD %XMM13,%YMM13 |
0x45e3c1 VBROADCASTSD 0xa0(%RSP),%YMM15 |
0x45e3cb VBROADCASTSD 0xc0(%RSP),%YMM30 |
0x45e3d3 VBROADCASTSD 0xe0(%RSP),%YMM11 |
0x45e3dd VBROADCASTSD %XMM12,%YMM12 |
0x45e3e2 VBROADCASTSD 0x100(%RSP),%YMM10 |
0x45e3ec VBROADCASTSD %XMM29,%YMM8 |
0x45e3f2 VBROADCASTSD 0x140(%RSP),%YMM9 |
0x45e3fc VBROADCASTSD %XMM31,%YMM31 |
0x45e402 XOR %EDX,%EDX |
0x45e404 VPBROADCASTD %EAX,%XMM21 |
0x45e40a VPBROADCASTQ %RDI,%YMM3 |
0x45e410 VMOVDQU %YMM3,0x140(%RSP) |
0x45e419 NOPL (%RAX) |
(1167) 0x45e420 LEA (%R9,%RDX,1),%EAX |
(1167) 0x45e424 VPBROADCASTD %EAX,%XMM3 |
(1167) 0x45e42a VPADDD 0x3df4e(%RIP),%XMM3,%XMM3 |
(1167) 0x45e432 CLTQ |
(1167) 0x45e434 VPCMPGTD %XMM3,%XMM21,%K1 |
(1167) 0x45e43a VMOVUPD (%R13,%RAX,8),%YMM3 |
(1167) 0x45e441 VSUBPD 0x300(%RSP),%YMM3,%YMM3 |
(1167) 0x45e44a VMOVUPD (%R12,%RAX,8),%YMM4 |
(1167) 0x45e450 VBROADCASTSD 0x37bd7(%RIP),%YMM14 |
(1167) 0x45e459 VBROADCASTSD 0x37bc5(%RIP),%YMM20 |
(1167) 0x45e463 VBLENDMPD %YMM20,%YMM14,%YMM25{%K1} |
(1167) 0x45e469 VMULPD %YMM25,%YMM3,%YMM28 |
(1167) 0x45e46f VSUBPD 0x340(%RSP),%YMM4,%YMM3 |
(1167) 0x45e478 VMOVUPD (%RSI,%RAX,8),%YMM4 |
(1167) 0x45e47d VSUBPD 0x360(%RSP),%YMM4,%YMM4 |
(1167) 0x45e486 VMULPD %YMM25,%YMM3,%YMM26 |
(1167) 0x45e48c VMULPD %YMM25,%YMM4,%YMM3 |
(1167) 0x45e492 VMULPD 0x320(%RSP),%YMM28,%YMM4 |
(1167) 0x45e49a VFMADD231PD 0x380(%RSP),%YMM26,%YMM4 |
(1167) 0x45e4a2 VFMADD231PD 0x1a0(%RSP),%YMM3,%YMM4 |
(1167) 0x45e4ac VRNDSCALEPD $0x9,%YMM4,%YMM27 |
(1167) 0x45e4b3 VMULPD 0x2c0(%RSP),%YMM28,%YMM4 |
(1167) 0x45e4bb VFMADD231PD 0x2e0(%RSP),%YMM26,%YMM4 |
(1167) 0x45e4c3 VFMADD231PD 0x1c0(%RSP),%YMM3,%YMM4 |
(1167) 0x45e4cd VROUNDPD $0x9,%YMM4,%YMM4 |
(1167) 0x45e4d3 VMULPD 0x1e0(%RSP),%YMM28,%YMM29 |
(1167) 0x45e4db VFMADD231PD 0x200(%RSP),%YMM26,%YMM29 |
(1167) 0x45e4e3 VFMADD231PD 0x3c0(%RSP),%YMM3,%YMM29 |
(1167) 0x45e4eb VRNDSCALEPD $0x9,%YMM29,%YMM29 |
(1167) 0x45e4f2 VFMSUB231PD %YMM2,%YMM27,%YMM28 |
(1167) 0x45e4f8 VFMADD231PD 0x180(%RSP),%YMM4,%YMM28 |
(1167) 0x45e500 VFNMSUB231PD %YMM29,%YMM7,%YMM28 |
(1167) 0x45e506 VFMSUB231PD %YMM1,%YMM27,%YMM26 |
(1167) 0x45e50c VFMADD231PD 0x160(%RSP),%YMM4,%YMM26 |
(1167) 0x45e514 VFMSUB213PD %YMM3,%YMM0,%YMM27 |
(1167) 0x45e51a VFNMSUB231PD %YMM24,%YMM29,%YMM26 |
(1167) 0x45e520 VFMADD231PD 0x3a0(%RSP),%YMM4,%YMM27 |
(1167) 0x45e528 VFNMSUB231PD 0x3e0(%RSP),%YMM29,%YMM27 |
(1167) 0x45e530 VMULPD %YMM28,%YMM28,%YMM3 |
(1167) 0x45e536 VFMADD231PD %YMM26,%YMM26,%YMM3 |
(1167) 0x45e53c VADDPD 0x420(%RSP),%YMM28,%YMM4 |
(1167) 0x45e544 VFMADD231PD %YMM27,%YMM27,%YMM3 |
(1167) 0x45e54a VADDPD 0x400(%RSP),%YMM26,%YMM29 |
(1167) 0x45e552 VMOVAPD %YMM7,%YMM20 |
(1167) 0x45e558 VMOVAPD %YMM31,%YMM7 |
(1167) 0x45e55e VADDPD 0x460(%RSP),%YMM27,%YMM31 |
(1167) 0x45e566 VMULPD %YMM4,%YMM4,%YMM4 |
(1167) 0x45e56a VFMADD231PD %YMM29,%YMM29,%YMM4 |
(1167) 0x45e570 VADDPD %YMM28,%YMM5,%YMM29 |
(1167) 0x45e576 VFMADD231PD %YMM31,%YMM31,%YMM4 |
(1167) 0x45e57c VADDPD %YMM26,%YMM6,%YMM31 |
(1167) 0x45e582 VMOVAPD %YMM2,%YMM14 |
(1167) 0x45e586 VMOVAPD %YMM1,%YMM2 |
(1167) 0x45e58a VMOVAPD %YMM0,%YMM1 |
(1167) 0x45e58e VMOVAPD %YMM5,%YMM0 |
(1167) 0x45e592 VADDPD 0x440(%RSP),%YMM27,%YMM5 |
(1167) 0x45e59a VMULPD %YMM29,%YMM29,%YMM29 |
(1167) 0x45e5a0 VFMADD231PD %YMM31,%YMM31,%YMM29 |
(1167) 0x45e5a6 VFMADD231PD %YMM5,%YMM5,%YMM29 |
(1167) 0x45e5ac VMINPD %YMM3,%YMM4,%YMM5 |
(1167) 0x45e5b0 VCMPPD $0x1,%YMM5,%YMM29,%K1 |
(1167) 0x45e5b7 VMINPD %YMM5,%YMM29,%YMM5 |
(1167) 0x45e5bd VADDPD 0x120(%RSP),%YMM28,%YMM29 |
(1167) 0x45e5c5 VADDPD %YMM26,%YMM23,%YMM31 |
(1167) 0x45e5cb VMULPD %YMM29,%YMM29,%YMM29 |
(1167) 0x45e5d1 VMOVAPD %YMM6,%YMM22 |
(1167) 0x45e5d7 VADDPD %YMM27,%YMM19,%YMM6 |
(1167) 0x45e5dd VFMADD231PD %YMM31,%YMM31,%YMM29 |
(1167) 0x45e5e3 VFMADD231PD %YMM6,%YMM6,%YMM29 |
(1167) 0x45e5e9 VCMPPD $0x1,%YMM5,%YMM29,%K2 |
(1167) 0x45e5f0 VADDPD %YMM28,%YMM17,%YMM6 |
(1167) 0x45e5f6 VADDPD %YMM26,%YMM18,%YMM31 |
(1167) 0x45e5fc VMINPD %YMM5,%YMM29,%YMM5 |
(1167) 0x45e602 VADDPD %YMM27,%YMM16,%YMM29 |
(1167) 0x45e608 VMULPD %YMM6,%YMM6,%YMM6 |
(1167) 0x45e60c VFMADD231PD %YMM31,%YMM31,%YMM6 |
(1167) 0x45e612 VFMADD231PD %YMM29,%YMM29,%YMM6 |
(1167) 0x45e618 VADDPD %YMM28,%YMM13,%YMM29 |
(1167) 0x45e61e VCMPPD $0x1,%YMM5,%YMM6,%K3 |
(1167) 0x45e625 VADDPD %YMM26,%YMM15,%YMM31 |
(1167) 0x45e62b VMULPD %YMM29,%YMM29,%YMM29 |
(1167) 0x45e631 VFMADD231PD %YMM31,%YMM31,%YMM29 |
(1167) 0x45e637 VADDPD %YMM27,%YMM30,%YMM31 |
(1167) 0x45e63d VFMADD231PD %YMM31,%YMM31,%YMM29 |
(1167) 0x45e643 VMINPD %YMM5,%YMM6,%YMM5 |
(1167) 0x45e647 VADDPD %YMM28,%YMM11,%YMM6 |
(1167) 0x45e64d VADDPD %YMM26,%YMM12,%YMM31 |
(1167) 0x45e653 VMULPD %YMM6,%YMM6,%YMM6 |
(1167) 0x45e657 VFMADD231PD %YMM31,%YMM31,%YMM6 |
(1167) 0x45e65d VMOVAPD %YMM7,%YMM31 |
(1167) 0x45e663 VMOVAPD %YMM20,%YMM7 |
(1167) 0x45e669 VCMPPD $0x1,%YMM5,%YMM29,%K4 |
(1167) 0x45e670 VMINPD %YMM5,%YMM29,%YMM5 |
(1167) 0x45e676 VADDPD %YMM27,%YMM10,%YMM29 |
(1167) 0x45e67c VFMADD231PD %YMM29,%YMM29,%YMM6 |
(1167) 0x45e682 VCMPPD $0x1,%YMM5,%YMM6,%K5 |
(1167) 0x45e689 VMINPD %YMM5,%YMM6,%YMM5 |
(1167) 0x45e68d VADDPD %YMM28,%YMM8,%YMM6 |
(1167) 0x45e693 VADDPD %YMM26,%YMM9,%YMM29 |
(1167) 0x45e699 VMULPD %YMM6,%YMM6,%YMM6 |
(1167) 0x45e69d VFMADD231PD %YMM29,%YMM29,%YMM6 |
(1167) 0x45e6a3 VADDPD %YMM27,%YMM31,%YMM29 |
(1167) 0x45e6a9 VFMADD231PD %YMM29,%YMM29,%YMM6 |
(1167) 0x45e6af VCMPPD $0x1,%YMM5,%YMM6,%K6 |
(1167) 0x45e6b6 VMINPD %YMM5,%YMM6,%YMM5 |
(1167) 0x45e6ba VMOVAPD %YMM22,%YMM6 |
(1167) 0x45e6c0 VCMPPD $0x1,%YMM3,%YMM4,%YMM3 |
(1167) 0x45e6c5 VSQRTPD %YMM5,%YMM4 |
(1167) 0x45e6c9 VMOVAPD %YMM0,%YMM5 |
(1167) 0x45e6cd VMOVAPD %YMM1,%YMM0 |
(1167) 0x45e6d1 VMOVAPD %YMM2,%YMM1 |
(1167) 0x45e6d5 VMOVAPD %YMM14,%YMM2 |
(1167) 0x45e6d9 VANDPD 0x37965(%RIP){1to4},%YMM3,%YMM3 |
(1167) 0x45e6e3 VPBROADCASTQ 0x3dc63(%RIP),%YMM3{%K1} |
(1167) 0x45e6ed VPBROADCASTQ 0x3dc61(%RIP),%YMM3{%K2} |
(1167) 0x45e6f7 VPBROADCASTQ 0x3dc5f(%RIP),%YMM3{%K3} |
(1167) 0x45e701 VPBROADCASTQ 0x3dc5d(%RIP),%YMM3{%K4} |
(1167) 0x45e70b VPBROADCASTQ 0x3dc5b(%RIP),%YMM3{%K5} |
(1167) 0x45e715 VPBROADCASTQ 0x3dc59(%RIP),%YMM3{%K6} |
(1167) 0x45e71f KXNORW %K0,%K0,%K1 |
(1167) 0x45e723 VMOVUPD %YMM4,(%RCX,%RAX,8) |
(1167) 0x45e728 VXORPD %XMM4,%XMM4,%XMM4 |
(1167) 0x45e72c VGATHERQPD 0x90(%RDI,%YMM3,8),%YMM4{%K1} |
(1167) 0x45e734 VADDPD %YMM28,%YMM4,%YMM4 |
(1167) 0x45e73a VMULPD %YMM25,%YMM4,%YMM4 |
(1167) 0x45e740 KXNORW %K0,%K0,%K1 |
(1167) 0x45e744 VMOVUPD %YMM4,(%R10,%RAX,8) |
(1167) 0x45e74a VXORPD %XMM4,%XMM4,%XMM4 |
(1167) 0x45e74e VGATHERQPD 0xd0(%RDI,%YMM3,8),%YMM4{%K1} |
(1167) 0x45e756 VADDPD %YMM26,%YMM4,%YMM4 |
(1167) 0x45e75c VMULPD %YMM25,%YMM4,%YMM4 |
(1167) 0x45e762 KXNORW %K0,%K0,%K1 |
(1167) 0x45e766 VMOVUPD %YMM4,(%R8,%RAX,8) |
(1167) 0x45e76c VXORPD %XMM4,%XMM4,%XMM4 |
(1167) 0x45e770 VGATHERQPD 0x110(%RDI,%YMM3,8),%YMM4{%K1} |
(1167) 0x45e778 VADDPD %YMM27,%YMM4,%YMM3 |
(1167) 0x45e77e VMULPD %YMM25,%YMM3,%YMM3 |
(1167) 0x45e784 VMOVUPD %YMM3,(%R11,%RAX,8) |
(1167) 0x45e78a ADD $0x4,%EDX |
(1167) 0x45e78d CMP %EBX,%EDX |
(1167) 0x45e78f JBE 45e420 |
0x45e795 VMOVDQU64 %XMM21,0x230(%RSP) |
0x45e79d VMOVUPD 0x160(%RSP),%YMM20 |
0x45e7a5 VMOVUPD 0x460(%RSP),%YMM14 |
0x45e7ae VMOVUPD 0x440(%RSP),%YMM4 |
0x45e7b7 VMOVUPD 0x120(%RSP),%YMM27 |
0x45e7bf CMP %R14D,%R15D |
0x45e7c2 JE 45edd3 |
0x45e7c8 VMOVAPD %YMM23,%YMM28 |
0x45e7ce VMOVAPD %YMM15,%YMM23 |
0x45e7d4 VPBROADCASTD %R15D,%XMM15 |
0x45e7da VMOVDQU64 0x140(%RSP),%YMM21 |
0x45e7e2 VMOVUPD %YMM8,0xe0(%RSP) |
0x45e7eb VMOVUPD %YMM9,0x100(%RSP) |
0x45e7f4 VMOVUPD %YMM10,0xc0(%RSP) |
0x45e7fd VMOVUPD %YMM11,0xa0(%RSP) |
0x45e806 VMOVUPD %YMM12,0x80(%RSP) |
0x45e80f VMOVUPD %YMM30,0x60(%RSP) |
0x45e817 VMOVUPD %YMM24,0x240(%RSP) |
0x45e81f VMOVUPD %YMM13,0x20(%RSP) |
0x45e825 VMOVUPD %YMM23,0x40(%RSP) |
0x45e82d VMOVUPD %YMM16,(%RSP) |
0x45e834 VMOVUPD %YMM17,0x2a0(%RSP) |
0x45e83c VMOVUPD %YMM18,0x280(%RSP) |
0x45e844 VMOVUPD %YMM19,0x260(%RSP) |
0x45e84c VMOVAPD %YMM4,%YMM18 |
0x45e852 VMOVAPD %YMM5,%YMM16 |
0x45e858 VMOVAPD %YMM6,%YMM17 |
0x45e85e VMOVAPD %YMM14,%YMM19 |
0x45e864 VMOVAPD %YMM20,%YMM23 |
0x45e86a VMOVUPD 0x420(%RSP),%YMM26 |
0x45e872 VMOVUPD 0x400(%RSP),%YMM20 |
0x45e87a VMOVUPD 0x3e0(%RSP),%YMM24 |
0x45e882 VMOVUPD 0x3c0(%RSP),%YMM30 |
0x45e88a VMOVUPD 0x3a0(%RSP),%YMM25 |
0x45e892 VMOVUPD 0x380(%RSP),%YMM5 |
0x45e89b VMOVUPD 0x360(%RSP),%YMM8 |
0x45e8a4 VMOVUPD 0x340(%RSP),%YMM9 |
0x45e8ad VMOVUPD 0x320(%RSP),%YMM11 |
0x45e8b6 VMOVUPD 0x300(%RSP),%YMM10 |
0x45e8bf VMOVUPD 0x2e0(%RSP),%YMM22 |
0x45e8c7 VMOVUPD 0x2c0(%RSP),%YMM29 |
0x45e8cf VMOVDQU 0x230(%RSP),%XMM6 |
0x45e8d8 JMP 45eabb |
0x45e8dd VMOVUPD %XMM31,0x160(%RSP) |
0x45e8e5 VBROADCASTSD %XMM10,%YMM31 |
0x45e8eb VBROADCASTSD %XMM9,%YMM9 |
0x45e8f0 VBROADCASTSD %XMM8,%YMM10 |
0x45e8f5 VBROADCASTSD %XMM4,%YMM8 |
0x45e8fa VBROADCASTSD %XMM5,%YMM5 |
0x45e8ff VBROADCASTSD %XMM2,%YMM0 |
0x45e904 VMOVUPS %YMM0,0x1a0(%RSP) |
0x45e90d VMOVAPD %XMM29,%XMM4 |
0x45e913 VBROADCASTSD %XMM1,%YMM29 |
0x45e919 VBROADCASTSD %XMM3,%YMM2 |
0x45e91e VBROADCASTSD %XMM7,%YMM1 |
0x45e923 VMOVUPS %YMM1,0x1c0(%RSP) |
0x45e92c VBROADCASTSD %XMM6,%YMM1 |
0x45e931 VMOVUPS %YMM1,0x1e0(%RSP) |
0x45e93a VBROADCASTSD %XMM22,%YMM0 |
0x45e940 VMOVAPD %YMM2,%YMM22 |
0x45e946 VMOVUPD %YMM0,0x200(%RSP) |
0x45e94f VBROADCASTSD %XMM30,%YMM30 |
0x45e955 VBROADCASTSD %XMM25,%YMM2 |
0x45e95b VBROADCASTSD %XMM24,%YMM0 |
0x45e961 VMOVUPS %YMM0,0x180(%RSP) |
0x45e96a VBROADCASTSD %XMM23,%YMM7 |
0x45e970 VBROADCASTSD %XMM11,%YMM1 |
0x45e975 VMOVAPD %YMM8,%YMM11 |
0x45e97a VMOVAPD %YMM10,%YMM8 |
0x45e97f VMOVAPD %YMM31,%YMM10 |
0x45e985 VBROADCASTSD %XMM21,%YMM23 |
0x45e98b VBROADCASTSD %XMM28,%YMM0 |
0x45e991 VMOVUPD %YMM0,0x240(%RSP) |
0x45e99a VBROADCASTSD %XMM27,%YMM0 |
0x45e9a0 VBROADCASTSD %XMM26,%YMM25 |
0x45e9a6 VBROADCASTSD %XMM19,%YMM24 |
0x45e9ac VBROADCASTSD %XMM18,%YMM26 |
0x45e9b2 VBROADCASTSD %XMM20,%YMM20 |
0x45e9b8 VBROADCASTSD %XMM17,%YMM19 |
0x45e9be VBROADCASTSD %XMM16,%YMM16 |
0x45e9c4 VBROADCASTSD %XMM15,%YMM17 |
0x45e9ca VBROADCASTSD %XMM14,%YMM18 |
0x45e9d0 VBROADCASTSD 0x120(%RSP),%YMM27 |
0x45e9d8 VBROADCASTSD (%RSP),%YMM28 |
0x45e9df VBROADCASTSD 0x20(%RSP),%YMM3 |
0x45e9e6 VMOVUPS %YMM3,0x260(%RSP) |
0x45e9ef VBROADCASTSD 0x40(%RSP),%YMM3 |
0x45e9f6 VMOVUPS %YMM3,0x2a0(%RSP) |
0x45e9ff VBROADCASTSD 0x60(%RSP),%YMM3 |
0x45ea06 VMOVUPS %YMM3,0x280(%RSP) |
0x45ea0f VBROADCASTSD 0x80(%RSP),%YMM3 |
0x45ea19 VMOVUPS %YMM3,(%RSP) |
0x45ea1e VBROADCASTSD %XMM13,%YMM3 |
0x45ea23 VMOVUPD %YMM3,0x20(%RSP) |
0x45ea29 VBROADCASTSD 0xa0(%RSP),%YMM3 |
0x45ea33 VMOVUPS %YMM3,0x40(%RSP) |
0x45ea39 VBROADCASTSD 0xc0(%RSP),%YMM3 |
0x45ea43 VMOVUPS %YMM3,0x60(%RSP) |
0x45ea49 VBROADCASTSD 0xe0(%RSP),%YMM3 |
0x45ea53 VMOVUPS %YMM3,0xa0(%RSP) |
0x45ea5c VBROADCASTSD %XMM12,%YMM3 |
0x45ea61 VMOVUPD %YMM3,0x80(%RSP) |
0x45ea6a VBROADCASTSD 0x100(%RSP),%YMM3 |
0x45ea74 VMOVUPS %YMM3,0xc0(%RSP) |
0x45ea7d VBROADCASTSD %XMM4,%YMM3 |
0x45ea82 VMOVUPD %YMM3,0xe0(%RSP) |
0x45ea8b VPBROADCASTQ 0x140(%RSP),%YMM3 |
0x45ea95 VMOVDQU %YMM3,0x100(%RSP) |
0x45ea9e VBROADCASTSD 0x160(%RSP),%YMM31 |
0x45eaa6 XOR %R14D,%R14D |
0x45eaa9 VPBROADCASTD %R15D,%XMM15 |
0x45eaaf VPBROADCASTD %EAX,%XMM6 |
0x45eab5 VPBROADCASTQ %RDI,%YMM21 |
0x45eabb VMOVDQU 0x3d8bd(%RIP),%XMM3 |
0x45eac3 VPBROADCASTD %R14D,%XMM4 |
0x45eac9 VPADDD %XMM3,%XMM4,%XMM4 |
0x45eacd VPCMPLTUD %XMM15,%XMM4,%K1 |
0x45ead4 ADD %R14D,%R9D |
0x45ead7 VPBROADCASTD %R9D,%XMM4 |
0x45eadd VPADDD %XMM3,%XMM4,%XMM3 |
0x45eae1 VPCMPGTD %XMM3,%XMM6,%K2 |
0x45eae7 MOVSXD %R9D,%RDX |
0x45eaea VMOVUPD (%R13,%RDX,8),%YMM3{%K1}{z} |
0x45eaf2 VMOVUPD (%R12,%RDX,8),%YMM4{%K1}{z} |
0x45eaf9 VSUBPD %YMM10,%YMM3,%YMM14 |
0x45eafe VSUBPD %YMM9,%YMM4,%YMM4 |
0x45eb03 VBROADCASTSD 0x37524(%RIP),%YMM3 |
0x45eb0c VMOVUPD (%RSI,%RDX,8),%YMM13{%K1}{z} |
0x45eb13 VSUBPD %YMM8,%YMM13,%YMM12 |
0x45eb18 VBROADCASTSD 0x37506(%RIP),%YMM3{%K2} |
0x45eb22 VMULPD %YMM3,%YMM14,%YMM13 |
0x45eb26 VMULPD %YMM3,%YMM4,%YMM4 |
0x45eb2a VMULPD %YMM13,%YMM11,%YMM14 |
0x45eb2f VFMADD231PD %YMM5,%YMM4,%YMM14 |
0x45eb34 VMULPD %YMM3,%YMM12,%YMM11 |
0x45eb38 VFMADD231PD 0x1a0(%RSP),%YMM11,%YMM14 |
0x45eb42 VMULPD %YMM13,%YMM29,%YMM9 |
0x45eb48 VFMADD231PD %YMM22,%YMM4,%YMM9 |
0x45eb4e VFMADD231PD 0x1c0(%RSP),%YMM11,%YMM9 |
0x45eb58 VMULPD 0x1e0(%RSP),%YMM13,%YMM6 |
0x45eb61 VFMADD231PD 0x200(%RSP),%YMM4,%YMM6 |
0x45eb6b VFMADD231PD %YMM30,%YMM11,%YMM6 |
0x45eb71 VROUNDPD $0x9,%YMM14,%YMM5 |
0x45eb77 VFMSUB213PD %YMM13,%YMM5,%YMM2 |
0x45eb7c VFMSUB213PD %YMM4,%YMM5,%YMM1 |
0x45eb81 VFMSUB213PD %YMM11,%YMM5,%YMM0 |
0x45eb86 VROUNDPD $0x9,%YMM9,%YMM4 |
0x45eb8c VFMADD231PD 0x180(%RSP),%YMM4,%YMM2 |
0x45eb96 VFMADD231PD %YMM23,%YMM4,%YMM1 |
0x45eb9c VFMADD231PD %YMM25,%YMM4,%YMM0 |
0x45eba2 VROUNDPD $0x9,%YMM6,%YMM4 |
0x45eba8 VFNMSUB231PD %YMM7,%YMM4,%YMM2 |
0x45ebad VFNMSUB231PD 0x240(%RSP),%YMM4,%YMM1 |
0x45ebb7 VFNMSUB231PD %YMM24,%YMM4,%YMM0 |
0x45ebbd VADDPD %YMM2,%YMM26,%YMM4 |
0x45ebc3 VADDPD %YMM1,%YMM20,%YMM5 |
0x45ebc9 VMULPD %YMM4,%YMM4,%YMM4 |
0x45ebcd VFMADD231PD %YMM5,%YMM5,%YMM4 |
0x45ebd2 VADDPD %YMM0,%YMM19,%YMM5 |
0x45ebd8 VFMADD231PD %YMM5,%YMM5,%YMM4 |
0x45ebdd VADDPD %YMM2,%YMM16,%YMM5 |
0x45ebe3 VADDPD %YMM1,%YMM17,%YMM6 |
0x45ebe9 VMULPD %YMM5,%YMM5,%YMM7 |
0x45ebed VFMADD231PD %YMM6,%YMM6,%YMM7 |
0x45ebf2 VMULPD %YMM2,%YMM2,%YMM5 |
0x45ebf6 VFMADD231PD %YMM1,%YMM1,%YMM5 |
0x45ebfb VFMADD231PD %YMM0,%YMM0,%YMM5 |
0x45ec00 VADDPD %YMM0,%YMM18,%YMM6 |
0x45ec06 VFMADD231PD %YMM6,%YMM6,%YMM7 |
0x45ec0b VMINPD %YMM5,%YMM4,%YMM6 |
0x45ec0f VCMPPD $0x1,%YMM6,%YMM7,%K2 |
0x45ec16 VMINPD %YMM6,%YMM7,%YMM6 |
0x45ec1a VADDPD %YMM2,%YMM27,%YMM7 |
0x45ec20 VADDPD %YMM1,%YMM28,%YMM8 |
0x45ec26 VMULPD %YMM7,%YMM7,%YMM7 |
0x45ec2a VFMADD231PD %YMM8,%YMM8,%YMM7 |
0x45ec2f VADDPD 0x260(%RSP),%YMM0,%YMM8 |
0x45ec38 VFMADD231PD %YMM8,%YMM8,%YMM7 |
0x45ec3d VCMPPD $0x1,%YMM6,%YMM7,%K3 |
0x45ec44 VMINPD %YMM6,%YMM7,%YMM6 |
0x45ec48 VADDPD 0x2a0(%RSP),%YMM2,%YMM7 |
0x45ec51 VADDPD 0x280(%RSP),%YMM1,%YMM8 |
0x45ec5a VMULPD %YMM7,%YMM7,%YMM7 |
0x45ec5e VFMADD231PD %YMM8,%YMM8,%YMM7 |
0x45ec63 VADDPD (%RSP),%YMM0,%YMM8 |
0x45ec68 VFMADD231PD %YMM8,%YMM8,%YMM7 |
0x45ec6d VCMPPD $0x1,%YMM6,%YMM7,%K4 |
0x45ec74 VMINPD %YMM6,%YMM7,%YMM6 |
0x45ec78 VADDPD 0x20(%RSP),%YMM2,%YMM7 |
0x45ec7e VADDPD 0x40(%RSP),%YMM1,%YMM8 |
0x45ec84 VMULPD %YMM7,%YMM7,%YMM7 |
0x45ec88 VFMADD231PD %YMM8,%YMM8,%YMM7 |
0x45ec8d VADDPD 0x60(%RSP),%YMM0,%YMM8 |
0x45ec93 VFMADD231PD %YMM8,%YMM8,%YMM7 |
0x45ec98 VCMPPD $0x1,%YMM6,%YMM7,%K5 |
0x45ec9f VMINPD %YMM6,%YMM7,%YMM6 |
0x45eca3 VADDPD 0xa0(%RSP),%YMM2,%YMM7 |
0x45ecac VADDPD 0x80(%RSP),%YMM1,%YMM8 |
0x45ecb5 VMULPD %YMM7,%YMM7,%YMM7 |
0x45ecb9 VFMADD231PD %YMM8,%YMM8,%YMM7 |
0x45ecbe VADDPD 0xc0(%RSP),%YMM0,%YMM8 |
0x45ecc7 VFMADD231PD %YMM8,%YMM8,%YMM7 |
0x45eccc VCMPPD $0x1,%YMM6,%YMM7,%K6 |
0x45ecd3 VMINPD %YMM6,%YMM7,%YMM6 |
0x45ecd7 VADDPD 0xe0(%RSP),%YMM2,%YMM7 |
0x45ece0 VADDPD 0x100(%RSP),%YMM1,%YMM8 |
0x45ece9 VMULPD %YMM7,%YMM7,%YMM7 |
0x45eced VFMADD231PD %YMM8,%YMM8,%YMM7 |
0x45ecf2 VADDPD %YMM0,%YMM31,%YMM8 |
0x45ecf8 VFMADD231PD %YMM8,%YMM8,%YMM7 |
0x45ecfd VMINPD %YMM6,%YMM7,%YMM8 |
0x45ed01 VSQRTPD %YMM8,%YMM8 |
0x45ed06 VMOVUPD %YMM8,(%RCX,%RDX,8){%K1} |
0x45ed0d VCMPPD $0x1,%YMM6,%YMM7,%K7 |
0x45ed14 VCMPPD $0x1,%YMM5,%YMM4,%YMM4 |
0x45ed19 VANDPD 0x37325(%RIP){1to4},%YMM4,%YMM4 |
0x45ed23 VPBROADCASTQ 0x3d623(%RIP),%YMM4{%K2} |
0x45ed2d VPBROADCASTQ 0x3d621(%RIP),%YMM4{%K3} |
0x45ed37 VPBROADCASTQ 0x3d61f(%RIP),%YMM4{%K4} |
0x45ed41 VPBROADCASTQ 0x3d61d(%RIP),%YMM4{%K5} |
0x45ed4b VPBROADCASTQ 0x3d61b(%RIP),%YMM4{%K6} |
0x45ed55 VPBROADCASTQ 0x3d619(%RIP),%YMM4{%K7} |
0x45ed5f VPSLLQ $0x3,%YMM4,%YMM4 |
0x45ed64 VPADDQ %YMM4,%YMM21,%YMM4 |
0x45ed6a VXORPD %XMM5,%XMM5,%XMM5 |
0x45ed6e KMOVQ %K1,%K2 |
0x45ed73 VGATHERQPD 0x90(,%YMM4,1),%YMM5{%K2} |
0x45ed7e VADDPD %YMM2,%YMM5,%YMM2 |
0x45ed82 VMULPD %YMM3,%YMM2,%YMM2 |
0x45ed86 VMOVUPD %YMM2,(%R10,%RDX,8){%K1} |
0x45ed8d VXORPD %XMM2,%XMM2,%XMM2 |
0x45ed91 KMOVQ %K1,%K2 |
0x45ed96 VGATHERQPD 0xd0(,%YMM4,1),%YMM2{%K2} |
0x45eda1 VADDPD %YMM1,%YMM2,%YMM1 |
0x45eda5 VMULPD %YMM3,%YMM1,%YMM1 |
0x45eda9 VMOVUPD %YMM1,(%R8,%RDX,8){%K1} |
0x45edb0 VXORPD %XMM1,%XMM1,%XMM1 |
0x45edb4 KMOVQ %K1,%K2 |
0x45edb9 VGATHERQPD 0x110(,%YMM4,1),%YMM1{%K2} |
0x45edc4 VADDPD %YMM0,%YMM1,%YMM0 |
0x45edc8 VMULPD %YMM3,%YMM0,%YMM0 |
0x45edcc VMOVUPD %YMM0,(%R11,%RDX,8){%K1} |
0x45edd3 LEA -0x28(%RBP),%RSP |
0x45edd7 POP %RBX |
0x45edd8 POP %R12 |
0x45edda POP %R13 |
0x45eddc POP %R14 |
0x45edde POP %R15 |
0x45ede0 POP %RBP |
0x45ede1 VZEROUPPER |
0x45ede4 RET |
0x45ede5 NOPW %CS:(%RAX,%RAX,1) |
0x45edef NOP |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►64.44+ | qmcplusplus::DistanceTableAA<d[...] | DistanceTableAA.h:83 | exec |
○ | qmcplusplus::ParticleSet::make[...] | ParticleSet.cpp:290 | exec |
○ | main.extracted.104 | miniqmc.cpp:482 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 | |
►15.56+ | qmcplusplus::DistanceTableAA<d[...] | DistanceTableAA.h:83 | exec |
○ | qmcplusplus::ParticleSet::make[...] | ParticleSet.cpp:290 | exec |
○ | main.extracted.104 | refwrap.h:347 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 | |
►8.89+ | qmcplusplus::DistanceTableBA<d[...] | DistanceTableBA.h:119 | exec |
○ | qmcplusplus::ParticleSet::make[...] | ParticleSet.cpp:290 | exec |
○ | main.extracted.104 | miniqmc.cpp:482 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 | |
►6.67+ | qmcplusplus::DistanceTableAA<d[...] | DistanceTableAA.h:76 | exec |
○ | qmcplusplus::ParticleSet::setA[...] | ParticleSet.cpp:259 | exec |
○ | main.extracted.104 | refwrap.h:347 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 | |
►2.22+ | qmcplusplus::DistanceTableAA<d[...] | DistanceTableAA.h:69 | exec |
○ | qmcplusplus::ParticleSet::upda[...] | stl_vector.h:990 | exec |
○ | main.extracted.107 | miniqmc.cpp:390 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:374 | exec |
○ | __libc_init_first | libc.so.6 | |
►2.22+ | qmcplusplus::DistanceTableBA<d[...] | DistanceTableBA.h:113 | exec |
○ | qmcplusplus::ParticleSet::setA[...] | ParticleSet.cpp:259 | exec |
○ | main.extracted.104 | refwrap.h:347 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 |
Path / |
Source file and lines | ParticleBConds.h:166-219 |
Module | exec |
nb instructions | 402 |
nb uops | 416 |
loop length | 2587 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 32 |
used ymm registers | 32 |
used zmm registers | 0 |
nb stack references | 39 |
ADD-SUB / MUL ratio | 1.59 |
micro-operation queue | 104.00 cycles |
front end | 104.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 52.33 | 52.67 | 71.67 | 71.67 | 76.00 | 79.00 | 17.00 | 71.67 |
cycles | 52.33 | 52.67 | 71.67 | 71.67 | 76.00 | 79.00 | 17.00 | 71.67 |
Cycles executing div or sqrt instructions | 9.00-12.00 |
FE+BE cycles | 250.45 |
Stall cycles | 148.24 |
RS full (events) | 21.03 |
LB full (events) | 142.98 |
Front-end | 104.00 |
Dispatch | 79.00 |
DIV/SQRT | 9.00-12.00 |
Overall L1 | 104.00 |
all | 41% |
load | 27% |
store | 100% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 75% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 20% |
all | 60% |
load | 38% |
store | 100% |
mul | 100% |
add-sub | 100% |
fma | 100% |
div/sqrt | 100% |
other | 29% |
all | 59% |
load | 37% |
store | 100% |
mul | 100% |
add-sub | 96% |
fma | 100% |
div/sqrt | 100% |
other | 28% |
all | 19% |
load | 17% |
store | 41% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 26% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 14% |
all | 34% |
load | 26% |
store | 45% |
mul | 50% |
add-sub | 50% |
fma | 50% |
div/sqrt | 50% |
other | 22% |
all | 32% |
load | 26% |
store | 45% |
mul | 50% |
add-sub | 46% |
fma | 50% |
div/sqrt | 50% |
other | 21% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
AND $-0x20,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SUB $0x4a0,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%R15D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
SUB %R9D,%R15D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 45edd3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VMOVSD (%RSI),%XMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x8(%RSI),%XMM9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x10(%RSI),%XMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RBP),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x8(%RDX),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RDX),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (,%RSI,8),%R12 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R13,%R12 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SAL $0x4,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
ADD %R13,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x8(%R8),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%R8),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R10,%R11,8),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x4,%R11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
VMOVSD (%RDI),%XMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x8(%RDI),%XMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x10(%RDI),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x18(%RDI),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x20(%RDI),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x28(%RDI),%XMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x30(%RDI),%XMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x38(%RDI),%XMM22 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x40(%RDI),%XMM30 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x48(%RDI),%XMM25 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x50(%RDI),%XMM24 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x58(%RDI),%XMM23 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x60(%RDI),%XMM11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x68(%RDI),%XMM21 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x70(%RDI),%XMM28 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x78(%RDI),%XMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x80(%RDI),%XMM26 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x88(%RDI),%XMM19 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x98(%RDI),%XMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xd8(%RDI),%XMM20 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x118(%RDI),%XMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xa0(%RDI),%XMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xe0(%RDI),%XMM15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x120(%RDI),%XMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xa8(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x120(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xe8(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x128(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x20(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xb0(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x40(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xf0(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x60(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x130(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x80(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xb8(%RDI),%XMM13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xf8(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0xa0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x138(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0xc0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xc0(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0xe0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x100(%RDI),%XMM12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x140(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x100(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xc8(%RDI),%XMM29 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD %R10,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R15D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x108(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x140(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x148(%RDI),%XMM31 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
AND $-0x4,%R14D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 45e8dd | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA -0x1(%R14),%EBX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM10,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM10,0x300(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM9,%YMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM9,0x340(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM8,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM8,0x360(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM4,%YMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM4,0x320(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM5,%YMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM4,0x380(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM2,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM2,0x1a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM1,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM1,0x2c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM3,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM1,0x2e0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM7,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM1,0x1c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM6,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM1,0x1e0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM22,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x200(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM30,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x3c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM25,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM24,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x180(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM23,%YMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM11,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM21,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x160(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM28,%YMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM27,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM26,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x3a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM19,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x3e0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM18,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x420(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM20,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x400(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM17,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x460(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM16,%YMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM15,%YMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM14,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x440(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x120(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0x120(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD (%RSP),%YMM23 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0x20(%RSP),%YMM19 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0x40(%RSP),%YMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0x60(%RSP),%YMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0x80(%RSP),%YMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD %XMM13,%YMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD 0xa0(%RSP),%YMM15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0xc0(%RSP),%YMM30 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0xe0(%RSP),%YMM11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD %XMM12,%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD 0x100(%RSP),%YMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD %XMM29,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD 0x140(%RSP),%YMM9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD %XMM31,%YMM31 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VPBROADCASTD %EAX,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RDI,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVDQU %YMM3,0x140(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVDQU64 %XMM21,0x230(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
VMOVUPD 0x160(%RSP),%YMM20 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x460(%RSP),%YMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x440(%RSP),%YMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x120(%RSP),%YMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
CMP %R14D,%R15D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 45edd3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VMOVAPD %YMM23,%YMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM15,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VPBROADCASTD %R15D,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVDQU64 0x140(%RSP),%YMM21 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPD %YMM8,0xe0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM9,0x100(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM10,0xc0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM11,0xa0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM12,0x80(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM30,0x60(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM24,0x240(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM13,0x20(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM23,0x40(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM16,(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM17,0x2a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM18,0x280(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM19,0x260(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %YMM4,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM5,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM6,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM14,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM20,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD 0x420(%RSP),%YMM26 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x400(%RSP),%YMM20 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x3e0(%RSP),%YMM24 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x3c0(%RSP),%YMM30 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x3a0(%RSP),%YMM25 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x380(%RSP),%YMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x360(%RSP),%YMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x340(%RSP),%YMM9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x320(%RSP),%YMM11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x300(%RSP),%YMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x2e0(%RSP),%YMM22 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x2c0(%RSP),%YMM29 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVDQU 0x230(%RSP),%XMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JMP 45eabb | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
VMOVUPD %XMM31,0x160(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM10,%YMM31 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM9,%YMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM8,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM4,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM5,%YMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM2,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x1a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM29,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM1,%YMM29 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM3,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM7,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM1,0x1c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM6,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM1,0x1e0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM22,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVAPD %YMM2,%YMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD %YMM0,0x200(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM30,%YMM30 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM25,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM24,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x180(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM23,%YMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM11,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVAPD %YMM8,%YMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM10,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM31,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM21,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM28,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x240(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM27,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM26,%YMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM19,%YMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM18,%YMM26 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM20,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM17,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM16,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM15,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM14,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD 0x120(%RSP),%YMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD (%RSP),%YMM28 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0x20(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0x260(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x40(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0x2a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x60(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0x280(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x80(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM13,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x20(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0xa0(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0x40(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0xc0(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0x60(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0xe0(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0xa0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM12,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x80(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x100(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0xc0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM4,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0xe0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VPBROADCASTQ 0x140(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVDQU %YMM3,0x100(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
VBROADCASTSD 0x160(%RSP),%YMM31 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VPBROADCASTD %R15D,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPBROADCASTD %EAX,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RDI,%YMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVDQU 0x3d8bd(%RIP),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTD %R14D,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPADDD %XMM3,%XMM4,%XMM4 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 1 | 0.33 |
VPCMPLTUD %XMM15,%XMM4,%K1 | |||||||||||
ADD %R14D,%R9D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VPBROADCASTD %R9D,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPADDD %XMM3,%XMM4,%XMM3 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 1 | 0.33 |
VPCMPGTD %XMM3,%XMM6,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
MOVSXD %R9D,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD (%R13,%RDX,8),%YMM3{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD (%R12,%RDX,8),%YMM4{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VSUBPD %YMM10,%YMM3,%YMM14 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSUBPD %YMM9,%YMM4,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x37524(%RIP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPD (%RSI,%RDX,8),%YMM13{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VSUBPD %YMM8,%YMM13,%YMM12 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x37506(%RIP),%YMM3{%K2} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMULPD %YMM3,%YMM14,%YMM13 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM3,%YMM4,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM13,%YMM11,%YMM14 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM5,%YMM4,%YMM14 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM3,%YMM12,%YMM11 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD 0x1a0(%RSP),%YMM11,%YMM14 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM13,%YMM29,%YMM9 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM22,%YMM4,%YMM9 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD 0x1c0(%RSP),%YMM11,%YMM9 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD 0x1e0(%RSP),%YMM13,%YMM6 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD 0x200(%RSP),%YMM4,%YMM6 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM30,%YMM11,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VROUNDPD $0x9,%YMM14,%YMM5 | 2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 8 | 1 |
VFMSUB213PD %YMM13,%YMM5,%YMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMSUB213PD %YMM4,%YMM5,%YMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMSUB213PD %YMM11,%YMM5,%YMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VROUNDPD $0x9,%YMM9,%YMM4 | 2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 8 | 1 |
VFMADD231PD 0x180(%RSP),%YMM4,%YMM2 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM23,%YMM4,%YMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM25,%YMM4,%YMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VROUNDPD $0x9,%YMM6,%YMM4 | 2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 8 | 1 |
VFNMSUB231PD %YMM7,%YMM4,%YMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFNMSUB231PD 0x240(%RSP),%YMM4,%YMM1 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFNMSUB231PD %YMM24,%YMM4,%YMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM2,%YMM26,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM1,%YMM20,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM4,%YMM4,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM5,%YMM5,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM0,%YMM19,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM5,%YMM5,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM2,%YMM16,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM1,%YMM17,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM5,%YMM5,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM6,%YMM6,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM2,%YMM2,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM1,%YMM1,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM0,%YMM0,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM0,%YMM18,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM6,%YMM6,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMINPD %YMM5,%YMM4,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%YMM6,%YMM7,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %YMM6,%YMM7,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM2,%YMM27,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM1,%YMM28,%YMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM7,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x260(%RSP),%YMM0,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%YMM6,%YMM7,%K3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %YMM6,%YMM7,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x2a0(%RSP),%YMM2,%YMM7 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x280(%RSP),%YMM1,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM7,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD (%RSP),%YMM0,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%YMM6,%YMM7,%K4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %YMM6,%YMM7,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x20(%RSP),%YMM2,%YMM7 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x40(%RSP),%YMM1,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM7,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x60(%RSP),%YMM0,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%YMM6,%YMM7,%K5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %YMM6,%YMM7,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0xa0(%RSP),%YMM2,%YMM7 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x80(%RSP),%YMM1,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM7,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0xc0(%RSP),%YMM0,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%YMM6,%YMM7,%K6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %YMM6,%YMM7,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0xe0(%RSP),%YMM2,%YMM7 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x100(%RSP),%YMM1,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM7,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM0,%YMM31,%YMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMINPD %YMM6,%YMM7,%YMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSQRTPD %YMM8,%YMM8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-19 | 9-12 |
VMOVUPD %YMM8,(%RCX,%RDX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VCMPPD $0x1,%YMM6,%YMM7,%K7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VCMPPD $0x1,%YMM5,%YMM4,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VANDPD 0x37325(%RIP){1to4},%YMM4,%YMM4 | 1 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0.33 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ 0x3d623(%RIP),%YMM4{%K2} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d621(%RIP),%YMM4{%K3} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d61f(%RIP),%YMM4{%K4} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d61d(%RIP),%YMM4{%K5} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d61b(%RIP),%YMM4{%K6} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d619(%RIP),%YMM4{%K7} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPSLLQ $0x3,%YMM4,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %YMM4,%YMM21,%YMM4 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 1 | 0.33 |
VXORPD %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VGATHERQPD 0x90(,%YMM4,1),%YMM5{%K2} | 4 | 1 | 0 | 2 | 2 | 0 | 1 | 0 | 0 | 20 | 4 |
VADDPD %YMM2,%YMM5,%YMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM3,%YMM2,%YMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %YMM2,(%R10,%RDX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VXORPD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VGATHERQPD 0xd0(,%YMM4,1),%YMM2{%K2} | 4 | 1 | 0 | 2 | 2 | 0 | 1 | 0 | 0 | 20 | 4 |
VADDPD %YMM1,%YMM2,%YMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM3,%YMM1,%YMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %YMM1,(%R8,%RDX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VGATHERQPD 0x110(,%YMM4,1),%YMM1{%K2} | 4 | 1 | 0 | 2 | 2 | 0 | 1 | 0 | 0 | 20 | 4 |
VADDPD %YMM0,%YMM1,%YMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM3,%YMM0,%YMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %YMM0,(%R11,%RDX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
VZEROUPPER | 4 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Source file and lines | ParticleBConds.h:166-219 |
Module | exec |
nb instructions | 402 |
nb uops | 416 |
loop length | 2587 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 32 |
used ymm registers | 32 |
used zmm registers | 0 |
nb stack references | 39 |
ADD-SUB / MUL ratio | 1.59 |
micro-operation queue | 104.00 cycles |
front end | 104.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 52.33 | 52.67 | 71.67 | 71.67 | 76.00 | 79.00 | 17.00 | 71.67 |
cycles | 52.33 | 52.67 | 71.67 | 71.67 | 76.00 | 79.00 | 17.00 | 71.67 |
Cycles executing div or sqrt instructions | 9.00-12.00 |
FE+BE cycles | 250.45 |
Stall cycles | 148.24 |
RS full (events) | 21.03 |
LB full (events) | 142.98 |
Front-end | 104.00 |
Dispatch | 79.00 |
DIV/SQRT | 9.00-12.00 |
Overall L1 | 104.00 |
all | 41% |
load | 27% |
store | 100% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 75% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 20% |
all | 60% |
load | 38% |
store | 100% |
mul | 100% |
add-sub | 100% |
fma | 100% |
div/sqrt | 100% |
other | 29% |
all | 59% |
load | 37% |
store | 100% |
mul | 100% |
add-sub | 96% |
fma | 100% |
div/sqrt | 100% |
other | 28% |
all | 19% |
load | 17% |
store | 41% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 26% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 14% |
all | 34% |
load | 26% |
store | 45% |
mul | 50% |
add-sub | 50% |
fma | 50% |
div/sqrt | 50% |
other | 22% |
all | 32% |
load | 26% |
store | 45% |
mul | 50% |
add-sub | 46% |
fma | 50% |
div/sqrt | 50% |
other | 21% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
AND $-0x20,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SUB $0x4a0,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%R15D | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
SUB %R9D,%R15D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 45edd3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VMOVSD (%RSI),%XMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x8(%RSI),%XMM9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x10(%RSI),%XMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RBP),%EAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x8(%RDX),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RDX),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (,%RSI,8),%R12 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R13,%R12 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SAL $0x4,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
ADD %R13,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x8(%R8),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%R8),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R10,%R11,8),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x4,%R11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
VMOVSD (%RDI),%XMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x8(%RDI),%XMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x10(%RDI),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x18(%RDI),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x20(%RDI),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x28(%RDI),%XMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x30(%RDI),%XMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x38(%RDI),%XMM22 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x40(%RDI),%XMM30 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x48(%RDI),%XMM25 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x50(%RDI),%XMM24 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x58(%RDI),%XMM23 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x60(%RDI),%XMM11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x68(%RDI),%XMM21 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x70(%RDI),%XMM28 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x78(%RDI),%XMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x80(%RDI),%XMM26 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x88(%RDI),%XMM19 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x98(%RDI),%XMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xd8(%RDI),%XMM20 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x118(%RDI),%XMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xa0(%RDI),%XMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xe0(%RDI),%XMM15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x120(%RDI),%XMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xa8(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x120(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xe8(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x128(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x20(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xb0(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x40(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xf0(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x60(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x130(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x80(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xb8(%RDI),%XMM13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xf8(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0xa0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x138(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0xc0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xc0(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0xe0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x100(%RDI),%XMM12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x140(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x100(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0xc8(%RDI),%XMM29 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD %R10,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R15D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x108(%RDI),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPS %XMM0,0x140(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD 0x148(%RDI),%XMM31 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
AND $-0x4,%R14D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 45e8dd | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA -0x1(%R14),%EBX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM10,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM10,0x300(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM9,%YMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM9,0x340(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM8,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM8,0x360(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM4,%YMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM4,0x320(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM5,%YMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM4,0x380(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM2,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM2,0x1a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM1,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM1,0x2c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM3,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM1,0x2e0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM7,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM1,0x1c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM6,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM1,0x1e0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM22,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x200(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM30,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x3c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM25,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM24,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x180(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM23,%YMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM11,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM21,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x160(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM28,%YMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM27,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM26,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x3a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM19,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x3e0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM18,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x420(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM20,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x400(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM17,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x460(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM16,%YMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM15,%YMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM14,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x440(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x120(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0x120(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD (%RSP),%YMM23 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0x20(%RSP),%YMM19 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0x40(%RSP),%YMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0x60(%RSP),%YMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0x80(%RSP),%YMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD %XMM13,%YMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD 0xa0(%RSP),%YMM15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0xc0(%RSP),%YMM30 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0xe0(%RSP),%YMM11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD %XMM12,%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD 0x100(%RSP),%YMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD %XMM29,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD 0x140(%RSP),%YMM9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD %XMM31,%YMM31 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VPBROADCASTD %EAX,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RDI,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVDQU %YMM3,0x140(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVDQU64 %XMM21,0x230(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
VMOVUPD 0x160(%RSP),%YMM20 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x460(%RSP),%YMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x440(%RSP),%YMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x120(%RSP),%YMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
CMP %R14D,%R15D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 45edd3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VMOVAPD %YMM23,%YMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM15,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VPBROADCASTD %R15D,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVDQU64 0x140(%RSP),%YMM21 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPD %YMM8,0xe0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM9,0x100(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM10,0xc0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM11,0xa0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM12,0x80(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM30,0x60(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM24,0x240(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM13,0x20(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM23,0x40(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM16,(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM17,0x2a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM18,0x280(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %YMM19,0x260(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %YMM4,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM5,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM6,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM14,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM20,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD 0x420(%RSP),%YMM26 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x400(%RSP),%YMM20 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x3e0(%RSP),%YMM24 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x3c0(%RSP),%YMM30 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x3a0(%RSP),%YMM25 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x380(%RSP),%YMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x360(%RSP),%YMM8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x340(%RSP),%YMM9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x320(%RSP),%YMM11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x300(%RSP),%YMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x2e0(%RSP),%YMM22 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x2c0(%RSP),%YMM29 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVDQU 0x230(%RSP),%XMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JMP 45eabb | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
VMOVUPD %XMM31,0x160(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM10,%YMM31 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM9,%YMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM8,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM4,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM5,%YMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM2,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x1a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM29,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM1,%YMM29 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM3,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM7,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM1,0x1c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM6,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM1,0x1e0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM22,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVAPD %YMM2,%YMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD %YMM0,0x200(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM30,%YMM30 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM25,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM24,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x180(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM23,%YMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM11,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVAPD %YMM8,%YMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM10,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVAPD %YMM31,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM21,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM28,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x240(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM27,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM26,%YMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM19,%YMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM18,%YMM26 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM20,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM17,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM16,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM15,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM14,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD 0x120(%RSP),%YMM27 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD (%RSP),%YMM28 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VBROADCASTSD 0x20(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0x260(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x40(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0x2a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x60(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0x280(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x80(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM13,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x20(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0xa0(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0x40(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0xc0(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0x60(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0xe0(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0xa0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM12,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x80(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD 0x100(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPS %YMM3,0xc0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM4,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0xe0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VPBROADCASTQ 0x140(%RSP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMOVDQU %YMM3,0x100(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
VBROADCASTSD 0x160(%RSP),%YMM31 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VPBROADCASTD %R15D,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPBROADCASTD %EAX,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RDI,%YMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVDQU 0x3d8bd(%RIP),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTD %R14D,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPADDD %XMM3,%XMM4,%XMM4 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 1 | 0.33 |
VPCMPLTUD %XMM15,%XMM4,%K1 | |||||||||||
ADD %R14D,%R9D | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VPBROADCASTD %R9D,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPADDD %XMM3,%XMM4,%XMM3 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 1 | 0.33 |
VPCMPGTD %XMM3,%XMM6,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
MOVSXD %R9D,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD (%R13,%RDX,8),%YMM3{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD (%R12,%RDX,8),%YMM4{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VSUBPD %YMM10,%YMM3,%YMM14 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSUBPD %YMM9,%YMM4,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x37524(%RIP),%YMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMOVUPD (%RSI,%RDX,8),%YMM13{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VSUBPD %YMM8,%YMM13,%YMM12 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0x37506(%RIP),%YMM3{%K2} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 0.50 |
VMULPD %YMM3,%YMM14,%YMM13 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM3,%YMM4,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM13,%YMM11,%YMM14 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM5,%YMM4,%YMM14 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM3,%YMM12,%YMM11 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD 0x1a0(%RSP),%YMM11,%YMM14 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM13,%YMM29,%YMM9 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM22,%YMM4,%YMM9 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD 0x1c0(%RSP),%YMM11,%YMM9 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD 0x1e0(%RSP),%YMM13,%YMM6 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD 0x200(%RSP),%YMM4,%YMM6 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM30,%YMM11,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VROUNDPD $0x9,%YMM14,%YMM5 | 2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 8 | 1 |
VFMSUB213PD %YMM13,%YMM5,%YMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMSUB213PD %YMM4,%YMM5,%YMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMSUB213PD %YMM11,%YMM5,%YMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VROUNDPD $0x9,%YMM9,%YMM4 | 2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 8 | 1 |
VFMADD231PD 0x180(%RSP),%YMM4,%YMM2 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM23,%YMM4,%YMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM25,%YMM4,%YMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VROUNDPD $0x9,%YMM6,%YMM4 | 2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 8 | 1 |
VFNMSUB231PD %YMM7,%YMM4,%YMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFNMSUB231PD 0x240(%RSP),%YMM4,%YMM1 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFNMSUB231PD %YMM24,%YMM4,%YMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM2,%YMM26,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM1,%YMM20,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM4,%YMM4,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM5,%YMM5,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM0,%YMM19,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM5,%YMM5,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM2,%YMM16,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM1,%YMM17,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM5,%YMM5,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM6,%YMM6,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM2,%YMM2,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM1,%YMM1,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM0,%YMM0,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM0,%YMM18,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM6,%YMM6,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMINPD %YMM5,%YMM4,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%YMM6,%YMM7,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %YMM6,%YMM7,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM2,%YMM27,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM1,%YMM28,%YMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM7,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x260(%RSP),%YMM0,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%YMM6,%YMM7,%K3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %YMM6,%YMM7,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x2a0(%RSP),%YMM2,%YMM7 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x280(%RSP),%YMM1,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM7,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD (%RSP),%YMM0,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%YMM6,%YMM7,%K4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %YMM6,%YMM7,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x20(%RSP),%YMM2,%YMM7 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x40(%RSP),%YMM1,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM7,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x60(%RSP),%YMM0,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%YMM6,%YMM7,%K5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %YMM6,%YMM7,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0xa0(%RSP),%YMM2,%YMM7 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x80(%RSP),%YMM1,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM7,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0xc0(%RSP),%YMM0,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPPD $0x1,%YMM6,%YMM7,%K6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMINPD %YMM6,%YMM7,%YMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0xe0(%RSP),%YMM2,%YMM7 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD 0x100(%RSP),%YMM1,%YMM8 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM7,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %YMM0,%YMM31,%YMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD231PD %YMM8,%YMM8,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMINPD %YMM6,%YMM7,%YMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSQRTPD %YMM8,%YMM8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-19 | 9-12 |
VMOVUPD %YMM8,(%RCX,%RDX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VCMPPD $0x1,%YMM6,%YMM7,%K7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VCMPPD $0x1,%YMM5,%YMM4,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VANDPD 0x37325(%RIP){1to4},%YMM4,%YMM4 | 1 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0.33 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ 0x3d623(%RIP),%YMM4{%K2} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d621(%RIP),%YMM4{%K3} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d61f(%RIP),%YMM4{%K4} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d61d(%RIP),%YMM4{%K5} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d61b(%RIP),%YMM4{%K6} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3d619(%RIP),%YMM4{%K7} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPSLLQ $0x3,%YMM4,%YMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %YMM4,%YMM21,%YMM4 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 1 | 0.33 |
VXORPD %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VGATHERQPD 0x90(,%YMM4,1),%YMM5{%K2} | 4 | 1 | 0 | 2 | 2 | 0 | 1 | 0 | 0 | 20 | 4 |
VADDPD %YMM2,%YMM5,%YMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM3,%YMM2,%YMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %YMM2,(%R10,%RDX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VXORPD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VGATHERQPD 0xd0(,%YMM4,1),%YMM2{%K2} | 4 | 1 | 0 | 2 | 2 | 0 | 1 | 0 | 0 | 20 | 4 |
VADDPD %YMM1,%YMM2,%YMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM3,%YMM1,%YMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %YMM1,(%R8,%RDX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VGATHERQPD 0x110(,%YMM4,1),%YMM1{%K2} | 4 | 1 | 0 | 2 | 2 | 0 | 1 | 0 | 0 | 20 | 4 |
VADDPD %YMM0,%YMM1,%YMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %YMM3,%YMM0,%YMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %YMM0,(%R11,%RDX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
VZEROUPPER | 4 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼void qmcplusplus::DTD_BConds | 23.44 | 0.22 |
○Loop 1167 - ParticleBConds.h:185-217 - exec | 23.44 | 0.22 |