| Loop Id: 274 | Module: exec | Source: advec_mom.cpp:96-100 [...] | Coverage: 2.98% |
|---|
| Loop Id: 274 | Module: exec | Source: advec_mom.cpp:96-100 [...] | Coverage: 2.98% |
|---|
0x239840 VEXTRACTI128 $0x1,%YMM0,%XMM14 |
0x239846 VPEXTRQ $0x1,%XMM10,%RSI |
0x23984c VMOVQ %XMM10,%RDI |
0x239851 VPEXTRQ $0x1,%XMM14,%RAX |
0x239857 CQTO |
0x239859 IDIV %RSI |
0x23985c MOV %RAX,%RSI |
0x23985f VMOVQ %XMM14,%RAX |
0x239864 VMOVQ %RSI,%XMM14 |
0x239869 VPEXTRQ $0x1,%XMM1,%RSI |
0x23986f CQTO |
0x239871 IDIV %RDI |
0x239874 VPEXTRQ $0x1,%XMM0,%RDX |
0x23987a VMOVQ %XMM1,%RDI |
0x23987f VMOVQ %RAX,%XMM15 |
0x239884 MOV %RDX,%RAX |
0x239887 CQTO |
0x239889 IDIV %RSI |
0x23988c VPUNPCKLQDQ %XMM14,%XMM15,%XMM14 |
0x239891 MOV %RAX,%RSI |
0x239894 VMOVQ %XMM0,%RAX |
0x239899 VMOVQ %RSI,%XMM15 |
0x23989e CQTO |
0x2398a0 IDIV %RDI |
0x2398a3 ADD $-0x4,%R13 |
0x2398a7 VMOVQ %RAX,%XMM16 |
0x2398ad VPUNPCKLQDQ %XMM15,%XMM16,%XMM15 |
0x2398b3 VINSERTI128 $0x1,%XMM14,%YMM15,%YMM14 |
0x2398b9 VPMOVQD %YMM14,%XMM15 |
0x2398bf VPMULLQ %YMM1,%YMM14,%YMM14 |
0x2398c5 VPSUBQ %YMM14,%YMM0,%YMM14 |
0x2398ca VPADDQ %YMM0,%YMM13,%YMM0 |
0x2398ce VPMOVQD %YMM14,%XMM14 |
0x2398d4 VPADDD %XMM15,%XMM2,%XMM16 |
0x2398da VPADDD %XMM14,%XMM3,%XMM17 |
0x2398e0 VPADDD %XMM4,%XMM15,%XMM14 |
0x2398e4 VPMOVSXDQ %XMM14,%YMM15 |
0x2398e9 VPMOVSXDQ %XMM17,%YMM14 |
0x2398ef VPMULLQ %YMM15,%YMM5,%YMM18 |
0x2398f5 VPMULLQ %YMM15,%YMM6,%YMM20 |
0x2398fb VPADDQ %YMM14,%YMM18,%YMM19 |
0x239901 VPADDQ %YMM14,%YMM20,%YMM15 |
0x239907 VMOVQ %XMM19,%RDX |
0x23990d VPEXTRQ $0x1,%XMM19,%RSI |
0x239914 VEXTRACTI32X4 $0x1,%YMM19,%XMM19 |
0x23991b VPEXTRQ $0x1,%XMM15,%R9 |
0x239921 VMOVQ %XMM19,%RDI |
0x239927 VPEXTRQ $0x1,%XMM19,%RAX |
0x23992e VMOVSD (%R8,%RDX,8),%XMM19 [7] |
0x239935 VMOVSD (%R8,%RDI,8),%XMM21 [5] |
0x23993c VMOVQ %XMM15,%RDI |
0x239941 VEXTRACTI128 $0x1,%YMM15,%XMM15 |
0x239947 VMOVHPD (%R8,%RSI,8),%XMM19,%XMM19 [47] |
0x23994e VMOVQ %XMM15,%RBX |
0x239953 VPEXTRQ $0x1,%XMM15,%RDX |
0x239959 VPMOVSXDQ %XMM16,%YMM15 |
0x23995f VMOVSD (%R10,%RDI,8),%XMM22 [28] |
0x239966 VMOVHPD (%R8,%RAX,8),%XMM21,%XMM21 [9] |
0x23996d VMOVHPD (%R10,%R9,8),%XMM22,%XMM22 [3] |
0x239974 VMOVSD (%R10,%RBX,8),%XMM24 [27] |
0x23997b VPMULLQ %YMM15,%YMM5,%YMM23 |
0x239981 VPMULLQ %YMM15,%YMM6,%YMM27 |
0x239987 VPADDQ %YMM14,%YMM23,%YMM16 |
0x23998d VMOVQ %XMM16,%RSI |
0x239993 VPEXTRQ $0x1,%XMM16,%RDI |
0x23999a VEXTRACTI32X4 $0x1,%YMM16,%XMM16 |
0x2399a1 VMOVQ %XMM16,%R9 |
0x2399a7 VMOVSD (%R8,%R9,8),%XMM25 [39] |
0x2399ae VPEXTRQ $0x1,%XMM16,%R9 |
0x2399b5 VMOVSD (%R8,%RSI,8),%XMM16 [23] |
0x2399bc VINSERTF32X4 $0x1,%XMM21,%YMM19,%YMM19 |
0x2399c3 VMOVHPD (%R8,%RDI,8),%XMM16,%XMM26 [26] |
0x2399ca VPADDQ %YMM14,%YMM27,%YMM16 |
0x2399d0 VMOVHPD (%R8,%R9,8),%XMM25,%XMM25 [41] |
0x2399d7 MOV -0x70(%RBP),%R9 [38] |
0x2399db VMOVQ %XMM16,%RSI |
0x2399e1 VPEXTRQ $0x1,%XMM16,%RDI |
0x2399e8 VEXTRACTI32X4 $0x1,%YMM16,%XMM16 |
0x2399ef VMOVQ %XMM16,%RAX |
0x2399f5 VMOVSD (%R10,%RAX,8),%XMM28 [29] |
0x2399fc VPEXTRQ $0x1,%XMM16,%RAX |
0x239a03 VMOVSD (%R10,%RSI,8),%XMM16 [21] |
0x239a0a VMOVHPD (%R10,%RDI,8),%XMM16,%XMM29 [44] |
0x239a11 VPADDD %XMM11,%XMM17,%XMM16 |
0x239a17 VMOVHPD (%R10,%RDX,8),%XMM24,%XMM17 [36] |
0x239a1e VMOVHPD (%R10,%RAX,8),%XMM28,%XMM28 [46] |
0x239a25 VPMOVSXDQ %XMM16,%YMM16 |
0x239a2b VPADDQ %YMM16,%YMM18,%YMM18 |
0x239a31 VPADDQ %YMM16,%YMM20,%YMM20 |
0x239a37 VPADDQ %YMM16,%YMM23,%YMM23 |
0x239a3d VMOVQ %XMM18,%RAX |
0x239a43 VPEXTRQ $0x1,%XMM18,%RDX |
0x239a4a VEXTRACTI32X4 $0x1,%YMM18,%XMM18 |
0x239a51 VMOVSD (%R8,%RAX,8),%XMM21 [49] |
0x239a58 VMOVQ %XMM18,%RSI |
0x239a5e VPEXTRQ $0x1,%XMM18,%RDI |
0x239a65 VPEXTRQ $0x1,%XMM20,%RAX |
0x239a6c VMOVSD (%R8,%RSI,8),%XMM18 [48] |
0x239a73 VMOVHPD (%R8,%RDX,8),%XMM21,%XMM21 [35] |
0x239a7a VMOVQ %XMM20,%RDX |
0x239a80 VEXTRACTI32X4 $0x1,%YMM20,%XMM20 |
0x239a87 VMOVHPD (%R8,%RDI,8),%XMM18,%XMM18 [20] |
0x239a8e VMOVQ %XMM20,%RSI |
0x239a94 VPEXTRQ $0x1,%XMM20,%RDI |
0x239a9b VMOVSD (%R10,%RSI,8),%XMM24 [16] |
0x239aa2 VINSERTF32X4 $0x1,%XMM17,%YMM22,%YMM17 |
0x239aa9 VINSERTF32X4 $0x1,%XMM25,%YMM26,%YMM22 |
0x239ab0 VMOVSD (%R10,%RDX,8),%XMM25 [40] |
0x239ab7 VINSERTF32X4 $0x1,%XMM28,%YMM29,%YMM20 |
0x239abe VPEXTRQ $0x1,%XMM23,%RDX |
0x239ac5 VMOVHPD (%R10,%RAX,8),%XMM25,%XMM25 [45] |
0x239acc VMOVHPD (%R10,%RDI,8),%XMM24,%XMM24 [11] |
0x239ad3 VMOVQ %XMM23,%RAX |
0x239ad9 VMULPD %YMM20,%YMM22,%YMM20 |
0x239adf VFMADD231PD %YMM17,%YMM19,%YMM20 |
0x239ae5 VPMULLQ %YMM15,%YMM8,%YMM19 |
0x239aeb VINSERTF32X4 $0x1,%XMM18,%YMM21,%YMM18 |
0x239af2 VEXTRACTI32X4 $0x1,%YMM23,%XMM21 |
0x239af9 VMOVQ %XMM21,%RSI |
0x239aff VPEXTRQ $0x1,%XMM21,%RDI |
0x239b06 VINSERTF32X4 $0x1,%XMM24,%YMM25,%YMM23 |
0x239b0d VMOVSD (%R8,%RSI,8),%XMM21 [31] |
0x239b14 VMOVSD (%R8,%RAX,8),%XMM25 [25] |
0x239b1b VMOVHPD (%R8,%RDI,8),%XMM21,%XMM21 [19] |
0x239b22 VMOVHPD (%R8,%RDX,8),%XMM25,%XMM22 [34] |
0x239b29 VFMADD213PD %YMM20,%YMM18,%YMM23 |
0x239b2f VINSERTF32X4 $0x1,%XMM21,%YMM22,%YMM21 |
0x239b36 VPADDQ %YMM16,%YMM27,%YMM22 |
0x239b3c VPADDQ %YMM16,%YMM19,%YMM16 |
0x239b42 VPADDQ %YMM14,%YMM19,%YMM19 |
0x239b48 VEXTRACTI32X4 $0x1,%YMM22,%XMM17 |
0x239b4f VMOVQ %XMM22,%RDX |
0x239b55 VPEXTRQ $0x1,%XMM22,%RAX |
0x239b5c VMOVQ %XMM17,%RSI |
0x239b62 VMOVSD (%R10,%RDX,8),%XMM18 [22] |
0x239b69 VPEXTRQ $0x1,%XMM17,%RDI |
0x239b70 VMOVSD (%R10,%RSI,8),%XMM17 [32] |
0x239b77 VMOVHPD (%R10,%RAX,8),%XMM18,%XMM18 [33] |
0x239b7e VMOVHPD (%R10,%RDI,8),%XMM17,%XMM17 [10] |
0x239b85 VINSERTF32X4 $0x1,%XMM17,%YMM18,%YMM17 |
0x239b8c VPMULLQ %YMM15,%YMM7,%YMM18 |
0x239b92 VPMULLQ %YMM15,%YMM9,%YMM15 |
0x239b98 VFMADD213PD %YMM23,%YMM21,%YMM17 |
0x239b9e VPADDQ %YMM14,%YMM18,%YMM18 |
0x239ba4 VPADDQ %YMM14,%YMM15,%YMM14 |
0x239ba9 VMOVQ %XMM18,%RAX |
0x239baf VPEXTRQ $0x1,%XMM18,%RDX |
0x239bb6 VEXTRACTI32X4 $0x1,%YMM18,%XMM18 |
0x239bbd VMOVQ %XMM18,%RSI |
0x239bc3 VPEXTRQ $0x1,%XMM18,%RDI |
0x239bca VMULPD %YMM12,%YMM17,%YMM17 |
0x239bd0 VEXTRACTF32X4 $0x1,%YMM17,%XMM18 |
0x239bd7 VMOVLPD %XMM17,(%R9,%RAX,8) [13] |
0x239bde VMOVHPD %XMM17,(%R9,%RDX,8) [24] |
0x239be5 VMOVQ %XMM16,%RAX |
0x239beb VPEXTRQ $0x1,%XMM16,%RDX |
0x239bf2 VEXTRACTI32X4 $0x1,%YMM16,%XMM16 |
0x239bf9 VMOVLPD %XMM18,(%R9,%RSI,8) [12] |
0x239c00 VMOVHPD %XMM18,(%R9,%RDI,8) [8] |
0x239c07 VMOVQ %XMM16,%RSI |
0x239c0d VPEXTRQ $0x1,%XMM16,%RDI |
0x239c14 MOV -0x38(%RBP),%R9 [38] |
0x239c18 VMOVSD (%R14,%RAX,8),%XMM18 [6] |
0x239c1f VMOVSD (%R14,%RSI,8),%XMM16 [4] |
0x239c26 VMOVQ %XMM19,%RAX |
0x239c2c VMOVHPD (%R14,%RDX,8),%XMM18,%XMM18 [43] |
0x239c33 VMOVHPD (%R14,%RDI,8),%XMM16,%XMM16 [30] |
0x239c3a VPEXTRQ $0x1,%XMM19,%RDX |
0x239c41 VEXTRACTI32X4 $0x1,%YMM19,%XMM19 |
0x239c48 VMOVQ %XMM19,%RDI |
0x239c4e VPEXTRQ $0x1,%XMM19,%RSI |
0x239c55 VMOVSD (%R14,%RAX,8),%XMM19 [2] |
0x239c5c VPEXTRQ $0x1,%XMM14,%RAX |
0x239c62 VMOVHPD (%R14,%RDX,8),%XMM19,%XMM19 [42] |
0x239c69 VMOVQ %XMM14,%RDX |
0x239c6e VEXTRACTI128 $0x1,%YMM14,%XMM14 |
0x239c74 VINSERTF32X4 $0x1,%XMM16,%YMM18,%YMM16 |
0x239c7b VMOVSD (%R14,%RDI,8),%XMM18 [1] |
0x239c82 VPEXTRQ $0x1,%XMM14,%RDI |
0x239c88 VMOVHPD (%R14,%RSI,8),%XMM18,%XMM18 [14] |
0x239c8f VMOVQ %XMM14,%RSI |
0x239c94 VSUBPD %YMM16,%YMM17,%YMM16 |
0x239c9a VINSERTF32X4 $0x1,%XMM18,%YMM19,%YMM17 |
0x239ca1 VADDPD %YMM17,%YMM16,%YMM16 |
0x239ca7 VMOVLPD %XMM16,(%R9,%RDX,8) [18] |
0x239cae MOV -0x38(%RBP),%R9 [38] |
0x239cb2 VEXTRACTF32X4 $0x1,%YMM16,%XMM14 |
0x239cb9 VMOVHPD %XMM16,(%R9,%RAX,8) [15] |
0x239cc0 VMOVLPD %XMM14,(%R9,%RSI,8) [17] |
0x239cc6 VMOVHPD %XMM14,(%R9,%RDI,8) [37] |
0x239ccc JNE 239840 |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/advec_mom.cpp: 96 - 100 |
-------------------------------------------------------------------------------- |
96: for (int j = (y_min + 1); j < (y_max + 1 + 2); j++) { |
97: for (int i = (x_min - 1 + 1); i < (x_max + 2 + 2); i++) { |
98: node_mass_post(i, j) = 0.25 * (density1(i + 0, j - 1) * post_vol(i + 0, j - 1) + density1(i, j) * post_vol(i, j) + |
99: density1(i - 1, j - 1) * post_vol(i - 1, j - 1) + density1(i - 1, j + 0) * post_vol(i - 1, j + 0)); |
100: node_mass_pre(i, j) = node_mass_post(i, j) - node_flux(i - 1, j + 0) + node_flux(i, j); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
| Path / |
| Metric | Value |
|---|---|
| CQA speedup if no scalar integer | 1.07 - 1.38 |
| CQA speedup if FP arith vectorized | 1.00 |
| CQA speedup if fully vectorized | 4.31 - 4.00 |
| CQA speedup if no inter-iteration dependency | NA |
| CQA speedup if next bottleneck killed | 1.16 - 1.29 |
| Bottlenecks | P8, P9, |
| Function | .omp_outlined..10#0x239680 |
| Source | advec_mom.cpp:96-100,context.h:69-69 |
| Source loop unroll info | unrolled by 4 |
| Source loop unroll confidence level | max |
| Unroll/vectorization loop type | main |
| Unroll factor | 4 |
| CQA cycles | 37.17 - 48.00 |
| CQA cycles if no scalar integer | 34.83 |
| CQA cycles if FP arith vectorized | 32.01 - 48.00 |
| CQA cycles if fully vectorized | 8.63 - 12.00 |
| Front-end cycles | 37.17 |
| DIV/SQRT cycles | 8.00 |
| P0 cycles | 0.50 |
| P1 cycles | 4.00 |
| P2 cycles | 0.50 |
| P3 cycles | 1.00 |
| P4 cycles | 17.00 |
| P5 cycles | 17.00 |
| P6 cycles | 17.00 |
| P7 cycles | 29.75 |
| P8 cycles | 29.83 |
| P9 cycles | 29.83 |
| P10 cycles | 29.58 |
| P11 cycles | 32.00 |
| P12 cycles | 32.00 |
| P13 cycles | 28.00 - 48.00 |
| Inter-iter dependencies cycles | 1 |
| FE+BE cycles (UFS) | NA |
| Stall cycles (UFS) | NA |
| Nb insns | 191.00 |
| Nb uops | 223.00 |
| Nb loads | 47.00 |
| Nb stores | 8.00 |
| Nb stack references | 2.00 |
| FLOP/cycle | 1.08 - 0.83 |
| Nb FLOP add-sub | 8.00 |
| Nb FLOP mul | 8.00 |
| Nb FLOP fma | 12.00 |
| Nb FLOP div | 0.00 |
| Nb FLOP rcp | 0.00 |
| Nb FLOP sqrt | 0.00 |
| Nb FLOP rsqrt | 0.00 |
| Bytes/cycle | 8.50 - 10.98 |
| Bytes prefetched | 0.00 |
| Bytes loaded | 344.00 |
| Bytes stored | 64.00 |
| Stride 0 | 1.00 |
| Stride 1 | 0.00 |
| Stride n | 0.00 |
| Stride unknown | 0.00 |
| Stride indirect | 19.00 |
| Vectorization ratio all | 35.52 |
| Vectorization ratio load | 0.00 |
| Vectorization ratio store | 0.00 |
| Vectorization ratio mul | 100.00 |
| Vectorization ratio add_sub | 100.00 |
| Vectorization ratio fma | 100.00 |
| Vectorization ratio div_sqrt | 0.00 |
| Vectorization ratio other | 32.65 |
| Vector-efficiency ratio all | 21.17 |
| Vector-efficiency ratio load | 12.50 |
| Vector-efficiency ratio store | 12.50 |
| Vector-efficiency ratio mul | 50.00 |
| Vector-efficiency ratio add_sub | 45.00 |
| Vector-efficiency ratio fma | 50.00 |
| Vector-efficiency ratio div_sqrt | 12.50 |
| Vector-efficiency ratio other | 17.09 |
| Metric | Value |
|---|---|
| CQA speedup if no scalar integer | 1.07 - 1.38 |
| CQA speedup if FP arith vectorized | 1.00 |
| CQA speedup if fully vectorized | 4.31 - 4.00 |
| CQA speedup if no inter-iteration dependency | NA |
| CQA speedup if next bottleneck killed | 1.16 - 1.29 |
| Bottlenecks | P8, P9, |
| Function | .omp_outlined..10#0x239680 |
| Source | advec_mom.cpp:96-100,context.h:69-69 |
| Source loop unroll info | unrolled by 4 |
| Source loop unroll confidence level | max |
| Unroll/vectorization loop type | main |
| Unroll factor | 4 |
| CQA cycles | 37.17 - 48.00 |
| CQA cycles if no scalar integer | 34.83 |
| CQA cycles if FP arith vectorized | 32.01 - 48.00 |
| CQA cycles if fully vectorized | 8.63 - 12.00 |
| Front-end cycles | 37.17 |
| DIV/SQRT cycles | 8.00 |
| P0 cycles | 0.50 |
| P1 cycles | 4.00 |
| P2 cycles | 0.50 |
| P3 cycles | 1.00 |
| P4 cycles | 17.00 |
| P5 cycles | 17.00 |
| P6 cycles | 17.00 |
| P7 cycles | 29.75 |
| P8 cycles | 29.83 |
| P9 cycles | 29.83 |
| P10 cycles | 29.58 |
| P11 cycles | 32.00 |
| P12 cycles | 32.00 |
| P13 cycles | 28.00 - 48.00 |
| Inter-iter dependencies cycles | 1 |
| FE+BE cycles (UFS) | NA |
| Stall cycles (UFS) | NA |
| Nb insns | 191.00 |
| Nb uops | 223.00 |
| Nb loads | 47.00 |
| Nb stores | 8.00 |
| Nb stack references | 2.00 |
| FLOP/cycle | 1.08 - 0.83 |
| Nb FLOP add-sub | 8.00 |
| Nb FLOP mul | 8.00 |
| Nb FLOP fma | 12.00 |
| Nb FLOP div | 0.00 |
| Nb FLOP rcp | 0.00 |
| Nb FLOP sqrt | 0.00 |
| Nb FLOP rsqrt | 0.00 |
| Bytes/cycle | 8.50 - 10.98 |
| Bytes prefetched | 0.00 |
| Bytes loaded | 344.00 |
| Bytes stored | 64.00 |
| Stride 0 | 1.00 |
| Stride 1 | 0.00 |
| Stride n | 0.00 |
| Stride unknown | 0.00 |
| Stride indirect | 19.00 |
| Vectorization ratio all | 35.52 |
| Vectorization ratio load | 0.00 |
| Vectorization ratio store | 0.00 |
| Vectorization ratio mul | 100.00 |
| Vectorization ratio add_sub | 100.00 |
| Vectorization ratio fma | 100.00 |
| Vectorization ratio div_sqrt | 0.00 |
| Vectorization ratio other | 32.65 |
| Vector-efficiency ratio all | 21.17 |
| Vector-efficiency ratio load | 12.50 |
| Vector-efficiency ratio store | 12.50 |
| Vector-efficiency ratio mul | 50.00 |
| Vector-efficiency ratio add_sub | 45.00 |
| Vector-efficiency ratio fma | 50.00 |
| Vector-efficiency ratio div_sqrt | 12.50 |
| Vector-efficiency ratio other | 17.09 |
| Path / |
| Function | .omp_outlined..10#0x239680 |
| Source file and lines | advec_mom.cpp:96-100 |
| Module | exec |
| nb instructions | 191 |
| nb uops | 223 |
| loop length | 1170 |
| used x86 registers | 11 |
| used mmx registers | 0 |
| used xmm registers | 22 |
| used ymm registers | 23 |
| used zmm registers | 0 |
| nb stack references | 2 |
| ADD-SUB / MUL ratio | 1.00 |
| micro-operation queue | 37.17 cycles |
| front end | 37.17 cycles |
| ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| uops | 8.00 | 0.50 | 4.00 | 0.50 | 1.00 | 17.00 | 17.00 | 17.00 | 29.75 | 29.83 | 29.83 | 29.58 | 32.00 | 32.00 |
| cycles | 8.00 | 0.50 | 4.00 | 0.50 | 1.00 | 17.00 | 17.00 | 17.00 | 29.75 | 29.83 | 29.83 | 29.58 | 32.00 | 32.00 |
| Cycles executing div or sqrt instructions | 28.00-48.00 |
| Longest recurrence chain latency (RecMII) | 1.00 |
| Front-end | 37.17 |
| Dispatch | 32.00 |
| DIV/SQRT | 28.00-48.00 |
| Data deps. | 1.00 |
| Overall L1 | 37.17-48.00 |
| all | 39% |
| load | NA (no load vectorizable/vectorized instructions) |
| store | NA (no store vectorizable/vectorized instructions) |
| mul | 100% |
| add-sub | 100% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| other | 22% |
| all | 28% |
| load | 0% |
| store | 0% |
| mul | 100% |
| add-sub | 100% |
| fma | 100% |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 100% |
| all | 35% |
| load | 0% |
| store | 0% |
| mul | 100% |
| add-sub | 100% |
| fma | 100% |
| div/sqrt | 0% |
| other | 32% |
| all | 22% |
| load | NA (no load vectorizable/vectorized instructions) |
| store | NA (no store vectorizable/vectorized instructions) |
| mul | 50% |
| add-sub | 44% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| other | 15% |
| all | 18% |
| load | 12% |
| store | 12% |
| mul | 50% |
| add-sub | 50% |
| fma | 50% |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 25% |
| all | 21% |
| load | 12% |
| store | 12% |
| mul | 50% |
| add-sub | 45% |
| fma | 50% |
| div/sqrt | 12% |
| other | 17% |
| Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| VEXTRACTI128 $0x1,%YMM0,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPEXTRQ $0x1,%XMM10,%RSI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVQ %XMM10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM14,%RAX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| CQTO | |||||||||||||||||
| IDIV %RSI | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-19 | 7-12 |
| MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| VMOVQ %XMM14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVQ %RSI,%XMM14 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
| VPEXTRQ $0x1,%XMM1,%RSI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| CQTO | |||||||||||||||||
| IDIV %RDI | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-19 | 7-12 |
| VPEXTRQ $0x1,%XMM0,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVQ %XMM1,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVQ %RAX,%XMM15 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
| MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| CQTO | |||||||||||||||||
| IDIV %RSI | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-19 | 7-12 |
| VPUNPCKLQDQ %XMM14,%XMM15,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| VMOVQ %XMM0,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVQ %RSI,%XMM15 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
| CQTO | |||||||||||||||||
| IDIV %RDI | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-19 | 7-12 |
| ADD $-0x4,%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| VMOVQ %RAX,%XMM16 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
| VPUNPCKLQDQ %XMM15,%XMM16,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| VINSERTI128 $0x1,%XMM14,%YMM15,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VPMOVQD %YMM14,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 0.50 |
| VPMULLQ %YMM1,%YMM14,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VPSUBQ %YMM14,%YMM0,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM0,%YMM13,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPMOVQD %YMM14,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 0.50 |
| VPADDD %XMM15,%XMM2,%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDD %XMM14,%XMM3,%XMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDD %XMM4,%XMM15,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPMOVSXDQ %XMM14,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| VPMOVSXDQ %XMM17,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| VPMULLQ %YMM15,%YMM5,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VPMULLQ %YMM15,%YMM6,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VPADDQ %YMM14,%YMM18,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM14,%YMM20,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVQ %XMM19,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM19,%RSI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM19,%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VPEXTRQ $0x1,%XMM15,%R9 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVQ %XMM19,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM19,%RAX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R8,%RDX,8),%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVSD (%R8,%RDI,8),%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVQ %XMM15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VEXTRACTI128 $0x1,%YMM15,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVHPD (%R8,%RSI,8),%XMM19,%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVQ %XMM15,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM15,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VPMOVSXDQ %XMM16,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| VMOVSD (%R10,%RDI,8),%XMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVHPD (%R8,%RAX,8),%XMM21,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVHPD (%R10,%R9,8),%XMM22,%XMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVSD (%R10,%RBX,8),%XMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VPMULLQ %YMM15,%YMM5,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VPMULLQ %YMM15,%YMM6,%YMM27 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VPADDQ %YMM14,%YMM23,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVQ %XMM16,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM16,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM16,%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVQ %XMM16,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVSD (%R8,%R9,8),%XMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VPEXTRQ $0x1,%XMM16,%R9 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R8,%RSI,8),%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VINSERTF32X4 $0x1,%XMM21,%YMM19,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVHPD (%R8,%RDI,8),%XMM16,%XMM26 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VPADDQ %YMM14,%YMM27,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVHPD (%R8,%R9,8),%XMM25,%XMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| MOV -0x70(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
| VMOVQ %XMM16,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM16,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM16,%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVQ %XMM16,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVSD (%R10,%RAX,8),%XMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VPEXTRQ $0x1,%XMM16,%RAX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R10,%RSI,8),%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVHPD (%R10,%RDI,8),%XMM16,%XMM29 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VPADDD %XMM11,%XMM17,%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVHPD (%R10,%RDX,8),%XMM24,%XMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVHPD (%R10,%RAX,8),%XMM28,%XMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VPMOVSXDQ %XMM16,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| VPADDQ %YMM16,%YMM18,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM16,%YMM20,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM16,%YMM23,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVQ %XMM18,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM18,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVSD (%R8,%RAX,8),%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVQ %XMM18,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM18,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VPEXTRQ $0x1,%XMM20,%RAX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R8,%RSI,8),%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVHPD (%R8,%RDX,8),%XMM21,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVQ %XMM20,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VEXTRACTI32X4 $0x1,%YMM20,%XMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVHPD (%R8,%RDI,8),%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVQ %XMM20,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM20,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R10,%RSI,8),%XMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VINSERTF32X4 $0x1,%XMM17,%YMM22,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VINSERTF32X4 $0x1,%XMM25,%YMM26,%YMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVSD (%R10,%RDX,8),%XMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VINSERTF32X4 $0x1,%XMM28,%YMM29,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VPEXTRQ $0x1,%XMM23,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVHPD (%R10,%RAX,8),%XMM25,%XMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVHPD (%R10,%RDI,8),%XMM24,%XMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVQ %XMM23,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMULPD %YMM20,%YMM22,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VFMADD231PD %YMM17,%YMM19,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
| VPMULLQ %YMM15,%YMM8,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VINSERTF32X4 $0x1,%XMM18,%YMM21,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VEXTRACTI32X4 $0x1,%YMM23,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVQ %XMM21,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM21,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VINSERTF32X4 $0x1,%XMM24,%YMM25,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVSD (%R8,%RSI,8),%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVSD (%R8,%RAX,8),%XMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVHPD (%R8,%RDI,8),%XMM21,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVHPD (%R8,%RDX,8),%XMM25,%XMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VFMADD213PD %YMM20,%YMM18,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
| VINSERTF32X4 $0x1,%XMM21,%YMM22,%YMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VPADDQ %YMM16,%YMM27,%YMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM16,%YMM19,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM14,%YMM19,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VEXTRACTI32X4 $0x1,%YMM22,%XMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVQ %XMM22,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM22,%RAX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVQ %XMM17,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVSD (%R10,%RDX,8),%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VPEXTRQ $0x1,%XMM17,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R10,%RSI,8),%XMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVHPD (%R10,%RAX,8),%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVHPD (%R10,%RDI,8),%XMM17,%XMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VINSERTF32X4 $0x1,%XMM17,%YMM18,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VPMULLQ %YMM15,%YMM7,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VPMULLQ %YMM15,%YMM9,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VFMADD213PD %YMM23,%YMM21,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
| VPADDQ %YMM14,%YMM18,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM14,%YMM15,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVQ %XMM18,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM18,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVQ %XMM18,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM18,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMULPD %YMM12,%YMM17,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VEXTRACTF32X4 $0x1,%YMM17,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVLPD %XMM17,(%R9,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVHPD %XMM17,(%R9,%RDX,8) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 9-11 | 1 |
| VMOVQ %XMM16,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM16,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM16,%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVLPD %XMM18,(%R9,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVHPD %XMM18,(%R9,%RDI,8) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 9-11 | 1 |
| VMOVQ %XMM16,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM16,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| MOV -0x38(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
| VMOVSD (%R14,%RAX,8),%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVSD (%R14,%RSI,8),%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVQ %XMM19,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVHPD (%R14,%RDX,8),%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVHPD (%R14,%RDI,8),%XMM16,%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VPEXTRQ $0x1,%XMM19,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM19,%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVQ %XMM19,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM19,%RSI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R14,%RAX,8),%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VPEXTRQ $0x1,%XMM14,%RAX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVHPD (%R14,%RDX,8),%XMM19,%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVQ %XMM14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VEXTRACTI128 $0x1,%YMM14,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VINSERTF32X4 $0x1,%XMM16,%YMM18,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVSD (%R14,%RDI,8),%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VPEXTRQ $0x1,%XMM14,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVHPD (%R14,%RSI,8),%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVQ %XMM14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VSUBPD %YMM16,%YMM17,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
| VINSERTF32X4 $0x1,%XMM18,%YMM19,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VADDPD %YMM17,%YMM16,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
| VMOVLPD %XMM16,(%R9,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| MOV -0x38(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
| VEXTRACTF32X4 $0x1,%YMM16,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVHPD %XMM16,(%R9,%RAX,8) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 9-11 | 1 |
| VMOVLPD %XMM14,(%R9,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVHPD %XMM14,(%R9,%RDI,8) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 9-11 | 1 |
| JNE 239840 <.omp_outlined..10+0x1c0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
| Function | .omp_outlined..10#0x239680 |
| Source file and lines | advec_mom.cpp:96-100 |
| Module | exec |
| nb instructions | 191 |
| nb uops | 223 |
| loop length | 1170 |
| used x86 registers | 11 |
| used mmx registers | 0 |
| used xmm registers | 22 |
| used ymm registers | 23 |
| used zmm registers | 0 |
| nb stack references | 2 |
| ADD-SUB / MUL ratio | 1.00 |
| micro-operation queue | 37.17 cycles |
| front end | 37.17 cycles |
| ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| uops | 8.00 | 0.50 | 4.00 | 0.50 | 1.00 | 17.00 | 17.00 | 17.00 | 29.75 | 29.83 | 29.83 | 29.58 | 32.00 | 32.00 |
| cycles | 8.00 | 0.50 | 4.00 | 0.50 | 1.00 | 17.00 | 17.00 | 17.00 | 29.75 | 29.83 | 29.83 | 29.58 | 32.00 | 32.00 |
| Cycles executing div or sqrt instructions | 28.00-48.00 |
| Longest recurrence chain latency (RecMII) | 1.00 |
| Front-end | 37.17 |
| Dispatch | 32.00 |
| DIV/SQRT | 28.00-48.00 |
| Data deps. | 1.00 |
| Overall L1 | 37.17-48.00 |
| all | 39% |
| load | NA (no load vectorizable/vectorized instructions) |
| store | NA (no store vectorizable/vectorized instructions) |
| mul | 100% |
| add-sub | 100% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| other | 22% |
| all | 28% |
| load | 0% |
| store | 0% |
| mul | 100% |
| add-sub | 100% |
| fma | 100% |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 100% |
| all | 35% |
| load | 0% |
| store | 0% |
| mul | 100% |
| add-sub | 100% |
| fma | 100% |
| div/sqrt | 0% |
| other | 32% |
| all | 22% |
| load | NA (no load vectorizable/vectorized instructions) |
| store | NA (no store vectorizable/vectorized instructions) |
| mul | 50% |
| add-sub | 44% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| other | 15% |
| all | 18% |
| load | 12% |
| store | 12% |
| mul | 50% |
| add-sub | 50% |
| fma | 50% |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 25% |
| all | 21% |
| load | 12% |
| store | 12% |
| mul | 50% |
| add-sub | 45% |
| fma | 50% |
| div/sqrt | 12% |
| other | 17% |
| Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| VEXTRACTI128 $0x1,%YMM0,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPEXTRQ $0x1,%XMM10,%RSI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVQ %XMM10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM14,%RAX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| CQTO | |||||||||||||||||
| IDIV %RSI | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-19 | 7-12 |
| MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| VMOVQ %XMM14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVQ %RSI,%XMM14 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
| VPEXTRQ $0x1,%XMM1,%RSI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| CQTO | |||||||||||||||||
| IDIV %RDI | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-19 | 7-12 |
| VPEXTRQ $0x1,%XMM0,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVQ %XMM1,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVQ %RAX,%XMM15 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
| MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| CQTO | |||||||||||||||||
| IDIV %RSI | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-19 | 7-12 |
| VPUNPCKLQDQ %XMM14,%XMM15,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| VMOVQ %XMM0,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVQ %RSI,%XMM15 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
| CQTO | |||||||||||||||||
| IDIV %RDI | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-19 | 7-12 |
| ADD $-0x4,%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| VMOVQ %RAX,%XMM16 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
| VPUNPCKLQDQ %XMM15,%XMM16,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| VINSERTI128 $0x1,%XMM14,%YMM15,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VPMOVQD %YMM14,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 0.50 |
| VPMULLQ %YMM1,%YMM14,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VPSUBQ %YMM14,%YMM0,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM0,%YMM13,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPMOVQD %YMM14,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 0.50 |
| VPADDD %XMM15,%XMM2,%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDD %XMM14,%XMM3,%XMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDD %XMM4,%XMM15,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPMOVSXDQ %XMM14,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| VPMOVSXDQ %XMM17,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| VPMULLQ %YMM15,%YMM5,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VPMULLQ %YMM15,%YMM6,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VPADDQ %YMM14,%YMM18,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM14,%YMM20,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVQ %XMM19,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM19,%RSI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM19,%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VPEXTRQ $0x1,%XMM15,%R9 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVQ %XMM19,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM19,%RAX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R8,%RDX,8),%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVSD (%R8,%RDI,8),%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVQ %XMM15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VEXTRACTI128 $0x1,%YMM15,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVHPD (%R8,%RSI,8),%XMM19,%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVQ %XMM15,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM15,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VPMOVSXDQ %XMM16,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| VMOVSD (%R10,%RDI,8),%XMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVHPD (%R8,%RAX,8),%XMM21,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVHPD (%R10,%R9,8),%XMM22,%XMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVSD (%R10,%RBX,8),%XMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VPMULLQ %YMM15,%YMM5,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VPMULLQ %YMM15,%YMM6,%YMM27 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VPADDQ %YMM14,%YMM23,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVQ %XMM16,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM16,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM16,%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVQ %XMM16,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVSD (%R8,%R9,8),%XMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VPEXTRQ $0x1,%XMM16,%R9 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R8,%RSI,8),%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VINSERTF32X4 $0x1,%XMM21,%YMM19,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVHPD (%R8,%RDI,8),%XMM16,%XMM26 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VPADDQ %YMM14,%YMM27,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVHPD (%R8,%R9,8),%XMM25,%XMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| MOV -0x70(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
| VMOVQ %XMM16,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM16,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM16,%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVQ %XMM16,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVSD (%R10,%RAX,8),%XMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VPEXTRQ $0x1,%XMM16,%RAX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R10,%RSI,8),%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVHPD (%R10,%RDI,8),%XMM16,%XMM29 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VPADDD %XMM11,%XMM17,%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVHPD (%R10,%RDX,8),%XMM24,%XMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVHPD (%R10,%RAX,8),%XMM28,%XMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VPMOVSXDQ %XMM16,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| VPADDQ %YMM16,%YMM18,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM16,%YMM20,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM16,%YMM23,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVQ %XMM18,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM18,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVSD (%R8,%RAX,8),%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVQ %XMM18,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM18,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VPEXTRQ $0x1,%XMM20,%RAX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R8,%RSI,8),%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVHPD (%R8,%RDX,8),%XMM21,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVQ %XMM20,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VEXTRACTI32X4 $0x1,%YMM20,%XMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVHPD (%R8,%RDI,8),%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVQ %XMM20,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM20,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R10,%RSI,8),%XMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VINSERTF32X4 $0x1,%XMM17,%YMM22,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VINSERTF32X4 $0x1,%XMM25,%YMM26,%YMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVSD (%R10,%RDX,8),%XMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VINSERTF32X4 $0x1,%XMM28,%YMM29,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VPEXTRQ $0x1,%XMM23,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVHPD (%R10,%RAX,8),%XMM25,%XMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVHPD (%R10,%RDI,8),%XMM24,%XMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVQ %XMM23,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMULPD %YMM20,%YMM22,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VFMADD231PD %YMM17,%YMM19,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
| VPMULLQ %YMM15,%YMM8,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VINSERTF32X4 $0x1,%XMM18,%YMM21,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VEXTRACTI32X4 $0x1,%YMM23,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVQ %XMM21,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM21,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VINSERTF32X4 $0x1,%XMM24,%YMM25,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVSD (%R8,%RSI,8),%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVSD (%R8,%RAX,8),%XMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVHPD (%R8,%RDI,8),%XMM21,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVHPD (%R8,%RDX,8),%XMM25,%XMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VFMADD213PD %YMM20,%YMM18,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
| VINSERTF32X4 $0x1,%XMM21,%YMM22,%YMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VPADDQ %YMM16,%YMM27,%YMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM16,%YMM19,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM14,%YMM19,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VEXTRACTI32X4 $0x1,%YMM22,%XMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVQ %XMM22,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM22,%RAX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVQ %XMM17,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVSD (%R10,%RDX,8),%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VPEXTRQ $0x1,%XMM17,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R10,%RSI,8),%XMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVHPD (%R10,%RAX,8),%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVHPD (%R10,%RDI,8),%XMM17,%XMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VINSERTF32X4 $0x1,%XMM17,%YMM18,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VPMULLQ %YMM15,%YMM7,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VPMULLQ %YMM15,%YMM9,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VFMADD213PD %YMM23,%YMM21,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
| VPADDQ %YMM14,%YMM18,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VPADDQ %YMM14,%YMM15,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VMOVQ %XMM18,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM18,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVQ %XMM18,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM18,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMULPD %YMM12,%YMM17,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| VEXTRACTF32X4 $0x1,%YMM17,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVLPD %XMM17,(%R9,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVHPD %XMM17,(%R9,%RDX,8) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 9-11 | 1 |
| VMOVQ %XMM16,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM16,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM16,%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVLPD %XMM18,(%R9,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVHPD %XMM18,(%R9,%RDI,8) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 9-11 | 1 |
| VMOVQ %XMM16,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM16,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| MOV -0x38(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
| VMOVSD (%R14,%RAX,8),%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVSD (%R14,%RSI,8),%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVQ %XMM19,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVHPD (%R14,%RDX,8),%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVHPD (%R14,%RDI,8),%XMM16,%XMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VPEXTRQ $0x1,%XMM19,%RDX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VEXTRACTI32X4 $0x1,%YMM19,%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVQ %XMM19,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VPEXTRQ $0x1,%XMM19,%RSI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVSD (%R14,%RAX,8),%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VPEXTRQ $0x1,%XMM14,%RAX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVHPD (%R14,%RDX,8),%XMM19,%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVQ %XMM14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VEXTRACTI128 $0x1,%YMM14,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| VINSERTF32X4 $0x1,%XMM16,%YMM18,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VMOVSD (%R14,%RDI,8),%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| VPEXTRQ $0x1,%XMM14,%RDI | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 |
| VMOVHPD (%R14,%RSI,8),%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 9 | 0.50 |
| VMOVQ %XMM14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VSUBPD %YMM16,%YMM17,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
| VINSERTF32X4 $0x1,%XMM18,%YMM19,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
| VADDPD %YMM17,%YMM16,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
| VMOVLPD %XMM16,(%R9,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| MOV -0x38(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
| VEXTRACTF32X4 $0x1,%YMM16,%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 4 | 0.25 |
| VMOVHPD %XMM16,(%R9,%RAX,8) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 9-11 | 1 |
| VMOVLPD %XMM14,(%R9,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
| VMOVHPD %XMM14,(%R9,%RDI,8) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 9-11 | 1 |
| JNE 239840 <.omp_outlined..10+0x1c0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
