| Loop Id: 372 | Module: exec | Source: field_summary.cpp:80-82 [...] | Coverage: 0.05% |
|---|
| Loop Id: 372 | Module: exec | Source: field_summary.cpp:80-82 [...] | Coverage: 0.05% |
|---|
0x444b20 INC %RAX |
0x444b23 MOVQ %RAX,%XMM0 |
0x444b28 PSHUFD $0x44,%XMM0,%XMM0 |
0x444b2d PXOR 0x4996b(%RIP),%XMM0 |
0x444b35 MOVDQA -0x3d0(%RBP),%XMM4 |
0x444b3d MOVDQA %XMM4,%XMM1 |
0x444b41 PCMPGTD %XMM0,%XMM1 |
0x444b45 PSHUFD $-0x60,%XMM1,%XMM3 |
0x444b4a PCMPEQD %XMM0,%XMM4 |
0x444b4e PSHUFD $-0xb,%XMM4,%XMM4 |
0x444b53 PAND %XMM3,%XMM4 |
0x444b57 PSHUFD $-0xb,%XMM1,%XMM1 |
0x444b5c POR %XMM4,%XMM1 |
0x444b60 MOVDQA -0x3c0(%RBP),%XMM6 |
0x444b68 MOVDQA %XMM6,%XMM3 |
0x444b6c PCMPGTD %XMM0,%XMM3 |
0x444b70 PSHUFD $-0x60,%XMM3,%XMM4 |
0x444b75 PCMPEQD %XMM6,%XMM0 |
0x444b79 PSHUFD $-0xb,%XMM0,%XMM6 |
0x444b7e PAND %XMM4,%XMM6 |
0x444b82 PSHUFD $-0xb,%XMM3,%XMM0 |
0x444b87 POR %XMM6,%XMM0 |
0x444b8b PACKSSDW %XMM1,%XMM0 |
0x444b8f MOVAPD -0x130(%RBP),%XMM4 |
0x444b97 MOVAPD -0x400(%RBP),%XMM6 |
0x444b9f PSHUFD $-0x6,%XMM8,%XMM1 |
0x444ba5 PSLLD $0x1f,%XMM1 |
0x444baa PSRAD $0x1f,%XMM1 |
0x444baf MOVAPD %XMM5,%XMM3 |
0x444bb3 ANDPD %XMM1,%XMM3 |
0x444bb7 ANDNPD %XMM6,%XMM1 |
0x444bbb MOVAPD %XMM1,%XMM6 |
0x444bbf ORPD %XMM3,%XMM6 |
0x444bc3 PSHUFD $0x50,%XMM8,%XMM1 |
0x444bc9 PSLLD $0x1f,%XMM1 |
0x444bce PSRAD $0x1f,%XMM1 |
0x444bd3 MOVAPD %XMM2,%XMM3 |
0x444bd7 ANDPD %XMM1,%XMM3 |
0x444bdb ANDNPD %XMM4,%XMM1 |
0x444bdf MOVAPD %XMM1,%XMM4 |
0x444be3 ORPD %XMM3,%XMM4 |
0x444be7 PAND %XMM0,%XMM8 |
0x444bec MOVDQA %XMM8,%XMM0 |
0x444bf1 PSLLD $0x1f,%XMM0 |
0x444bf6 MOVMSKPS %XMM0,%ECX |
0x444bf9 MOVAPD %XMM2,%XMM7 |
0x444bfd MOVAPD %XMM5,%XMM11 |
0x444c02 TEST %ECX,%ECX |
0x444c04 JE 4442b0 |
0x444c0a MOVDQA %XMM8,%XMM0 |
0x444c0f PSLLD $0x1f,%XMM0 |
0x444c14 MOVMSKPS %XMM0,%ECX |
0x444c17 TEST %ECX,%ECX |
0x444c19 JE 444fb0 |
0x444c1f MOVAPS %XMM6,-0x400(%RBP) |
0x444c26 MOVAPS %XMM4,-0x130(%RBP) |
0x444c2d MOVQ %RAX,%XMM0 |
0x444c32 PSHUFD $0x44,%XMM0,%XMM4 |
0x444c37 MOVDQA -0x3b0(%RBP),%XMM0 |
0x444c3f PMULUDQ %XMM4,%XMM0 |
0x444c43 MOVDQA %XMM4,%XMM1 |
0x444c47 PSRLQ $0x20,%XMM1 |
0x444c4c MOVDQA -0x1d0(%RBP),%XMM3 |
0x444c54 MOVDQA %XMM3,%XMM2 |
0x444c58 PMULUDQ %XMM1,%XMM2 |
0x444c5c PADDQ %XMM0,%XMM2 |
0x444c60 PSLLQ $0x20,%XMM2 |
0x444c65 PMULUDQ %XMM4,%XMM3 |
0x444c69 PADDQ %XMM2,%XMM3 |
0x444c6d MOVDQA -0x3a0(%RBP),%XMM0 |
0x444c75 PADDQ %XMM3,%XMM0 |
0x444c79 MOVDQA %XMM0,-0x150(%RBP) |
0x444c81 PADDQ -0x390(%RBP),%XMM3 |
0x444c89 MOVDQA %XMM3,-0x160(%RBP) |
0x444c91 MOVDQA -0x380(%RBP),%XMM0 |
0x444c99 PMULUDQ %XMM4,%XMM0 |
0x444c9d MOVDQA -0x1c0(%RBP),%XMM2 |
0x444ca5 PMULUDQ %XMM2,%XMM1 |
0x444ca9 PADDQ %XMM0,%XMM1 |
0x444cad PSLLQ $0x20,%XMM1 |
0x444cb2 PMULUDQ %XMM2,%XMM4 |
0x444cb6 PADDQ %XMM1,%XMM4 |
0x444cba MOVDQA -0x3f0(%RBP),%XMM0 |
0x444cc2 PADDQ %XMM4,%XMM0 |
0x444cc6 MOVDQA %XMM0,-0x140(%RBP) |
0x444cce PADDQ -0x3e0(%RBP),%XMM4 |
0x444cd6 MOVDQA %XMM4,-0x170(%RBP) |
0x444cde MOV $0x1,%ECX |
0x444ce3 MOVDQA 0x465e4(%RIP),%XMM15 |
0x444cec MOVDQA %XMM8,-0x100(%RBP) |
0x444cf5 JMP 444e33 |
(373) 0x444d00 MOVDQA -0x1e0(%RBP),%XMM10 |
(373) 0x444d09 PAND %XMM14,%XMM6 |
(373) 0x444d0e PANDN %XMM13,%XMM14 |
(373) 0x444d13 MOVDQA %XMM14,%XMM13 |
(373) 0x444d18 POR %XMM6,%XMM13 |
(373) 0x444d1d PAND %XMM1,%XMM0 |
(373) 0x444d21 PANDN %XMM12,%XMM1 |
(373) 0x444d26 MOVDQA %XMM1,%XMM12 |
(373) 0x444d2b POR %XMM0,%XMM12 |
(373) 0x444d30 MOVDQA %XMM12,%XMM0 |
(373) 0x444d35 MULPD %XMM12,%XMM0 |
(373) 0x444d3a ADDPD %XMM9,%XMM0 |
(373) 0x444d3f MOVDQA %XMM13,%XMM1 |
(373) 0x444d44 MULPD %XMM13,%XMM1 |
(373) 0x444d49 ADDPD %XMM3,%XMM1 |
(373) 0x444d4d MOVAPD 0x4684b(%RIP),%XMM3 |
(373) 0x444d55 MULPD %XMM3,%XMM0 |
(373) 0x444d59 ADDPD %XMM0,%XMM11 |
(373) 0x444d5e MULPD %XMM3,%XMM1 |
(373) 0x444d62 ADDPD %XMM1,%XMM7 |
(373) 0x444d66 MOVQ %RCX,%XMM0 |
(373) 0x444d6b PSHUFD $0x44,%XMM0,%XMM1 |
(373) 0x444d70 PXOR 0x49728(%RIP),%XMM1 |
(373) 0x444d78 MOVDQA -0x430(%RBP),%XMM4 |
(373) 0x444d80 MOVDQA %XMM4,%XMM3 |
(373) 0x444d84 PCMPGTD %XMM1,%XMM3 |
(373) 0x444d88 MOVDQA -0x420(%RBP),%XMM6 |
(373) 0x444d90 MOVDQA %XMM6,%XMM0 |
(373) 0x444d94 PCMPGTD %XMM1,%XMM0 |
(373) 0x444d98 PCMPEQD %XMM1,%XMM4 |
(373) 0x444d9c PCMPEQD %XMM6,%XMM1 |
(373) 0x444da0 SHUFPS $-0x23,%XMM4,%XMM1 |
(373) 0x444da4 MOVDQA %XMM0,%XMM4 |
(373) 0x444da8 SHUFPS $-0x78,%XMM3,%XMM4 |
(373) 0x444dac ANDPS %XMM4,%XMM1 |
(373) 0x444daf SHUFPS $-0x23,%XMM3,%XMM0 |
(373) 0x444db3 ORPS %XMM1,%XMM0 |
(373) 0x444db6 PSHUFD $-0x6,%XMM15,%XMM1 |
(373) 0x444dbc PSLLD $0x1f,%XMM1 |
(373) 0x444dc1 PSRAD $0x1f,%XMM1 |
(373) 0x444dc6 MOVAPD %XMM11,%XMM3 |
(373) 0x444dcb ANDPD %XMM1,%XMM3 |
(373) 0x444dcf ANDNPD %XMM5,%XMM1 |
(373) 0x444dd3 MOVAPD %XMM1,%XMM5 |
(373) 0x444dd7 ORPD %XMM3,%XMM5 |
(373) 0x444ddb PSHUFD $0x50,%XMM15,%XMM1 |
(373) 0x444de1 PSLLD $0x1f,%XMM1 |
(373) 0x444de6 PSRAD $0x1f,%XMM1 |
(373) 0x444deb MOVAPD %XMM7,%XMM3 |
(373) 0x444def ANDPD %XMM1,%XMM3 |
(373) 0x444df3 ANDNPD %XMM2,%XMM1 |
(373) 0x444df7 MOVAPD %XMM1,%XMM2 |
(373) 0x444dfb ORPD %XMM3,%XMM2 |
(373) 0x444dff PAND %XMM0,%XMM15 |
(373) 0x444e04 MOVDQA -0x100(%RBP),%XMM8 |
(373) 0x444e0d MOVDQA %XMM8,%XMM0 |
(373) 0x444e12 PAND %XMM15,%XMM0 |
(373) 0x444e17 PSLLD $0x1f,%XMM0 |
(373) 0x444e1c MOVMSKPS %XMM0,%EDX |
(373) 0x444e1f INC %RCX |
(373) 0x444e22 TEST %EDX,%EDX |
(373) 0x444e24 MOVDQA -0x410(%RBP),%XMM14 |
(373) 0x444e2d JE 444b20 |
(373) 0x444e33 LEA -0x1(%RCX),%RDX |
(373) 0x444e37 MOVDQA %XMM8,%XMM1 |
(373) 0x444e3c PAND %XMM15,%XMM1 |
(373) 0x444e41 MOVQ %RDX,%XMM0 |
(373) 0x444e46 PSHUFD $0x44,%XMM0,%XMM8 |
(373) 0x444e4c MOVDQA -0x160(%RBP),%XMM0 |
(373) 0x444e54 PADDQ %XMM8,%XMM0 |
(373) 0x444e59 PSLLQ $0x3,%XMM0 |
(373) 0x444e5e PADDQ %XMM10,%XMM0 |
(373) 0x444e63 MOVDQA %XMM1,%XMM3 |
(373) 0x444e67 PSLLD $0x1f,%XMM3 |
(373) 0x444e6c MOVMSKPS %XMM3,%EDX |
(373) 0x444e6f TEST $0x1,%DL |
(373) 0x444e72 JE 444e7d |
(373) 0x444e74 MOVQ %XMM0,%RDI |
(373) 0x444e79 MOVSD (%RDI),%XMM3 |
(373) 0x444e7d TEST $0x2,%DL |
(373) 0x444e80 JE 444e8f |
(373) 0x444e82 PSHUFD $-0x12,%XMM0,%XMM0 |
(373) 0x444e87 MOVQ %XMM0,%RDI |
(373) 0x444e8c MOVHPS (%RDI),%XMM3 |
(373) 0x444e8f MOVDQA -0x150(%RBP),%XMM0 |
(373) 0x444e97 PADDQ %XMM8,%XMM0 |
(373) 0x444e9c PSLLQ $0x3,%XMM0 |
(373) 0x444ea1 PADDQ %XMM10,%XMM0 |
(373) 0x444ea6 TEST $0x4,%DL |
(373) 0x444ea9 JE 444ec0 |
(373) 0x444eab MOVQ %XMM0,%RDI |
(373) 0x444eb0 MOVLPS (%RDI),%XMM9 |
(373) 0x444eb4 TEST $0x8,%DL |
(373) 0x444eb7 JNE 444ec5 |
(373) 0x444eb9 JMP 444ed3 |
(373) 0x444ec0 TEST $0x8,%DL |
(373) 0x444ec3 JE 444ed3 |
(373) 0x444ec5 PSHUFD $-0x12,%XMM0,%XMM0 |
(373) 0x444eca MOVQ %XMM0,%RDI |
(373) 0x444ecf MOVHPS (%RDI),%XMM9 |
(373) 0x444ed3 MOVDQA -0x170(%RBP),%XMM0 |
(373) 0x444edb PADDQ %XMM8,%XMM0 |
(373) 0x444ee0 PSLLQ $0x3,%XMM0 |
(373) 0x444ee5 PADDQ %XMM14,%XMM0 |
(373) 0x444eea TEST $0x1,%DL |
(373) 0x444eed JE 444ef8 |
(373) 0x444eef MOVQ %XMM0,%RDI |
(373) 0x444ef4 MOVSD (%RDI),%XMM6 |
(373) 0x444ef8 TEST $0x2,%DL |
(373) 0x444efb JE 444f0a |
(373) 0x444efd PSHUFD $-0x12,%XMM0,%XMM0 |
(373) 0x444f02 MOVQ %XMM0,%RDI |
(373) 0x444f07 MOVHPS (%RDI),%XMM6 |
(373) 0x444f0a PADDQ -0x140(%RBP),%XMM8 |
(373) 0x444f13 PSLLQ $0x3,%XMM8 |
(373) 0x444f19 PADDQ %XMM14,%XMM8 |
(373) 0x444f1e TEST $0x4,%DL |
(373) 0x444f21 JE 444f30 |
(373) 0x444f23 MOVQ %XMM8,%RDI |
(373) 0x444f28 MOVLPS (%RDI),%XMM0 |
(373) 0x444f2b JMP 444f30 |
(373) 0x444f30 PSHUFD $0x50,%XMM1,%XMM14 |
(373) 0x444f36 PSLLD $0x1f,%XMM14 |
(373) 0x444f3c PSRAD $0x1f,%XMM14 |
(373) 0x444f42 MOVDQA %XMM14,%XMM10 |
(373) 0x444f47 PANDN -0x50(%RBP),%XMM10 |
(373) 0x444f4d PAND %XMM14,%XMM3 |
(373) 0x444f52 POR %XMM10,%XMM3 |
(373) 0x444f57 PSHUFD $-0x6,%XMM1,%XMM1 |
(373) 0x444f5c PSLLD $0x1f,%XMM1 |
(373) 0x444f61 PSRAD $0x1f,%XMM1 |
(373) 0x444f66 MOVDQA %XMM1,%XMM4 |
(373) 0x444f6a PANDN -0xa0(%RBP),%XMM4 |
(373) 0x444f72 PAND %XMM1,%XMM9 |
(373) 0x444f77 POR %XMM4,%XMM9 |
(373) 0x444f7c MOVDQA %XMM9,-0xa0(%RBP) |
(373) 0x444f85 MULPD %XMM9,%XMM9 |
(373) 0x444f8a MOVDQA %XMM3,-0x50(%RBP) |
(373) 0x444f8f MULPD %XMM3,%XMM3 |
(373) 0x444f93 TEST $0x8,%DL |
(373) 0x444f96 JE 444d00 |
(373) 0x444f9c PSHUFD $-0x12,%XMM8,%XMM8 |
(373) 0x444fa2 MOVQ %XMM8,%RDX |
(373) 0x444fa7 MOVHPS (%RDX),%XMM0 |
(373) 0x444faa JMP 444d00 |
0x444fb0 PXOR %XMM2,%XMM2 |
0x444fb4 PXOR %XMM5,%XMM5 |
0x444fb8 XOR %EAX,%EAX |
0x444fba PXOR %XMM0,%XMM0 |
0x444fbe JMP 444b9f |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/field_summary.cpp: 80 - 82 |
-------------------------------------------------------------------------------- |
80: for (int kv = k; kv <= k + 1; ++kv) { |
81: for (int jv = j; jv <= j + 1; ++jv) { |
82: vsqrd += 0.25 * (field.xvel0(jv, kv) * field.xvel0(jv, kv) + field.yvel0(jv, kv) * field.yvel0(jv, kv)); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
| Path / |
| Metric | Value |
|---|---|
| CQA speedup if no scalar integer | 1.05 |
| CQA speedup if FP arith vectorized | 1.00 |
| CQA speedup if fully vectorized | 5.21 |
| CQA speedup if no inter-iteration dependency | NA |
| CQA speedup if next bottleneck killed | 1.25 |
| Bottlenecks | micro-operation queue, |
| Function | _Z13field_summaryR16global_variablesR9parallel_.extracted |
| Source | field_summary.cpp:80-82 |
| Source loop unroll info | NA |
| Source loop unroll confidence level | NA |
| Unroll/vectorization loop type | NA |
| Unroll factor | NA |
| CQA cycles | 16.33 |
| CQA cycles if no scalar integer | 15.50 |
| CQA cycles if FP arith vectorized | 16.33 |
| CQA cycles if fully vectorized | 3.14 |
| Front-end cycles | 16.33 |
| DIV/SQRT cycles | 2.00 |
| P0 cycles | 1.50 |
| P1 cycles | 1.25 |
| P2 cycles | 1.25 |
| P3 cycles | 2.00 |
| P4 cycles | 7.00 |
| P5 cycles | 7.00 |
| P6 cycles | 7.00 |
| P7 cycles | 13.00 |
| P8 cycles | 12.92 |
| P9 cycles | 13.08 |
| P10 cycles | 13.00 |
| P11 cycles | 4.50 |
| P12 cycles | 4.50 |
| P13 cycles | 0.00 |
| Inter-iter dependencies cycles | NA |
| FE+BE cycles (UFS) | NA |
| Stall cycles (UFS) | NA |
| Nb insns | 96.00 |
| Nb uops | 98.00 |
| Nb loads | 14.00 |
| Nb stores | 7.00 |
| Nb stack references | 17.00 |
| FLOP/cycle | 0.00 |
| Nb FLOP add-sub | 0.00 |
| Nb FLOP mul | 0.00 |
| Nb FLOP fma | 0.00 |
| Nb FLOP div | 0.00 |
| Nb FLOP rcp | 0.00 |
| Nb FLOP sqrt | 0.00 |
| Nb FLOP rsqrt | 0.00 |
| Bytes/cycle | 20.57 |
| Bytes prefetched | 0.00 |
| Bytes loaded | 224.00 |
| Bytes stored | 112.00 |
| Stride 0 | NA |
| Stride 1 | NA |
| Stride n | NA |
| Stride unknown | NA |
| Stride indirect | NA |
| Vectorization ratio all | 94.44 |
| Vectorization ratio load | 100.00 |
| Vectorization ratio store | 100.00 |
| Vectorization ratio mul | 100.00 |
| Vectorization ratio add_sub | 88.89 |
| Vectorization ratio fma | NA |
| Vectorization ratio div_sqrt | NA |
| Vectorization ratio other | 92.98 |
| Vector-efficiency ratio all | 24.17 |
| Vector-efficiency ratio load | 25.00 |
| Vector-efficiency ratio store | 25.00 |
| Vector-efficiency ratio mul | 25.00 |
| Vector-efficiency ratio add_sub | 23.61 |
| Vector-efficiency ratio fma | NA |
| Vector-efficiency ratio div_sqrt | NA |
| Vector-efficiency ratio other | 23.90 |
| Metric | Value |
|---|---|
| CQA speedup if no scalar integer | 1.05 |
| CQA speedup if FP arith vectorized | 1.00 |
| CQA speedup if fully vectorized | 5.21 |
| CQA speedup if no inter-iteration dependency | NA |
| CQA speedup if next bottleneck killed | 1.25 |
| Bottlenecks | micro-operation queue, |
| Function | _Z13field_summaryR16global_variablesR9parallel_.extracted |
| Source | field_summary.cpp:80-82 |
| Source loop unroll info | NA |
| Source loop unroll confidence level | NA |
| Unroll/vectorization loop type | NA |
| Unroll factor | NA |
| CQA cycles | 16.33 |
| CQA cycles if no scalar integer | 15.50 |
| CQA cycles if FP arith vectorized | 16.33 |
| CQA cycles if fully vectorized | 3.14 |
| Front-end cycles | 16.33 |
| DIV/SQRT cycles | 2.00 |
| P0 cycles | 1.50 |
| P1 cycles | 1.25 |
| P2 cycles | 1.25 |
| P3 cycles | 2.00 |
| P4 cycles | 7.00 |
| P5 cycles | 7.00 |
| P6 cycles | 7.00 |
| P7 cycles | 13.00 |
| P8 cycles | 12.92 |
| P9 cycles | 13.08 |
| P10 cycles | 13.00 |
| P11 cycles | 4.50 |
| P12 cycles | 4.50 |
| P13 cycles | 0.00 |
| Inter-iter dependencies cycles | NA |
| FE+BE cycles (UFS) | NA |
| Stall cycles (UFS) | NA |
| Nb insns | 96.00 |
| Nb uops | 98.00 |
| Nb loads | 14.00 |
| Nb stores | 7.00 |
| Nb stack references | 17.00 |
| FLOP/cycle | 0.00 |
| Nb FLOP add-sub | 0.00 |
| Nb FLOP mul | 0.00 |
| Nb FLOP fma | 0.00 |
| Nb FLOP div | 0.00 |
| Nb FLOP rcp | 0.00 |
| Nb FLOP sqrt | 0.00 |
| Nb FLOP rsqrt | 0.00 |
| Bytes/cycle | 20.57 |
| Bytes prefetched | 0.00 |
| Bytes loaded | 224.00 |
| Bytes stored | 112.00 |
| Stride 0 | NA |
| Stride 1 | NA |
| Stride n | NA |
| Stride unknown | NA |
| Stride indirect | NA |
| Vectorization ratio all | 94.44 |
| Vectorization ratio load | 100.00 |
| Vectorization ratio store | 100.00 |
| Vectorization ratio mul | 100.00 |
| Vectorization ratio add_sub | 88.89 |
| Vectorization ratio fma | NA |
| Vectorization ratio div_sqrt | NA |
| Vectorization ratio other | 92.98 |
| Vector-efficiency ratio all | 24.17 |
| Vector-efficiency ratio load | 25.00 |
| Vector-efficiency ratio store | 25.00 |
| Vector-efficiency ratio mul | 25.00 |
| Vector-efficiency ratio add_sub | 23.61 |
| Vector-efficiency ratio fma | NA |
| Vector-efficiency ratio div_sqrt | NA |
| Vector-efficiency ratio other | 23.90 |
| Path / |
| Function | _Z13field_summaryR16global_variablesR9parallel_.extracted |
| Source file and lines | field_summary.cpp:80-82 |
| Module | exec |
| nb instructions | 96 |
| nb uops | 98 |
| loop length | 493 |
| used x86 registers | 3 |
| used mmx registers | 0 |
| used xmm registers | 11 |
| used ymm registers | 0 |
| used zmm registers | 0 |
| nb stack references | 17 |
| micro-operation queue | 16.33 cycles |
| front end | 16.33 cycles |
| ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| uops | 2.00 | 1.50 | 1.25 | 1.25 | 2.00 | 7.00 | 7.00 | 7.00 | 13.00 | 12.92 | 13.08 | 13.00 | 4.50 | 4.50 |
| cycles | 2.00 | 1.50 | 1.25 | 1.25 | 2.00 | 7.00 | 7.00 | 7.00 | 13.00 | 12.92 | 13.08 | 13.00 | 4.50 | 4.50 |
| Cycles executing div or sqrt instructions | NA |
| Front-end | 16.33 |
| Dispatch | 13.08 |
| Overall L1 | 16.33 |
| all | 93% |
| load | 100% |
| store | 100% |
| mul | 100% |
| add-sub | 88% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| other | 90% |
| all | 100% |
| load | 100% |
| store | 100% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | NA (no add-sub vectorizable/vectorized instructions) |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 100% |
| all | 94% |
| load | 100% |
| store | 100% |
| mul | 100% |
| add-sub | 88% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 92% |
| all | 23% |
| load | 25% |
| store | 25% |
| mul | 25% |
| add-sub | 23% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| other | 23% |
| all | 25% |
| load | 25% |
| store | 25% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | NA (no add-sub vectorizable/vectorized instructions) |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 25% |
| all | 24% |
| load | 25% |
| store | 25% |
| mul | 25% |
| add-sub | 23% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 23% |
| Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| INC %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| MOVQ %RAX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
| PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PXOR 0x4996b(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
| MOVDQA -0x3d0(%RBP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVDQA %XMM4,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| PCMPGTD %XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $-0x60,%XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PCMPEQD %XMM0,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $-0xb,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PAND %XMM3,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $-0xb,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| POR %XMM4,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVDQA -0x3c0(%RBP),%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVDQA %XMM6,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| PCMPGTD %XMM0,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $-0x60,%XMM3,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PCMPEQD %XMM6,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $-0xb,%XMM0,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PAND %XMM4,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $-0xb,%XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| POR %XMM6,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PACKSSDW %XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| MOVAPD -0x130(%RBP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVAPD -0x400(%RBP),%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PSHUFD $-0x6,%XMM8,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PSLLD $0x1f,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| PSRAD $0x1f,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| MOVAPD %XMM5,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| ANDPD %XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| ANDNPD %XMM6,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVAPD %XMM1,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| ORPD %XMM3,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $0x50,%XMM8,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PSLLD $0x1f,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| PSRAD $0x1f,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| MOVAPD %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| ANDPD %XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| ANDNPD %XMM4,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVAPD %XMM1,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| ORPD %XMM3,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PAND %XMM0,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVDQA %XMM8,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| PSLLD $0x1f,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| MOVMSKPS %XMM0,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 6 | 1 |
| MOVAPD %XMM2,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| MOVAPD %XMM5,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| TEST %ECX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| JE 4442b0 <_Z13field_summaryR16global_variablesR9parallel_.extracted+0x300> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
| MOVDQA %XMM8,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| PSLLD $0x1f,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| MOVMSKPS %XMM0,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 6 | 1 |
| TEST %ECX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| JE 444fb0 <_Z13field_summaryR16global_variablesR9parallel_.extracted+0x1000> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
| MOVAPS %XMM6,-0x400(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| MOVAPS %XMM4,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| MOVQ %RAX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
| PSHUFD $0x44,%XMM0,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| MOVDQA -0x3b0(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PMULUDQ %XMM4,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVDQA %XMM4,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| PSRLQ $0x20,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| MOVDQA -0x1d0(%RBP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVDQA %XMM3,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| PMULUDQ %XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PADDQ %XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSLLQ $0x20,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| PMULUDQ %XMM4,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PADDQ %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVDQA -0x3a0(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PADDQ %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVDQA %XMM0,-0x150(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| PADDQ -0x390(%RBP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
| MOVDQA %XMM3,-0x160(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| MOVDQA -0x380(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PMULUDQ %XMM4,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVDQA -0x1c0(%RBP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PMULUDQ %XMM2,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PADDQ %XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSLLQ $0x20,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| PMULUDQ %XMM2,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PADDQ %XMM1,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVDQA -0x3f0(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PADDQ %XMM4,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVDQA %XMM0,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| PADDQ -0x3e0(%RBP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
| MOVDQA %XMM4,-0x170(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| MOV $0x1,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| MOVDQA 0x465e4(%RIP),%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVDQA %XMM8,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| JMP 444e33 <_Z13field_summaryR16global_variablesR9parallel_.extracted+0xe83> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
| PXOR %XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
| PXOR %XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
| XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
| PXOR %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
| JMP 444b9f <_Z13field_summaryR16global_variablesR9parallel_.extracted+0xbef> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
| Function | _Z13field_summaryR16global_variablesR9parallel_.extracted |
| Source file and lines | field_summary.cpp:80-82 |
| Module | exec |
| nb instructions | 96 |
| nb uops | 98 |
| loop length | 493 |
| used x86 registers | 3 |
| used mmx registers | 0 |
| used xmm registers | 11 |
| used ymm registers | 0 |
| used zmm registers | 0 |
| nb stack references | 17 |
| micro-operation queue | 16.33 cycles |
| front end | 16.33 cycles |
| ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| uops | 2.00 | 1.50 | 1.25 | 1.25 | 2.00 | 7.00 | 7.00 | 7.00 | 13.00 | 12.92 | 13.08 | 13.00 | 4.50 | 4.50 |
| cycles | 2.00 | 1.50 | 1.25 | 1.25 | 2.00 | 7.00 | 7.00 | 7.00 | 13.00 | 12.92 | 13.08 | 13.00 | 4.50 | 4.50 |
| Cycles executing div or sqrt instructions | NA |
| Front-end | 16.33 |
| Dispatch | 13.08 |
| Overall L1 | 16.33 |
| all | 93% |
| load | 100% |
| store | 100% |
| mul | 100% |
| add-sub | 88% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| other | 90% |
| all | 100% |
| load | 100% |
| store | 100% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | NA (no add-sub vectorizable/vectorized instructions) |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 100% |
| all | 94% |
| load | 100% |
| store | 100% |
| mul | 100% |
| add-sub | 88% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 92% |
| all | 23% |
| load | 25% |
| store | 25% |
| mul | 25% |
| add-sub | 23% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| other | 23% |
| all | 25% |
| load | 25% |
| store | 25% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | NA (no add-sub vectorizable/vectorized instructions) |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 25% |
| all | 24% |
| load | 25% |
| store | 25% |
| mul | 25% |
| add-sub | 23% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 23% |
| Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| INC %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| MOVQ %RAX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
| PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PXOR 0x4996b(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
| MOVDQA -0x3d0(%RBP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVDQA %XMM4,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| PCMPGTD %XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $-0x60,%XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PCMPEQD %XMM0,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $-0xb,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PAND %XMM3,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $-0xb,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| POR %XMM4,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVDQA -0x3c0(%RBP),%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVDQA %XMM6,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| PCMPGTD %XMM0,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $-0x60,%XMM3,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PCMPEQD %XMM6,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $-0xb,%XMM0,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PAND %XMM4,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $-0xb,%XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| POR %XMM6,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PACKSSDW %XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| MOVAPD -0x130(%RBP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVAPD -0x400(%RBP),%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PSHUFD $-0x6,%XMM8,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PSLLD $0x1f,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| PSRAD $0x1f,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| MOVAPD %XMM5,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| ANDPD %XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| ANDNPD %XMM6,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVAPD %XMM1,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| ORPD %XMM3,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSHUFD $0x50,%XMM8,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| PSLLD $0x1f,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| PSRAD $0x1f,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| MOVAPD %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| ANDPD %XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| ANDNPD %XMM4,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVAPD %XMM1,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| ORPD %XMM3,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PAND %XMM0,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVDQA %XMM8,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| PSLLD $0x1f,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| MOVMSKPS %XMM0,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 6 | 1 |
| MOVAPD %XMM2,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| MOVAPD %XMM5,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| TEST %ECX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| JE 4442b0 <_Z13field_summaryR16global_variablesR9parallel_.extracted+0x300> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
| MOVDQA %XMM8,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| PSLLD $0x1f,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| MOVMSKPS %XMM0,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 6 | 1 |
| TEST %ECX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| JE 444fb0 <_Z13field_summaryR16global_variablesR9parallel_.extracted+0x1000> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
| MOVAPS %XMM6,-0x400(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| MOVAPS %XMM4,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| MOVQ %RAX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
| PSHUFD $0x44,%XMM0,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
| MOVDQA -0x3b0(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PMULUDQ %XMM4,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVDQA %XMM4,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| PSRLQ $0x20,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| MOVDQA -0x1d0(%RBP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVDQA %XMM3,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
| PMULUDQ %XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PADDQ %XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSLLQ $0x20,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| PMULUDQ %XMM4,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PADDQ %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVDQA -0x3a0(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PADDQ %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVDQA %XMM0,-0x150(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| PADDQ -0x390(%RBP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
| MOVDQA %XMM3,-0x160(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| MOVDQA -0x380(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PMULUDQ %XMM4,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVDQA -0x1c0(%RBP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PMULUDQ %XMM2,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PADDQ %XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| PSLLQ $0x20,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
| PMULUDQ %XMM2,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PADDQ %XMM1,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVDQA -0x3f0(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| PADDQ %XMM4,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
| MOVDQA %XMM0,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| PADDQ -0x3e0(%RBP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
| MOVDQA %XMM4,-0x170(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| MOV $0x1,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| MOVDQA 0x465e4(%RIP),%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
| MOVDQA %XMM8,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
| JMP 444e33 <_Z13field_summaryR16global_variablesR9parallel_.extracted+0xe83> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
| PXOR %XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
| PXOR %XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
| XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
| PXOR %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
| JMP 444b9f <_Z13field_summaryR16global_variablesR9parallel_.extracted+0xbef> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
