Loop Id: 1246 | Module: exec | Source: par_lr_interp.c:1221-1675 [...] | Coverage: 0.07% |
---|
Loop Id: 1246 | Module: exec | Source: par_lr_interp.c:1221-1675 [...] | Coverage: 0.07% |
---|
0x452650 MOV -0x98(%RBP),%RCX |
0x452657 MOV (%RCX),%RCX |
0x45265a VMOVSD (%RCX,%RAX,8),%XMM5 |
0x45265f MOV -0x50(%RBP),%RDX |
0x452663 VADDSD (%RDX,%R9,8),%XMM5,%XMM5 |
0x452669 VMOVSD %XMM5,(%RCX,%RAX,8) |
0x45266e INC %R9 |
0x452671 CMP -0x68(%RBP),%R9 |
0x452675 JE 4525a2 |
0x45267b MOV (%RBX,%R9,8),%R10 |
0x45267f MOV (%R13,%R10,8),%RAX |
0x452684 CMP %RDI,%RAX |
0x452687 JGE 452650 |
0x452689 CMP -0x80(%RBP),%RAX |
0x45268d JNE 452820 |
0x452693 MOV -0x188(%RBP),%RCX |
0x45269a MOV (%RCX,%R10,8),%R15 |
0x45269e VPXOR %XMM5,%XMM5,%XMM5 |
0x4526a2 XOR %EAX,%EAX |
0x4526a4 MOV -0x50(%RBP),%RDX |
0x4526a8 VUCOMISD (%RDX,%R15,8),%XMM5 |
0x4526ae MOV %R10,-0xf0(%RBP) |
0x4526b5 MOV 0x8(%RCX,%R10,8),%RCX |
0x4526ba SETBE %AL |
0x4526bd LEA -0x1(%RAX,%RAX,1),%RAX |
0x4526c2 MOV %RAX,-0xa8(%RBP) |
0x4526c9 LEA 0x1(%R15),%R10 |
0x4526cd CMP %RCX,%R10 |
0x4526d0 MOV %R15,-0x58(%RBP) |
0x4526d4 JGE 4526ff |
0x4526d6 VCVTSI2SDQ -0xa8(%RBP),%XMM9,%XMM6 |
0x4526df NOT %R15 |
0x4526e2 ADD %RCX,%R15 |
0x4526e5 CMP $0x4,%R15 |
0x4526e9 JAE 452865 |
0x4526ef MOV %R15,%RAX |
0x4526f2 AND $-0x4,%RAX |
0x4526f6 CMP %R15,%RAX |
0x4526f9 JNE 452958 |
0x4526ff MOV -0xc0(%RBP),%RAX |
0x452706 MOV (%RAX),%RAX |
0x452709 MOV %RAX,-0xe8(%RBP) |
0x452710 CMP $0x2,%RAX |
0x452714 JL 452770 |
0x452716 MOV -0x168(%RBP),%RAX |
0x45271d MOV -0xf0(%RBP),%RDX |
0x452724 MOV (%RAX,%RDX,8),%R12 |
0x452728 MOV 0x8(%RAX,%RDX,8),%R15 |
0x45272d MOV %R15,%RAX |
0x452730 SUB %R12,%RAX |
0x452733 JLE 452770 |
0x452735 VCVTSI2SDQ -0xa8(%RBP),%XMM9,%XMM6 |
0x45273e CMP $0x4,%RAX |
0x452742 MOV %RAX,-0xe0(%RBP) |
0x452749 JAE 4529ac |
0x45274f MOV -0xe0(%RBP),%RDX |
0x452756 MOV %RDX,%RAX |
0x452759 AND $-0x4,%RAX |
0x45275d CMP %RDX,%RAX |
0x452760 JNE 452a9c |
0x452766 MOV -0x30(%RBP),%R11 |
0x45276a NOPW (%RAX,%RAX,1) |
0x452770 VUCOMISD %XMM0,%XMM5 |
0x452774 MOV -0x50(%RBP),%RAX |
0x452778 VMOVSD (%RAX,%R9,8),%XMM6 |
0x45277e JE 452859 |
0x452784 VDIVSD %XMM5,%XMM6,%XMM5 |
0x452788 CMP %RCX,%R10 |
0x45278b MOV %R8,%R15 |
0x45278e JGE 452aff |
0x452794 VCVTSI2SDQ -0xa8(%RBP),%XMM9,%XMM6 |
0x45279d MOV -0x58(%RBP),%RDX |
0x4527a1 MOV %EDX,%EAX |
0x4527a3 NOT %EAX |
0x4527a5 ADD %ECX,%EAX |
0x4527a7 TEST $0x1,%AL |
0x4527a9 JE 452af6 |
0x4527af MOV 0x8(%RBX,%RDX,8),%RAX |
0x4527b4 MOV (%R13,%RAX,8),%RDX |
0x4527b9 CMP %RDI,%RDX |
0x4527bc JL 4527ed |
0x4527be MOV -0x50(%RBP),%R10 |
0x4527c2 MOV -0x58(%RBP),%R12 |
0x4527c6 VMOVSD 0x8(%R10,%R12,8),%XMM7 |
0x4527cd VMULSD %XMM6,%XMM7,%XMM8 |
0x4527d1 VUCOMISD %XMM0,%XMM8 |
0x4527d5 JAE 4527ed |
0x4527d7 MOV -0x98(%RBP),%R10 |
0x4527de MOV (%R10),%R10 |
0x4527e1 VFMADD213SD (%R10,%RDX,8),%XMM5,%XMM7 |
0x4527e7 VMOVSD %XMM7,(%R10,%RDX,8) |
0x4527ed CMP %R15,%RAX |
0x4527f0 JNE 452aee |
0x4527f6 MOV -0x50(%RBP),%RAX |
0x4527fa MOV -0x58(%RBP),%RDX |
0x4527fe VMOVSD 0x8(%RAX,%RDX,8),%XMM7 |
0x452804 VMULSD %XMM6,%XMM7,%XMM8 |
0x452808 VFMADD213SD %XMM4,%XMM5,%XMM7 |
0x45280d VCMPSD $0x1,%XMM0,%XMM8,%K1 |
0x452814 VMOVSD %XMM7,%XMM4,%XMM4{%K1} |
0x45281a JMP 452af2 |
0x452820 CMPQ $-0x3,(%R11,%R10,8) |
0x452825 JE 45266e |
0x45282b CMPQ $0x1,-0x180(%RBP) |
0x452833 JE 45284a |
0x452835 MOV -0x178(%RBP),%RCX |
0x45283c MOV (%RCX,%R15,8),%RAX |
0x452840 CMP (%RCX,%R10,8),%RAX |
0x452844 JNE 45266e |
0x45284a MOV -0x50(%RBP),%RAX |
0x45284e VADDSD (%RAX,%R9,8),%XMM4,%XMM4 |
0x452854 JMP 45266e |
0x452859 VADDSD %XMM4,%XMM6,%XMM4 |
0x45285d MOV %R8,%R15 |
0x452860 JMP 45266e |
0x452865 MOV %R15,%R12 |
0x452868 SHR $0x2,%R12 |
0x45286c MOV -0x58(%RBP),%RAX |
0x452870 LEA 0x20(,%RAX,8),%RAX |
0x452878 JMP 4528ab |
(1253) 0x452880 MOV -0x50(%RBP),%RDX |
(1253) 0x452884 VMOVSD (%RDX,%RAX,1),%XMM7 |
(1253) 0x452889 VMULSD %XMM6,%XMM7,%XMM8 |
(1253) 0x45288d VADDSD %XMM5,%XMM7,%XMM7 |
(1253) 0x452891 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1253) 0x452898 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1253) 0x45289e ADD $0x20,%RAX |
(1253) 0x4528a2 DEC %R12 |
(1253) 0x4528a5 JE 4526ef |
(1253) 0x4528ab MOV -0x18(%RBX,%RAX,1),%RDX |
(1253) 0x4528b0 CMP %R8,%RDX |
(1253) 0x4528b3 JE 4528bc |
(1253) 0x4528b5 CMP %RDI,(%R13,%RDX,8) |
(1253) 0x4528ba JL 4528db |
(1253) 0x4528bc MOV -0x50(%RBP),%RDX |
(1253) 0x4528c0 VMOVSD -0x18(%RDX,%RAX,1),%XMM7 |
(1253) 0x4528c6 VMULSD %XMM6,%XMM7,%XMM8 |
(1253) 0x4528ca VADDSD %XMM5,%XMM7,%XMM7 |
(1253) 0x4528ce VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1253) 0x4528d5 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1253) 0x4528db MOV -0x10(%RBX,%RAX,1),%RDX |
(1253) 0x4528e0 CMP %R8,%RDX |
(1253) 0x4528e3 JE 4528ec |
(1253) 0x4528e5 CMP %RDI,(%R13,%RDX,8) |
(1253) 0x4528ea JL 45290b |
(1253) 0x4528ec MOV -0x50(%RBP),%RDX |
(1253) 0x4528f0 VMOVSD -0x10(%RDX,%RAX,1),%XMM7 |
(1253) 0x4528f6 VMULSD %XMM6,%XMM7,%XMM8 |
(1253) 0x4528fa VADDSD %XMM5,%XMM7,%XMM7 |
(1253) 0x4528fe VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1253) 0x452905 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1253) 0x45290b MOV -0x8(%RBX,%RAX,1),%RDX |
(1253) 0x452910 CMP %R8,%RDX |
(1253) 0x452913 JE 45291c |
(1253) 0x452915 CMP %RDI,(%R13,%RDX,8) |
(1253) 0x45291a JL 45293b |
(1253) 0x45291c MOV -0x50(%RBP),%RDX |
(1253) 0x452920 VMOVSD -0x8(%RDX,%RAX,1),%XMM7 |
(1253) 0x452926 VMULSD %XMM6,%XMM7,%XMM8 |
(1253) 0x45292a VADDSD %XMM5,%XMM7,%XMM7 |
(1253) 0x45292e VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1253) 0x452935 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1253) 0x45293b MOV (%RBX,%RAX,1),%RDX |
(1253) 0x45293f CMP %R8,%RDX |
(1253) 0x452942 JE 452880 |
(1253) 0x452948 CMP %RDI,(%R13,%RDX,8) |
(1253) 0x45294d JL 45289e |
(1253) 0x452953 JMP 452880 |
0x452958 MOV -0x58(%RBP),%RDX |
0x45295c LEA 0x1(%RDX,%RAX,1),%RAX |
0x452961 MOV %R8,%R15 |
0x452964 JMP 45299a |
(1252) 0x452970 MOV -0x50(%RBP),%RDX |
(1252) 0x452974 VMOVSD (%RDX,%RAX,8),%XMM7 |
(1252) 0x452979 VMULSD %XMM6,%XMM7,%XMM8 |
(1252) 0x45297d VADDSD %XMM5,%XMM7,%XMM7 |
(1252) 0x452981 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1252) 0x452988 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1252) 0x45298e INC %RAX |
(1252) 0x452991 CMP %RAX,%RCX |
(1252) 0x452994 JE 4526ff |
(1252) 0x45299a MOV (%RBX,%RAX,8),%RDX |
(1252) 0x45299e CMP %R15,%RDX |
(1252) 0x4529a1 JE 452970 |
(1252) 0x4529a3 CMP %RDI,(%R13,%RDX,8) |
(1252) 0x4529a8 JL 45298e |
(1252) 0x4529aa JMP 452970 |
0x4529ac SHR $0x2,%RAX |
0x4529b0 LEA 0x18(,%R12,8),%RDX |
0x4529b8 JMP 4529cd |
(1251) 0x4529c0 ADD $0x20,%RDX |
(1251) 0x4529c4 DEC %RAX |
(1251) 0x4529c7 JE 45274f |
(1251) 0x4529cd MOV -0xa0(%RBP),%R11 |
(1251) 0x4529d4 MOV -0x18(%R11,%RDX,1),%R11 |
(1251) 0x4529d9 CMP %RSI,(%R14,%R11,8) |
(1251) 0x4529dd JL 4529ff |
(1251) 0x4529df MOV -0x70(%RBP),%R11 |
(1251) 0x4529e3 VMOVSD -0x18(%R11,%RDX,1),%XMM7 |
(1251) 0x4529ea VMULSD %XMM6,%XMM7,%XMM8 |
(1251) 0x4529ee VADDSD %XMM5,%XMM7,%XMM7 |
(1251) 0x4529f2 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1251) 0x4529f9 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1251) 0x4529ff MOV -0xa0(%RBP),%R11 |
(1251) 0x452a06 MOV -0x10(%R11,%RDX,1),%R11 |
(1251) 0x452a0b CMP %RSI,(%R14,%R11,8) |
(1251) 0x452a0f JL 452a31 |
(1251) 0x452a11 MOV -0x70(%RBP),%R11 |
(1251) 0x452a15 VMOVSD -0x10(%R11,%RDX,1),%XMM7 |
(1251) 0x452a1c VMULSD %XMM6,%XMM7,%XMM8 |
(1251) 0x452a20 VADDSD %XMM5,%XMM7,%XMM7 |
(1251) 0x452a24 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1251) 0x452a2b VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1251) 0x452a31 MOV -0xa0(%RBP),%R11 |
(1251) 0x452a38 MOV -0x8(%R11,%RDX,1),%R11 |
(1251) 0x452a3d CMP %RSI,(%R14,%R11,8) |
(1251) 0x452a41 JL 452a63 |
(1251) 0x452a43 MOV -0x70(%RBP),%R11 |
(1251) 0x452a47 VMOVSD -0x8(%R11,%RDX,1),%XMM7 |
(1251) 0x452a4e VMULSD %XMM6,%XMM7,%XMM8 |
(1251) 0x452a52 VADDSD %XMM5,%XMM7,%XMM7 |
(1251) 0x452a56 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1251) 0x452a5d VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1251) 0x452a63 MOV -0xa0(%RBP),%R11 |
(1251) 0x452a6a MOV (%R11,%RDX,1),%R11 |
(1251) 0x452a6e CMP %RSI,(%R14,%R11,8) |
(1251) 0x452a72 JL 4529c0 |
(1251) 0x452a78 MOV -0x70(%RBP),%R11 |
(1251) 0x452a7c VMOVSD (%R11,%RDX,1),%XMM7 |
(1251) 0x452a82 VMULSD %XMM6,%XMM7,%XMM8 |
(1251) 0x452a86 VADDSD %XMM5,%XMM7,%XMM7 |
(1251) 0x452a8a VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1251) 0x452a91 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1251) 0x452a97 JMP 4529c0 |
0x452a9c ADD %RAX,%R12 |
0x452a9f MOV -0x30(%RBP),%R11 |
0x452aa3 JMP 452abc |
(1250) 0x452ab0 INC %R12 |
(1250) 0x452ab3 CMP %R12,%R15 |
(1250) 0x452ab6 JE 452770 |
(1250) 0x452abc MOV -0xa0(%RBP),%RAX |
(1250) 0x452ac3 MOV (%RAX,%R12,8),%RAX |
(1250) 0x452ac7 CMP %RSI,(%R14,%RAX,8) |
(1250) 0x452acb JL 452ab0 |
(1250) 0x452acd MOV -0x70(%RBP),%RAX |
(1250) 0x452ad1 VMOVSD (%RAX,%R12,8),%XMM7 |
(1250) 0x452ad7 VMULSD %XMM6,%XMM7,%XMM8 |
(1250) 0x452adb VADDSD %XMM5,%XMM7,%XMM7 |
(1250) 0x452adf VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1250) 0x452ae6 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1250) 0x452aec JMP 452ab0 |
0x452aee MOV -0x58(%RBP),%RDX |
0x452af2 LEA 0x2(%RDX),%R10 |
0x452af6 LEA -0x2(%RCX),%RAX |
0x452afa CMP %RDX,%RAX |
0x452afd JNE 452b79 |
0x452aff CMPQ $0x2,-0xe8(%RBP) |
0x452b07 JL 45266e |
0x452b0d MOV -0x168(%RBP),%RCX |
0x452b14 MOV -0xf0(%RBP),%RDX |
0x452b1b MOV (%RCX,%RDX,8),%RAX |
0x452b1f MOV 0x8(%RCX,%RDX,8),%RCX |
0x452b24 MOV %RCX,%R10 |
0x452b27 SUB %RAX,%R10 |
0x452b2a JLE 45266e |
0x452b30 VCVTSI2SDQ -0xa8(%RBP),%XMM9,%XMM6 |
0x452b39 CMP $0x4,%R10 |
0x452b3d JAE 452c4b |
0x452b43 MOV %R10,%RDX |
0x452b46 AND $-0x4,%RDX |
0x452b4a CMP %R10,%RDX |
0x452b4d JNE 452d78 |
0x452b53 MOV -0x30(%RBP),%R11 |
0x452b57 MOV -0xf8(%RBP),%RBX |
0x452b5e MOV %R8,%R15 |
0x452b61 JMP 45266e |
(1249) 0x452b70 ADD $0x2,%R10 |
(1249) 0x452b74 CMP %R10,%RCX |
(1249) 0x452b77 JE 452aff |
(1249) 0x452b79 MOV (%RBX,%R10,8),%RAX |
(1249) 0x452b7d MOV (%R13,%RAX,8),%RDX |
(1249) 0x452b82 CMP %RDI,%RDX |
(1249) 0x452b85 JL 452bb7 |
(1249) 0x452b87 MOV -0x50(%RBP),%R15 |
(1249) 0x452b8b VMOVSD (%R15,%R10,8),%XMM7 |
(1249) 0x452b91 MOV %R8,%R15 |
(1249) 0x452b94 VMULSD %XMM6,%XMM7,%XMM8 |
(1249) 0x452b98 VUCOMISD %XMM0,%XMM8 |
(1249) 0x452b9c JAE 452bb7 |
(1249) 0x452b9e MOV -0x98(%RBP),%R15 |
(1249) 0x452ba5 MOV (%R15),%R15 |
(1249) 0x452ba8 VFMADD213SD (%R15,%RDX,8),%XMM5,%XMM7 |
(1249) 0x452bae VMOVSD %XMM7,(%R15,%RDX,8) |
(1249) 0x452bb4 MOV %R8,%R15 |
(1249) 0x452bb7 CMP %R15,%RAX |
(1249) 0x452bba JNE 452bdc |
(1249) 0x452bbc MOV -0x50(%RBP),%RAX |
(1249) 0x452bc0 VMOVSD (%RAX,%R10,8),%XMM7 |
(1249) 0x452bc6 VMULSD %XMM6,%XMM7,%XMM8 |
(1249) 0x452bca VFMADD213SD %XMM4,%XMM5,%XMM7 |
(1249) 0x452bcf VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1249) 0x452bd6 VMOVSD %XMM7,%XMM4,%XMM4{%K1} |
(1249) 0x452bdc MOV 0x8(%RBX,%R10,8),%RAX |
(1249) 0x452be1 MOV (%R13,%RAX,8),%RDX |
(1249) 0x452be6 CMP %RDI,%RDX |
(1249) 0x452be9 JL 452c1c |
(1249) 0x452beb MOV -0x50(%RBP),%R15 |
(1249) 0x452bef VMOVSD 0x8(%R15,%R10,8),%XMM7 |
(1249) 0x452bf6 MOV %R8,%R15 |
(1249) 0x452bf9 VMULSD %XMM6,%XMM7,%XMM8 |
(1249) 0x452bfd VUCOMISD %XMM0,%XMM8 |
(1249) 0x452c01 JAE 452c1c |
(1249) 0x452c03 MOV -0x98(%RBP),%R15 |
(1249) 0x452c0a MOV (%R15),%R15 |
(1249) 0x452c0d VFMADD213SD (%R15,%RDX,8),%XMM5,%XMM7 |
(1249) 0x452c13 VMOVSD %XMM7,(%R15,%RDX,8) |
(1249) 0x452c19 MOV %R8,%R15 |
(1249) 0x452c1c CMP %R15,%RAX |
(1249) 0x452c1f JNE 452b70 |
(1249) 0x452c25 MOV -0x50(%RBP),%RAX |
(1249) 0x452c29 VMOVSD 0x8(%RAX,%R10,8),%XMM7 |
(1249) 0x452c30 VMULSD %XMM6,%XMM7,%XMM8 |
(1249) 0x452c34 VFMADD213SD %XMM4,%XMM5,%XMM7 |
(1249) 0x452c39 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1249) 0x452c40 VMOVSD %XMM7,%XMM4,%XMM4{%K1} |
(1249) 0x452c46 JMP 452b70 |
0x452c4b MOV %R10,%RDX |
0x452c4e SHR $0x2,%RDX |
0x452c52 LEA 0x18(,%RAX,8),%R11 |
0x452c5a JMP 452c6d |
(1248) 0x452c60 ADD $0x20,%R11 |
(1248) 0x452c64 DEC %RDX |
(1248) 0x452c67 JE 452b43 |
(1248) 0x452c6d MOV -0xa0(%RBP),%R15 |
(1248) 0x452c74 MOV -0x18(%R15,%R11,1),%R15 |
(1248) 0x452c79 MOV (%R14,%R15,8),%R15 |
(1248) 0x452c7d CMP %RSI,%R15 |
(1248) 0x452c80 JL 452cad |
(1248) 0x452c82 MOV -0x70(%RBP),%RBX |
(1248) 0x452c86 VMOVSD -0x18(%RBX,%R11,1),%XMM7 |
(1248) 0x452c8d VMULSD %XMM6,%XMM7,%XMM8 |
(1248) 0x452c91 VUCOMISD %XMM0,%XMM8 |
(1248) 0x452c95 JAE 452cad |
(1248) 0x452c97 MOV -0x88(%RBP),%RBX |
(1248) 0x452c9e MOV (%RBX),%R12 |
(1248) 0x452ca1 VFMADD213SD (%R12,%R15,8),%XMM5,%XMM7 |
(1248) 0x452ca7 VMOVSD %XMM7,(%R12,%R15,8) |
(1248) 0x452cad MOV -0xa0(%RBP),%R15 |
(1248) 0x452cb4 MOV -0x10(%R15,%R11,1),%R15 |
(1248) 0x452cb9 MOV (%R14,%R15,8),%R15 |
(1248) 0x452cbd CMP %RSI,%R15 |
(1248) 0x452cc0 JL 452ced |
(1248) 0x452cc2 MOV -0x70(%RBP),%RBX |
(1248) 0x452cc6 VMOVSD -0x10(%RBX,%R11,1),%XMM7 |
(1248) 0x452ccd VMULSD %XMM6,%XMM7,%XMM8 |
(1248) 0x452cd1 VUCOMISD %XMM0,%XMM8 |
(1248) 0x452cd5 JAE 452ced |
(1248) 0x452cd7 MOV -0x88(%RBP),%RBX |
(1248) 0x452cde MOV (%RBX),%R12 |
(1248) 0x452ce1 VFMADD213SD (%R12,%R15,8),%XMM5,%XMM7 |
(1248) 0x452ce7 VMOVSD %XMM7,(%R12,%R15,8) |
(1248) 0x452ced MOV -0xa0(%RBP),%R15 |
(1248) 0x452cf4 MOV -0x8(%R15,%R11,1),%R15 |
(1248) 0x452cf9 MOV (%R14,%R15,8),%R15 |
(1248) 0x452cfd CMP %RSI,%R15 |
(1248) 0x452d00 JL 452d2d |
(1248) 0x452d02 MOV -0x70(%RBP),%RBX |
(1248) 0x452d06 VMOVSD -0x8(%RBX,%R11,1),%XMM7 |
(1248) 0x452d0d VMULSD %XMM6,%XMM7,%XMM8 |
(1248) 0x452d11 VUCOMISD %XMM0,%XMM8 |
(1248) 0x452d15 JAE 452d2d |
(1248) 0x452d17 MOV -0x88(%RBP),%RBX |
(1248) 0x452d1e MOV (%RBX),%R12 |
(1248) 0x452d21 VFMADD213SD (%R12,%R15,8),%XMM5,%XMM7 |
(1248) 0x452d27 VMOVSD %XMM7,(%R12,%R15,8) |
(1248) 0x452d2d MOV -0xa0(%RBP),%R15 |
(1248) 0x452d34 MOV (%R15,%R11,1),%R15 |
(1248) 0x452d38 MOV (%R14,%R15,8),%R15 |
(1248) 0x452d3c CMP %RSI,%R15 |
(1248) 0x452d3f JL 452c60 |
(1248) 0x452d45 MOV -0x70(%RBP),%RBX |
(1248) 0x452d49 VMOVSD (%RBX,%R11,1),%XMM7 |
(1248) 0x452d4f VMULSD %XMM6,%XMM7,%XMM8 |
(1248) 0x452d53 VUCOMISD %XMM0,%XMM8 |
(1248) 0x452d57 JAE 452c60 |
(1248) 0x452d5d MOV -0x88(%RBP),%RBX |
(1248) 0x452d64 MOV (%RBX),%R12 |
(1248) 0x452d67 VFMADD213SD (%R12,%R15,8),%XMM5,%XMM7 |
(1248) 0x452d6d VMOVSD %XMM7,(%R12,%R15,8) |
(1248) 0x452d73 JMP 452c60 |
0x452d78 ADD %RDX,%RAX |
0x452d7b MOV -0x30(%RBP),%R11 |
0x452d7f MOV -0xf8(%RBP),%RBX |
0x452d86 MOV %R8,%R15 |
0x452d89 JMP 452d9c |
(1247) 0x452d90 INC %RAX |
(1247) 0x452d93 CMP %RAX,%RCX |
(1247) 0x452d96 JE 45266e |
(1247) 0x452d9c MOV -0xa0(%RBP),%RDX |
(1247) 0x452da3 MOV (%RDX,%RAX,8),%RDX |
(1247) 0x452da7 MOV (%R14,%RDX,8),%RDX |
(1247) 0x452dab CMP %RSI,%RDX |
(1247) 0x452dae JL 452d90 |
(1247) 0x452db0 MOV -0x70(%RBP),%R10 |
(1247) 0x452db4 VMOVSD (%R10,%RAX,8),%XMM7 |
(1247) 0x452dba VMULSD %XMM6,%XMM7,%XMM8 |
(1247) 0x452dbe VUCOMISD %XMM0,%XMM8 |
(1247) 0x452dc2 JAE 452d90 |
(1247) 0x452dc4 MOV -0x88(%RBP),%R10 |
(1247) 0x452dcb MOV (%R10),%R10 |
(1247) 0x452dce VFMADD213SD (%R10,%RDX,8),%XMM5,%XMM7 |
(1247) 0x452dd4 VMOVSD %XMM7,(%R10,%RDX,8) |
(1247) 0x452dda JMP 452d90 |
/scratch_na/users/xoserete/qaas_runs/171-415-3661/intel/AMG/build/AMG/AMG/parcsr_ls/par_lr_interp.c: 1221 - 1675 |
-------------------------------------------------------------------------------- |
1221: if (n_fine) |
[...] |
1609: for (jj = A_diag_i[i]+1; jj < A_diag_i[i+1]; jj++) |
1610: { /* i1 is a c-point and strongly influences i, accumulate |
1611: * a_(i,i1) into interpolation weight */ |
1612: i1 = A_diag_j[jj]; |
1613: if (P_marker[i1] >= jj_begin_row) |
1614: { |
1615: P_diag_data[P_marker[i1]] += A_diag_data[jj]; |
1616: } |
1617: else if(P_marker[i1] == strong_f_marker) |
1618: { |
1619: sum = zero; |
1620: sgn = 1; |
1621: if(A_diag_data[A_diag_i[i1]] < 0) sgn = -1; |
1622: /* Loop over row of A for point i1 and calculate the sum |
1623: * of the connections to c-points that strongly influence i. */ |
1624: for(jj1 = A_diag_i[i1]+1; jj1 < A_diag_i[i1+1]; jj1++) |
1625: { |
1626: i2 = A_diag_j[jj1]; |
1627: if((P_marker[i2] >= jj_begin_row || i2 == i) && (sgn*A_diag_data[jj1]) < 0) |
1628: sum += A_diag_data[jj1]; |
1629: } |
1630: if(num_procs > 1) |
1631: { |
1632: for(jj1 = A_offd_i[i1]; jj1< A_offd_i[i1+1]; jj1++) |
1633: { |
1634: i2 = A_offd_j[jj1]; |
1635: if(P_marker_offd[i2] >= jj_begin_row_offd && |
1636: (sgn*A_offd_data[jj1]) < 0) |
1637: sum += A_offd_data[jj1]; |
1638: } |
1639: } |
1640: if(sum != 0) |
1641: { |
1642: distribute = A_diag_data[jj]/sum; |
1643: /* Loop over row of A for point i1 and do the distribution */ |
1644: for(jj1 = A_diag_i[i1]+1; jj1 < A_diag_i[i1+1]; jj1++) |
1645: { |
1646: i2 = A_diag_j[jj1]; |
1647: if(P_marker[i2] >= jj_begin_row && (sgn*A_diag_data[jj1]) < 0) |
1648: P_diag_data[P_marker[i2]] += |
1649: distribute*A_diag_data[jj1]; |
1650: if(i2 == i && (sgn*A_diag_data[jj1]) < 0) |
1651: diagonal += distribute*A_diag_data[jj1]; |
1652: } |
1653: if(num_procs > 1) |
1654: { |
1655: for(jj1 = A_offd_i[i1]; jj1 < A_offd_i[i1+1]; jj1++) |
1656: { |
1657: i2 = A_offd_j[jj1]; |
1658: if(P_marker_offd[i2] >= jj_begin_row_offd && |
1659: (sgn*A_offd_data[jj1]) < 0) |
1660: P_offd_data[P_marker_offd[i2]] += |
[...] |
1667: diagonal += A_diag_data[jj]; |
1668: } |
1669: } |
1670: /* neighbor i1 weakly influences i, accumulate a_(i,i1) into |
1671: * diagonal */ |
1672: else if (CF_marker[i1] != -3) |
1673: { |
1674: if(num_functions == 1 || dof_func[i] == dof_func[i1]) |
1675: diagonal += A_diag_data[jj]; |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.89 |
CQA speedup if FP arith vectorized | 2.98 |
CQA speedup if fully vectorized | 8.00 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.42 |
Bottlenecks | micro-operation queue, |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source | par_lr_interp.c:1221-1221,par_lr_interp.c:1609-1609,par_lr_interp.c:1612-1617,par_lr_interp.c:1621-1621,par_lr_interp.c:1624-1624,par_lr_interp.c:1627-1627,par_lr_interp.c:1630-1632,par_lr_interp.c:1635-1636,par_lr_interp.c:1640-1650,par_lr_interp.c:1653-1655,par_lr_interp.c:1659-1660,par_lr_interp.c:1667-1667,par_lr_interp.c:1672-1675 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 28.33 |
CQA cycles if no scalar integer | 15.00 |
CQA cycles if FP arith vectorized | 9.51 |
CQA cycles if fully vectorized | 3.54 |
Front-end cycles | 28.33 |
DIV/SQRT cycles | 16.50 |
P0 cycles | 15.20 |
P1 cycles | 20.00 |
P2 cycles | 20.00 |
P3 cycles | 3.50 |
P4 cycles | 15.40 |
P5 cycles | 16.50 |
P6 cycles | 3.50 |
P7 cycles | 3.50 |
P8 cycles | 3.50 |
P9 cycles | 15.40 |
P10 cycles | 20.00 |
P11 cycles | 4.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 28.63 - 28.66 |
Stall cycles (UFS) | 0.00 |
Nb insns | 164.00 |
Nb uops | 166.00 |
Nb loads | 60.00 |
Nb stores | 7.00 |
Nb stack references | 16.00 |
FLOP/cycle | 0.35 |
Nb FLOP add-sub | 3.00 |
Nb FLOP mul | 2.00 |
Nb FLOP fma | 2.00 |
Nb FLOP div | 1.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 18.92 |
Bytes prefetched | 0.00 |
Bytes loaded | 480.00 |
Bytes stored | 56.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 2.08 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | 0.00 |
Vectorization ratio div_sqrt | 0.00 |
Vectorization ratio other | 3.45 |
Vector-efficiency ratio all | 12.76 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | 12.50 |
Vector-efficiency ratio div_sqrt | 12.50 |
Vector-efficiency ratio other | 12.93 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.89 |
CQA speedup if FP arith vectorized | 2.98 |
CQA speedup if fully vectorized | 8.00 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.42 |
Bottlenecks | micro-operation queue, |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source | par_lr_interp.c:1221-1221,par_lr_interp.c:1609-1609,par_lr_interp.c:1612-1617,par_lr_interp.c:1621-1621,par_lr_interp.c:1624-1624,par_lr_interp.c:1627-1627,par_lr_interp.c:1630-1632,par_lr_interp.c:1635-1636,par_lr_interp.c:1640-1650,par_lr_interp.c:1653-1655,par_lr_interp.c:1659-1660,par_lr_interp.c:1667-1667,par_lr_interp.c:1672-1675 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 28.33 |
CQA cycles if no scalar integer | 15.00 |
CQA cycles if FP arith vectorized | 9.51 |
CQA cycles if fully vectorized | 3.54 |
Front-end cycles | 28.33 |
DIV/SQRT cycles | 16.50 |
P0 cycles | 15.20 |
P1 cycles | 20.00 |
P2 cycles | 20.00 |
P3 cycles | 3.50 |
P4 cycles | 15.40 |
P5 cycles | 16.50 |
P6 cycles | 3.50 |
P7 cycles | 3.50 |
P8 cycles | 3.50 |
P9 cycles | 15.40 |
P10 cycles | 20.00 |
P11 cycles | 4.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 28.63 - 28.66 |
Stall cycles (UFS) | 0.00 |
Nb insns | 164.00 |
Nb uops | 166.00 |
Nb loads | 60.00 |
Nb stores | 7.00 |
Nb stack references | 16.00 |
FLOP/cycle | 0.35 |
Nb FLOP add-sub | 3.00 |
Nb FLOP mul | 2.00 |
Nb FLOP fma | 2.00 |
Nb FLOP div | 1.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 18.92 |
Bytes prefetched | 0.00 |
Bytes loaded | 480.00 |
Bytes stored | 56.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 2.08 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | 0.00 |
Vectorization ratio div_sqrt | 0.00 |
Vectorization ratio other | 3.45 |
Vector-efficiency ratio all | 12.76 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | 12.50 |
Vector-efficiency ratio div_sqrt | 12.50 |
Vector-efficiency ratio other | 12.93 |
Path / |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source file and lines | par_lr_interp.c:1221-1675 |
Module | exec |
nb instructions | 164 |
nb uops | 166 |
loop length | 746 |
used x86 registers | 13 |
used mmx registers | 0 |
used xmm registers | 7 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 16 |
ADD-SUB / MUL ratio | 1.50 |
micro-operation queue | 28.33 cycles |
front end | 28.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 16.50 | 15.20 | 20.00 | 20.00 | 3.50 | 15.40 | 16.50 | 3.50 | 3.50 | 3.50 | 15.40 | 20.00 |
cycles | 16.50 | 15.20 | 20.00 | 20.00 | 3.50 | 15.40 | 16.50 | 3.50 | 3.50 | 3.50 | 15.40 | 20.00 |
Cycles executing div or sqrt instructions | 4.00 |
FE+BE cycles | 28.63-28.66 |
Stall cycles | 0.00 |
Front-end | 28.33 |
Dispatch | 20.00 |
DIV/SQRT | 4.00 |
Overall L1 | 28.33 |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 4% |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 0% |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 3% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | 12% |
other | 12% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | 12% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0x98(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RCX,%RAX,8),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RDX,%R9,8),%XMM5,%XMM5 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM5,(%RCX,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP -0x68(%RBP),%R9 | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4525a2 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1382> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%RBX,%R9,8),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%R10,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 452650 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1430> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP -0x80(%RBP),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 452820 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1600> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x188(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R10,8),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPXOR %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD (%RDX,%R15,8),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x8(%RCX,%R10,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SETBE %AL | 2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 1-2 | 1 |
LEA -0x1(%RAX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%R15),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4526ff <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xa8(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
NOT %R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RCX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP $0x4,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 452865 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1645> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452958 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1738> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x2,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 452770 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1550> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x168(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%RDX,8),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX,%RDX,8),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 452770 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1550> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xa8(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 4529ac <hypre_BoomerAMGBuildExtPIInterp.extracted+0x178c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xe0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452a9c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x187c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM0,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RAX,%R9,8),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 452859 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1639> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VDIVSD %XMM5,%XMM6,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-15 | 4 |
CMP %RCX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JGE 452aff <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xa8(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EDX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %ECX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 452af6 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18d6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x8(%RBX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%RAX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4527ed <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15cd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%R10,%R12,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM6,%XMM7,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VUCOMISD %XMM0,%XMM8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JAE 4527ed <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15cd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x98(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VFMADD213SD (%R10,%RDX,8),%XMM5,%XMM7 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD %XMM7,(%R10,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452aee <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18ce> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%RAX,%RDX,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM6,%XMM7,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM4,%XMM5,%XMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPSD $0x1,%XMM0,%XMM8,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVSD %XMM7,%XMM4,%XMM4{%K1} | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 452af2 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18d2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
CMPQ $-0x3,(%R11,%R10,8) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x1,-0x180(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 45284a <hypre_BoomerAMGBuildExtPIInterp.extracted+0x162a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x178(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R15,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RCX,%R10,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R9,8),%XMM4,%XMM4 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
JMP 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
VADDSD %XMM4,%XMM6,%XMM4 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R15,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x20(,%RAX,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4528ab <hypre_BoomerAMGBuildExtPIInterp.extracted+0x168b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RDX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 45299a <hypre_BoomerAMGBuildExtPIInterp.extracted+0x177a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
SHR $0x2,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%R12,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4529cd <hypre_BoomerAMGBuildExtPIInterp.extracted+0x17ad> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 452abc <hypre_BoomerAMGBuildExtPIInterp.extracted+0x189c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x2(%RDX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x2(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452b79 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1959> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x2,-0xe8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JL 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x168(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX,%RDX,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xa8(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 452c4b <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a2b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R10,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452d78 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b58> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf8(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%RAX,8),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 452c6d <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a4d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf8(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 452d9c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b7c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source file and lines | par_lr_interp.c:1221-1675 |
Module | exec |
nb instructions | 164 |
nb uops | 166 |
loop length | 746 |
used x86 registers | 13 |
used mmx registers | 0 |
used xmm registers | 7 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 16 |
ADD-SUB / MUL ratio | 1.50 |
micro-operation queue | 28.33 cycles |
front end | 28.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 16.50 | 15.20 | 20.00 | 20.00 | 3.50 | 15.40 | 16.50 | 3.50 | 3.50 | 3.50 | 15.40 | 20.00 |
cycles | 16.50 | 15.20 | 20.00 | 20.00 | 3.50 | 15.40 | 16.50 | 3.50 | 3.50 | 3.50 | 15.40 | 20.00 |
Cycles executing div or sqrt instructions | 4.00 |
FE+BE cycles | 28.63-28.66 |
Stall cycles | 0.00 |
Front-end | 28.33 |
Dispatch | 20.00 |
DIV/SQRT | 4.00 |
Overall L1 | 28.33 |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 4% |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 0% |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 3% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | 12% |
other | 12% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | 12% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0x98(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RCX,%RAX,8),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RDX,%R9,8),%XMM5,%XMM5 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM5,(%RCX,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP -0x68(%RBP),%R9 | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4525a2 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1382> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%RBX,%R9,8),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%R10,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 452650 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1430> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP -0x80(%RBP),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 452820 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1600> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x188(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R10,8),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPXOR %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD (%RDX,%R15,8),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x8(%RCX,%R10,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SETBE %AL | 2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 1-2 | 1 |
LEA -0x1(%RAX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%R15),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4526ff <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xa8(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
NOT %R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RCX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP $0x4,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 452865 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1645> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452958 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1738> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x2,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 452770 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1550> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x168(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%RDX,8),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX,%RDX,8),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 452770 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1550> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xa8(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 4529ac <hypre_BoomerAMGBuildExtPIInterp.extracted+0x178c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xe0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452a9c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x187c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM0,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RAX,%R9,8),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 452859 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1639> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VDIVSD %XMM5,%XMM6,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-15 | 4 |
CMP %RCX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JGE 452aff <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xa8(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EDX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %ECX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 452af6 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18d6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x8(%RBX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%RAX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4527ed <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15cd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%R10,%R12,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM6,%XMM7,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VUCOMISD %XMM0,%XMM8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JAE 4527ed <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15cd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x98(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VFMADD213SD (%R10,%RDX,8),%XMM5,%XMM7 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD %XMM7,(%R10,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452aee <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18ce> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%RAX,%RDX,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM6,%XMM7,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM4,%XMM5,%XMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPSD $0x1,%XMM0,%XMM8,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVSD %XMM7,%XMM4,%XMM4{%K1} | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 452af2 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18d2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
CMPQ $-0x3,(%R11,%R10,8) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x1,-0x180(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 45284a <hypre_BoomerAMGBuildExtPIInterp.extracted+0x162a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x178(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R15,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RCX,%R10,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R9,8),%XMM4,%XMM4 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
JMP 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
VADDSD %XMM4,%XMM6,%XMM4 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R15,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x20(,%RAX,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4528ab <hypre_BoomerAMGBuildExtPIInterp.extracted+0x168b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RDX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 45299a <hypre_BoomerAMGBuildExtPIInterp.extracted+0x177a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
SHR $0x2,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%R12,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4529cd <hypre_BoomerAMGBuildExtPIInterp.extracted+0x17ad> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 452abc <hypre_BoomerAMGBuildExtPIInterp.extracted+0x189c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x2(%RDX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x2(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452b79 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1959> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x2,-0xe8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JL 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x168(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX,%RDX,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xa8(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 452c4b <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a2b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R10,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452d78 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b58> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf8(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 45266e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x144e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%RAX,8),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 452c6d <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a4d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf8(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 452d9c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b7c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |