Loop Id: 675 | Module: exec | Source: TinyVectorOps.h:59-59 [...] | Coverage: 0.03% |
---|
Loop Id: 675 | Module: exec | Source: TinyVectorOps.h:59-59 [...] | Coverage: 0.03% |
---|
0x438420 MOV 0x78(%RSP),%RDX |
0x438425 INC %RDX |
0x438428 MOV 0x128(%RSP),%R15 |
0x438430 MOVSXD 0x30(%R15),%RAX |
0x438434 CMP %RAX,%RDX |
0x438437 JGE 43957b |
0x43843d MOV 0x2e8(%R15),%RAX |
0x438444 MOV 0x300(%R15),%RCX |
0x43844b MOV (%RAX,%RDX,8),%R11 |
0x43844f LEA (%RDX,%RDX,2),%RAX |
0x438453 MOV (%RCX,%RAX,8),%R12 |
0x438457 MOV 0x318(%R15),%RAX |
0x43845e MOV %RDX,0x78(%RSP) |
0x438463 LEA (,%RDX,8),%RCX |
0x43846b LEA (%RCX,%RCX,4),%RCX |
0x43846f MOV 0x18(%RAX,%RCX,1),%RAX |
0x438474 MOV %RAX,0x18(%RSP) |
0x438479 MOV 0x330(%R15),%RAX |
0x438480 MOV 0x18(%RAX,%RCX,1),%R14 |
0x438485 VMOVUPD 0x1f0(%RSP),%XMM0 |
0x43848e VSUBSD 0x78(%R11),%XMM0,%XMM0 |
0x438494 MOVSXD 0x40(%R15),%RDX |
0x438498 VMOVSD 0x98(%R11),%XMM1 |
0x4384a1 VMOVUPD %XMM1,0x230(%RSP) |
0x4384aa VMULSD %XMM0,%XMM1,%XMM8 |
0x4384ae MOV 0x88(%R11),%ESI |
0x4384b5 DEC %ESI |
0x4384b7 VROUNDSD $0x9,%XMM8,%XMM8,%XMM9 |
0x4384bd VCVTTSD2SI %XMM9,%EAX |
0x4384c2 MOV %EAX,%ECX |
0x4384c4 SAR $0x1f,%ECX |
0x4384c7 ANDN %EAX,%ECX,%EAX |
0x4384cc CMP %EAX,%ESI |
0x4384ce VMOVSD 0x28(%R11),%XMM2 |
0x4384d4 VMOVHPD 0x50(%R11),%XMM2,%XMM2 |
0x4384da VMOVUPD 0x200(%RSP),%XMM0 |
0x4384e3 VSUBPD %XMM2,%XMM0,%XMM2 |
0x4384e7 VMOVSD 0x48(%R11),%XMM1 |
0x4384ed VMOVSD 0x70(%R11),%XMM0 |
0x4384f3 VMOVUPD %XMM0,0x220(%RSP) |
0x4384fc VMOVUPD %XMM1,0x210(%RSP) |
0x438505 VUNPCKLPD %XMM0,%XMM1,%XMM3 |
0x438509 VMULPD %XMM2,%XMM3,%XMM2 |
0x43850d VRNDSCALEPD $0x9,%XMM2,%XMM18 |
0x438514 VMOVD 0x38(%R11),%XMM3 |
0x43851a VPINSRD $0x1,0x60(%R11),%XMM3,%XMM19 |
0x438522 VSUBPD %XMM18,%XMM2,%XMM2 |
0x438528 VMOVSD 0x597b8(%RIP),%XMM10 |
0x438530 VMULSD %XMM2,%XMM10,%XMM3 |
0x438534 VMOVSD 0x55ad4(%RIP),%XMM12 |
0x43853c VSUBSD %XMM3,%XMM12,%XMM4 |
0x438540 VMULPD %XMM2,%XMM2,%XMM5 |
0x438544 VMOVDDUP %XMM2,%XMM6 |
0x438548 VMOVUPD 0x1e0(%RSP),%XMM0 |
0x438551 VBLENDPD $0x1,%XMM4,%XMM0,%XMM4 |
0x438557 VMULPD %XMM4,%XMM6,%XMM4 |
0x43855b VMOVUPD 0x59eed(%RIP),%XMM11 |
0x438563 VADDPD %XMM4,%XMM11,%XMM6 |
0x438567 VUNPCKLPD %XMM5,%XMM2,%XMM7 |
0x43856b VMOVUPD 0x59eed(%RIP),%XMM13 |
0x438573 VFMADD213PD %XMM13,%XMM6,%XMM7 |
0x438578 VMOVUPD %XMM7,0x260(%RSP) |
0x438581 VMOVAPD %XMM2,%XMM6 |
0x438585 VMOVSD 0x55aeb(%RIP),%XMM14 |
0x43858d VFMADD213SD %XMM12,%XMM14,%XMM6 |
0x438592 VFMADD213SD %XMM12,%XMM2,%XMM6 |
0x438597 VFMADD213SD %XMM10,%XMM2,%XMM6 |
0x43859c VMOVSD %XMM6,0x270(%RSP) |
0x4385a5 VMULSD %XMM5,%XMM3,%XMM3 |
0x4385a9 VMOVSD %XMM3,0x278(%RSP) |
0x4385b2 VMOVAPD %XMM2,%XMM3 |
0x4385b6 VMOVSD 0x55a6a(%RIP),%XMM1 |
0x4385be VFMADD213SD %XMM1,%XMM14,%XMM3 |
0x4385c3 VFMADD213SD %XMM14,%XMM2,%XMM3 |
0x4385c8 VMOVSD %XMM3,0x1c0(%RSP) |
0x4385d1 VMOVAPD %XMM2,%XMM3 |
0x4385d5 VMOVSD 0x5971b(%RIP),%XMM15 |
0x4385dd VMOVSD 0x55a79(%RIP),%XMM16 |
0x4385e7 VFMADD213SD %XMM16,%XMM15,%XMM3 |
0x4385ed VMULSD %XMM2,%XMM3,%XMM3 |
0x4385f1 VMOVSD %XMM3,0x1c8(%RSP) |
0x4385fa VMOVAPD %XMM2,%XMM3 |
0x4385fe VFMSUB213SD %XMM1,%XMM15,%XMM3 |
0x438603 VFNMADD213SD %XMM12,%XMM2,%XMM3 |
0x438608 VMOVSD %XMM3,0x1d0(%RSP) |
0x438611 VPERMILPD $0x1,%XMM4,%XMM3 |
0x438617 VMULSD %XMM2,%XMM3,%XMM3 |
0x43861b VMOVSD %XMM3,0x1d8(%RSP) |
0x438624 VSUBSD %XMM2,%XMM1,%XMM3 |
0x438628 VMOVSD %XMM3,0x180(%RSP) |
0x438631 VMOVAPD %XMM2,%XMM3 |
0x438635 VMOVSD 0x58939(%RIP),%XMM17 |
0x43863f VFMADD213SD %XMM16,%XMM17,%XMM3 |
0x438645 VMOVSD %XMM3,0x188(%RSP) |
0x43864e CMOVGE %EAX,%ESI |
0x438651 VMOVAPD %XMM2,%XMM3 |
0x438655 VFNMADD213SD %XMM1,%XMM17,%XMM3 |
0x43865b VMOVSD %XMM3,0x190(%RSP) |
0x438664 VMOVLPD %XMM2,0x198(%RSP) |
0x43866d VPERMILPD $0x1,%XMM2,%XMM3 |
0x438673 VMULSD %XMM3,%XMM10,%XMM4 |
0x438677 VSUBSD %XMM4,%XMM12,%XMM5 |
0x43867b VMULSD %XMM3,%XMM3,%XMM6 |
0x43867f VPERMILPD $0x3,%XMM2,%XMM7 |
0x438685 VBLENDPD $0x1,%XMM5,%XMM0,%XMM5 |
0x43868b VMULPD %XMM5,%XMM7,%XMM5 |
0x43868f VADDPD %XMM5,%XMM11,%XMM7 |
0x438693 VSHUFPD $0x1,%XMM6,%XMM2,%XMM0 |
0x438698 VFMADD213PD %XMM13,%XMM7,%XMM0 |
0x43869d VMOVUPD %XMM0,0x240(%RSP) |
0x4386a6 VMOVAPD %XMM3,%XMM0 |
0x4386aa VFMADD213SD %XMM12,%XMM14,%XMM0 |
0x4386af VFMADD213SD %XMM12,%XMM3,%XMM0 |
0x4386b4 VFMADD213SD %XMM10,%XMM3,%XMM0 |
0x4386b9 VMOVSD %XMM0,0x250(%RSP) |
0x4386c2 VMULSD %XMM6,%XMM4,%XMM0 |
0x4386c6 VMOVSD %XMM0,0x258(%RSP) |
0x4386cf VMOVAPD %XMM3,%XMM0 |
0x4386d3 VFMADD213SD %XMM1,%XMM14,%XMM0 |
0x4386d8 VFMADD213SD %XMM14,%XMM3,%XMM0 |
0x4386dd VMOVSD %XMM0,0x1a0(%RSP) |
0x4386e6 VMOVAPD %XMM3,%XMM0 |
0x4386ea VFMADD213SD %XMM16,%XMM15,%XMM0 |
0x4386f0 VMULSD %XMM3,%XMM0,%XMM0 |
0x4386f4 VMOVSD %XMM0,0x1a8(%RSP) |
0x4386fd VMOVAPD %XMM3,%XMM0 |
0x438701 VFMSUB213SD %XMM1,%XMM15,%XMM0 |
0x438706 VFNMADD213SD %XMM12,%XMM3,%XMM0 |
0x43870b VMOVSD %XMM0,0x1b0(%RSP) |
0x438714 VMULPD %XMM2,%XMM5,%XMM0 |
0x438718 VMOVHPD %XMM0,0x1b8(%RSP) |
0x438721 VSUBSD %XMM3,%XMM1,%XMM0 |
0x438725 VMOVSD %XMM0,0x160(%RSP) |
0x43872e VMOVAPD %XMM3,%XMM0 |
0x438732 VFMADD213SD %XMM16,%XMM17,%XMM0 |
0x438738 VMOVSD %XMM0,0x168(%RSP) |
0x438741 VFNMADD213SD %XMM1,%XMM17,%XMM3 |
0x438747 VMOVSD %XMM3,0x170(%RSP) |
0x438750 VMOVHPD %XMM2,0x178(%RSP) |
0x438759 MOVSXD 0xe8(%R11),%RBX |
0x438760 LEA (%RBX,%RBX,1),%RCX |
0x438764 LEA (,%RBX,4),%R8 |
0x43876c VSUBSD %XMM9,%XMM8,%XMM14 |
0x438771 VMULSD %XMM12,%XMM14,%XMM13 |
0x438776 VADDSD 0x558b2(%RIP),%XMM13,%XMM15 |
0x43877e VMULSD %XMM14,%XMM14,%XMM17 |
0x438784 VFMADD213SD 0x59562(%RIP),%XMM17,%XMM15 |
0x43878e VMOVDQU64 0x10(%R11),%XMM16 |
0x438795 MOV 0x20(%R11),%RDI |
0x438799 LEA (%RBX,%RBX,2),%R9 |
0x43879d LEA (%RBX,%RBX,4),%R10 |
0x4387a1 MOV %RDX,%RAX |
0x4387a4 MOV %RDX,0x10(%RSP) |
0x4387a9 TEST %RDX,%RDX |
0x4387ac MOV %RCX,0x48(%RSP) |
0x4387b1 MOV %R8,0xa8(%RSP) |
0x4387b9 MOV %R10,0x40(%RSP) |
0x4387be MOV %R9,0x38(%RSP) |
0x4387c3 JE 438969 |
0x4387c9 LEA (%R14,%R10,8),%RAX |
0x4387cd MOV %RAX,0x280(%RSP) |
0x4387d5 LEA (%R14,%R8,8),%RAX |
0x4387d9 MOV %RAX,0x30(%RSP) |
0x4387de LEA (%R14,%R9,8),%RAX |
0x4387e2 MOV %RAX,0xa0(%RSP) |
0x4387ea LEA (%R14,%RCX,8),%RAX |
0x4387ee MOV %RAX,0x98(%RSP) |
0x4387f6 LEA (%R14,%RBX,8),%RAX |
0x4387fa MOV %RAX,0x90(%RSP) |
0x438802 MOV 0x18(%RSP),%R15 |
0x438807 LEA (%R15,%RCX,8),%RAX |
0x43880b MOV %RAX,0x88(%RSP) |
0x438813 LEA (%R15,%RBX,8),%RAX |
0x438817 MOV %RAX,0x80(%RSP) |
0x43881f MOV 0x10(%RSP),%RAX |
0x438824 LEA (,%RAX,8),%R13 |
0x43882c MOV %RDI,0x28(%RSP) |
0x438831 MOV %R12,%RDI |
0x438834 MOV %ESI,0x20(%RSP) |
0x438838 XOR %ESI,%ESI |
0x43883a MOV %R13,%RDX |
0x43883d VMOVUPD %XMM18,0x60(%RSP) |
0x438845 VMOVDQU64 %XMM19,0x50(%RSP) |
0x43884d VMOVUPD %XMM13,0xf0(%RSP) |
0x438856 VMOVUPD %XMM14,0xe0(%RSP) |
0x43885f VMOVUPD %XMM15,0xd0(%RSP) |
0x438868 VMOVDQU64 %XMM16,0xc0(%RSP) |
0x438870 VMOVSD %XMM17,0xb8(%RSP) |
0x438878 MOV %R11,0xb0(%RSP) |
0x438880 VZEROUPPER |
0x438883 CALL 47ebf0 <_intel_fast_memset> |
0x438888 MOV %R15,%RDI |
0x43888b XOR %ESI,%ESI |
0x43888d MOV %R13,%RDX |
0x438890 CALL 47ebf0 <_intel_fast_memset> |
0x438895 MOV 0x80(%RSP),%RDI |
0x43889d XOR %ESI,%ESI |
0x43889f MOV %R13,%RDX |
0x4388a2 CALL 47ebf0 <_intel_fast_memset> |
0x4388a7 MOV 0x88(%RSP),%RDI |
0x4388af XOR %ESI,%ESI |
0x4388b1 MOV %R13,%RDX |
0x4388b4 CALL 47ebf0 <_intel_fast_memset> |
0x4388b9 MOV %R14,%RDI |
0x4388bc XOR %ESI,%ESI |
0x4388be MOV %R13,%RDX |
0x4388c1 CALL 47ebf0 <_intel_fast_memset> |
0x4388c6 MOV 0x90(%RSP),%RDI |
0x4388ce XOR %ESI,%ESI |
0x4388d0 MOV %R13,%RDX |
0x4388d3 CALL 47ebf0 <_intel_fast_memset> |
0x4388d8 MOV 0x98(%RSP),%RDI |
0x4388e0 XOR %ESI,%ESI |
0x4388e2 MOV %R13,%RDX |
0x4388e5 CALL 47ebf0 <_intel_fast_memset> |
0x4388ea MOV 0xa0(%RSP),%RDI |
0x4388f2 XOR %ESI,%ESI |
0x4388f4 MOV %R13,%RDX |
0x4388f7 CALL 47ebf0 <_intel_fast_memset> |
0x4388fc MOV 0x30(%RSP),%RDI |
0x438901 XOR %ESI,%ESI |
0x438903 MOV %R13,%RDX |
0x438906 CALL 47ebf0 <_intel_fast_memset> |
0x43890b MOV 0x280(%RSP),%RDI |
0x438913 XOR %ESI,%ESI |
0x438915 MOV %R13,%RDX |
0x438918 CALL 47ebf0 <_intel_fast_memset> |
0x43891d MOV 0xb0(%RSP),%R11 |
0x438925 VMOVSD 0xb8(%RSP),%XMM17 |
0x43892d VMOVDQU64 0xc0(%RSP),%XMM16 |
0x438935 MOV 0x28(%RSP),%RDI |
0x43893a VMOVUPD 0xd0(%RSP),%XMM15 |
0x438943 VMOVUPD 0xe0(%RSP),%XMM14 |
0x43894c VMOVUPD 0xf0(%RSP),%XMM13 |
0x438955 VMOVDQU64 0x50(%RSP),%XMM19 |
0x43895d VMOVUPD 0x60(%RSP),%XMM18 |
0x438965 MOV 0x20(%RSP),%ESI |
0x438969 VMOVSD 0x59377(%RIP),%XMM4 |
0x438971 VMOVAPD %XMM4,%XMM0 |
0x438975 VMOVSD 0x55693(%RIP),%XMM1 |
0x43897d VFMSUB213SD %XMM1,%XMM14,%XMM0 |
0x438982 VMOVSD 0x556ee(%RIP),%XMM2 |
0x43898a VFMSUB213SD %XMM2,%XMM14,%XMM0 |
0x43898f VFNMADD213SD %XMM4,%XMM14,%XMM0 |
0x438994 VMOVAPD %XMM14,%XMM3 |
0x438998 VFMADD213SD %XMM1,%XMM2,%XMM3 |
0x43899d VFMADD213SD %XMM1,%XMM14,%XMM3 |
0x4389a2 VFMADD213SD %XMM4,%XMM14,%XMM3 |
0x4389a7 VMOVAPD %XMM14,%XMM6 |
0x4389ab VMOVSD 0x55675(%RIP),%XMM5 |
0x4389b3 VFMADD213SD %XMM5,%XMM2,%XMM6 |
0x4389b8 VFMADD213SD %XMM2,%XMM14,%XMM6 |
0x4389bd VMOVAPD %XMM14,%XMM9 |
0x4389c2 VMOVSD 0x5932e(%RIP),%XMM2 |
0x4389ca VMOVSD 0x5568e(%RIP),%XMM7 |
0x4389d2 VFMADD213SD %XMM7,%XMM2,%XMM9 |
0x4389d7 VMOVAPD %XMM14,%XMM8 |
0x4389dc VFMSUB213SD %XMM5,%XMM2,%XMM8 |
0x4389e1 VFNMADD213SD %XMM1,%XMM14,%XMM8 |
0x4389e6 VSUBSD %XMM14,%XMM5,%XMM10 |
0x4389eb VMOVAPD %XMM14,%XMM11 |
0x4389f0 VMOVSD 0x58580(%RIP),%XMM1 |
0x4389f8 VFMADD213SD %XMM7,%XMM1,%XMM11 |
0x4389fd VMOVAPD %XMM14,%XMM12 |
0x438a02 VFNMADD213SD %XMM5,%XMM1,%XMM12 |
0x438a07 VCVTTPD2DQ %XMM18,%XMM1 |
0x438a0d VPCMPEQD %XMM2,%XMM2,%XMM2 |
0x438a11 VPADDD %XMM2,%XMM19,%XMM2 |
0x438a17 VPMAXSD 0x55de0(%RIP),%XMM1,%XMM1 |
0x438a20 VPMINSD %XMM1,%XMM2,%XMM1 |
0x438a25 MOV 0x8(%R11),%R10 |
0x438a29 MOVSXD %ESI,%RAX |
0x438a2c MOV %RDI,%R11 |
0x438a2f IMUL %RAX,%R11 |
0x438a33 VPMOVSXDQ %XMM1,%XMM1 |
0x438a38 VPMULLQ %XMM1,%XMM16,%XMM1 |
0x438a3e VPEXTRQ $0x1,%XMM1,%RCX |
0x438a44 VMULSD %XMM4,%XMM17,%XMM5 |
0x438a4a LEA (%R11,%RCX,1),%RDX |
0x438a4e VMOVQ %XMM1,%RSI |
0x438a53 ADD %RSI,%RDX |
0x438a56 MOV %RDX,0x98(%RSP) |
0x438a5e VPEXTRQ $0x1,%XMM16,0x30(%RSP) |
0x438a67 VMOVQ %XMM16,%R13 |
0x438a6d LEA (%RCX,%RSI,1),%R9 |
0x438a71 LEA 0x2(%RAX),%R8 |
0x438a75 IMUL %RDI,%R8 |
0x438a79 LEA (%R8,%RCX,1),%RDX |
0x438a7d ADD %RSI,%RDX |
0x438a80 MOV %RDX,0x90(%RSP) |
0x438a88 LEA 0x3(%RAX),%RDX |
0x438a8c IMUL %RDI,%RDX |
0x438a90 ADD %RDX,%RCX |
0x438a93 ADD %RSI,%RCX |
0x438a96 MOV %RCX,0xa0(%RSP) |
0x438a9e LEA (%RDI,%R11,1),%RCX |
0x438aa2 ADD %R9,%RCX |
0x438aa5 MOV %RCX,0x88(%RSP) |
0x438aad INC %RAX |
0x438ab0 IMUL %RDI,%RAX |
0x438ab4 MOV 0x18(%RSP),%RDI |
0x438ab9 MOV 0x10(%RSP),%RSI |
0x438abe MOV %RSI,%RCX |
0x438ac1 AND $-0x8,%RCX |
0x438ac5 MOV %RCX,0x20(%RSP) |
0x438aca VBROADCASTSD %XMM0,%ZMM29 |
0x438ad0 VBROADCASTSD %XMM15,%ZMM17 |
0x438ad6 VBROADCASTSD %XMM3,%ZMM18 |
0x438adc VBROADCASTSD %XMM14,%ZMM4 |
0x438ae2 VBROADCASTSD %XMM5,%ZMM5 |
0x438ae8 VBROADCASTSD %XMM6,%ZMM6 |
0x438aee VBROADCASTSD %XMM9,%ZMM7 |
0x438af4 VBROADCASTSD %XMM8,%ZMM8 |
0x438afa VBROADCASTSD %XMM13,%ZMM9 |
0x438b00 VBROADCASTSD %XMM10,%ZMM10 |
0x438b06 VBROADCASTSD %XMM11,%ZMM11 |
0x438b0c VBROADCASTSD %XMM12,%ZMM12 |
0x438b12 VPBROADCASTQ %RSI,%ZMM0 |
0x438b18 VMOVDQU64 %ZMM0,0x280(%RSP) |
0x438b20 ADD %R9,%RDX |
0x438b23 ADD %R9,%R8 |
0x438b26 ADD %R9,%RAX |
0x438b29 ADD %R9,%R11 |
0x438b2c MOV 0x48(%RSP),%RCX |
0x438b31 MOV %R12,%RSI |
0x438b34 LEA (%RDI,%RCX,8),%R12 |
0x438b38 LEA (%R10,%RDX,8),%RDX |
0x438b3c LEA (%R10,%R8,8),%RCX |
0x438b40 LEA (%R10,%RAX,8),%R9 |
0x438b44 MOV %R10,0x50(%RSP) |
0x438b49 LEA (%R10,%R11,8),%R8 |
0x438b4d MOV %RCX,%R10 |
0x438b50 MOV %RDX,%R11 |
0x438b53 LEA (%RDI,%RBX,8),%RDX |
0x438b57 MOV %R13,0x138(%RSP) |
0x438b5f LEA (,%R13,8),%RDI |
0x438b67 MOV %RDI,0x130(%RSP) |
0x438b6f MOV 0x30(%RSP),%RAX |
0x438b74 LEA (,%RAX,8),%RAX |
0x438b7c MOV %RAX,0xe0(%RSP) |
0x438b84 MOV %R9,%R13 |
0x438b87 LEA (,%RBX,8),%R9 |
0x438b8f XOR %EAX,%EAX |
0x438b91 MOV %RSI,0x158(%RSP) |
0x438b99 MOV 0x18(%RSP),%RCX |
0x438b9e JMP 438be5 |
(677) 0x438ba0 LEA 0x1(%RDI),%R15 |
(677) 0x438ba4 MOV 0x80(%RSP),%R11 |
(677) 0x438bac MOV 0x130(%RSP),%RAX |
(677) 0x438bb4 ADD %RAX,%R11 |
(677) 0x438bb7 MOV 0x150(%RSP),%R10 |
(677) 0x438bbf ADD %RAX,%R10 |
(677) 0x438bc2 MOV 0x148(%RSP),%R13 |
(677) 0x438bca ADD %RAX,%R13 |
(677) 0x438bcd MOV 0x140(%RSP),%R8 |
(677) 0x438bd5 ADD %RAX,%R8 |
(677) 0x438bd8 CMP $0x3,%RDI |
(677) 0x438bdc MOV %R15,%RAX |
(677) 0x438bdf JE 439200 |
(677) 0x438be5 MOV %RAX,0xf0(%RSP) |
(677) 0x438bed VMOVSD 0x180(%RSP,%RAX,8),%XMM0 |
(677) 0x438bf6 VMOVSD %XMM0,0xd0(%RSP) |
(677) 0x438bff VMOVSD 0x1c0(%RSP,%RAX,8),%XMM0 |
(677) 0x438c08 VMOVSD %XMM0,0x28(%RSP) |
(677) 0x438c0e VMOVSD 0x260(%RSP,%RAX,8),%XMM0 |
(677) 0x438c17 VMOVSD %XMM0,0xc0(%RSP) |
(677) 0x438c20 MOV 0x138(%RSP),%RDI |
(677) 0x438c28 IMUL %RAX,%RDI |
(677) 0x438c2c MOV %RDI,0xb0(%RSP) |
(677) 0x438c34 MOV %R8,0x140(%RSP) |
(677) 0x438c3c MOV %R13,0x148(%RSP) |
(677) 0x438c44 MOV %R10,0x150(%RSP) |
(677) 0x438c4c MOV %R11,0x80(%RSP) |
(677) 0x438c54 XOR %EAX,%EAX |
(677) 0x438c56 JMP 438c8d |
(678) 0x438c60 LEA 0x1(%RAX),%R15 |
(678) 0x438c64 MOV 0xe0(%RSP),%RDI |
(678) 0x438c6c ADD %RDI,%R11 |
(678) 0x438c6f ADD %RDI,%R10 |
(678) 0x438c72 ADD %RDI,%R13 |
(678) 0x438c75 ADD %RDI,%R8 |
(678) 0x438c78 CMP $0x3,%RAX |
(678) 0x438c7c MOV %R15,%RAX |
(678) 0x438c7f MOV 0xf0(%RSP),%RDI |
(678) 0x438c87 JE 438ba0 |
(678) 0x438c8d CMPL $0,0x10(%RSP) |
(678) 0x438c92 JLE 438c60 |
(678) 0x438c94 VMOVSD 0x240(%RSP,%RAX,8),%XMM0 |
(678) 0x438c9d VMULSD 0xd0(%RSP),%XMM0,%XMM28 |
(678) 0x438ca5 VMOVSD 0x28(%RSP),%XMM2 |
(678) 0x438cab VMULSD %XMM2,%XMM0,%XMM20 |
(678) 0x438cb1 VMOVSD 0x1a0(%RSP,%RAX,8),%XMM1 |
(678) 0x438cba VMOVSD 0xc0(%RSP),%XMM3 |
(678) 0x438cc3 VMULSD %XMM3,%XMM0,%XMM27 |
(678) 0x438cc9 VMULSD %XMM2,%XMM1,%XMM21 |
(678) 0x438ccf VMULSD %XMM3,%XMM1,%XMM2 |
(678) 0x438cd3 VMULSD 0x160(%RSP,%RAX,8),%XMM3,%XMM19 |
(678) 0x438cdb CMPQ $0,0x20(%RSP) |
(678) 0x438ce1 MOV %RAX,0x60(%RSP) |
(678) 0x438ce6 JE 438e90 |
(678) 0x438cec VBROADCASTSD %XMM28,%ZMM22 |
(678) 0x438cf2 VBROADCASTSD %XMM21,%ZMM23 |
(678) 0x438cf8 VBROADCASTSD %XMM20,%ZMM24 |
(678) 0x438cfe VBROADCASTSD %XMM19,%ZMM25 |
(678) 0x438d04 VBROADCASTSD %XMM2,%ZMM26 |
(678) 0x438d0a VMOVAPD %XMM27,%XMM3 |
(678) 0x438d10 VBROADCASTSD %XMM27,%ZMM27 |
(678) 0x438d16 XOR %EAX,%EAX |
(678) 0x438d18 NOPL (%RAX,%RAX,1) |
(679) 0x438d20 VMOVUPD (%R8,%RAX,8),%ZMM0 |
(679) 0x438d27 VMOVUPD (%R13,%RAX,8),%ZMM1 |
(679) 0x438d2f VMOVUPD (%R10,%RAX,8),%ZMM30 |
(679) 0x438d36 VMOVUPD (%R11,%RAX,8),%ZMM31 |
(679) 0x438d3d VMULPD %ZMM29,%ZMM0,%ZMM13 |
(679) 0x438d43 VMULPD %ZMM4,%ZMM31,%ZMM14 |
(679) 0x438d49 VFMADD231PD %ZMM17,%ZMM1,%ZMM13 |
(679) 0x438d4f VFMADD231PD %ZMM18,%ZMM30,%ZMM13 |
(679) 0x438d55 VFMADD231PD %ZMM14,%ZMM5,%ZMM13 |
(679) 0x438d5b VMULPD %ZMM6,%ZMM0,%ZMM15 |
(679) 0x438d61 VMULPD %ZMM7,%ZMM1,%ZMM16 |
(679) 0x438d67 VFMADD231PD %ZMM31,%ZMM9,%ZMM16 |
(679) 0x438d6d VFMADD231PD %ZMM8,%ZMM30,%ZMM15 |
(679) 0x438d73 VFMADD231PD %ZMM16,%ZMM4,%ZMM15 |
(679) 0x438d79 LEA (%R14,%RAX,8),%RDI |
(679) 0x438d7d VMOVUPD (%R14,%RAX,8),%ZMM16 |
(679) 0x438d84 VFMADD231PD %ZMM13,%ZMM22,%ZMM16 |
(679) 0x438d8a VMOVUPD %ZMM16,(%R14,%RAX,8) |
(679) 0x438d91 VMOVUPD (%RDI,%RBX,8),%ZMM16 |
(679) 0x438d98 VFMADD231PD %ZMM13,%ZMM23,%ZMM16 |
(679) 0x438d9e VMOVUPD %ZMM16,(%RDI,%RBX,8) |
(679) 0x438da5 LEA (%RDI,%RBX,8),%RDI |
(679) 0x438da9 VMOVUPD (%R9,%RDI,1),%ZMM16 |
(679) 0x438db0 VFMADD231PD %ZMM24,%ZMM15,%ZMM16 |
(679) 0x438db6 VMOVUPD %ZMM16,(%R9,%RDI,1) |
(679) 0x438dbd LEA (%RDI,%R9,1),%RDI |
(679) 0x438dc1 VMOVUPD (%R9,%RDI,1),%ZMM16 |
(679) 0x438dc8 VFMADD231PD %ZMM13,%ZMM25,%ZMM16 |
(679) 0x438dce VMOVUPD %ZMM16,(%R9,%RDI,1) |
(679) 0x438dd5 LEA (%RDI,%R9,1),%RDI |
(679) 0x438dd9 VMOVUPD (%R9,%RDI,1),%ZMM16 |
(679) 0x438de0 VFMADD231PD %ZMM26,%ZMM15,%ZMM16 |
(679) 0x438de6 VMOVUPD %ZMM16,(%R9,%RDI,1) |
(679) 0x438ded LEA (%RDI,%R9,1),%RDI |
(679) 0x438df1 VFMADD213PD %ZMM14,%ZMM10,%ZMM0 |
(679) 0x438df7 VFMADD231PD %ZMM1,%ZMM11,%ZMM0 |
(679) 0x438dfd VFMADD231PD %ZMM30,%ZMM12,%ZMM0 |
(679) 0x438e03 VFMADD213PD (%R9,%RDI,1),%ZMM27,%ZMM0 |
(679) 0x438e0a VMOVUPD %ZMM0,(%R9,%RDI,1) |
(679) 0x438e11 VMOVUPD (%RCX,%RAX,8),%ZMM0 |
(679) 0x438e18 VFMADD231PD %ZMM24,%ZMM13,%ZMM0 |
(679) 0x438e1e VMOVUPD %ZMM0,(%RCX,%RAX,8) |
(679) 0x438e25 VMOVUPD (%RDX,%RAX,8),%ZMM0 |
(679) 0x438e2c VFMADD231PD %ZMM26,%ZMM13,%ZMM0 |
(679) 0x438e32 VMOVUPD %ZMM0,(%RDX,%RAX,8) |
(679) 0x438e39 VFMADD213PD (%R12,%RAX,8),%ZMM27,%ZMM15 |
(679) 0x438e40 VMOVUPD %ZMM15,(%R12,%RAX,8) |
(679) 0x438e47 VFMADD213PD (%RSI,%RAX,8),%ZMM27,%ZMM13 |
(679) 0x438e4e VMOVUPD %ZMM13,(%RSI,%RAX,8) |
(679) 0x438e55 ADD $0x8,%RAX |
(679) 0x438e59 CMP 0x20(%RSP),%RAX |
(679) 0x438e5e JL 438d20 |
(678) 0x438e64 MOV 0x20(%RSP),%RAX |
(678) 0x438e69 MOV %RAX,%R15 |
(678) 0x438e6c CMP 0x10(%RSP),%RAX |
(678) 0x438e71 MOV 0x60(%RSP),%RAX |
(678) 0x438e76 VMOVAPD %XMM3,%XMM27 |
(678) 0x438e7c JE 438c60 |
(678) 0x438e82 JMP 438e93 |
(678) 0x438e90 XOR %R15D,%R15D |
(678) 0x438e93 VPBROADCASTQ %R15,%ZMM0 |
(678) 0x438e99 VPORQ 0x58f9d(%RIP),%ZMM0,%ZMM0 |
(678) 0x438ea3 VPCMPLTUQ 0x280(%RSP),%ZMM0,%K1 |
(678) 0x438eac KORTESTB %K1,%K1 |
(678) 0x438eb0 JE 438c60 |
(678) 0x438eb6 MOV 0x30(%RSP),%RAX |
(678) 0x438ebb IMUL 0x60(%RSP),%RAX |
(678) 0x438ec1 ADD 0xb0(%RSP),%RAX |
(678) 0x438ec9 MOV 0x98(%RSP),%RDI |
(678) 0x438ed1 ADD %R15,%RDI |
(678) 0x438ed4 ADD %RAX,%RDI |
(678) 0x438ed7 MOV 0x50(%RSP),%RSI |
(678) 0x438edc VMOVUPD (%RSI,%RDI,8),%ZMM0{%K1}{z} |
(678) 0x438ee3 VMOVUPD 0x500(%RSP),%ZMM25 |
(678) 0x438eeb VMOVAPD %ZMM0,%ZMM25{%K1} |
(678) 0x438ef1 MOV 0x88(%RSP),%RDI |
(678) 0x438ef9 ADD %R15,%RDI |
(678) 0x438efc ADD %RAX,%RDI |
(678) 0x438eff MOV 0x50(%RSP),%RSI |
(678) 0x438f04 VMOVUPD (%RSI,%RDI,8),%ZMM0{%K1}{z} |
(678) 0x438f0b VMOVUPD 0x540(%RSP),%ZMM16 |
(678) 0x438f13 VMOVAPD %ZMM0,%ZMM16{%K1} |
(678) 0x438f19 MOV 0x90(%RSP),%RDI |
(678) 0x438f21 ADD %R15,%RDI |
(678) 0x438f24 ADD %RAX,%RDI |
(678) 0x438f27 MOV 0x50(%RSP),%RSI |
(678) 0x438f2c VMOVUPD (%RSI,%RDI,8),%ZMM0{%K1}{z} |
(678) 0x438f33 VMOVUPD 0x580(%RSP),%ZMM15 |
(678) 0x438f3b VMOVAPD %ZMM0,%ZMM15{%K1} |
(678) 0x438f41 MOV 0xa0(%RSP),%RDI |
(678) 0x438f49 ADD %R15,%RDI |
(678) 0x438f4c ADD %RDI,%RAX |
(678) 0x438f4f MOV 0x50(%RSP),%RSI |
(678) 0x438f54 VMOVUPD (%RSI,%RAX,8),%ZMM0{%K1}{z} |
(678) 0x438f5b MOV 0x158(%RSP),%RSI |
(678) 0x438f63 VMOVUPD 0x5c0(%RSP),%ZMM1 |
(678) 0x438f6b VMOVAPD %ZMM0,%ZMM1{%K1} |
(678) 0x438f71 VMULPD %ZMM29,%ZMM25,%ZMM22 |
(678) 0x438f77 VMULPD %ZMM4,%ZMM1,%ZMM24 |
(678) 0x438f7d VFMADD231PD %ZMM17,%ZMM16,%ZMM22 |
(678) 0x438f83 VFMADD231PD %ZMM18,%ZMM15,%ZMM22 |
(678) 0x438f89 VFMADD231PD %ZMM24,%ZMM5,%ZMM22 |
(678) 0x438f8f VMOVUPD (%R14,%R15,8),%ZMM0{%K1}{z} |
(678) 0x438f96 VMULPD %ZMM6,%ZMM25,%ZMM23 |
(678) 0x438f9c VMOVUPD 0x600(%RSP),%ZMM13 |
(678) 0x438fa4 VMOVAPD %ZMM0,%ZMM13{%K1} |
(678) 0x438faa VMULPD %ZMM7,%ZMM16,%ZMM0 |
(678) 0x438fb0 VMOVUPD %ZMM1,0x5c0(%RSP) |
(678) 0x438fb8 VFMADD231PD %ZMM9,%ZMM1,%ZMM0 |
(678) 0x438fbe VFMADD231PD %ZMM8,%ZMM15,%ZMM23 |
(678) 0x438fc4 VBROADCASTSD %XMM28,%ZMM1 |
(678) 0x438fca VMOVUPD %ZMM13,0x600(%RSP) |
(678) 0x438fd2 VFMADD213PD %ZMM13,%ZMM22,%ZMM1 |
(678) 0x438fd8 VMOVUPD %ZMM1,(%R14,%R15,8){%K1} |
(678) 0x438fdf LEA (%R15,%RBX,1),%RAX |
(678) 0x438fe3 MOV %RAX,0xb8(%RSP) |
(678) 0x438feb VMOVUPD (%R14,%RAX,8),%ZMM1{%K1}{z} |
(678) 0x438ff2 VFMADD231PD %ZMM0,%ZMM4,%ZMM23 |
(678) 0x438ff8 VMOVUPD 0x640(%RSP),%ZMM13 |
(678) 0x439000 VMOVAPD %ZMM1,%ZMM13{%K1} |
(678) 0x439006 VBROADCASTSD %XMM21,%ZMM0 |
(678) 0x43900c VMOVUPD %ZMM13,0x640(%RSP) |
(678) 0x439014 VFMADD213PD %ZMM13,%ZMM22,%ZMM0 |
(678) 0x43901a VMOVUPD %ZMM0,(%R14,%RAX,8){%K1} |
(678) 0x439021 VBROADCASTSD %XMM20,%ZMM0 |
(678) 0x439027 MOV 0x48(%RSP),%RAX |
(678) 0x43902c LEA (%RAX,%R15,1),%RAX |
(678) 0x439030 VMOVUPD (%R14,%RAX,8),%ZMM1{%K1}{z} |
(678) 0x439037 VMOVUPD 0x680(%RSP),%ZMM13 |
(678) 0x43903f VMOVAPD %ZMM1,%ZMM13{%K1} |
(678) 0x439045 VMOVAPD %ZMM0,%ZMM1 |
(678) 0x43904b VMOVUPD %ZMM13,0x680(%RSP) |
(678) 0x439053 VFMADD213PD %ZMM13,%ZMM23,%ZMM1 |
(678) 0x439059 VMOVUPD %ZMM1,(%R14,%RAX,8){%K1} |
(678) 0x439060 MOV 0x38(%RSP),%RDI |
(678) 0x439065 LEA (%RDI,%R15,1),%RDI |
(678) 0x439069 VMOVUPD (%R14,%RDI,8),%ZMM1{%K1}{z} |
(678) 0x439070 VMOVUPD 0x6c0(%RSP),%ZMM13 |
(678) 0x439078 VMOVAPD %ZMM1,%ZMM13{%K1} |
(678) 0x43907e VBROADCASTSD %XMM19,%ZMM1 |
(678) 0x439084 VMOVUPD %ZMM13,0x6c0(%RSP) |
(678) 0x43908c VFMADD213PD %ZMM13,%ZMM22,%ZMM1 |
(678) 0x439092 VMOVUPD %ZMM1,(%R14,%RDI,8){%K1} |
(678) 0x439099 VBROADCASTSD %XMM2,%ZMM1 |
(678) 0x43909f MOV 0xa8(%RSP),%RDI |
(678) 0x4390a7 LEA (%RDI,%R15,1),%RDI |
(678) 0x4390ab VMOVUPD (%R14,%RDI,8),%ZMM13{%K1}{z} |
(678) 0x4390b2 VMOVUPD 0x700(%RSP),%ZMM14 |
(678) 0x4390ba VMOVAPD %ZMM13,%ZMM14{%K1} |
(678) 0x4390c0 VMOVAPD %ZMM1,%ZMM13 |
(678) 0x4390c6 VMOVUPD %ZMM14,0x700(%RSP) |
(678) 0x4390ce VFMADD213PD %ZMM14,%ZMM23,%ZMM13 |
(678) 0x4390d4 VMOVUPD %ZMM13,(%R14,%RDI,8){%K1} |
(678) 0x4390db MOV 0x40(%RSP),%RDI |
(678) 0x4390e0 LEA (%RDI,%R15,1),%RDI |
(678) 0x4390e4 VMOVUPD (%R14,%RDI,8),%ZMM13{%K1}{z} |
(678) 0x4390eb VMOVUPD 0x740(%RSP),%ZMM14 |
(678) 0x4390f3 VMOVAPD %ZMM13,%ZMM14{%K1} |
(678) 0x4390f9 VBROADCASTSD %XMM27,%ZMM13 |
(678) 0x4390ff VMOVUPD %ZMM25,0x500(%RSP) |
(678) 0x439107 VFMADD231PD %ZMM25,%ZMM10,%ZMM24 |
(678) 0x43910d VMOVUPD %ZMM16,0x540(%RSP) |
(678) 0x439115 VFMADD231PD %ZMM16,%ZMM11,%ZMM24 |
(678) 0x43911b VMOVUPD %ZMM15,0x580(%RSP) |
(678) 0x439123 VFMADD231PD %ZMM15,%ZMM12,%ZMM24 |
(678) 0x439129 VMOVUPD %ZMM14,0x740(%RSP) |
(678) 0x439131 VFMADD213PD %ZMM14,%ZMM13,%ZMM24 |
(678) 0x439137 VMOVUPD %ZMM24,(%R14,%RDI,8){%K1} |
(678) 0x43913e VMOVUPD (%RCX,%R15,8),%ZMM14{%K1}{z} |
(678) 0x439145 VMOVUPD 0x780(%RSP),%ZMM15 |
(678) 0x43914d VMOVAPD %ZMM14,%ZMM15{%K1} |
(678) 0x439153 VMOVUPD %ZMM15,0x780(%RSP) |
(678) 0x43915b VFMADD213PD %ZMM15,%ZMM22,%ZMM0 |
(678) 0x439161 VMOVUPD %ZMM0,(%RCX,%R15,8){%K1} |
(678) 0x439168 MOV 0xb8(%RSP),%RDI |
(678) 0x439170 VMOVUPD (%RCX,%RDI,8),%ZMM0{%K1}{z} |
(678) 0x439177 VMOVUPD 0x7c0(%RSP),%ZMM14 |
(678) 0x43917f VMOVAPD %ZMM0,%ZMM14{%K1} |
(678) 0x439185 VMOVUPD %ZMM14,0x7c0(%RSP) |
(678) 0x43918d VFMADD213PD %ZMM14,%ZMM22,%ZMM1 |
(678) 0x439193 VMOVUPD %ZMM1,(%RCX,%RDI,8){%K1} |
(678) 0x43919a VMOVUPD (%RCX,%RAX,8),%ZMM0{%K1}{z} |
(678) 0x4391a1 VMOVUPD 0x800(%RSP),%ZMM1 |
(678) 0x4391a9 VMOVAPD %ZMM0,%ZMM1{%K1} |
(678) 0x4391af VMOVUPD %ZMM1,0x800(%RSP) |
(678) 0x4391b7 VFMADD213PD %ZMM1,%ZMM13,%ZMM23 |
(678) 0x4391bd VMOVUPD %ZMM23,(%RCX,%RAX,8){%K1} |
(678) 0x4391c4 MOV 0x60(%RSP),%RAX |
(678) 0x4391c9 VMOVUPD (%RSI,%R15,8),%ZMM0{%K1}{z} |
(678) 0x4391d0 VMOVUPD 0x840(%RSP),%ZMM1 |
(678) 0x4391d8 VMOVAPD %ZMM0,%ZMM1{%K1} |
(678) 0x4391de VMOVUPD %ZMM1,0x840(%RSP) |
(678) 0x4391e6 VFMADD213PD %ZMM1,%ZMM13,%ZMM22 |
(678) 0x4391ec VMOVUPD %ZMM22,(%RSI,%R15,8){%K1} |
(678) 0x4391f3 JMP 438c60 |
0x439200 CMPL $0,0x10(%RSP) |
0x439205 JLE 438420 |
0x43920b VMOVUPD 0x210(%RSP),%XMM2 |
0x439214 VMULSD %XMM2,%XMM2,%XMM5 |
0x439218 VMOVUPD 0x220(%RSP),%XMM1 |
0x439221 VMULSD %XMM1,%XMM1,%XMM4 |
0x439225 VMOVUPD 0x230(%RSP),%XMM0 |
0x43922e VMULSD %XMM0,%XMM0,%XMM3 |
0x439232 VMULSD %XMM2,%XMM1,%XMM18 |
0x439238 VMULSD %XMM2,%XMM0,%XMM17 |
0x43923e VMULSD %XMM1,%XMM0,%XMM16 |
0x439244 MOV 0x10(%RSP),%R8 |
0x439249 AND $-0x8,%R8 |
0x43924d JE 439370 |
0x439253 VBROADCASTSD %XMM2,%ZMM6 |
0x439259 VBROADCASTSD %XMM1,%ZMM7 |
0x43925f VBROADCASTSD %XMM0,%ZMM8 |
0x439265 VBROADCASTSD %XMM5,%ZMM9 |
0x43926b VBROADCASTSD %XMM4,%ZMM10 |
0x439271 VBROADCASTSD %XMM3,%ZMM11 |
0x439277 VBROADCASTSD %XMM18,%ZMM12 |
0x43927d VBROADCASTSD %XMM17,%ZMM14 |
0x439283 VBROADCASTSD %XMM16,%ZMM15 |
0x439289 MOV 0xa8(%RSP),%R13 |
0x439291 LEA (%R14,%R13,8),%R9 |
0x439295 MOV 0x40(%RSP),%RAX |
0x43929a LEA (%R14,%RAX,8),%R10 |
0x43929e MOV 0x38(%RSP),%RAX |
0x4392a3 LEA (%R14,%RAX,8),%R11 |
0x4392a7 MOV 0x48(%RSP),%RAX |
0x4392ac LEA (%R14,%RAX,8),%RCX |
0x4392b0 LEA (%R14,%RBX,8),%RDI |
0x4392b4 XOR %EAX,%EAX |
0x4392b6 MOV 0x18(%RSP),%R15 |
0x4392bb NOPL (%RAX,%RAX,1) |
(676) 0x4392c0 VMULPD (%R15,%RAX,8),%ZMM6,%ZMM13 |
(676) 0x4392c7 VMOVUPD %ZMM13,(%R15,%RAX,8) |
(676) 0x4392ce VMULPD (%RDX,%RAX,8),%ZMM7,%ZMM13 |
(676) 0x4392d5 VMOVUPD %ZMM13,(%RDX,%RAX,8) |
(676) 0x4392dc VMULPD (%R12,%RAX,8),%ZMM8,%ZMM13 |
(676) 0x4392e3 VMOVUPD %ZMM13,(%R12,%RAX,8) |
(676) 0x4392ea VMULPD (%R14,%RAX,8),%ZMM9,%ZMM13 |
(676) 0x4392f1 VMOVUPD %ZMM13,(%R14,%RAX,8) |
(676) 0x4392f8 VMULPD (%R11,%RAX,8),%ZMM10,%ZMM13 |
(676) 0x4392ff VMOVUPD %ZMM13,(%R11,%RAX,8) |
(676) 0x439306 VMULPD (%R10,%RAX,8),%ZMM11,%ZMM13 |
(676) 0x43930d VMOVUPD %ZMM13,(%R10,%RAX,8) |
(676) 0x439314 VMULPD (%RDI,%RAX,8),%ZMM12,%ZMM13 |
(676) 0x43931b VMOVUPD %ZMM13,(%RDI,%RAX,8) |
(676) 0x439322 VMULPD (%RCX,%RAX,8),%ZMM14,%ZMM13 |
(676) 0x439329 VMOVUPD %ZMM13,(%RCX,%RAX,8) |
(676) 0x439330 VMULPD (%R9,%RAX,8),%ZMM15,%ZMM13 |
(676) 0x439337 VMOVUPD %ZMM13,(%R9,%RAX,8) |
(676) 0x43933e ADD $0x8,%RAX |
(676) 0x439342 CMP %R8,%RAX |
(676) 0x439345 JL 4392c0 |
0x43934b CMP 0x10(%RSP),%R8 |
0x439350 MOV 0x78(%RSP),%RDX |
0x439355 MOV 0x40(%RSP),%RCX |
0x43935a MOV 0x38(%RSP),%RSI |
0x43935f JE 438425 |
0x439365 JMP 43938f |
0x439370 XOR %R8D,%R8D |
0x439373 MOV 0x78(%RSP),%RDX |
0x439378 MOV 0xa8(%RSP),%R13 |
0x439380 MOV 0x40(%RSP),%RCX |
0x439385 MOV 0x38(%RSP),%RSI |
0x43938a MOV 0x18(%RSP),%R15 |
0x43938f VPBROADCASTQ %R8,%ZMM6 |
0x439395 VPORQ 0x58aa1(%RIP),%ZMM6,%ZMM6 |
0x43939f VPCMPLTUQ 0x280(%RSP),%ZMM6,%K1 |
0x4393a8 KORTESTB %K1,%K1 |
0x4393ac JE 438425 |
0x4393b2 VMOVUPD (%R15,%R8,8),%ZMM6{%K1}{z} |
0x4393b9 VMOVUPD 0x2c0(%RSP),%ZMM7 |
0x4393c1 VMOVAPD %ZMM6,%ZMM7{%K1} |
0x4393c7 VBROADCASTSD %XMM2,%ZMM6 |
0x4393cd VMOVUPD %ZMM7,0x2c0(%RSP) |
0x4393d5 VMULPD %ZMM6,%ZMM7,%ZMM6 |
0x4393db VMOVUPD %ZMM6,(%R15,%R8,8){%K1} |
0x4393e2 ADD %R8,%RBX |
0x4393e5 VMOVUPD (%R15,%RBX,8),%ZMM6{%K1}{z} |
0x4393ec VMOVUPD 0x300(%RSP),%ZMM7 |
0x4393f4 VMOVAPD %ZMM6,%ZMM7{%K1} |
0x4393fa VBROADCASTSD %XMM1,%ZMM6 |
0x439400 VMOVUPD %ZMM7,0x300(%RSP) |
0x439408 VMULPD %ZMM6,%ZMM7,%ZMM6 |
0x43940e VMOVUPD %ZMM6,(%R15,%RBX,8){%K1} |
0x439415 MOV 0x48(%RSP),%RAX |
0x43941a ADD %R8,%RAX |
0x43941d VMOVUPD (%R15,%RAX,8),%ZMM6{%K1}{z} |
0x439424 VMOVUPD 0x340(%RSP),%ZMM7 |
0x43942c VMOVAPD %ZMM6,%ZMM7{%K1} |
0x439432 VBROADCASTSD %XMM0,%ZMM6 |
0x439438 VMOVUPD %ZMM7,0x340(%RSP) |
0x439440 VMULPD %ZMM6,%ZMM7,%ZMM6 |
0x439446 VMOVUPD %ZMM6,(%R15,%RAX,8){%K1} |
0x43944d VMOVUPD (%R14,%R8,8),%ZMM6{%K1}{z} |
0x439454 VMOVUPD 0x380(%RSP),%ZMM7 |
0x43945c VMOVAPD %ZMM6,%ZMM7{%K1} |
0x439462 VBROADCASTSD %XMM5,%ZMM5 |
0x439468 VMOVUPD %ZMM7,0x380(%RSP) |
0x439470 VMULPD %ZMM7,%ZMM5,%ZMM5 |
0x439476 VMOVUPD %ZMM5,(%R14,%R8,8){%K1} |
0x43947d ADD %R8,%RSI |
0x439480 VMOVUPD (%R14,%RSI,8),%ZMM5{%K1}{z} |
0x439487 VMOVUPD 0x3c0(%RSP),%ZMM6 |
0x43948f VMOVAPD %ZMM5,%ZMM6{%K1} |
0x439495 VBROADCASTSD %XMM4,%ZMM4 |
0x43949b VMOVUPD %ZMM6,0x3c0(%RSP) |
0x4394a3 VMULPD %ZMM6,%ZMM4,%ZMM4 |
0x4394a9 VMOVUPD %ZMM4,(%R14,%RSI,8){%K1} |
0x4394b0 ADD %R8,%RCX |
0x4394b3 VMOVUPD (%R14,%RCX,8),%ZMM4{%K1}{z} |
0x4394ba VMOVUPD 0x400(%RSP),%ZMM5 |
0x4394c2 VMOVAPD %ZMM4,%ZMM5{%K1} |
0x4394c8 VBROADCASTSD %XMM3,%ZMM3 |
0x4394ce VMOVUPD %ZMM5,0x400(%RSP) |
0x4394d6 VMULPD %ZMM5,%ZMM3,%ZMM3 |
0x4394dc VMOVUPD %ZMM3,(%R14,%RCX,8){%K1} |
0x4394e3 VMOVUPD (%R14,%RBX,8),%ZMM3{%K1}{z} |
0x4394ea VMOVUPD 0x440(%RSP),%ZMM4 |
0x4394f2 VMOVAPD %ZMM3,%ZMM4{%K1} |
0x4394f8 VBROADCASTSD %XMM18,%ZMM2 |
0x4394fe VMOVUPD %ZMM4,0x440(%RSP) |
0x439506 VMULPD %ZMM4,%ZMM2,%ZMM2 |
0x43950c VMOVUPD %ZMM2,(%R14,%RBX,8){%K1} |
0x439513 VMOVUPD (%R14,%RAX,8),%ZMM2{%K1}{z} |
0x43951a VMOVUPD 0x480(%RSP),%ZMM3 |
0x439522 VMOVAPD %ZMM2,%ZMM3{%K1} |
0x439528 VBROADCASTSD %XMM17,%ZMM1 |
0x43952e VMOVUPD %ZMM3,0x480(%RSP) |
0x439536 VMULPD %ZMM3,%ZMM1,%ZMM1 |
0x43953c VMOVUPD %ZMM1,(%R14,%RAX,8){%K1} |
0x439543 ADD %R8,%R13 |
0x439546 VMOVUPD (%R14,%R13,8),%ZMM1{%K1}{z} |
0x43954d VMOVUPD 0x4c0(%RSP),%ZMM2 |
0x439555 VMOVAPD %ZMM1,%ZMM2{%K1} |
0x43955b VBROADCASTSD %XMM16,%ZMM0 |
0x439561 VMOVUPD %ZMM2,0x4c0(%RSP) |
0x439569 VMULPD %ZMM2,%ZMM0,%ZMM0 |
0x43956f VMOVUPD %ZMM0,(%R14,%R13,8){%K1} |
0x439576 JMP 438425 |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVectorOps.h: 59 - 59 |
-------------------------------------------------------------------------------- |
59: for (unsigned d = 0; d < D; ++d) |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineEvalHelper.hpp: 47 - 49 |
-------------------------------------------------------------------------------- |
47: T sf = std::floor(x); |
48: T dx2 = x - sf; |
49: int ind2 = std::min(std::max(0, static_cast<int>(sf)), nmax); |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineRef.hpp: 193 - 295 |
-------------------------------------------------------------------------------- |
193: y -= spline_m->y_grid.start; |
194: z -= spline_m->z_grid.start; |
195: spline2::getSplineBound(x * spline_m->x_grid.delta_inv, tx, ix, spline_m->x_grid.num - 1); |
196: spline2::getSplineBound(y * spline_m->y_grid.delta_inv, ty, iy, spline_m->y_grid.num - 1); |
197: spline2::getSplineBound(z * spline_m->z_grid.delta_inv, tz, iz, spline_m->z_grid.num - 1); |
[...] |
203: const intptr_t xs = spline_m->x_stride; |
204: const intptr_t ys = spline_m->y_stride; |
205: const intptr_t zs = spline_m->z_stride; |
206: |
207: const size_t out_offset = spline_m->num_splines; |
208: |
209: T* restrict gx = grads; |
210: T* restrict gy = grads + out_offset; |
211: T* restrict gz = grads + 2 * out_offset; |
212: |
213: T* restrict hxx = hess; |
214: T* restrict hxy = hess + out_offset; |
215: T* restrict hxz = hess + 2 * out_offset; |
216: T* restrict hyy = hess + 3 * out_offset; |
217: T* restrict hyz = hess + 4 * out_offset; |
218: T* restrict hzz = hess + 5 * out_offset; |
[...] |
233: for (int i = 0; i < 4; i++) |
234: for (int j = 0; j < 4; j++) |
235: { |
236: const T* restrict coefs = spline_m->coefs + (ix + i) * xs + (iy + j) * ys + iz * zs; |
237: const T* restrict coefszs = coefs + zs; |
238: const T* restrict coefs2zs = coefs + 2 * zs; |
239: const T* restrict coefs3zs = coefs + 3 * zs; |
240: |
241: const T pre20 = d2a[i] * b[j]; |
242: const T pre10 = da[i] * b[j]; |
243: const T pre00 = a[i] * b[j]; |
244: const T pre11 = da[i] * db[j]; |
245: const T pre01 = a[i] * db[j]; |
246: const T pre02 = a[i] * d2b[j]; |
247: |
248: const int iSplitPoint = num_splines; |
249: #pragma omp simd aligned(coefs, coefszs, coefs2zs, coefs3zs: QMC_SIMD_ALIGNMENT) simdlen(simdlen_) |
250: for (int n = 0; n < iSplitPoint; n++) |
251: { |
252: T coefsv = coefs[n]; |
253: T coefsvzs = coefszs[n]; |
254: T coefsv2zs = coefs2zs[n]; |
255: T coefsv3zs = coefs3zs[n]; |
256: |
257: T sum0 = c[0] * coefsv + c[1] * coefsvzs + c[2] * coefsv2zs + c[3] * coefsv3zs; |
258: T sum1 = dc[0] * coefsv + dc[1] * coefsvzs + dc[2] * coefsv2zs + dc[3] * coefsv3zs; |
259: T sum2 = d2c[0] * coefsv + d2c[1] * coefsvzs + d2c[2] * coefsv2zs + d2c[3] * coefsv3zs; |
260: |
261: hxx[n] += pre20 * sum0; |
262: hxy[n] += pre11 * sum0; |
263: hxz[n] += pre10 * sum1; |
264: hyy[n] += pre02 * sum0; |
265: hyz[n] += pre01 * sum1; |
266: hzz[n] += pre00 * sum2; |
267: gx[n] += pre10 * sum0; |
268: gy[n] += pre01 * sum0; |
269: gz[n] += pre00 * sum1; |
270: vals[n] += pre00 * sum0; |
[...] |
277: const T dxx = dxInv * dxInv; |
278: const T dyy = dyInv * dyInv; |
279: const T dzz = dzInv * dzInv; |
280: const T dxy = dxInv * dyInv; |
281: const T dxz = dxInv * dzInv; |
282: const T dyz = dyInv * dzInv; |
283: |
284: #pragma omp simd simdlen(simdlen_) |
285: for (int n = 0; n < num_splines; n++) |
286: { |
287: gx[n] *= dxInv; |
288: gy[n] *= dyInv; |
289: gz[n] *= dzInv; |
290: hxx[n] *= dxx; |
291: hyy[n] *= dyy; |
292: hzz[n] *= dzz; |
293: hxy[n] *= dxy; |
294: hxz[n] *= dxz; |
295: hyz[n] *= dyz; |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/einspline_spo_ref.hpp: 206 - 208 |
-------------------------------------------------------------------------------- |
206: for (int i = 0; i < nBlocks; ++i) |
207: MultiBsplineEvalRef::evaluate_vgh(einsplines[i], u[0], u[1], u[2], psi[i].data(), grad[i].data(), hess[i].data(), |
208: nSplinesPerBlock); |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineData.hpp: 68 - 79 |
-------------------------------------------------------------------------------- |
68: a[0] = ((A00 * tx + A01) * tx + A02) * tx + A03; |
69: a[1] = ((A10 * tx + A11) * tx + A12) * tx + A13; |
70: a[2] = ((A20 * tx + A21) * tx + A22) * tx + A23; |
71: a[3] = ((A30 * tx + A31) * tx + A32) * tx + A33; |
72: da[0] = (dA01 * tx + dA02) * tx + dA03; |
73: da[1] = (dA11 * tx + dA12) * tx + dA13; |
74: da[2] = (dA21 * tx + dA22) * tx + dA23; |
75: da[3] = (dA31 * tx + dA32) * tx + dA33; |
76: d2a[0] = d2A02 * tx + d2A03; |
77: d2a[1] = d2A12 * tx + d2A13; |
78: d2a[2] = d2A22 * tx + d2A23; |
79: d2a[3] = d2A32 * tx + d2A33; |
/home/kcamus/qaas_runs/169-451-1869/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 237 - 237 |
-------------------------------------------------------------------------------- |
237: T* data() { return myData; } |
/usr/lib64/gcc/x86_64-pc-linux-gnu/13.1.1/../../../../include/c++/13.1.1/bits/stl_algobase.h: 238 - 931 |
-------------------------------------------------------------------------------- |
238: if (__b < __a) |
[...] |
930: for (; __first != __last; ++__first) |
931: *__first = __tmp; |
/usr/lib64/gcc/x86_64-pc-linux-gnu/13.1.1/../../../../include/c++/13.1.1/bits/stl_vector.h: 1126 - 1258 |
-------------------------------------------------------------------------------- |
1126: return *(this->_M_impl._M_start + __n); |
[...] |
1258: { return _M_data_ptr(this->_M_impl._M_start); } |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►66.67+ | miniqmcreference::DiracDetermi[...] | DiracDeterminantRef.cpp:100 | exec |
○ | qmcplusplus::WaveFunction::rat[...] | WaveFunction.cpp:202 | exec |
○ | main.extracted.104 | stl_vector.h:1126 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:404 | exec |
○ | __libc_init_first | libc.so.6 | |
►33.33+ | qmcplusplus::SPOSet::evaluate_[...] | OhmmsVector.h:144 | exec |
○ | miniqmcreference::DiracDetermi[...] | DiracDeterminantRef.cpp:263 | exec |
○ | miniqmcreference::DiracDetermi[...] | DiracDeterminantRef.cpp:238 | exec |
○ | qmcplusplus::WaveFunction::eva[...] | WaveFunction.cpp:176 | exec |
○ | main.extracted.107 | miniqmc.cpp:375 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | main | miniqmc.cpp:374 | exec |
○ | __libc_init_first | libc.so.6 |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.61 |
CQA speedup if FP arith vectorized | 1.15 |
CQA speedup if fully vectorized | 1.69 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.37 |
Bottlenecks | micro-operation queue, |
Function | miniqmcreference::einspline_spo_ref |
Source | TinyVectorOps.h:59-59,MultiBsplineEvalHelper.hpp:47-49,MultiBsplineRef.hpp:193-295,einspline_spo_ref.hpp:206-208,MultiBsplineData.hpp:68-79,VectorSoAContainer.h:237-237,stl_algobase.h:238-931,stl_vector.h:1126-1258 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 122.25 |
CQA cycles if no scalar integer | 76.00 |
CQA cycles if FP arith vectorized | 106.72 |
CQA cycles if fully vectorized | 72.41 |
Front-end cycles | 122.25 |
DIV/SQRT cycles | 63.00 |
P0 cycles | 62.00 |
P1 cycles | 66.33 |
P2 cycles | 66.33 |
P3 cycles | 89.00 |
P4 cycles | 63.00 |
P5 cycles | 44.00 |
P6 cycles | 66.33 |
P7 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 136.54 |
Stall cycles (UFS) | 17.03 |
Nb insns | 468.00 |
Nb uops | 489.00 |
Nb loads | 111.00 |
Nb stores | 79.00 |
Nb stack references | 65.00 |
FLOP/cycle | 1.57 |
Nb FLOP add-sub | 16.00 |
Nb FLOP mul | 100.00 |
Nb FLOP fma | 38.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 31.77 |
Bytes prefetched | 0.00 |
Bytes loaded | 2104.00 |
Bytes stored | 1780.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 41.78 |
Vectorization ratio load | 56.25 |
Vectorization ratio store | 37.97 |
Vectorization ratio mul | 45.45 |
Vectorization ratio add_sub | 38.46 |
Vectorization ratio fma | 5.56 |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 47.73 |
Vector-efficiency ratio all | 31.64 |
Vector-efficiency ratio load | 42.68 |
Vector-efficiency ratio store | 35.21 |
Vector-efficiency ratio mul | 38.64 |
Vector-efficiency ratio add_sub | 17.31 |
Vector-efficiency ratio fma | 13.19 |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 27.49 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.61 |
CQA speedup if FP arith vectorized | 1.15 |
CQA speedup if fully vectorized | 1.69 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.37 |
Bottlenecks | micro-operation queue, |
Function | miniqmcreference::einspline_spo_ref |
Source | TinyVectorOps.h:59-59,MultiBsplineEvalHelper.hpp:47-49,MultiBsplineRef.hpp:193-295,einspline_spo_ref.hpp:206-208,MultiBsplineData.hpp:68-79,VectorSoAContainer.h:237-237,stl_algobase.h:238-931,stl_vector.h:1126-1258 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 122.25 |
CQA cycles if no scalar integer | 76.00 |
CQA cycles if FP arith vectorized | 106.72 |
CQA cycles if fully vectorized | 72.41 |
Front-end cycles | 122.25 |
DIV/SQRT cycles | 63.00 |
P0 cycles | 62.00 |
P1 cycles | 66.33 |
P2 cycles | 66.33 |
P3 cycles | 89.00 |
P4 cycles | 63.00 |
P5 cycles | 44.00 |
P6 cycles | 66.33 |
P7 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 136.54 |
Stall cycles (UFS) | 17.03 |
Nb insns | 468.00 |
Nb uops | 489.00 |
Nb loads | 111.00 |
Nb stores | 79.00 |
Nb stack references | 65.00 |
FLOP/cycle | 1.57 |
Nb FLOP add-sub | 16.00 |
Nb FLOP mul | 100.00 |
Nb FLOP fma | 38.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 31.77 |
Bytes prefetched | 0.00 |
Bytes loaded | 2104.00 |
Bytes stored | 1780.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 41.78 |
Vectorization ratio load | 56.25 |
Vectorization ratio store | 37.97 |
Vectorization ratio mul | 45.45 |
Vectorization ratio add_sub | 38.46 |
Vectorization ratio fma | 5.56 |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 47.73 |
Vector-efficiency ratio all | 31.64 |
Vector-efficiency ratio load | 42.68 |
Vector-efficiency ratio store | 35.21 |
Vector-efficiency ratio mul | 38.64 |
Vector-efficiency ratio add_sub | 17.31 |
Vector-efficiency ratio fma | 13.19 |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 27.49 |
Path / |
Function | miniqmcreference::einspline_spo_ref |
Source file and lines | TinyVectorOps.h:59-59 |
Module | exec |
nb instructions | 468 |
nb uops | 489 |
loop length | 2663 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 20 |
used ymm registers | 0 |
used zmm registers | 18 |
nb stack references | 65 |
ADD-SUB / MUL ratio | 0.38 |
micro-operation queue | 122.25 cycles |
front end | 122.25 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 63.00 | 62.00 | 66.33 | 66.33 | 89.00 | 63.00 | 44.00 | 66.33 |
cycles | 63.00 | 62.00 | 66.33 | 66.33 | 89.00 | 63.00 | 44.00 | 66.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 136.54 |
Stall cycles | 17.03 |
ROB full (events) | 14.98 |
RS full (events) | 4.11 |
LB full (events) | 3.00 |
Front-end | 122.25 |
Dispatch | 89.00 |
Overall L1 | 122.25 |
all | 26% |
load | 54% |
store | 9% |
mul | 100% |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 38% |
all | 45% |
load | 56% |
store | 56% |
mul | 43% |
add-sub | 33% |
fma | 5% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 41% |
load | 56% |
store | 37% |
mul | 45% |
add-sub | 38% |
fma | 5% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 47% |
all | 19% |
load | 31% |
store | 15% |
mul | 25% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 23% |
all | 34% |
load | 45% |
store | 47% |
mul | 39% |
add-sub | 16% |
fma | 13% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 28% |
all | 31% |
load | 42% |
store | 35% |
mul | 38% |
add-sub | 17% |
fma | 13% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 27% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
MOV 0x78(%RSP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
INC %RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x128(%RSP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD 0x30(%R15),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %RAX,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JGE 43957b | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x2e8(%R15),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x300(%R15),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX,%RDX,8),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RDX,%RDX,2),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RCX,%RAX,8),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x318(%R15),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RDX,0x78(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (,%RDX,8),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%RCX,4),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RAX,%RCX,1),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,0x18(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x330(%R15),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RAX,%RCX,1),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1f0(%RSP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VSUBSD 0x78(%R11),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVSXD 0x40(%R15),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x98(%R11),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD %XMM1,0x230(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULSD %XMM0,%XMM1,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x88(%R11),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
DEC %ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VROUNDSD $0x9,%XMM8,%XMM8,%XMM9 | 2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 8 | 1 |
VCVTTSD2SI %XMM9,%EAX | 2 | 1.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 6 | 1 |
MOV %EAX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SAR $0x1f,%ECX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
ANDN %EAX,%ECX,%EAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %EAX,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD 0x28(%R11),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVHPD 0x50(%R11),%XMM2,%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 1 | 0 | 0 | 4 | 1 |
VMOVUPD 0x200(%RSP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VSUBPD %XMM2,%XMM0,%XMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x48(%R11),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x70(%R11),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD %XMM0,0x220(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM1,0x210(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VUNPCKLPD %XMM0,%XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMULPD %XMM2,%XMM3,%XMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VRNDSCALEPD $0x9,%XMM2,%XMM18 | 2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 8 | 1 |
VMOVD 0x38(%R11),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VPINSRD $0x1,0x60(%R11),%XMM3,%XMM19 | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 1 | 0 | 0 | 3 | 1 |
VSUBPD %XMM18,%XMM2,%XMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x597b8(%RIP),%XMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMULSD %XMM2,%XMM10,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x55ad4(%RIP),%XMM12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VSUBSD %XMM3,%XMM12,%XMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %XMM2,%XMM2,%XMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDDUP %XMM2,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVUPD 0x1e0(%RSP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBLENDPD $0x1,%XMM4,%XMM0,%XMM4 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 1 | 0.33 |
VMULPD %XMM4,%XMM6,%XMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD 0x59eed(%RIP),%XMM11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VADDPD %XMM4,%XMM11,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VUNPCKLPD %XMM5,%XMM2,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVUPD 0x59eed(%RIP),%XMM13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213PD %XMM13,%XMM6,%XMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM7,0x260(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM2,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x55aeb(%RIP),%XMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM12,%XMM14,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM12,%XMM2,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM10,%XMM2,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM6,0x270(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULSD %XMM5,%XMM3,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x278(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x55a6a(%RIP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM1,%XMM14,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM14,%XMM2,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x1c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x5971b(%RIP),%XMM15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x55a79(%RIP),%XMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM16,%XMM15,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM2,%XMM3,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x1c8(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMSUB213SD %XMM1,%XMM15,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFNMADD213SD %XMM12,%XMM2,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x1d0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VPERMILPD $0x1,%XMM4,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMULSD %XMM2,%XMM3,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x1d8(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VSUBSD %XMM2,%XMM1,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x180(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x58939(%RIP),%XMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM16,%XMM17,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x188(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMOVGE %EAX,%ESI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
VMOVAPD %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFNMADD213SD %XMM1,%XMM17,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x190(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVLPD %XMM2,0x198(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VPERMILPD $0x1,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMULSD %XMM3,%XMM10,%XMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSUBSD %XMM4,%XMM12,%XMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM3,%XMM3,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPERMILPD $0x3,%XMM2,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VBLENDPD $0x1,%XMM5,%XMM0,%XMM5 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 1 | 0.33 |
VMULPD %XMM5,%XMM7,%XMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %XMM5,%XMM11,%XMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSHUFPD $0x1,%XMM6,%XMM2,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VFMADD213PD %XMM13,%XMM7,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM0,0x240(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMADD213SD %XMM12,%XMM14,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM12,%XMM3,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM10,%XMM3,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x250(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULSD %XMM6,%XMM4,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x258(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMADD213SD %XMM1,%XMM14,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM14,%XMM3,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x1a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMADD213SD %XMM16,%XMM15,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM3,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x1a8(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMSUB213SD %XMM1,%XMM15,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFNMADD213SD %XMM12,%XMM3,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x1b0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %XMM2,%XMM5,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVHPD %XMM0,0x1b8(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VSUBSD %XMM3,%XMM1,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x160(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMADD213SD %XMM16,%XMM17,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x168(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VFNMADD213SD %XMM1,%XMM17,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x170(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVHPD %XMM2,0x178(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOVSXD 0xe8(%R11),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RBX,%RBX,1),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RBX,4),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VSUBSD %XMM9,%XMM8,%XMM14 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM12,%XMM14,%XMM13 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD 0x558b2(%RIP),%XMM13,%XMM15 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM14,%XMM14,%XMM17 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD 0x59562(%RIP),%XMM17,%XMM15 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDQU64 0x10(%R11),%XMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x20(%R11),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RBX,%RBX,2),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RBX,%RBX,4),%R10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDX,0x10(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
TEST %RDX,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RCX,0x48(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R8,0xa8(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,0x40(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R9,0x38(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JE 438969 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA (%R14,%R10,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x280(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R14,%R8,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x30(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R14,%R9,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0xa0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R14,%RCX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x98(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R14,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x90(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x18(%RSP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R15,%RCX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x88(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R15,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x80(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x10(%RSP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (,%RAX,8),%R13 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0x28(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %ESI,0x20(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD %XMM18,0x60(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVDQU64 %XMM19,0x50(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
VMOVUPD %XMM13,0xf0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM14,0xe0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM15,0xd0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVDQU64 %XMM16,0xc0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
VMOVSD %XMM17,0xb8(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R11,0xb0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VZEROUPPER | 4 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x80(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x88(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x90(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x98(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0xa0(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x30(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x280(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0xb0(%RSP),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xb8(%RSP),%XMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVDQU64 0xc0(%RSP),%XMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x28(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xd0(%RSP),%XMM15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xe0(%RSP),%XMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xf0(%RSP),%XMM13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVDQU64 0x50(%RSP),%XMM19 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD 0x60(%RSP),%XMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x20(%RSP),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x59377(%RIP),%XMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVAPD %XMM4,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x55693(%RIP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMSUB213SD %XMM1,%XMM14,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x556ee(%RIP),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMSUB213SD %XMM2,%XMM14,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFNMADD213SD %XMM4,%XMM14,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM14,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMADD213SD %XMM1,%XMM2,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM1,%XMM14,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM4,%XMM14,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM14,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x55675(%RIP),%XMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM5,%XMM2,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM2,%XMM14,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM14,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x5932e(%RIP),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x5568e(%RIP),%XMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM7,%XMM2,%XMM9 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM14,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMSUB213SD %XMM5,%XMM2,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFNMADD213SD %XMM1,%XMM14,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSUBSD %XMM14,%XMM5,%XMM10 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM14,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x58580(%RIP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM7,%XMM1,%XMM11 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM14,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFNMADD213SD %XMM5,%XMM1,%XMM12 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCVTTPD2DQ %XMM18,%XMM1 | 2 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0 | 0 | 5 | 1 |
VPCMPEQD %XMM2,%XMM2,%XMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDD %XMM2,%XMM19,%XMM2 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 1 | 0.33 |
VPMAXSD 0x55de0(%RIP),%XMM1,%XMM1 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPMINSD %XMM1,%XMM2,%XMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x8(%R11),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD %ESI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RDI,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
IMUL %RAX,%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMOVSXDQ %XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPMULLQ %XMM1,%XMM16,%XMM1 | 3 | 1.50 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPEXTRQ $0x1,%XMM1,%RCX | 2 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMULSD %XMM4,%XMM17,%XMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%R11,%RCX,1),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVQ %XMM1,%RSI | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
ADD %RSI,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RDX,0x98(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VPEXTRQ $0x1,%XMM16,0x30(%RSP) | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 1 | 0 | 0.33 | 3 | 1 |
VMOVQ %XMM16,%R13 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
LEA (%RCX,%RSI,1),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x2(%RAX),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RDI,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R8,%RCX,1),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RSI,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RDX,0x90(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA 0x3(%RAX),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RDI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RSI,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RCX,0xa0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%RDI,%R11,1),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R9,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RCX,0x88(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
INC %RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
IMUL %RDI,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x18(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x10(%RSP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
AND $-0x8,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RCX,0x20(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM0,%ZMM29 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM15,%ZMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM3,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM14,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM5,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM6,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM9,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM8,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM13,%ZMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM10,%ZMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM11,%ZMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM12,%ZMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RSI,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVDQU64 %ZMM0,0x280(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
ADD %R9,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %R9,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %R9,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %R9,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x48(%RSP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R12,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA (%RDI,%RCX,8),%R12 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%RDX,8),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%R8,8),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%RAX,8),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x50(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R10,%R11,8),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA (%RDI,%RBX,8),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x138(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (,%R13,8),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0x130(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (,%RAX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0xe0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA (,%RBX,8),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RSI,0x158(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x18(%RSP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JMP 438be5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
CMPL $0,0x10(%RSP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JLE 438420 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VMOVUPD 0x210(%RSP),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMULSD %XMM2,%XMM2,%XMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD 0x220(%RSP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMULSD %XMM1,%XMM1,%XMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD 0x230(%RSP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMULSD %XMM0,%XMM0,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM2,%XMM1,%XMM18 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM2,%XMM0,%XMM17 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM1,%XMM0,%XMM16 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RSP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
AND $-0x8,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 439370 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VBROADCASTSD %XMM2,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM1,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM0,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM5,%ZMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM4,%ZMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM3,%ZMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM18,%ZMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM17,%ZMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM16,%ZMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
MOV 0xa8(%RSP),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R14,%R13,8),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RSP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R14,%RAX,8),%R10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R14,%RAX,8),%R11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RSP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R14,%RAX,8),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R14,%RBX,8),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x18(%RSP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP 0x10(%RSP),%R8 | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
MOV 0x78(%RSP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x40(%RSP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x38(%RSP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JE 438425 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 43938f | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x78(%RSP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0xa8(%RSP),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x40(%RSP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x38(%RSP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RSP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VPBROADCASTQ %R8,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPORQ 0x58aa1(%RIP),%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VPCMPLTUQ 0x280(%RSP),%ZMM6,%K1 | |||||||||||
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JE 438425 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VMOVUPD (%R15,%R8,8),%ZMM6{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x2c0(%RSP),%ZMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM6,%ZMM7{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM2,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM7,0x2c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM6,%ZMM7,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM6,(%R15,%R8,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
ADD %R8,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD (%R15,%RBX,8),%ZMM6{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x300(%RSP),%ZMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM6,%ZMM7{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM1,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM7,0x300(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM6,%ZMM7,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM6,(%R15,%RBX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x48(%RSP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD %R8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD (%R15,%RAX,8),%ZMM6{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x340(%RSP),%ZMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM6,%ZMM7{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM0,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM7,0x340(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM6,%ZMM7,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM6,(%R15,%RAX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD (%R14,%R8,8),%ZMM6{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x380(%RSP),%ZMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM6,%ZMM7{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM5,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM7,0x380(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM7,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM5,(%R14,%R8,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
ADD %R8,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD (%R14,%RSI,8),%ZMM5{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x3c0(%RSP),%ZMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM5,%ZMM6{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM4,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM6,0x3c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM6,%ZMM4,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM4,(%R14,%RSI,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
ADD %R8,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD (%R14,%RCX,8),%ZMM4{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x400(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM4,%ZMM5{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM5,0x400(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM5,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM3,(%R14,%RCX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD (%R14,%RBX,8),%ZMM3{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x440(%RSP),%ZMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM3,%ZMM4{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM18,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM4,0x440(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM4,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM2,(%R14,%RBX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD (%R14,%RAX,8),%ZMM2{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x480(%RSP),%ZMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM2,%ZMM3{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM17,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM3,0x480(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM3,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM1,(%R14,%RAX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
ADD %R8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD (%R14,%R13,8),%ZMM1{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x4c0(%RSP),%ZMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM1,%ZMM2{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM16,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM2,0x4c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM2,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM0,(%R14,%R13,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JMP 438425 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
Function | miniqmcreference::einspline_spo_ref |
Source file and lines | TinyVectorOps.h:59-59 |
Module | exec |
nb instructions | 468 |
nb uops | 489 |
loop length | 2663 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 20 |
used ymm registers | 0 |
used zmm registers | 18 |
nb stack references | 65 |
ADD-SUB / MUL ratio | 0.38 |
micro-operation queue | 122.25 cycles |
front end | 122.25 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 63.00 | 62.00 | 66.33 | 66.33 | 89.00 | 63.00 | 44.00 | 66.33 |
cycles | 63.00 | 62.00 | 66.33 | 66.33 | 89.00 | 63.00 | 44.00 | 66.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 136.54 |
Stall cycles | 17.03 |
ROB full (events) | 14.98 |
RS full (events) | 4.11 |
LB full (events) | 3.00 |
Front-end | 122.25 |
Dispatch | 89.00 |
Overall L1 | 122.25 |
all | 26% |
load | 54% |
store | 9% |
mul | 100% |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 38% |
all | 45% |
load | 56% |
store | 56% |
mul | 43% |
add-sub | 33% |
fma | 5% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 41% |
load | 56% |
store | 37% |
mul | 45% |
add-sub | 38% |
fma | 5% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 47% |
all | 19% |
load | 31% |
store | 15% |
mul | 25% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 23% |
all | 34% |
load | 45% |
store | 47% |
mul | 39% |
add-sub | 16% |
fma | 13% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 28% |
all | 31% |
load | 42% |
store | 35% |
mul | 38% |
add-sub | 17% |
fma | 13% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 27% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
MOV 0x78(%RSP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
INC %RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x128(%RSP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD 0x30(%R15),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %RAX,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JGE 43957b | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x2e8(%R15),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x300(%R15),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX,%RDX,8),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RDX,%RDX,2),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RCX,%RAX,8),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x318(%R15),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RDX,0x78(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (,%RDX,8),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%RCX,4),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RAX,%RCX,1),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,0x18(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x330(%R15),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RAX,%RCX,1),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0x1f0(%RSP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VSUBSD 0x78(%R11),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVSXD 0x40(%R15),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x98(%R11),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD %XMM1,0x230(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULSD %XMM0,%XMM1,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x88(%R11),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
DEC %ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VROUNDSD $0x9,%XMM8,%XMM8,%XMM9 | 2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 8 | 1 |
VCVTTSD2SI %XMM9,%EAX | 2 | 1.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 6 | 1 |
MOV %EAX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SAR $0x1f,%ECX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
ANDN %EAX,%ECX,%EAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %EAX,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVSD 0x28(%R11),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVHPD 0x50(%R11),%XMM2,%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 1 | 0 | 0 | 4 | 1 |
VMOVUPD 0x200(%RSP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VSUBPD %XMM2,%XMM0,%XMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x48(%R11),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x70(%R11),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD %XMM0,0x220(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM1,0x210(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VUNPCKLPD %XMM0,%XMM1,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMULPD %XMM2,%XMM3,%XMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VRNDSCALEPD $0x9,%XMM2,%XMM18 | 2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 8 | 1 |
VMOVD 0x38(%R11),%XMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VPINSRD $0x1,0x60(%R11),%XMM3,%XMM19 | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 1 | 0 | 0 | 3 | 1 |
VSUBPD %XMM18,%XMM2,%XMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x597b8(%RIP),%XMM10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMULSD %XMM2,%XMM10,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x55ad4(%RIP),%XMM12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VSUBSD %XMM3,%XMM12,%XMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULPD %XMM2,%XMM2,%XMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDDUP %XMM2,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVUPD 0x1e0(%RSP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VBLENDPD $0x1,%XMM4,%XMM0,%XMM4 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 1 | 0.33 |
VMULPD %XMM4,%XMM6,%XMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD 0x59eed(%RIP),%XMM11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VADDPD %XMM4,%XMM11,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VUNPCKLPD %XMM5,%XMM2,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVUPD 0x59eed(%RIP),%XMM13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213PD %XMM13,%XMM6,%XMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM7,0x260(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM2,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x55aeb(%RIP),%XMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM12,%XMM14,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM12,%XMM2,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM10,%XMM2,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM6,0x270(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULSD %XMM5,%XMM3,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x278(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x55a6a(%RIP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM1,%XMM14,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM14,%XMM2,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x1c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x5971b(%RIP),%XMM15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x55a79(%RIP),%XMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM16,%XMM15,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM2,%XMM3,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x1c8(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMSUB213SD %XMM1,%XMM15,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFNMADD213SD %XMM12,%XMM2,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x1d0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VPERMILPD $0x1,%XMM4,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMULSD %XMM2,%XMM3,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x1d8(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VSUBSD %XMM2,%XMM1,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x180(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x58939(%RIP),%XMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM16,%XMM17,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x188(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMOVGE %EAX,%ESI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
VMOVAPD %XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFNMADD213SD %XMM1,%XMM17,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x190(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVLPD %XMM2,0x198(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VPERMILPD $0x1,%XMM2,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMULSD %XMM3,%XMM10,%XMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSUBSD %XMM4,%XMM12,%XMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM3,%XMM3,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPERMILPD $0x3,%XMM2,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VBLENDPD $0x1,%XMM5,%XMM0,%XMM5 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 1 | 0.33 |
VMULPD %XMM5,%XMM7,%XMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDPD %XMM5,%XMM11,%XMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSHUFPD $0x1,%XMM6,%XMM2,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VFMADD213PD %XMM13,%XMM7,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM0,0x240(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMADD213SD %XMM12,%XMM14,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM12,%XMM3,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM10,%XMM3,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x250(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULSD %XMM6,%XMM4,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x258(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMADD213SD %XMM1,%XMM14,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM14,%XMM3,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x1a0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMADD213SD %XMM16,%XMM15,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM3,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x1a8(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMSUB213SD %XMM1,%XMM15,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFNMADD213SD %XMM12,%XMM3,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x1b0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %XMM2,%XMM5,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVHPD %XMM0,0x1b8(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VSUBSD %XMM3,%XMM1,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x160(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVAPD %XMM3,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMADD213SD %XMM16,%XMM17,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM0,0x168(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VFNMADD213SD %XMM1,%XMM17,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD %XMM3,0x170(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVHPD %XMM2,0x178(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOVSXD 0xe8(%R11),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RBX,%RBX,1),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RBX,4),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VSUBSD %XMM9,%XMM8,%XMM14 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM12,%XMM14,%XMM13 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VADDSD 0x558b2(%RIP),%XMM13,%XMM15 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM14,%XMM14,%XMM17 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD 0x59562(%RIP),%XMM17,%XMM15 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDQU64 0x10(%R11),%XMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x20(%R11),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%RBX,%RBX,2),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RBX,%RBX,4),%R10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDX,0x10(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
TEST %RDX,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RCX,0x48(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R8,0xa8(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,0x40(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R9,0x38(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JE 438969 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA (%R14,%R10,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x280(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R14,%R8,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x30(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R14,%R9,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0xa0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R14,%RCX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x98(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R14,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x90(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x18(%RSP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R15,%RCX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x88(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R15,%RBX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x80(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x10(%RSP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (,%RAX,8),%R13 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0x28(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %ESI,0x20(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVUPD %XMM18,0x60(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVDQU64 %XMM19,0x50(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
VMOVUPD %XMM13,0xf0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM14,0xe0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD %XMM15,0xd0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVDQU64 %XMM16,0xc0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
VMOVSD %XMM17,0xb8(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R11,0xb0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VZEROUPPER | 4 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x80(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x88(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x90(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x98(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0xa0(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x30(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x280(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 47ebf0 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0xb0(%RSP),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0xb8(%RSP),%XMM17 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVDQU64 0xc0(%RSP),%XMM16 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x28(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xd0(%RSP),%XMM15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xe0(%RSP),%XMM14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVUPD 0xf0(%RSP),%XMM13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVDQU64 0x50(%RSP),%XMM19 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD 0x60(%RSP),%XMM18 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x20(%RSP),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x59377(%RIP),%XMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVAPD %XMM4,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x55693(%RIP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMSUB213SD %XMM1,%XMM14,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x556ee(%RIP),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMSUB213SD %XMM2,%XMM14,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFNMADD213SD %XMM4,%XMM14,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM14,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMADD213SD %XMM1,%XMM2,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM1,%XMM14,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM4,%XMM14,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM14,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x55675(%RIP),%XMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM5,%XMM2,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM2,%XMM14,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM14,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x5932e(%RIP),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD 0x5568e(%RIP),%XMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM7,%XMM2,%XMM9 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM14,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFMSUB213SD %XMM5,%XMM2,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFNMADD213SD %XMM1,%XMM14,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSUBSD %XMM14,%XMM5,%XMM10 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM14,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD 0x58580(%RIP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VFMADD213SD %XMM7,%XMM1,%XMM11 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVAPD %XMM14,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VFNMADD213SD %XMM5,%XMM1,%XMM12 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCVTTPD2DQ %XMM18,%XMM1 | 2 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0 | 0 | 5 | 1 |
VPCMPEQD %XMM2,%XMM2,%XMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDD %XMM2,%XMM19,%XMM2 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 1 | 0.33 |
VPMAXSD 0x55de0(%RIP),%XMM1,%XMM1 | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPMINSD %XMM1,%XMM2,%XMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x8(%R11),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOVSXD %ESI,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RDI,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
IMUL %RAX,%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMOVSXDQ %XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPMULLQ %XMM1,%XMM16,%XMM1 | 3 | 1.50 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPEXTRQ $0x1,%XMM1,%RCX | 2 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMULSD %XMM4,%XMM17,%XMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%R11,%RCX,1),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVQ %XMM1,%RSI | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
ADD %RSI,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RDX,0x98(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VPEXTRQ $0x1,%XMM16,0x30(%RSP) | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 1 | 0 | 0.33 | 3 | 1 |
VMOVQ %XMM16,%R13 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
LEA (%RCX,%RSI,1),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x2(%RAX),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RDI,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R8,%RCX,1),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RSI,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RDX,0x90(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA 0x3(%RAX),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RDI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RSI,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RCX,0xa0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%RDI,%R11,1),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R9,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RCX,0x88(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
INC %RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
IMUL %RDI,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x18(%RSP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x10(%RSP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
AND $-0x8,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RCX,0x20(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VBROADCASTSD %XMM0,%ZMM29 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM15,%ZMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM3,%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM14,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM5,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM6,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM9,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM8,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM13,%ZMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM10,%ZMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM11,%ZMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM12,%ZMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RSI,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VMOVDQU64 %ZMM0,0x280(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 4 | 1 |
ADD %R9,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %R9,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %R9,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %R9,%R11 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x48(%RSP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R12,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA (%RDI,%RCX,8),%R12 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%RDX,8),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%R8,8),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%RAX,8),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x50(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R10,%R11,8),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA (%RDI,%RBX,8),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x138(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (,%R13,8),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0x130(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (,%RAX,8),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0xe0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA (,%RBX,8),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RSI,0x158(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x18(%RSP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JMP 438be5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
CMPL $0,0x10(%RSP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JLE 438420 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VMOVUPD 0x210(%RSP),%XMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMULSD %XMM2,%XMM2,%XMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD 0x220(%RSP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMULSD %XMM1,%XMM1,%XMM4 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD 0x230(%RSP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMULSD %XMM0,%XMM0,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM2,%XMM1,%XMM18 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM2,%XMM0,%XMM17 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM1,%XMM0,%XMM16 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RSP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
AND $-0x8,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JE 439370 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VBROADCASTSD %XMM2,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM1,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM0,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM5,%ZMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM4,%ZMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM3,%ZMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM18,%ZMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM17,%ZMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM16,%ZMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
MOV 0xa8(%RSP),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R14,%R13,8),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RSP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R14,%RAX,8),%R10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R14,%RAX,8),%R11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RSP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA (%R14,%RAX,8),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R14,%RBX,8),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x18(%RSP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP 0x10(%RSP),%R8 | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
MOV 0x78(%RSP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x40(%RSP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x38(%RSP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JE 438425 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 43938f | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x78(%RSP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0xa8(%RSP),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x40(%RSP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x38(%RSP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RSP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VPBROADCASTQ %R8,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1 | 1 |
VPORQ 0x58aa1(%RIP),%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
VPCMPLTUQ 0x280(%RSP),%ZMM6,%K1 | |||||||||||
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JE 438425 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
VMOVUPD (%R15,%R8,8),%ZMM6{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x2c0(%RSP),%ZMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM6,%ZMM7{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM2,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM7,0x2c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM6,%ZMM7,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM6,(%R15,%R8,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
ADD %R8,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD (%R15,%RBX,8),%ZMM6{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x300(%RSP),%ZMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM6,%ZMM7{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM1,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM7,0x300(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM6,%ZMM7,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM6,(%R15,%RBX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x48(%RSP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD %R8,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD (%R15,%RAX,8),%ZMM6{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x340(%RSP),%ZMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM6,%ZMM7{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM0,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM7,0x340(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM6,%ZMM7,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM6,(%R15,%RAX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD (%R14,%R8,8),%ZMM6{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x380(%RSP),%ZMM7 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM6,%ZMM7{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM5,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM7,0x380(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM7,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM5,(%R14,%R8,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
ADD %R8,%RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD (%R14,%RSI,8),%ZMM5{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x3c0(%RSP),%ZMM6 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM5,%ZMM6{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM4,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM6,0x3c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM6,%ZMM4,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM4,(%R14,%RSI,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
ADD %R8,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD (%R14,%RCX,8),%ZMM4{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x400(%RSP),%ZMM5 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM4,%ZMM5{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM5,0x400(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM5,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM3,(%R14,%RCX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD (%R14,%RBX,8),%ZMM3{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x440(%RSP),%ZMM4 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM3,%ZMM4{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM18,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM4,0x440(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM4,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM2,(%R14,%RBX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVUPD (%R14,%RAX,8),%ZMM2{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x480(%RSP),%ZMM3 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM2,%ZMM3{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM17,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM3,0x480(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM3,%ZMM1,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM1,(%R14,%RAX,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
ADD %R8,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVUPD (%R14,%R13,8),%ZMM1{%K1}{z} | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVUPD 0x4c0(%RSP),%ZMM2 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5-6 | 0.50 |
VMOVAPD %ZMM1,%ZMM2{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VBROADCASTSD %XMM16,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM2,0x4c0(%RSP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMULPD %ZMM2,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 4 | 0.50 |
VMOVUPD %ZMM0,(%R14,%R13,8){%K1} | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JMP 438425 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |