Function: viscosity_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: viscosity_kernel.f90:50-94 | Coverage: 2.89% |
---|
Function: viscosity_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: viscosity_kernel.f90:50-94 | Coverage: 2.89% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-861-0321/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90: 50 - 94 |
-------------------------------------------------------------------------------- |
50: !$OMP PARALLEL |
51: |
52: !$OMP DO PRIVATE(ugrad,vgrad,div,strain2,pgradx,pgrady,pgradx2,pgrady2,limiter,pgrad,xgrad,ygrad,grad,grad2,dirx,diry) |
53: DO k=y_min,y_max |
54: !$OMP SIMD |
55: DO j=x_min,x_max |
56: ugrad=(xvel0(j+1,k )+xvel0(j+1,k+1))-(xvel0(j ,k )+xvel0(j ,k+1)) |
57: |
58: vgrad=(yvel0(j ,k+1)+yvel0(j+1,k+1))-(yvel0(j ,k )+yvel0(j+1,k )) |
59: |
60: div = (celldx(j)*(ugrad)+ celldy(k)*(vgrad)) |
61: |
62: strain2 = 0.5_8*(xvel0(j, k+1) + xvel0(j+1,k+1)-xvel0(j ,k )-xvel0(j+1,k ))/celldy(k) & |
63: + 0.5_8*(yvel0(j+1,k ) + yvel0(j+1,k+1)-yvel0(j ,k )-yvel0(j ,k+1))/celldx(j) |
64: |
65: pgradx=(pressure(j+1,k)-pressure(j-1,k))/(celldx(j)+celldx(j+1)) |
66: pgrady=(pressure(j,k+1)-pressure(j,k-1))/(celldy(k)+celldy(k+1)) |
67: |
68: pgradx2 = pgradx*pgradx |
69: pgrady2 = pgrady*pgrady |
70: |
71: limiter = ((0.5_8*(ugrad)/celldx(j))*pgradx2+(0.5_8*(vgrad)/celldy(k))*pgrady2+strain2*pgradx*pgrady) & |
72: /MAX(pgradx2+pgrady2,1.0e-16_8) |
73: |
74: IF ((limiter.GT.0.0).OR.(div.GE.0.0))THEN |
75: viscosity(j,k) = 0.0 |
76: ELSE |
77: dirx=1.0_8 |
78: IF(pgradx.LT.0.0) dirx=-1.0_8 |
79: pgradx = dirx*MAX(1.0e-16_8,ABS(pgradx)) |
80: diry=1.0_8 |
81: IF(pgradx.LT.0.0) diry=-1.0_8 |
82: pgrady = diry*MAX(1.0e-16_8,ABS(pgrady)) |
83: pgrad = SQRT(pgradx**2+pgrady**2) |
84: xgrad = ABS(celldx(j)*pgrad/pgradx) |
85: ygrad = ABS(celldy(k)*pgrad/pgrady) |
86: grad = MIN(xgrad,ygrad) |
87: grad2 = grad*grad |
88: |
89: viscosity(j,k)=2.0_8*density0(j,k)*grad2*limiter*limiter |
90: ENDIF |
91: |
92: ENDDO |
93: ENDDO |
94: !$OMP END DO |
0x46d430 PUSH %RBP |
0x46d431 MOV %RSP,%RBP |
0x46d434 PUSH %R15 |
0x46d436 PUSH %R14 |
0x46d438 PUSH %R13 |
0x46d43a PUSH %R12 |
0x46d43c PUSH %RBX |
0x46d43d AND $-0x20,%RSP |
0x46d441 SUB $0x300,%RSP |
0x46d448 MOV %R9,0x30(%RSP) |
0x46d44d MOV %R8,0x28(%RSP) |
0x46d452 MOV 0x40(%RBP),%EBX |
0x46d455 MOV 0x38(%RBP),%EAX |
0x46d458 SUB %EBX,%EAX |
0x46d45a MOVL $0,0x24(%RSP) |
0x46d462 JS 46d4df |
0x46d464 MOV %RCX,%R12 |
0x46d467 MOV %RDX,%R13 |
0x46d46a MOV %RDI,0x48(%RSP) |
0x46d46f MOV (%RDI),%ESI |
0x46d471 MOVL $0,0x10(%RSP) |
0x46d479 MOV %EAX,0xc(%RSP) |
0x46d47d MOVL $0x1,0x20(%RSP) |
0x46d485 SUB $0x8,%RSP |
0x46d489 LEA 0x28(%RSP),%RAX |
0x46d48e LEA 0x2c(%RSP),%RCX |
0x46d493 LEA 0x18(%RSP),%R8 |
0x46d498 LEA 0x14(%RSP),%R9 |
0x46d49d MOV $0x542630,%EDI |
0x46d4a2 MOV %ESI,0x1c(%RSP) |
0x46d4a6 MOV $0x22,%EDX |
0x46d4ab PUSH $0x1 |
0x46d4ad PUSH $0x1 |
0x46d4af PUSH %RAX |
0x46d4b0 CALL 404670 <__kmpc_for_static_init_4@plt> |
0x46d4b5 ADD $0x20,%RSP |
0x46d4b9 MOV 0x10(%RSP),%EAX |
0x46d4bd MOV 0xc(%RSP),%ECX |
0x46d4c1 SUB %EAX,%ECX |
0x46d4c3 MOV %ECX,0x18(%RSP) |
0x46d4c7 JAE 46d4fa |
0x46d4c9 MOV $0x542650,%EDI |
0x46d4ce MOV 0x14(%RSP),%ESI |
0x46d4d2 VZEROUPPER |
0x46d4d5 CALL 404230 <__kmpc_for_static_fini@plt> |
0x46d4da MOV 0x48(%RSP),%RDI |
0x46d4df MOV (%RDI),%ESI |
0x46d4e1 MOV $0x542670,%EDI |
0x46d4e6 CALL 404740 <__kmpc_barrier@plt> |
0x46d4eb LEA -0x28(%RBP),%RSP |
0x46d4ef POP %RBX |
0x46d4f0 POP %R12 |
0x46d4f2 POP %R13 |
0x46d4f4 POP %R14 |
0x46d4f6 POP %R15 |
0x46d4f8 POP %RBP |
0x46d4f9 RET |
0x46d4fa MOV %RAX,%RDI |
0x46d4fd MOV 0x50(%RBP),%RDX |
0x46d501 MOV 0x48(%RBP),%RSI |
0x46d505 SAL $0x20,%R12 |
0x46d509 MOV $-0x200000000,%RAX |
0x46d513 LEA (%R12,%RAX,1),%RCX |
0x46d517 MOV %RCX,%R8 |
0x46d51a SAR $0x20,%R8 |
0x46d51e SAL $0x20,%R13 |
0x46d522 ADD %R13,%RAX |
0x46d525 MOV %RAX,%R9 |
0x46d528 SAR $0x20,%R9 |
0x46d52c MOVSXD (%RDX),%R10 |
0x46d52f MOV (%RSI),%EDX |
0x46d531 SUB %R10D,%EDX |
0x46d534 ADD %EBX,%EDI |
0x46d536 MOV %RDX,0x130(%RSP) |
0x46d53e INC %EDX |
0x46d540 CMP $0x2,%EDX |
0x46d543 MOV $0x1,%ESI |
0x46d548 CMOVGE %EDX,%ESI |
0x46d54b MOV %RSI,0x38(%RSP) |
0x46d550 AND $0x7ffffffc,%ESI |
0x46d556 MOV %RSI,0xd8(%RSP) |
0x46d55e TEST %RCX,%RCX |
0x46d561 MOV $-0x1,%RSI |
0x46d568 CMOVNS %RCX,%RSI |
0x46d56c TEST %RSI,%RSI |
0x46d56f MOV $0x1,%R11D |
0x46d575 CMOVG %R11,%RSI |
0x46d579 MOV $0x200000000,%RBX |
0x46d583 MOV %RBX,%RDX |
0x46d586 SUB %R12,%RDX |
0x46d589 CMP %RDX,%RCX |
0x46d58c CMOVG %RCX,%RDX |
0x46d590 LEA (,%R10,8),%RCX |
0x46d598 SHR $0x20,%RDX |
0x46d59c IMUL %RSI,%RDX |
0x46d5a0 MOV $-0x1,%RSI |
0x46d5a7 SAL $0x3,%RDX |
0x46d5ab SUB %RDX,%RCX |
0x46d5ae TEST %RAX,%RAX |
0x46d5b1 CMOVNS %RAX,%RSI |
0x46d5b5 TEST %RSI,%RSI |
0x46d5b8 CMOVG %R11,%RSI |
0x46d5bc SUB %R13,%RBX |
0x46d5bf MOV 0x30(%RBP),%R14 |
0x46d5c3 CMP %RBX,%RAX |
0x46d5c6 CMOVG %RAX,%RBX |
0x46d5ca MOV %R8,%RAX |
0x46d5cd NOT %RAX |
0x46d5d0 MOV %RAX,0xa8(%RSP) |
0x46d5d8 SHR $0x20,%RBX |
0x46d5dc IMUL %RSI,%RBX |
0x46d5e0 NEG %RBX |
0x46d5e3 MOV %RBX,0xc8(%RSP) |
0x46d5eb MOV $0x8,%ESI |
0x46d5f0 SUB %RDX,%RSI |
0x46d5f3 MOV %R9,%RAX |
0x46d5f6 NOT %RAX |
0x46d5f9 MOV %RAX,0xc0(%RSP) |
0x46d601 MOV %R9,0xe0(%RSP) |
0x46d609 SUB %R9,%R11 |
0x46d60c MOV %R11,0xd0(%RSP) |
0x46d614 MOV 0x20(%RBP),%RAX |
0x46d618 MOV 0x18(%RBP),%R9 |
0x46d61c MOV 0x10(%RBP),%RDX |
0x46d620 LEA 0x8(%R9,%RCX,1),%R11 |
0x46d625 MOV %R11,0x78(%RSP) |
0x46d62a ADD %RCX,%RDX |
0x46d62d MOV %RDX,0x70(%RSP) |
0x46d632 LEA (%RAX,%RCX,1),%RAX |
0x46d636 MOV %RAX,0x68(%RSP) |
0x46d63b LEA (%R9,%RCX,1),%RAX |
0x46d63f MOV %RAX,0x60(%RSP) |
0x46d644 LEA 0x8(%R14,%RCX,1),%RAX |
0x46d649 MOV %RAX,0x158(%RSP) |
0x46d651 MOV 0x28(%RSP),%RDX |
0x46d656 LEA 0x8(%RDX,%RCX,1),%RAX |
0x46d65b MOV %RAX,0x58(%RSP) |
0x46d660 MOV 0x30(%RSP),%RAX |
0x46d665 LEA 0x8(%RAX,%RCX,1),%RCX |
0x46d66a MOV %RCX,0x50(%RSP) |
0x46d66f MOV %R10,0xb0(%RSP) |
0x46d677 MOV %R8,0xb8(%RSP) |
0x46d67f SUB %R8,%R10 |
0x46d682 MOV %R10,0x98(%RSP) |
0x46d68a LEA (%R14,%RSI,1),%RCX |
0x46d68e MOV %RCX,0x90(%RSP) |
0x46d696 LEA (%R9,%RSI,1),%RCX |
0x46d69a MOV %RCX,0x88(%RSP) |
0x46d6a2 LEA (%RDX,%RSI,1),%RCX |
0x46d6a6 MOV %RCX,0x80(%RSP) |
0x46d6ae ADD %RAX,%RSI |
0x46d6b1 MOV %RSI,0xa0(%RSP) |
0x46d6b9 VMOVSD 0x8aded(%RIP),%XMM21 |
0x46d6c3 VMOVSD 0x8bafb(%RIP),%XMM22 |
0x46d6cd VMOVSD 0xa9ce1(%RIP),%XMM23 |
0x46d6d7 VMOVSD 0xa9cdf(%RIP),%XMM25 |
0x46d6e1 VBROADCASTSD 0x8adc6(%RIP),%YMM14 |
0x46d6ea VXORPD %XMM18,%XMM18,%XMM18 |
0x46d6f0 XOR %R9D,%R9D |
0x46d6f3 MOV %RDI,0xe8(%RSP) |
0x46d6fb MOV %EDI,%ESI |
0x46d6fd JMP 46d71e |
0x46d6ff NOP |
(923) 0x46d700 MOV 0x150(%RSP),%RCX |
(923) 0x46d708 LEA 0x1(%RCX),%EAX |
(923) 0x46d70b MOV 0x1c(%RSP),%ESI |
(923) 0x46d70f INC %ESI |
(923) 0x46d711 CMP 0x18(%RSP),%ECX |
(923) 0x46d715 MOV %EAX,%R9D |
(923) 0x46d718 JE 46d4c9 |
(923) 0x46d71e CMPL $0,0x130(%RSP) |
(923) 0x46d726 MOV %ESI,0x1c(%RSP) |
(923) 0x46d72a MOV %R9,0x150(%RSP) |
(923) 0x46d732 JS 46d700 |
(923) 0x46d734 MOVSXD %ESI,%R8 |
(923) 0x46d737 MOV 0xc8(%RSP),%RAX |
(923) 0x46d73f LEA (%RAX,%R8,1),%RBX |
(923) 0x46d743 MOV 0xc0(%RSP),%RAX |
(923) 0x46d74b LEA (%RAX,%R8,1),%R13 |
(923) 0x46d74f ADD 0xd0(%RSP),%R8 |
(923) 0x46d757 MOV 0xe8(%RSP),%RCX |
(923) 0x46d75f LEA (%RCX,%R9,1),%EAX |
(923) 0x46d763 MOVSXD %EAX,%R10 |
(923) 0x46d766 MOV 0xe0(%RSP),%RDX |
(923) 0x46d76e SUB %RDX,%R10 |
(923) 0x46d771 LEA (%RCX,%R9,1),%EAX |
(923) 0x46d775 INC %EAX |
(923) 0x46d777 CLTQ |
(923) 0x46d779 SUB %RDX,%RAX |
(923) 0x46d77c MOV 0x58(%RBP),%RCX |
(923) 0x46d780 MOV (%RCX),%R15 |
(923) 0x46d783 MOV 0x28(%RBP),%RDX |
(923) 0x46d787 VMOVSD (%RDX,%R10,8),%XMM20 |
(923) 0x46d78e MOV 0x60(%RBP),%RCX |
(923) 0x46d792 MOV (%RCX),%R14 |
(923) 0x46d795 MOV 0x68(%RBP),%RCX |
(923) 0x46d799 MOV (%RCX),%R11 |
(923) 0x46d79c VADDSD (%RDX,%RAX,8),%XMM20,%XMM1 |
(923) 0x46d7a3 MOV 0x70(%RBP),%RAX |
(923) 0x46d7a7 MOV (%RAX),%R12 |
(923) 0x46d7aa MOV 0xd8(%RSP),%RDI |
(923) 0x46d7b2 TEST %RDI,%RDI |
(923) 0x46d7b5 VMOVAPD %XMM20,0x170(%RSP) |
(923) 0x46d7bd MOV %R8,0x148(%RSP) |
(923) 0x46d7c5 MOV %R12,0x140(%RSP) |
(923) 0x46d7cd MOV %R14,0x138(%RSP) |
(923) 0x46d7d5 JE 46df30 |
(923) 0x46d7db VMOVAPD %XMM8,0x1f0(%RSP) |
(923) 0x46d7e4 VBROADCASTSD %XMM8,%YMM4 |
(923) 0x46d7e9 VMOVAPD %XMM26,0x1e0(%RSP) |
(923) 0x46d7f1 VBROADCASTSD %XMM26,%YMM17 |
(923) 0x46d7f7 VMOVAPD %XMM27,0x1d0(%RSP) |
(923) 0x46d7ff VBROADCASTSD %XMM27,%YMM16 |
(923) 0x46d805 VMOVAPD %XMM28,0x1c0(%RSP) |
(923) 0x46d80d VBROADCASTSD %XMM28,%YMM15 |
(923) 0x46d813 VMOVAPD %XMM31,0x1b0(%RSP) |
(923) 0x46d81b VBROADCASTSD %XMM31,%YMM19 |
(923) 0x46d821 VMOVAPD %XMM29,0x160(%RSP) |
(923) 0x46d829 VBROADCASTSD %XMM29,%YMM0 |
(923) 0x46d82f VMOVAPD %XMM30,0x1a0(%RSP) |
(923) 0x46d837 VBROADCASTSD %XMM30,%YMM27 |
(923) 0x46d83d MOV %R15,%RAX |
(923) 0x46d840 IMUL %R10,%RAX |
(923) 0x46d844 MOV %RAX,0x100(%RSP) |
(923) 0x46d84c LEA 0x1(%R10),%RCX |
(923) 0x46d850 MOV %R15,%RAX |
(923) 0x46d853 IMUL %RCX,%RAX |
(923) 0x46d857 MOV %RAX,0x108(%RSP) |
(923) 0x46d85f IMUL %R14,%RCX |
(923) 0x46d863 MOV %RCX,0xf8(%RSP) |
(923) 0x46d86b MOV %R14,%RAX |
(923) 0x46d86e IMUL %R10,%RAX |
(923) 0x46d872 MOV %RAX,0xf0(%RSP) |
(923) 0x46d87a VBROADCASTSD %XMM20,%YMM24 |
(923) 0x46d880 VDIVSD %XMM20,%XMM21,%XMM2 |
(923) 0x46d886 VBROADCASTSD %XMM2,%YMM26 |
(923) 0x46d88c IMUL %R11,%R10 |
(923) 0x46d890 MOV %R10,0x40(%RSP) |
(923) 0x46d895 VMOVSD %XMM1,0x118(%RSP) |
(923) 0x46d89e VDIVSD %XMM1,%XMM21,%XMM2 |
(923) 0x46d8a4 VBROADCASTSD %XMM2,%YMM1 |
(923) 0x46d8a9 VMOVAPD %YMM1,0x180(%RSP) |
(923) 0x46d8b2 MOV %R11,%RAX |
(923) 0x46d8b5 IMUL %RBX,%RAX |
(923) 0x46d8b9 ADD 0x78(%RSP),%RAX |
(923) 0x46d8be IMUL %RBX,%R12 |
(923) 0x46d8c2 ADD 0x70(%RSP),%R12 |
(923) 0x46d8c7 MOV %R11,%RDX |
(923) 0x46d8ca MOV %R13,0x128(%RSP) |
(923) 0x46d8d2 IMUL %R13,%R11 |
(923) 0x46d8d6 MOV 0x60(%RSP),%RCX |
(923) 0x46d8db ADD %RCX,%R11 |
(923) 0x46d8de MOV %R15,%R10 |
(923) 0x46d8e1 MOV %RDX,0x110(%RSP) |
(923) 0x46d8e9 MOV %RDX,%R15 |
(923) 0x46d8ec IMUL %R8,%R15 |
(923) 0x46d8f0 ADD %RCX,%R15 |
(923) 0x46d8f3 MOV %R14,%RSI |
(923) 0x46d8f6 IMUL %RBX,%RSI |
(923) 0x46d8fa MOV 0x58(%RSP),%RCX |
(923) 0x46d8ff ADD %RCX,%RSI |
(923) 0x46d902 MOV %R14,%RDX |
(923) 0x46d905 IMUL %R8,%RDX |
(923) 0x46d909 ADD %RCX,%RDX |
(923) 0x46d90c MOV %R10,%R14 |
(923) 0x46d90f IMUL %R8,%R14 |
(923) 0x46d913 MOV 0x50(%RSP),%RCX |
(923) 0x46d918 ADD %RCX,%R14 |
(923) 0x46d91b MOV %R10,0x120(%RSP) |
(923) 0x46d923 MOV %RBX,%R8 |
(923) 0x46d926 IMUL %RBX,%R10 |
(923) 0x46d92a ADD %RCX,%R10 |
(923) 0x46d92d VPCMPEQD %YMM7,%YMM7,%YMM7 |
(923) 0x46d931 XOR %R13D,%R13D |
(923) 0x46d934 VPCMPEQD %YMM12,%YMM12,%YMM12 |
(923) 0x46d939 VPCMPEQD %YMM11,%YMM11,%YMM11 |
(923) 0x46d93e VPCMPEQD %YMM3,%YMM3,%YMM3 |
(923) 0x46d942 VPCMPEQD %YMM6,%YMM6,%YMM6 |
(923) 0x46d946 VPCMPEQD %YMM9,%YMM9,%YMM9 |
(923) 0x46d94b VPCMPEQD %YMM5,%YMM5,%YMM5 |
(923) 0x46d94f MOV 0x68(%RSP),%R9 |
(923) 0x46d954 VMOVAPD %YMM14,%YMM18 |
(923) 0x46d95a VBROADCASTSD 0xa9a55(%RIP),%YMM8 |
(923) 0x46d963 VXORPD %XMM28,%XMM28,%XMM28 |
(923) 0x46d969 JMP 46dad9 |
0x46d96e XCHG %AX,%AX |
(925) 0x46d970 VCMPPD $0x1,%YMM13,%YMM22,%K3 |
(925) 0x46d977 VBROADCASTSD 0xa9a40(%RIP),%YMM8 |
(925) 0x46d980 VBLENDMPD %YMM8,%YMM18,%YMM31{%K3} |
(925) 0x46d986 VBROADCASTSD 0x8a9a0(%RIP),%YMM29 |
(925) 0x46d990 VANDPD %YMM29,%YMM22,%YMM1 |
(925) 0x46d996 VMAXPD %YMM1,%YMM14,%YMM1 |
(925) 0x46d99a VMULPD %YMM31,%YMM1,%YMM1 |
(925) 0x46d9a0 VCMPPD $0x1,%YMM13,%YMM1,%K3 |
(925) 0x46d9a7 VBLENDMPD %YMM8,%YMM18,%YMM25{%K3} |
(925) 0x46d9ad VANDPD %YMM29,%YMM21,%YMM13 |
(925) 0x46d9b3 VMAXPD %YMM13,%YMM14,%YMM13 |
(925) 0x46d9b8 VMULPD %YMM25,%YMM13,%YMM13 |
(925) 0x46d9be VMULPD %YMM1,%YMM1,%YMM20 |
(925) 0x46d9c4 VFMADD231PD %YMM13,%YMM13,%YMM20 |
(925) 0x46d9ca VXORPD %XMM28,%XMM28,%XMM28 |
(925) 0x46d9d0 VSQRTPD %YMM20,%YMM23 |
(925) 0x46d9d6 VMULPD %YMM2,%YMM23,%YMM2 |
(925) 0x46d9dc VDIVPD %YMM1,%YMM2,%YMM1 |
(925) 0x46d9e0 VANDPD %YMM29,%YMM1,%YMM22 |
(925) 0x46d9e6 VMULPD %YMM24,%YMM23,%YMM1 |
(925) 0x46d9ec VDIVPD %YMM13,%YMM1,%YMM1 |
(925) 0x46d9f1 VANDPD %YMM29,%YMM1,%YMM21 |
(925) 0x46d9f7 VCMPPD $0x2,%YMM21,%YMM22,%K3 |
(925) 0x46d9fe VBLENDMPD %YMM22,%YMM21,%YMM30{%K3} |
(925) 0x46da04 VMULPD %YMM30,%YMM30,%YMM29 |
(925) 0x46da0a VMULPD %YMM10,%YMM10,%YMM1 |
(925) 0x46da0f IMUL %R8,%RCX |
(925) 0x46da13 ADD %R9,%RCX |
(925) 0x46da16 VMOVUPD (%RCX,%R13,8),%YMM2{%K2}{z} |
(925) 0x46da1d VADDPD %YMM29,%YMM29,%YMM10 |
(925) 0x46da23 VMULPD %YMM2,%YMM1,%YMM1 |
(925) 0x46da27 VMULPD %YMM1,%YMM10,%YMM1 |
(925) 0x46da2b VPBROADCASTQ %R13,%YMM2 |
(925) 0x46da31 VPADDQ 0x8a707(%RIP),%YMM2,%YMM2 |
(925) 0x46da39 VPBLENDMQ %YMM5,%YMM2,%YMM5{%K1} |
(925) 0x46da3f VMOVAPD %YMM4,%YMM31{%K1} |
(925) 0x46da45 VPBLENDMQ %YMM9,%YMM2,%YMM9{%K1} |
(925) 0x46da4b VMOVAPD %YMM17,%YMM25{%K1} |
(925) 0x46da51 VPBLENDMQ %YMM6,%YMM2,%YMM6{%K1} |
(925) 0x46da57 VMOVAPD %YMM16,%YMM23{%K1} |
(925) 0x46da5d VPBLENDMQ %YMM3,%YMM2,%YMM3{%K1} |
(925) 0x46da63 VMOVAPD %YMM15,%YMM22{%K1} |
(925) 0x46da69 VPBLENDMQ %YMM11,%YMM2,%YMM11{%K1} |
(925) 0x46da6f VMOVAPD %YMM19,%YMM21{%K1} |
(925) 0x46da75 VPBLENDMQ %YMM12,%YMM2,%YMM12{%K1} |
(925) 0x46da7b VMOVAPD %YMM0,%YMM30{%K1} |
(925) 0x46da81 VMOVDQA64 %YMM7,%YMM2{%K1} |
(925) 0x46da87 VMOVAPD %YMM27,%YMM29{%K1} |
(925) 0x46da8d VMOVAPD %YMM28,%YMM1{%K1} |
(925) 0x46da93 VMOVUPD %YMM1,(%R12,%R13,8) |
(925) 0x46da99 ADD $0x4,%R13 |
(925) 0x46da9d VMOVDQA %YMM2,%YMM7 |
(925) 0x46daa1 VMOVAPD %YMM29,%YMM27 |
(925) 0x46daa7 VMOVAPD %YMM30,%YMM0 |
(925) 0x46daad VMOVAPD %YMM21,%YMM19 |
(925) 0x46dab3 VMOVAPD %YMM22,%YMM15 |
(925) 0x46dab9 VMOVAPD %YMM23,%YMM16 |
(925) 0x46dabf VMOVAPD %YMM25,%YMM17 |
(925) 0x46dac5 VMOVAPD %YMM31,%YMM4 |
(925) 0x46dacb CMP %RDI,%R13 |
(925) 0x46dace VMOVAPD %YMM14,%YMM8 |
(925) 0x46dad3 JAE 46dc70 |
(925) 0x46dad9 VMOVUPD -0x8(%R10,%R13,8),%YMM10 |
(925) 0x46dae0 VMOVUPD (%R10,%R13,8),%YMM21 |
(925) 0x46dae7 VMOVUPD -0x8(%R14,%R13,8),%YMM22 |
(925) 0x46daf2 VMOVUPD (%R14,%R13,8),%YMM23 |
(925) 0x46daf9 VADDPD %YMM21,%YMM23,%YMM2 |
(925) 0x46daff VADDPD %YMM22,%YMM10,%YMM25 |
(925) 0x46db05 VMOVUPD -0x8(%RDX,%R13,8),%YMM29 |
(925) 0x46db10 VMOVUPD (%RDX,%R13,8),%YMM30 |
(925) 0x46db17 VSUBPD %YMM25,%YMM2,%YMM25 |
(925) 0x46db1d VMOVUPD -0x8(%RSI,%R13,8),%YMM31 |
(925) 0x46db28 VMOVUPD (%RSI,%R13,8),%YMM20 |
(925) 0x46db2f VADDPD %YMM29,%YMM30,%YMM2 |
(925) 0x46db35 VADDPD %YMM20,%YMM31,%YMM1 |
(925) 0x46db3b VSUBPD %YMM1,%YMM2,%YMM1 |
(925) 0x46db3f MOV 0x158(%RSP),%RCX |
(925) 0x46db47 VMOVUPD -0x8(%RCX,%R13,8),%YMM2 |
(925) 0x46db4e VMULPD %YMM25,%YMM2,%YMM13 |
(925) 0x46db54 VFMADD231PD %YMM1,%YMM24,%YMM13 |
(925) 0x46db5a VADDPD %YMM10,%YMM21,%YMM10 |
(925) 0x46db60 VSUBPD %YMM10,%YMM23,%YMM10 |
(925) 0x46db66 VADDPD %YMM22,%YMM10,%YMM10 |
(925) 0x46db6c VBROADCASTSD 0x8b653(%RIP),%YMM14 |
(925) 0x46db75 VMULPD %YMM14,%YMM10,%YMM10 |
(925) 0x46db7a VADDPD %YMM31,%YMM29,%YMM21 |
(925) 0x46db80 VSUBPD %YMM21,%YMM30,%YMM21 |
(925) 0x46db86 VADDPD %YMM20,%YMM21,%YMM20 |
(925) 0x46db8c VMULPD %YMM14,%YMM20,%YMM20 |
(925) 0x46db92 VDIVPD %YMM2,%YMM18,%YMM23 |
(925) 0x46db98 VMULPD %YMM23,%YMM20,%YMM20 |
(925) 0x46db9e VMOVUPD (%RAX,%R13,8),%YMM21 |
(925) 0x46dba5 VFMADD231PD %YMM10,%YMM26,%YMM20 |
(925) 0x46dbab VSUBPD -0x10(%RAX,%R13,8),%YMM21,%YMM10 |
(925) 0x46dbb6 VADDPD (%RCX,%R13,8),%YMM2,%YMM21 |
(925) 0x46dbbd VDIVPD %YMM21,%YMM10,%YMM22 |
(925) 0x46dbc3 VMOVUPD (%R15,%R13,8),%YMM10 |
(925) 0x46dbc9 VSUBPD (%R11,%R13,8),%YMM10,%YMM10 |
(925) 0x46dbcf VMULPD 0x180(%RSP),%YMM10,%YMM21 |
(925) 0x46dbd7 VMULPD %YMM22,%YMM22,%YMM10 |
(925) 0x46dbdd VMULPD %YMM21,%YMM21,%YMM29 |
(925) 0x46dbe3 VMULPD %YMM14,%YMM25,%YMM25 |
(925) 0x46dbe9 VMULPD %YMM23,%YMM25,%YMM23 |
(925) 0x46dbef VMULPD %YMM10,%YMM23,%YMM23 |
(925) 0x46dbf5 VMULPD %YMM1,%YMM14,%YMM1 |
(925) 0x46dbf9 VMULPD %YMM29,%YMM1,%YMM1 |
(925) 0x46dbff VMULPD %YMM20,%YMM22,%YMM20 |
(925) 0x46dc05 VFMADD213PD %YMM23,%YMM21,%YMM20 |
(925) 0x46dc0b VFMADD231PD %YMM1,%YMM26,%YMM20 |
(925) 0x46dc11 VADDPD %YMM10,%YMM29,%YMM1 |
(925) 0x46dc17 VMAXPD %YMM8,%YMM1,%YMM1 |
(925) 0x46dc1c VDIVPD %YMM1,%YMM20,%YMM10 |
(925) 0x46dc22 VCMPPD $0x1,%YMM10,%YMM28,%K1 |
(925) 0x46dc29 VCMPPD $0x2,%YMM13,%YMM28,%K0 |
(925) 0x46dc30 VCMPPD $0x6,%YMM13,%YMM28,%K1{%K1} |
(925) 0x46dc37 KORW %K1,%K0,%K1 |
(925) 0x46dc3b KNOTW %K1,%K2 |
(925) 0x46dc3f KMOVD %K2,%EBX |
(925) 0x46dc43 TEST $0xf,%BL |
(925) 0x46dc46 VMOVAPD %YMM8,%YMM14 |
(925) 0x46dc4b VXORPD %XMM13,%XMM13,%XMM13 |
(925) 0x46dc50 JE 46d970 |
(925) 0x46dc56 MOV 0x78(%RBP),%RCX |
(925) 0x46dc5a MOV (%RCX),%RCX |
(925) 0x46dc5d JMP 46d970 |
0x46dc62 NOPW %CS:(%RAX,%RAX,1) |
(923) 0x46dc70 VMOVAPD %YMM18,%YMM14 |
(923) 0x46dc76 VPCMPEQD %YMM4,%YMM4,%YMM4 |
(923) 0x46dc7a VPTEST %YMM4,%YMM5 |
(923) 0x46dc7f VMOVAPD 0x1f0(%RSP),%XMM8 |
(923) 0x46dc88 JB 46dcc8 |
(923) 0x46dc8a VEXTRACTI128 $0x1,%YMM5,%XMM0 |
(923) 0x46dc90 VPMAXSQ %XMM0,%XMM5,%XMM0 |
(923) 0x46dc96 VPSHUFD $-0x12,%XMM0,%XMM1 |
(923) 0x46dc9b VPMAXSQ %XMM1,%XMM0,%XMM0 |
(923) 0x46dca1 VPBROADCASTQ %XMM0,%YMM0 |
(923) 0x46dca6 VPCMPEQQ %YMM0,%YMM5,%K0 |
(923) 0x46dcac KMOVD %K0,%EAX |
(923) 0x46dcb0 TZCNT %EAX,%EAX |
(923) 0x46dcb4 VMOVAPD %YMM31,0x2c0(%RSP) |
(923) 0x46dcbc AND $0x3,%EAX |
(923) 0x46dcbf VMOVSD 0x2c0(%RSP,%RAX,8),%XMM8 |
(923) 0x46dcc8 VPTEST %YMM4,%YMM9 |
(923) 0x46dccd VXORPD %XMM18,%XMM18,%XMM18 |
(923) 0x46dcd3 VMOVAPD 0x1e0(%RSP),%XMM26 |
(923) 0x46dcdb VMOVAPD 0x1d0(%RSP),%XMM27 |
(923) 0x46dce3 VMOVAPD 0x1c0(%RSP),%XMM28 |
(923) 0x46dceb MOV 0x128(%RSP),%R13 |
(923) 0x46dcf3 MOV 0x120(%RSP),%R15 |
(923) 0x46dcfb MOV 0x110(%RSP),%R11 |
(923) 0x46dd03 MOV 0x108(%RSP),%RSI |
(923) 0x46dd0b MOV 0xf8(%RSP),%R9 |
(923) 0x46dd13 MOV 0xf0(%RSP),%RBX |
(923) 0x46dd1b JB 46dd5a |
(923) 0x46dd1d VEXTRACTI128 $0x1,%YMM9,%XMM0 |
(923) 0x46dd23 VPMAXSQ %XMM0,%XMM9,%XMM0 |
(923) 0x46dd29 VPSHUFD $-0x12,%XMM0,%XMM1 |
(923) 0x46dd2e VPMAXSQ %XMM1,%XMM0,%XMM0 |
(923) 0x46dd34 VPBROADCASTQ %XMM0,%YMM0 |
(923) 0x46dd39 VPCMPEQQ %YMM0,%YMM9,%K0 |
(923) 0x46dd3f KMOVD %K0,%EAX |
(923) 0x46dd43 TZCNT %EAX,%EAX |
(923) 0x46dd47 VMOVAPD %YMM25,0x2a0(%RSP) |
(923) 0x46dd4f AND $0x3,%EAX |
(923) 0x46dd52 VMOVSD 0x2a0(%RSP,%RAX,8),%XMM26 |
(923) 0x46dd5a VPTEST %YMM4,%YMM6 |
(923) 0x46dd5f VMOVAPD 0x1b0(%RSP),%XMM31 |
(923) 0x46dd67 JB 46dda6 |
(923) 0x46dd69 VEXTRACTI128 $0x1,%YMM6,%XMM0 |
(923) 0x46dd6f VPMAXSQ %XMM0,%XMM6,%XMM0 |
(923) 0x46dd75 VPSHUFD $-0x12,%XMM0,%XMM1 |
(923) 0x46dd7a VPMAXSQ %XMM1,%XMM0,%XMM0 |
(923) 0x46dd80 VPBROADCASTQ %XMM0,%YMM0 |
(923) 0x46dd85 VPCMPEQQ %YMM0,%YMM6,%K0 |
(923) 0x46dd8b KMOVD %K0,%EAX |
(923) 0x46dd8f TZCNT %EAX,%EAX |
(923) 0x46dd93 VMOVAPD %YMM23,0x280(%RSP) |
(923) 0x46dd9b AND $0x3,%EAX |
(923) 0x46dd9e VMOVSD 0x280(%RSP,%RAX,8),%XMM27 |
(923) 0x46dda6 VPTEST %YMM4,%YMM3 |
(923) 0x46ddab VMOVSD 0xa960b(%RIP),%XMM25 |
(923) 0x46ddb5 VMOVAPD 0x170(%RSP),%XMM20 |
(923) 0x46ddbd JB 46ddfc |
(923) 0x46ddbf VEXTRACTI128 $0x1,%YMM3,%XMM0 |
(923) 0x46ddc5 VPMAXSQ %XMM0,%XMM3,%XMM0 |
(923) 0x46ddcb VPSHUFD $-0x12,%XMM0,%XMM1 |
(923) 0x46ddd0 VPMAXSQ %XMM1,%XMM0,%XMM0 |
(923) 0x46ddd6 VPBROADCASTQ %XMM0,%YMM0 |
(923) 0x46dddb VPCMPEQQ %YMM0,%YMM3,%K0 |
(923) 0x46dde1 KMOVD %K0,%EAX |
(923) 0x46dde5 TZCNT %EAX,%EAX |
(923) 0x46dde9 VMOVAPD %YMM22,0x260(%RSP) |
(923) 0x46ddf1 AND $0x3,%EAX |
(923) 0x46ddf4 VMOVSD 0x260(%RSP,%RAX,8),%XMM28 |
(923) 0x46ddfc VPTEST %YMM4,%YMM11 |
(923) 0x46de01 VMOVSD 0xa95ad(%RIP),%XMM23 |
(923) 0x46de0b JB 46de4a |
(923) 0x46de0d VEXTRACTI128 $0x1,%YMM11,%XMM0 |
(923) 0x46de13 VPMAXSQ %XMM0,%XMM11,%XMM0 |
(923) 0x46de19 VPSHUFD $-0x12,%XMM0,%XMM1 |
(923) 0x46de1e VPMAXSQ %XMM1,%XMM0,%XMM0 |
(923) 0x46de24 VPBROADCASTQ %XMM0,%YMM0 |
(923) 0x46de29 VPCMPEQQ %YMM0,%YMM11,%K0 |
(923) 0x46de2f KMOVD %K0,%EAX |
(923) 0x46de33 TZCNT %EAX,%EAX |
(923) 0x46de37 VMOVAPD %YMM21,0x240(%RSP) |
(923) 0x46de3f AND $0x3,%EAX |
(923) 0x46de42 VMOVSD 0x240(%RSP,%RAX,8),%XMM31 |
(923) 0x46de4a VPTEST %YMM4,%YMM12 |
(923) 0x46de4f VMOVSD 0x8b36f(%RIP),%XMM22 |
(923) 0x46de59 JB 46dea2 |
(923) 0x46de5b VEXTRACTI128 $0x1,%YMM12,%XMM0 |
(923) 0x46de61 VPMAXSQ %XMM0,%XMM12,%XMM0 |
(923) 0x46de67 VPSHUFD $-0x12,%XMM0,%XMM1 |
(923) 0x46de6c VPMAXSQ %XMM1,%XMM0,%XMM0 |
(923) 0x46de72 VPBROADCASTQ %XMM0,%YMM0 |
(923) 0x46de77 VPCMPEQQ %YMM0,%YMM12,%K0 |
(923) 0x46de7d KMOVD %K0,%EAX |
(923) 0x46de81 TZCNT %EAX,%EAX |
(923) 0x46de85 VMOVAPD %YMM30,0x220(%RSP) |
(923) 0x46de8d AND $0x3,%EAX |
(923) 0x46de90 VMOVSD 0x220(%RSP,%RAX,8),%XMM0 |
(923) 0x46de99 VMOVAPD %XMM0,0x160(%RSP) |
(923) 0x46dea2 VPTEST %YMM4,%YMM2 |
(923) 0x46dea7 VMOVSD 0x8a5ff(%RIP),%XMM21 |
(923) 0x46deb1 VMOVAPD 0x1a0(%RSP),%XMM30 |
(923) 0x46deb9 JB 46def8 |
(923) 0x46debb VEXTRACTI128 $0x1,%YMM2,%XMM0 |
(923) 0x46dec1 VPMAXSQ %XMM0,%XMM2,%XMM0 |
(923) 0x46dec7 VPSHUFD $-0x12,%XMM0,%XMM1 |
(923) 0x46decc VPMAXSQ %XMM1,%XMM0,%XMM0 |
(923) 0x46ded2 VPBROADCASTQ %XMM0,%YMM0 |
(923) 0x46ded7 VPCMPEQQ %YMM0,%YMM2,%K0 |
(923) 0x46dedd KMOVD %K0,%EAX |
(923) 0x46dee1 TZCNT %EAX,%EAX |
(923) 0x46dee5 VMOVAPD %YMM29,0x200(%RSP) |
(923) 0x46deed AND $0x3,%EAX |
(923) 0x46def0 VMOVSD 0x200(%RSP,%RAX,8),%XMM30 |
(923) 0x46def8 MOV %RDI,%RDX |
(923) 0x46defb CMP 0x38(%RSP),%RDI |
(923) 0x46df00 VMOVAPD 0x160(%RSP),%XMM29 |
(923) 0x46df08 VMOVSD 0x118(%RSP),%XMM1 |
(923) 0x46df11 MOV 0x100(%RSP),%RDI |
(923) 0x46df19 JE 46d700 |
(923) 0x46df1f JMP 46df5b |
0x46df21 NOPW %CS:(%RAX,%RAX,1) |
(923) 0x46df30 MOV %RBX,%R8 |
(923) 0x46df33 MOV %R14,%RBX |
(923) 0x46df36 IMUL %R10,%RBX |
(923) 0x46df3a LEA 0x1(%R10),%RSI |
(923) 0x46df3e MOV %R14,%R9 |
(923) 0x46df41 IMUL %RSI,%R9 |
(923) 0x46df45 MOV %R15,%RDI |
(923) 0x46df48 IMUL %R10,%RDI |
(923) 0x46df4c IMUL %R15,%RSI |
(923) 0x46df50 IMUL %R11,%R10 |
(923) 0x46df54 MOV %R10,0x40(%RSP) |
(923) 0x46df59 XOR %EDX,%EDX |
(923) 0x46df5b MOV 0x28(%RSP),%RAX |
(923) 0x46df60 ADD %RAX,%RBX |
(923) 0x46df63 MOV 0xb0(%RSP),%RCX |
(923) 0x46df6b LEA (%RCX,%RDX,1),%R10 |
(923) 0x46df6f MOV %R10,%R14 |
(923) 0x46df72 SUB 0xb8(%RSP),%R14 |
(923) 0x46df7a VMOVSD (%RBX,%R14,8),%XMM3 |
(923) 0x46df80 ADD %RAX,%R9 |
(923) 0x46df83 VMOVSD (%R9,%R14,8),%XMM11 |
(923) 0x46df89 MOV 0x30(%RSP),%RAX |
(923) 0x46df8e ADD %RAX,%RDI |
(923) 0x46df91 VMOVSD (%RDI,%R14,8),%XMM12 |
(923) 0x46df97 MOV 0xa8(%RSP),%RCX |
(923) 0x46df9f ADD %R10,%RCX |
(923) 0x46dfa2 ADD %RAX,%RSI |
(923) 0x46dfa5 VMOVSD (%RSI,%R14,8),%XMM24 |
(923) 0x46dfac IMUL %R11,%R13 |
(923) 0x46dfb0 MOV %R11,%R9 |
(923) 0x46dfb3 MOV %R8,%R12 |
(923) 0x46dfb6 IMUL %R8,%R11 |
(923) 0x46dfba LEA (%R11,%R10,8),%RAX |
(923) 0x46dfbe MOV 0x18(%RBP),%RSI |
(923) 0x46dfc2 MOV 0x40(%RSP),%R8 |
(923) 0x46dfc7 ADD %RSI,%R8 |
(923) 0x46dfca VMOVSD (%R8,%RCX,8),%XMM4 |
(923) 0x46dfd0 MOV 0x138(%RSP),%RSI |
(923) 0x46dfd8 MOV %RSI,%RCX |
(923) 0x46dfdb IMUL %R12,%RCX |
(923) 0x46dfdf LEA (%RCX,%R10,8),%R11 |
(923) 0x46dfe3 MOV 0x148(%RSP),%RCX |
(923) 0x46dfeb IMUL %RCX,%RSI |
(923) 0x46dfef LEA (%RSI,%R10,8),%RSI |
(923) 0x46dff3 IMUL %RCX,%R9 |
(923) 0x46dff7 IMUL %R15,%RCX |
(923) 0x46dffb LEA (%RCX,%R10,8),%RBX |
(923) 0x46dfff IMUL %R12,%R15 |
(923) 0x46e003 LEA (%R15,%R10,8),%RCX |
(923) 0x46e007 MOV 0x90(%RSP),%RDI |
(923) 0x46e00f LEA (%RDI,%R10,8),%R15 |
(923) 0x46e013 VMOVQ (%R8,%R14,8),%XMM9 |
(923) 0x46e019 MOV 0x30(%RBP),%RDI |
(923) 0x46e01d VMOVSD (%RDI,%R14,8),%XMM0 |
(923) 0x46e023 VDIVSD %XMM20,%XMM21,%XMM6 |
(923) 0x46e029 VDIVSD %XMM1,%XMM21,%XMM2 |
(923) 0x46e02f MOV 0x38(%RSP),%R8 |
(923) 0x46e034 SUB %RDX,%R8 |
(923) 0x46e037 MOV %R12,0x180(%RSP) |
(923) 0x46e03f MOV 0x140(%RSP),%RDI |
(923) 0x46e047 IMUL %R12,%RDI |
(923) 0x46e04b ADD 0x98(%RSP),%RDX |
(923) 0x46e053 LEA (%RDI,%RDX,8),%R12 |
(923) 0x46e057 ADD 0x10(%RBP),%R12 |
(923) 0x46e05b MOV 0x20(%RBP),%RDI |
(923) 0x46e05f LEA (%RDI,%RDX,8),%R14 |
(923) 0x46e063 LEA (%R13,%RDX,8),%R13 |
(923) 0x46e068 MOV 0x18(%RBP),%RDI |
(923) 0x46e06c ADD %RDI,%R13 |
(923) 0x46e06f LEA (%R9,%RDX,8),%RDX |
(923) 0x46e073 ADD %RDI,%RDX |
(923) 0x46e076 ADD 0x88(%RSP),%RAX |
(923) 0x46e07e MOV 0x80(%RSP),%RDI |
(923) 0x46e086 ADD %RDI,%R11 |
(923) 0x46e089 ADD %RDI,%RSI |
(923) 0x46e08c MOV 0xa0(%RSP),%RDI |
(923) 0x46e094 ADD %RDI,%RBX |
(923) 0x46e097 ADD %RDI,%RCX |
(923) 0x46e09a XOR %R10D,%R10D |
(923) 0x46e09d JMP 46e0bf |
0x46e09f NOP |
(924) 0x46e0a0 VMOVSD %XMM17,(%R12,%R10,8) |
(924) 0x46e0a7 INC %R10 |
(924) 0x46e0aa VMOVDQA %XMM9,%XMM4 |
(924) 0x46e0ae VMOVAPD %XMM5,%XMM9 |
(924) 0x46e0b2 VMOVAPD %XMM7,%XMM0 |
(924) 0x46e0b6 CMP %R10,%R8 |
(924) 0x46e0b9 JE 46d700 |
(924) 0x46e0bf VMOVAPD %XMM24,%XMM1 |
(924) 0x46e0c5 VMOVAPD %XMM12,%XMM5 |
(924) 0x46e0c9 VMOVSD (%RCX,%R10,8),%XMM12 |
(924) 0x46e0cf VMOVSD (%RBX,%R10,8),%XMM24 |
(924) 0x46e0d6 VMOVAPD %XMM11,%XMM7 |
(924) 0x46e0da VMOVAPD %XMM3,%XMM10 |
(924) 0x46e0de VADDSD %XMM12,%XMM24,%XMM3 |
(924) 0x46e0e4 VADDSD %XMM1,%XMM5,%XMM11 |
(924) 0x46e0e8 VSUBSD %XMM11,%XMM3,%XMM13 |
(924) 0x46e0ed VMOVSD (%RSI,%R10,8),%XMM11 |
(924) 0x46e0f3 VMOVSD (%R11,%R10,8),%XMM3 |
(924) 0x46e0f9 VADDSD %XMM7,%XMM11,%XMM15 |
(924) 0x46e0fd VADDSD %XMM3,%XMM10,%XMM16 |
(924) 0x46e103 VSUBSD %XMM16,%XMM15,%XMM17 |
(924) 0x46e109 VMULSD %XMM13,%XMM0,%XMM19 |
(924) 0x46e10f VFMADD231SD %XMM17,%XMM20,%XMM19 |
(924) 0x46e115 VADDSD %XMM5,%XMM12,%XMM5 |
(924) 0x46e119 VSUBSD %XMM5,%XMM24,%XMM5 |
(924) 0x46e11f VADDSD %XMM1,%XMM5,%XMM1 |
(924) 0x46e123 VMULSD %XMM22,%XMM1,%XMM1 |
(924) 0x46e129 VADDSD %XMM7,%XMM10,%XMM5 |
(924) 0x46e12d VSUBSD %XMM5,%XMM11,%XMM5 |
(924) 0x46e131 VADDSD %XMM3,%XMM5,%XMM5 |
(924) 0x46e135 VMULSD %XMM22,%XMM5,%XMM5 |
(924) 0x46e13b VDIVSD %XMM0,%XMM21,%XMM10 |
(924) 0x46e141 VMULSD %XMM10,%XMM5,%XMM20 |
(924) 0x46e147 VFMADD231SD %XMM1,%XMM6,%XMM20 |
(924) 0x46e14d VMOVSD (%RAX,%R10,8),%XMM5 |
(924) 0x46e153 VSUBSD %XMM4,%XMM5,%XMM1 |
(924) 0x46e157 VMOVSD (%R15,%R10,8),%XMM7 |
(924) 0x46e15d VADDSD %XMM0,%XMM7,%XMM4 |
(924) 0x46e161 VDIVSD %XMM4,%XMM1,%XMM16 |
(924) 0x46e167 VMOVSD (%RDX,%R10,8),%XMM1 |
(924) 0x46e16d VSUBSD (%R13,%R10,8),%XMM1,%XMM1 |
(924) 0x46e174 VMULSD %XMM2,%XMM1,%XMM15 |
(924) 0x46e178 VMULSD %XMM16,%XMM16,%XMM1 |
(924) 0x46e17e VMULSD %XMM15,%XMM15,%XMM4 |
(924) 0x46e183 VMULSD %XMM22,%XMM13,%XMM13 |
(924) 0x46e189 VMULSD %XMM10,%XMM13,%XMM10 |
(924) 0x46e18e VMULSD %XMM1,%XMM10,%XMM10 |
(924) 0x46e192 VMULSD %XMM22,%XMM17,%XMM13 |
(924) 0x46e198 VMULSD %XMM4,%XMM13,%XMM13 |
(924) 0x46e19c VMULSD %XMM20,%XMM16,%XMM17 |
(924) 0x46e1a2 VMOVAPD 0x170(%RSP),%XMM20 |
(924) 0x46e1aa VFMADD213SD %XMM10,%XMM15,%XMM17 |
(924) 0x46e1b0 VFMADD231SD %XMM13,%XMM6,%XMM17 |
(924) 0x46e1b6 VADDSD %XMM1,%XMM4,%XMM1 |
(924) 0x46e1ba VMAXSD %XMM23,%XMM1,%XMM1 |
(924) 0x46e1c0 VDIVSD %XMM1,%XMM17,%XMM4 |
(924) 0x46e1c6 VXORPD %XMM17,%XMM17,%XMM17 |
(924) 0x46e1cc XOR %EDI,%EDI |
(924) 0x46e1ce VUCOMISD %XMM17,%XMM4 |
(924) 0x46e1d4 SETBE %DIL |
(924) 0x46e1d8 XOR %R9D,%R9D |
(924) 0x46e1db VUCOMISD %XMM17,%XMM19 |
(924) 0x46e1e1 SETB %R9B |
(924) 0x46e1e5 CMP %R9B,%DIL |
(924) 0x46e1e8 CMOVB %EDI,%R9D |
(924) 0x46e1ec CMP $0x1,%R9B |
(924) 0x46e1f0 JNE 46e0a0 |
(924) 0x46e1f6 VCMPSD $0x1,%XMM18,%XMM16,%K1 |
(924) 0x46e1fd VMOVAPD %XMM21,%XMM8 |
(924) 0x46e203 VMOVSD %XMM25,%XMM8,%XMM8{%K1} |
(924) 0x46e209 VMOVDDUP 0x8a11f(%RIP),%XMM1 |
(924) 0x46e211 VANDPD %XMM1,%XMM16,%XMM10 |
(924) 0x46e217 VMAXSD %XMM10,%XMM23,%XMM10 |
(924) 0x46e21d VMULSD %XMM8,%XMM10,%XMM10 |
(924) 0x46e222 VCMPSD $0x1,%XMM18,%XMM10,%K1 |
(924) 0x46e229 VMOVAPD %XMM21,%XMM26 |
(924) 0x46e22f VMOVSD %XMM25,%XMM26,%XMM26{%K1} |
(924) 0x46e235 VANDPD %XMM1,%XMM15,%XMM13 |
(924) 0x46e239 VMAXSD %XMM13,%XMM23,%XMM13 |
(924) 0x46e23f VMULSD %XMM26,%XMM13,%XMM13 |
(924) 0x46e245 VMULSD %XMM10,%XMM10,%XMM15 |
(924) 0x46e24a VFMADD231SD %XMM13,%XMM13,%XMM15 |
(924) 0x46e24f VSQRTSD %XMM15,%XMM15,%XMM27 |
(924) 0x46e255 VMULSD %XMM0,%XMM27,%XMM0 |
(924) 0x46e25b VDIVSD %XMM10,%XMM0,%XMM0 |
(924) 0x46e260 VANDPD %XMM1,%XMM0,%XMM28 |
(924) 0x46e266 VMULSD %XMM20,%XMM27,%XMM0 |
(924) 0x46e26c VDIVSD %XMM13,%XMM0,%XMM0 |
(924) 0x46e271 VANDPD %XMM1,%XMM0,%XMM31 |
(924) 0x46e277 VCMPSD $0x2,%XMM31,%XMM28,%K1 |
(924) 0x46e27e VMOVAPD %XMM31,%XMM29 |
(924) 0x46e284 VMOVSD %XMM28,%XMM29,%XMM29{%K1} |
(924) 0x46e28a VMULSD %XMM29,%XMM29,%XMM30 |
(924) 0x46e290 VMULSD %XMM4,%XMM4,%XMM0 |
(924) 0x46e294 VADDSD %XMM30,%XMM30,%XMM1 |
(924) 0x46e29a VMULSD %XMM1,%XMM0,%XMM0 |
(924) 0x46e29e MOV 0x78(%RBP),%RDI |
(924) 0x46e2a2 MOV (%RDI),%RDI |
(924) 0x46e2a5 IMUL 0x180(%RSP),%RDI |
(924) 0x46e2ae ADD %R14,%RDI |
(924) 0x46e2b1 VMULSD (%RDI,%R10,8),%XMM0,%XMM17 |
(924) 0x46e2b8 JMP 46e0a0 |
0x46e2bd NOPL (%RAX) |
Path / |
Source file and lines | viscosity_kernel.f90:50-94 |
Module | exec |
nb instructions | 168 |
nb uops | 169 |
loop length | 755 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 43 |
micro-operation queue | 28.17 cycles |
front end | 28.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 19.00 | 19.00 | 19.00 | 19.00 | 4.00 | 20.67 | 20.67 | 20.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 19.00 | 19.00 | 19.00 | 19.00 | 4.00 | 20.67 | 20.67 | 20.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 28.17 |
Dispatch | 20.67 |
Overall L1 | 28.17 |
all | 1% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 16% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 3% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
all | 11% |
load | 6% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 11% |
load | 11% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x300,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R9,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R8,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x40(%RBP),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x38(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EBX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVL $0,0x24(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JS 46d4df <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xaf> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVL $0,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EAX,0xc(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0x1,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x28(%RSP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x2c(%RSP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x18(%RSP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x14(%RSP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x542630,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x10(%RSP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xc(%RSP),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EAX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ECX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JAE 46d4fa <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xca> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x542650,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x14(%RSP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x48(%RSP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV $0x542670,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CALL 404740 <__kmpc_barrier@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x50(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x48(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SAL $0x20,%R12 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
LEA (%R12,%RAX,1),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAR $0x20,%R8 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SAL $0x20,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %R13,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAR $0x20,%R9 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSXD (%RDX),%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV (%RSI),%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %R10D,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD %EBX,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
INC %EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x2,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVGE %EDX,%ESI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND $0x7ffffffc,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RSI,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %RCX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x1,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNS %RCX,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%R11D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %R11,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %R12,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %RDX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RCX,%RDX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA (,%R10,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SHR $0x20,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RSI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV $-0x1,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAL $0x3,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %RDX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNS %RAX,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %R11,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %R13,%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x30(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RBX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RAX,%RBX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R8,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOT %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SHR $0x20,%RBX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RSI,%RBX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RBX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x8,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %RDX,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R9,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOT %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R9,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %R9,%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R11,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x8(%R9,%RCX,1),%R11 | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
MOV %R11,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
ADD %RCX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%RAX,%RCX,1),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%R9,%RCX,1),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA 0x8(%R14,%RCX,1),%RAX | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
MOV %RAX,0x158(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x28(%RSP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x8(%RDX,%RCX,1),%RAX | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
MOV %RAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x8(%RAX,%RCX,1),%RCX | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
MOV %RCX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R8,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %R8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R10,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%R14,%RSI,1),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%R9,%RSI,1),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%RDX,%RSI,1),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
ADD %RAX,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RSI,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x8aded(%RIP),%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x8bafb(%RIP),%XMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD 0xa9ce1(%RIP),%XMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD 0xa9cdf(%RIP),%XMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD 0x8adc6(%RIP),%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VXORPD %XMM18,%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EDI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 46d71e <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x2ee> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Source file and lines | viscosity_kernel.f90:50-94 |
Module | exec |
nb instructions | 168 |
nb uops | 169 |
loop length | 755 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 43 |
micro-operation queue | 28.17 cycles |
front end | 28.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 19.00 | 19.00 | 19.00 | 19.00 | 4.00 | 20.67 | 20.67 | 20.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 19.00 | 19.00 | 19.00 | 19.00 | 4.00 | 20.67 | 20.67 | 20.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 28.17 |
Dispatch | 20.67 |
Overall L1 | 28.17 |
all | 1% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 16% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 3% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
all | 11% |
load | 6% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 11% |
load | 11% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x300,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R9,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R8,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x40(%RBP),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x38(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EBX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVL $0,0x24(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JS 46d4df <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xaf> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVL $0,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EAX,0xc(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0x1,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x28(%RSP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x2c(%RSP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x18(%RSP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x14(%RSP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x542630,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x10(%RSP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xc(%RSP),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EAX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ECX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JAE 46d4fa <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xca> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x542650,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x14(%RSP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x48(%RSP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV $0x542670,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CALL 404740 <__kmpc_barrier@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x50(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x48(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SAL $0x20,%R12 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
LEA (%R12,%RAX,1),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAR $0x20,%R8 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SAL $0x20,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %R13,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAR $0x20,%R9 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSXD (%RDX),%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV (%RSI),%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %R10D,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD %EBX,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
INC %EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x2,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVGE %EDX,%ESI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND $0x7ffffffc,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RSI,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %RCX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x1,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNS %RCX,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%R11D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %R11,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %R12,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %RDX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RCX,%RDX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA (,%R10,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SHR $0x20,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RSI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV $-0x1,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAL $0x3,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %RDX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNS %RAX,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %R11,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %R13,%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x30(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RBX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RAX,%RBX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R8,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOT %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SHR $0x20,%RBX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RSI,%RBX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RBX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x8,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %RDX,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R9,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOT %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R9,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %R9,%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R11,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x8(%R9,%RCX,1),%R11 | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
MOV %R11,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
ADD %RCX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%RAX,%RCX,1),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%R9,%RCX,1),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA 0x8(%R14,%RCX,1),%RAX | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
MOV %RAX,0x158(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x28(%RSP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x8(%RDX,%RCX,1),%RAX | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
MOV %RAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x8(%RAX,%RCX,1),%RCX | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
MOV %RCX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R8,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %R8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R10,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%R14,%RSI,1),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%R9,%RSI,1),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%RDX,%RSI,1),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
ADD %RAX,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RSI,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x8aded(%RIP),%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x8bafb(%RIP),%XMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD 0xa9ce1(%RIP),%XMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD 0xa9cdf(%RIP),%XMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD 0x8adc6(%RIP),%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VXORPD %XMM18,%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EDI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 46d71e <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x2ee> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼viscosity_kernel_.DIR.OMP.PARALLEL.2– | 2.89 | 1.5 |
▼Loop 923 - viscosity_kernel.f90:53-89 - exec– | 0 | 0 |
○Loop 925 - viscosity_kernel.f90:53-89 - exec | 2.89 | 1.49 |
○Loop 924 - viscosity_kernel.f90:55-89 - exec | 0 | 0 |