Function: hypre_ParTMatmul.extracted | Module: libparcsr_mv.so | Source: par_csr_matop.c:3454-3640 [...] | Coverage: 0.08% |
---|
Function: hypre_ParTMatmul.extracted | Module: libparcsr_mv.so | Source: par_csr_matop.c:3454-3640 [...] | Coverage: 0.08% |
---|
/scratch_na/users/xoserete/qaas_runs/171-587-0005/intel/AMG/build/AMG/AMG/parcsr_mv/par_csr_matop.c: 3454 - 3640 |
-------------------------------------------------------------------------------- |
3454: #pragma omp parallel |
[...] |
3462: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
3463: |
3464: size = num_cols_diag_A/num_threads; |
3465: rest = num_cols_diag_A - size*num_threads; |
3466: ii = hypre_GetThreadNum(); |
3467: if (ii < rest) |
3468: { |
3469: ns = ii*size+ii; |
3470: ne = (ii+1)*size+ii+1; |
3471: } |
3472: else |
3473: { |
3474: ns = ii*size+rest; |
3475: ne = (ii+1)*size+rest; |
3476: } |
3477: |
3478: B_marker = hypre_CTAlloc(HYPRE_Int, num_cols_diag_B); |
3479: B_marker_offd = hypre_CTAlloc(HYPRE_Int, num_cols_offd_C); |
3480: |
3481: for (ik = 0; ik < num_cols_diag_B; ik++) |
3482: B_marker[ik] = -1; |
3483: |
3484: for (ik = 0; ik < num_cols_offd_C; ik++) |
3485: B_marker_offd[ik] = -1; |
3486: |
3487: nnz_d = 0; |
3488: nnz_o = 0; |
3489: for (ik = ns; ik < ne; ik++) |
3490: { |
3491: for (jk = C_tmp_diag_i[ik]; jk < C_tmp_diag_i[ik+1]; jk++) |
3492: { |
3493: jcol = C_tmp_diag_j[jk]; |
3494: B_marker[jcol] = ik; |
3495: nnz_d++; |
3496: } |
3497: for (jk = C_tmp_offd_i[ik]; jk < C_tmp_offd_i[ik+1]; jk++) |
3498: { |
3499: jcol = C_tmp_offd_j[jk]; |
3500: B_marker_offd[jcol] = ik; |
3501: nnz_o++; |
3502: } |
3503: for (jk = 0; jk < num_sends_A; jk++) |
3504: for (j1 = send_map_starts_A[jk]; j1 < send_map_starts_A[jk+1]; j1++) |
3505: if (send_map_elmts_A[j1] == ik) |
3506: { |
3507: for (j2 = C_ext_diag_i[j1]; j2 < C_ext_diag_i[j1+1]; j2++) |
3508: { |
3509: jcol = C_ext_diag_j[j2]; |
3510: if (B_marker[jcol] < ik) |
3511: { |
3512: B_marker[jcol] = ik; |
3513: nnz_d++; |
3514: } |
3515: } |
3516: for (j2 = C_ext_offd_i[j1]; j2 < C_ext_offd_i[j1+1]; j2++) |
3517: { |
3518: jcol = C_ext_offd_j[j2]; |
3519: if (B_marker_offd[jcol] < ik) |
3520: { |
3521: B_marker_offd[jcol] = ik; |
3522: nnz_o++; |
3523: } |
3524: } |
3525: break; |
3526: } |
3527: C_diag_array[ii] = nnz_d; |
3528: C_offd_array[ii] = nnz_o; |
3529: } |
3530: #ifdef HYPRE_USING_OPENMP |
3531: #pragma omp barrier |
3532: #endif |
3533: if (ii == 0) |
3534: { |
3535: nnz_d = 0; |
3536: nnz_o = 0; |
3537: for (ik = 0; ik < num_threads-1; ik++) |
3538: { |
3539: C_diag_array[ik+1] += C_diag_array[ik]; |
3540: C_offd_array[ik+1] += C_offd_array[ik]; |
3541: } |
3542: nnz_d = C_diag_array[num_threads-1]; |
3543: nnz_o = C_offd_array[num_threads-1]; |
3544: C_diag_i[num_cols_diag_A] = nnz_d; |
3545: C_offd_i[num_cols_diag_A] = nnz_o; |
3546: |
3547: C_diag = hypre_CSRMatrixCreate(num_cols_diag_A, num_cols_diag_A, nnz_d); |
3548: C_offd = hypre_CSRMatrixCreate(num_cols_diag_A, num_cols_offd_C, nnz_o); |
3549: hypre_CSRMatrixI(C_diag) = C_diag_i; |
3550: hypre_CSRMatrixInitialize(C_diag); |
3551: C_diag_j = hypre_CSRMatrixJ(C_diag); |
3552: C_diag_data = hypre_CSRMatrixData(C_diag); |
3553: hypre_CSRMatrixI(C_offd) = C_offd_i; |
3554: hypre_CSRMatrixInitialize(C_offd); |
3555: C_offd_j = hypre_CSRMatrixJ(C_offd); |
3556: C_offd_data = hypre_CSRMatrixData(C_offd); |
[...] |
3568: for (ik = 0; ik < num_cols_diag_B; ik++) |
3569: B_marker[ik] = -1; |
3570: |
3571: for (ik = 0; ik < num_cols_offd_C; ik++) |
3572: B_marker_offd[ik] = -1; |
[...] |
3581: if (ii) |
3582: { |
3583: nnz_d = C_diag_array[ii-1]; |
3584: nnz_o = C_offd_array[ii-1]; |
3585: } |
3586: for (ik = ns; ik < ne; ik++) |
3587: { |
3588: C_diag_i[ik] = nnz_d; |
3589: C_offd_i[ik] = nnz_o; |
3590: for (jk = C_tmp_diag_i[ik]; jk < C_tmp_diag_i[ik+1]; jk++) |
3591: { |
3592: jcol = C_tmp_diag_j[jk]; |
3593: C_diag_j[nnz_d] = jcol; |
3594: C_diag_data[nnz_d] = C_tmp_diag_data[jk]; |
3595: B_marker[jcol] = nnz_d; |
3596: nnz_d++; |
3597: } |
3598: for (jk = C_tmp_offd_i[ik]; jk < C_tmp_offd_i[ik+1]; jk++) |
3599: { |
3600: jcol = C_tmp_offd_j[jk]; |
3601: C_offd_j[nnz_o] = jcol; |
3602: C_offd_data[nnz_o] = C_tmp_offd_data[jk]; |
3603: B_marker_offd[jcol] = nnz_o; |
3604: nnz_o++; |
3605: } |
3606: for (jk = 0; jk < num_sends_A; jk++) |
3607: for (j1 = send_map_starts_A[jk]; j1 < send_map_starts_A[jk+1]; j1++) |
3608: if (send_map_elmts_A[j1] == ik) |
3609: { |
3610: for (j2 = C_ext_diag_i[j1]; j2 < C_ext_diag_i[j1+1]; j2++) |
3611: { |
3612: jcol = C_ext_diag_j[j2]; |
3613: if (B_marker[jcol] < C_diag_i[ik]) |
3614: { |
3615: C_diag_j[nnz_d] = jcol; |
3616: C_diag_data[nnz_d] = C_ext_diag_data[j2]; |
3617: B_marker[jcol] = nnz_d; |
3618: nnz_d++; |
3619: } |
3620: else |
3621: C_diag_data[B_marker[jcol]] += C_ext_diag_data[j2]; |
3622: } |
3623: for (j2 = C_ext_offd_i[j1]; j2 < C_ext_offd_i[j1+1]; j2++) |
3624: { |
3625: jcol = C_ext_offd_j[j2]; |
3626: if (B_marker_offd[jcol] < C_offd_i[ik]) |
3627: { |
3628: C_offd_j[nnz_o] = jcol; |
3629: C_offd_data[nnz_o] = C_ext_offd_data[j2]; |
3630: B_marker_offd[jcol] = nnz_o; |
3631: nnz_o++; |
3632: } |
3633: else |
3634: C_offd_data[B_marker_offd[jcol]] += C_ext_offd_data[j2]; |
3635: } |
3636: break; |
3637: } |
3638: } |
3639: hypre_TFree(B_marker); |
3640: hypre_TFree(B_marker_offd); |
0x12bb0 PUSH %RBP |
0x12bb1 MOV %RSP,%RBP |
0x12bb4 PUSH %R15 |
0x12bb6 PUSH %R14 |
0x12bb8 PUSH %R13 |
0x12bba PUSH %R12 |
0x12bbc PUSH %RBX |
0x12bbd SUB $0x118,%RSP |
0x12bc4 MOV %R9,-0xb0(%RBP) |
0x12bcb MOV %R8,-0xd0(%RBP) |
0x12bd2 MOV %RCX,%R13 |
0x12bd5 MOV %RDX,%R14 |
0x12bd8 MOV %RDI,-0x50(%RBP) |
0x12bdc MOV 0xc8(%RBP),%RBX |
0x12be3 MOV 0xc0(%RBP),%RAX |
0x12bea MOV %RAX,-0xd8(%RBP) |
0x12bf1 MOV 0xb8(%RBP),%RAX |
0x12bf8 MOV %RAX,-0xa0(%RBP) |
0x12bff MOV 0xb0(%RBP),%RAX |
0x12c06 MOV %RAX,-0xa8(%RBP) |
0x12c0d MOV 0xa8(%RBP),%RAX |
0x12c14 MOV %RAX,-0x78(%RBP) |
0x12c18 MOV 0xa0(%RBP),%RAX |
0x12c1f MOV %RAX,-0x48(%RBP) |
0x12c23 MOV 0x98(%RBP),%RAX |
0x12c2a MOV %RAX,-0x108(%RBP) |
0x12c31 MOV 0x90(%RBP),%RAX |
0x12c38 MOV %RAX,-0x38(%RBP) |
0x12c3c MOV 0x88(%RBP),%RAX |
0x12c43 MOV %RAX,-0x40(%RBP) |
0x12c47 MOV 0x80(%RBP),%RAX |
0x12c4e MOV %RAX,-0x88(%RBP) |
0x12c55 MOV 0x78(%RBP),%RAX |
0x12c59 MOV %RAX,-0x110(%RBP) |
0x12c60 MOV 0x70(%RBP),%RAX |
0x12c64 MOV %RAX,-0xf8(%RBP) |
0x12c6b MOV 0x68(%RBP),%RAX |
0x12c6f MOV %RAX,-0x70(%RBP) |
0x12c73 MOV 0x60(%RBP),%RAX |
0x12c77 MOV %RAX,-0x68(%RBP) |
0x12c7b MOV 0x58(%RBP),%R12 |
0x12c7f MOV 0x50(%RBP),%RAX |
0x12c83 MOV %RAX,-0xf0(%RBP) |
0x12c8a MOV 0x48(%RBP),%RAX |
0x12c8e MOV %RAX,-0x120(%RBP) |
0x12c95 MOV 0x40(%RBP),%RAX |
0x12c99 MOV %RAX,-0xc8(%RBP) |
0x12ca0 MOV 0x38(%RBP),%RAX |
0x12ca4 MOV %RAX,-0x118(%RBP) |
0x12cab MOV 0x30(%RBP),%RAX |
0x12caf MOV %RAX,-0x98(%RBP) |
0x12cb6 MOV 0x28(%RBP),%RAX |
0x12cba MOV %RAX,-0xc0(%RBP) |
0x12cc1 MOV 0x20(%RBP),%RAX |
0x12cc5 MOV %RAX,-0x138(%RBP) |
0x12ccc MOV 0x18(%RBP),%RAX |
0x12cd0 MOV %RAX,-0x100(%RBP) |
0x12cd7 MOV 0x10(%RBP),%RAX |
0x12cdb MOV %RAX,-0xb8(%RBP) |
0x12ce2 CALL 45b0 <hypre_NumActiveThreads@plt> |
0x12ce7 MOV %RAX,%RCX |
0x12cea MOV %R14,%RAX |
0x12ced OR %RCX,%RAX |
0x12cf0 SHR $0x20,%RAX |
0x12cf4 MOV %R14,-0x130(%RBP) |
0x12cfb MOV %RCX,-0x128(%RBP) |
0x12d02 JE 12d14 |
0x12d04 MOV %R14,%RAX |
0x12d07 CQTO |
0x12d09 IDIV %RCX |
0x12d0c MOV %RDX,%R15 |
0x12d0f MOV %RAX,%R14 |
0x12d12 JMP 12d21 |
0x12d14 MOV %R14D,%EAX |
0x12d17 XOR %EDX,%EDX |
0x12d19 DIV %ECX |
0x12d1b MOV %EDX,%R15D |
0x12d1e MOV %EAX,%R14D |
0x12d21 CALL 4180 <hypre_GetThreadNum@plt> |
0x12d26 LEA 0x1(%RAX),%RCX |
0x12d2a CMP %R15,%RAX |
0x12d2d MOV %RBX,-0xe0(%RBP) |
0x12d34 MOV %RAX,-0xe8(%RBP) |
0x12d3b JGE 12d4e |
0x12d3d INC %R14 |
0x12d40 IMUL %R14,%RAX |
0x12d44 MOV %RAX,-0x58(%RBP) |
0x12d48 IMUL %R14,%RCX |
0x12d4c JMP 12d60 |
0x12d4e IMUL %R14,%RAX |
0x12d52 ADD %R15,%RAX |
0x12d55 MOV %RAX,-0x58(%RBP) |
0x12d59 IMUL %R14,%RCX |
0x12d5d ADD %R15,%RCX |
0x12d60 MOV %RCX,-0x90(%RBP) |
0x12d67 MOV $0x8,%ESI |
0x12d6c MOV %R13,%RDI |
0x12d6f CALL 4660 <hypre_CAlloc@plt> |
0x12d74 MOV %RAX,-0x30(%RBP) |
0x12d78 MOV -0xa0(%RBP),%RAX |
0x12d7f MOV (%RAX),%RDI |
0x12d82 MOV $0x8,%ESI |
0x12d87 CALL 4660 <hypre_CAlloc@plt> |
0x12d8c MOV %RAX,%R15 |
0x12d8f TEST %R13,%R13 |
0x12d92 MOV -0x40(%RBP),%RBX |
0x12d96 MOV -0x38(%RBP),%R14 |
0x12d9a JLE 12db2 |
0x12d9c LEA (,%R13,8),%RDX |
0x12da4 MOV -0x30(%RBP),%RDI |
0x12da8 MOV $0xff,%ESI |
0x12dad CALL 4590 <_intel_fast_memset@plt> |
0x12db2 MOV %R13,-0x140(%RBP) |
0x12db9 MOV -0xa0(%RBP),%RDX |
0x12dc0 CMPQ $0,(%RDX) |
0x12dc4 MOV -0x90(%RBP),%RCX |
0x12dcb MOV -0x58(%RBP),%RSI |
0x12dcf JLE 12df0 |
0x12dd1 XOR %EAX,%EAX |
0x12dd3 NOPW %CS:(%RAX,%RAX,1) |
(336) 0x12de0 MOVQ $-0x1,(%R15,%RAX,8) |
(336) 0x12de8 INC %RAX |
(336) 0x12deb CMP (%RDX),%RAX |
(336) 0x12dee JL 12de0 |
0x12df0 CMP %RCX,%RSI |
0x12df3 MOV -0x68(%RBP),%R11 |
0x12df7 MOV %R12,-0x80(%RBP) |
0x12dfb MOV -0x30(%RBP),%R13 |
0x12dff MOV -0x50(%RBP),%R8 |
0x12e03 JGE 13141 |
0x12e09 XOR %EAX,%EAX |
0x12e0b MOV -0x58(%RBP),%RDX |
0x12e0f XOR %ECX,%ECX |
0x12e11 JMP 12e51 |
0x12e13 NOPW %CS:(%RAX,%RAX,1) |
(327) 0x12e20 MOV -0x50(%RBP),%R8 |
(327) 0x12e24 MOV -0xd8(%RBP),%RDX |
(327) 0x12e2b MOV -0xe8(%RBP),%RSI |
(327) 0x12e32 MOV %RCX,(%RDX,%RSI,8) |
(327) 0x12e36 MOV -0xe0(%RBP),%RDX |
(327) 0x12e3d MOV %RAX,(%RDX,%RSI,8) |
(327) 0x12e41 MOV %R10,%RDX |
(327) 0x12e44 CMP -0x90(%RBP),%R10 |
(327) 0x12e4b JGE 13141 |
(327) 0x12e51 MOV (%R12,%RDX,8),%RSI |
(327) 0x12e55 LEA 0x1(%RDX),%R10 |
(327) 0x12e59 CMP 0x8(%R12,%RDX,8),%RSI |
(327) 0x12e5e MOV -0x110(%RBP),%R8 |
(327) 0x12e65 MOV -0xf8(%RBP),%R9 |
(327) 0x12e6c JGE 12e85 |
(327) 0x12e6e XCHG %AX,%AX |
(335) 0x12e70 MOV (%R11,%RSI,8),%RDI |
(335) 0x12e74 MOV %RDX,(%R13,%RDI,8) |
(335) 0x12e79 INC %RCX |
(335) 0x12e7c INC %RSI |
(335) 0x12e7f CMP (%R12,%R10,8),%RSI |
(335) 0x12e83 JL 12e70 |
(327) 0x12e85 MOV (%R9,%RDX,8),%RSI |
(327) 0x12e89 CMP (%R9,%R10,8),%RSI |
(327) 0x12e8d JGE 12ea4 |
(327) 0x12e8f NOP |
(334) 0x12e90 MOV (%R8,%RSI,8),%RDI |
(334) 0x12e94 MOV %RDX,(%R15,%RDI,8) |
(334) 0x12e98 INC %RAX |
(334) 0x12e9b INC %RSI |
(334) 0x12e9e CMP (%R9,%R10,8),%RSI |
(334) 0x12ea2 JL 12e90 |
(327) 0x12ea4 CMPQ $0,-0xa8(%RBP) |
(327) 0x12eac JLE 12e20 |
(327) 0x12eb2 VMOVQ %RDX,%XMM0 |
(327) 0x12eb7 VPBROADCASTQ %XMM0,%YMM0 |
(327) 0x12ebc XOR %EDI,%EDI |
(327) 0x12ebe MOV -0x48(%RBP),%RSI |
(327) 0x12ec2 MOV -0x50(%RBP),%R8 |
(327) 0x12ec6 MOV %R10,-0x60(%RBP) |
(327) 0x12eca NOPW (%RAX,%RAX,1) |
(328) 0x12ed0 MOV (%RSI,%RDI,8),%R10 |
(328) 0x12ed4 MOV 0x8(%RSI,%RDI,8),%R9 |
(328) 0x12ed9 MOV %R9,%R11 |
(328) 0x12edc SUB %R10,%R11 |
(328) 0x12edf JLE 12fc0 |
(328) 0x12ee5 MOV -0x78(%RBP),%RSI |
(328) 0x12ee9 LEA (%RSI,%R10,8),%ESI |
(328) 0x12eed AND $0x7f,%ESI |
(328) 0x12ef0 MOV $0x80,%EBX |
(328) 0x12ef5 SUB %ESI,%EBX |
(328) 0x12ef7 SHR $0x3,%EBX |
(328) 0x12efa CMP %RBX,%R11 |
(328) 0x12efd MOV %R11,%RSI |
(328) 0x12f00 CMOVA %RBX,%RSI |
(328) 0x12f04 TEST %RSI,%RSI |
(328) 0x12f07 JE 12f33 |
(328) 0x12f09 MOV %R10,%R8 |
(328) 0x12f0c MOV %RSI,%R14 |
(328) 0x12f0f MOV -0x78(%RBP),%R13 |
(328) 0x12f13 NOPW %CS:(%RAX,%RAX,1) |
(333) 0x12f20 CMP %RDX,(%R13,%R8,8) |
(333) 0x12f25 JE 12fe2 |
(333) 0x12f2b INC %R8 |
(333) 0x12f2e DEC %R14 |
(333) 0x12f31 JNE 12f20 |
(328) 0x12f33 CMP %RBX,%R11 |
(328) 0x12f36 MOV -0x30(%RBP),%R13 |
(328) 0x12f3a JBE 12fc9 |
(328) 0x12f40 SUB %RSI,%R11 |
(328) 0x12f43 MOV %R11,%RBX |
(328) 0x12f46 AND $-0x10,%RBX |
(328) 0x12f4a JE 12f9b |
(328) 0x12f4c LEA -0x1(%RBX),%R13 |
(328) 0x12f50 LEA (%R10,%RSI,1),%R8 |
(328) 0x12f54 MOV -0x78(%RBP),%R14 |
(328) 0x12f58 LEA (%R14,%R8,8),%R14 |
(328) 0x12f5c XOR %R12D,%R12D |
(328) 0x12f5f NOP |
(332) 0x12f60 VPCMPEQQ (%R14,%R12,8),%YMM0,%YMM1 |
(332) 0x12f66 VPCMPEQQ 0x20(%R14,%R12,8),%YMM0,%YMM3 |
(332) 0x12f6d VPCMPEQQ 0x40(%R14,%R12,8),%YMM0,%YMM2 |
(332) 0x12f74 VPCMPEQQ 0x60(%R14,%R12,8),%YMM0,%YMM4 |
(332) 0x12f7b VPOR %YMM3,%YMM1,%YMM5 |
(332) 0x12f7f VPOR %YMM4,%YMM2,%YMM6 |
(332) 0x12f83 VPOR %YMM5,%YMM6,%YMM5 |
(332) 0x12f87 VTESTPD %YMM5,%YMM5 |
(332) 0x12f8c JNE 1303b |
(332) 0x12f92 ADD $0x10,%R12 |
(332) 0x12f96 CMP %R13,%R12 |
(332) 0x12f99 JBE 12f60 |
(328) 0x12f9b CMP %R11,%RBX |
(328) 0x12f9e JNE 12ffb |
(328) 0x12fa0 MOV -0x48(%RBP),%RSI |
(328) 0x12fa4 MOV -0x38(%RBP),%R14 |
(328) 0x12fa8 MOV -0x40(%RBP),%RBX |
(328) 0x12fac MOV -0x68(%RBP),%R11 |
(328) 0x12fb0 MOV -0x80(%RBP),%R12 |
(328) 0x12fb4 MOV -0x30(%RBP),%R13 |
(328) 0x12fb8 JMP 13124 |
0x12fbd NOPL (%RAX) |
(328) 0x12fc0 MOV -0x68(%RBP),%R11 |
(328) 0x12fc4 JMP 13128 |
(328) 0x12fc9 MOV -0x48(%RBP),%RSI |
(328) 0x12fcd MOV -0x38(%RBP),%R14 |
(328) 0x12fd1 MOV -0x40(%RBP),%RBX |
(328) 0x12fd5 MOV -0x68(%RBP),%R11 |
(328) 0x12fd9 MOV -0x80(%RBP),%R12 |
(328) 0x12fdd JMP 13124 |
(328) 0x12fe2 MOV -0x38(%RBP),%R14 |
(328) 0x12fe6 MOV -0x40(%RBP),%RBX |
(328) 0x12fea MOV -0x68(%RBP),%R11 |
(328) 0x12fee MOV -0x30(%RBP),%R13 |
(328) 0x12ff2 MOV -0x80(%RBP),%R12 |
(328) 0x12ff6 JMP 13084 |
(328) 0x12ffb ADD %RSI,%R10 |
(328) 0x12ffe ADD %RBX,%R10 |
(328) 0x13001 MOV %R10,%R8 |
(328) 0x13004 MOV -0x38(%RBP),%R14 |
(328) 0x13008 MOV -0x40(%RBP),%RBX |
(328) 0x1300c MOV -0x68(%RBP),%R11 |
(328) 0x13010 MOV -0x80(%RBP),%R12 |
(328) 0x13014 MOV -0x30(%RBP),%R13 |
(328) 0x13018 MOV -0x60(%RBP),%R10 |
(328) 0x1301c MOV -0x78(%RBP),%RSI |
(331) 0x13020 CMP %RDX,(%RSI,%R8,8) |
(331) 0x13024 JE 13084 |
(331) 0x13026 INC %R8 |
(331) 0x13029 CMP %R8,%R9 |
(331) 0x1302c JNE 13020 |
(328) 0x1302e MOV -0x48(%RBP),%RSI |
(328) 0x13032 MOV -0x50(%RBP),%R8 |
(328) 0x13036 JMP 1312c |
(328) 0x1303b VPACKSSDW %YMM3,%YMM1,%YMM1 |
(328) 0x1303f VPERMQ $-0x28,%YMM1,%YMM1 |
(328) 0x13045 VPACKSSDW %YMM4,%YMM2,%YMM2 |
(328) 0x13049 VPERMQ $-0x28,%YMM2,%YMM2 |
(328) 0x1304f VPACKSSDW %YMM2,%YMM1,%YMM1 |
(328) 0x13053 VEXTRACTI128 $0x1,%YMM1,%XMM2 |
(328) 0x13059 VPACKSSWB %XMM2,%XMM1,%XMM1 |
(328) 0x1305d VPSHUFD $-0x28,%XMM1,%XMM1 |
(328) 0x13062 VPMOVMSKB %XMM1,%ESI |
(328) 0x13066 TZCNT %ESI,%ESI |
(328) 0x1306a ADD %R12,%R8 |
(328) 0x1306d ADD %RSI,%R8 |
(328) 0x13070 MOV -0x38(%RBP),%R14 |
(328) 0x13074 MOV -0x40(%RBP),%RBX |
(328) 0x13078 MOV -0x68(%RBP),%R11 |
(328) 0x1307c MOV -0x80(%RBP),%R12 |
(328) 0x13080 MOV -0x30(%RBP),%R13 |
(328) 0x13084 MOV -0xc0(%RBP),%R9 |
(328) 0x1308b MOV (%R9,%R8,8),%RSI |
(328) 0x1308f MOV 0x8(%R9,%R8,8),%R9 |
(328) 0x13094 JMP 130a3 |
0x13096 NOPW %CS:(%RAX,%RAX,1) |
(330) 0x130a0 INC %RSI |
(330) 0x130a3 CMP %R9,%RSI |
(330) 0x130a6 JGE 130d0 |
(330) 0x130a8 MOV -0x98(%RBP),%R10 |
(330) 0x130af MOV (%R10,%RSI,8),%R10 |
(330) 0x130b3 CMP %RDX,(%R13,%R10,8) |
(330) 0x130b8 JGE 130a0 |
(330) 0x130ba MOV %RDX,(%R13,%R10,8) |
(330) 0x130bf INC %RCX |
(330) 0x130c2 MOV -0xc0(%RBP),%R9 |
(330) 0x130c9 MOV 0x8(%R9,%R8,8),%R9 |
(330) 0x130ce JMP 130a0 |
(328) 0x130d0 MOV -0xc8(%RBP),%R9 |
(328) 0x130d7 MOV (%R9,%R8,8),%RSI |
(328) 0x130db MOV 0x8(%R9,%R8,8),%R9 |
(328) 0x130e0 JMP 130f3 |
0x130e2 NOPW %CS:(%RAX,%RAX,1) |
(329) 0x130f0 INC %RSI |
(329) 0x130f3 CMP %R9,%RSI |
(329) 0x130f6 JGE 13120 |
(329) 0x130f8 MOV -0x120(%RBP),%R10 |
(329) 0x130ff MOV (%R10,%RSI,8),%R10 |
(329) 0x13103 CMP %RDX,(%R15,%R10,8) |
(329) 0x13107 JGE 130f0 |
(329) 0x13109 MOV %RDX,(%R15,%R10,8) |
(329) 0x1310d INC %RAX |
(329) 0x13110 MOV -0xc8(%RBP),%R9 |
(329) 0x13117 MOV 0x8(%R9,%R8,8),%R9 |
(329) 0x1311c JMP 130f0 |
0x1311e XCHG %AX,%AX |
(328) 0x13120 MOV -0x48(%RBP),%RSI |
(328) 0x13124 MOV -0x50(%RBP),%R8 |
(328) 0x13128 MOV -0x60(%RBP),%R10 |
(328) 0x1312c INC %RDI |
(328) 0x1312f CMP -0xa8(%RBP),%RDI |
(328) 0x13136 JNE 12ed0 |
(327) 0x1313c JMP 12e24 |
0x13141 MOV (%R8),%ESI |
0x13144 LEA 0x20c375(%RIP),%RDI |
0x1314b VZEROUPPER |
0x1314e CALL 4680 <__kmpc_barrier@plt> |
0x13153 MOV -0x50(%RBP),%RAX |
0x13157 CMPQ $0,-0xe8(%RBP) |
0x1315f JNE 1343b |
0x13165 MOV -0x128(%RBP),%R10 |
0x1316c CMP $0x2,%R10 |
0x13170 MOV -0xe0(%RBP),%R8 |
0x13177 MOV -0xd8(%RBP),%R9 |
0x1317e JL 13378 |
0x13184 LEA -0x1(%R10),%RAX |
0x13188 LEA (%R8,%R10,8),%RCX |
0x1318c CMP %R9,%RCX |
0x1318f JBE 131df |
0x13191 LEA (%R9,%R10,8),%RCX |
0x13195 CMP %R8,%RCX |
0x13198 JBE 131df |
0x1319a LEA (%R9,%RAX,8),%RCX |
0x1319e CMP %R8,%RCX |
0x131a1 JB 132cd |
0x131a7 LEA (%R8,%RAX,8),%RCX |
0x131ab CMP %R9,%RCX |
0x131ae JB 132cd |
0x131b4 MOV $0x1,%EAX |
0x131b9 NOPL (%RAX) |
(326) 0x131c0 MOV -0x8(%R9,%RAX,8),%RCX |
(326) 0x131c5 ADD %RCX,(%R9,%RAX,8) |
(326) 0x131c9 MOV -0x8(%R8,%RAX,8),%RCX |
(326) 0x131ce ADD %RCX,(%R8,%RAX,8) |
(326) 0x131d2 INC %RAX |
(326) 0x131d5 CMP %RAX,%R10 |
(326) 0x131d8 JNE 131c0 |
0x131da JMP 13378 |
0x131df MOV (%R9),%RCX |
0x131e2 MOV (%R8),%RDX |
0x131e5 LEA (%R9,%RAX,8),%RSI |
0x131e9 LEA 0x8(%R8),%RDI |
0x131ed CMP %RDI,%RSI |
0x131f0 JB 1322d |
0x131f2 LEA 0x8(%R9),%RSI |
0x131f6 LEA (%R8,%RAX,8),%RDI |
0x131fa CMP %RSI,%RDI |
0x131fd JB 1322d |
0x131ff MOV $0x1,%EAX |
0x13204 NOPW %CS:(%RAX,%RAX,1) |
(323) 0x13210 ADD (%R9,%RAX,8),%RCX |
(323) 0x13214 MOV %RCX,(%R9,%RAX,8) |
(323) 0x13218 ADD (%R8,%RAX,8),%RDX |
(323) 0x1321c MOV %RDX,(%R8,%RAX,8) |
(323) 0x13220 INC %RAX |
(323) 0x13223 CMP %RAX,%R10 |
(323) 0x13226 JNE 13210 |
0x13228 JMP 13378 |
0x1322d CMP $0x5,%R10 |
0x13231 JB 13295 |
0x13233 MOV %RAX,%RSI |
0x13236 SHR $0x2,%RSI |
0x1323a MOV $0x20,%EDI |
0x1323f NOP |
(322) 0x13240 ADD -0x18(%R9,%RDI,1),%RCX |
(322) 0x13245 MOV %RCX,-0x18(%R9,%RDI,1) |
(322) 0x1324a ADD -0x18(%R8,%RDI,1),%RDX |
(322) 0x1324f MOV %RDX,-0x18(%R8,%RDI,1) |
(322) 0x13254 ADD -0x10(%R9,%RDI,1),%RCX |
(322) 0x13259 MOV %RCX,-0x10(%R9,%RDI,1) |
(322) 0x1325e ADD -0x10(%R8,%RDI,1),%RDX |
(322) 0x13263 MOV %RDX,-0x10(%R8,%RDI,1) |
(322) 0x13268 ADD -0x8(%R9,%RDI,1),%RCX |
(322) 0x1326d MOV %RCX,-0x8(%R9,%RDI,1) |
(322) 0x13272 ADD -0x8(%R8,%RDI,1),%RDX |
(322) 0x13277 MOV %RDX,-0x8(%R8,%RDI,1) |
(322) 0x1327c ADD (%R9,%RDI,1),%RCX |
(322) 0x13280 MOV %RCX,(%R9,%RDI,1) |
(322) 0x13284 ADD (%R8,%RDI,1),%RDX |
(322) 0x13288 MOV %RDX,(%R8,%RDI,1) |
(322) 0x1328c ADD $0x20,%RDI |
(322) 0x13290 DEC %RSI |
(322) 0x13293 JNE 13240 |
0x13295 MOV %RAX,%RSI |
0x13298 AND $-0x4,%RSI |
0x1329c CMP %RAX,%RSI |
0x1329f JE 13378 |
0x132a5 INC %RSI |
0x132a8 NOPL (%RAX,%RAX,1) |
(321) 0x132b0 ADD (%R9,%RSI,8),%RCX |
(321) 0x132b4 MOV %RCX,(%R9,%RSI,8) |
(321) 0x132b8 ADD (%R8,%RSI,8),%RDX |
(321) 0x132bc MOV %RDX,(%R8,%RSI,8) |
(321) 0x132c0 INC %RSI |
(321) 0x132c3 CMP %RSI,%R10 |
(321) 0x132c6 JNE 132b0 |
0x132c8 JMP 13378 |
0x132cd CMP $0x5,%R10 |
0x132d1 JB 13345 |
0x132d3 MOV %RAX,%RCX |
0x132d6 SHR $0x2,%RCX |
0x132da MOV (%R9),%RDX |
0x132dd MOV (%R8),%RSI |
0x132e0 MOV $0x20,%EDI |
0x132e5 NOPW %CS:(%RAX,%RAX,1) |
(325) 0x132f0 ADD -0x18(%R9,%RDI,1),%RDX |
(325) 0x132f5 MOV %RDX,-0x18(%R9,%RDI,1) |
(325) 0x132fa ADD -0x18(%R8,%RDI,1),%RSI |
(325) 0x132ff MOV %RSI,-0x18(%R8,%RDI,1) |
(325) 0x13304 ADD -0x10(%R9,%RDI,1),%RDX |
(325) 0x13309 MOV %RDX,-0x10(%R9,%RDI,1) |
(325) 0x1330e ADD -0x10(%R8,%RDI,1),%RSI |
(325) 0x13313 MOV %RSI,-0x10(%R8,%RDI,1) |
(325) 0x13318 ADD -0x8(%R9,%RDI,1),%RDX |
(325) 0x1331d MOV %RDX,-0x8(%R9,%RDI,1) |
(325) 0x13322 ADD -0x8(%R8,%RDI,1),%RSI |
(325) 0x13327 MOV %RSI,-0x8(%R8,%RDI,1) |
(325) 0x1332c ADD (%R9,%RDI,1),%RDX |
(325) 0x13330 MOV %RDX,(%R9,%RDI,1) |
(325) 0x13334 ADD (%R8,%RDI,1),%RSI |
(325) 0x13338 MOV %RSI,(%R8,%RDI,1) |
(325) 0x1333c ADD $0x20,%RDI |
(325) 0x13340 DEC %RCX |
(325) 0x13343 JNE 132f0 |
0x13345 MOV %RAX,%RCX |
0x13348 AND $-0x4,%RCX |
0x1334c CMP %RAX,%RCX |
0x1334f JE 13378 |
0x13351 MOV (%R9,%RCX,8),%RAX |
0x13355 MOV (%R8,%RCX,8),%RDX |
0x13359 INC %RCX |
0x1335c NOPL (%RAX) |
(324) 0x13360 ADD (%R9,%RCX,8),%RAX |
(324) 0x13364 MOV %RAX,(%R9,%RCX,8) |
(324) 0x13368 ADD (%R8,%RCX,8),%RDX |
(324) 0x1336c MOV %RDX,(%R8,%RCX,8) |
(324) 0x13370 INC %RCX |
(324) 0x13373 CMP %RCX,%R10 |
(324) 0x13376 JNE 13360 |
0x13378 MOV -0x8(%R9,%R10,8),%RDX |
0x1337d MOV -0x8(%R8,%R10,8),%RCX |
0x13382 MOV %RCX,-0x60(%RBP) |
0x13386 MOV -0x130(%RBP),%RBX |
0x1338d MOV -0xb8(%RBP),%RAX |
0x13394 MOV %RDX,(%RAX,%RBX,8) |
0x13398 MOV %RCX,(%R14,%RBX,8) |
0x1339c MOV %RBX,%RDI |
0x1339f MOV %RBX,%RSI |
0x133a2 CALL 4710 <hypre_CSRMatrixCreate@plt> |
0x133a7 MOV -0xd0(%RBP),%RCX |
0x133ae MOV %RAX,(%RCX) |
0x133b1 MOV -0xa0(%RBP),%RAX |
0x133b8 MOV (%RAX),%RSI |
0x133bb MOV %RBX,%RDI |
0x133be MOV -0x60(%RBP),%RDX |
0x133c2 CALL 4710 <hypre_CSRMatrixCreate@plt> |
0x133c7 MOV -0x138(%RBP),%RBX |
0x133ce MOV %RAX,(%RBX) |
0x133d1 MOV -0xd0(%RBP),%RAX |
0x133d8 MOV (%RAX),%RDI |
0x133db MOV -0xb8(%RBP),%RAX |
0x133e2 MOV %RAX,(%RDI) |
0x133e5 CALL 4460 <hypre_CSRMatrixInitialize@plt> |
0x133ea MOV -0xd0(%RBP),%RAX |
0x133f1 MOV (%RAX),%RAX |
0x133f4 MOV 0x8(%RAX),%RCX |
0x133f8 MOV -0x100(%RBP),%RDX |
0x133ff MOV %RCX,(%RDX) |
0x13402 MOV 0x30(%RAX),%RAX |
0x13406 MOV -0xb0(%RBP),%RCX |
0x1340d MOV %RAX,(%RCX) |
0x13410 MOV (%RBX),%RDI |
0x13413 MOV %R14,(%RDI) |
0x13416 CALL 4460 <hypre_CSRMatrixInitialize@plt> |
0x1341b MOV (%RBX),%RAX |
0x1341e MOV 0x8(%RAX),%RCX |
0x13422 MOV -0x108(%RBP),%RDX |
0x13429 MOV %RCX,(%RDX) |
0x1342c MOV 0x30(%RAX),%RAX |
0x13430 MOV -0x40(%RBP),%RBX |
0x13434 MOV %RAX,(%RBX) |
0x13437 MOV -0x50(%RBP),%RAX |
0x1343b MOV (%RAX),%ESI |
0x1343d LEA 0x20c09c(%RIP),%RDI |
0x13444 CALL 4680 <__kmpc_barrier@plt> |
0x13449 MOV -0x140(%RBP),%RDX |
0x13450 TEST %RDX,%RDX |
0x13453 JLE 13466 |
0x13455 SAL $0x3,%RDX |
0x13459 MOV %R13,%RDI |
0x1345c MOV $0xff,%ESI |
0x13461 CALL 4590 <_intel_fast_memset@plt> |
0x13466 MOV -0xa0(%RBP),%RCX |
0x1346d CMPQ $0,(%RCX) |
0x13471 MOV -0xe8(%RBP),%RSI |
0x13478 JLE 13490 |
0x1347a XOR %EAX,%EAX |
0x1347c NOPL (%RAX) |
(320) 0x13480 MOVQ $-0x1,(%R15,%RAX,8) |
(320) 0x13488 INC %RAX |
(320) 0x1348b CMP (%RCX),%RAX |
(320) 0x1348e JL 13480 |
0x13490 TEST %RSI,%RSI |
0x13493 MOV -0x70(%RBP),%R10 |
0x13497 MOV -0x90(%RBP),%RDX |
0x1349e MOV -0x58(%RBP),%R11 |
0x134a2 JE 134c3 |
0x134a4 MOV -0xd8(%RBP),%RAX |
0x134ab MOV -0x8(%RAX,%RSI,8),%RAX |
0x134b0 MOV -0xe0(%RBP),%RCX |
0x134b7 MOV -0x8(%RCX,%RSI,8),%RCX |
0x134bc CMP %RDX,%R11 |
0x134bf JL 13505 |
0x134c1 JMP 134cc |
0x134c3 XOR %EAX,%EAX |
0x134c5 XOR %ECX,%ECX |
0x134c7 CMP %RDX,%R11 |
0x134ca JL 13505 |
0x134cc MOV %R13,%RDI |
0x134cf VZEROUPPER |
0x134d2 CALL 43b0 <hypre_Free@plt> |
0x134d7 MOV %R15,%RDI |
0x134da ADD $0x118,%RSP |
0x134e1 POP %RBX |
0x134e2 POP %R12 |
0x134e4 POP %R13 |
0x134e6 POP %R14 |
0x134e8 POP %R15 |
0x134ea POP %RBP |
0x134eb JMP 43b0 |
(311) 0x134f0 MOV -0x70(%RBP),%R10 |
(311) 0x134f4 MOV -0x38(%RBP),%R14 |
(311) 0x134f8 CMP -0x90(%RBP),%R11 |
(311) 0x134ff MOV -0x80(%RBP),%R12 |
(311) 0x13503 JGE 134cc |
(311) 0x13505 MOV %R11,%RDX |
(311) 0x13508 MOV -0xb8(%RBP),%RSI |
(311) 0x1350f MOV %RAX,(%RSI,%R11,8) |
(311) 0x13513 MOV %RCX,(%R14,%R11,8) |
(311) 0x13517 MOV (%R12,%R11,8),%RSI |
(311) 0x1351b INC %R11 |
(311) 0x1351e CMP 0x8(%R12,%RDX,8),%RSI |
(311) 0x13523 JGE 13575 |
(311) 0x13525 MOV -0x100(%RBP),%RDI |
(311) 0x1352c MOV (%RDI),%RDI |
(311) 0x1352f MOV -0xb0(%RBP),%R8 |
(311) 0x13536 MOV (%R8),%R8 |
(311) 0x13539 MOV -0x68(%RBP),%R12 |
(311) 0x1353d MOV -0x80(%RBP),%R13 |
(311) 0x13541 MOV -0x30(%RBP),%R14 |
(311) 0x13545 NOPW %CS:(%RAX,%RAX,1) |
(319) 0x13550 MOV (%R12,%RSI,8),%R9 |
(319) 0x13554 MOV %R9,(%RDI,%RAX,8) |
(319) 0x13558 VMOVQ (%R10,%RSI,8),%XMM0 |
(319) 0x1355e VMOVQ %XMM0,(%R8,%RAX,8) |
(319) 0x13564 MOV %RAX,(%R14,%R9,8) |
(319) 0x13568 INC %RAX |
(319) 0x1356b INC %RSI |
(319) 0x1356e CMP (%R13,%R11,8),%RSI |
(319) 0x13573 JL 13550 |
(311) 0x13575 MOV -0xf8(%RBP),%RDI |
(311) 0x1357c MOV (%RDI,%RDX,8),%RSI |
(311) 0x13580 CMP (%RDI,%R11,8),%RSI |
(311) 0x13584 JGE 135f0 |
(311) 0x13586 MOV -0x108(%RBP),%RDI |
(311) 0x1358d MOV (%RDI),%RDI |
(311) 0x13590 MOV (%RBX),%R8 |
(311) 0x13593 MOV -0x110(%RBP),%R10 |
(311) 0x1359a MOV -0x30(%RBP),%R13 |
(311) 0x1359e MOV -0x88(%RBP),%R14 |
(311) 0x135a5 NOPW %CS:(%RAX,%RAX,1) |
(318) 0x135b0 MOV (%R10,%RSI,8),%R9 |
(318) 0x135b4 MOV %R9,(%RDI,%RCX,8) |
(318) 0x135b8 VMOVQ (%R14,%RSI,8),%XMM0 |
(318) 0x135be VMOVQ %XMM0,(%R8,%RCX,8) |
(318) 0x135c4 MOV %RCX,(%R15,%R9,8) |
(318) 0x135c8 INC %RCX |
(318) 0x135cb INC %RSI |
(318) 0x135ce MOV -0xf8(%RBP),%R9 |
(318) 0x135d5 CMP (%R9,%R11,8),%RSI |
(318) 0x135d9 JL 135b0 |
(311) 0x135db CMPQ $0,-0xa8(%RBP) |
(311) 0x135e3 JG 13602 |
(311) 0x135e5 JMP 134f0 |
0x135ea NOPW (%RAX,%RAX,1) |
(311) 0x135f0 MOV -0x30(%RBP),%R13 |
(311) 0x135f4 CMPQ $0,-0xa8(%RBP) |
(311) 0x135fc JLE 134f0 |
(311) 0x13602 VMOVQ %RDX,%XMM0 |
(311) 0x13607 VPBROADCASTQ %XMM0,%YMM0 |
(311) 0x1360c XOR %ESI,%ESI |
(311) 0x1360e MOV -0x48(%RBP),%RDI |
(311) 0x13612 MOV -0x88(%RBP),%R8 |
(311) 0x13619 MOV -0x38(%RBP),%R14 |
(311) 0x1361d MOV %R11,-0x58(%RBP) |
(311) 0x13621 JMP 1365f |
0x13623 NOPW %CS:(%RAX,%RAX,1) |
(312) 0x13630 MOV %R13,%R15 |
(312) 0x13633 MOV %RBX,%R13 |
(312) 0x13636 MOV %R14,%RBX |
(312) 0x13639 MOV %RDI,%R14 |
(312) 0x1363c MOV -0x70(%RBP),%R10 |
(312) 0x13640 MOV %RBX,%R14 |
(312) 0x13643 MOV %R13,%RBX |
(312) 0x13646 MOV %R15,%R13 |
(312) 0x13649 MOV %R12,%R15 |
(312) 0x1364c MOV %R9,%R8 |
(312) 0x1364f INC %RSI |
(312) 0x13652 CMP -0xa8(%RBP),%RSI |
(312) 0x13659 JE 134f8 |
(312) 0x1365f MOV %RSI,%R10 |
(312) 0x13662 MOV %R8,%R9 |
(312) 0x13665 MOV %R15,%R12 |
(312) 0x13668 MOV (%RDI,%RSI,8),%R8 |
(312) 0x1366c MOV 0x8(%RDI,%RSI,8),%R10 |
(312) 0x13671 MOV %R10,-0x60(%RBP) |
(312) 0x13675 SUB %R8,%R10 |
(312) 0x13678 JLE 13630 |
(312) 0x1367a MOV -0x78(%RBP),%RDI |
(312) 0x1367e LEA (%RDI,%R8,8),%EDI |
(312) 0x13682 AND $0x7f,%EDI |
(312) 0x13685 MOV $0x80,%EBX |
(312) 0x1368a SUB %EDI,%EBX |
(312) 0x1368c SHR $0x3,%EBX |
(312) 0x1368f CMP %RBX,%R10 |
(312) 0x13692 MOV %R10,%R11 |
(312) 0x13695 CMOVA %RBX,%R11 |
(312) 0x13699 TEST %R11,%R11 |
(312) 0x1369c MOV %R12,%R15 |
(312) 0x1369f MOV -0x98(%RBP),%R12 |
(312) 0x136a6 JE 136d3 |
(312) 0x136a8 MOV %R8,%RDI |
(312) 0x136ab MOV %R11,%R14 |
(312) 0x136ae MOV -0x78(%RBP),%R13 |
(312) 0x136b2 NOPW %CS:(%RAX,%RAX,1) |
(317) 0x136c0 CMP %RDX,(%R13,%RDI,8) |
(317) 0x136c5 JE 13764 |
(317) 0x136cb INC %RDI |
(317) 0x136ce DEC %R14 |
(317) 0x136d1 JNE 136c0 |
(312) 0x136d3 CMP %RBX,%R10 |
(312) 0x136d6 JBE 13740 |
(312) 0x136d8 SUB %R11,%R10 |
(312) 0x136db MOV %R10,%RBX |
(312) 0x136de AND $-0x10,%RBX |
(312) 0x136e2 JE 1373b |
(312) 0x136e4 LEA -0x1(%RBX),%R13 |
(312) 0x136e8 LEA (%R8,%R11,1),%RDI |
(312) 0x136ec MOV -0x78(%RBP),%R14 |
(312) 0x136f0 LEA (%R14,%RDI,8),%R14 |
(312) 0x136f4 XOR %R12D,%R12D |
(312) 0x136f7 NOPW (%RAX,%RAX,1) |
(316) 0x13700 VPCMPEQQ (%R14,%R12,8),%YMM0,%YMM1 |
(316) 0x13706 VPCMPEQQ 0x20(%R14,%R12,8),%YMM0,%YMM3 |
(316) 0x1370d VPCMPEQQ 0x40(%R14,%R12,8),%YMM0,%YMM2 |
(316) 0x13714 VPCMPEQQ 0x60(%R14,%R12,8),%YMM0,%YMM4 |
(316) 0x1371b VPOR %YMM3,%YMM1,%YMM5 |
(316) 0x1371f VPOR %YMM4,%YMM2,%YMM6 |
(316) 0x13723 VPOR %YMM5,%YMM6,%YMM5 |
(316) 0x13727 VTESTPD %YMM5,%YMM5 |
(316) 0x1372c JNE 137cc |
(316) 0x13732 ADD $0x10,%R12 |
(316) 0x13736 CMP %R13,%R12 |
(316) 0x13739 JBE 13700 |
(312) 0x1373b CMP %R10,%RBX |
(312) 0x1373e JNE 13770 |
(312) 0x13740 MOV -0x48(%RBP),%RDI |
(312) 0x13744 MOV -0x38(%RBP),%R14 |
(312) 0x13748 MOV -0x40(%RBP),%RBX |
(312) 0x1374c MOV -0x88(%RBP),%R8 |
(312) 0x13753 MOV -0x70(%RBP),%R10 |
(312) 0x13757 MOV -0x58(%RBP),%R11 |
(312) 0x1375b MOV -0x30(%RBP),%R13 |
(312) 0x1375f JMP 1364f |
(312) 0x13764 MOV -0xf0(%RBP),%R13 |
(312) 0x1376b JMP 13810 |
(312) 0x13770 ADD %R11,%R8 |
(312) 0x13773 ADD %RBX,%R8 |
(312) 0x13776 MOV %R8,%RDI |
(312) 0x13779 MOV -0x38(%RBP),%R14 |
(312) 0x1377d MOV -0x40(%RBP),%RBX |
(312) 0x13781 MOV -0x88(%RBP),%R8 |
(312) 0x13788 MOV -0x70(%RBP),%R10 |
(312) 0x1378c MOV -0xf0(%RBP),%R13 |
(312) 0x13793 MOV -0x98(%RBP),%R12 |
(312) 0x1379a MOV -0x58(%RBP),%R11 |
(312) 0x1379e MOV -0x78(%RBP),%R9 |
(312) 0x137a2 NOPW %CS:(%RAX,%RAX,1) |
(315) 0x137b0 CMP %RDX,(%R9,%RDI,8) |
(315) 0x137b4 JE 13810 |
(315) 0x137b6 INC %RDI |
(315) 0x137b9 CMP %RDI,-0x60(%RBP) |
(315) 0x137bd JNE 137b0 |
(312) 0x137bf MOV -0x30(%RBP),%R13 |
(312) 0x137c3 MOV -0x48(%RBP),%RDI |
(312) 0x137c7 JMP 1364f |
(312) 0x137cc VPACKSSDW %YMM3,%YMM1,%YMM1 |
(312) 0x137d0 VPERMQ $-0x28,%YMM1,%YMM1 |
(312) 0x137d6 VPACKSSDW %YMM4,%YMM2,%YMM2 |
(312) 0x137da VPERMQ $-0x28,%YMM2,%YMM2 |
(312) 0x137e0 VPACKSSDW %YMM2,%YMM1,%YMM1 |
(312) 0x137e4 VEXTRACTI128 $0x1,%YMM1,%XMM2 |
(312) 0x137ea VPACKSSWB %XMM2,%XMM1,%XMM1 |
(312) 0x137ee VPSHUFD $-0x28,%XMM1,%XMM1 |
(312) 0x137f3 VPMOVMSKB %XMM1,%R8D |
(312) 0x137f7 TZCNT %R8D,%R8D |
(312) 0x137fc ADD %R12,%RDI |
(312) 0x137ff ADD %R8,%RDI |
(312) 0x13802 MOV -0xf0(%RBP),%R13 |
(312) 0x13809 MOV -0x98(%RBP),%R12 |
(312) 0x13810 MOV -0xc0(%RBP),%R9 |
(312) 0x13817 MOV (%R9,%RDI,8),%R8 |
(312) 0x1381b MOV 0x8(%R9,%RDI,8),%R9 |
(312) 0x13820 CMP %R9,%R8 |
(312) 0x13823 JGE 138c0 |
(312) 0x13829 MOV -0x30(%RBP),%R14 |
(312) 0x1382d MOV -0xb8(%RBP),%RBX |
(312) 0x13834 JMP 13872 |
0x13836 NOPW %CS:(%RAX,%RAX,1) |
(314) 0x13840 MOV -0xb0(%RBP),%R10 |
(314) 0x13847 MOV (%R10),%R10 |
(314) 0x1384a VMOVSD (%R10,%R11,8),%XMM1 |
(314) 0x13850 MOV -0x118(%RBP),%R12 |
(314) 0x13857 VADDSD (%R12,%R8,8),%XMM1,%XMM1 |
(314) 0x1385d MOV -0x98(%RBP),%R12 |
(314) 0x13864 VMOVSD %XMM1,(%R10,%R11,8) |
(314) 0x1386a INC %R8 |
(314) 0x1386d CMP %R9,%R8 |
(314) 0x13870 JGE 138c0 |
(314) 0x13872 MOV (%R12,%R8,8),%R10 |
(314) 0x13876 MOV (%R14,%R10,8),%R11 |
(314) 0x1387a CMP (%RBX,%RDX,8),%R11 |
(314) 0x1387e JGE 13840 |
(314) 0x13880 MOV -0x100(%RBP),%R9 |
(314) 0x13887 MOV (%R9),%R9 |
(314) 0x1388a MOV %R10,(%R9,%RAX,8) |
(314) 0x1388e MOV -0x118(%RBP),%R9 |
(314) 0x13895 VMOVSD (%R9,%R8,8),%XMM1 |
(314) 0x1389b MOV -0xb0(%RBP),%R9 |
(314) 0x138a2 MOV (%R9),%R9 |
(314) 0x138a5 VMOVSD %XMM1,(%R9,%RAX,8) |
(314) 0x138ab MOV %RAX,(%R14,%R10,8) |
(314) 0x138af INC %RAX |
(314) 0x138b2 MOV -0xc0(%RBP),%R9 |
(314) 0x138b9 MOV 0x8(%R9,%RDI,8),%R9 |
(314) 0x138be JMP 1386a |
(312) 0x138c0 MOV -0xc8(%RBP),%R9 |
(312) 0x138c7 MOV (%R9,%RDI,8),%R8 |
(312) 0x138cb MOV 0x8(%R9,%RDI,8),%R9 |
(312) 0x138d0 CMP %R9,%R8 |
(312) 0x138d3 JGE 13946 |
(312) 0x138d5 MOV -0x38(%RBP),%R14 |
(312) 0x138d9 MOV -0x40(%RBP),%RBX |
(312) 0x138dd JMP 138fe |
0x138df NOP |
(313) 0x138e0 MOV (%RBX),%R10 |
(313) 0x138e3 VMOVSD (%R10,%R11,8),%XMM1 |
(313) 0x138e9 VADDSD (%R13,%R8,8),%XMM1,%XMM1 |
(313) 0x138f0 VMOVSD %XMM1,(%R10,%R11,8) |
(313) 0x138f6 INC %R8 |
(313) 0x138f9 CMP %R9,%R8 |
(313) 0x138fc JGE 1396a |
(313) 0x138fe MOV -0x120(%RBP),%R10 |
(313) 0x13905 MOV (%R10,%R8,8),%R10 |
(313) 0x13909 MOV (%R15,%R10,8),%R11 |
(313) 0x1390d CMP (%R14,%RDX,8),%R11 |
(313) 0x13911 JGE 138e0 |
(313) 0x13913 MOV -0x108(%RBP),%R9 |
(313) 0x1391a MOV (%R9),%R9 |
(313) 0x1391d MOV %R10,(%R9,%RCX,8) |
(313) 0x13921 VMOVSD (%R13,%R8,8),%XMM1 |
(313) 0x13928 MOV (%RBX),%R9 |
(313) 0x1392b VMOVSD %XMM1,(%R9,%RCX,8) |
(313) 0x13931 MOV %RCX,(%R15,%R10,8) |
(313) 0x13935 INC %RCX |
(313) 0x13938 MOV -0xc8(%RBP),%R9 |
(313) 0x1393f MOV 0x8(%R9,%RDI,8),%R9 |
(313) 0x13944 JMP 138f6 |
(312) 0x13946 MOV -0x88(%RBP),%R8 |
(312) 0x1394d MOV -0x70(%RBP),%R10 |
(312) 0x13951 MOV -0x58(%RBP),%R11 |
(312) 0x13955 MOV -0x30(%RBP),%R13 |
(312) 0x13959 MOV -0x48(%RBP),%RDI |
(312) 0x1395d MOV -0x38(%RBP),%R14 |
(312) 0x13961 MOV -0x40(%RBP),%RBX |
(312) 0x13965 JMP 1364f |
(312) 0x1396a MOV -0x88(%RBP),%R8 |
(312) 0x13971 MOV -0x70(%RBP),%R10 |
(312) 0x13975 MOV -0x30(%RBP),%R13 |
(312) 0x13979 MOV -0x48(%RBP),%RDI |
(312) 0x1397d MOV -0x58(%RBP),%R11 |
(312) 0x13981 JMP 1364f |
0x13986 NOPW %CS:(%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | par_csr_matop.c:3454-3640 |
Module | libparcsr_mv.so |
nb instructions | 297 |
nb uops | 319 |
loop length | 1336 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 59 |
micro-operation queue | 53.17 cycles |
front end | 53.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 14.70 | 14.60 | 30.67 | 30.67 | 32.50 | 14.60 | 14.50 | 32.50 | 32.50 | 32.50 | 14.60 | 30.67 |
cycles | 14.70 | 17.20 | 30.67 | 30.67 | 32.50 | 14.60 | 14.50 | 32.50 | 32.50 | 32.50 | 14.60 | 30.67 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 50.35-50.40 |
Stall cycles | 0.00 |
Front-end | 53.17 |
Dispatch | 32.50 |
DIV/SQRT | 16.00 |
Overall L1 | 53.17 |
all | 2% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 7% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x118,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x80(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 45b0 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 12d14 <hypre_ParTMatmul.extracted+0x164> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 12d21 <hypre_ParTMatmul.extracted+0x171> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R14D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %EDX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4180 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 12d4e <hypre_ParTMatmul.extracted+0x19e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP 12d60 <hypre_ParTMatmul.extracted+0x1b0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4660 <hypre_CAlloc@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4660 <hypre_CAlloc@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R13,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x40(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 12db2 <hypre_ParTMatmul.extracted+0x202> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%R13,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4590 <_intel_fast_memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R13,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,(%RDX) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 12df0 <hypre_ParTMatmul.extracted+0x240> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x68(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 13141 <hypre_ParTMatmul.extracted+0x591> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 12e51 <hypre_ParTMatmul.extracted+0x2a1> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R8),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x20c375(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4680 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,-0xe8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 1343b <hypre_ParTMatmul.extracted+0x88b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x128(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x2,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xe0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd8(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JL 13378 <hypre_ParTMatmul.extracted+0x7c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%R10),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R8,%R10,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R9,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 131df <hypre_ParTMatmul.extracted+0x62f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R9,%R10,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R8,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 131df <hypre_ParTMatmul.extracted+0x62f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R9,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R8,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 132cd <hypre_ParTMatmul.extracted+0x71d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R8,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R9,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 132cd <hypre_ParTMatmul.extracted+0x71d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 13378 <hypre_ParTMatmul.extracted+0x7c8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV (%R9),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R9,%RAX,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x8(%R8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 1322d <hypre_ParTMatmul.extracted+0x67d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x8(%R9),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R8,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 1322d <hypre_ParTMatmul.extracted+0x67d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 13378 <hypre_ParTMatmul.extracted+0x7c8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
CMP $0x5,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 13295 <hypre_ParTMatmul.extracted+0x6e5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 13378 <hypre_ParTMatmul.extracted+0x7c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 13378 <hypre_ParTMatmul.extracted+0x7c8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
CMP $0x5,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 13345 <hypre_ParTMatmul.extracted+0x795> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R9),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 13378 <hypre_ParTMatmul.extracted+0x7c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R9,%RCX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R8,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%R9,%R10,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%R8,%R10,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x130(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,(%R14,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4710 <hypre_CSRMatrixCreate@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xd0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x60(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4710 <hypre_CSRMatrixCreate@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x138(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xd0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4460 <hypre_CSRMatrixInitialize@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xd0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x100(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xb0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4460 <hypre_CSRMatrixInitialize@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x108(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x20c09c(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4680 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x140(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 13466 <hypre_ParTMatmul.extracted+0x8b6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4590 <_intel_fast_memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xa0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,(%RCX) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0xe8(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 13490 <hypre_ParTMatmul.extracted+0x8e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x70(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 134c3 <hypre_ParTMatmul.extracted+0x913> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xd8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RAX,%RSI,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RCX,%RSI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 13505 <hypre_ParTMatmul.extracted+0x955> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 134cc <hypre_ParTMatmul.extracted+0x91c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 13505 <hypre_ParTMatmul.extracted+0x955> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 43b0 <hypre_Free@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD $0x118,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 43b0 <hypre_Free@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | par_csr_matop.c:3454-3640 |
Module | libparcsr_mv.so |
nb instructions | 297 |
nb uops | 319 |
loop length | 1336 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 59 |
micro-operation queue | 53.17 cycles |
front end | 53.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 14.70 | 14.60 | 30.67 | 30.67 | 32.50 | 14.60 | 14.50 | 32.50 | 32.50 | 32.50 | 14.60 | 30.67 |
cycles | 14.70 | 17.20 | 30.67 | 30.67 | 32.50 | 14.60 | 14.50 | 32.50 | 32.50 | 32.50 | 14.60 | 30.67 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 50.35-50.40 |
Stall cycles | 0.00 |
Front-end | 53.17 |
Dispatch | 32.50 |
DIV/SQRT | 16.00 |
Overall L1 | 53.17 |
all | 2% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 7% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x118,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x80(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 45b0 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 12d14 <hypre_ParTMatmul.extracted+0x164> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 12d21 <hypre_ParTMatmul.extracted+0x171> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R14D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %EDX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4180 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 12d4e <hypre_ParTMatmul.extracted+0x19e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP 12d60 <hypre_ParTMatmul.extracted+0x1b0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4660 <hypre_CAlloc@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4660 <hypre_CAlloc@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R13,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x40(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 12db2 <hypre_ParTMatmul.extracted+0x202> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%R13,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4590 <_intel_fast_memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R13,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,(%RDX) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 12df0 <hypre_ParTMatmul.extracted+0x240> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x68(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 13141 <hypre_ParTMatmul.extracted+0x591> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 12e51 <hypre_ParTMatmul.extracted+0x2a1> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R8),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x20c375(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4680 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,-0xe8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 1343b <hypre_ParTMatmul.extracted+0x88b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x128(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x2,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xe0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd8(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JL 13378 <hypre_ParTMatmul.extracted+0x7c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%R10),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R8,%R10,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R9,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 131df <hypre_ParTMatmul.extracted+0x62f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R9,%R10,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R8,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 131df <hypre_ParTMatmul.extracted+0x62f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R9,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R8,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 132cd <hypre_ParTMatmul.extracted+0x71d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R8,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R9,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 132cd <hypre_ParTMatmul.extracted+0x71d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 13378 <hypre_ParTMatmul.extracted+0x7c8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV (%R9),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R9,%RAX,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x8(%R8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 1322d <hypre_ParTMatmul.extracted+0x67d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x8(%R9),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R8,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 1322d <hypre_ParTMatmul.extracted+0x67d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 13378 <hypre_ParTMatmul.extracted+0x7c8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
CMP $0x5,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 13295 <hypre_ParTMatmul.extracted+0x6e5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 13378 <hypre_ParTMatmul.extracted+0x7c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 13378 <hypre_ParTMatmul.extracted+0x7c8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
CMP $0x5,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 13345 <hypre_ParTMatmul.extracted+0x795> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R9),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 13378 <hypre_ParTMatmul.extracted+0x7c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R9,%RCX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R8,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%R9,%R10,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%R8,%R10,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x130(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,(%R14,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4710 <hypre_CSRMatrixCreate@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xd0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x60(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4710 <hypre_CSRMatrixCreate@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x138(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xd0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4460 <hypre_CSRMatrixInitialize@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xd0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x100(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xb0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4460 <hypre_CSRMatrixInitialize@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x108(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x20c09c(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4680 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x140(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 13466 <hypre_ParTMatmul.extracted+0x8b6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4590 <_intel_fast_memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xa0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,(%RCX) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0xe8(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 13490 <hypre_ParTMatmul.extracted+0x8e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x70(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 134c3 <hypre_ParTMatmul.extracted+0x913> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xd8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RAX,%RSI,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RCX,%RSI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 13505 <hypre_ParTMatmul.extracted+0x955> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 134cc <hypre_ParTMatmul.extracted+0x91c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 13505 <hypre_ParTMatmul.extracted+0x955> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 43b0 <hypre_Free@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD $0x118,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 43b0 <hypre_Free@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_ParTMatmul.extracted– | 0.08 | 0.03 |
○Loop 324 - par_csr_matop.c:3537-3540 - libparcsr_mv.so | 0 | 0 |
▼Loop 327 - par_csr_matop.c:3467-3528 - libparcsr_mv.so– | 0 | 0 |
○Loop 335 - par_csr_matop.c:3491-3495 - libparcsr_mv.so | 0 | 0.01 |
○Loop 334 - par_csr_matop.c:3497-3501 - libparcsr_mv.so | 0 | 0 |
▼Loop 328 - par_csr_matop.c:3467-3522 - libparcsr_mv.so– | 0 | 0.01 |
○Loop 332 - par_csr_matop.c:3467-3504 - libparcsr_mv.so | 0.03 | 0.01 |
○Loop 331 - par_csr_matop.c:3504-3505 - libparcsr_mv.so | 0 | 0 |
○Loop 330 - par_csr_matop.c:3507-3513 - libparcsr_mv.so | 0 | 0 |
○Loop 329 - par_csr_matop.c:3516-3522 - libparcsr_mv.so | 0 | 0 |
○Loop 333 - par_csr_matop.c:3504-3505 - libparcsr_mv.so | 0 | 0.01 |
○Loop 321 - par_csr_matop.c:3537-3540 - libparcsr_mv.so | 0 | 0 |
○Loop 323 - par_csr_matop.c:3537-3540 - libparcsr_mv.so | 0 | 0 |
▼Loop 311 - par_csr_matop.c:3467-3640 - libparcsr_mv.so– | 0 | 0 |
○Loop 319 - par_csr_matop.c:3590-3596 - libparcsr_mv.so | 0.01 | 0.01 |
▼Loop 312 - par_csr_matop.c:3467-3634 - libparcsr_mv.so– | 0 | 0 |
○Loop 316 - par_csr_matop.c:3467-3607 - libparcsr_mv.so | 0.03 | 0.01 |
○Loop 315 - par_csr_matop.c:3607-3608 - libparcsr_mv.so | 0 | 0 |
○Loop 314 - par_csr_matop.c:3610-3621 - libparcsr_mv.so | 0 | 0 |
○Loop 313 - par_csr_matop.c:3623-3634 - libparcsr_mv.so | 0 | 0 |
○Loop 317 - par_csr_matop.c:3607-3608 - libparcsr_mv.so | 0 | 0.01 |
○Loop 318 - par_csr_matop.c:3598-3604 - libparcsr_mv.so | 0 | 0 |
○Loop 325 - par_csr_matop.c:3537-3540 - libparcsr_mv.so | 0 | 0 |
○Loop 320 - par_csr_matop.c:3571-3572 - libparcsr_mv.so | 0 | 0 |
○Loop 322 - par_csr_matop.c:3537-3540 - libparcsr_mv.so | 0 | 0 |
○Loop 326 - par_csr_matop.c:3537-3540 - libparcsr_mv.so | 0 | 0 |
○Loop 336 - par_csr_matop.c:3484-3485 - libparcsr_mv.so | 0 | 0 |