Function: hypre_ParTMatmul.extracted | Module: exec | Source: par_csr_matop.c:3454-3640 [...] | Coverage: 0.09% |
---|
Function: hypre_ParTMatmul.extracted | Module: exec | Source: par_csr_matop.c:3454-3640 [...] | Coverage: 0.09% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-3661/intel/AMG/build/AMG/AMG/parcsr_mv/par_csr_matop.c: 3454 - 3640 |
-------------------------------------------------------------------------------- |
3454: #pragma omp parallel |
[...] |
3462: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
3463: |
3464: size = num_cols_diag_A/num_threads; |
3465: rest = num_cols_diag_A - size*num_threads; |
3466: ii = hypre_GetThreadNum(); |
3467: if (ii < rest) |
3468: { |
3469: ns = ii*size+ii; |
3470: ne = (ii+1)*size+ii+1; |
3471: } |
3472: else |
3473: { |
3474: ns = ii*size+rest; |
3475: ne = (ii+1)*size+rest; |
3476: } |
3477: |
3478: B_marker = hypre_CTAlloc(HYPRE_Int, num_cols_diag_B); |
3479: B_marker_offd = hypre_CTAlloc(HYPRE_Int, num_cols_offd_C); |
3480: |
3481: for (ik = 0; ik < num_cols_diag_B; ik++) |
3482: B_marker[ik] = -1; |
3483: |
3484: for (ik = 0; ik < num_cols_offd_C; ik++) |
3485: B_marker_offd[ik] = -1; |
3486: |
3487: nnz_d = 0; |
3488: nnz_o = 0; |
3489: for (ik = ns; ik < ne; ik++) |
3490: { |
3491: for (jk = C_tmp_diag_i[ik]; jk < C_tmp_diag_i[ik+1]; jk++) |
3492: { |
3493: jcol = C_tmp_diag_j[jk]; |
3494: B_marker[jcol] = ik; |
3495: nnz_d++; |
3496: } |
3497: for (jk = C_tmp_offd_i[ik]; jk < C_tmp_offd_i[ik+1]; jk++) |
3498: { |
3499: jcol = C_tmp_offd_j[jk]; |
3500: B_marker_offd[jcol] = ik; |
3501: nnz_o++; |
3502: } |
3503: for (jk = 0; jk < num_sends_A; jk++) |
3504: for (j1 = send_map_starts_A[jk]; j1 < send_map_starts_A[jk+1]; j1++) |
3505: if (send_map_elmts_A[j1] == ik) |
3506: { |
3507: for (j2 = C_ext_diag_i[j1]; j2 < C_ext_diag_i[j1+1]; j2++) |
3508: { |
3509: jcol = C_ext_diag_j[j2]; |
3510: if (B_marker[jcol] < ik) |
3511: { |
3512: B_marker[jcol] = ik; |
3513: nnz_d++; |
3514: } |
3515: } |
3516: for (j2 = C_ext_offd_i[j1]; j2 < C_ext_offd_i[j1+1]; j2++) |
3517: { |
3518: jcol = C_ext_offd_j[j2]; |
3519: if (B_marker_offd[jcol] < ik) |
3520: { |
3521: B_marker_offd[jcol] = ik; |
3522: nnz_o++; |
3523: } |
3524: } |
3525: break; |
3526: } |
3527: C_diag_array[ii] = nnz_d; |
3528: C_offd_array[ii] = nnz_o; |
3529: } |
3530: #ifdef HYPRE_USING_OPENMP |
3531: #pragma omp barrier |
3532: #endif |
3533: if (ii == 0) |
3534: { |
3535: nnz_d = 0; |
3536: nnz_o = 0; |
3537: for (ik = 0; ik < num_threads-1; ik++) |
3538: { |
3539: C_diag_array[ik+1] += C_diag_array[ik]; |
3540: C_offd_array[ik+1] += C_offd_array[ik]; |
3541: } |
3542: nnz_d = C_diag_array[num_threads-1]; |
3543: nnz_o = C_offd_array[num_threads-1]; |
3544: C_diag_i[num_cols_diag_A] = nnz_d; |
3545: C_offd_i[num_cols_diag_A] = nnz_o; |
3546: |
3547: C_diag = hypre_CSRMatrixCreate(num_cols_diag_A, num_cols_diag_A, nnz_d); |
3548: C_offd = hypre_CSRMatrixCreate(num_cols_diag_A, num_cols_offd_C, nnz_o); |
3549: hypre_CSRMatrixI(C_diag) = C_diag_i; |
3550: hypre_CSRMatrixInitialize(C_diag); |
3551: C_diag_j = hypre_CSRMatrixJ(C_diag); |
3552: C_diag_data = hypre_CSRMatrixData(C_diag); |
3553: hypre_CSRMatrixI(C_offd) = C_offd_i; |
3554: hypre_CSRMatrixInitialize(C_offd); |
3555: C_offd_j = hypre_CSRMatrixJ(C_offd); |
3556: C_offd_data = hypre_CSRMatrixData(C_offd); |
[...] |
3568: for (ik = 0; ik < num_cols_diag_B; ik++) |
3569: B_marker[ik] = -1; |
3570: |
3571: for (ik = 0; ik < num_cols_offd_C; ik++) |
3572: B_marker_offd[ik] = -1; |
[...] |
3581: if (ii) |
3582: { |
3583: nnz_d = C_diag_array[ii-1]; |
3584: nnz_o = C_offd_array[ii-1]; |
3585: } |
3586: for (ik = ns; ik < ne; ik++) |
3587: { |
3588: C_diag_i[ik] = nnz_d; |
3589: C_offd_i[ik] = nnz_o; |
3590: for (jk = C_tmp_diag_i[ik]; jk < C_tmp_diag_i[ik+1]; jk++) |
3591: { |
3592: jcol = C_tmp_diag_j[jk]; |
3593: C_diag_j[nnz_d] = jcol; |
3594: C_diag_data[nnz_d] = C_tmp_diag_data[jk]; |
3595: B_marker[jcol] = nnz_d; |
3596: nnz_d++; |
3597: } |
3598: for (jk = C_tmp_offd_i[ik]; jk < C_tmp_offd_i[ik+1]; jk++) |
3599: { |
3600: jcol = C_tmp_offd_j[jk]; |
3601: C_offd_j[nnz_o] = jcol; |
3602: C_offd_data[nnz_o] = C_tmp_offd_data[jk]; |
3603: B_marker_offd[jcol] = nnz_o; |
3604: nnz_o++; |
3605: } |
3606: for (jk = 0; jk < num_sends_A; jk++) |
3607: for (j1 = send_map_starts_A[jk]; j1 < send_map_starts_A[jk+1]; j1++) |
3608: if (send_map_elmts_A[j1] == ik) |
3609: { |
3610: for (j2 = C_ext_diag_i[j1]; j2 < C_ext_diag_i[j1+1]; j2++) |
3611: { |
3612: jcol = C_ext_diag_j[j2]; |
3613: if (B_marker[jcol] < C_diag_i[ik]) |
3614: { |
3615: C_diag_j[nnz_d] = jcol; |
3616: C_diag_data[nnz_d] = C_ext_diag_data[j2]; |
3617: B_marker[jcol] = nnz_d; |
3618: nnz_d++; |
3619: } |
3620: else |
3621: C_diag_data[B_marker[jcol]] += C_ext_diag_data[j2]; |
3622: } |
3623: for (j2 = C_ext_offd_i[j1]; j2 < C_ext_offd_i[j1+1]; j2++) |
3624: { |
3625: jcol = C_ext_offd_j[j2]; |
3626: if (B_marker_offd[jcol] < C_offd_i[ik]) |
3627: { |
3628: C_offd_j[nnz_o] = jcol; |
3629: C_offd_data[nnz_o] = C_ext_offd_data[j2]; |
3630: B_marker_offd[jcol] = nnz_o; |
3631: nnz_o++; |
3632: } |
3633: else |
3634: C_offd_data[B_marker_offd[jcol]] += C_ext_offd_data[j2]; |
3635: } |
3636: break; |
3637: } |
3638: } |
3639: hypre_TFree(B_marker); |
3640: hypre_TFree(B_marker_offd); |
0x4b23c0 PUSH %RBP |
0x4b23c1 MOV %RSP,%RBP |
0x4b23c4 PUSH %R15 |
0x4b23c6 PUSH %R14 |
0x4b23c8 PUSH %R13 |
0x4b23ca PUSH %R12 |
0x4b23cc PUSH %RBX |
0x4b23cd SUB $0x118,%RSP |
0x4b23d4 MOV %R9,-0xa0(%RBP) |
0x4b23db MOV %R8,-0x138(%RBP) |
0x4b23e2 MOV %RCX,%RBX |
0x4b23e5 MOV %RDX,%R14 |
0x4b23e8 MOV %RDI,%R13 |
0x4b23eb MOV 0xc8(%RBP),%RAX |
0x4b23f2 MOV %RAX,-0xd0(%RBP) |
0x4b23f9 MOV 0xc0(%RBP),%RAX |
0x4b2400 MOV %RAX,-0xc8(%RBP) |
0x4b2407 MOV 0xb8(%RBP),%RAX |
0x4b240e MOV %RAX,-0x90(%RBP) |
0x4b2415 MOV 0xb0(%RBP),%RAX |
0x4b241c MOV %RAX,-0x38(%RBP) |
0x4b2420 MOV 0xa8(%RBP),%RAX |
0x4b2427 MOV %RAX,-0x68(%RBP) |
0x4b242b MOV 0xa0(%RBP),%RAX |
0x4b2432 MOV %RAX,-0x40(%RBP) |
0x4b2436 MOV 0x98(%RBP),%RAX |
0x4b243d MOV %RAX,-0xf8(%RBP) |
0x4b2444 MOV 0x90(%RBP),%RAX |
0x4b244b MOV %RAX,-0xb0(%RBP) |
0x4b2452 MOV 0x88(%RBP),%RAX |
0x4b2459 MOV %RAX,-0x98(%RBP) |
0x4b2460 MOV 0x80(%RBP),%RAX |
0x4b2467 MOV %RAX,-0x78(%RBP) |
0x4b246b MOV 0x78(%RBP),%RAX |
0x4b246f MOV %RAX,-0x108(%RBP) |
0x4b2476 MOV 0x70(%RBP),%RAX |
0x4b247a MOV %RAX,-0xe8(%RBP) |
0x4b2481 MOV 0x68(%RBP),%RAX |
0x4b2485 MOV %RAX,-0x58(%RBP) |
0x4b2489 MOV 0x60(%RBP),%RAX |
0x4b248d MOV %RAX,-0x50(%RBP) |
0x4b2491 MOV 0x58(%RBP),%R12 |
0x4b2495 MOV 0x50(%RBP),%RAX |
0x4b2499 MOV %RAX,-0xe0(%RBP) |
0x4b24a0 MOV 0x48(%RBP),%RAX |
0x4b24a4 MOV %RAX,-0x118(%RBP) |
0x4b24ab MOV 0x40(%RBP),%RAX |
0x4b24af MOV %RAX,-0xc0(%RBP) |
0x4b24b6 MOV 0x38(%RBP),%RAX |
0x4b24ba MOV %RAX,-0x110(%RBP) |
0x4b24c1 MOV 0x30(%RBP),%RAX |
0x4b24c5 MOV %RAX,-0x70(%RBP) |
0x4b24c9 MOV 0x28(%RBP),%RAX |
0x4b24cd MOV %RAX,-0xb8(%RBP) |
0x4b24d4 MOV 0x20(%RBP),%RAX |
0x4b24d8 MOV %RAX,-0x130(%RBP) |
0x4b24df MOV 0x18(%RBP),%RAX |
0x4b24e3 MOV %RAX,-0xf0(%RBP) |
0x4b24ea MOV 0x10(%RBP),%RAX |
0x4b24ee MOV %RAX,-0xa8(%RBP) |
0x4b24f5 CALL 4d6de0 <hypre_NumActiveThreads> |
0x4b24fa MOV %RAX,%RCX |
0x4b24fd MOV %R14,%RAX |
0x4b2500 OR %RCX,%RAX |
0x4b2503 SHR $0x20,%RAX |
0x4b2507 MOV %R14,-0x128(%RBP) |
0x4b250e MOV %RCX,-0x120(%RBP) |
0x4b2515 JE 4b2527 |
0x4b2517 MOV %R14,%RAX |
0x4b251a CQTO |
0x4b251c IDIV %RCX |
0x4b251f MOV %RDX,%R15 |
0x4b2522 MOV %RAX,%R14 |
0x4b2525 JMP 4b2534 |
0x4b2527 MOV %R14D,%EAX |
0x4b252a XOR %EDX,%EDX |
0x4b252c DIV %ECX |
0x4b252e MOV %EDX,%R15D |
0x4b2531 MOV %EAX,%R14D |
0x4b2534 CALL 4d6df0 <hypre_GetThreadNum> |
0x4b2539 LEA 0x1(%RAX),%RCX |
0x4b253d CMP %R15,%RAX |
0x4b2540 MOV %RAX,-0xd8(%RBP) |
0x4b2547 MOV %R13,-0x100(%RBP) |
0x4b254e JGE 4b2561 |
0x4b2550 INC %R14 |
0x4b2553 IMUL %R14,%RAX |
0x4b2557 MOV %RAX,-0x48(%RBP) |
0x4b255b IMUL %R14,%RCX |
0x4b255f JMP 4b2573 |
0x4b2561 IMUL %R14,%RAX |
0x4b2565 ADD %R15,%RAX |
0x4b2568 MOV %RAX,-0x48(%RBP) |
0x4b256c IMUL %R14,%RCX |
0x4b2570 ADD %R15,%RCX |
0x4b2573 MOV %RCX,-0x80(%RBP) |
0x4b2577 MOV $0x8,%ESI |
0x4b257c MOV %RBX,%RDI |
0x4b257f CALL 4d5130 <hypre_CAlloc> |
0x4b2584 MOV %RAX,%R13 |
0x4b2587 MOV -0x90(%RBP),%RAX |
0x4b258e MOV (%RAX),%RDI |
0x4b2591 MOV $0x8,%ESI |
0x4b2596 CALL 4d5130 <hypre_CAlloc> |
0x4b259b MOV %RAX,%R15 |
0x4b259e TEST %RBX,%RBX |
0x4b25a1 MOV -0x40(%RBP),%R14 |
0x4b25a5 JLE 4b25bc |
0x4b25a7 LEA (,%RBX,8),%RDX |
0x4b25af MOV %R13,%RDI |
0x4b25b2 MOV $0xff,%ESI |
0x4b25b7 CALL 4e0070 <__intel_avx_rep_memset> |
0x4b25bc MOV %RBX,-0x140(%RBP) |
0x4b25c3 MOV %R13,-0x30(%RBP) |
0x4b25c7 MOV -0x90(%RBP),%RDX |
0x4b25ce CMPQ $0,(%RDX) |
0x4b25d2 MOV -0x80(%RBP),%RCX |
0x4b25d6 JLE 4b25f0 |
0x4b25d8 XOR %EAX,%EAX |
0x4b25da NOPW (%RAX,%RAX,1) |
(3474) 0x4b25e0 MOVQ $-0x1,(%R15,%RAX,8) |
(3474) 0x4b25e8 INC %RAX |
(3474) 0x4b25eb CMP (%RDX),%RAX |
(3474) 0x4b25ee JL 4b25e0 |
0x4b25f0 MOV -0x48(%RBP),%RAX |
0x4b25f4 CMP %RCX,%RAX |
0x4b25f7 MOV -0x38(%RBP),%RBX |
0x4b25fb MOV -0x50(%RBP),%R11 |
0x4b25ff MOV %R12,-0x88(%RBP) |
0x4b2606 MOV -0x30(%RBP),%R13 |
0x4b260a JGE 4b2902 |
0x4b2610 XOR %EAX,%EAX |
0x4b2612 MOV -0x48(%RBP),%RDX |
0x4b2616 XOR %ECX,%ECX |
0x4b2618 JMP 4b264a |
0x4b261a NOPW (%RAX,%RAX,1) |
(3465) 0x4b2620 MOV -0xc8(%RBP),%RDX |
(3465) 0x4b2627 MOV -0xd8(%RBP),%RSI |
(3465) 0x4b262e MOV %RCX,(%RDX,%RSI,8) |
(3465) 0x4b2632 MOV -0xd0(%RBP),%RDX |
(3465) 0x4b2639 MOV %RAX,(%RDX,%RSI,8) |
(3465) 0x4b263d MOV %R10,%RDX |
(3465) 0x4b2640 CMP -0x80(%RBP),%R10 |
(3465) 0x4b2644 JGE 4b2902 |
(3465) 0x4b264a MOV (%R12,%RDX,8),%RSI |
(3465) 0x4b264e LEA 0x1(%RDX),%R10 |
(3465) 0x4b2652 CMP 0x8(%R12,%RDX,8),%RSI |
(3465) 0x4b2657 MOV -0x108(%RBP),%R8 |
(3465) 0x4b265e MOV -0xe8(%RBP),%R9 |
(3465) 0x4b2665 JGE 4b2685 |
(3465) 0x4b2667 NOPW (%RAX,%RAX,1) |
(3473) 0x4b2670 MOV (%R11,%RSI,8),%RDI |
(3473) 0x4b2674 MOV %RDX,(%R13,%RDI,8) |
(3473) 0x4b2679 INC %RCX |
(3473) 0x4b267c INC %RSI |
(3473) 0x4b267f CMP (%R12,%R10,8),%RSI |
(3473) 0x4b2683 JL 4b2670 |
(3465) 0x4b2685 MOV (%R9,%RDX,8),%RSI |
(3465) 0x4b2689 CMP (%R9,%R10,8),%RSI |
(3465) 0x4b268d JGE 4b26a4 |
(3465) 0x4b268f NOP |
(3472) 0x4b2690 MOV (%R8,%RSI,8),%RDI |
(3472) 0x4b2694 MOV %RDX,(%R15,%RDI,8) |
(3472) 0x4b2698 INC %RAX |
(3472) 0x4b269b INC %RSI |
(3472) 0x4b269e CMP (%R9,%R10,8),%RSI |
(3472) 0x4b26a2 JL 4b2690 |
(3465) 0x4b26a4 TEST %RBX,%RBX |
(3465) 0x4b26a7 JLE 4b2620 |
(3465) 0x4b26ad VPBROADCASTQ %RDX,%YMM0 |
(3465) 0x4b26b3 XOR %EDI,%EDI |
(3465) 0x4b26b5 MOV %R10,-0x60(%RBP) |
(3465) 0x4b26b9 NOPL (%RAX) |
(3466) 0x4b26c0 MOV (%R14,%RDI,8),%R10 |
(3466) 0x4b26c4 MOV 0x8(%R14,%RDI,8),%R9 |
(3466) 0x4b26c9 MOV %R9,%R11 |
(3466) 0x4b26cc SUB %R10,%R11 |
(3466) 0x4b26cf JLE 4b27b0 |
(3466) 0x4b26d5 MOV -0x68(%RBP),%RSI |
(3466) 0x4b26d9 LEA (%RSI,%R10,8),%ESI |
(3466) 0x4b26dd AND $0x7f,%ESI |
(3466) 0x4b26e0 MOV $0x80,%EBX |
(3466) 0x4b26e5 SUB %ESI,%EBX |
(3466) 0x4b26e7 SHR $0x3,%EBX |
(3466) 0x4b26ea CMP %RBX,%R11 |
(3466) 0x4b26ed MOV %RBX,%RSI |
(3466) 0x4b26f0 CMOVB %R11,%RSI |
(3466) 0x4b26f4 TEST %RSI,%RSI |
(3466) 0x4b26f7 JE 4b2723 |
(3466) 0x4b26f9 MOV %R10,%R8 |
(3466) 0x4b26fc MOV %RSI,%R14 |
(3466) 0x4b26ff MOV -0x68(%RBP),%R13 |
(3466) 0x4b2703 NOPW %CS:(%RAX,%RAX,1) |
(3471) 0x4b2710 CMP %RDX,(%R13,%R8,8) |
(3471) 0x4b2715 JE 4b27e5 |
(3471) 0x4b271b INC %R8 |
(3471) 0x4b271e DEC %R14 |
(3471) 0x4b2721 JNE 4b2710 |
(3466) 0x4b2723 CMP %R11,%RBX |
(3466) 0x4b2726 MOV -0x30(%RBP),%R13 |
(3466) 0x4b272a JAE 4b27b6 |
(3466) 0x4b2730 SUB %RSI,%R11 |
(3466) 0x4b2733 MOV %R11,%RBX |
(3466) 0x4b2736 AND $-0x10,%RBX |
(3466) 0x4b273a JE 4b278a |
(3466) 0x4b273c LEA -0x1(%RBX),%R13 |
(3466) 0x4b2740 LEA (%R10,%RSI,1),%R8 |
(3466) 0x4b2744 MOV -0x68(%RBP),%R14 |
(3466) 0x4b2748 LEA (%R14,%R8,8),%R14 |
(3466) 0x4b274c XOR %R12D,%R12D |
(3466) 0x4b274f NOP |
(3470) 0x4b2750 VPCMPEQQ 0x20(%R14,%R12,8),%YMM0,%K0 |
(3470) 0x4b2758 VPCMPEQQ (%R14,%R12,8),%YMM0,%K1 |
(3470) 0x4b275f VPCMPEQQ 0x60(%R14,%R12,8),%YMM0,%K2 |
(3470) 0x4b2767 VPCMPEQQ 0x40(%R14,%R12,8),%YMM0,%K3 |
(3470) 0x4b276f KORB %K0,%K1,%K4 |
(3470) 0x4b2773 KORB %K2,%K3,%K5 |
(3470) 0x4b2777 KORTESTB %K5,%K4 |
(3470) 0x4b277b JNE 4b2830 |
(3470) 0x4b2781 ADD $0x10,%R12 |
(3470) 0x4b2785 CMP %R13,%R12 |
(3470) 0x4b2788 JBE 4b2750 |
(3466) 0x4b278a CMP %R11,%RBX |
(3466) 0x4b278d JNE 4b27f7 |
(3466) 0x4b278f MOV -0x38(%RBP),%RBX |
(3466) 0x4b2793 MOV -0x40(%RBP),%R14 |
(3466) 0x4b2797 MOV -0x50(%RBP),%R11 |
(3466) 0x4b279b MOV -0x88(%RBP),%R12 |
(3466) 0x4b27a2 MOV -0x30(%RBP),%R13 |
(3466) 0x4b27a6 JMP 4b27d0 |
0x4b27a8 NOPL (%RAX,%RAX,1) |
(3466) 0x4b27b0 MOV -0x50(%RBP),%R11 |
(3466) 0x4b27b4 JMP 4b27d0 |
(3466) 0x4b27b6 MOV -0x40(%RBP),%R14 |
(3466) 0x4b27ba MOV -0x50(%RBP),%R11 |
(3466) 0x4b27be MOV -0x38(%RBP),%RBX |
(3466) 0x4b27c2 NOPW %CS:(%RAX,%RAX,1) |
(3466) 0x4b27d0 MOV -0x60(%RBP),%R10 |
(3466) 0x4b27d4 INC %RDI |
(3466) 0x4b27d7 CMP %RBX,%RDI |
(3466) 0x4b27da JNE 4b26c0 |
(3465) 0x4b27e0 JMP 4b2620 |
(3466) 0x4b27e5 MOV -0x40(%RBP),%R14 |
(3466) 0x4b27e9 MOV -0x50(%RBP),%R11 |
(3466) 0x4b27ed MOV -0x30(%RBP),%R13 |
(3466) 0x4b27f1 MOV -0x38(%RBP),%RBX |
(3466) 0x4b27f5 JMP 4b286d |
(3466) 0x4b27f7 ADD %RSI,%R10 |
(3466) 0x4b27fa ADD %RBX,%R10 |
(3466) 0x4b27fd MOV %R10,%R8 |
(3466) 0x4b2800 MOV -0x38(%RBP),%RBX |
(3466) 0x4b2804 MOV -0x40(%RBP),%R14 |
(3466) 0x4b2808 MOV -0x50(%RBP),%R11 |
(3466) 0x4b280c MOV -0x88(%RBP),%R12 |
(3466) 0x4b2813 MOV -0x30(%RBP),%R13 |
(3466) 0x4b2817 MOV -0x60(%RBP),%R10 |
(3466) 0x4b281b MOV -0x68(%RBP),%RSI |
(3466) 0x4b281f NOP |
(3469) 0x4b2820 CMP %RDX,(%RSI,%R8,8) |
(3469) 0x4b2824 JE 4b286d |
(3469) 0x4b2826 INC %R8 |
(3469) 0x4b2829 CMP %R8,%R9 |
(3469) 0x4b282c JNE 4b2820 |
(3466) 0x4b282e JMP 4b27d4 |
(3466) 0x4b2830 KSHIFTLB $0x4,%K0,%K0 |
(3466) 0x4b2836 KORB %K0,%K1,%K0 |
(3466) 0x4b283a KSHIFTLB $0x4,%K2,%K1 |
(3466) 0x4b2840 KORB %K1,%K3,%K1 |
(3466) 0x4b2844 KUNPCKBW %K0,%K1,%K0 |
(3466) 0x4b2848 KMOVD %K0,%ESI |
(3466) 0x4b284c TZCNT %ESI,%ESI |
(3466) 0x4b2850 ADD %R12,%R8 |
(3466) 0x4b2853 ADD %RSI,%R8 |
(3466) 0x4b2856 MOV -0x38(%RBP),%RBX |
(3466) 0x4b285a MOV -0x40(%RBP),%R14 |
(3466) 0x4b285e MOV -0x50(%RBP),%R11 |
(3466) 0x4b2862 MOV -0x88(%RBP),%R12 |
(3466) 0x4b2869 MOV -0x30(%RBP),%R13 |
(3466) 0x4b286d MOV -0xb8(%RBP),%R9 |
(3466) 0x4b2874 MOV (%R9,%R8,8),%RSI |
(3466) 0x4b2878 MOV 0x8(%R9,%R8,8),%R9 |
(3466) 0x4b287d JMP 4b2883 |
0x4b287f NOP |
(3468) 0x4b2880 INC %RSI |
(3468) 0x4b2883 CMP %R9,%RSI |
(3468) 0x4b2886 JGE 4b28b0 |
(3468) 0x4b2888 MOV -0x70(%RBP),%R10 |
(3468) 0x4b288c MOV (%R10,%RSI,8),%R10 |
(3468) 0x4b2890 CMP %RDX,(%R13,%R10,8) |
(3468) 0x4b2895 JGE 4b2880 |
(3468) 0x4b2897 MOV %RDX,(%R13,%R10,8) |
(3468) 0x4b289c INC %RCX |
(3468) 0x4b289f MOV -0xb8(%RBP),%R9 |
(3468) 0x4b28a6 MOV 0x8(%R9,%R8,8),%R9 |
(3468) 0x4b28ab JMP 4b2880 |
0x4b28ad NOPL (%RAX) |
(3466) 0x4b28b0 MOV -0xc0(%RBP),%R9 |
(3466) 0x4b28b7 MOV (%R9,%R8,8),%RSI |
(3466) 0x4b28bb MOV 0x8(%R9,%R8,8),%R9 |
(3466) 0x4b28c0 JMP 4b28d3 |
0x4b28c2 NOPW %CS:(%RAX,%RAX,1) |
(3467) 0x4b28d0 INC %RSI |
(3467) 0x4b28d3 CMP %R9,%RSI |
(3467) 0x4b28d6 JGE 4b27d0 |
(3467) 0x4b28dc MOV -0x118(%RBP),%R10 |
(3467) 0x4b28e3 MOV (%R10,%RSI,8),%R10 |
(3467) 0x4b28e7 CMP %RDX,(%R15,%R10,8) |
(3467) 0x4b28eb JGE 4b28d0 |
(3467) 0x4b28ed MOV %RDX,(%R15,%R10,8) |
(3467) 0x4b28f1 INC %RAX |
(3467) 0x4b28f4 MOV -0xc0(%RBP),%R9 |
(3467) 0x4b28fb MOV 0x8(%R9,%R8,8),%R9 |
(3467) 0x4b2900 JMP 4b28d0 |
0x4b2902 MOV -0x100(%RBP),%RBX |
0x4b2909 MOV (%RBX),%ESI |
0x4b290b MOV $0x7192b0,%EDI |
0x4b2910 VZEROUPPER |
0x4b2913 CALL 40fef0 <__kmpc_barrier@plt> |
0x4b2918 CMPQ $0,-0xd8(%RBP) |
0x4b2920 JNE 4b2b55 |
0x4b2926 MOV -0x120(%RBP),%RDI |
0x4b292d CMP $0x1,%RDI |
0x4b2931 MOV -0xd0(%RBP),%R10 |
0x4b2938 MOV -0xc8(%RBP),%R11 |
0x4b293f JLE 4b2a8c |
0x4b2945 LEA -0x1(%RDI),%RAX |
0x4b2949 LEA (%R11,%RAX,8),%RCX |
0x4b294d CMP %R10,%RCX |
0x4b2950 JB 4b29b1 |
0x4b2952 LEA (%R10,%RAX,8),%RCX |
0x4b2956 CMP %R11,%RCX |
0x4b2959 JB 4b29b1 |
0x4b295b LEA (%R10,%RDI,8),%RAX |
0x4b295f CMP %R11,%RAX |
0x4b2962 JBE 4b2a5e |
0x4b2968 LEA (%R11,%RDI,8),%RAX |
0x4b296c CMP %R10,%RAX |
0x4b296f JBE 4b2a5e |
0x4b2975 MOV $0x1,%EAX |
0x4b297a NOPW (%RAX,%RAX,1) |
(3464) 0x4b2980 MOV -0x8(%R11,%RAX,8),%RCX |
(3464) 0x4b2985 LEA (%R11,%RAX,8),%RDX |
(3464) 0x4b2989 MOV (%RDX),%RSI |
(3464) 0x4b298c ADD %RCX,%RSI |
(3464) 0x4b298f MOV %RSI,(%RDX) |
(3464) 0x4b2992 MOV -0x8(%R10,%RAX,8),%RCX |
(3464) 0x4b2997 LEA (%R10,%RAX,8),%RDX |
(3464) 0x4b299b MOV (%RDX),%RSI |
(3464) 0x4b299e ADD %RCX,%RSI |
(3464) 0x4b29a1 MOV %RSI,(%RDX) |
(3464) 0x4b29a4 INC %RAX |
(3464) 0x4b29a7 CMP %RAX,%RDI |
(3464) 0x4b29aa JNE 4b2980 |
0x4b29ac JMP 4b2a8c |
0x4b29b1 MOV %RDI,%RBX |
0x4b29b4 CMP $0x5,%RDI |
0x4b29b8 JB 4b2a1d |
0x4b29ba MOV %RAX,%RCX |
0x4b29bd SHR $0x2,%RCX |
0x4b29c1 MOV (%R11),%RDX |
0x4b29c4 MOV (%R10),%RSI |
0x4b29c7 MOV $0x20,%EDI |
0x4b29cc NOPL (%RAX) |
(3462) 0x4b29d0 LEA (%R11,%RDI,1),%R8 |
(3462) 0x4b29d4 ADD -0x18(%R8),%RDX |
(3462) 0x4b29d8 MOV %RDX,-0x18(%R8) |
(3462) 0x4b29dc LEA (%R10,%RDI,1),%R9 |
(3462) 0x4b29e0 ADD -0x18(%R9),%RSI |
(3462) 0x4b29e4 MOV %RSI,-0x18(%R9) |
(3462) 0x4b29e8 ADD -0x10(%R8),%RDX |
(3462) 0x4b29ec MOV %RDX,-0x10(%R8) |
(3462) 0x4b29f0 ADD -0x10(%R9),%RSI |
(3462) 0x4b29f4 MOV %RSI,-0x10(%R9) |
(3462) 0x4b29f8 ADD -0x8(%R8),%RDX |
(3462) 0x4b29fc MOV %RDX,-0x8(%R8) |
(3462) 0x4b2a00 ADD -0x8(%R9),%RSI |
(3462) 0x4b2a04 MOV %RSI,-0x8(%R9) |
(3462) 0x4b2a08 ADD (%R8),%RDX |
(3462) 0x4b2a0b MOV %RDX,(%R8) |
(3462) 0x4b2a0e ADD (%R9),%RSI |
(3462) 0x4b2a11 MOV %RSI,(%R9) |
(3462) 0x4b2a14 ADD $0x20,%RDI |
(3462) 0x4b2a18 DEC %RCX |
(3462) 0x4b2a1b JNE 4b29d0 |
0x4b2a1d MOV %RAX,%RCX |
0x4b2a20 AND $-0x4,%RCX |
0x4b2a24 CMP %RAX,%RCX |
0x4b2a27 MOV %RBX,%RDI |
0x4b2a2a JE 4b2a8c |
0x4b2a2c MOV (%R11,%RCX,8),%RAX |
0x4b2a30 MOV (%R10,%RCX,8),%RDX |
0x4b2a34 INC %RCX |
0x4b2a37 NOPW (%RAX,%RAX,1) |
(3461) 0x4b2a40 LEA (%R11,%RCX,8),%RSI |
(3461) 0x4b2a44 ADD (%RSI),%RAX |
(3461) 0x4b2a47 MOV %RAX,(%RSI) |
(3461) 0x4b2a4a LEA (%R10,%RCX,8),%RSI |
(3461) 0x4b2a4e ADD (%RSI),%RDX |
(3461) 0x4b2a51 MOV %RDX,(%RSI) |
(3461) 0x4b2a54 INC %RCX |
(3461) 0x4b2a57 CMP %RCX,%RDI |
(3461) 0x4b2a5a JNE 4b2a40 |
0x4b2a5c JMP 4b2a8c |
0x4b2a5e MOV (%R11),%RAX |
0x4b2a61 MOV (%R10),%RCX |
0x4b2a64 MOV $0x1,%EDX |
0x4b2a69 NOPL (%RAX) |
(3463) 0x4b2a70 LEA (%R11,%RDX,8),%RSI |
(3463) 0x4b2a74 ADD (%RSI),%RAX |
(3463) 0x4b2a77 MOV %RAX,(%RSI) |
(3463) 0x4b2a7a LEA (%R10,%RDX,8),%RSI |
(3463) 0x4b2a7e ADD (%RSI),%RCX |
(3463) 0x4b2a81 MOV %RCX,(%RSI) |
(3463) 0x4b2a84 INC %RDX |
(3463) 0x4b2a87 CMP %RDX,%RDI |
(3463) 0x4b2a8a JNE 4b2a70 |
0x4b2a8c MOV -0x8(%R11,%RDI,8),%RDX |
0x4b2a91 MOV -0x8(%R10,%RDI,8),%RCX |
0x4b2a96 MOV %RCX,-0x60(%RBP) |
0x4b2a9a MOV -0x128(%RBP),%RBX |
0x4b2aa1 MOV -0xa8(%RBP),%RAX |
0x4b2aa8 MOV %RDX,(%RAX,%RBX,8) |
0x4b2aac MOV -0xb0(%RBP),%RAX |
0x4b2ab3 MOV %RCX,(%RAX,%RBX,8) |
0x4b2ab7 MOV %RBX,%RDI |
0x4b2aba MOV %RBX,%RSI |
0x4b2abd CALL 4ca550 <hypre_CSRMatrixCreate> |
0x4b2ac2 MOV -0x138(%RBP),%R14 |
0x4b2ac9 MOV %RAX,(%R14) |
0x4b2acc MOV -0x90(%RBP),%RAX |
0x4b2ad3 MOV (%RAX),%RSI |
0x4b2ad6 MOV %RBX,%RDI |
0x4b2ad9 MOV -0x60(%RBP),%RDX |
0x4b2add CALL 4ca550 <hypre_CSRMatrixCreate> |
0x4b2ae2 MOV -0x130(%RBP),%RBX |
0x4b2ae9 MOV %RAX,(%RBX) |
0x4b2aec MOV (%R14),%RDI |
0x4b2aef MOV -0xa8(%RBP),%RAX |
0x4b2af6 MOV %RAX,(%RDI) |
0x4b2af9 CALL 4ca630 <hypre_CSRMatrixInitialize> |
0x4b2afe MOV (%R14),%RAX |
0x4b2b01 MOV 0x8(%RAX),%RCX |
0x4b2b05 MOV -0xf0(%RBP),%RDX |
0x4b2b0c MOV %RCX,(%RDX) |
0x4b2b0f MOV 0x30(%RAX),%RAX |
0x4b2b13 MOV -0xa0(%RBP),%RCX |
0x4b2b1a MOV %RAX,(%RCX) |
0x4b2b1d MOV (%RBX),%RDI |
0x4b2b20 MOV -0xb0(%RBP),%RAX |
0x4b2b27 MOV %RAX,(%RDI) |
0x4b2b2a CALL 4ca630 <hypre_CSRMatrixInitialize> |
0x4b2b2f MOV (%RBX),%RAX |
0x4b2b32 MOV 0x8(%RAX),%RCX |
0x4b2b36 MOV -0xf8(%RBP),%RDX |
0x4b2b3d MOV %RCX,(%RDX) |
0x4b2b40 MOV 0x30(%RAX),%RAX |
0x4b2b44 MOV -0x98(%RBP),%RCX |
0x4b2b4b MOV %RAX,(%RCX) |
0x4b2b4e MOV -0x100(%RBP),%RBX |
0x4b2b55 MOV (%RBX),%ESI |
0x4b2b57 MOV $0x7192d0,%EDI |
0x4b2b5c CALL 40fef0 <__kmpc_barrier@plt> |
0x4b2b61 MOV -0x140(%RBP),%RDX |
0x4b2b68 TEST %RDX,%RDX |
0x4b2b6b JLE 4b2b7e |
0x4b2b6d SAL $0x3,%RDX |
0x4b2b71 MOV %R13,%RDI |
0x4b2b74 MOV $0xff,%ESI |
0x4b2b79 CALL 4e0070 <__intel_avx_rep_memset> |
0x4b2b7e MOV -0x90(%RBP),%RCX |
0x4b2b85 CMPQ $0,(%RCX) |
0x4b2b89 MOV -0xd8(%RBP),%RSI |
0x4b2b90 JLE 4b2bb0 |
0x4b2b92 XOR %EAX,%EAX |
0x4b2b94 NOPW %CS:(%RAX,%RAX,1) |
(3460) 0x4b2ba0 MOVQ $-0x1,(%R15,%RAX,8) |
(3460) 0x4b2ba8 INC %RAX |
(3460) 0x4b2bab CMP (%RCX),%RAX |
(3460) 0x4b2bae JL 4b2ba0 |
0x4b2bb0 TEST %RSI,%RSI |
0x4b2bb3 MOV -0x78(%RBP),%R11 |
0x4b2bb7 MOV -0x58(%RBP),%R10 |
0x4b2bbb MOV -0x80(%RBP),%RDX |
0x4b2bbf JE 4b2bdb |
0x4b2bc1 MOV -0xc8(%RBP),%RAX |
0x4b2bc8 MOV -0x8(%RAX,%RSI,8),%RAX |
0x4b2bcd MOV -0xd0(%RBP),%RCX |
0x4b2bd4 MOV -0x8(%RCX,%RSI,8),%RCX |
0x4b2bd9 JMP 4b2bdf |
0x4b2bdb XOR %EAX,%EAX |
0x4b2bdd XOR %ECX,%ECX |
0x4b2bdf MOV -0x48(%RBP),%RSI |
0x4b2be3 CMP %RDX,%RSI |
0x4b2be6 JL 4b2c28 |
0x4b2be8 MOV %R13,%RDI |
0x4b2beb VZEROUPPER |
0x4b2bee CALL 4d5200 <hypre_Free> |
0x4b2bf3 MOV %R15,%RDI |
0x4b2bf6 ADD $0x118,%RSP |
0x4b2bfd POP %RBX |
0x4b2bfe POP %R12 |
0x4b2c00 POP %R13 |
0x4b2c02 POP %R14 |
0x4b2c04 POP %R15 |
0x4b2c06 POP %RBP |
0x4b2c07 JMP 4d5200 |
0x4b2c0c NOPL (%RAX) |
(3451) 0x4b2c10 MOV -0x58(%RBP),%R10 |
(3451) 0x4b2c14 MOV -0x80(%RBP),%RDX |
(3451) 0x4b2c18 MOV -0x48(%RBP),%RSI |
(3451) 0x4b2c1c CMP %RDX,%RSI |
(3451) 0x4b2c1f MOV -0x88(%RBP),%R12 |
(3451) 0x4b2c26 JGE 4b2be8 |
(3451) 0x4b2c28 MOV %RSI,%RDX |
(3451) 0x4b2c2b MOV -0xa8(%RBP),%RSI |
(3451) 0x4b2c32 MOV %RAX,(%RSI,%RDX,8) |
(3451) 0x4b2c36 MOV -0xb0(%RBP),%RSI |
(3451) 0x4b2c3d MOV %RCX,(%RSI,%RDX,8) |
(3451) 0x4b2c41 MOV (%R12,%RDX,8),%RSI |
(3451) 0x4b2c45 LEA 0x1(%RDX),%RDI |
(3451) 0x4b2c49 MOV %RDI,-0x48(%RBP) |
(3451) 0x4b2c4d CMP 0x8(%R12,%RDX,8),%RSI |
(3451) 0x4b2c52 JGE 4b2cb0 |
(3451) 0x4b2c54 MOV -0xf0(%RBP),%RDI |
(3451) 0x4b2c5b MOV (%RDI),%RDI |
(3451) 0x4b2c5e MOV -0xa0(%RBP),%R8 |
(3451) 0x4b2c65 MOV (%R8),%R8 |
(3451) 0x4b2c68 MOV -0x50(%RBP),%R12 |
(3451) 0x4b2c6c MOV -0x88(%RBP),%R13 |
(3451) 0x4b2c73 MOV -0x30(%RBP),%RBX |
(3451) 0x4b2c77 MOV -0x48(%RBP),%R14 |
(3451) 0x4b2c7b NOPL (%RAX,%RAX,1) |
(3459) 0x4b2c80 MOV (%R12,%RSI,8),%R9 |
(3459) 0x4b2c84 MOV %R9,(%RDI,%RAX,8) |
(3459) 0x4b2c88 VMOVQ (%R10,%RSI,8),%XMM0 |
(3459) 0x4b2c8e VMOVQ %XMM0,(%R8,%RAX,8) |
(3459) 0x4b2c94 MOV %RAX,(%RBX,%R9,8) |
(3459) 0x4b2c98 INC %RAX |
(3459) 0x4b2c9b INC %RSI |
(3459) 0x4b2c9e CMP (%R13,%R14,8),%RSI |
(3459) 0x4b2ca3 JL 4b2c80 |
(3451) 0x4b2ca5 JMP 4b2cb4 |
0x4b2ca7 NOPW (%RAX,%RAX,1) |
(3451) 0x4b2cb0 MOV -0x48(%RBP),%R14 |
(3451) 0x4b2cb4 MOV -0xe8(%RBP),%RDI |
(3451) 0x4b2cbb MOV (%RDI,%RDX,8),%RSI |
(3451) 0x4b2cbf CMP (%RDI,%R14,8),%RSI |
(3451) 0x4b2cc3 JGE 4b2d20 |
(3451) 0x4b2cc5 MOV -0xf8(%RBP),%RDI |
(3451) 0x4b2ccc MOV (%RDI),%RDI |
(3451) 0x4b2ccf MOV -0x98(%RBP),%R8 |
(3451) 0x4b2cd6 MOV (%R8),%R8 |
(3451) 0x4b2cd9 MOV -0x108(%RBP),%R10 |
(3451) 0x4b2ce0 MOV -0x70(%RBP),%R12 |
(3451) 0x4b2ce4 MOV -0x30(%RBP),%R13 |
(3451) 0x4b2ce8 MOV -0x38(%RBP),%RBX |
(3451) 0x4b2cec MOV -0x48(%RBP),%R14 |
(3458) 0x4b2cf0 MOV (%R10,%RSI,8),%R9 |
(3458) 0x4b2cf4 MOV %R9,(%RDI,%RCX,8) |
(3458) 0x4b2cf8 VMOVQ (%R11,%RSI,8),%XMM0 |
(3458) 0x4b2cfe VMOVQ %XMM0,(%R8,%RCX,8) |
(3458) 0x4b2d04 MOV %RCX,(%R15,%R9,8) |
(3458) 0x4b2d08 INC %RCX |
(3458) 0x4b2d0b INC %RSI |
(3458) 0x4b2d0e MOV -0xe8(%RBP),%R9 |
(3458) 0x4b2d15 CMP (%R9,%R14,8),%RSI |
(3458) 0x4b2d19 JL 4b2cf0 |
(3451) 0x4b2d1b JMP 4b2d2c |
0x4b2d1d NOPL (%RAX) |
(3451) 0x4b2d20 MOV -0x70(%RBP),%R12 |
(3451) 0x4b2d24 MOV -0x30(%RBP),%R13 |
(3451) 0x4b2d28 MOV -0x38(%RBP),%RBX |
(3451) 0x4b2d2c TEST %RBX,%RBX |
(3451) 0x4b2d2f MOV -0x40(%RBP),%R14 |
(3451) 0x4b2d33 JLE 4b2c10 |
(3451) 0x4b2d39 VPBROADCASTQ %RDX,%YMM0 |
(3451) 0x4b2d3f XOR %ESI,%ESI |
(3451) 0x4b2d41 JMP 4b2d60 |
0x4b2d43 NOPW %CS:(%RAX,%RAX,1) |
(3452) 0x4b2d50 MOV -0x58(%RBP),%R10 |
(3452) 0x4b2d54 INC %RSI |
(3452) 0x4b2d57 CMP %RBX,%RSI |
(3452) 0x4b2d5a JE 4b2c14 |
(3452) 0x4b2d60 MOV (%R14,%RSI,8),%R9 |
(3452) 0x4b2d64 MOV 0x8(%R14,%RSI,8),%R8 |
(3452) 0x4b2d69 MOV %R8,%R10 |
(3452) 0x4b2d6c SUB %R9,%R10 |
(3452) 0x4b2d6f JLE 4b2d50 |
(3452) 0x4b2d71 MOV -0x68(%RBP),%RDI |
(3452) 0x4b2d75 LEA (%RDI,%R9,8),%EDI |
(3452) 0x4b2d79 AND $0x7f,%EDI |
(3452) 0x4b2d7c MOV $0x80,%EBX |
(3452) 0x4b2d81 SUB %EDI,%EBX |
(3452) 0x4b2d83 SHR $0x3,%EBX |
(3452) 0x4b2d86 CMP %RBX,%R10 |
(3452) 0x4b2d89 MOV %RBX,%R11 |
(3452) 0x4b2d8c CMOVB %R10,%R11 |
(3452) 0x4b2d90 TEST %R11,%R11 |
(3452) 0x4b2d93 JE 4b2db3 |
(3452) 0x4b2d95 MOV %R9,%RDI |
(3452) 0x4b2d98 MOV %R11,%R14 |
(3452) 0x4b2d9b MOV -0x68(%RBP),%R13 |
(3452) 0x4b2d9f NOP |
(3457) 0x4b2da0 CMP %RDX,(%R13,%RDI,8) |
(3457) 0x4b2da5 JE 4b2e55 |
(3457) 0x4b2dab INC %RDI |
(3457) 0x4b2dae DEC %R14 |
(3457) 0x4b2db1 JNE 4b2da0 |
(3452) 0x4b2db3 CMP %R10,%RBX |
(3452) 0x4b2db6 JAE 4b2e3c |
(3452) 0x4b2dbc SUB %R11,%R10 |
(3452) 0x4b2dbf MOV %R10,%RBX |
(3452) 0x4b2dc2 AND $-0x10,%RBX |
(3452) 0x4b2dc6 JE 4b2e1a |
(3452) 0x4b2dc8 LEA -0x1(%RBX),%R13 |
(3452) 0x4b2dcc LEA (%R9,%R11,1),%RDI |
(3452) 0x4b2dd0 MOV -0x68(%RBP),%R14 |
(3452) 0x4b2dd4 LEA (%R14,%RDI,8),%R14 |
(3452) 0x4b2dd8 XOR %R12D,%R12D |
(3452) 0x4b2ddb NOPL (%RAX,%RAX,1) |
(3456) 0x4b2de0 VPCMPEQQ 0x20(%R14,%R12,8),%YMM0,%K0 |
(3456) 0x4b2de8 VPCMPEQQ (%R14,%R12,8),%YMM0,%K1 |
(3456) 0x4b2def VPCMPEQQ 0x60(%R14,%R12,8),%YMM0,%K2 |
(3456) 0x4b2df7 VPCMPEQQ 0x40(%R14,%R12,8),%YMM0,%K3 |
(3456) 0x4b2dff KORB %K0,%K1,%K4 |
(3456) 0x4b2e03 KORB %K2,%K3,%K5 |
(3456) 0x4b2e07 KORTESTB %K5,%K4 |
(3456) 0x4b2e0b JNE 4b2ea7 |
(3456) 0x4b2e11 ADD $0x10,%R12 |
(3456) 0x4b2e15 CMP %R13,%R12 |
(3456) 0x4b2e18 JBE 4b2de0 |
(3452) 0x4b2e1a CMP %R10,%RBX |
(3452) 0x4b2e1d JNE 4b2e5e |
(3452) 0x4b2e1f MOV -0x38(%RBP),%RBX |
(3452) 0x4b2e23 MOV -0x40(%RBP),%R14 |
(3452) 0x4b2e27 MOV -0x78(%RBP),%R11 |
(3452) 0x4b2e2b MOV -0x58(%RBP),%R10 |
(3452) 0x4b2e2f MOV -0x70(%RBP),%R12 |
(3452) 0x4b2e33 MOV -0x30(%RBP),%R13 |
(3452) 0x4b2e37 JMP 4b2d54 |
(3452) 0x4b2e3c MOV -0x40(%RBP),%R14 |
(3452) 0x4b2e40 MOV -0x78(%RBP),%R11 |
(3452) 0x4b2e44 MOV -0x58(%RBP),%R10 |
(3452) 0x4b2e48 MOV -0x30(%RBP),%R13 |
(3452) 0x4b2e4c MOV -0x38(%RBP),%RBX |
(3452) 0x4b2e50 JMP 4b2d54 |
(3452) 0x4b2e55 MOV -0xe0(%RBP),%R13 |
(3452) 0x4b2e5c JMP 4b2ed9 |
(3452) 0x4b2e5e ADD %R11,%R9 |
(3452) 0x4b2e61 ADD %RBX,%R9 |
(3452) 0x4b2e64 MOV %R9,%RDI |
(3452) 0x4b2e67 MOV -0x38(%RBP),%RBX |
(3452) 0x4b2e6b MOV -0x40(%RBP),%R14 |
(3452) 0x4b2e6f MOV -0x78(%RBP),%R11 |
(3452) 0x4b2e73 MOV -0x58(%RBP),%R10 |
(3452) 0x4b2e77 MOV -0xe0(%RBP),%R13 |
(3452) 0x4b2e7e MOV -0x70(%RBP),%R12 |
(3452) 0x4b2e82 MOV -0x68(%RBP),%R9 |
(3452) 0x4b2e86 NOPW %CS:(%RAX,%RAX,1) |
(3455) 0x4b2e90 CMP %RDX,(%R9,%RDI,8) |
(3455) 0x4b2e94 JE 4b2ed9 |
(3455) 0x4b2e96 INC %RDI |
(3455) 0x4b2e99 CMP %RDI,%R8 |
(3455) 0x4b2e9c JNE 4b2e90 |
(3452) 0x4b2e9e MOV -0x30(%RBP),%R13 |
(3452) 0x4b2ea2 JMP 4b2d54 |
(3452) 0x4b2ea7 KSHIFTLB $0x4,%K0,%K0 |
(3452) 0x4b2ead KORB %K0,%K1,%K0 |
(3452) 0x4b2eb1 KSHIFTLB $0x4,%K2,%K1 |
(3452) 0x4b2eb7 KORB %K1,%K3,%K1 |
(3452) 0x4b2ebb KUNPCKBW %K0,%K1,%K0 |
(3452) 0x4b2ebf KMOVD %K0,%R8D |
(3452) 0x4b2ec3 TZCNT %R8D,%R8D |
(3452) 0x4b2ec8 ADD %R12,%RDI |
(3452) 0x4b2ecb ADD %R8,%RDI |
(3452) 0x4b2ece MOV -0xe0(%RBP),%R13 |
(3452) 0x4b2ed5 MOV -0x70(%RBP),%R12 |
(3452) 0x4b2ed9 MOV -0xb8(%RBP),%R9 |
(3452) 0x4b2ee0 MOV (%R9,%RDI,8),%R8 |
(3452) 0x4b2ee4 MOV 0x8(%R9,%RDI,8),%R9 |
(3452) 0x4b2ee9 CMP %R9,%R8 |
(3452) 0x4b2eec JGE 4b2f80 |
(3452) 0x4b2ef2 MOV -0x30(%RBP),%R14 |
(3452) 0x4b2ef6 MOV -0xa8(%RBP),%RBX |
(3452) 0x4b2efd JMP 4b2f2f |
0x4b2eff NOP |
(3454) 0x4b2f00 MOV -0xa0(%RBP),%R10 |
(3454) 0x4b2f07 MOV (%R10),%R10 |
(3454) 0x4b2f0a VMOVSD (%R10,%R11,8),%XMM1 |
(3454) 0x4b2f10 MOV -0x110(%RBP),%R12 |
(3454) 0x4b2f17 VADDSD (%R12,%R8,8),%XMM1,%XMM1 |
(3454) 0x4b2f1d MOV -0x70(%RBP),%R12 |
(3454) 0x4b2f21 VMOVSD %XMM1,(%R10,%R11,8) |
(3454) 0x4b2f27 INC %R8 |
(3454) 0x4b2f2a CMP %R9,%R8 |
(3454) 0x4b2f2d JGE 4b2f80 |
(3454) 0x4b2f2f MOV (%R12,%R8,8),%R10 |
(3454) 0x4b2f33 MOV (%R14,%R10,8),%R11 |
(3454) 0x4b2f37 CMP (%RBX,%RDX,8),%R11 |
(3454) 0x4b2f3b JGE 4b2f00 |
(3454) 0x4b2f3d MOV -0xf0(%RBP),%R9 |
(3454) 0x4b2f44 MOV (%R9),%R9 |
(3454) 0x4b2f47 MOV %R10,(%R9,%RAX,8) |
(3454) 0x4b2f4b MOV -0x110(%RBP),%R9 |
(3454) 0x4b2f52 VMOVSD (%R9,%R8,8),%XMM1 |
(3454) 0x4b2f58 MOV -0xa0(%RBP),%R9 |
(3454) 0x4b2f5f MOV (%R9),%R9 |
(3454) 0x4b2f62 VMOVSD %XMM1,(%R9,%RAX,8) |
(3454) 0x4b2f68 MOV %RAX,(%R14,%R10,8) |
(3454) 0x4b2f6c INC %RAX |
(3454) 0x4b2f6f MOV -0xb8(%RBP),%R9 |
(3454) 0x4b2f76 MOV 0x8(%R9,%RDI,8),%R9 |
(3454) 0x4b2f7b JMP 4b2f27 |
0x4b2f7d NOPL (%RAX) |
(3452) 0x4b2f80 MOV -0xc0(%RBP),%R9 |
(3452) 0x4b2f87 MOV (%R9,%RDI,8),%R8 |
(3452) 0x4b2f8b MOV 0x8(%R9,%RDI,8),%R9 |
(3452) 0x4b2f90 CMP %R9,%R8 |
(3452) 0x4b2f93 JGE 4b3028 |
(3452) 0x4b2f99 MOV -0x40(%RBP),%R14 |
(3452) 0x4b2f9d MOV -0xb0(%RBP),%RBX |
(3452) 0x4b2fa4 JMP 4b2fd9 |
0x4b2fa6 NOPW %CS:(%RAX,%RAX,1) |
(3453) 0x4b2fb0 MOV -0x98(%RBP),%R10 |
(3453) 0x4b2fb7 MOV (%R10),%R10 |
(3453) 0x4b2fba VMOVSD (%R10,%R11,8),%XMM1 |
(3453) 0x4b2fc0 VADDSD (%R13,%R8,8),%XMM1,%XMM1 |
(3453) 0x4b2fc7 VMOVSD %XMM1,(%R10,%R11,8) |
(3453) 0x4b2fcd INC %R8 |
(3453) 0x4b2fd0 CMP %R9,%R8 |
(3453) 0x4b2fd3 JGE 4b2e40 |
(3453) 0x4b2fd9 MOV -0x118(%RBP),%R10 |
(3453) 0x4b2fe0 MOV (%R10,%R8,8),%R10 |
(3453) 0x4b2fe4 MOV (%R15,%R10,8),%R11 |
(3453) 0x4b2fe8 CMP (%RBX,%RDX,8),%R11 |
(3453) 0x4b2fec JGE 4b2fb0 |
(3453) 0x4b2fee MOV -0xf8(%RBP),%R9 |
(3453) 0x4b2ff5 MOV (%R9),%R9 |
(3453) 0x4b2ff8 MOV %R10,(%R9,%RCX,8) |
(3453) 0x4b2ffc VMOVSD (%R13,%R8,8),%XMM1 |
(3453) 0x4b3003 MOV -0x98(%RBP),%R9 |
(3453) 0x4b300a MOV (%R9),%R9 |
(3453) 0x4b300d VMOVSD %XMM1,(%R9,%RCX,8) |
(3453) 0x4b3013 MOV %RCX,(%R15,%R10,8) |
(3453) 0x4b3017 INC %RCX |
(3453) 0x4b301a MOV -0xc0(%RBP),%R9 |
(3453) 0x4b3021 MOV 0x8(%R9,%RDI,8),%R9 |
(3453) 0x4b3026 JMP 4b2fcd |
(3452) 0x4b3028 MOV -0x78(%RBP),%R11 |
(3452) 0x4b302c MOV -0x58(%RBP),%R10 |
(3452) 0x4b3030 MOV -0x30(%RBP),%R13 |
(3452) 0x4b3034 MOV -0x38(%RBP),%RBX |
(3452) 0x4b3038 MOV -0x40(%RBP),%R14 |
(3452) 0x4b303c JMP 4b2d54 |
0x4b3041 NOPW %CS:(%RAX,%RAX,1) |
0x4b304b NOPL (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.59+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | par_csr_matop.c:3454-3640 |
Module | exec |
nb instructions | 282 |
nb uops | 304 |
loop length | 1261 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 59 |
micro-operation queue | 50.67 cycles |
front end | 50.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 12.50 | 12.40 | 30.33 | 30.33 | 32.50 | 12.40 | 12.30 | 32.50 | 32.50 | 32.50 | 12.40 | 30.33 |
cycles | 12.50 | 16.20 | 30.33 | 30.33 | 32.50 | 12.40 | 12.30 | 32.50 | 32.50 | 32.50 | 12.40 | 30.33 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 47.85-47.90 |
Stall cycles | 0.00 |
Front-end | 50.67 |
Dispatch | 32.50 |
DIV/SQRT | 16.00 |
Overall L1 | 50.67 |
all | 2% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 8% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x118,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x80(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4d6de0 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4b2527 <hypre_ParTMatmul.extracted+0x167> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4b2534 <hypre_ParTMatmul.extracted+0x174> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R14D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %EDX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d6df0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4b2561 <hypre_ParTMatmul.extracted+0x1a1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP 4b2573 <hypre_ParTMatmul.extracted+0x1b3> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d5130 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4d5130 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x40(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4b25bc <hypre_ParTMatmul.extracted+0x1fc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RBX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4e0070 <__intel_avx_rep_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RBX,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,(%RDX) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x80(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4b25f0 <hypre_ParTMatmul.extracted+0x230> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x38(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 4b2902 <hypre_ParTMatmul.extracted+0x542> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4b264a <hypre_ParTMatmul.extracted+0x28a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x100(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x7192b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 40fef0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,-0xd8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 4b2b55 <hypre_ParTMatmul.extracted+0x795> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x120(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xd0(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4b2a8c <hypre_ParTMatmul.extracted+0x6cc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R11,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4b29b1 <hypre_ParTMatmul.extracted+0x5f1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4b29b1 <hypre_ParTMatmul.extracted+0x5f1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4b2a5e <hypre_ParTMatmul.extracted+0x69e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R11,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4b2a5e <hypre_ParTMatmul.extracted+0x69e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4b2a8c <hypre_ParTMatmul.extracted+0x6cc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x5,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4b2a1d <hypre_ParTMatmul.extracted+0x65d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R11),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JE 4b2a8c <hypre_ParTMatmul.extracted+0x6cc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R11,%RCX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4b2a8c <hypre_ParTMatmul.extracted+0x6cc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV (%R11),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%R11,%RDI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%R10,%RDI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x128(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4ca550 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x138(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%R14) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x60(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4ca550 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x130(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R14),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4ca630 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4ca630 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x98(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x100(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x7192d0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fef0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x140(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4b2b7e <hypre_ParTMatmul.extracted+0x7be> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4e0070 <__intel_avx_rep_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x90(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,(%RCX) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0xd8(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4b2bb0 <hypre_ParTMatmul.extracted+0x7f0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x78(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x80(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 4b2bdb <hypre_ParTMatmul.extracted+0x81b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RAX,%RSI,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RCX,%RSI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4b2bdf <hypre_ParTMatmul.extracted+0x81f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4b2c28 <hypre_ParTMatmul.extracted+0x868> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4d5200 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD $0x118,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 4d5200 <hypre_Free> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | par_csr_matop.c:3454-3640 |
Module | exec |
nb instructions | 282 |
nb uops | 304 |
loop length | 1261 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 59 |
micro-operation queue | 50.67 cycles |
front end | 50.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 12.50 | 12.40 | 30.33 | 30.33 | 32.50 | 12.40 | 12.30 | 32.50 | 32.50 | 32.50 | 12.40 | 30.33 |
cycles | 12.50 | 16.20 | 30.33 | 30.33 | 32.50 | 12.40 | 12.30 | 32.50 | 32.50 | 32.50 | 12.40 | 30.33 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 47.85-47.90 |
Stall cycles | 0.00 |
Front-end | 50.67 |
Dispatch | 32.50 |
DIV/SQRT | 16.00 |
Overall L1 | 50.67 |
all | 2% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 8% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x118,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x80(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4d6de0 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4b2527 <hypre_ParTMatmul.extracted+0x167> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4b2534 <hypre_ParTMatmul.extracted+0x174> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R14D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %EDX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d6df0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4b2561 <hypre_ParTMatmul.extracted+0x1a1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP 4b2573 <hypre_ParTMatmul.extracted+0x1b3> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d5130 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4d5130 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x40(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4b25bc <hypre_ParTMatmul.extracted+0x1fc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RBX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4e0070 <__intel_avx_rep_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RBX,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,(%RDX) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x80(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4b25f0 <hypre_ParTMatmul.extracted+0x230> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x38(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 4b2902 <hypre_ParTMatmul.extracted+0x542> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4b264a <hypre_ParTMatmul.extracted+0x28a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x100(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x7192b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 40fef0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,-0xd8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 4b2b55 <hypre_ParTMatmul.extracted+0x795> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x120(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xd0(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4b2a8c <hypre_ParTMatmul.extracted+0x6cc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R11,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4b29b1 <hypre_ParTMatmul.extracted+0x5f1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4b29b1 <hypre_ParTMatmul.extracted+0x5f1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4b2a5e <hypre_ParTMatmul.extracted+0x69e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R11,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4b2a5e <hypre_ParTMatmul.extracted+0x69e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4b2a8c <hypre_ParTMatmul.extracted+0x6cc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x5,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4b2a1d <hypre_ParTMatmul.extracted+0x65d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R11),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JE 4b2a8c <hypre_ParTMatmul.extracted+0x6cc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R11,%RCX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4b2a8c <hypre_ParTMatmul.extracted+0x6cc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV (%R11),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%R11,%RDI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%R10,%RDI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x128(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4ca550 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x138(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%R14) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x60(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4ca550 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x130(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R14),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4ca630 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4ca630 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x98(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x100(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x7192d0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fef0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x140(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4b2b7e <hypre_ParTMatmul.extracted+0x7be> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4e0070 <__intel_avx_rep_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x90(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,(%RCX) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0xd8(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4b2bb0 <hypre_ParTMatmul.extracted+0x7f0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x78(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x80(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 4b2bdb <hypre_ParTMatmul.extracted+0x81b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RAX,%RSI,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RCX,%RSI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4b2bdf <hypre_ParTMatmul.extracted+0x81f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4b2c28 <hypre_ParTMatmul.extracted+0x868> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4d5200 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD $0x118,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 4d5200 <hypre_Free> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_ParTMatmul.extracted– | 0.09 | 0.01 |
○Loop 3460 - par_csr_matop.c:3571-3572 - exec | 0 | 0 |
○Loop 3464 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
○Loop 3463 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
▼Loop 3465 - par_csr_matop.c:3467-3528 - exec– | 0 | 0 |
○Loop 3473 - par_csr_matop.c:3491-3495 - exec | 0.01 | 0.01 |
▼Loop 3466 - par_csr_matop.c:3467-3522 - exec– | 0 | 0 |
○Loop 3470 - par_csr_matop.c:3504-3505 - exec | 0.04 | 0.01 |
○Loop 3469 - par_csr_matop.c:3504-3505 - exec | 0 | 0 |
○Loop 3468 - par_csr_matop.c:3507-3513 - exec | 0 | 0 |
○Loop 3471 - par_csr_matop.c:3504-3505 - exec | 0 | 0 |
○Loop 3467 - par_csr_matop.c:3516-3522 - exec | 0 | 0 |
○Loop 3472 - par_csr_matop.c:3497-3501 - exec | 0 | 0 |
○Loop 3462 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
○Loop 3461 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
▼Loop 3451 - par_csr_matop.c:3467-3640 - exec– | 0 | 0 |
○Loop 3459 - par_csr_matop.c:3590-3596 - exec | 0.01 | 0.01 |
○Loop 3458 - par_csr_matop.c:3598-3604 - exec | 0 | 0 |
▼Loop 3452 - par_csr_matop.c:3467-3634 - exec– | 0 | 0 |
○Loop 3456 - par_csr_matop.c:3505-3608 - exec | 0.03 | 0.01 |
○Loop 3457 - par_csr_matop.c:3607-3608 - exec | 0 | 0 |
○Loop 3454 - par_csr_matop.c:3610-3621 - exec | 0 | 0 |
○Loop 3455 - par_csr_matop.c:3607-3608 - exec | 0 | 0 |
○Loop 3453 - par_csr_matop.c:3623-3634 - exec | 0 | 0 |
○Loop 3474 - par_csr_matop.c:3484-3485 - exec | 0 | 0 |