Function: hypre_CSRMatrixTranspose.extracted | Module: exec | Source: csr_matop.c:380-560 [...] | Coverage: 0.17% |
---|
Function: hypre_CSRMatrixTranspose.extracted | Module: exec | Source: csr_matop.c:380-560 [...] | Coverage: 0.17% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-3661/intel/AMG/build/AMG/AMG/seq_mv/csr_matop.c: 380 - 560 |
-------------------------------------------------------------------------------- |
380: return idx%dim1*dim2 + idx/dim1; |
[...] |
463: #pragma omp parallel |
464: #endif |
465: { |
466: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
467: HYPRE_Int my_thread_num = hypre_GetThreadNum(); |
468: |
469: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
470: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
471: hypre_assert(iBegin <= iEnd); |
472: hypre_assert(iBegin >= 0 && iBegin <= num_rowsA); |
473: hypre_assert(iEnd >= 0 && iEnd <= num_rowsA); |
474: |
475: HYPRE_Int i, j; |
476: memset(bucket + my_thread_num*num_colsA, 0, sizeof(HYPRE_Int)*num_colsA); |
[...] |
483: for (j = A_i[iBegin]; j < A_i[iEnd]; ++j) { |
484: HYPRE_Int idx = A_j[j]; |
485: bucket[my_thread_num*num_colsA + idx]++; |
[...] |
496: for (i = my_thread_num*num_colsA + 1; i < (my_thread_num + 1)*num_colsA; ++i) { |
497: HYPRE_Int transpose_i = transpose_idx(i, num_threads, num_colsA); |
498: HYPRE_Int transpose_i_minus_1 = transpose_idx(i - 1, num_threads, num_colsA); |
499: |
500: bucket[transpose_i] += bucket[transpose_i_minus_1]; |
501: } |
502: |
503: #ifdef HYPRE_USING_OPENMP |
504: #pragma omp barrier |
505: #pragma omp master |
506: #endif |
507: { |
508: for (i = 1; i < num_threads; ++i) { |
509: HYPRE_Int j0 = num_colsA*i - 1, j1 = num_colsA*(i + 1) - 1; |
510: HYPRE_Int transpose_j0 = transpose_idx(j0, num_threads, num_colsA); |
511: HYPRE_Int transpose_j1 = transpose_idx(j1, num_threads, num_colsA); |
512: |
513: bucket[transpose_j1] += bucket[transpose_j0]; |
[...] |
520: if (my_thread_num > 0) { |
521: HYPRE_Int transpose_i0 = transpose_idx(num_colsA*my_thread_num - 1, num_threads, num_colsA); |
522: HYPRE_Int offset = bucket[transpose_i0]; |
523: |
524: for (i = my_thread_num*num_colsA; i < (my_thread_num + 1)*num_colsA - 1; ++i) { |
525: HYPRE_Int transpose_i = transpose_idx(i, num_threads, num_colsA); |
526: |
527: bucket[transpose_i] += offset; |
[...] |
539: if (data) { |
540: for (i = iEnd - 1; i >= iBegin; --i) { |
541: for (j = A_i[i + 1] - 1; j >= A_i[i]; --j) { |
542: HYPRE_Int idx = A_j[j]; |
543: --bucket[my_thread_num*num_colsA + idx]; |
544: |
545: HYPRE_Int offset = bucket[my_thread_num*num_colsA + idx]; |
546: |
547: AT_data[offset] = A_data[j]; |
548: AT_j[offset] = i; |
549: } |
550: } |
551: } |
552: else { |
553: for (i = iEnd - 1; i >= iBegin; --i) { |
554: for (j = A_i[i + 1] - 1; j >= A_i[i]; --j) { |
555: HYPRE_Int idx = A_j[j]; |
556: --bucket[my_thread_num*num_colsA + idx]; |
557: |
558: HYPRE_Int offset = bucket[my_thread_num*num_colsA + idx]; |
559: |
560: AT_j[offset] = i; |
0x4c9a60 PUSH %RBP |
0x4c9a61 MOV %RSP,%RBP |
0x4c9a64 PUSH %R15 |
0x4c9a66 PUSH %R14 |
0x4c9a68 PUSH %R13 |
0x4c9a6a PUSH %R12 |
0x4c9a6c PUSH %RBX |
0x4c9a6d SUB $0x48,%RSP |
0x4c9a71 MOV %R9,%RBX |
0x4c9a74 MOV %R8,-0x50(%RBP) |
0x4c9a78 MOV %RCX,-0x68(%RBP) |
0x4c9a7c MOV %RDX,%R13 |
0x4c9a7f MOV %RDI,-0x30(%RBP) |
0x4c9a83 CALL 4d6de0 <hypre_NumActiveThreads> |
0x4c9a88 MOV %RAX,%R15 |
0x4c9a8b CALL 4d6df0 <hypre_GetThreadNum> |
0x4c9a90 MOV %RAX,%R14 |
0x4c9a93 MOV %R13,%RDI |
0x4c9a96 CALL 4cb940 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> |
0x4c9a9b MOV %RAX,%R12 |
0x4c9a9e MOV %R13,%RDI |
0x4c9aa1 CALL 4cb9c0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> |
0x4c9aa6 MOV %RAX,%RCX |
0x4c9aa9 CMP %R12,%RAX |
0x4c9aac MOV %R12,%RAX |
0x4c9aaf MOV %R12,-0x40(%RBP) |
0x4c9ab3 MOV %RCX,-0x38(%RBP) |
0x4c9ab7 JGE 4c9aef |
0x4c9ab9 MOV 0x251140(%RIP),%RDI |
0x4c9ac0 MOV $0x4f4345,%ESI |
0x4c9ac5 MOV $0x4f635b,%EDX |
0x4c9aca XOR %EAX,%EAX |
0x4c9acc CALL 4d53b0 <hypre_fprintf> |
0x4c9ad1 MOV $0x4f62d4,%EDI |
0x4c9ad6 MOV $0x1d7,%ESI |
0x4c9adb MOV $0x1,%EDX |
0x4c9ae0 XOR %ECX,%ECX |
0x4c9ae2 CALL 4d7ce0 <hypre_error_handler> |
0x4c9ae7 MOV -0x38(%RBP),%RCX |
0x4c9aeb MOV -0x40(%RBP),%R12 |
0x4c9aef MOV 0x18(%RBP),%RAX |
0x4c9af3 TEST %R12,%R12 |
0x4c9af6 JS 4c9afd |
0x4c9af8 CMP %RAX,%R12 |
0x4c9afb JLE 4c9b35 |
0x4c9afd MOV 0x2510fc(%RIP),%RDI |
0x4c9b04 MOV $0x4f4345,%ESI |
0x4c9b09 MOV $0x4f636a,%EDX |
0x4c9b0e MOV %RAX,%R12 |
0x4c9b11 XOR %EAX,%EAX |
0x4c9b13 CALL 4d53b0 <hypre_fprintf> |
0x4c9b18 MOV $0x4f62d4,%EDI |
0x4c9b1d MOV $0x1d8,%ESI |
0x4c9b22 MOV $0x1,%EDX |
0x4c9b27 XOR %ECX,%ECX |
0x4c9b29 CALL 4d7ce0 <hypre_error_handler> |
0x4c9b2e MOV %R12,%RAX |
0x4c9b31 MOV -0x38(%RBP),%RCX |
0x4c9b35 MOV 0x38(%RBP),%R13 |
0x4c9b39 MOV 0x20(%RBP),%R12 |
0x4c9b3d TEST %RCX,%RCX |
0x4c9b40 JS 4c9b47 |
0x4c9b42 CMP %RAX,%RCX |
0x4c9b45 JLE 4c9b75 |
0x4c9b47 MOV 0x2510b2(%RIP),%RDI |
0x4c9b4e MOV $0x4f4345,%ESI |
0x4c9b53 MOV $0x4f638d,%EDX |
0x4c9b58 XOR %EAX,%EAX |
0x4c9b5a CALL 4d53b0 <hypre_fprintf> |
0x4c9b5f MOV $0x4f62d4,%EDI |
0x4c9b64 MOV $0x1d9,%ESI |
0x4c9b69 MOV $0x1,%EDX |
0x4c9b6e XOR %ECX,%ECX |
0x4c9b70 CALL 4d7ce0 <hypre_error_handler> |
0x4c9b75 MOV (%R12),%RDX |
0x4c9b79 MOV %RDX,%RAX |
0x4c9b7c IMUL %R14,%RAX |
0x4c9b80 LEA (%R13,%RAX,8),%RDI |
0x4c9b85 SAL $0x3,%RDX |
0x4c9b89 XOR %ESI,%ESI |
0x4c9b8b CALL 4e0070 <__intel_avx_rep_memset> |
0x4c9b90 MOV -0x38(%RBP),%RSI |
0x4c9b94 MOV 0x10(%RBP),%RDX |
0x4c9b98 MOV -0x40(%RBP),%RAX |
0x4c9b9c MOV (%RBX,%RAX,8),%RAX |
0x4c9ba0 CMP (%RBX,%RSI,8),%RAX |
0x4c9ba4 JGE 4c9bcd |
0x4c9ba6 NOPW %CS:(%RAX,%RAX,1) |
(3952) 0x4c9bb0 MOV (%R12),%RCX |
(3952) 0x4c9bb4 IMUL %R14,%RCX |
(3952) 0x4c9bb8 ADD (%RDX,%RAX,8),%RCX |
(3952) 0x4c9bbc LEA (%R13,%RCX,8),%RCX |
(3952) 0x4c9bc1 INCQ (%RCX) |
(3952) 0x4c9bc4 INC %RAX |
(3952) 0x4c9bc7 CMP (%RBX,%RSI,8),%RAX |
(3952) 0x4c9bcb JL 4c9bb0 |
0x4c9bcd MOV -0x30(%RBP),%RAX |
0x4c9bd1 MOV (%RAX),%ESI |
0x4c9bd3 MOV $0x719ab0,%EDI |
0x4c9bd8 CALL 40fef0 <__kmpc_barrier@plt> |
0x4c9bdd MOV (%R12),%R9 |
0x4c9be1 MOV %R9,%RCX |
0x4c9be4 IMUL %R14,%RCX |
0x4c9be8 LEA 0x1(%R14),%R11 |
0x4c9bec LEA 0x1(%RCX),%RAX |
0x4c9bf0 MOV %R9,%RDX |
0x4c9bf3 IMUL %R11,%RDX |
0x4c9bf7 CMP %RDX,%RAX |
0x4c9bfa JL 4c9cfb |
0x4c9c00 MOV %R11,-0x60(%RBP) |
0x4c9c04 MOV %R15,-0x58(%RBP) |
0x4c9c08 MOV -0x30(%RBP),%R15 |
0x4c9c0c MOV (%R15),%ESI |
0x4c9c0f MOV $0x719ad0,%EDI |
0x4c9c14 CALL 40fef0 <__kmpc_barrier@plt> |
0x4c9c19 MOV (%R15),%ESI |
0x4c9c1c MOV -0x58(%RBP),%R15 |
0x4c9c20 MOV $0x719af0,%EDI |
0x4c9c25 XOR %EDX,%EDX |
0x4c9c27 CALL 410060 <__kmpc_masked@plt> |
0x4c9c2c CMP $0x1,%EAX |
0x4c9c2f JNE 4c9c72 |
0x4c9c31 CMP $0x1,%R15 |
0x4c9c35 MOV -0x30(%RBP),%R9 |
0x4c9c39 JLE 4c9c65 |
0x4c9c3b LEA -0x1(%R15),%RAX |
0x4c9c3f MOV %RAX,-0x48(%RBP) |
0x4c9c43 CMP $0x4,%RAX |
0x4c9c47 JAE 4ca09a |
0x4c9c4d MOV -0x48(%RBP),%RAX |
0x4c9c51 MOV %RAX,%R8 |
0x4c9c54 AND $-0x4,%R8 |
0x4c9c58 CMP %RAX,%R8 |
0x4c9c5b MOV -0x30(%RBP),%R9 |
0x4c9c5f JNE 4ca2cc |
0x4c9c65 MOV (%R9),%ESI |
0x4c9c68 MOV $0x719b10,%EDI |
0x4c9c6d CALL 40fe80 <__kmpc_end_masked@plt> |
0x4c9c72 MOV -0x30(%RBP),%RAX |
0x4c9c76 MOV (%RAX),%ESI |
0x4c9c78 MOV $0x719b30,%EDI |
0x4c9c7d CALL 40fef0 <__kmpc_barrier@plt> |
0x4c9c82 TEST %R14,%R14 |
0x4c9c85 MOV -0x60(%RBP),%R8 |
0x4c9c89 JLE 4c9f92 |
0x4c9c8f MOV (%R12),%RDI |
0x4c9c93 MOV %R14,%RCX |
0x4c9c96 IMUL %RDI,%RCX |
0x4c9c9a LEA -0x1(%RCX),%RAX |
0x4c9c9e MOV %RAX,%RDX |
0x4c9ca1 OR %R15,%RDX |
0x4c9ca4 SHR $0x20,%RDX |
0x4c9ca8 JE 4c9e46 |
0x4c9cae CQTO |
0x4c9cb0 IDIV %R15 |
0x4c9cb3 JMP 4c9e4b |
0x4c9cb8 NOPL (%RAX,%RAX,1) |
(3951) 0x4c9cc0 MOV %R8,%RAX |
(3951) 0x4c9cc3 CQTO |
(3951) 0x4c9cc5 IDIV %R15 |
(3951) 0x4c9cc8 IMUL %R9,%RSI |
(3951) 0x4c9ccc ADD %RSI,%RDI |
(3951) 0x4c9ccf MOV (%R13,%RDI,8),%RSI |
(3951) 0x4c9cd4 IMUL %R9,%RDX |
(3951) 0x4c9cd8 ADD %RAX,%RDX |
(3951) 0x4c9cdb ADD %RSI,(%R13,%RDX,8) |
(3951) 0x4c9ce0 MOV (%R12),%R9 |
(3951) 0x4c9ce4 MOV %R11,%RAX |
(3951) 0x4c9ce7 IMUL %R9,%RAX |
(3951) 0x4c9ceb ADD $0x5,%RCX |
(3951) 0x4c9cef CMP %RAX,%RCX |
(3951) 0x4c9cf2 MOV %R8,%RCX |
(3951) 0x4c9cf5 JGE 4c9c00 |
(3951) 0x4c9cfb LEA 0x1(%RCX),%RAX |
(3951) 0x4c9cff MOV %RAX,%RDX |
(3951) 0x4c9d02 OR %R15,%RDX |
(3951) 0x4c9d05 SHR $0x20,%RDX |
(3951) 0x4c9d09 JE 4c9d20 |
(3951) 0x4c9d0b CQTO |
(3951) 0x4c9d0d IDIV %R15 |
(3951) 0x4c9d10 MOV %RDX,%RSI |
(3951) 0x4c9d13 MOV %RAX,%RDI |
(3951) 0x4c9d16 JMP 4c9d29 |
0x4c9d18 NOPL (%RAX,%RAX,1) |
(3951) 0x4c9d20 XOR %EDX,%EDX |
(3951) 0x4c9d22 DIV %R15D |
(3951) 0x4c9d25 MOV %EDX,%ESI |
(3951) 0x4c9d27 MOV %EAX,%EDI |
(3951) 0x4c9d29 MOV %RCX,%RAX |
(3951) 0x4c9d2c OR %R15,%RAX |
(3951) 0x4c9d2f SHR $0x20,%RAX |
(3951) 0x4c9d33 JE 4c9d40 |
(3951) 0x4c9d35 MOV %RCX,%RAX |
(3951) 0x4c9d38 CQTO |
(3951) 0x4c9d3a IDIV %R15 |
(3951) 0x4c9d3d JMP 4c9d47 |
0x4c9d3f NOP |
(3951) 0x4c9d40 MOV %ECX,%EAX |
(3951) 0x4c9d42 XOR %EDX,%EDX |
(3951) 0x4c9d44 DIV %R15D |
(3951) 0x4c9d47 IMUL %R9,%RDX |
(3951) 0x4c9d4b ADD %RAX,%RDX |
(3951) 0x4c9d4e MOV (%R13,%RDX,8),%RAX |
(3951) 0x4c9d53 IMUL %RSI,%R9 |
(3951) 0x4c9d57 ADD %RDI,%R9 |
(3951) 0x4c9d5a ADD %RAX,(%R13,%R9,8) |
(3951) 0x4c9d5f MOV (%R12),%R10 |
(3951) 0x4c9d63 LEA 0x2(%RCX),%RAX |
(3951) 0x4c9d67 MOV %R11,%RDX |
(3951) 0x4c9d6a IMUL %R10,%RDX |
(3951) 0x4c9d6e CMP %RDX,%RAX |
(3951) 0x4c9d71 JGE 4c9c00 |
(3951) 0x4c9d77 MOV %RAX,%RDX |
(3951) 0x4c9d7a OR %R15,%RDX |
(3951) 0x4c9d7d SHR $0x20,%RDX |
(3951) 0x4c9d81 JE 4c9d90 |
(3951) 0x4c9d83 CQTO |
(3951) 0x4c9d85 IDIV %R15 |
(3951) 0x4c9d88 MOV %RDX,%R8 |
(3951) 0x4c9d8b MOV %RAX,%R9 |
(3951) 0x4c9d8e JMP 4c9d9b |
(3951) 0x4c9d90 XOR %EDX,%EDX |
(3951) 0x4c9d92 DIV %R15D |
(3951) 0x4c9d95 MOV %EDX,%R8D |
(3951) 0x4c9d98 MOV %EAX,%R9D |
(3951) 0x4c9d9b IMUL %R10,%RSI |
(3951) 0x4c9d9f ADD %RSI,%RDI |
(3951) 0x4c9da2 MOV (%R13,%RDI,8),%RAX |
(3951) 0x4c9da7 IMUL %R8,%R10 |
(3951) 0x4c9dab ADD %R9,%R10 |
(3951) 0x4c9dae ADD %RAX,(%R13,%R10,8) |
(3951) 0x4c9db3 MOV (%R12),%R10 |
(3951) 0x4c9db7 LEA 0x3(%RCX),%RAX |
(3951) 0x4c9dbb MOV %R11,%RDX |
(3951) 0x4c9dbe IMUL %R10,%RDX |
(3951) 0x4c9dc2 CMP %RDX,%RAX |
(3951) 0x4c9dc5 JGE 4c9c00 |
(3951) 0x4c9dcb MOV %RAX,%RDX |
(3951) 0x4c9dce OR %R15,%RDX |
(3951) 0x4c9dd1 SHR $0x20,%RDX |
(3951) 0x4c9dd5 JE 4c9df0 |
(3951) 0x4c9dd7 CQTO |
(3951) 0x4c9dd9 IDIV %R15 |
(3951) 0x4c9ddc MOV %RDX,%RSI |
(3951) 0x4c9ddf MOV %RAX,%RDI |
(3951) 0x4c9de2 JMP 4c9df9 |
0x4c9de4 NOPW %CS:(%RAX,%RAX,1) |
(3951) 0x4c9df0 XOR %EDX,%EDX |
(3951) 0x4c9df2 DIV %R15D |
(3951) 0x4c9df5 MOV %EDX,%ESI |
(3951) 0x4c9df7 MOV %EAX,%EDI |
(3951) 0x4c9df9 IMUL %R10,%R8 |
(3951) 0x4c9dfd ADD %R8,%R9 |
(3951) 0x4c9e00 MOV (%R13,%R9,8),%RAX |
(3951) 0x4c9e05 IMUL %RSI,%R10 |
(3951) 0x4c9e09 ADD %RDI,%R10 |
(3951) 0x4c9e0c ADD %RAX,(%R13,%R10,8) |
(3951) 0x4c9e11 MOV (%R12),%R9 |
(3951) 0x4c9e15 LEA 0x4(%RCX),%R8 |
(3951) 0x4c9e19 MOV %R11,%RAX |
(3951) 0x4c9e1c IMUL %R9,%RAX |
(3951) 0x4c9e20 CMP %RAX,%R8 |
(3951) 0x4c9e23 JGE 4c9c00 |
(3951) 0x4c9e29 MOV %R8,%RAX |
(3951) 0x4c9e2c OR %R15,%RAX |
(3951) 0x4c9e2f SHR $0x20,%RAX |
(3951) 0x4c9e33 JNE 4c9cc0 |
(3951) 0x4c9e39 MOV %R8D,%EAX |
(3951) 0x4c9e3c XOR %EDX,%EDX |
(3951) 0x4c9e3e DIV %R15D |
(3951) 0x4c9e41 JMP 4c9cc8 |
0x4c9e46 XOR %EDX,%EDX |
0x4c9e48 DIV %R15D |
0x4c9e4b MOV %RDI,%RSI |
0x4c9e4e IMUL %R8,%RSI |
0x4c9e52 DEC %RSI |
0x4c9e55 CMP %RSI,%RCX |
0x4c9e58 JGE 4c9f92 |
0x4c9e5e IMUL %RDI,%RDX |
0x4c9e62 ADD %RAX,%RDX |
0x4c9e65 MOV (%R13,%RDX,8),%RSI |
0x4c9e6a JMP 4c9e9c |
0x4c9e6c NOPL (%RAX) |
(3948) 0x4c9e70 XOR %EDX,%EDX |
(3948) 0x4c9e72 DIV %R15D |
(3948) 0x4c9e75 IMUL %RDX,%RDI |
(3948) 0x4c9e79 ADD %RAX,%RDI |
(3948) 0x4c9e7c ADD %RSI,(%R13,%RDI,8) |
(3948) 0x4c9e81 MOV (%R12),%RDI |
(3948) 0x4c9e85 MOV %R8,%RAX |
(3948) 0x4c9e88 IMUL %RDI,%RAX |
(3948) 0x4c9e8c DEC %RAX |
(3948) 0x4c9e8f ADD $0x4,%RCX |
(3948) 0x4c9e93 CMP %RAX,%RCX |
(3948) 0x4c9e96 JGE 4c9f92 |
(3948) 0x4c9e9c MOV %RCX,%RAX |
(3948) 0x4c9e9f OR %R15,%RAX |
(3948) 0x4c9ea2 SHR $0x20,%RAX |
(3948) 0x4c9ea6 JE 4c9ec0 |
(3948) 0x4c9ea8 MOV %RCX,%RAX |
(3948) 0x4c9eab CQTO |
(3948) 0x4c9ead IDIV %R15 |
(3948) 0x4c9eb0 JMP 4c9ec7 |
0x4c9eb2 NOPW %CS:(%RAX,%RAX,1) |
(3948) 0x4c9ec0 MOV %ECX,%EAX |
(3948) 0x4c9ec2 XOR %EDX,%EDX |
(3948) 0x4c9ec4 DIV %R15D |
(3948) 0x4c9ec7 IMUL %RDX,%RDI |
(3948) 0x4c9ecb ADD %RAX,%RDI |
(3948) 0x4c9ece ADD %RSI,(%R13,%RDI,8) |
(3948) 0x4c9ed3 MOV (%R12),%RDI |
(3948) 0x4c9ed7 LEA 0x1(%RCX),%RAX |
(3948) 0x4c9edb MOV %R8,%RDX |
(3948) 0x4c9ede IMUL %RDI,%RDX |
(3948) 0x4c9ee2 DEC %RDX |
(3948) 0x4c9ee5 CMP %RDX,%RAX |
(3948) 0x4c9ee8 JGE 4c9f92 |
(3948) 0x4c9eee MOV %RAX,%RDX |
(3948) 0x4c9ef1 OR %R15,%RDX |
(3948) 0x4c9ef4 SHR $0x20,%RDX |
(3948) 0x4c9ef8 JE 4c9f10 |
(3948) 0x4c9efa CQTO |
(3948) 0x4c9efc IDIV %R15 |
(3948) 0x4c9eff JMP 4c9f15 |
0x4c9f01 NOPW %CS:(%RAX,%RAX,1) |
(3948) 0x4c9f10 XOR %EDX,%EDX |
(3948) 0x4c9f12 DIV %R15D |
(3948) 0x4c9f15 IMUL %RDX,%RDI |
(3948) 0x4c9f19 ADD %RAX,%RDI |
(3948) 0x4c9f1c ADD %RSI,(%R13,%RDI,8) |
(3948) 0x4c9f21 MOV (%R12),%RDI |
(3948) 0x4c9f25 LEA 0x2(%RCX),%RAX |
(3948) 0x4c9f29 MOV %R8,%RDX |
(3948) 0x4c9f2c IMUL %RDI,%RDX |
(3948) 0x4c9f30 DEC %RDX |
(3948) 0x4c9f33 CMP %RDX,%RAX |
(3948) 0x4c9f36 JGE 4c9f92 |
(3948) 0x4c9f38 MOV %RAX,%RDX |
(3948) 0x4c9f3b OR %R15,%RDX |
(3948) 0x4c9f3e SHR $0x20,%RDX |
(3948) 0x4c9f42 JE 4c9f50 |
(3948) 0x4c9f44 CQTO |
(3948) 0x4c9f46 IDIV %R15 |
(3948) 0x4c9f49 JMP 4c9f55 |
0x4c9f4b NOPL (%RAX,%RAX,1) |
(3948) 0x4c9f50 XOR %EDX,%EDX |
(3948) 0x4c9f52 DIV %R15D |
(3948) 0x4c9f55 IMUL %RDX,%RDI |
(3948) 0x4c9f59 ADD %RAX,%RDI |
(3948) 0x4c9f5c ADD %RSI,(%R13,%RDI,8) |
(3948) 0x4c9f61 MOV (%R12),%RDI |
(3948) 0x4c9f65 LEA 0x3(%RCX),%RAX |
(3948) 0x4c9f69 MOV %R8,%RDX |
(3948) 0x4c9f6c IMUL %RDI,%RDX |
(3948) 0x4c9f70 DEC %RDX |
(3948) 0x4c9f73 CMP %RDX,%RAX |
(3948) 0x4c9f76 JGE 4c9f92 |
(3948) 0x4c9f78 MOV %RAX,%RDX |
(3948) 0x4c9f7b OR %R15,%RDX |
(3948) 0x4c9f7e SHR $0x20,%RDX |
(3948) 0x4c9f82 JE 4c9e70 |
(3948) 0x4c9f88 CQTO |
(3948) 0x4c9f8a IDIV %R15 |
(3948) 0x4c9f8d JMP 4c9e75 |
0x4c9f92 MOV 0x30(%RBP),%R15 |
0x4c9f96 MOV -0x30(%RBP),%RAX |
0x4c9f9a MOV (%RAX),%ESI |
0x4c9f9c MOV $0x719b50,%EDI |
0x4c9fa1 CALL 40fef0 <__kmpc_barrier@plt> |
0x4c9fa6 CMPQ $0,-0x68(%RBP) |
0x4c9fab JE 4c9fed |
0x4c9fad MOV -0x40(%RBP),%R9 |
0x4c9fb1 MOV -0x38(%RBP),%RSI |
0x4c9fb5 CMP %R9,%RSI |
0x4c9fb8 MOV 0x10(%RBP),%R10 |
0x4c9fbc MOV -0x50(%RBP),%R11 |
0x4c9fc0 JLE 4ca469 |
0x4c9fc6 MOV 0x28(%RBP),%RAX |
0x4c9fca MOV (%RBX,%RSI,8),%RDX |
0x4c9fce MOV %ESI,%ECX |
0x4c9fd0 SUB %R9D,%ECX |
0x4c9fd3 LEA 0x1(%R9),%R8 |
0x4c9fd7 TEST $0x1,%CL |
0x4c9fda JNE 4ca020 |
0x4c9fdc MOV %RSI,%RCX |
0x4c9fdf CMP %R8,%RSI |
0x4c9fe2 JNE 4ca485 |
0x4c9fe8 JMP 4ca469 |
0x4c9fed MOV -0x40(%RBP),%R8 |
0x4c9ff1 MOV -0x38(%RBP),%R10 |
0x4c9ff5 CMP %R8,%R10 |
0x4c9ff8 MOV 0x10(%RBP),%R9 |
0x4c9ffc JLE 4ca469 |
0x4ca002 MOV (%RBX,%R10,8),%RCX |
0x4ca006 MOV %R10D,%EAX |
0x4ca009 SUB %R8D,%EAX |
0x4ca00c LEA 0x1(%R8),%RDX |
0x4ca010 TEST $0x1,%AL |
0x4ca012 JNE 4ca359 |
0x4ca018 MOV %R10,%RAX |
0x4ca01b JMP 4ca39e |
0x4ca020 LEA -0x1(%RSI),%RCX |
0x4ca024 MOV -0x8(%RBX,%RSI,8),%RDI |
0x4ca029 CMP %RDI,%RDX |
0x4ca02c JLE 4ca45d |
0x4ca032 MOV %R8,-0x30(%RBP) |
0x4ca036 MOV -0x38(%RBP),%RSI |
0x4ca03a NOPW (%RAX,%RAX,1) |
(3947) 0x4ca040 MOV -0x8(%R10,%RDX,8),%RDI |
(3947) 0x4ca045 MOV (%R12),%R8 |
(3947) 0x4ca049 IMUL %R14,%R8 |
(3947) 0x4ca04d ADD %RDI,%R8 |
(3947) 0x4ca050 LEA (%R13,%R8,8),%R8 |
(3947) 0x4ca055 DECQ (%R8) |
(3947) 0x4ca058 MOV (%R12),%R8 |
(3947) 0x4ca05c IMUL %R14,%R8 |
(3947) 0x4ca060 ADD %RDI,%R8 |
(3947) 0x4ca063 VMOVSD -0x8(%R11,%RDX,8),%XMM0 |
(3947) 0x4ca06a DEC %RDX |
(3947) 0x4ca06d MOV (%R13,%R8,8),%RDI |
(3947) 0x4ca072 VMOVSD %XMM0,(%RAX,%RDI,8) |
(3947) 0x4ca077 MOV %RCX,(%R15,%RDI,8) |
(3947) 0x4ca07b MOV -0x8(%RBX,%RSI,8),%RDI |
(3947) 0x4ca080 CMP %RDI,%RDX |
(3947) 0x4ca083 JG 4ca040 |
0x4ca085 MOV %RDI,%RDX |
0x4ca088 MOV -0x30(%RBP),%R8 |
0x4ca08c CMP %R8,%RSI |
0x4ca08f JNE 4ca485 |
0x4ca095 JMP 4ca469 |
0x4ca09a MOV -0x48(%RBP),%R8 |
0x4ca09e SHR $0x2,%R8 |
0x4ca0a2 XOR %R9D,%R9D |
0x4ca0a5 JMP 4ca0d9 |
0x4ca0a7 NOPW (%RAX,%RAX,1) |
(3950) 0x4ca0b0 CQTO |
(3950) 0x4ca0b2 IDIV %R15 |
(3950) 0x4ca0b5 IMUL %R10,%RCX |
(3950) 0x4ca0b9 ADD %RSI,%RCX |
(3950) 0x4ca0bc MOV (%R13,%RCX,8),%RCX |
(3950) 0x4ca0c1 IMUL %R10,%RDX |
(3950) 0x4ca0c5 ADD %RAX,%RDX |
(3950) 0x4ca0c8 ADD %RCX,(%R13,%RDX,8) |
(3950) 0x4ca0cd INC %R9 |
(3950) 0x4ca0d0 CMP %R9,%R8 |
(3950) 0x4ca0d3 JE 4c9c4d |
(3950) 0x4ca0d9 MOV (%R12),%R10 |
(3950) 0x4ca0dd MOV %R10,%R11 |
(3950) 0x4ca0e0 IMUL %R9,%R11 |
(3950) 0x4ca0e4 LEA -0x1(%R10,%R11,4),%RAX |
(3950) 0x4ca0e9 MOV %RAX,%RCX |
(3950) 0x4ca0ec OR %R15,%RCX |
(3950) 0x4ca0ef SHR $0x20,%RCX |
(3950) 0x4ca0f3 JE 4ca110 |
(3950) 0x4ca0f5 CQTO |
(3950) 0x4ca0f7 IDIV %R15 |
(3950) 0x4ca0fa MOV %RDX,%RCX |
(3950) 0x4ca0fd MOV %RAX,%RSI |
(3950) 0x4ca100 JMP 4ca119 |
0x4ca102 NOPW %CS:(%RAX,%RAX,1) |
(3950) 0x4ca110 XOR %EDX,%EDX |
(3950) 0x4ca112 DIV %R15D |
(3950) 0x4ca115 MOV %EDX,%ECX |
(3950) 0x4ca117 MOV %EAX,%ESI |
(3950) 0x4ca119 SAL $0x2,%R11 |
(3950) 0x4ca11d LEA -0x1(%R11,%R10,2),%RAX |
(3950) 0x4ca122 MOV %RAX,%RDX |
(3950) 0x4ca125 OR %R15,%RDX |
(3950) 0x4ca128 SHR $0x20,%RDX |
(3950) 0x4ca12c JE 4ca140 |
(3950) 0x4ca12e CQTO |
(3950) 0x4ca130 IDIV %R15 |
(3950) 0x4ca133 JMP 4ca145 |
0x4ca135 NOPW %CS:(%RAX,%RAX,1) |
(3950) 0x4ca140 XOR %EDX,%EDX |
(3950) 0x4ca142 DIV %R15D |
(3950) 0x4ca145 IMUL %R10,%RCX |
(3950) 0x4ca149 ADD %RSI,%RCX |
(3950) 0x4ca14c MOV (%R13,%RCX,8),%RCX |
(3950) 0x4ca151 IMUL %R10,%RDX |
(3950) 0x4ca155 ADD %RAX,%RDX |
(3950) 0x4ca158 ADD %RCX,(%R13,%RDX,8) |
(3950) 0x4ca15d MOV (%R12),%R10 |
(3950) 0x4ca161 MOV %R10,%R11 |
(3950) 0x4ca164 IMUL %R9,%R11 |
(3950) 0x4ca168 SAL $0x2,%R11 |
(3950) 0x4ca16c LEA -0x1(%R11,%R10,2),%RAX |
(3950) 0x4ca171 MOV %RAX,%RCX |
(3950) 0x4ca174 OR %R15,%RCX |
(3950) 0x4ca177 SHR $0x20,%RCX |
(3950) 0x4ca17b JE 4ca190 |
(3950) 0x4ca17d CQTO |
(3950) 0x4ca17f IDIV %R15 |
(3950) 0x4ca182 MOV %RDX,%RCX |
(3950) 0x4ca185 MOV %RAX,%RSI |
(3950) 0x4ca188 JMP 4ca199 |
0x4ca18a NOPW (%RAX,%RAX,1) |
(3950) 0x4ca190 XOR %EDX,%EDX |
(3950) 0x4ca192 DIV %R15D |
(3950) 0x4ca195 MOV %EDX,%ECX |
(3950) 0x4ca197 MOV %EAX,%ESI |
(3950) 0x4ca199 LEA (%R10,%R10,2),%RAX |
(3950) 0x4ca19d LEA -0x1(%R11,%RAX,1),%RAX |
(3950) 0x4ca1a2 MOV %RAX,%RDX |
(3950) 0x4ca1a5 OR %R15,%RDX |
(3950) 0x4ca1a8 SHR $0x20,%RDX |
(3950) 0x4ca1ac JE 4ca1c0 |
(3950) 0x4ca1ae CQTO |
(3950) 0x4ca1b0 IDIV %R15 |
(3950) 0x4ca1b3 JMP 4ca1c5 |
0x4ca1b5 NOPW %CS:(%RAX,%RAX,1) |
(3950) 0x4ca1c0 XOR %EDX,%EDX |
(3950) 0x4ca1c2 DIV %R15D |
(3950) 0x4ca1c5 IMUL %R10,%RCX |
(3950) 0x4ca1c9 ADD %RSI,%RCX |
(3950) 0x4ca1cc MOV (%R13,%RCX,8),%RCX |
(3950) 0x4ca1d1 IMUL %R10,%RDX |
(3950) 0x4ca1d5 ADD %RAX,%RDX |
(3950) 0x4ca1d8 ADD %RCX,(%R13,%RDX,8) |
(3950) 0x4ca1dd MOV (%R12),%R10 |
(3950) 0x4ca1e1 LEA (%R10,%R10,2),%RAX |
(3950) 0x4ca1e5 LEA (,%R10,4),%RDI |
(3950) 0x4ca1ed MOV %RDI,%R11 |
(3950) 0x4ca1f0 IMUL %R9,%R11 |
(3950) 0x4ca1f4 LEA -0x1(%R11,%RAX,1),%RAX |
(3950) 0x4ca1f9 MOV %RAX,%RCX |
(3950) 0x4ca1fc OR %R15,%RCX |
(3950) 0x4ca1ff SHR $0x20,%RCX |
(3950) 0x4ca203 JE 4ca220 |
(3950) 0x4ca205 CQTO |
(3950) 0x4ca207 IDIV %R15 |
(3950) 0x4ca20a MOV %RDX,%RCX |
(3950) 0x4ca20d MOV %RAX,%RSI |
(3950) 0x4ca210 JMP 4ca229 |
0x4ca212 NOPW %CS:(%RAX,%RAX,1) |
(3950) 0x4ca220 XOR %EDX,%EDX |
(3950) 0x4ca222 DIV %R15D |
(3950) 0x4ca225 MOV %EDX,%ECX |
(3950) 0x4ca227 MOV %EAX,%ESI |
(3950) 0x4ca229 LEA -0x1(%RDI,%R11,1),%RAX |
(3950) 0x4ca22e MOV %RAX,%RDX |
(3950) 0x4ca231 OR %R15,%RDX |
(3950) 0x4ca234 SHR $0x20,%RDX |
(3950) 0x4ca238 JE 4ca250 |
(3950) 0x4ca23a CQTO |
(3950) 0x4ca23c IDIV %R15 |
(3950) 0x4ca23f JMP 4ca255 |
0x4ca241 NOPW %CS:(%RAX,%RAX,1) |
(3950) 0x4ca250 XOR %EDX,%EDX |
(3950) 0x4ca252 DIV %R15D |
(3950) 0x4ca255 IMUL %R10,%RCX |
(3950) 0x4ca259 ADD %RSI,%RCX |
(3950) 0x4ca25c MOV (%R13,%RCX,8),%RCX |
(3950) 0x4ca261 IMUL %R10,%RDX |
(3950) 0x4ca265 ADD %RAX,%RDX |
(3950) 0x4ca268 ADD %RCX,(%R13,%RDX,8) |
(3950) 0x4ca26d MOV (%R12),%R10 |
(3950) 0x4ca271 LEA (,%R10,4),%R11 |
(3950) 0x4ca279 IMUL %R9,%R11 |
(3950) 0x4ca27d LEA -0x1(%R11,%R10,4),%RAX |
(3950) 0x4ca282 MOV %RAX,%RCX |
(3950) 0x4ca285 OR %R15,%RCX |
(3950) 0x4ca288 SHR $0x20,%RCX |
(3950) 0x4ca28c JE 4ca2a0 |
(3950) 0x4ca28e CQTO |
(3950) 0x4ca290 IDIV %R15 |
(3950) 0x4ca293 MOV %RDX,%RCX |
(3950) 0x4ca296 MOV %RAX,%RSI |
(3950) 0x4ca299 JMP 4ca2a9 |
0x4ca29b NOPL (%RAX,%RAX,1) |
(3950) 0x4ca2a0 XOR %EDX,%EDX |
(3950) 0x4ca2a2 DIV %R15D |
(3950) 0x4ca2a5 MOV %EDX,%ECX |
(3950) 0x4ca2a7 MOV %EAX,%ESI |
(3950) 0x4ca2a9 LEA (%R10,%R10,4),%RAX |
(3950) 0x4ca2ad LEA -0x1(%R11,%RAX,1),%RAX |
(3950) 0x4ca2b2 MOV %RAX,%RDX |
(3950) 0x4ca2b5 OR %R15,%RDX |
(3950) 0x4ca2b8 SHR $0x20,%RDX |
(3950) 0x4ca2bc JNE 4ca0b0 |
(3950) 0x4ca2c2 XOR %EDX,%EDX |
(3950) 0x4ca2c4 DIV %R15D |
(3950) 0x4ca2c7 JMP 4ca0b5 |
0x4ca2cc INC %R8 |
0x4ca2cf JMP 4ca306 |
0x4ca2d1 NOPW %CS:(%RAX,%RAX,1) |
(3949) 0x4ca2e0 CQTO |
(3949) 0x4ca2e2 IDIV %R15 |
(3949) 0x4ca2e5 IMUL %RDI,%RCX |
(3949) 0x4ca2e9 ADD %RSI,%RCX |
(3949) 0x4ca2ec MOV (%R13,%RCX,8),%RCX |
(3949) 0x4ca2f1 IMUL %RDI,%RDX |
(3949) 0x4ca2f5 ADD %RAX,%RDX |
(3949) 0x4ca2f8 ADD %RCX,(%R13,%RDX,8) |
(3949) 0x4ca2fd CMP %R8,%R15 |
(3949) 0x4ca300 JE 4c9c65 |
(3949) 0x4ca306 MOV (%R12),%RDI |
(3949) 0x4ca30a MOV %RDI,%RAX |
(3949) 0x4ca30d IMUL %R8,%RAX |
(3949) 0x4ca311 DEC %RAX |
(3949) 0x4ca314 MOV %RAX,%RCX |
(3949) 0x4ca317 OR %R15,%RCX |
(3949) 0x4ca31a SHR $0x20,%RCX |
(3949) 0x4ca31e JE 4ca330 |
(3949) 0x4ca320 CQTO |
(3949) 0x4ca322 IDIV %R15 |
(3949) 0x4ca325 MOV %RDX,%RCX |
(3949) 0x4ca328 MOV %RAX,%RSI |
(3949) 0x4ca32b JMP 4ca339 |
0x4ca32d NOPL (%RAX) |
(3949) 0x4ca330 XOR %EDX,%EDX |
(3949) 0x4ca332 DIV %R15D |
(3949) 0x4ca335 MOV %EDX,%ECX |
(3949) 0x4ca337 MOV %EAX,%ESI |
(3949) 0x4ca339 INC %R8 |
(3949) 0x4ca33c MOV %RDI,%RAX |
(3949) 0x4ca33f IMUL %R8,%RAX |
(3949) 0x4ca343 DEC %RAX |
(3949) 0x4ca346 MOV %RAX,%RDX |
(3949) 0x4ca349 OR %R15,%RDX |
(3949) 0x4ca34c SHR $0x20,%RDX |
(3949) 0x4ca350 JNE 4ca2e0 |
(3949) 0x4ca352 XOR %EDX,%EDX |
(3949) 0x4ca354 DIV %R15D |
(3949) 0x4ca357 JMP 4ca2e5 |
0x4ca359 LEA -0x1(%R10),%RAX |
0x4ca35d NOPL (%RAX) |
(3943) 0x4ca360 MOV -0x8(%RBX,%R10,8),%RSI |
(3943) 0x4ca365 CMP %RSI,%RCX |
(3943) 0x4ca368 JLE 4ca39b |
(3943) 0x4ca36a MOV -0x8(%R9,%RCX,8),%RSI |
(3943) 0x4ca36f DEC %RCX |
(3943) 0x4ca372 MOV (%R12),%RDI |
(3943) 0x4ca376 IMUL %R14,%RDI |
(3943) 0x4ca37a ADD %RSI,%RDI |
(3943) 0x4ca37d LEA (%R13,%RDI,8),%RDI |
(3943) 0x4ca382 DECQ (%RDI) |
(3943) 0x4ca385 MOV (%R12),%RDI |
(3943) 0x4ca389 IMUL %R14,%RDI |
(3943) 0x4ca38d ADD %RSI,%RDI |
(3943) 0x4ca390 MOV (%R13,%RDI,8),%RSI |
(3943) 0x4ca395 MOV %RAX,(%R15,%RSI,8) |
(3943) 0x4ca399 JMP 4ca360 |
0x4ca39b MOV %RSI,%RCX |
0x4ca39e CMP %RDX,%R10 |
0x4ca3a1 JNE 4ca3b9 |
0x4ca3a3 JMP 4ca469 |
0x4ca3a8 NOPL (%RAX,%RAX,1) |
(3940) 0x4ca3b0 CMP %R8,%RAX |
(3940) 0x4ca3b3 JLE 4ca469 |
(3940) 0x4ca3b9 MOV -0x8(%RBX,%RAX,8),%RDX |
(3940) 0x4ca3be CMP %RDX,%RCX |
(3940) 0x4ca3c1 JLE 4ca409 |
(3940) 0x4ca3c3 LEA -0x1(%RAX),%RSI |
(3940) 0x4ca3c7 NOPW (%RAX,%RAX,1) |
(3942) 0x4ca3d0 MOV -0x8(%R9,%RCX,8),%RDX |
(3942) 0x4ca3d5 DEC %RCX |
(3942) 0x4ca3d8 MOV (%R12),%RDI |
(3942) 0x4ca3dc IMUL %R14,%RDI |
(3942) 0x4ca3e0 ADD %RDX,%RDI |
(3942) 0x4ca3e3 LEA (%R13,%RDI,8),%RDI |
(3942) 0x4ca3e8 DECQ (%RDI) |
(3942) 0x4ca3eb MOV (%R12),%RDI |
(3942) 0x4ca3ef IMUL %R14,%RDI |
(3942) 0x4ca3f3 ADD %RDX,%RDI |
(3942) 0x4ca3f6 MOV (%R13,%RDI,8),%RDX |
(3942) 0x4ca3fb MOV %RSI,(%R15,%RDX,8) |
(3942) 0x4ca3ff MOV -0x8(%RBX,%RAX,8),%RDX |
(3942) 0x4ca404 CMP %RDX,%RCX |
(3942) 0x4ca407 JG 4ca3d0 |
(3940) 0x4ca409 MOV -0x10(%RBX,%RAX,8),%RCX |
(3940) 0x4ca40e ADD $-0x2,%RAX |
(3940) 0x4ca412 CMP %RCX,%RDX |
(3940) 0x4ca415 JLE 4ca3b0 |
(3940) 0x4ca417 NOPW (%RAX,%RAX,1) |
(3941) 0x4ca420 MOV -0x8(%R9,%RDX,8),%RCX |
(3941) 0x4ca425 DEC %RDX |
(3941) 0x4ca428 MOV (%R12),%RSI |
(3941) 0x4ca42c IMUL %R14,%RSI |
(3941) 0x4ca430 ADD %RCX,%RSI |
(3941) 0x4ca433 LEA (%R13,%RSI,8),%RSI |
(3941) 0x4ca438 DECQ (%RSI) |
(3941) 0x4ca43b MOV (%R12),%RSI |
(3941) 0x4ca43f IMUL %R14,%RSI |
(3941) 0x4ca443 ADD %RCX,%RSI |
(3941) 0x4ca446 MOV (%R13,%RSI,8),%RCX |
(3941) 0x4ca44b MOV %RAX,(%R15,%RCX,8) |
(3941) 0x4ca44f MOV (%RBX,%RAX,8),%RCX |
(3941) 0x4ca453 CMP %RCX,%RDX |
(3941) 0x4ca456 JG 4ca420 |
(3940) 0x4ca458 JMP 4ca3b0 |
0x4ca45d MOV %RDI,%RDX |
0x4ca460 MOV -0x38(%RBP),%RSI |
0x4ca464 CMP %R8,%RSI |
0x4ca467 JNE 4ca485 |
0x4ca469 ADD $0x48,%RSP |
0x4ca46d POP %RBX |
0x4ca46e POP %R12 |
0x4ca470 POP %R13 |
0x4ca472 POP %R14 |
0x4ca474 POP %R15 |
0x4ca476 POP %RBP |
0x4ca477 RET |
0x4ca478 NOPL (%RAX,%RAX,1) |
(3944) 0x4ca480 CMP %R9,%RCX |
(3944) 0x4ca483 JLE 4ca469 |
(3944) 0x4ca485 MOV -0x8(%RBX,%RCX,8),%RSI |
(3944) 0x4ca48a CMP %RSI,%RDX |
(3944) 0x4ca48d JLE 4ca4e5 |
(3944) 0x4ca48f LEA -0x1(%RCX),%RDI |
(3944) 0x4ca493 NOPW %CS:(%RAX,%RAX,1) |
(3946) 0x4ca4a0 MOV -0x8(%R10,%RDX,8),%RSI |
(3946) 0x4ca4a5 MOV (%R12),%R8 |
(3946) 0x4ca4a9 IMUL %R14,%R8 |
(3946) 0x4ca4ad ADD %RSI,%R8 |
(3946) 0x4ca4b0 LEA (%R13,%R8,8),%R8 |
(3946) 0x4ca4b5 DECQ (%R8) |
(3946) 0x4ca4b8 MOV (%R12),%R8 |
(3946) 0x4ca4bc IMUL %R14,%R8 |
(3946) 0x4ca4c0 ADD %RSI,%R8 |
(3946) 0x4ca4c3 VMOVSD -0x8(%R11,%RDX,8),%XMM0 |
(3946) 0x4ca4ca DEC %RDX |
(3946) 0x4ca4cd MOV (%R13,%R8,8),%RSI |
(3946) 0x4ca4d2 VMOVSD %XMM0,(%RAX,%RSI,8) |
(3946) 0x4ca4d7 MOV %RDI,(%R15,%RSI,8) |
(3946) 0x4ca4db MOV -0x8(%RBX,%RCX,8),%RSI |
(3946) 0x4ca4e0 CMP %RSI,%RDX |
(3946) 0x4ca4e3 JG 4ca4a0 |
(3944) 0x4ca4e5 MOV -0x10(%RBX,%RCX,8),%RDX |
(3944) 0x4ca4ea ADD $-0x2,%RCX |
(3944) 0x4ca4ee CMP %RDX,%RSI |
(3944) 0x4ca4f1 JLE 4ca480 |
(3944) 0x4ca4f3 NOPW %CS:(%RAX,%RAX,1) |
(3945) 0x4ca500 MOV -0x8(%R10,%RSI,8),%RDX |
(3945) 0x4ca505 MOV (%R12),%RDI |
(3945) 0x4ca509 IMUL %R14,%RDI |
(3945) 0x4ca50d ADD %RDX,%RDI |
(3945) 0x4ca510 LEA (%R13,%RDI,8),%RDI |
(3945) 0x4ca515 DECQ (%RDI) |
(3945) 0x4ca518 MOV (%R12),%RDI |
(3945) 0x4ca51c IMUL %R14,%RDI |
(3945) 0x4ca520 ADD %RDX,%RDI |
(3945) 0x4ca523 VMOVSD -0x8(%R11,%RSI,8),%XMM0 |
(3945) 0x4ca52a DEC %RSI |
(3945) 0x4ca52d MOV (%R13,%RDI,8),%RDX |
(3945) 0x4ca532 VMOVSD %XMM0,(%RAX,%RDX,8) |
(3945) 0x4ca537 MOV %RCX,(%R15,%RDX,8) |
(3945) 0x4ca53b MOV (%RBX,%RCX,8),%RDX |
(3945) 0x4ca53f CMP %RDX,%RSI |
(3945) 0x4ca542 JG 4ca500 |
(3944) 0x4ca544 JMP 4ca480 |
0x4ca549 NOPL (%RAX) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | csr_matop.c:380-560 |
Module | exec |
nb instructions | 253 |
nb uops | 277 |
loop length | 1062 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 46.33 cycles |
front end | 46.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 18.10 | 18.00 | 19.00 | 19.00 | 16.00 | 18.00 | 17.90 | 16.00 | 16.00 | 16.00 | 18.00 | 19.00 |
cycles | 18.10 | 21.80 | 19.00 | 19.00 | 16.00 | 18.00 | 17.90 | 16.00 | 16.00 | 16.00 | 18.00 | 19.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 43.20-43.25 |
Stall cycles | 0.00 |
Front-end | 46.33 |
Dispatch | 21.80 |
DIV/SQRT | 16.00 |
Overall L1 | 46.33 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x48,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4d6de0 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d6df0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cb940 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cb9c0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c9aef <hypre_CSRMatrixTranspose.extracted+0x8f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x251140(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4345,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f635b,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d53b0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f62d4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d7,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d7ce0 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c9afd <hypre_CSRMatrixTranspose.extracted+0x9d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c9b35 <hypre_CSRMatrixTranspose.extracted+0xd5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x2510fc(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4345,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f636a,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d53b0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f62d4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d7ce0 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c9b47 <hypre_CSRMatrixTranspose.extracted+0xe7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c9b75 <hypre_CSRMatrixTranspose.extracted+0x115> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x2510b2(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4345,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f638d,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d53b0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f62d4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d7ce0 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R13,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e0070 <__intel_avx_rep_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RAX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RBX,%RSI,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JGE 4c9bcd <hypre_CSRMatrixTranspose.extracted+0x16d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719ab0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fef0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R12),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x1(%R14),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R11,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4c9cfb <hypre_CSRMatrixTranspose.extracted+0x29b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R11,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719ad0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fef0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R15),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719af0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 410060 <__kmpc_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMP $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4c9c72 <hypre_CSRMatrixTranspose.extracted+0x212> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x1,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c9c65 <hypre_CSRMatrixTranspose.extracted+0x205> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%R15),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4ca09a <hypre_CSRMatrixTranspose.extracted+0x63a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4ca2cc <hypre_CSRMatrixTranspose.extracted+0x86c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R9),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719b10,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fe80 <__kmpc_end_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719b30,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fef0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x60(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c9f92 <hypre_CSRMatrixTranspose.extracted+0x532> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RDI,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA -0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R15,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4c9e46 <hypre_CSRMatrixTranspose.extracted+0x3e6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R15 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 4c9e4b <hypre_CSRMatrixTranspose.extracted+0x3eb> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R15D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R8,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c9f92 <hypre_CSRMatrixTranspose.extracted+0x532> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %RDI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R13,%RDX,8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4c9e9c <hypre_CSRMatrixTranspose.extracted+0x43c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719b50,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fef0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,-0x68(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4c9fed <hypre_CSRMatrixTranspose.extracted+0x58d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ca469 <hypre_CSRMatrixTranspose.extracted+0xa09> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RSI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ESI,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R9D,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R9),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%CL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4ca020 <hypre_CSRMatrixTranspose.extracted+0x5c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca485 <hypre_CSRMatrixTranspose.extracted+0xa25> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ca469 <hypre_CSRMatrixTranspose.extracted+0xa09> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ca469 <hypre_CSRMatrixTranspose.extracted+0xa09> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%RBX,%R10,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R8D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4ca359 <hypre_CSRMatrixTranspose.extracted+0x8f9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4ca39e <hypre_CSRMatrixTranspose.extracted+0x93e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x1(%RSI),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%RBX,%RSI,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ca45d <hypre_CSRMatrixTranspose.extracted+0x9fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R8,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca485 <hypre_CSRMatrixTranspose.extracted+0xa25> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ca469 <hypre_CSRMatrixTranspose.extracted+0xa09> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x48(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SHR $0x2,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ca0d9 <hypre_CSRMatrixTranspose.extracted+0x679> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4ca306 <hypre_CSRMatrixTranspose.extracted+0x8a6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x1(%R10),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca3b9 <hypre_CSRMatrixTranspose.extracted+0x959> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ca469 <hypre_CSRMatrixTranspose.extracted+0xa09> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca485 <hypre_CSRMatrixTranspose.extracted+0xa25> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x48,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matop.c:380-560 |
Module | exec |
nb instructions | 253 |
nb uops | 277 |
loop length | 1062 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 46.33 cycles |
front end | 46.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 18.10 | 18.00 | 19.00 | 19.00 | 16.00 | 18.00 | 17.90 | 16.00 | 16.00 | 16.00 | 18.00 | 19.00 |
cycles | 18.10 | 21.80 | 19.00 | 19.00 | 16.00 | 18.00 | 17.90 | 16.00 | 16.00 | 16.00 | 18.00 | 19.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 43.20-43.25 |
Stall cycles | 0.00 |
Front-end | 46.33 |
Dispatch | 21.80 |
DIV/SQRT | 16.00 |
Overall L1 | 46.33 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x48,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4d6de0 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d6df0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cb940 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cb9c0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c9aef <hypre_CSRMatrixTranspose.extracted+0x8f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x251140(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4345,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f635b,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d53b0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f62d4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d7,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d7ce0 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c9afd <hypre_CSRMatrixTranspose.extracted+0x9d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c9b35 <hypre_CSRMatrixTranspose.extracted+0xd5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x2510fc(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4345,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f636a,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d53b0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f62d4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d7ce0 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c9b47 <hypre_CSRMatrixTranspose.extracted+0xe7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c9b75 <hypre_CSRMatrixTranspose.extracted+0x115> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x2510b2(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4345,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f638d,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d53b0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f62d4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d7ce0 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R13,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e0070 <__intel_avx_rep_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RAX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RBX,%RSI,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JGE 4c9bcd <hypre_CSRMatrixTranspose.extracted+0x16d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719ab0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fef0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R12),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x1(%R14),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R11,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4c9cfb <hypre_CSRMatrixTranspose.extracted+0x29b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R11,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719ad0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fef0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R15),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719af0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 410060 <__kmpc_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMP $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4c9c72 <hypre_CSRMatrixTranspose.extracted+0x212> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x1,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c9c65 <hypre_CSRMatrixTranspose.extracted+0x205> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%R15),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4ca09a <hypre_CSRMatrixTranspose.extracted+0x63a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4ca2cc <hypre_CSRMatrixTranspose.extracted+0x86c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R9),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719b10,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fe80 <__kmpc_end_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719b30,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fef0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x60(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c9f92 <hypre_CSRMatrixTranspose.extracted+0x532> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RDI,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA -0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R15,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4c9e46 <hypre_CSRMatrixTranspose.extracted+0x3e6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R15 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 4c9e4b <hypre_CSRMatrixTranspose.extracted+0x3eb> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R15D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R8,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c9f92 <hypre_CSRMatrixTranspose.extracted+0x532> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %RDI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R13,%RDX,8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4c9e9c <hypre_CSRMatrixTranspose.extracted+0x43c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719b50,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fef0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,-0x68(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4c9fed <hypre_CSRMatrixTranspose.extracted+0x58d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ca469 <hypre_CSRMatrixTranspose.extracted+0xa09> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RSI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ESI,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R9D,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R9),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%CL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4ca020 <hypre_CSRMatrixTranspose.extracted+0x5c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca485 <hypre_CSRMatrixTranspose.extracted+0xa25> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ca469 <hypre_CSRMatrixTranspose.extracted+0xa09> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ca469 <hypre_CSRMatrixTranspose.extracted+0xa09> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%RBX,%R10,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R8D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4ca359 <hypre_CSRMatrixTranspose.extracted+0x8f9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4ca39e <hypre_CSRMatrixTranspose.extracted+0x93e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x1(%RSI),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%RBX,%RSI,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ca45d <hypre_CSRMatrixTranspose.extracted+0x9fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R8,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca485 <hypre_CSRMatrixTranspose.extracted+0xa25> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ca469 <hypre_CSRMatrixTranspose.extracted+0xa09> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x48(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SHR $0x2,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ca0d9 <hypre_CSRMatrixTranspose.extracted+0x679> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4ca306 <hypre_CSRMatrixTranspose.extracted+0x8a6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x1(%R10),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca3b9 <hypre_CSRMatrixTranspose.extracted+0x959> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ca469 <hypre_CSRMatrixTranspose.extracted+0xa09> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca485 <hypre_CSRMatrixTranspose.extracted+0xa25> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x48,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixTranspose.extracted– | 0.17 | 0.03 |
▼Loop 3944 - csr_matop.c:540-548 - exec– | 0.04 | 0.01 |
○Loop 3946 - csr_matop.c:541-548 - exec | 0.04 | 0.01 |
○Loop 3945 - csr_matop.c:541-548 - exec | 0.04 | 0.01 |
○Loop 3951 - csr_matop.c:380-500 - exec | 0.02 | 0.01 |
○Loop 3952 - csr_matop.c:483-485 - exec | 0.01 | 0 |
○Loop 3948 - csr_matop.c:380-527 - exec | 0.01 | 0.01 |
○Loop 3943 - csr_matop.c:554-560 - exec | 0 | 0 |
○Loop 3947 - csr_matop.c:541-548 - exec | 0 | 0 |
○Loop 3949 - csr_matop.c:380-513 - exec | 0 | 0 |
▼Loop 3940 - csr_matop.c:553-560 - exec– | 0 | 0 |
○Loop 3942 - csr_matop.c:554-560 - exec | 0 | 0 |
○Loop 3941 - csr_matop.c:554-560 - exec | 0 | 0 |
○Loop 3950 - csr_matop.c:380-513 - exec | 0 | 0 |