Function: hypre_CSRMatrixMatvecOutOfPlace.extracted.19 | Module: exec | Source: csr_matvec.c:178-206 [...] | Coverage: 0.01% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace.extracted.19 | Module: exec | Source: csr_matvec.c:178-206 [...] | Coverage: 0.01% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-3661/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 178 - 206 |
-------------------------------------------------------------------------------- |
178: #pragma omp parallel for private(i,j,jj,m,tempx) HYPRE_SMP_SCHEDULE |
179: #endif |
180: |
181: for (i = 0; i < num_rownnz; i++) |
182: { |
183: m = A_rownnz[i]; |
[...] |
191: if ( num_vectors==1 ) |
192: { |
193: tempx = 0; |
194: for (jj = A_i[m]; jj < A_i[m+1]; jj++) |
195: tempx += A_data[jj] * x_data[A_j[jj]]; |
196: y_data[m] += tempx; |
197: } |
198: else |
199: for ( j=0; j<num_vectors; ++j ) |
200: { |
201: tempx = 0; |
202: for (jj = A_i[m]; jj < A_i[m+1]; jj++) |
203: tempx += A_data[jj] * x_data[ j*vecstride_x + A_j[jj]*idxstride_x ]; |
204: y_data[ j*vecstride_y + m*idxstride_y] += tempx; |
205: } |
206: } |
0x4ce140 PUSH %RBP |
0x4ce141 MOV %RSP,%RBP |
0x4ce144 PUSH %R15 |
0x4ce146 PUSH %R14 |
0x4ce148 PUSH %R13 |
0x4ce14a PUSH %R12 |
0x4ce14c PUSH %RBX |
0x4ce14d SUB $0x98,%RSP |
0x4ce154 MOV 0x40(%RBP),%RAX |
0x4ce158 MOV %RAX,-0x68(%RBP) |
0x4ce15c MOV 0x38(%RBP),%R12 |
0x4ce160 MOV 0x30(%RBP),%RAX |
0x4ce164 MOV %RAX,-0xb8(%RBP) |
0x4ce16b MOV 0x28(%RBP),%RAX |
0x4ce16f MOV %RAX,-0x78(%RBP) |
0x4ce173 MOV 0x20(%RBP),%RAX |
0x4ce177 MOV %RAX,-0x48(%RBP) |
0x4ce17b MOV 0x18(%RBP),%RAX |
0x4ce17f MOV %RAX,-0x40(%RBP) |
0x4ce183 MOV 0x10(%RBP),%RAX |
0x4ce187 MOV %RAX,-0x60(%RBP) |
0x4ce18b MOVL $0,-0x30(%RBP) |
0x4ce192 MOV %R9,-0x90(%RBP) |
0x4ce199 MOV %R8,-0x58(%RBP) |
0x4ce19d MOV %RCX,-0x38(%RBP) |
0x4ce1a1 MOV %RDX,-0x50(%RBP) |
0x4ce1a5 MOV (%RDI),%ESI |
0x4ce1a7 MOVQ $0,-0x70(%RBP) |
0x4ce1af MOVQ $0x1,-0xc0(%RBP) |
0x4ce1ba SUB $0x8,%RSP |
0x4ce1be LEA -0xc0(%RBP),%RAX |
0x4ce1c5 LEA -0x30(%RBP),%RCX |
0x4ce1c9 LEA -0x70(%RBP),%R8 |
0x4ce1cd LEA 0x50(%RBP),%R9 |
0x4ce1d1 MOV $0x719db0,%EDI |
0x4ce1d6 MOV %ESI,-0x2c(%RBP) |
0x4ce1d9 MOV $0x22,%EDX |
0x4ce1de PUSH $0x1 |
0x4ce1e0 PUSH $0x1 |
0x4ce1e2 PUSH %RAX |
0x4ce1e3 CALL 40fdb0 <__kmpc_for_static_init_8@plt> |
0x4ce1e8 ADD $0x20,%RSP |
0x4ce1ec MOV -0x70(%RBP),%RAX |
0x4ce1f0 MOV 0x50(%RBP),%RCX |
0x4ce1f4 MOV %RAX,-0x88(%RBP) |
0x4ce1fb SUB %RAX,%RCX |
0x4ce1fe MOV %RCX,-0x80(%RBP) |
0x4ce202 JAE 4ce225 |
0x4ce204 MOV $0x719dd0,%EDI |
0x4ce209 MOV -0x2c(%RBP),%ESI |
0x4ce20c ADD $0x98,%RSP |
0x4ce213 POP %RBX |
0x4ce214 POP %R12 |
0x4ce216 POP %R13 |
0x4ce218 POP %R14 |
0x4ce21a POP %R15 |
0x4ce21c POP %RBP |
0x4ce21d VZEROUPPER |
0x4ce220 JMP 40faf0 |
0x4ce225 MOV -0x48(%RBP),%RAX |
0x4ce229 DEC %RAX |
0x4ce22c MOV %RAX,-0xb0(%RBP) |
0x4ce233 VPBROADCASTQ %R12,%YMM0 |
0x4ce239 XOR %ECX,%ECX |
0x4ce23b JMP 4ce265 |
0x4ce23d NOPL (%RAX) |
(4061) 0x4ce240 MOV -0x40(%RBP),%RAX |
(4061) 0x4ce244 MOV (%RAX),%RAX |
(4061) 0x4ce247 VADDSD (%RAX,%RDI,8),%XMM1,%XMM1 |
(4061) 0x4ce24c VMOVSD %XMM1,(%RAX,%RDI,8) |
(4061) 0x4ce251 MOV -0x98(%RBP),%RCX |
(4061) 0x4ce258 LEA 0x1(%RCX),%RAX |
(4061) 0x4ce25c CMP -0x80(%RBP),%RCX |
(4061) 0x4ce260 MOV %RAX,%RCX |
(4061) 0x4ce263 JE 4ce204 |
(4061) 0x4ce265 MOV -0x88(%RBP),%RAX |
(4061) 0x4ce26c MOV %RCX,-0x98(%RBP) |
(4061) 0x4ce273 ADD %RCX,%RAX |
(4061) 0x4ce276 MOV -0x90(%RBP),%RCX |
(4061) 0x4ce27d MOV (%RCX,%RAX,8),%RDI |
(4061) 0x4ce281 CMPQ $0x1,-0x48(%RBP) |
(4061) 0x4ce286 JNE 4ce330 |
(4061) 0x4ce28c MOV -0x38(%RBP),%RAX |
(4061) 0x4ce290 MOV (%RAX),%RAX |
(4061) 0x4ce293 MOV (%RAX,%RDI,8),%R10 |
(4061) 0x4ce297 MOV 0x8(%RAX,%RDI,8),%RAX |
(4061) 0x4ce29c VXORPD %XMM1,%XMM1,%XMM1 |
(4061) 0x4ce2a0 MOV %RAX,%R11 |
(4061) 0x4ce2a3 SUB %R10,%R11 |
(4061) 0x4ce2a6 JLE 4ce240 |
(4061) 0x4ce2a8 MOV -0x50(%RBP),%RCX |
(4061) 0x4ce2ac MOV (%RCX),%RCX |
(4061) 0x4ce2af MOV -0x60(%RBP),%RDX |
(4061) 0x4ce2b3 MOV (%RDX),%RSI |
(4061) 0x4ce2b6 MOV -0x58(%RBP),%RDX |
(4061) 0x4ce2ba MOV (%RDX),%R8 |
(4061) 0x4ce2bd MOV %R11,%R9 |
(4061) 0x4ce2c0 AND $-0x4,%R9 |
(4061) 0x4ce2c4 JE 4ce494 |
(4061) 0x4ce2ca LEA -0x1(%R9),%RDX |
(4061) 0x4ce2ce LEA (%RCX,%R10,8),%RBX |
(4061) 0x4ce2d2 LEA (%R8,%R10,8),%R14 |
(4061) 0x4ce2d6 VXORPD %XMM1,%XMM1,%XMM1 |
(4061) 0x4ce2da XOR %R15D,%R15D |
(4061) 0x4ce2dd NOPL (%RAX) |
(4066) 0x4ce2e0 VMOVUPD (%R14,%R15,8),%YMM2 |
(4066) 0x4ce2e6 KXNORW %K0,%K0,%K1 |
(4066) 0x4ce2ea VXORPD %XMM3,%XMM3,%XMM3 |
(4066) 0x4ce2ee VGATHERQPD (%RSI,%YMM2,8),%YMM3{%K1} |
(4066) 0x4ce2f5 VFMADD231PD (%RBX,%R15,8),%YMM3,%YMM1 |
(4066) 0x4ce2fb ADD $0x4,%R15 |
(4066) 0x4ce2ff CMP %RDX,%R15 |
(4066) 0x4ce302 JBE 4ce2e0 |
(4061) 0x4ce304 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4061) 0x4ce30a VADDPD %XMM2,%XMM1,%XMM1 |
(4061) 0x4ce30e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4061) 0x4ce313 VADDSD %XMM2,%XMM1,%XMM1 |
(4061) 0x4ce317 CMP %R9,%R11 |
(4061) 0x4ce31a JE 4ce240 |
(4061) 0x4ce320 JMP 4ce497 |
0x4ce325 NOPW %CS:(%RAX,%RAX,1) |
(4061) 0x4ce330 JL 4ce251 |
(4061) 0x4ce336 MOV -0x38(%RBP),%RAX |
(4061) 0x4ce33a MOV (%RAX),%RAX |
(4061) 0x4ce33d MOV (%RAX,%RDI,8),%R8 |
(4061) 0x4ce341 MOV 0x8(%RAX,%RDI,8),%R9 |
(4061) 0x4ce346 MOV -0x40(%RBP),%RAX |
(4061) 0x4ce34a MOV (%RAX),%R10 |
(4061) 0x4ce34d MOV %R9,%RBX |
(4061) 0x4ce350 SUB %R8,%RBX |
(4061) 0x4ce353 IMUL -0x78(%RBP),%RDI |
(4061) 0x4ce358 MOV %RBX,-0xa8(%RBP) |
(4061) 0x4ce35f AND $-0x4,%RBX |
(4061) 0x4ce363 LEA -0x1(%RBX),%RCX |
(4061) 0x4ce367 LEA (,%R8,8),%RAX |
(4061) 0x4ce36f MOV %RAX,-0xa0(%RBP) |
(4061) 0x4ce376 XOR %EDX,%EDX |
(4061) 0x4ce378 JMP 4ce3ae |
0x4ce37a NOPW (%RAX,%RAX,1) |
(4062) 0x4ce380 MOV %RDX,%RAX |
(4062) 0x4ce383 IMUL -0xb8(%RBP),%RAX |
(4062) 0x4ce38b ADD %RDI,%RAX |
(4062) 0x4ce38e VADDSD (%R10,%RAX,8),%XMM1,%XMM1 |
(4062) 0x4ce394 VMOVSD %XMM1,(%R10,%RAX,8) |
(4062) 0x4ce39a LEA 0x1(%RDX),%RAX |
(4062) 0x4ce39e CMP -0xb0(%RBP),%RDX |
(4062) 0x4ce3a5 MOV %RAX,%RDX |
(4062) 0x4ce3a8 JE 4ce251 |
(4062) 0x4ce3ae VXORPD %XMM1,%XMM1,%XMM1 |
(4062) 0x4ce3b2 CMP %R8,%R9 |
(4062) 0x4ce3b5 JLE 4ce380 |
(4062) 0x4ce3b7 MOV -0x50(%RBP),%RAX |
(4062) 0x4ce3bb MOV (%RAX),%R15 |
(4062) 0x4ce3be MOV -0x60(%RBP),%RAX |
(4062) 0x4ce3c2 MOV (%RAX),%RSI |
(4062) 0x4ce3c5 MOV -0x58(%RBP),%RAX |
(4062) 0x4ce3c9 MOV (%RAX),%RAX |
(4062) 0x4ce3cc TEST %RBX,%RBX |
(4062) 0x4ce3cf JE 4ce453 |
(4062) 0x4ce3d5 MOV %RDX,%R11 |
(4062) 0x4ce3d8 IMUL -0x68(%RBP),%R11 |
(4062) 0x4ce3dd VPBROADCASTQ %R11,%YMM2 |
(4062) 0x4ce3e3 MOV -0xa0(%RBP),%R14 |
(4062) 0x4ce3ea LEA (%R15,%R14,1),%R11 |
(4062) 0x4ce3ee LEA (%RAX,%R14,1),%R13 |
(4062) 0x4ce3f2 VXORPD %XMM1,%XMM1,%XMM1 |
(4062) 0x4ce3f6 XOR %R14D,%R14D |
(4062) 0x4ce3f9 NOPL (%RAX) |
(4064) 0x4ce400 VXORPS %XMM3,%XMM3,%XMM3 |
(4064) 0x4ce404 VPMULLQ (%R13,%R14,8),%YMM0,%YMM3 |
(4064) 0x4ce40c VPADDQ %YMM2,%YMM3,%YMM3 |
(4064) 0x4ce410 VXORPD %XMM4,%XMM4,%XMM4 |
(4064) 0x4ce414 KXNORW %K0,%K0,%K1 |
(4064) 0x4ce418 VGATHERQPD (%RSI,%YMM3,8),%YMM4{%K1} |
(4064) 0x4ce41f VFMADD231PD (%R11,%R14,8),%YMM4,%YMM1 |
(4064) 0x4ce425 ADD $0x4,%R14 |
(4064) 0x4ce429 CMP %RCX,%R14 |
(4064) 0x4ce42c JBE 4ce400 |
(4062) 0x4ce42e VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4062) 0x4ce434 VADDPD %XMM2,%XMM1,%XMM1 |
(4062) 0x4ce438 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4062) 0x4ce43d VADDSD %XMM2,%XMM1,%XMM1 |
(4062) 0x4ce441 MOV %RBX,%R11 |
(4062) 0x4ce444 CMP %RBX,-0xa8(%RBP) |
(4062) 0x4ce44b JE 4ce380 |
(4062) 0x4ce451 JMP 4ce456 |
(4062) 0x4ce453 XOR %R11D,%R11D |
(4062) 0x4ce456 MOV %RDX,%R13 |
(4062) 0x4ce459 IMUL -0x68(%RBP),%R13 |
(4062) 0x4ce45e ADD %R8,%R11 |
(4062) 0x4ce461 NOPW %CS:(%RAX,%RAX,1) |
(4063) 0x4ce470 MOV (%RAX,%R11,8),%R14 |
(4063) 0x4ce474 IMUL %R12,%R14 |
(4063) 0x4ce478 ADD %R13,%R14 |
(4063) 0x4ce47b VMOVSD (%RSI,%R14,8),%XMM2 |
(4063) 0x4ce481 VFMADD231SD (%R15,%R11,8),%XMM2,%XMM1 |
(4063) 0x4ce487 INC %R11 |
(4063) 0x4ce48a CMP %R11,%R9 |
(4063) 0x4ce48d JNE 4ce470 |
(4062) 0x4ce48f JMP 4ce380 |
(4061) 0x4ce494 XOR %R9D,%R9D |
(4061) 0x4ce497 ADD %R10,%R9 |
(4061) 0x4ce49a NOPW (%RAX,%RAX,1) |
(4065) 0x4ce4a0 MOV (%R8,%R9,8),%RDX |
(4065) 0x4ce4a4 VMOVSD (%RSI,%RDX,8),%XMM2 |
(4065) 0x4ce4a9 VFMADD231SD (%RCX,%R9,8),%XMM2,%XMM1 |
(4065) 0x4ce4af INC %R9 |
(4065) 0x4ce4b2 CMP %R9,%RAX |
(4065) 0x4ce4b5 JNE 4ce4a0 |
(4061) 0x4ce4b7 JMP 4ce240 |
0x4ce4bc NOPL (%RAX) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►97.22+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
○2.78 | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | csr_matvec.c:178-206 |
Module | exec |
nb instructions | 69 |
nb uops | 71 |
loop length | 277 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 25 |
micro-operation queue | 11.83 cycles |
front end | 11.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 1.70 | 1.60 | 6.00 | 6.00 | 13.50 | 1.60 | 1.50 | 13.50 | 13.50 | 13.50 | 1.60 | 6.00 |
cycles | 1.70 | 1.60 | 6.00 | 6.00 | 13.50 | 1.60 | 1.50 | 13.50 | 13.50 | 13.50 | 1.60 | 6.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 13.59 |
Stall cycles | 1.64-1.64 |
RS full (events) | 5.17-4.80 |
Front-end | 11.83 |
Dispatch | 13.50 |
Overall L1 | 13.50 |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 11% |
load | 9% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x30(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x70(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x50(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x719db0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 40fdb0 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 4ce225 <hypre_CSRMatrixMatvecOutOfPlace.extracted.19+0xe5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x719dd0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x2c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 40faf0 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
DEC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R12,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ce265 <hypre_CSRMatrixMatvecOutOfPlace.extracted.19+0x125> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matvec.c:178-206 |
Module | exec |
nb instructions | 69 |
nb uops | 71 |
loop length | 277 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 25 |
micro-operation queue | 11.83 cycles |
front end | 11.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 1.70 | 1.60 | 6.00 | 6.00 | 13.50 | 1.60 | 1.50 | 13.50 | 13.50 | 13.50 | 1.60 | 6.00 |
cycles | 1.70 | 1.60 | 6.00 | 6.00 | 13.50 | 1.60 | 1.50 | 13.50 | 13.50 | 13.50 | 1.60 | 6.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 13.59 |
Stall cycles | 1.64-1.64 |
RS full (events) | 5.17-4.80 |
Front-end | 11.83 |
Dispatch | 13.50 |
Overall L1 | 13.50 |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 11% |
load | 9% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x30(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x70(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x50(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x719db0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 40fdb0 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 4ce225 <hypre_CSRMatrixMatvecOutOfPlace.extracted.19+0xe5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x719dd0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x2c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 40faf0 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
DEC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R12,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ce265 <hypre_CSRMatrixMatvecOutOfPlace.extracted.19+0x125> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace.extracted.19– | 0.01 | 0 |
▼Loop 4061 - csr_matvec.c:181-206 - exec– | 0.01 | 0 |
○Loop 4066 - csr_matvec.c:194-195 - exec | 0.01 | 0 |
▼Loop 4062 - csr_matvec.c:199-204 - exec– | 0 | 0 |
○Loop 4064 - csr_matvec.c:202-203 - exec | 0 | 0 |
○Loop 4063 - csr_matvec.c:202-203 - exec | 0 | 0 |
○Loop 4065 - csr_matvec.c:194-195 - exec | 0 | 0 |