Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 12.09% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 12.09% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-3661/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 243 - 404 |
-------------------------------------------------------------------------------- |
243: #pragma omp parallel private(i,jj,tempx) |
244: #endif |
245: { |
246: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
247: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
248: hypre_assert(iBegin <= iEnd); |
249: hypre_assert(iBegin >= 0 && iBegin <= num_rows); |
250: hypre_assert(iEnd >= 0 && iEnd <= num_rows); |
251: |
252: if (0 == temp) |
253: { |
254: if (1 == alpha) // JSP: a common path |
255: { |
256: for (i = iBegin; i < iEnd; i++) |
257: { |
258: tempx = 0.0; |
259: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
260: { |
261: tempx += A_data[jj] * x_data[A_j[jj]]; |
262: } |
263: y_data[i] = tempx; |
264: } |
265: } // y = A*x |
266: else if (-1 == alpha) |
267: { |
268: for (i = iBegin; i < iEnd; i++) |
269: { |
270: tempx = 0.0; |
271: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
272: { |
273: tempx -= A_data[jj] * x_data[A_j[jj]]; |
274: } |
275: y_data[i] = tempx; |
276: } |
277: } // y = -A*x |
278: else |
279: { |
280: for (i = iBegin; i < iEnd; i++) |
281: { |
282: tempx = 0.0; |
283: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
284: { |
285: tempx += A_data[jj] * x_data[A_j[jj]]; |
286: } |
287: y_data[i] = alpha*tempx; |
288: } |
289: } // y = alpha*A*x |
290: } // temp == 0 |
291: else if (-1 == temp) // beta == -alpha |
292: { |
293: if (1 == alpha) // JSP: a common path |
294: { |
295: for (i = iBegin; i < iEnd; i++) |
296: { |
297: tempx = -b_data[i]; |
298: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
299: { |
300: tempx += A_data[jj] * x_data[A_j[jj]]; |
301: } |
302: y_data[i] = tempx; |
303: } |
304: } // y = A*x - y |
305: else if (-1 == alpha) // JSP: a common path |
306: { |
307: for (i = iBegin; i < iEnd; i++) |
308: { |
309: tempx = b_data[i]; |
310: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
311: { |
312: tempx -= A_data[jj] * x_data[A_j[jj]]; |
313: } |
314: y_data[i] = tempx; |
315: } |
316: } // y = -A*x + y |
317: else |
318: { |
319: for (i = iBegin; i < iEnd; i++) |
320: { |
321: tempx = -b_data[i]; |
322: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
323: { |
324: tempx += A_data[jj] * x_data[A_j[jj]]; |
325: } |
326: y_data[i] = alpha*tempx; |
327: } |
328: } // y = alpha*(A*x - y) |
329: } // temp == -1 |
330: else if (1 == temp) |
331: { |
332: if (1 == alpha) // JSP: a common path |
333: { |
334: for (i = iBegin; i < iEnd; i++) |
335: { |
336: tempx = b_data[i]; |
337: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
338: { |
339: tempx += A_data[jj] * x_data[A_j[jj]]; |
340: } |
341: y_data[i] = tempx; |
342: } |
343: } // y = A*x + y |
344: else if (-1 == alpha) |
345: { |
346: for (i = iBegin; i < iEnd; i++) |
347: { |
348: tempx = -b_data[i]; |
349: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
350: { |
351: tempx -= A_data[jj] * x_data[A_j[jj]]; |
352: } |
353: y_data[i] = tempx; |
354: } |
355: } // y = -A*x - y |
356: else |
357: { |
358: for (i = iBegin; i < iEnd; i++) |
359: { |
360: tempx = b_data[i]; |
361: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
362: { |
363: tempx += A_data[jj] * x_data[A_j[jj]]; |
364: } |
365: y_data[i] = alpha*tempx; |
[...] |
371: if (1 == alpha) // JSP: a common path |
372: { |
373: for (i = iBegin; i < iEnd; i++) |
374: { |
375: tempx = b_data[i]*temp; |
376: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
377: { |
378: tempx += A_data[jj] * x_data[A_j[jj]]; |
379: } |
380: y_data[i] = tempx; |
381: } |
382: } // y = A*x + temp*y |
383: else if (-1 == alpha) |
384: { |
385: for (i = iBegin; i < iEnd; i++) |
386: { |
387: tempx = -b_data[i]*temp; |
388: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
389: { |
390: tempx -= A_data[jj] * x_data[A_j[jj]]; |
391: } |
392: y_data[i] = tempx; |
393: } |
394: } // y = -A*x - temp*y |
395: else |
396: { |
397: for (i = iBegin; i < iEnd; i++) |
398: { |
399: tempx = b_data[i]*temp; |
400: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
401: { |
402: tempx += A_data[jj] * x_data[A_j[jj]]; |
403: } |
404: y_data[i] = alpha*tempx; |
0x4ccec0 PUSH %RBP |
0x4ccec1 MOV %RSP,%RBP |
0x4ccec4 PUSH %R15 |
0x4ccec6 PUSH %R14 |
0x4ccec8 PUSH %R13 |
0x4cceca PUSH %R12 |
0x4ccecc PUSH %RBX |
0x4ccecd SUB $0x28,%RSP |
0x4cced1 MOV %R9,%R12 |
0x4cced4 MOV %R8,-0x48(%RBP) |
0x4cced8 MOV %RCX,%R15 |
0x4ccedb MOV %RDX,%R13 |
0x4ccede MOV %RCX,%RDI |
0x4ccee1 CALL 4cb940 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> |
0x4ccee6 MOV %RAX,%R14 |
0x4ccee9 MOV %R15,%RDI |
0x4cceec CALL 4cb9c0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> |
0x4ccef1 MOV %RAX,%R15 |
0x4ccef4 CMP %RAX,%R14 |
0x4ccef7 JLE 4ccf27 |
0x4ccef9 MOV 0x24dd00(%RIP),%RDI |
0x4ccf00 MOV $0x4f4345,%ESI |
0x4ccf05 MOV $0x4f635b,%EDX |
0x4ccf0a XOR %EAX,%EAX |
0x4ccf0c CALL 4d53b0 <hypre_fprintf> |
0x4ccf11 MOV $0x4f6d01,%EDI |
0x4ccf16 MOV $0xf8,%ESI |
0x4ccf1b MOV $0x1,%EDX |
0x4ccf20 XOR %ECX,%ECX |
0x4ccf22 CALL 4d7ce0 <hypre_error_handler> |
0x4ccf27 MOV 0x18(%RBP),%RBX |
0x4ccf2b TEST %R14,%R14 |
0x4ccf2e JS 4ccf35 |
0x4ccf30 CMP %RBX,%R14 |
0x4ccf33 JLE 4ccf63 |
0x4ccf35 MOV 0x24dcc4(%RIP),%RDI |
0x4ccf3c MOV $0x4f4345,%ESI |
0x4ccf41 MOV $0x4f6d88,%EDX |
0x4ccf46 XOR %EAX,%EAX |
0x4ccf48 CALL 4d53b0 <hypre_fprintf> |
0x4ccf4d MOV $0x4f6d01,%EDI |
0x4ccf52 MOV $0xf9,%ESI |
0x4ccf57 MOV $0x1,%EDX |
0x4ccf5c XOR %ECX,%ECX |
0x4ccf5e CALL 4d7ce0 <hypre_error_handler> |
0x4ccf63 VMOVSD 0x38(%RBP),%XMM5 |
0x4ccf68 TEST %R15,%R15 |
0x4ccf6b JS 4ccf72 |
0x4ccf6d CMP %RBX,%R15 |
0x4ccf70 JLE 4ccfa5 |
0x4ccf72 MOV 0x24dc87(%RIP),%RDI |
0x4ccf79 MOV $0x4f4345,%ESI |
0x4ccf7e MOV $0x4f6daa,%EDX |
0x4ccf83 XOR %EAX,%EAX |
0x4ccf85 CALL 4d53b0 <hypre_fprintf> |
0x4ccf8a MOV $0x4f6d01,%EDI |
0x4ccf8f MOV $0xfa,%ESI |
0x4ccf94 MOV $0x1,%EDX |
0x4ccf99 XOR %ECX,%ECX |
0x4ccf9b CALL 4d7ce0 <hypre_error_handler> |
0x4ccfa0 VMOVSD 0x38(%RBP),%XMM5 |
0x4ccfa5 MOV 0x30(%RBP),%RSI |
0x4ccfa9 VMOVQ %R13,%XMM0 |
0x4ccfae VXORPD %XMM1,%XMM1,%XMM1 |
0x4ccfb2 VUCOMISD %XMM1,%XMM5 |
0x4ccfb6 MOV %R14,-0x40(%RBP) |
0x4ccfba JNE 4cd0dd |
0x4ccfc0 VUCOMISD 0x14ea8(%RIP),%XMM0 |
0x4ccfc8 JNE 4cd21e |
0x4ccfce CMP %R15,%R14 |
0x4ccfd1 JGE 4cdd7e |
0x4ccfd7 MOV (%R12),%RDX |
0x4ccfdb MOV (%RSI),%RBX |
0x4ccfde MOV %R14,%RAX |
0x4ccfe1 NOT %RAX |
0x4ccfe4 ADD %RAX,%R15 |
0x4ccfe7 XOR %EDI,%EDI |
0x4ccfe9 MOV %R15,-0x38(%RBP) |
0x4ccfed MOV %RBX,-0x30(%RBP) |
0x4ccff1 JMP 4cd016 |
0x4ccff3 NOPW %CS:(%RAX,%RAX,1) |
(4052) 0x4cd000 VMOVSD %XMM0,(%RBX,%R8,8) |
(4052) 0x4cd006 LEA 0x1(%RDI),%RAX |
(4052) 0x4cd00a CMP %R15,%RDI |
(4052) 0x4cd00d MOV %RAX,%RDI |
(4052) 0x4cd010 JE 4cdd7e |
(4052) 0x4cd016 LEA (%R14,%RDI,1),%R8 |
(4052) 0x4cd01a MOV (%RDX,%R8,8),%RAX |
(4052) 0x4cd01e MOV 0x8(%RDX,%R8,8),%R9 |
(4052) 0x4cd023 VXORPD %XMM0,%XMM0,%XMM0 |
(4052) 0x4cd027 MOV %R9,%RCX |
(4052) 0x4cd02a SUB %RAX,%RCX |
(4052) 0x4cd02d JLE 4cd000 |
(4052) 0x4cd02f MOV -0x48(%RBP),%RSI |
(4052) 0x4cd033 MOV (%RSI),%R10 |
(4052) 0x4cd036 MOV 0x20(%RBP),%RSI |
(4052) 0x4cd03a MOV (%RSI),%R11 |
(4052) 0x4cd03d MOV 0x10(%RBP),%RSI |
(4052) 0x4cd041 MOV (%RSI),%R12 |
(4052) 0x4cd044 MOV %RCX,%R13 |
(4052) 0x4cd047 AND $-0x4,%R13 |
(4052) 0x4cd04b JE 4cd0ae |
(4052) 0x4cd04d LEA -0x1(%R13),%RBX |
(4052) 0x4cd051 LEA (%R10,%RAX,8),%R14 |
(4052) 0x4cd055 LEA (%R12,%RAX,8),%R15 |
(4052) 0x4cd059 VXORPD %XMM0,%XMM0,%XMM0 |
(4052) 0x4cd05d XOR %ESI,%ESI |
(4052) 0x4cd05f NOP |
(4054) 0x4cd060 VMOVUPD (%R15,%RSI,8),%YMM1 |
(4054) 0x4cd066 KXNORW %K0,%K0,%K1 |
(4054) 0x4cd06a VXORPD %XMM2,%XMM2,%XMM2 |
(4054) 0x4cd06e VGATHERQPD (%R11,%YMM1,8),%YMM2{%K1} |
(4054) 0x4cd075 VFMADD231PD (%R14,%RSI,8),%YMM2,%YMM0 |
(4054) 0x4cd07b ADD $0x4,%RSI |
(4054) 0x4cd07f CMP %RBX,%RSI |
(4054) 0x4cd082 JBE 4cd060 |
(4052) 0x4cd084 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(4052) 0x4cd08a VADDPD %XMM1,%XMM0,%XMM0 |
(4052) 0x4cd08e VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(4052) 0x4cd093 VADDSD %XMM1,%XMM0,%XMM0 |
(4052) 0x4cd097 CMP %R13,%RCX |
(4052) 0x4cd09a MOV -0x40(%RBP),%R14 |
(4052) 0x4cd09e MOV -0x38(%RBP),%R15 |
(4052) 0x4cd0a2 MOV -0x30(%RBP),%RBX |
(4052) 0x4cd0a6 JE 4cd000 |
(4052) 0x4cd0ac JMP 4cd0b1 |
(4052) 0x4cd0ae XOR %R13D,%R13D |
(4052) 0x4cd0b1 ADD %RAX,%R13 |
(4052) 0x4cd0b4 NOPW %CS:(%RAX,%RAX,1) |
(4053) 0x4cd0c0 MOV (%R12,%R13,8),%RAX |
(4053) 0x4cd0c4 VMOVSD (%R11,%RAX,8),%XMM1 |
(4053) 0x4cd0ca VFMADD231SD (%R10,%R13,8),%XMM1,%XMM0 |
(4053) 0x4cd0d0 INC %R13 |
(4053) 0x4cd0d3 CMP %R13,%R9 |
(4053) 0x4cd0d6 JNE 4cd0c0 |
(4052) 0x4cd0d8 JMP 4cd000 |
0x4cd0dd MOV 0x28(%RBP),%RBX |
0x4cd0e1 VUCOMISD 0x15c87(%RIP),%XMM5 |
0x4cd0e9 JNE 4cd33d |
0x4cd0ef VUCOMISD 0x14d79(%RIP),%XMM0 |
0x4cd0f7 JNE 4cd46e |
0x4cd0fd CMP %R15,%R14 |
0x4cd100 JGE 4cdd7e |
0x4cd106 MOV (%R12),%RDI |
0x4cd10a MOV (%RSI),%RSI |
0x4cd10d MOV %R14,%RAX |
0x4cd110 NOT %RAX |
0x4cd113 ADD %RAX,%R15 |
0x4cd116 XOR %R8D,%R8D |
0x4cd119 VMOVDDUP 0x159ff(%RIP),%XMM0 |
0x4cd121 MOV %R15,-0x38(%RBP) |
0x4cd125 MOV %RSI,-0x30(%RBP) |
0x4cd129 JMP 4cd146 |
0x4cd12b NOPL (%RAX,%RAX,1) |
(4043) 0x4cd130 VMOVSD %XMM1,(%RSI,%R9,8) |
(4043) 0x4cd136 LEA 0x1(%R8),%RAX |
(4043) 0x4cd13a CMP %R15,%R8 |
(4043) 0x4cd13d MOV %RAX,%R8 |
(4043) 0x4cd140 JE 4cdd7e |
(4043) 0x4cd146 LEA (%R14,%R8,1),%R9 |
(4043) 0x4cd14a VMOVSD (%RBX,%R9,8),%XMM1 |
(4043) 0x4cd150 VXORPD %XMM0,%XMM1,%XMM1 |
(4043) 0x4cd154 MOV (%RDI,%R9,8),%RAX |
(4043) 0x4cd158 MOV 0x8(%RDI,%R9,8),%R10 |
(4043) 0x4cd15d MOV %R10,%RCX |
(4043) 0x4cd160 SUB %RAX,%RCX |
(4043) 0x4cd163 JLE 4cd130 |
(4043) 0x4cd165 MOV -0x48(%RBP),%RDX |
(4043) 0x4cd169 MOV (%RDX),%R11 |
(4043) 0x4cd16c MOV 0x20(%RBP),%RDX |
(4043) 0x4cd170 MOV (%RDX),%R12 |
(4043) 0x4cd173 MOV 0x10(%RBP),%RDX |
(4043) 0x4cd177 MOV (%RDX),%R13 |
(4043) 0x4cd17a MOV %RCX,%RDX |
(4043) 0x4cd17d AND $-0x4,%RDX |
(4043) 0x4cd181 JE 4cd1f6 |
(4043) 0x4cd183 LEA -0x1(%RDX),%RBX |
(4043) 0x4cd187 LEA (%R11,%RAX,8),%R14 |
(4043) 0x4cd18b LEA (%R13,%RAX,8),%R15 |
(4043) 0x4cd190 VXORPD %XMM2,%XMM2,%XMM2 |
(4043) 0x4cd194 XOR %ESI,%ESI |
(4043) 0x4cd196 NOPW %CS:(%RAX,%RAX,1) |
(4045) 0x4cd1a0 VMOVUPD (%R15,%RSI,8),%YMM3 |
(4045) 0x4cd1a6 KXNORW %K0,%K0,%K1 |
(4045) 0x4cd1aa VXORPD %XMM4,%XMM4,%XMM4 |
(4045) 0x4cd1ae VGATHERQPD (%R12,%YMM3,8),%YMM4{%K1} |
(4045) 0x4cd1b5 VFMADD231PD (%R14,%RSI,8),%YMM4,%YMM2 |
(4045) 0x4cd1bb ADD $0x4,%RSI |
(4045) 0x4cd1bf CMP %RBX,%RSI |
(4045) 0x4cd1c2 JBE 4cd1a0 |
(4043) 0x4cd1c4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4043) 0x4cd1ca VADDPD %XMM3,%XMM2,%XMM2 |
(4043) 0x4cd1ce VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4043) 0x4cd1d3 VADDSD %XMM3,%XMM2,%XMM2 |
(4043) 0x4cd1d7 VADDSD %XMM2,%XMM1,%XMM1 |
(4043) 0x4cd1db CMP %RDX,%RCX |
(4043) 0x4cd1de MOV -0x40(%RBP),%R14 |
(4043) 0x4cd1e2 MOV -0x38(%RBP),%R15 |
(4043) 0x4cd1e6 MOV 0x28(%RBP),%RBX |
(4043) 0x4cd1ea MOV -0x30(%RBP),%RSI |
(4043) 0x4cd1ee JE 4cd130 |
(4043) 0x4cd1f4 JMP 4cd1f8 |
(4043) 0x4cd1f6 XOR %EDX,%EDX |
(4043) 0x4cd1f8 ADD %RAX,%RDX |
(4043) 0x4cd1fb NOPL (%RAX,%RAX,1) |
(4044) 0x4cd200 MOV (%R13,%RDX,8),%RAX |
(4044) 0x4cd205 VMOVSD (%R12,%RAX,8),%XMM2 |
(4044) 0x4cd20b VFMADD231SD (%R11,%RDX,8),%XMM2,%XMM1 |
(4044) 0x4cd211 INC %RDX |
(4044) 0x4cd214 CMP %RDX,%R10 |
(4044) 0x4cd217 JNE 4cd200 |
(4043) 0x4cd219 JMP 4cd130 |
0x4cd21e VUCOMISD 0x15b4a(%RIP),%XMM0 |
0x4cd226 JNE 4cd59e |
0x4cd22c CMP %R15,%R14 |
0x4cd22f JGE 4cdd7e |
0x4cd235 MOV (%R12),%RDX |
0x4cd239 MOV (%RSI),%RBX |
0x4cd23c MOV %R14,%RAX |
0x4cd23f NOT %RAX |
0x4cd242 ADD %RAX,%R15 |
0x4cd245 XOR %EDI,%EDI |
0x4cd247 MOV %R15,-0x38(%RBP) |
0x4cd24b MOV %RBX,-0x30(%RBP) |
0x4cd24f JMP 4cd276 |
0x4cd251 NOPW %CS:(%RAX,%RAX,1) |
(4049) 0x4cd260 VMOVSD %XMM0,(%RBX,%R8,8) |
(4049) 0x4cd266 LEA 0x1(%RDI),%RAX |
(4049) 0x4cd26a CMP %R15,%RDI |
(4049) 0x4cd26d MOV %RAX,%RDI |
(4049) 0x4cd270 JE 4cdd7e |
(4049) 0x4cd276 LEA (%R14,%RDI,1),%R8 |
(4049) 0x4cd27a MOV (%RDX,%R8,8),%RAX |
(4049) 0x4cd27e MOV 0x8(%RDX,%R8,8),%R9 |
(4049) 0x4cd283 VXORPD %XMM0,%XMM0,%XMM0 |
(4049) 0x4cd287 MOV %R9,%RCX |
(4049) 0x4cd28a SUB %RAX,%RCX |
(4049) 0x4cd28d JLE 4cd260 |
(4049) 0x4cd28f MOV -0x48(%RBP),%RSI |
(4049) 0x4cd293 MOV (%RSI),%R10 |
(4049) 0x4cd296 MOV 0x20(%RBP),%RSI |
(4049) 0x4cd29a MOV (%RSI),%R11 |
(4049) 0x4cd29d MOV 0x10(%RBP),%RSI |
(4049) 0x4cd2a1 MOV (%RSI),%R12 |
(4049) 0x4cd2a4 MOV %RCX,%R13 |
(4049) 0x4cd2a7 AND $-0x4,%R13 |
(4049) 0x4cd2ab JE 4cd30e |
(4049) 0x4cd2ad LEA -0x1(%R13),%RBX |
(4049) 0x4cd2b1 LEA (%R10,%RAX,8),%R14 |
(4049) 0x4cd2b5 LEA (%R12,%RAX,8),%R15 |
(4049) 0x4cd2b9 VXORPD %XMM0,%XMM0,%XMM0 |
(4049) 0x4cd2bd XOR %ESI,%ESI |
(4049) 0x4cd2bf NOP |
(4051) 0x4cd2c0 VMOVUPD (%R15,%RSI,8),%YMM1 |
(4051) 0x4cd2c6 KXNORW %K0,%K0,%K1 |
(4051) 0x4cd2ca VXORPD %XMM2,%XMM2,%XMM2 |
(4051) 0x4cd2ce VGATHERQPD (%R11,%YMM1,8),%YMM2{%K1} |
(4051) 0x4cd2d5 VFNMADD231PD (%R14,%RSI,8),%YMM2,%YMM0 |
(4051) 0x4cd2db ADD $0x4,%RSI |
(4051) 0x4cd2df CMP %RBX,%RSI |
(4051) 0x4cd2e2 JBE 4cd2c0 |
(4049) 0x4cd2e4 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(4049) 0x4cd2ea VADDPD %XMM1,%XMM0,%XMM0 |
(4049) 0x4cd2ee VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(4049) 0x4cd2f3 VADDSD %XMM1,%XMM0,%XMM0 |
(4049) 0x4cd2f7 CMP %R13,%RCX |
(4049) 0x4cd2fa MOV -0x40(%RBP),%R14 |
(4049) 0x4cd2fe MOV -0x38(%RBP),%R15 |
(4049) 0x4cd302 MOV -0x30(%RBP),%RBX |
(4049) 0x4cd306 JE 4cd260 |
(4049) 0x4cd30c JMP 4cd311 |
(4049) 0x4cd30e XOR %R13D,%R13D |
(4049) 0x4cd311 ADD %RAX,%R13 |
(4049) 0x4cd314 NOPW %CS:(%RAX,%RAX,1) |
(4050) 0x4cd320 MOV (%R12,%R13,8),%RAX |
(4050) 0x4cd324 VMOVSD (%R11,%RAX,8),%XMM1 |
(4050) 0x4cd32a VFNMADD231SD (%R10,%R13,8),%XMM1,%XMM0 |
(4050) 0x4cd330 INC %R13 |
(4050) 0x4cd333 CMP %R13,%R9 |
(4050) 0x4cd336 JNE 4cd320 |
(4049) 0x4cd338 JMP 4cd260 |
0x4cd33d VUCOMISD 0x14b2b(%RIP),%XMM5 |
0x4cd345 JNE 4cd6bd |
0x4cd34b VUCOMISD 0x14b1d(%RIP),%XMM0 |
0x4cd353 JNE 4cd7ee |
0x4cd359 CMP %R15,%R14 |
0x4cd35c JGE 4cdd7e |
0x4cd362 MOV (%R12),%RDI |
0x4cd366 MOV (%RSI),%RSI |
0x4cd369 MOV %R14,%RAX |
0x4cd36c NOT %RAX |
0x4cd36f ADD %RAX,%R15 |
0x4cd372 XOR %R8D,%R8D |
0x4cd375 MOV %R15,-0x38(%RBP) |
0x4cd379 MOV %RSI,-0x30(%RBP) |
0x4cd37d JMP 4cd396 |
0x4cd37f NOP |
(4034) 0x4cd380 VMOVSD %XMM0,(%RSI,%R9,8) |
(4034) 0x4cd386 LEA 0x1(%R8),%RAX |
(4034) 0x4cd38a CMP %R15,%R8 |
(4034) 0x4cd38d MOV %RAX,%R8 |
(4034) 0x4cd390 JE 4cdd7e |
(4034) 0x4cd396 LEA (%R14,%R8,1),%R9 |
(4034) 0x4cd39a VMOVSD (%RBX,%R9,8),%XMM0 |
(4034) 0x4cd3a0 MOV (%RDI,%R9,8),%RAX |
(4034) 0x4cd3a4 MOV 0x8(%RDI,%R9,8),%R10 |
(4034) 0x4cd3a9 MOV %R10,%RCX |
(4034) 0x4cd3ac SUB %RAX,%RCX |
(4034) 0x4cd3af JLE 4cd380 |
(4034) 0x4cd3b1 MOV -0x48(%RBP),%RDX |
(4034) 0x4cd3b5 MOV (%RDX),%R11 |
(4034) 0x4cd3b8 MOV 0x20(%RBP),%RDX |
(4034) 0x4cd3bc MOV (%RDX),%R12 |
(4034) 0x4cd3bf MOV 0x10(%RBP),%RDX |
(4034) 0x4cd3c3 MOV (%RDX),%R13 |
(4034) 0x4cd3c6 MOV %RCX,%RDX |
(4034) 0x4cd3c9 AND $-0x4,%RDX |
(4034) 0x4cd3cd JE 4cd446 |
(4034) 0x4cd3cf LEA -0x1(%RDX),%RBX |
(4034) 0x4cd3d3 LEA (%R11,%RAX,8),%RSI |
(4034) 0x4cd3d7 LEA (%R13,%RAX,8),%R14 |
(4034) 0x4cd3dc VXORPD %XMM1,%XMM1,%XMM1 |
(4034) 0x4cd3e0 XOR %R15D,%R15D |
(4034) 0x4cd3e3 NOPW %CS:(%RAX,%RAX,1) |
(4036) 0x4cd3f0 VMOVUPD (%R14,%R15,8),%YMM2 |
(4036) 0x4cd3f6 KXNORW %K0,%K0,%K1 |
(4036) 0x4cd3fa VXORPD %XMM3,%XMM3,%XMM3 |
(4036) 0x4cd3fe VGATHERQPD (%R12,%YMM2,8),%YMM3{%K1} |
(4036) 0x4cd405 VFMADD231PD (%RSI,%R15,8),%YMM3,%YMM1 |
(4036) 0x4cd40b ADD $0x4,%R15 |
(4036) 0x4cd40f CMP %RBX,%R15 |
(4036) 0x4cd412 JBE 4cd3f0 |
(4034) 0x4cd414 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4034) 0x4cd41a VADDPD %XMM2,%XMM1,%XMM1 |
(4034) 0x4cd41e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4034) 0x4cd423 VADDSD %XMM2,%XMM1,%XMM1 |
(4034) 0x4cd427 VADDSD %XMM1,%XMM0,%XMM0 |
(4034) 0x4cd42b CMP %RDX,%RCX |
(4034) 0x4cd42e MOV -0x40(%RBP),%R14 |
(4034) 0x4cd432 MOV -0x38(%RBP),%R15 |
(4034) 0x4cd436 MOV 0x28(%RBP),%RBX |
(4034) 0x4cd43a MOV -0x30(%RBP),%RSI |
(4034) 0x4cd43e JE 4cd380 |
(4034) 0x4cd444 JMP 4cd448 |
(4034) 0x4cd446 XOR %EDX,%EDX |
(4034) 0x4cd448 ADD %RAX,%RDX |
(4034) 0x4cd44b NOPL (%RAX,%RAX,1) |
(4035) 0x4cd450 MOV (%R13,%RDX,8),%RAX |
(4035) 0x4cd455 VMOVSD (%R12,%RAX,8),%XMM1 |
(4035) 0x4cd45b VFMADD231SD (%R11,%RDX,8),%XMM1,%XMM0 |
(4035) 0x4cd461 INC %RDX |
(4035) 0x4cd464 CMP %RDX,%R10 |
(4035) 0x4cd467 JNE 4cd450 |
(4034) 0x4cd469 JMP 4cd380 |
0x4cd46e VUCOMISD 0x158fa(%RIP),%XMM0 |
0x4cd476 JNE 4cd91e |
0x4cd47c CMP %R15,%R14 |
0x4cd47f JGE 4cdd7e |
0x4cd485 MOV (%R12),%RDI |
0x4cd489 MOV (%RSI),%RSI |
0x4cd48c MOV %R14,%RAX |
0x4cd48f NOT %RAX |
0x4cd492 ADD %RAX,%R15 |
0x4cd495 XOR %R8D,%R8D |
0x4cd498 MOV %R15,-0x38(%RBP) |
0x4cd49c MOV %RSI,-0x30(%RBP) |
0x4cd4a0 JMP 4cd4c6 |
0x4cd4a2 NOPW %CS:(%RAX,%RAX,1) |
(4040) 0x4cd4b0 VMOVSD %XMM0,(%RSI,%R9,8) |
(4040) 0x4cd4b6 LEA 0x1(%R8),%RAX |
(4040) 0x4cd4ba CMP %R15,%R8 |
(4040) 0x4cd4bd MOV %RAX,%R8 |
(4040) 0x4cd4c0 JE 4cdd7e |
(4040) 0x4cd4c6 LEA (%R14,%R8,1),%R9 |
(4040) 0x4cd4ca VMOVSD (%RBX,%R9,8),%XMM0 |
(4040) 0x4cd4d0 MOV (%RDI,%R9,8),%RAX |
(4040) 0x4cd4d4 MOV 0x8(%RDI,%R9,8),%R10 |
(4040) 0x4cd4d9 MOV %R10,%RCX |
(4040) 0x4cd4dc SUB %RAX,%RCX |
(4040) 0x4cd4df JLE 4cd4b0 |
(4040) 0x4cd4e1 MOV -0x48(%RBP),%RDX |
(4040) 0x4cd4e5 MOV (%RDX),%R11 |
(4040) 0x4cd4e8 MOV 0x20(%RBP),%RDX |
(4040) 0x4cd4ec MOV (%RDX),%R12 |
(4040) 0x4cd4ef MOV 0x10(%RBP),%RDX |
(4040) 0x4cd4f3 MOV (%RDX),%R13 |
(4040) 0x4cd4f6 MOV %RCX,%RDX |
(4040) 0x4cd4f9 AND $-0x4,%RDX |
(4040) 0x4cd4fd JE 4cd576 |
(4040) 0x4cd4ff LEA -0x1(%RDX),%RBX |
(4040) 0x4cd503 LEA (%R11,%RAX,8),%RSI |
(4040) 0x4cd507 LEA (%R13,%RAX,8),%R14 |
(4040) 0x4cd50c VXORPD %XMM1,%XMM1,%XMM1 |
(4040) 0x4cd510 XOR %R15D,%R15D |
(4040) 0x4cd513 NOPW %CS:(%RAX,%RAX,1) |
(4042) 0x4cd520 VMOVUPD (%R14,%R15,8),%YMM2 |
(4042) 0x4cd526 KXNORW %K0,%K0,%K1 |
(4042) 0x4cd52a VXORPD %XMM3,%XMM3,%XMM3 |
(4042) 0x4cd52e VGATHERQPD (%R12,%YMM2,8),%YMM3{%K1} |
(4042) 0x4cd535 VFNMADD231PD (%RSI,%R15,8),%YMM3,%YMM1 |
(4042) 0x4cd53b ADD $0x4,%R15 |
(4042) 0x4cd53f CMP %RBX,%R15 |
(4042) 0x4cd542 JBE 4cd520 |
(4040) 0x4cd544 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4040) 0x4cd54a VADDPD %XMM2,%XMM1,%XMM1 |
(4040) 0x4cd54e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4040) 0x4cd553 VADDSD %XMM2,%XMM1,%XMM1 |
(4040) 0x4cd557 VADDSD %XMM1,%XMM0,%XMM0 |
(4040) 0x4cd55b CMP %RDX,%RCX |
(4040) 0x4cd55e MOV -0x40(%RBP),%R14 |
(4040) 0x4cd562 MOV -0x38(%RBP),%R15 |
(4040) 0x4cd566 MOV 0x28(%RBP),%RBX |
(4040) 0x4cd56a MOV -0x30(%RBP),%RSI |
(4040) 0x4cd56e JE 4cd4b0 |
(4040) 0x4cd574 JMP 4cd578 |
(4040) 0x4cd576 XOR %EDX,%EDX |
(4040) 0x4cd578 ADD %RAX,%RDX |
(4040) 0x4cd57b NOPL (%RAX,%RAX,1) |
(4041) 0x4cd580 MOV (%R13,%RDX,8),%RAX |
(4041) 0x4cd585 VMOVSD (%R12,%RAX,8),%XMM1 |
(4041) 0x4cd58b VFNMADD231SD (%R11,%RDX,8),%XMM1,%XMM0 |
(4041) 0x4cd591 INC %RDX |
(4041) 0x4cd594 CMP %RDX,%R10 |
(4041) 0x4cd597 JNE 4cd580 |
(4040) 0x4cd599 JMP 4cd4b0 |
0x4cd59e CMP %R15,%R14 |
0x4cd5a1 JGE 4cdd7e |
0x4cd5a7 MOV (%R12),%RDX |
0x4cd5ab MOV (%RSI),%RBX |
0x4cd5ae MOV %R14,%RAX |
0x4cd5b1 NOT %RAX |
0x4cd5b4 ADD %RAX,%R15 |
0x4cd5b7 XOR %EDI,%EDI |
0x4cd5b9 MOV %R15,-0x38(%RBP) |
0x4cd5bd MOV %RBX,-0x30(%RBP) |
0x4cd5c1 JMP 4cd5ea |
0x4cd5c3 NOPW %CS:(%RAX,%RAX,1) |
(4046) 0x4cd5d0 VMULSD %XMM0,%XMM1,%XMM1 |
(4046) 0x4cd5d4 VMOVSD %XMM1,(%RBX,%R8,8) |
(4046) 0x4cd5da LEA 0x1(%RDI),%RAX |
(4046) 0x4cd5de CMP %R15,%RDI |
(4046) 0x4cd5e1 MOV %RAX,%RDI |
(4046) 0x4cd5e4 JE 4cdd7e |
(4046) 0x4cd5ea LEA (%R14,%RDI,1),%R8 |
(4046) 0x4cd5ee MOV (%RDX,%R8,8),%RAX |
(4046) 0x4cd5f2 MOV 0x8(%RDX,%R8,8),%R9 |
(4046) 0x4cd5f7 VXORPD %XMM1,%XMM1,%XMM1 |
(4046) 0x4cd5fb MOV %R9,%RCX |
(4046) 0x4cd5fe SUB %RAX,%RCX |
(4046) 0x4cd601 JLE 4cd5d0 |
(4046) 0x4cd603 MOV -0x48(%RBP),%RSI |
(4046) 0x4cd607 MOV (%RSI),%R10 |
(4046) 0x4cd60a MOV 0x20(%RBP),%RSI |
(4046) 0x4cd60e MOV (%RSI),%R11 |
(4046) 0x4cd611 MOV 0x10(%RBP),%RSI |
(4046) 0x4cd615 MOV (%RSI),%R12 |
(4046) 0x4cd618 MOV %RCX,%R13 |
(4046) 0x4cd61b AND $-0x4,%R13 |
(4046) 0x4cd61f JE 4cd68e |
(4046) 0x4cd621 LEA -0x1(%R13),%RBX |
(4046) 0x4cd625 LEA (%R10,%RAX,8),%R14 |
(4046) 0x4cd629 LEA (%R12,%RAX,8),%R15 |
(4046) 0x4cd62d VXORPD %XMM1,%XMM1,%XMM1 |
(4046) 0x4cd631 XOR %ESI,%ESI |
(4046) 0x4cd633 NOPW %CS:(%RAX,%RAX,1) |
(4048) 0x4cd640 VMOVUPD (%R15,%RSI,8),%YMM2 |
(4048) 0x4cd646 VXORPD %XMM3,%XMM3,%XMM3 |
(4048) 0x4cd64a KXNORW %K0,%K0,%K1 |
(4048) 0x4cd64e VGATHERQPD (%R11,%YMM2,8),%YMM3{%K1} |
(4048) 0x4cd655 VFMADD231PD (%R14,%RSI,8),%YMM3,%YMM1 |
(4048) 0x4cd65b ADD $0x4,%RSI |
(4048) 0x4cd65f CMP %RBX,%RSI |
(4048) 0x4cd662 JBE 4cd640 |
(4046) 0x4cd664 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4046) 0x4cd66a VADDPD %XMM2,%XMM1,%XMM1 |
(4046) 0x4cd66e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4046) 0x4cd673 VADDSD %XMM2,%XMM1,%XMM1 |
(4046) 0x4cd677 CMP %R13,%RCX |
(4046) 0x4cd67a MOV -0x40(%RBP),%R14 |
(4046) 0x4cd67e MOV -0x38(%RBP),%R15 |
(4046) 0x4cd682 MOV -0x30(%RBP),%RBX |
(4046) 0x4cd686 JE 4cd5d0 |
(4046) 0x4cd68c JMP 4cd691 |
(4046) 0x4cd68e XOR %R13D,%R13D |
(4046) 0x4cd691 ADD %RAX,%R13 |
(4046) 0x4cd694 NOPW %CS:(%RAX,%RAX,1) |
(4047) 0x4cd6a0 MOV (%R12,%R13,8),%RAX |
(4047) 0x4cd6a4 VMOVSD (%R11,%RAX,8),%XMM2 |
(4047) 0x4cd6aa VFMADD231SD (%R10,%R13,8),%XMM2,%XMM1 |
(4047) 0x4cd6b0 INC %R13 |
(4047) 0x4cd6b3 CMP %R13,%R9 |
(4047) 0x4cd6b6 JNE 4cd6a0 |
(4046) 0x4cd6b8 JMP 4cd5d0 |
0x4cd6bd VUCOMISD 0x147ab(%RIP),%XMM0 |
0x4cd6c5 JNE 4cda3e |
0x4cd6cb CMP %R15,%R14 |
0x4cd6ce JGE 4cdd7e |
0x4cd6d4 MOV (%R12),%RDI |
0x4cd6d8 MOV (%RSI),%RSI |
0x4cd6db MOV %R14,%RAX |
0x4cd6de NOT %RAX |
0x4cd6e1 ADD %RAX,%R15 |
0x4cd6e4 XOR %R8D,%R8D |
0x4cd6e7 MOV %R15,-0x38(%RBP) |
0x4cd6eb MOV %RSI,-0x30(%RBP) |
0x4cd6ef JMP 4cd716 |
0x4cd6f1 NOPW %CS:(%RAX,%RAX,1) |
(4025) 0x4cd700 VMOVSD %XMM0,(%RSI,%R9,8) |
(4025) 0x4cd706 LEA 0x1(%R8),%RAX |
(4025) 0x4cd70a CMP %R15,%R8 |
(4025) 0x4cd70d MOV %RAX,%R8 |
(4025) 0x4cd710 JE 4cdd7e |
(4025) 0x4cd716 LEA (%R14,%R8,1),%R9 |
(4025) 0x4cd71a VMULSD (%RBX,%R9,8),%XMM5,%XMM0 |
(4025) 0x4cd720 MOV (%RDI,%R9,8),%RAX |
(4025) 0x4cd724 MOV 0x8(%RDI,%R9,8),%R10 |
(4025) 0x4cd729 MOV %R10,%RCX |
(4025) 0x4cd72c SUB %RAX,%RCX |
(4025) 0x4cd72f JLE 4cd700 |
(4025) 0x4cd731 MOV -0x48(%RBP),%RDX |
(4025) 0x4cd735 MOV (%RDX),%R11 |
(4025) 0x4cd738 MOV 0x20(%RBP),%RDX |
(4025) 0x4cd73c MOV (%RDX),%R12 |
(4025) 0x4cd73f MOV 0x10(%RBP),%RDX |
(4025) 0x4cd743 MOV (%RDX),%R13 |
(4025) 0x4cd746 MOV %RCX,%RDX |
(4025) 0x4cd749 AND $-0x4,%RDX |
(4025) 0x4cd74d JE 4cd7c6 |
(4025) 0x4cd74f LEA -0x1(%RDX),%RBX |
(4025) 0x4cd753 LEA (%R11,%RAX,8),%RSI |
(4025) 0x4cd757 LEA (%R13,%RAX,8),%R14 |
(4025) 0x4cd75c VXORPD %XMM1,%XMM1,%XMM1 |
(4025) 0x4cd760 XOR %R15D,%R15D |
(4025) 0x4cd763 NOPW %CS:(%RAX,%RAX,1) |
(4027) 0x4cd770 VMOVUPD (%R14,%R15,8),%YMM2 |
(4027) 0x4cd776 VXORPD %XMM3,%XMM3,%XMM3 |
(4027) 0x4cd77a KXNORW %K0,%K0,%K1 |
(4027) 0x4cd77e VGATHERQPD (%R12,%YMM2,8),%YMM3{%K1} |
(4027) 0x4cd785 VFMADD231PD (%RSI,%R15,8),%YMM3,%YMM1 |
(4027) 0x4cd78b ADD $0x4,%R15 |
(4027) 0x4cd78f CMP %RBX,%R15 |
(4027) 0x4cd792 JBE 4cd770 |
(4025) 0x4cd794 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4025) 0x4cd79a VADDPD %XMM2,%XMM1,%XMM1 |
(4025) 0x4cd79e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4025) 0x4cd7a3 VADDSD %XMM2,%XMM1,%XMM1 |
(4025) 0x4cd7a7 VADDSD %XMM1,%XMM0,%XMM0 |
(4025) 0x4cd7ab CMP %RDX,%RCX |
(4025) 0x4cd7ae MOV -0x40(%RBP),%R14 |
(4025) 0x4cd7b2 MOV -0x38(%RBP),%R15 |
(4025) 0x4cd7b6 MOV 0x28(%RBP),%RBX |
(4025) 0x4cd7ba MOV -0x30(%RBP),%RSI |
(4025) 0x4cd7be JE 4cd700 |
(4025) 0x4cd7c4 JMP 4cd7c8 |
(4025) 0x4cd7c6 XOR %EDX,%EDX |
(4025) 0x4cd7c8 ADD %RAX,%RDX |
(4025) 0x4cd7cb NOPL (%RAX,%RAX,1) |
(4026) 0x4cd7d0 MOV (%R13,%RDX,8),%RAX |
(4026) 0x4cd7d5 VMOVSD (%R12,%RAX,8),%XMM1 |
(4026) 0x4cd7db VFMADD231SD (%R11,%RDX,8),%XMM1,%XMM0 |
(4026) 0x4cd7e1 INC %RDX |
(4026) 0x4cd7e4 CMP %RDX,%R10 |
(4026) 0x4cd7e7 JNE 4cd7d0 |
(4025) 0x4cd7e9 JMP 4cd700 |
0x4cd7ee VUCOMISD 0x1557a(%RIP),%XMM0 |
0x4cd7f6 JNE 4cdb5e |
0x4cd7fc CMP %R15,%R14 |
0x4cd7ff JGE 4cdd7e |
0x4cd805 MOV (%R12),%RDI |
0x4cd809 MOV (%RSI),%RSI |
0x4cd80c MOV %R14,%RAX |
0x4cd80f NOT %RAX |
0x4cd812 ADD %RAX,%R15 |
0x4cd815 XOR %R8D,%R8D |
0x4cd818 VMOVDDUP 0x15300(%RIP),%XMM0 |
0x4cd820 MOV %R15,-0x38(%RBP) |
0x4cd824 MOV %RSI,-0x30(%RBP) |
0x4cd828 JMP 4cd846 |
0x4cd82a NOPW (%RAX,%RAX,1) |
(4031) 0x4cd830 VMOVSD %XMM1,(%RSI,%R9,8) |
(4031) 0x4cd836 LEA 0x1(%R8),%RAX |
(4031) 0x4cd83a CMP %R15,%R8 |
(4031) 0x4cd83d MOV %RAX,%R8 |
(4031) 0x4cd840 JE 4cdd7e |
(4031) 0x4cd846 LEA (%R14,%R8,1),%R9 |
(4031) 0x4cd84a VMOVSD (%RBX,%R9,8),%XMM1 |
(4031) 0x4cd850 VXORPD %XMM0,%XMM1,%XMM1 |
(4031) 0x4cd854 MOV (%RDI,%R9,8),%RAX |
(4031) 0x4cd858 MOV 0x8(%RDI,%R9,8),%R10 |
(4031) 0x4cd85d MOV %R10,%RCX |
(4031) 0x4cd860 SUB %RAX,%RCX |
(4031) 0x4cd863 JLE 4cd830 |
(4031) 0x4cd865 MOV -0x48(%RBP),%RDX |
(4031) 0x4cd869 MOV (%RDX),%R11 |
(4031) 0x4cd86c MOV 0x20(%RBP),%RDX |
(4031) 0x4cd870 MOV (%RDX),%R12 |
(4031) 0x4cd873 MOV 0x10(%RBP),%RDX |
(4031) 0x4cd877 MOV (%RDX),%R13 |
(4031) 0x4cd87a MOV %RCX,%RDX |
(4031) 0x4cd87d AND $-0x4,%RDX |
(4031) 0x4cd881 JE 4cd8f6 |
(4031) 0x4cd883 LEA -0x1(%RDX),%RBX |
(4031) 0x4cd887 LEA (%R11,%RAX,8),%RSI |
(4031) 0x4cd88b LEA (%R13,%RAX,8),%R14 |
(4031) 0x4cd890 VXORPD %XMM2,%XMM2,%XMM2 |
(4031) 0x4cd894 XOR %R15D,%R15D |
(4031) 0x4cd897 NOPW (%RAX,%RAX,1) |
(4033) 0x4cd8a0 VMOVUPD (%R14,%R15,8),%YMM3 |
(4033) 0x4cd8a6 KXNORW %K0,%K0,%K1 |
(4033) 0x4cd8aa VXORPD %XMM4,%XMM4,%XMM4 |
(4033) 0x4cd8ae VGATHERQPD (%R12,%YMM3,8),%YMM4{%K1} |
(4033) 0x4cd8b5 VFNMADD231PD (%RSI,%R15,8),%YMM4,%YMM2 |
(4033) 0x4cd8bb ADD $0x4,%R15 |
(4033) 0x4cd8bf CMP %RBX,%R15 |
(4033) 0x4cd8c2 JBE 4cd8a0 |
(4031) 0x4cd8c4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4031) 0x4cd8ca VADDPD %XMM3,%XMM2,%XMM2 |
(4031) 0x4cd8ce VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4031) 0x4cd8d3 VADDSD %XMM3,%XMM2,%XMM2 |
(4031) 0x4cd8d7 VADDSD %XMM2,%XMM1,%XMM1 |
(4031) 0x4cd8db CMP %RDX,%RCX |
(4031) 0x4cd8de MOV -0x40(%RBP),%R14 |
(4031) 0x4cd8e2 MOV -0x38(%RBP),%R15 |
(4031) 0x4cd8e6 MOV 0x28(%RBP),%RBX |
(4031) 0x4cd8ea MOV -0x30(%RBP),%RSI |
(4031) 0x4cd8ee JE 4cd830 |
(4031) 0x4cd8f4 JMP 4cd8f8 |
(4031) 0x4cd8f6 XOR %EDX,%EDX |
(4031) 0x4cd8f8 ADD %RAX,%RDX |
(4031) 0x4cd8fb NOPL (%RAX,%RAX,1) |
(4032) 0x4cd900 MOV (%R13,%RDX,8),%RAX |
(4032) 0x4cd905 VMOVSD (%R12,%RAX,8),%XMM2 |
(4032) 0x4cd90b VFNMADD231SD (%R11,%RDX,8),%XMM2,%XMM1 |
(4032) 0x4cd911 INC %RDX |
(4032) 0x4cd914 CMP %RDX,%R10 |
(4032) 0x4cd917 JNE 4cd900 |
(4031) 0x4cd919 JMP 4cd830 |
0x4cd91e CMP %R15,%R14 |
0x4cd921 JGE 4cdd7e |
0x4cd927 MOV (%R12),%RDI |
0x4cd92b MOV (%RSI),%RSI |
0x4cd92e MOV %R14,%RAX |
0x4cd931 NOT %RAX |
0x4cd934 ADD %RAX,%R15 |
0x4cd937 XOR %R8D,%R8D |
0x4cd93a VMOVDDUP 0x151de(%RIP),%XMM1 |
0x4cd942 MOV %R15,-0x38(%RBP) |
0x4cd946 MOV %RSI,-0x30(%RBP) |
0x4cd94a JMP 4cd96a |
0x4cd94c NOPL (%RAX) |
(4037) 0x4cd950 VMULSD %XMM0,%XMM2,%XMM2 |
(4037) 0x4cd954 VMOVSD %XMM2,(%RSI,%R9,8) |
(4037) 0x4cd95a LEA 0x1(%R8),%RAX |
(4037) 0x4cd95e CMP %R15,%R8 |
(4037) 0x4cd961 MOV %RAX,%R8 |
(4037) 0x4cd964 JE 4cdd7e |
(4037) 0x4cd96a LEA (%R14,%R8,1),%R9 |
(4037) 0x4cd96e VMOVSD (%RBX,%R9,8),%XMM2 |
(4037) 0x4cd974 VXORPD %XMM1,%XMM2,%XMM2 |
(4037) 0x4cd978 MOV (%RDI,%R9,8),%RAX |
(4037) 0x4cd97c MOV 0x8(%RDI,%R9,8),%R10 |
(4037) 0x4cd981 MOV %R10,%RCX |
(4037) 0x4cd984 SUB %RAX,%RCX |
(4037) 0x4cd987 JLE 4cd950 |
(4037) 0x4cd989 MOV -0x48(%RBP),%RDX |
(4037) 0x4cd98d MOV (%RDX),%R11 |
(4037) 0x4cd990 MOV 0x20(%RBP),%RDX |
(4037) 0x4cd994 MOV (%RDX),%R12 |
(4037) 0x4cd997 MOV 0x10(%RBP),%RDX |
(4037) 0x4cd99b MOV (%RDX),%R13 |
(4037) 0x4cd99e MOV %RCX,%RDX |
(4037) 0x4cd9a1 AND $-0x4,%RDX |
(4037) 0x4cd9a5 JE 4cda16 |
(4037) 0x4cd9a7 LEA -0x1(%RDX),%RBX |
(4037) 0x4cd9ab LEA (%R11,%RAX,8),%RSI |
(4037) 0x4cd9af LEA (%R13,%RAX,8),%R14 |
(4037) 0x4cd9b4 VXORPD %XMM3,%XMM3,%XMM3 |
(4037) 0x4cd9b8 XOR %R15D,%R15D |
(4037) 0x4cd9bb NOPL (%RAX,%RAX,1) |
(4039) 0x4cd9c0 VMOVUPD (%R14,%R15,8),%YMM4 |
(4039) 0x4cd9c6 KXNORW %K0,%K0,%K1 |
(4039) 0x4cd9ca VXORPD %XMM5,%XMM5,%XMM5 |
(4039) 0x4cd9ce VGATHERQPD (%R12,%YMM4,8),%YMM5{%K1} |
(4039) 0x4cd9d5 VFMADD231PD (%RSI,%R15,8),%YMM5,%YMM3 |
(4039) 0x4cd9db ADD $0x4,%R15 |
(4039) 0x4cd9df CMP %RBX,%R15 |
(4039) 0x4cd9e2 JBE 4cd9c0 |
(4037) 0x4cd9e4 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(4037) 0x4cd9ea VADDPD %XMM4,%XMM3,%XMM3 |
(4037) 0x4cd9ee VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(4037) 0x4cd9f3 VADDSD %XMM4,%XMM3,%XMM3 |
(4037) 0x4cd9f7 VADDSD %XMM3,%XMM2,%XMM2 |
(4037) 0x4cd9fb CMP %RDX,%RCX |
(4037) 0x4cd9fe MOV -0x40(%RBP),%R14 |
(4037) 0x4cda02 MOV -0x38(%RBP),%R15 |
(4037) 0x4cda06 MOV 0x28(%RBP),%RBX |
(4037) 0x4cda0a MOV -0x30(%RBP),%RSI |
(4037) 0x4cda0e JE 4cd950 |
(4037) 0x4cda14 JMP 4cda18 |
(4037) 0x4cda16 XOR %EDX,%EDX |
(4037) 0x4cda18 ADD %RAX,%RDX |
(4037) 0x4cda1b NOPL (%RAX,%RAX,1) |
(4038) 0x4cda20 MOV (%R13,%RDX,8),%RAX |
(4038) 0x4cda25 VMOVSD (%R12,%RAX,8),%XMM3 |
(4038) 0x4cda2b VFMADD231SD (%R11,%RDX,8),%XMM3,%XMM2 |
(4038) 0x4cda31 INC %RDX |
(4038) 0x4cda34 CMP %RDX,%R10 |
(4038) 0x4cda37 JNE 4cda20 |
(4037) 0x4cda39 JMP 4cd950 |
0x4cda3e VUCOMISD 0x1532a(%RIP),%XMM0 |
0x4cda46 JNE 4cdc6e |
0x4cda4c CMP %R15,%R14 |
0x4cda4f JGE 4cdd7e |
0x4cda55 VXORPD 0x150c1(%RIP){1to2},%XMM5,%XMM0 |
0x4cda5f MOV (%R12),%RDI |
0x4cda63 MOV (%RSI),%RDX |
0x4cda66 MOV %R14,%RAX |
0x4cda69 NOT %RAX |
0x4cda6c ADD %RAX,%R15 |
0x4cda6f XOR %R8D,%R8D |
0x4cda72 MOV %R15,-0x38(%RBP) |
0x4cda76 MOV %RDX,-0x30(%RBP) |
0x4cda7a JMP 4cda92 |
(4022) 0x4cda7c VMOVSD %XMM1,(%RDX,%R9,8) |
(4022) 0x4cda82 LEA 0x1(%R8),%RAX |
(4022) 0x4cda86 CMP %R15,%R8 |
(4022) 0x4cda89 MOV %RAX,%R8 |
(4022) 0x4cda8c JE 4cdd7e |
(4022) 0x4cda92 LEA (%R14,%R8,1),%R9 |
(4022) 0x4cda96 VMULSD (%RBX,%R9,8),%XMM0,%XMM1 |
(4022) 0x4cda9c MOV (%RDI,%R9,8),%RAX |
(4022) 0x4cdaa0 MOV 0x8(%RDI,%R9,8),%R10 |
(4022) 0x4cdaa5 MOV %R10,%RCX |
(4022) 0x4cdaa8 SUB %RAX,%RCX |
(4022) 0x4cdaab JLE 4cda7c |
(4022) 0x4cdaad MOV -0x48(%RBP),%RDX |
(4022) 0x4cdab1 MOV (%RDX),%R11 |
(4022) 0x4cdab4 MOV 0x20(%RBP),%RDX |
(4022) 0x4cdab8 MOV (%RDX),%R12 |
(4022) 0x4cdabb MOV 0x10(%RBP),%RDX |
(4022) 0x4cdabf MOV (%RDX),%R13 |
(4022) 0x4cdac2 MOV %RCX,%RSI |
(4022) 0x4cdac5 AND $-0x4,%RSI |
(4022) 0x4cdac9 JE 4cdb36 |
(4022) 0x4cdacb LEA -0x1(%RSI),%RDX |
(4022) 0x4cdacf LEA (%R11,%RAX,8),%RBX |
(4022) 0x4cdad3 LEA (%R13,%RAX,8),%R14 |
(4022) 0x4cdad8 VXORPD %XMM2,%XMM2,%XMM2 |
(4022) 0x4cdadc XOR %R15D,%R15D |
(4022) 0x4cdadf NOP |
(4024) 0x4cdae0 VMOVUPD (%R14,%R15,8),%YMM3 |
(4024) 0x4cdae6 KXNORW %K0,%K0,%K1 |
(4024) 0x4cdaea VXORPD %XMM4,%XMM4,%XMM4 |
(4024) 0x4cdaee VGATHERQPD (%R12,%YMM3,8),%YMM4{%K1} |
(4024) 0x4cdaf5 VFNMADD231PD (%RBX,%R15,8),%YMM4,%YMM2 |
(4024) 0x4cdafb ADD $0x4,%R15 |
(4024) 0x4cdaff CMP %RDX,%R15 |
(4024) 0x4cdb02 JBE 4cdae0 |
(4022) 0x4cdb04 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4022) 0x4cdb0a VADDPD %XMM3,%XMM2,%XMM2 |
(4022) 0x4cdb0e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4022) 0x4cdb13 VADDSD %XMM3,%XMM2,%XMM2 |
(4022) 0x4cdb17 VADDSD %XMM2,%XMM1,%XMM1 |
(4022) 0x4cdb1b CMP %RSI,%RCX |
(4022) 0x4cdb1e MOV -0x40(%RBP),%R14 |
(4022) 0x4cdb22 MOV -0x38(%RBP),%R15 |
(4022) 0x4cdb26 MOV 0x28(%RBP),%RBX |
(4022) 0x4cdb2a MOV -0x30(%RBP),%RDX |
(4022) 0x4cdb2e JE 4cda7c |
(4022) 0x4cdb34 JMP 4cdb3c |
(4022) 0x4cdb36 XOR %ESI,%ESI |
(4022) 0x4cdb38 MOV -0x30(%RBP),%RDX |
(4022) 0x4cdb3c ADD %RAX,%RSI |
(4022) 0x4cdb3f NOP |
(4023) 0x4cdb40 MOV (%R13,%RSI,8),%RAX |
(4023) 0x4cdb45 VMOVSD (%R12,%RAX,8),%XMM2 |
(4023) 0x4cdb4b VFNMADD231SD (%R11,%RSI,8),%XMM2,%XMM1 |
(4023) 0x4cdb51 INC %RSI |
(4023) 0x4cdb54 CMP %RSI,%R10 |
(4023) 0x4cdb57 JNE 4cdb40 |
(4022) 0x4cdb59 JMP 4cda7c |
0x4cdb5e CMP %R15,%R14 |
0x4cdb61 JGE 4cdd7e |
0x4cdb67 MOV (%R12),%RDI |
0x4cdb6b MOV (%RSI),%RSI |
0x4cdb6e MOV %R14,%RAX |
0x4cdb71 NOT %RAX |
0x4cdb74 ADD %RAX,%R15 |
0x4cdb77 XOR %R8D,%R8D |
0x4cdb7a MOV %R15,-0x38(%RBP) |
0x4cdb7e MOV %RSI,-0x30(%RBP) |
0x4cdb82 JMP 4cdb9e |
(4028) 0x4cdb84 VMULSD %XMM0,%XMM1,%XMM1 |
(4028) 0x4cdb88 VMOVSD %XMM1,(%RSI,%R9,8) |
(4028) 0x4cdb8e LEA 0x1(%R8),%RAX |
(4028) 0x4cdb92 CMP %R15,%R8 |
(4028) 0x4cdb95 MOV %RAX,%R8 |
(4028) 0x4cdb98 JE 4cdd7e |
(4028) 0x4cdb9e LEA (%R14,%R8,1),%R9 |
(4028) 0x4cdba2 VMOVSD (%RBX,%R9,8),%XMM1 |
(4028) 0x4cdba8 MOV (%RDI,%R9,8),%RAX |
(4028) 0x4cdbac MOV 0x8(%RDI,%R9,8),%R10 |
(4028) 0x4cdbb1 MOV %R10,%RCX |
(4028) 0x4cdbb4 SUB %RAX,%RCX |
(4028) 0x4cdbb7 JLE 4cdb84 |
(4028) 0x4cdbb9 MOV -0x48(%RBP),%RDX |
(4028) 0x4cdbbd MOV (%RDX),%R11 |
(4028) 0x4cdbc0 MOV 0x20(%RBP),%RDX |
(4028) 0x4cdbc4 MOV (%RDX),%R12 |
(4028) 0x4cdbc7 MOV 0x10(%RBP),%RDX |
(4028) 0x4cdbcb MOV (%RDX),%R13 |
(4028) 0x4cdbce MOV %RCX,%RDX |
(4028) 0x4cdbd1 AND $-0x4,%RDX |
(4028) 0x4cdbd5 JE 4cdc46 |
(4028) 0x4cdbd7 LEA -0x1(%RDX),%RBX |
(4028) 0x4cdbdb LEA (%R11,%RAX,8),%RSI |
(4028) 0x4cdbdf LEA (%R13,%RAX,8),%R14 |
(4028) 0x4cdbe4 VXORPD %XMM2,%XMM2,%XMM2 |
(4028) 0x4cdbe8 XOR %R15D,%R15D |
(4028) 0x4cdbeb NOPL (%RAX,%RAX,1) |
(4030) 0x4cdbf0 VMOVUPD (%R14,%R15,8),%YMM3 |
(4030) 0x4cdbf6 KXNORW %K0,%K0,%K1 |
(4030) 0x4cdbfa VXORPD %XMM4,%XMM4,%XMM4 |
(4030) 0x4cdbfe VGATHERQPD (%R12,%YMM3,8),%YMM4{%K1} |
(4030) 0x4cdc05 VFMADD231PD (%RSI,%R15,8),%YMM4,%YMM2 |
(4030) 0x4cdc0b ADD $0x4,%R15 |
(4030) 0x4cdc0f CMP %RBX,%R15 |
(4030) 0x4cdc12 JBE 4cdbf0 |
(4028) 0x4cdc14 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4028) 0x4cdc1a VADDPD %XMM3,%XMM2,%XMM2 |
(4028) 0x4cdc1e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4028) 0x4cdc23 VADDSD %XMM3,%XMM2,%XMM2 |
(4028) 0x4cdc27 VADDSD %XMM2,%XMM1,%XMM1 |
(4028) 0x4cdc2b CMP %RDX,%RCX |
(4028) 0x4cdc2e MOV -0x40(%RBP),%R14 |
(4028) 0x4cdc32 MOV -0x38(%RBP),%R15 |
(4028) 0x4cdc36 MOV 0x28(%RBP),%RBX |
(4028) 0x4cdc3a MOV -0x30(%RBP),%RSI |
(4028) 0x4cdc3e JE 4cdb84 |
(4028) 0x4cdc44 JMP 4cdc48 |
(4028) 0x4cdc46 XOR %EDX,%EDX |
(4028) 0x4cdc48 ADD %RAX,%RDX |
(4028) 0x4cdc4b NOPL (%RAX,%RAX,1) |
(4029) 0x4cdc50 MOV (%R13,%RDX,8),%RAX |
(4029) 0x4cdc55 VMOVSD (%R12,%RAX,8),%XMM2 |
(4029) 0x4cdc5b VFMADD231SD (%R11,%RDX,8),%XMM2,%XMM1 |
(4029) 0x4cdc61 INC %RDX |
(4029) 0x4cdc64 CMP %RDX,%R10 |
(4029) 0x4cdc67 JNE 4cdc50 |
(4028) 0x4cdc69 JMP 4cdb84 |
0x4cdc6e CMP %R15,%R14 |
0x4cdc71 JGE 4cdd7e |
0x4cdc77 MOV (%R12),%RDI |
0x4cdc7b MOV (%RSI),%RDX |
0x4cdc7e MOV %R14,%RAX |
0x4cdc81 NOT %RAX |
0x4cdc84 ADD %RAX,%R15 |
0x4cdc87 XOR %R8D,%R8D |
0x4cdc8a MOV %R15,-0x38(%RBP) |
0x4cdc8e MOV %RDX,-0x30(%RBP) |
0x4cdc92 JMP 4cdcae |
(4019) 0x4cdc94 VMULSD %XMM0,%XMM1,%XMM1 |
(4019) 0x4cdc98 VMOVSD %XMM1,(%RDX,%R9,8) |
(4019) 0x4cdc9e LEA 0x1(%R8),%RAX |
(4019) 0x4cdca2 CMP %R15,%R8 |
(4019) 0x4cdca5 MOV %RAX,%R8 |
(4019) 0x4cdca8 JE 4cdd7e |
(4019) 0x4cdcae LEA (%R14,%R8,1),%R9 |
(4019) 0x4cdcb2 VMULSD (%RBX,%R9,8),%XMM5,%XMM1 |
(4019) 0x4cdcb8 MOV (%RDI,%R9,8),%RAX |
(4019) 0x4cdcbc MOV 0x8(%RDI,%R9,8),%R10 |
(4019) 0x4cdcc1 MOV %R10,%RCX |
(4019) 0x4cdcc4 SUB %RAX,%RCX |
(4019) 0x4cdcc7 JLE 4cdc94 |
(4019) 0x4cdcc9 MOV -0x48(%RBP),%RDX |
(4019) 0x4cdccd MOV (%RDX),%R11 |
(4019) 0x4cdcd0 MOV 0x20(%RBP),%RDX |
(4019) 0x4cdcd4 MOV (%RDX),%R12 |
(4019) 0x4cdcd7 MOV 0x10(%RBP),%RDX |
(4019) 0x4cdcdb MOV (%RDX),%R13 |
(4019) 0x4cdcde MOV %RCX,%RSI |
(4019) 0x4cdce1 AND $-0x4,%RSI |
(4019) 0x4cdce5 JE 4cdd56 |
(4019) 0x4cdce7 LEA -0x1(%RSI),%RDX |
(4019) 0x4cdceb LEA (%R11,%RAX,8),%RBX |
(4019) 0x4cdcef LEA (%R13,%RAX,8),%R14 |
(4019) 0x4cdcf4 VXORPD %XMM2,%XMM2,%XMM2 |
(4019) 0x4cdcf8 XOR %R15D,%R15D |
(4019) 0x4cdcfb NOPL (%RAX,%RAX,1) |
(4021) 0x4cdd00 VMOVUPD (%R14,%R15,8),%YMM3 |
(4021) 0x4cdd06 KXNORW %K0,%K0,%K1 |
(4021) 0x4cdd0a VXORPD %XMM4,%XMM4,%XMM4 |
(4021) 0x4cdd0e VGATHERQPD (%R12,%YMM3,8),%YMM4{%K1} |
(4021) 0x4cdd15 VFMADD231PD (%RBX,%R15,8),%YMM4,%YMM2 |
(4021) 0x4cdd1b ADD $0x4,%R15 |
(4021) 0x4cdd1f CMP %RDX,%R15 |
(4021) 0x4cdd22 JBE 4cdd00 |
(4019) 0x4cdd24 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4019) 0x4cdd2a VADDPD %XMM3,%XMM2,%XMM2 |
(4019) 0x4cdd2e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4019) 0x4cdd33 VADDSD %XMM3,%XMM2,%XMM2 |
(4019) 0x4cdd37 VADDSD %XMM2,%XMM1,%XMM1 |
(4019) 0x4cdd3b CMP %RSI,%RCX |
(4019) 0x4cdd3e MOV -0x40(%RBP),%R14 |
(4019) 0x4cdd42 MOV -0x38(%RBP),%R15 |
(4019) 0x4cdd46 MOV 0x28(%RBP),%RBX |
(4019) 0x4cdd4a MOV -0x30(%RBP),%RDX |
(4019) 0x4cdd4e JE 4cdc94 |
(4019) 0x4cdd54 JMP 4cdd5c |
(4019) 0x4cdd56 XOR %ESI,%ESI |
(4019) 0x4cdd58 MOV -0x30(%RBP),%RDX |
(4019) 0x4cdd5c ADD %RAX,%RSI |
(4019) 0x4cdd5f NOP |
(4020) 0x4cdd60 MOV (%R13,%RSI,8),%RAX |
(4020) 0x4cdd65 VMOVSD (%R12,%RAX,8),%XMM2 |
(4020) 0x4cdd6b VFMADD231SD (%R11,%RSI,8),%XMM2,%XMM1 |
(4020) 0x4cdd71 INC %RSI |
(4020) 0x4cdd74 CMP %RSI,%R10 |
(4020) 0x4cdd77 JNE 4cdd60 |
(4019) 0x4cdd79 JMP 4cdc94 |
0x4cdd7e ADD $0x28,%RSP |
0x4cdd82 POP %RBX |
0x4cdd83 POP %R12 |
0x4cdd85 POP %R13 |
0x4cdd87 POP %R14 |
0x4cdd89 POP %R15 |
0x4cdd8b POP %RBP |
0x4cdd8c VZEROUPPER |
0x4cdd8f RET |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.99+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 242 |
nb uops | 261 |
loop length | 991 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 8 |
micro-operation queue | 43.50 cycles |
front end | 43.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 19.40 | 17.67 | 17.67 | 20.00 | 19.40 | 20.00 | 20.00 | 20.00 | 20.00 | 19.20 | 17.67 |
cycles | 20.00 | 19.40 | 17.67 | 17.67 | 20.00 | 19.40 | 20.00 | 20.00 | 20.00 | 20.00 | 19.20 | 17.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 42.22 |
Stall cycles | 0.00 |
Front-end | 43.50 |
Dispatch | 20.00 |
Overall L1 | 43.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 2% |
all | 11% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cb940 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cb9c0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ccf27 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x67> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x24dd00(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4345,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f635b,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d53b0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f6d01,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d7ce0 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4ccf35 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ccf63 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x24dcc4(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4345,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f6d88,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d53b0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f6d01,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d7ce0 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4ccf72 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ccfa5 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x24dc87(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4345,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f6daa,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d53b0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f6d01,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d7ce0 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R14,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4cd0dd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x21d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x14ea8(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd21e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x35e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd016 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x156> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x28(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x15c87(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd33d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x47d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x14d79(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd46e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x5ae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x159ff(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd146 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x286> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x15b4a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd59e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x6de> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd276 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x3b6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x14b2b(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd6bd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x14b1d(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd7ee <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x92e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd396 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4d6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x158fa(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd91e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa5e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd4c6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x606> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd5ea <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x72a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x147ab(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cda3e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb7e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd716 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x856> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1557a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cdb5e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc9e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x15300(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd846 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x986> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x151de(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd96a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xaaa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1532a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cdc6e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x150c1(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cda92 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbd2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cdb9e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcde> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cdcae <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 242 |
nb uops | 261 |
loop length | 991 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 8 |
micro-operation queue | 43.50 cycles |
front end | 43.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 19.40 | 17.67 | 17.67 | 20.00 | 19.40 | 20.00 | 20.00 | 20.00 | 20.00 | 19.20 | 17.67 |
cycles | 20.00 | 19.40 | 17.67 | 17.67 | 20.00 | 19.40 | 20.00 | 20.00 | 20.00 | 20.00 | 19.20 | 17.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 42.22 |
Stall cycles | 0.00 |
Front-end | 43.50 |
Dispatch | 20.00 |
Overall L1 | 43.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 2% |
all | 11% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cb940 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cb9c0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ccf27 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x67> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x24dd00(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4345,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f635b,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d53b0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f6d01,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d7ce0 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4ccf35 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ccf63 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x24dcc4(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4345,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f6d88,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d53b0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f6d01,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d7ce0 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4ccf72 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ccfa5 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x24dc87(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4345,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f6daa,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d53b0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f6d01,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d7ce0 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R14,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4cd0dd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x21d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x14ea8(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd21e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x35e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd016 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x156> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x28(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x15c87(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd33d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x47d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x14d79(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd46e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x5ae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x159ff(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd146 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x286> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x15b4a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd59e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x6de> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd276 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x3b6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x14b2b(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd6bd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x14b1d(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd7ee <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x92e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd396 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4d6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x158fa(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd91e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa5e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd4c6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x606> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd5ea <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x72a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x147ab(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cda3e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb7e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd716 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x856> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1557a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cdb5e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc9e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x15300(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd846 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x986> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x151de(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd96a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xaaa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1532a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cdc6e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x150c1(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cda92 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbd2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cdb9e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcde> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4cdd7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cdcae <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace.extracted– | 12.09 | 1.82 |
▼Loop 4034 - csr_matvec.c:248-341 - exec– | 0.97 | 0.12 |
○Loop 4035 - csr_matvec.c:337-339 - exec | 0.45 | 0.06 |
○Loop 4036 - csr_matvec.c:337-339 - exec | 0.13 | 0.02 |
▼Loop 4040 - csr_matvec.c:248-314 - exec– | 0.64 | 0.08 |
○Loop 4042 - csr_matvec.c:310-312 - exec | 4.26 | 0.53 |
○Loop 4041 - csr_matvec.c:310-312 - exec | 0.7 | 0.09 |
▼Loop 4052 - csr_matvec.c:248-263 - exec– | 0.52 | 0.06 |
○Loop 4054 - csr_matvec.c:259-261 - exec | 3.76 | 0.47 |
○Loop 4053 - csr_matvec.c:259-261 - exec | 0.65 | 0.08 |
▼Loop 4049 - csr_matvec.c:248-275 - exec– | 0 | 0 |
○Loop 4051 - csr_matvec.c:271-273 - exec | 0 | 0 |
○Loop 4050 - csr_matvec.c:271-273 - exec | 0 | 0 |
▼Loop 4037 - csr_matvec.c:248-326 - exec– | 0 | 0 |
○Loop 4039 - csr_matvec.c:322-324 - exec | 0 | 0 |
○Loop 4038 - csr_matvec.c:322-324 - exec | 0 | 0 |
▼Loop 4025 - csr_matvec.c:248-380 - exec– | 0 | 0 |
○Loop 4027 - csr_matvec.c:376-378 - exec | 0 | 0 |
○Loop 4026 - csr_matvec.c:376-378 - exec | 0 | 0 |
▼Loop 4019 - csr_matvec.c:248-404 - exec– | 0 | 0 |
○Loop 4021 - csr_matvec.c:400-402 - exec | 0 | 0 |
○Loop 4020 - csr_matvec.c:400-402 - exec | 0 | 0 |
▼Loop 4046 - csr_matvec.c:248-287 - exec– | 0 | 0 |
○Loop 4048 - csr_matvec.c:283-285 - exec | 0 | 0 |
○Loop 4047 - csr_matvec.c:283-285 - exec | 0 | 0 |
▼Loop 4028 - csr_matvec.c:248-365 - exec– | 0 | 0 |
○Loop 4029 - csr_matvec.c:361-363 - exec | 0 | 0 |
○Loop 4030 - csr_matvec.c:361-363 - exec | 0 | 0 |
▼Loop 4022 - csr_matvec.c:248-392 - exec– | 0 | 0 |
○Loop 4023 - csr_matvec.c:388-390 - exec | 0 | 0 |
○Loop 4024 - csr_matvec.c:388-390 - exec | 0 | 0 |
▼Loop 4031 - csr_matvec.c:248-353 - exec– | 0 | 0 |
○Loop 4033 - csr_matvec.c:349-351 - exec | 0 | 0 |
○Loop 4032 - csr_matvec.c:349-351 - exec | 0 | 0 |
▼Loop 4043 - csr_matvec.c:248-302 - exec– | 0 | 0 |
○Loop 4044 - csr_matvec.c:298-300 - exec | 0 | 0 |
○Loop 4045 - csr_matvec.c:298-300 - exec | 0 | 0 |