Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: libseq_mv.so | Source: csr_matvec.c:243-404 [...] | Coverage: 18.69% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: libseq_mv.so | Source: csr_matvec.c:243-404 [...] | Coverage: 18.69% |
---|
/scratch_na/users/xoserete/qaas_runs/171-587-0005/intel/AMG/build/AMG/AMG/seq_mv/csr_matrix.c: 645 - 674 |
-------------------------------------------------------------------------------- |
645: HYPRE_Int num_nonzerosA = hypre_CSRMatrixNumNonzeros(A); |
646: HYPRE_Int num_rowsA = hypre_CSRMatrixNumRows(A); |
647: HYPRE_Int *A_i = hypre_CSRMatrixI(A); |
648: |
649: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
650: |
651: HYPRE_Int nonzeros_per_thread = (num_nonzerosA + num_threads - 1)/num_threads; |
652: |
653: if (idx <= 0) |
654: { |
655: return 0; |
656: } |
657: else if (idx >= num_threads) |
[...] |
663: return (HYPRE_Int)(hypre_LowerBound(A_i, A_i + num_rowsA, nonzeros_per_thread*idx) - A_i); |
[...] |
669: return hypre_CSRMatrixGetLoadBalancedPartitionBoundary(A, hypre_GetThreadNum()); |
670: } |
671: |
672: HYPRE_Int hypre_CSRMatrixGetLoadBalancedPartitionEnd(hypre_CSRMatrix *A) |
673: { |
674: return hypre_CSRMatrixGetLoadBalancedPartitionBoundary(A, hypre_GetThreadNum() + 1); |
/scratch_na/users/xoserete/qaas_runs/171-587-0005/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 243 - 404 |
-------------------------------------------------------------------------------- |
243: #pragma omp parallel private(i,jj,tempx) |
244: #endif |
245: { |
246: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
247: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
248: hypre_assert(iBegin <= iEnd); |
249: hypre_assert(iBegin >= 0 && iBegin <= num_rows); |
250: hypre_assert(iEnd >= 0 && iEnd <= num_rows); |
251: |
252: if (0 == temp) |
253: { |
254: if (1 == alpha) // JSP: a common path |
255: { |
256: for (i = iBegin; i < iEnd; i++) |
257: { |
258: tempx = 0.0; |
259: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
260: { |
261: tempx += A_data[jj] * x_data[A_j[jj]]; |
262: } |
263: y_data[i] = tempx; |
264: } |
265: } // y = A*x |
266: else if (-1 == alpha) |
267: { |
268: for (i = iBegin; i < iEnd; i++) |
269: { |
270: tempx = 0.0; |
271: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
272: { |
273: tempx -= A_data[jj] * x_data[A_j[jj]]; |
274: } |
275: y_data[i] = tempx; |
276: } |
277: } // y = -A*x |
278: else |
279: { |
280: for (i = iBegin; i < iEnd; i++) |
281: { |
282: tempx = 0.0; |
283: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
284: { |
285: tempx += A_data[jj] * x_data[A_j[jj]]; |
286: } |
287: y_data[i] = alpha*tempx; |
288: } |
289: } // y = alpha*A*x |
290: } // temp == 0 |
291: else if (-1 == temp) // beta == -alpha |
292: { |
293: if (1 == alpha) // JSP: a common path |
294: { |
295: for (i = iBegin; i < iEnd; i++) |
296: { |
297: tempx = -b_data[i]; |
298: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
299: { |
300: tempx += A_data[jj] * x_data[A_j[jj]]; |
301: } |
302: y_data[i] = tempx; |
303: } |
304: } // y = A*x - y |
305: else if (-1 == alpha) // JSP: a common path |
306: { |
307: for (i = iBegin; i < iEnd; i++) |
308: { |
309: tempx = b_data[i]; |
310: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
311: { |
312: tempx -= A_data[jj] * x_data[A_j[jj]]; |
313: } |
314: y_data[i] = tempx; |
315: } |
316: } // y = -A*x + y |
317: else |
318: { |
319: for (i = iBegin; i < iEnd; i++) |
320: { |
321: tempx = -b_data[i]; |
322: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
323: { |
324: tempx += A_data[jj] * x_data[A_j[jj]]; |
325: } |
326: y_data[i] = alpha*tempx; |
327: } |
328: } // y = alpha*(A*x - y) |
329: } // temp == -1 |
330: else if (1 == temp) |
331: { |
332: if (1 == alpha) // JSP: a common path |
333: { |
334: for (i = iBegin; i < iEnd; i++) |
335: { |
336: tempx = b_data[i]; |
337: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
338: { |
339: tempx += A_data[jj] * x_data[A_j[jj]]; |
340: } |
341: y_data[i] = tempx; |
342: } |
343: } // y = A*x + y |
344: else if (-1 == alpha) |
345: { |
346: for (i = iBegin; i < iEnd; i++) |
347: { |
348: tempx = -b_data[i]; |
349: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
350: { |
351: tempx -= A_data[jj] * x_data[A_j[jj]]; |
352: } |
353: y_data[i] = tempx; |
354: } |
355: } // y = -A*x - y |
356: else |
357: { |
358: for (i = iBegin; i < iEnd; i++) |
359: { |
360: tempx = b_data[i]; |
361: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
362: { |
363: tempx += A_data[jj] * x_data[A_j[jj]]; |
364: } |
365: y_data[i] = alpha*tempx; |
[...] |
371: if (1 == alpha) // JSP: a common path |
372: { |
373: for (i = iBegin; i < iEnd; i++) |
374: { |
375: tempx = b_data[i]*temp; |
376: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
377: { |
378: tempx += A_data[jj] * x_data[A_j[jj]]; |
379: } |
380: y_data[i] = tempx; |
381: } |
382: } // y = A*x + temp*y |
383: else if (-1 == alpha) |
384: { |
385: for (i = iBegin; i < iEnd; i++) |
386: { |
387: tempx = -b_data[i]*temp; |
388: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
389: { |
390: tempx -= A_data[jj] * x_data[A_j[jj]]; |
391: } |
392: y_data[i] = tempx; |
393: } |
394: } // y = -A*x - temp*y |
395: else |
396: { |
397: for (i = iBegin; i < iEnd; i++) |
398: { |
399: tempx = b_data[i]*temp; |
400: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
401: { |
402: tempx += A_data[jj] * x_data[A_j[jj]]; |
403: } |
404: y_data[i] = alpha*tempx; |
0x6aa0 PUSH %RBP |
0x6aa1 MOV %RSP,%RBP |
0x6aa4 PUSH %R15 |
0x6aa6 PUSH %R14 |
0x6aa8 PUSH %R13 |
0x6aaa PUSH %R12 |
0x6aac PUSH %RBX |
0x6aad SUB $0x38,%RSP |
0x6ab1 MOV %R9,-0x30(%RBP) |
0x6ab5 MOV %R8,-0x58(%RBP) |
0x6ab9 MOV %RCX,%R15 |
0x6abc MOV %RDX,%R13 |
0x6abf CALL 2220 <hypre_GetThreadNum@plt> |
0x6ac4 MOV %RAX,%RBX |
0x6ac7 MOV 0x20(%R15),%R14 |
0x6acb MOV (%R15),%R12 |
0x6ace MOV 0x10(%R15),%RAX |
0x6ad2 MOV %RAX,-0x50(%RBP) |
0x6ad6 CALL 2310 <hypre_NumActiveThreads@plt> |
0x6adb MOV %RAX,%RCX |
0x6ade ADD %R14,%RAX |
0x6ae1 DEC %RAX |
0x6ae4 MOV %RAX,%RDX |
0x6ae7 OR %RCX,%RDX |
0x6aea SHR $0x20,%RDX |
0x6aee JE 6b23 |
0x6af0 CQTO |
0x6af2 IDIV %RCX |
0x6af5 TEST %RBX,%RBX |
0x6af8 JLE 6b2c |
0x6afa CMP %RBX,%RCX |
0x6afd JLE 6b34 |
0x6aff MOV -0x50(%RBP),%RCX |
0x6b03 LEA (%R12,%RCX,8),%RSI |
0x6b07 IMUL %RBX,%RAX |
0x6b0b MOV %R12,%RDI |
0x6b0e MOV %RAX,%RDX |
0x6b11 CALL 22d0 <hypre_LowerBound@plt> |
0x6b16 SUB %R12,%RAX |
0x6b19 SAR $0x3,%RAX |
0x6b1d MOV %RAX,-0x50(%RBP) |
0x6b21 JMP 6b34 |
0x6b23 XOR %EDX,%EDX |
0x6b25 DIV %ECX |
0x6b27 TEST %RBX,%RBX |
0x6b2a JG 6afa |
0x6b2c MOVQ $0,-0x50(%RBP) |
0x6b34 CALL 2220 <hypre_GetThreadNum@plt> |
0x6b39 MOV %RAX,%RBX |
0x6b3c MOV 0x20(%R15),%R14 |
0x6b40 MOV (%R15),%R12 |
0x6b43 MOV 0x10(%R15),%R15 |
0x6b47 CALL 2310 <hypre_NumActiveThreads@plt> |
0x6b4c MOV %RAX,%RCX |
0x6b4f ADD %R14,%RAX |
0x6b52 DEC %RAX |
0x6b55 MOV %RAX,%RDX |
0x6b58 OR %RCX,%RDX |
0x6b5b SHR $0x20,%RDX |
0x6b5f JE 6b68 |
0x6b61 CQTO |
0x6b63 IDIV %RCX |
0x6b66 JMP 6b6c |
0x6b68 XOR %EDX,%EDX |
0x6b6a DIV %ECX |
0x6b6c MOV -0x50(%RBP),%R14 |
0x6b70 TEST %RBX,%RBX |
0x6b73 JS 6dad |
0x6b79 INC %RBX |
0x6b7c CMP %RBX,%RCX |
0x6b7f JLE 6b9e |
0x6b81 LEA (%R12,%R15,8),%RSI |
0x6b85 IMUL %RBX,%RAX |
0x6b89 MOV %R12,%RDI |
0x6b8c MOV %RAX,%RDX |
0x6b8f CALL 22d0 <hypre_LowerBound@plt> |
0x6b94 MOV %RAX,%R15 |
0x6b97 SUB %R12,%R15 |
0x6b9a SAR $0x3,%R15 |
0x6b9e CMP %R15,%R14 |
0x6ba1 JLE 6bda |
0x6ba3 MOV 0x208436(%RIP),%RAX |
0x6baa MOV (%RAX),%RDI |
0x6bad LEA 0x4345(%RIP),%RSI |
0x6bb4 LEA 0x42e6(%RIP),%RDX |
0x6bbb XOR %EAX,%EAX |
0x6bbd CALL 2370 <hypre_fprintf@plt> |
0x6bc2 LEA 0x4251(%RIP),%RDI |
0x6bc9 MOV $0xf8,%ESI |
0x6bce MOV $0x1,%EDX |
0x6bd3 XOR %ECX,%ECX |
0x6bd5 CALL 23b0 <hypre_error_handler@plt> |
0x6bda MOV 0x18(%RBP),%RBX |
0x6bde TEST %R14,%R14 |
0x6be1 JS 6be8 |
0x6be3 CMP %RBX,%R14 |
0x6be6 JLE 6c1f |
0x6be8 MOV 0x2083f1(%RIP),%RAX |
0x6bef MOV (%RAX),%RDI |
0x6bf2 LEA 0x4300(%RIP),%RSI |
0x6bf9 LEA 0x42b0(%RIP),%RDX |
0x6c00 XOR %EAX,%EAX |
0x6c02 CALL 2370 <hypre_fprintf@plt> |
0x6c07 LEA 0x420c(%RIP),%RDI |
0x6c0e MOV $0xf9,%ESI |
0x6c13 MOV $0x1,%EDX |
0x6c18 XOR %ECX,%ECX |
0x6c1a CALL 23b0 <hypre_error_handler@plt> |
0x6c1f VMOVSD 0x38(%RBP),%XMM4 |
0x6c24 TEST %R15,%R15 |
0x6c27 JS 6c2e |
0x6c29 CMP %RBX,%R15 |
0x6c2c JLE 6c6a |
0x6c2e MOV 0x2083ab(%RIP),%RAX |
0x6c35 MOV (%RAX),%RDI |
0x6c38 LEA 0x42ba(%RIP),%RSI |
0x6c3f LEA 0x428c(%RIP),%RDX |
0x6c46 XOR %EAX,%EAX |
0x6c48 CALL 2370 <hypre_fprintf@plt> |
0x6c4d LEA 0x41c6(%RIP),%RDI |
0x6c54 MOV $0xfa,%ESI |
0x6c59 MOV $0x1,%EDX |
0x6c5e XOR %ECX,%ECX |
0x6c60 CALL 23b0 <hypre_error_handler@plt> |
0x6c65 VMOVSD 0x38(%RBP),%XMM4 |
0x6c6a MOV 0x30(%RBP),%RSI |
0x6c6e VMOVQ %R13,%XMM0 |
0x6c73 VXORPD %XMM1,%XMM1,%XMM1 |
0x6c77 VUCOMISD %XMM1,%XMM4 |
0x6c7b JNE 6dbe |
0x6c81 VUCOMISD 0x3ee7(%RIP),%XMM0 |
0x6c89 JNE 6f0c |
0x6c8f CMP %R15,%R14 |
0x6c92 JGE 7adc |
0x6c98 MOV -0x30(%RBP),%RAX |
0x6c9c MOV (%RAX),%RDX |
0x6c9f MOV (%RSI),%RSI |
0x6ca2 MOV %R14,%RAX |
0x6ca5 NOT %RAX |
0x6ca8 ADD %RAX,%R15 |
0x6cab XOR %EDI,%EDI |
0x6cad MOV %R15,-0x30(%RBP) |
0x6cb1 MOV %RDX,-0x48(%RBP) |
0x6cb5 MOV %RSI,-0x40(%RBP) |
0x6cb9 JMP 6cd6 |
0x6cbb NOPL (%RAX,%RAX,1) |
(147) 0x6cc0 VMOVSD %XMM0,(%RSI,%R8,8) |
(147) 0x6cc6 LEA 0x1(%RDI),%RAX |
(147) 0x6cca CMP %R15,%RDI |
(147) 0x6ccd MOV %RAX,%RDI |
(147) 0x6cd0 JE 7adc |
(147) 0x6cd6 LEA (%R14,%RDI,1),%R8 |
(147) 0x6cda MOV (%RDX,%R8,8),%R13 |
(147) 0x6cde MOV 0x8(%RDX,%R8,8),%R9 |
(147) 0x6ce3 VXORPD %XMM0,%XMM0,%XMM0 |
(147) 0x6ce7 MOV %R9,%RAX |
(147) 0x6cea SUB %R13,%RAX |
(147) 0x6ced JLE 6cc0 |
(147) 0x6cef MOV -0x58(%RBP),%RCX |
(147) 0x6cf3 MOV (%RCX),%R10 |
(147) 0x6cf6 MOV 0x20(%RBP),%RCX |
(147) 0x6cfa MOV (%RCX),%R11 |
(147) 0x6cfd MOV 0x10(%RBP),%RCX |
(147) 0x6d01 MOV (%RCX),%RBX |
(147) 0x6d04 MOV %RAX,%R12 |
(147) 0x6d07 AND $-0x2,%R12 |
(147) 0x6d0b JE 6d7c |
(147) 0x6d0d LEA -0x1(%R12),%RCX |
(147) 0x6d12 LEA (%R10,%R13,8),%R14 |
(147) 0x6d16 MOV %R13,-0x38(%RBP) |
(147) 0x6d1a LEA (%RBX,%R13,8),%R15 |
(147) 0x6d1e VXORPD %XMM0,%XMM0,%XMM0 |
(147) 0x6d22 XOR %ESI,%ESI |
(147) 0x6d24 NOPW %CS:(%RAX,%RAX,1) |
(149) 0x6d30 MOV (%R15,%RSI,8),%RDX |
(149) 0x6d34 MOV 0x8(%R15,%RSI,8),%R13 |
(149) 0x6d39 VMOVSD (%R11,%RDX,8),%XMM1 |
(149) 0x6d3f VMOVHPD (%R11,%R13,8),%XMM1,%XMM1 |
(149) 0x6d45 VFMADD231PD (%R14,%RSI,8),%XMM1,%XMM0 |
(149) 0x6d4b ADD $0x2,%RSI |
(149) 0x6d4f CMP %RCX,%RSI |
(149) 0x6d52 JBE 6d30 |
(147) 0x6d54 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(147) 0x6d59 VADDSD %XMM1,%XMM0,%XMM0 |
(147) 0x6d5d CMP %R12,%RAX |
(147) 0x6d60 MOV -0x50(%RBP),%R14 |
(147) 0x6d64 MOV -0x30(%RBP),%R15 |
(147) 0x6d68 MOV -0x48(%RBP),%RDX |
(147) 0x6d6c MOV -0x40(%RBP),%RSI |
(147) 0x6d70 MOV -0x38(%RBP),%R13 |
(147) 0x6d74 JE 6cc0 |
(147) 0x6d7a JMP 6d7f |
(147) 0x6d7c XOR %R12D,%R12D |
(147) 0x6d7f ADD %R13,%R12 |
(147) 0x6d82 NOPW %CS:(%RAX,%RAX,1) |
(148) 0x6d90 MOV (%RBX,%R12,8),%RAX |
(148) 0x6d94 VMOVSD (%R11,%RAX,8),%XMM1 |
(148) 0x6d9a VFMADD231SD (%R10,%R12,8),%XMM1,%XMM0 |
(148) 0x6da0 INC %R12 |
(148) 0x6da3 CMP %R12,%R9 |
(148) 0x6da6 JNE 6d90 |
(147) 0x6da8 JMP 6cc0 |
0x6dad XOR %R15D,%R15D |
0x6db0 CMP %R15,%R14 |
0x6db3 JG 6ba3 |
0x6db9 JMP 6bda |
0x6dbe MOV 0x28(%RBP),%RDX |
0x6dc2 VUCOMISD 0x3dae(%RIP),%XMM4 |
0x6dca JNE 703d |
0x6dd0 VUCOMISD 0x3d98(%RIP),%XMM0 |
0x6dd8 JNE 717c |
0x6dde CMP %R15,%R14 |
0x6de1 JGE 7adc |
0x6de7 MOV -0x30(%RBP),%RAX |
0x6deb MOV (%RAX),%RDI |
0x6dee MOV (%RSI),%RSI |
0x6df1 MOV %R14,%RAX |
0x6df4 NOT %RAX |
0x6df7 ADD %RAX,%R15 |
0x6dfa XOR %R8D,%R8D |
0x6dfd VMOVDDUP 0x3d7b(%RIP),%XMM0 |
0x6e05 MOV %R15,-0x30(%RBP) |
0x6e09 MOV %RDI,-0x48(%RBP) |
0x6e0d MOV %RSI,-0x40(%RBP) |
0x6e11 JMP 6e36 |
0x6e13 NOPW %CS:(%RAX,%RAX,1) |
(138) 0x6e20 VMOVSD %XMM1,(%RSI,%R9,8) |
(138) 0x6e26 LEA 0x1(%R8),%RAX |
(138) 0x6e2a CMP %R15,%R8 |
(138) 0x6e2d MOV %RAX,%R8 |
(138) 0x6e30 JE 7adc |
(138) 0x6e36 LEA (%R14,%R8,1),%R9 |
(138) 0x6e3a VMOVSD (%RDX,%R9,8),%XMM1 |
(138) 0x6e40 VXORPD %XMM0,%XMM1,%XMM1 |
(138) 0x6e44 MOV (%RDI,%R9,8),%RCX |
(138) 0x6e48 MOV 0x8(%RDI,%R9,8),%R10 |
(138) 0x6e4d MOV %R10,%RAX |
(138) 0x6e50 SUB %RCX,%RAX |
(138) 0x6e53 JLE 6e20 |
(138) 0x6e55 MOV %RCX,-0x38(%RBP) |
(138) 0x6e59 MOV -0x58(%RBP),%RCX |
(138) 0x6e5d MOV (%RCX),%R11 |
(138) 0x6e60 MOV 0x20(%RBP),%RCX |
(138) 0x6e64 MOV (%RCX),%RBX |
(138) 0x6e67 MOV 0x10(%RBP),%RCX |
(138) 0x6e6b MOV (%RCX),%R12 |
(138) 0x6e6e MOV %RAX,%R13 |
(138) 0x6e71 AND $-0x2,%R13 |
(138) 0x6e75 JE 6ede |
(138) 0x6e77 LEA -0x1(%R13),%RCX |
(138) 0x6e7b MOV -0x38(%RBP),%RDX |
(138) 0x6e7f LEA (%R11,%RDX,8),%R14 |
(138) 0x6e83 LEA (%R12,%RDX,8),%R15 |
(138) 0x6e87 VXORPD %XMM2,%XMM2,%XMM2 |
(138) 0x6e8b XOR %ESI,%ESI |
(138) 0x6e8d NOPL (%RAX) |
(140) 0x6e90 MOV (%R15,%RSI,8),%RDI |
(140) 0x6e94 MOV 0x8(%R15,%RSI,8),%RDX |
(140) 0x6e99 VMOVSD (%RBX,%RDI,8),%XMM3 |
(140) 0x6e9e VMOVHPD (%RBX,%RDX,8),%XMM3,%XMM3 |
(140) 0x6ea3 VFMADD231PD (%R14,%RSI,8),%XMM3,%XMM2 |
(140) 0x6ea9 ADD $0x2,%RSI |
(140) 0x6ead CMP %RCX,%RSI |
(140) 0x6eb0 JBE 6e90 |
(138) 0x6eb2 VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(138) 0x6eb7 VADDSD %XMM3,%XMM2,%XMM2 |
(138) 0x6ebb VADDSD %XMM2,%XMM1,%XMM1 |
(138) 0x6ebf CMP %R13,%RAX |
(138) 0x6ec2 MOV -0x50(%RBP),%R14 |
(138) 0x6ec6 MOV -0x30(%RBP),%R15 |
(138) 0x6eca MOV 0x28(%RBP),%RDX |
(138) 0x6ece MOV -0x48(%RBP),%RDI |
(138) 0x6ed2 MOV -0x40(%RBP),%RSI |
(138) 0x6ed6 JE 6e20 |
(138) 0x6edc JMP 6ee1 |
(138) 0x6ede XOR %R13D,%R13D |
(138) 0x6ee1 ADD -0x38(%RBP),%R13 |
(138) 0x6ee5 NOPW %CS:(%RAX,%RAX,1) |
(139) 0x6ef0 MOV (%R12,%R13,8),%RAX |
(139) 0x6ef4 VMOVSD (%RBX,%RAX,8),%XMM2 |
(139) 0x6ef9 VFMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(139) 0x6eff INC %R13 |
(139) 0x6f02 CMP %R13,%R10 |
(139) 0x6f05 JNE 6ef0 |
(138) 0x6f07 JMP 6e20 |
0x6f0c VUCOMISD 0x3c64(%RIP),%XMM0 |
0x6f14 JNE 72ac |
0x6f1a CMP %R15,%R14 |
0x6f1d JGE 7adc |
0x6f23 MOV -0x30(%RBP),%RAX |
0x6f27 MOV (%RAX),%RDX |
0x6f2a MOV (%RSI),%RSI |
0x6f2d MOV %R14,%RAX |
0x6f30 NOT %RAX |
0x6f33 ADD %RAX,%R15 |
0x6f36 XOR %EDI,%EDI |
0x6f38 MOV %R15,-0x30(%RBP) |
0x6f3c MOV %RDX,-0x48(%RBP) |
0x6f40 MOV %RSI,-0x40(%RBP) |
0x6f44 JMP 6f66 |
0x6f46 NOPW %CS:(%RAX,%RAX,1) |
(144) 0x6f50 VMOVSD %XMM0,(%RSI,%R8,8) |
(144) 0x6f56 LEA 0x1(%RDI),%RAX |
(144) 0x6f5a CMP %R15,%RDI |
(144) 0x6f5d MOV %RAX,%RDI |
(144) 0x6f60 JE 7adc |
(144) 0x6f66 LEA (%R14,%RDI,1),%R8 |
(144) 0x6f6a MOV (%RDX,%R8,8),%R13 |
(144) 0x6f6e MOV 0x8(%RDX,%R8,8),%R9 |
(144) 0x6f73 VXORPD %XMM0,%XMM0,%XMM0 |
(144) 0x6f77 MOV %R9,%RAX |
(144) 0x6f7a SUB %R13,%RAX |
(144) 0x6f7d JLE 6f50 |
(144) 0x6f7f MOV -0x58(%RBP),%RCX |
(144) 0x6f83 MOV (%RCX),%R10 |
(144) 0x6f86 MOV 0x20(%RBP),%RCX |
(144) 0x6f8a MOV (%RCX),%R11 |
(144) 0x6f8d MOV 0x10(%RBP),%RCX |
(144) 0x6f91 MOV (%RCX),%RBX |
(144) 0x6f94 MOV %RAX,%R12 |
(144) 0x6f97 AND $-0x2,%R12 |
(144) 0x6f9b JE 700c |
(144) 0x6f9d LEA -0x1(%R12),%RCX |
(144) 0x6fa2 LEA (%R10,%R13,8),%R14 |
(144) 0x6fa6 MOV %R13,-0x38(%RBP) |
(144) 0x6faa LEA (%RBX,%R13,8),%R15 |
(144) 0x6fae VXORPD %XMM0,%XMM0,%XMM0 |
(144) 0x6fb2 XOR %ESI,%ESI |
(144) 0x6fb4 NOPW %CS:(%RAX,%RAX,1) |
(146) 0x6fc0 MOV (%R15,%RSI,8),%RDX |
(146) 0x6fc4 MOV 0x8(%R15,%RSI,8),%R13 |
(146) 0x6fc9 VMOVSD (%R11,%RDX,8),%XMM1 |
(146) 0x6fcf VMOVHPD (%R11,%R13,8),%XMM1,%XMM1 |
(146) 0x6fd5 VFNMADD231PD (%R14,%RSI,8),%XMM1,%XMM0 |
(146) 0x6fdb ADD $0x2,%RSI |
(146) 0x6fdf CMP %RCX,%RSI |
(146) 0x6fe2 JBE 6fc0 |
(144) 0x6fe4 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(144) 0x6fe9 VADDSD %XMM1,%XMM0,%XMM0 |
(144) 0x6fed CMP %R12,%RAX |
(144) 0x6ff0 MOV -0x50(%RBP),%R14 |
(144) 0x6ff4 MOV -0x30(%RBP),%R15 |
(144) 0x6ff8 MOV -0x48(%RBP),%RDX |
(144) 0x6ffc MOV -0x40(%RBP),%RSI |
(144) 0x7000 MOV -0x38(%RBP),%R13 |
(144) 0x7004 JE 6f50 |
(144) 0x700a JMP 700f |
(144) 0x700c XOR %R12D,%R12D |
(144) 0x700f ADD %R13,%R12 |
(144) 0x7012 NOPW %CS:(%RAX,%RAX,1) |
(145) 0x7020 MOV (%RBX,%R12,8),%RAX |
(145) 0x7024 VMOVSD (%R11,%RAX,8),%XMM1 |
(145) 0x702a VFNMADD231SD (%R10,%R12,8),%XMM1,%XMM0 |
(145) 0x7030 INC %R12 |
(145) 0x7033 CMP %R12,%R9 |
(145) 0x7036 JNE 7020 |
(144) 0x7038 JMP 6f50 |
0x703d VUCOMISD 0x3b2b(%RIP),%XMM4 |
0x7045 JNE 73cd |
0x704b VUCOMISD 0x3b1d(%RIP),%XMM0 |
0x7053 JNE 74fc |
0x7059 CMP %R15,%R14 |
0x705c JGE 7adc |
0x7062 MOV -0x30(%RBP),%RAX |
0x7066 MOV (%RAX),%RDI |
0x7069 MOV (%RSI),%RSI |
0x706c MOV %R14,%RAX |
0x706f NOT %RAX |
0x7072 ADD %RAX,%R15 |
0x7075 XOR %R8D,%R8D |
0x7078 MOV %R15,-0x30(%RBP) |
0x707c MOV %RDI,-0x48(%RBP) |
0x7080 MOV %RSI,-0x40(%RBP) |
0x7084 JMP 70a6 |
0x7086 NOPW %CS:(%RAX,%RAX,1) |
(129) 0x7090 VMOVSD %XMM0,(%RSI,%R9,8) |
(129) 0x7096 LEA 0x1(%R8),%RAX |
(129) 0x709a CMP %R15,%R8 |
(129) 0x709d MOV %RAX,%R8 |
(129) 0x70a0 JE 7adc |
(129) 0x70a6 LEA (%R14,%R8,1),%R9 |
(129) 0x70aa VMOVSD (%RDX,%R9,8),%XMM0 |
(129) 0x70b0 MOV (%RDI,%R9,8),%RCX |
(129) 0x70b4 MOV 0x8(%RDI,%R9,8),%R10 |
(129) 0x70b9 MOV %R10,%RAX |
(129) 0x70bc SUB %RCX,%RAX |
(129) 0x70bf JLE 7090 |
(129) 0x70c1 MOV %RCX,-0x38(%RBP) |
(129) 0x70c5 MOV -0x58(%RBP),%RCX |
(129) 0x70c9 MOV (%RCX),%R11 |
(129) 0x70cc MOV 0x20(%RBP),%RCX |
(129) 0x70d0 MOV (%RCX),%RBX |
(129) 0x70d3 MOV 0x10(%RBP),%RCX |
(129) 0x70d7 MOV (%RCX),%R12 |
(129) 0x70da MOV %RAX,%R13 |
(129) 0x70dd AND $-0x2,%R13 |
(129) 0x70e1 JE 714e |
(129) 0x70e3 LEA -0x1(%R13),%RCX |
(129) 0x70e7 MOV -0x38(%RBP),%RDX |
(129) 0x70eb LEA (%R11,%RDX,8),%RSI |
(129) 0x70ef LEA (%R12,%RDX,8),%R14 |
(129) 0x70f3 VXORPD %XMM1,%XMM1,%XMM1 |
(129) 0x70f7 XOR %R15D,%R15D |
(129) 0x70fa NOPW (%RAX,%RAX,1) |
(131) 0x7100 MOV (%R14,%R15,8),%RDI |
(131) 0x7104 MOV 0x8(%R14,%R15,8),%RDX |
(131) 0x7109 VMOVSD (%RBX,%RDI,8),%XMM2 |
(131) 0x710e VMOVHPD (%RBX,%RDX,8),%XMM2,%XMM2 |
(131) 0x7113 VFMADD231PD (%RSI,%R15,8),%XMM2,%XMM1 |
(131) 0x7119 ADD $0x2,%R15 |
(131) 0x711d CMP %RCX,%R15 |
(131) 0x7120 JBE 7100 |
(129) 0x7122 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(129) 0x7127 VADDSD %XMM2,%XMM1,%XMM1 |
(129) 0x712b VADDSD %XMM1,%XMM0,%XMM0 |
(129) 0x712f CMP %R13,%RAX |
(129) 0x7132 MOV -0x50(%RBP),%R14 |
(129) 0x7136 MOV -0x30(%RBP),%R15 |
(129) 0x713a MOV 0x28(%RBP),%RDX |
(129) 0x713e MOV -0x48(%RBP),%RDI |
(129) 0x7142 MOV -0x40(%RBP),%RSI |
(129) 0x7146 JE 7090 |
(129) 0x714c JMP 7151 |
(129) 0x714e XOR %R13D,%R13D |
(129) 0x7151 ADD -0x38(%RBP),%R13 |
(129) 0x7155 NOPW %CS:(%RAX,%RAX,1) |
(130) 0x7160 MOV (%R12,%R13,8),%RAX |
(130) 0x7164 VMOVSD (%RBX,%RAX,8),%XMM1 |
(130) 0x7169 VFMADD231SD (%R11,%R13,8),%XMM1,%XMM0 |
(130) 0x716f INC %R13 |
(130) 0x7172 CMP %R13,%R10 |
(130) 0x7175 JNE 7160 |
(129) 0x7177 JMP 7090 |
0x717c VUCOMISD 0x39f4(%RIP),%XMM0 |
0x7184 JNE 762c |
0x718a CMP %R15,%R14 |
0x718d JGE 7adc |
0x7193 MOV -0x30(%RBP),%RAX |
0x7197 MOV (%RAX),%RDI |
0x719a MOV (%RSI),%RSI |
0x719d MOV %R14,%RAX |
0x71a0 NOT %RAX |
0x71a3 ADD %RAX,%R15 |
0x71a6 XOR %R8D,%R8D |
0x71a9 MOV %R15,-0x30(%RBP) |
0x71ad MOV %RDI,-0x48(%RBP) |
0x71b1 MOV %RSI,-0x40(%RBP) |
0x71b5 JMP 71d6 |
0x71b7 NOPW (%RAX,%RAX,1) |
(135) 0x71c0 VMOVSD %XMM0,(%RSI,%R9,8) |
(135) 0x71c6 LEA 0x1(%R8),%RAX |
(135) 0x71ca CMP %R15,%R8 |
(135) 0x71cd MOV %RAX,%R8 |
(135) 0x71d0 JE 7adc |
(135) 0x71d6 LEA (%R14,%R8,1),%R9 |
(135) 0x71da VMOVSD (%RDX,%R9,8),%XMM0 |
(135) 0x71e0 MOV (%RDI,%R9,8),%RCX |
(135) 0x71e4 MOV 0x8(%RDI,%R9,8),%R10 |
(135) 0x71e9 MOV %R10,%RAX |
(135) 0x71ec SUB %RCX,%RAX |
(135) 0x71ef JLE 71c0 |
(135) 0x71f1 MOV %RCX,-0x38(%RBP) |
(135) 0x71f5 MOV -0x58(%RBP),%RCX |
(135) 0x71f9 MOV (%RCX),%R11 |
(135) 0x71fc MOV 0x20(%RBP),%RCX |
(135) 0x7200 MOV (%RCX),%RBX |
(135) 0x7203 MOV 0x10(%RBP),%RCX |
(135) 0x7207 MOV (%RCX),%R12 |
(135) 0x720a MOV %RAX,%R13 |
(135) 0x720d AND $-0x2,%R13 |
(135) 0x7211 JE 727e |
(135) 0x7213 LEA -0x1(%R13),%RCX |
(135) 0x7217 MOV -0x38(%RBP),%RDX |
(135) 0x721b LEA (%R11,%RDX,8),%RSI |
(135) 0x721f LEA (%R12,%RDX,8),%R14 |
(135) 0x7223 VXORPD %XMM1,%XMM1,%XMM1 |
(135) 0x7227 XOR %R15D,%R15D |
(135) 0x722a NOPW (%RAX,%RAX,1) |
(137) 0x7230 MOV (%R14,%R15,8),%RDI |
(137) 0x7234 MOV 0x8(%R14,%R15,8),%RDX |
(137) 0x7239 VMOVSD (%RBX,%RDI,8),%XMM2 |
(137) 0x723e VMOVHPD (%RBX,%RDX,8),%XMM2,%XMM2 |
(137) 0x7243 VFNMADD231PD (%RSI,%R15,8),%XMM2,%XMM1 |
(137) 0x7249 ADD $0x2,%R15 |
(137) 0x724d CMP %RCX,%R15 |
(137) 0x7250 JBE 7230 |
(135) 0x7252 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(135) 0x7257 VADDSD %XMM2,%XMM1,%XMM1 |
(135) 0x725b VADDSD %XMM1,%XMM0,%XMM0 |
(135) 0x725f CMP %R13,%RAX |
(135) 0x7262 MOV -0x50(%RBP),%R14 |
(135) 0x7266 MOV -0x30(%RBP),%R15 |
(135) 0x726a MOV 0x28(%RBP),%RDX |
(135) 0x726e MOV -0x48(%RBP),%RDI |
(135) 0x7272 MOV -0x40(%RBP),%RSI |
(135) 0x7276 JE 71c0 |
(135) 0x727c JMP 7281 |
(135) 0x727e XOR %R13D,%R13D |
(135) 0x7281 ADD -0x38(%RBP),%R13 |
(135) 0x7285 NOPW %CS:(%RAX,%RAX,1) |
(136) 0x7290 MOV (%R12,%R13,8),%RAX |
(136) 0x7294 VMOVSD (%RBX,%RAX,8),%XMM1 |
(136) 0x7299 VFNMADD231SD (%R11,%R13,8),%XMM1,%XMM0 |
(136) 0x729f INC %R13 |
(136) 0x72a2 CMP %R13,%R10 |
(136) 0x72a5 JNE 7290 |
(135) 0x72a7 JMP 71c0 |
0x72ac CMP %R15,%R14 |
0x72af JGE 7adc |
0x72b5 MOV -0x30(%RBP),%RAX |
0x72b9 MOV (%RAX),%RDX |
0x72bc MOV (%RSI),%RSI |
0x72bf MOV %R14,%RAX |
0x72c2 NOT %RAX |
0x72c5 ADD %RAX,%R15 |
0x72c8 XOR %EDI,%EDI |
0x72ca MOV %R15,-0x30(%RBP) |
0x72ce MOV %RDX,-0x48(%RBP) |
0x72d2 MOV %RSI,-0x40(%RBP) |
0x72d6 JMP 72fa |
0x72d8 NOPL (%RAX,%RAX,1) |
(141) 0x72e0 VMULSD %XMM0,%XMM1,%XMM1 |
(141) 0x72e4 VMOVSD %XMM1,(%RSI,%R8,8) |
(141) 0x72ea LEA 0x1(%RDI),%RAX |
(141) 0x72ee CMP %R15,%RDI |
(141) 0x72f1 MOV %RAX,%RDI |
(141) 0x72f4 JE 7adc |
(141) 0x72fa LEA (%R14,%RDI,1),%R8 |
(141) 0x72fe MOV (%RDX,%R8,8),%R13 |
(141) 0x7302 MOV 0x8(%RDX,%R8,8),%R9 |
(141) 0x7307 VXORPD %XMM1,%XMM1,%XMM1 |
(141) 0x730b MOV %R9,%RAX |
(141) 0x730e SUB %R13,%RAX |
(141) 0x7311 JLE 72e0 |
(141) 0x7313 MOV -0x58(%RBP),%RCX |
(141) 0x7317 MOV (%RCX),%R10 |
(141) 0x731a MOV 0x20(%RBP),%RCX |
(141) 0x731e MOV (%RCX),%R11 |
(141) 0x7321 MOV 0x10(%RBP),%RCX |
(141) 0x7325 MOV (%RCX),%RBX |
(141) 0x7328 MOV %RAX,%R12 |
(141) 0x732b AND $-0x2,%R12 |
(141) 0x732f JE 739c |
(141) 0x7331 LEA -0x1(%R12),%RCX |
(141) 0x7336 LEA (%R10,%R13,8),%R14 |
(141) 0x733a MOV %R13,-0x38(%RBP) |
(141) 0x733e LEA (%RBX,%R13,8),%R15 |
(141) 0x7342 VXORPD %XMM1,%XMM1,%XMM1 |
(141) 0x7346 XOR %ESI,%ESI |
(141) 0x7348 NOPL (%RAX,%RAX,1) |
(143) 0x7350 MOV (%R15,%RSI,8),%RDX |
(143) 0x7354 MOV 0x8(%R15,%RSI,8),%R13 |
(143) 0x7359 VMOVSD (%R11,%RDX,8),%XMM2 |
(143) 0x735f VMOVHPD (%R11,%R13,8),%XMM2,%XMM2 |
(143) 0x7365 VFMADD231PD (%R14,%RSI,8),%XMM2,%XMM1 |
(143) 0x736b ADD $0x2,%RSI |
(143) 0x736f CMP %RCX,%RSI |
(143) 0x7372 JBE 7350 |
(141) 0x7374 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(141) 0x7379 VADDSD %XMM2,%XMM1,%XMM1 |
(141) 0x737d CMP %R12,%RAX |
(141) 0x7380 MOV -0x50(%RBP),%R14 |
(141) 0x7384 MOV -0x30(%RBP),%R15 |
(141) 0x7388 MOV -0x48(%RBP),%RDX |
(141) 0x738c MOV -0x40(%RBP),%RSI |
(141) 0x7390 MOV -0x38(%RBP),%R13 |
(141) 0x7394 JE 72e0 |
(141) 0x739a JMP 739f |
(141) 0x739c XOR %R12D,%R12D |
(141) 0x739f ADD %R13,%R12 |
(141) 0x73a2 NOPW %CS:(%RAX,%RAX,1) |
(142) 0x73b0 MOV (%RBX,%R12,8),%RAX |
(142) 0x73b4 VMOVSD (%R11,%RAX,8),%XMM2 |
(142) 0x73ba VFMADD231SD (%R10,%R12,8),%XMM2,%XMM1 |
(142) 0x73c0 INC %R12 |
(142) 0x73c3 CMP %R12,%R9 |
(142) 0x73c6 JNE 73b0 |
(141) 0x73c8 JMP 72e0 |
0x73cd VUCOMISD 0x379b(%RIP),%XMM0 |
0x73d5 JNE 776c |
0x73db CMP %R15,%R14 |
0x73de JGE 7adc |
0x73e4 MOV -0x30(%RBP),%RAX |
0x73e8 MOV (%RAX),%RDI |
0x73eb MOV (%RSI),%RSI |
0x73ee MOV %R14,%RAX |
0x73f1 NOT %RAX |
0x73f4 ADD %RAX,%R15 |
0x73f7 XOR %R8D,%R8D |
0x73fa MOV %R15,-0x30(%RBP) |
0x73fe MOV %RDI,-0x48(%RBP) |
0x7402 MOV %RSI,-0x40(%RBP) |
0x7406 JMP 7426 |
0x7408 NOPL (%RAX,%RAX,1) |
(120) 0x7410 VMOVSD %XMM0,(%RSI,%R9,8) |
(120) 0x7416 LEA 0x1(%R8),%RAX |
(120) 0x741a CMP %R15,%R8 |
(120) 0x741d MOV %RAX,%R8 |
(120) 0x7420 JE 7adc |
(120) 0x7426 LEA (%R14,%R8,1),%R9 |
(120) 0x742a VMULSD (%RDX,%R9,8),%XMM4,%XMM0 |
(120) 0x7430 MOV (%RDI,%R9,8),%RCX |
(120) 0x7434 MOV 0x8(%RDI,%R9,8),%R10 |
(120) 0x7439 MOV %R10,%RAX |
(120) 0x743c SUB %RCX,%RAX |
(120) 0x743f JLE 7410 |
(120) 0x7441 MOV %RCX,-0x38(%RBP) |
(120) 0x7445 MOV -0x58(%RBP),%RCX |
(120) 0x7449 MOV (%RCX),%R11 |
(120) 0x744c MOV 0x20(%RBP),%RCX |
(120) 0x7450 MOV (%RCX),%RBX |
(120) 0x7453 MOV 0x10(%RBP),%RCX |
(120) 0x7457 MOV (%RCX),%R12 |
(120) 0x745a MOV %RAX,%R13 |
(120) 0x745d AND $-0x2,%R13 |
(120) 0x7461 JE 74ce |
(120) 0x7463 LEA -0x1(%R13),%RCX |
(120) 0x7467 MOV -0x38(%RBP),%RDX |
(120) 0x746b LEA (%R11,%RDX,8),%RSI |
(120) 0x746f LEA (%R12,%RDX,8),%R14 |
(120) 0x7473 VXORPD %XMM1,%XMM1,%XMM1 |
(120) 0x7477 XOR %R15D,%R15D |
(120) 0x747a NOPW (%RAX,%RAX,1) |
(122) 0x7480 MOV (%R14,%R15,8),%RDI |
(122) 0x7484 MOV 0x8(%R14,%R15,8),%RDX |
(122) 0x7489 VMOVSD (%RBX,%RDI,8),%XMM2 |
(122) 0x748e VMOVHPD (%RBX,%RDX,8),%XMM2,%XMM2 |
(122) 0x7493 VFMADD231PD (%RSI,%R15,8),%XMM2,%XMM1 |
(122) 0x7499 ADD $0x2,%R15 |
(122) 0x749d CMP %RCX,%R15 |
(122) 0x74a0 JBE 7480 |
(120) 0x74a2 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(120) 0x74a7 VADDSD %XMM2,%XMM1,%XMM1 |
(120) 0x74ab VADDSD %XMM1,%XMM0,%XMM0 |
(120) 0x74af CMP %R13,%RAX |
(120) 0x74b2 MOV -0x50(%RBP),%R14 |
(120) 0x74b6 MOV -0x30(%RBP),%R15 |
(120) 0x74ba MOV 0x28(%RBP),%RDX |
(120) 0x74be MOV -0x48(%RBP),%RDI |
(120) 0x74c2 MOV -0x40(%RBP),%RSI |
(120) 0x74c6 JE 7410 |
(120) 0x74cc JMP 74d1 |
(120) 0x74ce XOR %R13D,%R13D |
(120) 0x74d1 ADD -0x38(%RBP),%R13 |
(120) 0x74d5 NOPW %CS:(%RAX,%RAX,1) |
(121) 0x74e0 MOV (%R12,%R13,8),%RAX |
(121) 0x74e4 VMOVSD (%RBX,%RAX,8),%XMM1 |
(121) 0x74e9 VFMADD231SD (%R11,%R13,8),%XMM1,%XMM0 |
(121) 0x74ef INC %R13 |
(121) 0x74f2 CMP %R13,%R10 |
(121) 0x74f5 JNE 74e0 |
(120) 0x74f7 JMP 7410 |
0x74fc VUCOMISD 0x3674(%RIP),%XMM0 |
0x7504 JNE 789c |
0x750a CMP %R15,%R14 |
0x750d JGE 7adc |
0x7513 MOV -0x30(%RBP),%RAX |
0x7517 MOV (%RAX),%RDI |
0x751a MOV (%RSI),%RSI |
0x751d MOV %R14,%RAX |
0x7520 NOT %RAX |
0x7523 ADD %RAX,%R15 |
0x7526 XOR %R8D,%R8D |
0x7529 VMOVDDUP 0x364f(%RIP),%XMM0 |
0x7531 MOV %R15,-0x30(%RBP) |
0x7535 MOV %RDI,-0x48(%RBP) |
0x7539 MOV %RSI,-0x40(%RBP) |
0x753d JMP 7556 |
0x753f NOP |
(126) 0x7540 VMOVSD %XMM1,(%RSI,%R9,8) |
(126) 0x7546 LEA 0x1(%R8),%RAX |
(126) 0x754a CMP %R15,%R8 |
(126) 0x754d MOV %RAX,%R8 |
(126) 0x7550 JE 7adc |
(126) 0x7556 LEA (%R14,%R8,1),%R9 |
(126) 0x755a VMOVSD (%RDX,%R9,8),%XMM1 |
(126) 0x7560 VXORPD %XMM0,%XMM1,%XMM1 |
(126) 0x7564 MOV (%RDI,%R9,8),%RCX |
(126) 0x7568 MOV 0x8(%RDI,%R9,8),%R10 |
(126) 0x756d MOV %R10,%RAX |
(126) 0x7570 SUB %RCX,%RAX |
(126) 0x7573 JLE 7540 |
(126) 0x7575 MOV %RCX,-0x38(%RBP) |
(126) 0x7579 MOV -0x58(%RBP),%RCX |
(126) 0x757d MOV (%RCX),%R11 |
(126) 0x7580 MOV 0x20(%RBP),%RCX |
(126) 0x7584 MOV (%RCX),%RBX |
(126) 0x7587 MOV 0x10(%RBP),%RCX |
(126) 0x758b MOV (%RCX),%R12 |
(126) 0x758e MOV %RAX,%R13 |
(126) 0x7591 AND $-0x2,%R13 |
(126) 0x7595 JE 75fe |
(126) 0x7597 LEA -0x1(%R13),%RCX |
(126) 0x759b MOV -0x38(%RBP),%RDX |
(126) 0x759f LEA (%R11,%RDX,8),%RSI |
(126) 0x75a3 LEA (%R12,%RDX,8),%R14 |
(126) 0x75a7 VXORPD %XMM2,%XMM2,%XMM2 |
(126) 0x75ab XOR %R15D,%R15D |
(126) 0x75ae XCHG %AX,%AX |
(128) 0x75b0 MOV (%R14,%R15,8),%RDI |
(128) 0x75b4 MOV 0x8(%R14,%R15,8),%RDX |
(128) 0x75b9 VMOVSD (%RBX,%RDI,8),%XMM3 |
(128) 0x75be VMOVHPD (%RBX,%RDX,8),%XMM3,%XMM3 |
(128) 0x75c3 VFNMADD231PD (%RSI,%R15,8),%XMM3,%XMM2 |
(128) 0x75c9 ADD $0x2,%R15 |
(128) 0x75cd CMP %RCX,%R15 |
(128) 0x75d0 JBE 75b0 |
(126) 0x75d2 VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(126) 0x75d7 VADDSD %XMM3,%XMM2,%XMM2 |
(126) 0x75db VADDSD %XMM2,%XMM1,%XMM1 |
(126) 0x75df CMP %R13,%RAX |
(126) 0x75e2 MOV -0x50(%RBP),%R14 |
(126) 0x75e6 MOV -0x30(%RBP),%R15 |
(126) 0x75ea MOV 0x28(%RBP),%RDX |
(126) 0x75ee MOV -0x48(%RBP),%RDI |
(126) 0x75f2 MOV -0x40(%RBP),%RSI |
(126) 0x75f6 JE 7540 |
(126) 0x75fc JMP 7601 |
(126) 0x75fe XOR %R13D,%R13D |
(126) 0x7601 ADD -0x38(%RBP),%R13 |
(126) 0x7605 NOPW %CS:(%RAX,%RAX,1) |
(127) 0x7610 MOV (%R12,%R13,8),%RAX |
(127) 0x7614 VMOVSD (%RBX,%RAX,8),%XMM2 |
(127) 0x7619 VFNMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(127) 0x761f INC %R13 |
(127) 0x7622 CMP %R13,%R10 |
(127) 0x7625 JNE 7610 |
(126) 0x7627 JMP 7540 |
0x762c CMP %R15,%R14 |
0x762f JGE 7adc |
0x7635 MOV -0x30(%RBP),%RAX |
0x7639 MOV (%RAX),%RDI |
0x763c MOV (%RSI),%RSI |
0x763f MOV %R14,%RAX |
0x7642 NOT %RAX |
0x7645 ADD %RAX,%R15 |
0x7648 XOR %R8D,%R8D |
0x764b VMOVDDUP 0x352d(%RIP),%XMM1 |
0x7653 MOV %R15,-0x30(%RBP) |
0x7657 MOV %RDI,-0x48(%RBP) |
0x765b MOV %RSI,-0x40(%RBP) |
0x765f JMP 768a |
0x7661 NOPW %CS:(%RAX,%RAX,1) |
(132) 0x7670 VMULSD %XMM0,%XMM2,%XMM2 |
(132) 0x7674 VMOVSD %XMM2,(%RSI,%R9,8) |
(132) 0x767a LEA 0x1(%R8),%RAX |
(132) 0x767e CMP %R15,%R8 |
(132) 0x7681 MOV %RAX,%R8 |
(132) 0x7684 JE 7adc |
(132) 0x768a LEA (%R14,%R8,1),%R9 |
(132) 0x768e VMOVSD (%RDX,%R9,8),%XMM2 |
(132) 0x7694 VXORPD %XMM1,%XMM2,%XMM2 |
(132) 0x7698 MOV (%RDI,%R9,8),%RCX |
(132) 0x769c MOV 0x8(%RDI,%R9,8),%R10 |
(132) 0x76a1 MOV %R10,%RAX |
(132) 0x76a4 SUB %RCX,%RAX |
(132) 0x76a7 JLE 7670 |
(132) 0x76a9 MOV %RCX,-0x38(%RBP) |
(132) 0x76ad MOV -0x58(%RBP),%RCX |
(132) 0x76b1 MOV (%RCX),%R11 |
(132) 0x76b4 MOV 0x20(%RBP),%RCX |
(132) 0x76b8 MOV (%RCX),%RBX |
(132) 0x76bb MOV 0x10(%RBP),%RCX |
(132) 0x76bf MOV (%RCX),%R12 |
(132) 0x76c2 MOV %RAX,%R13 |
(132) 0x76c5 AND $-0x2,%R13 |
(132) 0x76c9 JE 773e |
(132) 0x76cb LEA -0x1(%R13),%RCX |
(132) 0x76cf MOV -0x38(%RBP),%RDX |
(132) 0x76d3 LEA (%R11,%RDX,8),%RSI |
(132) 0x76d7 LEA (%R12,%RDX,8),%R14 |
(132) 0x76db VXORPD %XMM3,%XMM3,%XMM3 |
(132) 0x76df XOR %R15D,%R15D |
(132) 0x76e2 NOPW %CS:(%RAX,%RAX,1) |
(134) 0x76f0 MOV (%R14,%R15,8),%RDI |
(134) 0x76f4 MOV 0x8(%R14,%R15,8),%RDX |
(134) 0x76f9 VMOVSD (%RBX,%RDI,8),%XMM4 |
(134) 0x76fe VMOVHPD (%RBX,%RDX,8),%XMM4,%XMM4 |
(134) 0x7703 VFMADD231PD (%RSI,%R15,8),%XMM4,%XMM3 |
(134) 0x7709 ADD $0x2,%R15 |
(134) 0x770d CMP %RCX,%R15 |
(134) 0x7710 JBE 76f0 |
(132) 0x7712 VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(132) 0x7717 VADDSD %XMM4,%XMM3,%XMM3 |
(132) 0x771b VADDSD %XMM3,%XMM2,%XMM2 |
(132) 0x771f CMP %R13,%RAX |
(132) 0x7722 MOV -0x50(%RBP),%R14 |
(132) 0x7726 MOV -0x30(%RBP),%R15 |
(132) 0x772a MOV 0x28(%RBP),%RDX |
(132) 0x772e MOV -0x48(%RBP),%RDI |
(132) 0x7732 MOV -0x40(%RBP),%RSI |
(132) 0x7736 JE 7670 |
(132) 0x773c JMP 7741 |
(132) 0x773e XOR %R13D,%R13D |
(132) 0x7741 ADD -0x38(%RBP),%R13 |
(132) 0x7745 NOPW %CS:(%RAX,%RAX,1) |
(133) 0x7750 MOV (%R12,%R13,8),%RAX |
(133) 0x7754 VMOVSD (%RBX,%RAX,8),%XMM3 |
(133) 0x7759 VFMADD231SD (%R11,%R13,8),%XMM3,%XMM2 |
(133) 0x775f INC %R13 |
(133) 0x7762 CMP %R13,%R10 |
(133) 0x7765 JNE 7750 |
(132) 0x7767 JMP 7670 |
0x776c VUCOMISD 0x3404(%RIP),%XMM0 |
0x7774 JNE 79bc |
0x777a CMP %R15,%R14 |
0x777d JGE 7adc |
0x7783 VXORPD 0x3415(%RIP),%XMM4,%XMM0 |
0x778b MOV -0x30(%RBP),%RAX |
0x778f MOV (%RAX),%RDI |
0x7792 MOV (%RSI),%RSI |
0x7795 MOV %R14,%RAX |
0x7798 NOT %RAX |
0x779b ADD %RAX,%R15 |
0x779e XOR %R8D,%R8D |
0x77a1 MOV %R15,-0x30(%RBP) |
0x77a5 MOV %RDI,-0x48(%RBP) |
0x77a9 MOV %RSI,-0x40(%RBP) |
0x77ad JMP 77c5 |
(117) 0x77af VMOVSD %XMM1,(%RSI,%R9,8) |
(117) 0x77b5 LEA 0x1(%R8),%RAX |
(117) 0x77b9 CMP %R15,%R8 |
(117) 0x77bc MOV %RAX,%R8 |
(117) 0x77bf JE 7adc |
(117) 0x77c5 LEA (%R14,%R8,1),%R9 |
(117) 0x77c9 VMULSD (%RDX,%R9,8),%XMM0,%XMM1 |
(117) 0x77cf MOV (%RDI,%R9,8),%RCX |
(117) 0x77d3 MOV 0x8(%RDI,%R9,8),%R10 |
(117) 0x77d8 MOV %R10,%RAX |
(117) 0x77db SUB %RCX,%RAX |
(117) 0x77de JLE 77af |
(117) 0x77e0 MOV %RCX,-0x38(%RBP) |
(117) 0x77e4 MOV -0x58(%RBP),%RCX |
(117) 0x77e8 MOV (%RCX),%R11 |
(117) 0x77eb MOV 0x20(%RBP),%RCX |
(117) 0x77ef MOV (%RCX),%RBX |
(117) 0x77f2 MOV 0x10(%RBP),%RCX |
(117) 0x77f6 MOV (%RCX),%R12 |
(117) 0x77f9 MOV %RAX,%R13 |
(117) 0x77fc AND $-0x2,%R13 |
(117) 0x7800 JE 786e |
(117) 0x7802 LEA -0x1(%R13),%RDX |
(117) 0x7806 MOV -0x38(%RBP),%RSI |
(117) 0x780a LEA (%R11,%RSI,8),%RCX |
(117) 0x780e LEA (%R12,%RSI,8),%R14 |
(117) 0x7812 VXORPD %XMM2,%XMM2,%XMM2 |
(117) 0x7816 XOR %R15D,%R15D |
(117) 0x7819 NOPL (%RAX) |
(119) 0x7820 MOV (%R14,%R15,8),%RDI |
(119) 0x7824 MOV 0x8(%R14,%R15,8),%RSI |
(119) 0x7829 VMOVSD (%RBX,%RDI,8),%XMM3 |
(119) 0x782e VMOVHPD (%RBX,%RSI,8),%XMM3,%XMM3 |
(119) 0x7833 VFNMADD231PD (%RCX,%R15,8),%XMM3,%XMM2 |
(119) 0x7839 ADD $0x2,%R15 |
(119) 0x783d CMP %RDX,%R15 |
(119) 0x7840 JBE 7820 |
(117) 0x7842 VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(117) 0x7847 VADDSD %XMM3,%XMM2,%XMM2 |
(117) 0x784b VADDSD %XMM2,%XMM1,%XMM1 |
(117) 0x784f CMP %R13,%RAX |
(117) 0x7852 MOV -0x50(%RBP),%R14 |
(117) 0x7856 MOV -0x30(%RBP),%R15 |
(117) 0x785a MOV 0x28(%RBP),%RDX |
(117) 0x785e MOV -0x48(%RBP),%RDI |
(117) 0x7862 MOV -0x40(%RBP),%RSI |
(117) 0x7866 JE 77af |
(117) 0x786c JMP 7871 |
(117) 0x786e XOR %R13D,%R13D |
(117) 0x7871 ADD -0x38(%RBP),%R13 |
(117) 0x7875 NOPW %CS:(%RAX,%RAX,1) |
(118) 0x7880 MOV (%R12,%R13,8),%RAX |
(118) 0x7884 VMOVSD (%RBX,%RAX,8),%XMM2 |
(118) 0x7889 VFNMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(118) 0x788f INC %R13 |
(118) 0x7892 CMP %R13,%R10 |
(118) 0x7895 JNE 7880 |
(117) 0x7897 JMP 77af |
0x789c CMP %R15,%R14 |
0x789f JGE 7adc |
0x78a5 MOV -0x30(%RBP),%RAX |
0x78a9 MOV (%RAX),%RDI |
0x78ac MOV (%RSI),%RSI |
0x78af MOV %R14,%RAX |
0x78b2 NOT %RAX |
0x78b5 ADD %RAX,%R15 |
0x78b8 XOR %R8D,%R8D |
0x78bb MOV %R15,-0x30(%RBP) |
0x78bf MOV %RDI,-0x48(%RBP) |
0x78c3 MOV %RSI,-0x40(%RBP) |
0x78c7 JMP 78e3 |
(123) 0x78c9 VMULSD %XMM0,%XMM1,%XMM1 |
(123) 0x78cd VMOVSD %XMM1,(%RSI,%R9,8) |
(123) 0x78d3 LEA 0x1(%R8),%RAX |
(123) 0x78d7 CMP %R15,%R8 |
(123) 0x78da MOV %RAX,%R8 |
(123) 0x78dd JE 7adc |
(123) 0x78e3 LEA (%R14,%R8,1),%R9 |
(123) 0x78e7 VMOVSD (%RDX,%R9,8),%XMM1 |
(123) 0x78ed MOV (%RDI,%R9,8),%RCX |
(123) 0x78f1 MOV 0x8(%RDI,%R9,8),%R10 |
(123) 0x78f6 MOV %R10,%RAX |
(123) 0x78f9 SUB %RCX,%RAX |
(123) 0x78fc JLE 78c9 |
(123) 0x78fe MOV %RCX,-0x38(%RBP) |
(123) 0x7902 MOV -0x58(%RBP),%RCX |
(123) 0x7906 MOV (%RCX),%R11 |
(123) 0x7909 MOV 0x20(%RBP),%RCX |
(123) 0x790d MOV (%RCX),%RBX |
(123) 0x7910 MOV 0x10(%RBP),%RCX |
(123) 0x7914 MOV (%RCX),%R12 |
(123) 0x7917 MOV %RAX,%R13 |
(123) 0x791a AND $-0x2,%R13 |
(123) 0x791e JE 798e |
(123) 0x7920 LEA -0x1(%R13),%RCX |
(123) 0x7924 MOV -0x38(%RBP),%RDX |
(123) 0x7928 LEA (%R11,%RDX,8),%RSI |
(123) 0x792c LEA (%R12,%RDX,8),%R14 |
(123) 0x7930 VXORPD %XMM2,%XMM2,%XMM2 |
(123) 0x7934 XOR %R15D,%R15D |
(123) 0x7937 NOPW (%RAX,%RAX,1) |
(125) 0x7940 MOV (%R14,%R15,8),%RDI |
(125) 0x7944 MOV 0x8(%R14,%R15,8),%RDX |
(125) 0x7949 VMOVSD (%RBX,%RDI,8),%XMM3 |
(125) 0x794e VMOVHPD (%RBX,%RDX,8),%XMM3,%XMM3 |
(125) 0x7953 VFMADD231PD (%RSI,%R15,8),%XMM3,%XMM2 |
(125) 0x7959 ADD $0x2,%R15 |
(125) 0x795d CMP %RCX,%R15 |
(125) 0x7960 JBE 7940 |
(123) 0x7962 VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(123) 0x7967 VADDSD %XMM3,%XMM2,%XMM2 |
(123) 0x796b VADDSD %XMM2,%XMM1,%XMM1 |
(123) 0x796f CMP %R13,%RAX |
(123) 0x7972 MOV -0x50(%RBP),%R14 |
(123) 0x7976 MOV -0x30(%RBP),%R15 |
(123) 0x797a MOV 0x28(%RBP),%RDX |
(123) 0x797e MOV -0x48(%RBP),%RDI |
(123) 0x7982 MOV -0x40(%RBP),%RSI |
(123) 0x7986 JE 78c9 |
(123) 0x798c JMP 7991 |
(123) 0x798e XOR %R13D,%R13D |
(123) 0x7991 ADD -0x38(%RBP),%R13 |
(123) 0x7995 NOPW %CS:(%RAX,%RAX,1) |
(124) 0x79a0 MOV (%R12,%R13,8),%RAX |
(124) 0x79a4 VMOVSD (%RBX,%RAX,8),%XMM2 |
(124) 0x79a9 VFMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(124) 0x79af INC %R13 |
(124) 0x79b2 CMP %R13,%R10 |
(124) 0x79b5 JNE 79a0 |
(123) 0x79b7 JMP 78c9 |
0x79bc CMP %R15,%R14 |
0x79bf JGE 7adc |
0x79c5 MOV -0x30(%RBP),%RAX |
0x79c9 MOV (%RAX),%RDI |
0x79cc MOV (%RSI),%RSI |
0x79cf MOV %R14,%RAX |
0x79d2 NOT %RAX |
0x79d5 ADD %RAX,%R15 |
0x79d8 XOR %R8D,%R8D |
0x79db MOV %R15,-0x30(%RBP) |
0x79df MOV %RDI,-0x48(%RBP) |
0x79e3 MOV %RSI,-0x40(%RBP) |
0x79e7 JMP 7a03 |
(114) 0x79e9 VMULSD %XMM0,%XMM1,%XMM1 |
(114) 0x79ed VMOVSD %XMM1,(%RSI,%R9,8) |
(114) 0x79f3 LEA 0x1(%R8),%RAX |
(114) 0x79f7 CMP %R15,%R8 |
(114) 0x79fa MOV %RAX,%R8 |
(114) 0x79fd JE 7adc |
(114) 0x7a03 LEA (%R14,%R8,1),%R9 |
(114) 0x7a07 VMULSD (%RDX,%R9,8),%XMM4,%XMM1 |
(114) 0x7a0d MOV (%RDI,%R9,8),%RCX |
(114) 0x7a11 MOV 0x8(%RDI,%R9,8),%R10 |
(114) 0x7a16 MOV %R10,%RAX |
(114) 0x7a19 SUB %RCX,%RAX |
(114) 0x7a1c JLE 79e9 |
(114) 0x7a1e MOV %RCX,-0x38(%RBP) |
(114) 0x7a22 MOV -0x58(%RBP),%RCX |
(114) 0x7a26 MOV (%RCX),%R11 |
(114) 0x7a29 MOV 0x20(%RBP),%RCX |
(114) 0x7a2d MOV (%RCX),%RBX |
(114) 0x7a30 MOV 0x10(%RBP),%RCX |
(114) 0x7a34 MOV (%RCX),%R12 |
(114) 0x7a37 MOV %RAX,%R13 |
(114) 0x7a3a AND $-0x2,%R13 |
(114) 0x7a3e JE 7aae |
(114) 0x7a40 LEA -0x1(%R13),%RDX |
(114) 0x7a44 MOV -0x38(%RBP),%RSI |
(114) 0x7a48 LEA (%R11,%RSI,8),%RCX |
(114) 0x7a4c LEA (%R12,%RSI,8),%R14 |
(114) 0x7a50 VXORPD %XMM2,%XMM2,%XMM2 |
(114) 0x7a54 XOR %R15D,%R15D |
(114) 0x7a57 NOPW (%RAX,%RAX,1) |
(116) 0x7a60 MOV (%R14,%R15,8),%RDI |
(116) 0x7a64 MOV 0x8(%R14,%R15,8),%RSI |
(116) 0x7a69 VMOVSD (%RBX,%RDI,8),%XMM3 |
(116) 0x7a6e VMOVHPD (%RBX,%RSI,8),%XMM3,%XMM3 |
(116) 0x7a73 VFMADD231PD (%RCX,%R15,8),%XMM3,%XMM2 |
(116) 0x7a79 ADD $0x2,%R15 |
(116) 0x7a7d CMP %RDX,%R15 |
(116) 0x7a80 JBE 7a60 |
(114) 0x7a82 VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(114) 0x7a87 VADDSD %XMM3,%XMM2,%XMM2 |
(114) 0x7a8b VADDSD %XMM2,%XMM1,%XMM1 |
(114) 0x7a8f CMP %R13,%RAX |
(114) 0x7a92 MOV -0x50(%RBP),%R14 |
(114) 0x7a96 MOV -0x30(%RBP),%R15 |
(114) 0x7a9a MOV 0x28(%RBP),%RDX |
(114) 0x7a9e MOV -0x48(%RBP),%RDI |
(114) 0x7aa2 MOV -0x40(%RBP),%RSI |
(114) 0x7aa6 JE 79e9 |
(114) 0x7aac JMP 7ab1 |
(114) 0x7aae XOR %R13D,%R13D |
(114) 0x7ab1 ADD -0x38(%RBP),%R13 |
(114) 0x7ab5 NOPW %CS:(%RAX,%RAX,1) |
(115) 0x7ac0 MOV (%R12,%R13,8),%RAX |
(115) 0x7ac4 VMOVSD (%RBX,%RAX,8),%XMM2 |
(115) 0x7ac9 VFMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(115) 0x7acf INC %R13 |
(115) 0x7ad2 CMP %R13,%R10 |
(115) 0x7ad5 JNE 7ac0 |
(114) 0x7ad7 JMP 79e9 |
0x7adc ADD $0x38,%RSP |
0x7ae0 POP %RBX |
0x7ae1 POP %R12 |
0x7ae3 POP %R13 |
0x7ae5 POP %R14 |
0x7ae7 POP %R15 |
0x7ae9 POP %RBP |
0x7aea RET |
0x7aeb NOPL (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | csr_matvec.c:243-404 |
Module | libseq_mv.so |
nb instructions | 333 |
nb uops | 369 |
loop length | 1310 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 9 |
micro-operation queue | 61.50 cycles |
front end | 61.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 27.00 | 25.00 | 25.33 | 25.33 | 29.50 | 25.00 | 27.00 | 29.50 | 29.50 | 29.50 | 25.00 | 25.33 |
cycles | 27.00 | 25.80 | 25.33 | 25.33 | 29.50 | 25.00 | 27.00 | 29.50 | 29.50 | 29.50 | 25.00 | 25.33 |
Cycles executing div or sqrt instructions | 32.00 |
FE+BE cycles | 58.87 |
Stall cycles | 0.00 |
Front-end | 61.50 |
Dispatch | 29.50 |
DIV/SQRT | 32.00 |
Overall L1 | 61.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 1% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 2% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x38,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 2220 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 2310 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %R14,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
DEC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 6b23 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x83> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 6b2c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6b34 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x94> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%RCX,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RBX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 22d0 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
SUB %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 6b34 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x94> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JG 6afa <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x5a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVQ $0,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 2220 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 2310 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %R14,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
DEC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 6b68 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 6b6c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x50(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 6dad <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x30d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6b9e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R12,%R15,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RBX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 22d0 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6bda <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x13a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x208436(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x4345(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x42e6(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 2370 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x4251(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 23b0 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 6be8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x148> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6c1f <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x17f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x2083f1(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x4300(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x42b0(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 2370 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x420c(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 23b0 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 6c2e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x18e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6c6a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1ca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x2083ab(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x42ba(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x428c(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 2370 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x41c6(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 23b0 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM4 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE 6dbe <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x31e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x3ee7(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 6f0c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x46c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 6cd6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x236> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JG 6ba3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 6bda <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x13a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x28(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x3dae(%RIP),%XMM4 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 703d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x59d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x3d98(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 717c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x6dc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x3d7b(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 6e36 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x396> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3c64(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 72ac <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x80c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 6f66 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4c6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3b2b(%RIP),%XMM4 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 73cd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x92d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x3b1d(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 74fc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa5c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 70a6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x606> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x39f4(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 762c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb8c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 71d6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x736> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 72fa <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x85a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x379b(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 776c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xccc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7426 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x986> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3674(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 789c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdfc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x364f(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7556 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xab6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x352d(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 768a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbea> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3404(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 79bc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xf1c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x3415(%RIP),%XMM4,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 77c5 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd25> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 78e3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe43> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7a03 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xf63> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x38,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matvec.c:243-404 |
Module | libseq_mv.so |
nb instructions | 333 |
nb uops | 369 |
loop length | 1310 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 9 |
micro-operation queue | 61.50 cycles |
front end | 61.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 27.00 | 25.00 | 25.33 | 25.33 | 29.50 | 25.00 | 27.00 | 29.50 | 29.50 | 29.50 | 25.00 | 25.33 |
cycles | 27.00 | 25.80 | 25.33 | 25.33 | 29.50 | 25.00 | 27.00 | 29.50 | 29.50 | 29.50 | 25.00 | 25.33 |
Cycles executing div or sqrt instructions | 32.00 |
FE+BE cycles | 58.87 |
Stall cycles | 0.00 |
Front-end | 61.50 |
Dispatch | 29.50 |
DIV/SQRT | 32.00 |
Overall L1 | 61.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 1% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 2% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x38,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 2220 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 2310 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %R14,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
DEC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 6b23 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x83> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 6b2c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6b34 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x94> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%RCX,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RBX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 22d0 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
SUB %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 6b34 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x94> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JG 6afa <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x5a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVQ $0,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 2220 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 2310 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %R14,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
DEC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 6b68 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 6b6c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x50(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 6dad <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x30d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6b9e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R12,%R15,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RBX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 22d0 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6bda <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x13a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x208436(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x4345(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x42e6(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 2370 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x4251(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 23b0 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 6be8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x148> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6c1f <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x17f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x2083f1(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x4300(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x42b0(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 2370 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x420c(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 23b0 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 6c2e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x18e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6c6a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1ca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x2083ab(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x42ba(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x428c(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 2370 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x41c6(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 23b0 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM4 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE 6dbe <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x31e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x3ee7(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 6f0c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x46c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 6cd6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x236> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JG 6ba3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 6bda <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x13a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x28(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x3dae(%RIP),%XMM4 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 703d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x59d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x3d98(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 717c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x6dc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x3d7b(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 6e36 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x396> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3c64(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 72ac <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x80c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 6f66 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4c6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3b2b(%RIP),%XMM4 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 73cd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x92d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x3b1d(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 74fc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa5c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 70a6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x606> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x39f4(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 762c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb8c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 71d6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x736> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 72fa <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x85a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x379b(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 776c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xccc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7426 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x986> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3674(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 789c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdfc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x364f(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7556 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xab6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x352d(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 768a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbea> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3404(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 79bc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xf1c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x3415(%RIP),%XMM4,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 77c5 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd25> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 78e3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe43> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7adc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x103c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7a03 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xf63> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x38,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace.extracted– | 18.69 | 7.57 |
▼Loop 129 - csr_matvec.c:334-341 - libseq_mv.so– | 1.1 | 0.38 |
○Loop 130 - csr_matvec.c:337-339 - libseq_mv.so | 0.22 | 0.08 |
○Loop 131 - csr_matvec.c:337-339 - libseq_mv.so | 0 | 0 |
▼Loop 135 - csr_matvec.c:307-314 - libseq_mv.so– | 0.33 | 0.11 |
○Loop 137 - csr_matvec.c:310-312 - libseq_mv.so | 8.54 | 2.92 |
○Loop 136 - csr_matvec.c:310-312 - libseq_mv.so | 0.17 | 0.06 |
▼Loop 147 - csr_matvec.c:256-263 - libseq_mv.so– | 0.25 | 0.09 |
○Loop 149 - csr_matvec.c:259-261 - libseq_mv.so | 7.61 | 2.61 |
○Loop 148 - csr_matvec.c:259-261 - libseq_mv.so | 0.16 | 0.06 |
▼Loop 144 - csr_matvec.c:268-275 - libseq_mv.so– | 0 | 0 |
○Loop 146 - csr_matvec.c:271-273 - libseq_mv.so | 0 | 0 |
○Loop 145 - csr_matvec.c:271-273 - libseq_mv.so | 0 | 0 |
▼Loop 132 - csr_matvec.c:319-326 - libseq_mv.so– | 0 | 0 |
○Loop 133 - csr_matvec.c:322-324 - libseq_mv.so | 0 | 0 |
○Loop 134 - csr_matvec.c:322-324 - libseq_mv.so | 0 | 0 |
▼Loop 123 - csr_matvec.c:358-365 - libseq_mv.so– | 0 | 0 |
○Loop 125 - csr_matvec.c:361-363 - libseq_mv.so | 0 | 0 |
○Loop 124 - csr_matvec.c:361-363 - libseq_mv.so | 0 | 0 |
▼Loop 114 - csr_matvec.c:397-404 - libseq_mv.so– | 0 | 0 |
○Loop 115 - csr_matvec.c:400-402 - libseq_mv.so | 0 | 0 |
○Loop 116 - csr_matvec.c:400-402 - libseq_mv.so | 0 | 0 |
▼Loop 138 - csr_matvec.c:295-302 - libseq_mv.so– | 0 | 0 |
○Loop 140 - csr_matvec.c:298-300 - libseq_mv.so | 0 | 0 |
○Loop 139 - csr_matvec.c:298-300 - libseq_mv.so | 0 | 0 |
▼Loop 120 - csr_matvec.c:373-380 - libseq_mv.so– | 0 | 0 |
○Loop 121 - csr_matvec.c:376-378 - libseq_mv.so | 0 | 0 |
○Loop 122 - csr_matvec.c:376-378 - libseq_mv.so | 0 | 0 |
▼Loop 126 - csr_matvec.c:346-353 - libseq_mv.so– | 0 | 0 |
○Loop 128 - csr_matvec.c:349-351 - libseq_mv.so | 0 | 0 |
○Loop 127 - csr_matvec.c:349-351 - libseq_mv.so | 0 | 0 |
▼Loop 141 - csr_matvec.c:280-287 - libseq_mv.so– | 0 | 0 |
○Loop 142 - csr_matvec.c:283-285 - libseq_mv.so | 0 | 0 |
○Loop 143 - csr_matvec.c:283-285 - libseq_mv.so | 0 | 0 |
▼Loop 117 - csr_matvec.c:385-392 - libseq_mv.so– | 0 | 0 |
○Loop 118 - csr_matvec.c:388-390 - libseq_mv.so | 0 | 0 |
○Loop 119 - csr_matvec.c:388-390 - libseq_mv.so | 0 | 0 |