Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: libseq_mv.so | Source: csr_matvec.c:243-404 [...] | Coverage: 17.05% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: libseq_mv.so | Source: csr_matvec.c:243-404 [...] | Coverage: 17.05% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-3872/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 243 - 404 |
-------------------------------------------------------------------------------- |
243: #pragma omp parallel private(i,jj,tempx) |
244: #endif |
245: { |
246: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
247: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
248: hypre_assert(iBegin <= iEnd); |
249: hypre_assert(iBegin >= 0 && iBegin <= num_rows); |
250: hypre_assert(iEnd >= 0 && iEnd <= num_rows); |
251: |
252: if (0 == temp) |
253: { |
254: if (1 == alpha) // JSP: a common path |
255: { |
256: for (i = iBegin; i < iEnd; i++) |
257: { |
258: tempx = 0.0; |
259: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
260: { |
261: tempx += A_data[jj] * x_data[A_j[jj]]; |
262: } |
263: y_data[i] = tempx; |
264: } |
265: } // y = A*x |
266: else if (-1 == alpha) |
267: { |
268: for (i = iBegin; i < iEnd; i++) |
269: { |
270: tempx = 0.0; |
271: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
272: { |
273: tempx -= A_data[jj] * x_data[A_j[jj]]; |
274: } |
275: y_data[i] = tempx; |
276: } |
277: } // y = -A*x |
278: else |
279: { |
280: for (i = iBegin; i < iEnd; i++) |
281: { |
282: tempx = 0.0; |
283: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
284: { |
285: tempx += A_data[jj] * x_data[A_j[jj]]; |
286: } |
287: y_data[i] = alpha*tempx; |
288: } |
289: } // y = alpha*A*x |
290: } // temp == 0 |
291: else if (-1 == temp) // beta == -alpha |
292: { |
293: if (1 == alpha) // JSP: a common path |
294: { |
295: for (i = iBegin; i < iEnd; i++) |
296: { |
297: tempx = -b_data[i]; |
298: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
299: { |
300: tempx += A_data[jj] * x_data[A_j[jj]]; |
301: } |
302: y_data[i] = tempx; |
303: } |
304: } // y = A*x - y |
305: else if (-1 == alpha) // JSP: a common path |
306: { |
307: for (i = iBegin; i < iEnd; i++) |
308: { |
309: tempx = b_data[i]; |
310: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
311: { |
312: tempx -= A_data[jj] * x_data[A_j[jj]]; |
313: } |
314: y_data[i] = tempx; |
315: } |
316: } // y = -A*x + y |
317: else |
318: { |
319: for (i = iBegin; i < iEnd; i++) |
320: { |
321: tempx = -b_data[i]; |
322: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
323: { |
324: tempx += A_data[jj] * x_data[A_j[jj]]; |
325: } |
326: y_data[i] = alpha*tempx; |
327: } |
328: } // y = alpha*(A*x - y) |
329: } // temp == -1 |
330: else if (1 == temp) |
331: { |
332: if (1 == alpha) // JSP: a common path |
333: { |
334: for (i = iBegin; i < iEnd; i++) |
335: { |
336: tempx = b_data[i]; |
337: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
338: { |
339: tempx += A_data[jj] * x_data[A_j[jj]]; |
340: } |
341: y_data[i] = tempx; |
342: } |
343: } // y = A*x + y |
344: else if (-1 == alpha) |
345: { |
346: for (i = iBegin; i < iEnd; i++) |
347: { |
348: tempx = -b_data[i]; |
349: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
350: { |
351: tempx -= A_data[jj] * x_data[A_j[jj]]; |
352: } |
353: y_data[i] = tempx; |
354: } |
355: } // y = -A*x - y |
356: else |
357: { |
358: for (i = iBegin; i < iEnd; i++) |
359: { |
360: tempx = b_data[i]; |
361: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
362: { |
363: tempx += A_data[jj] * x_data[A_j[jj]]; |
364: } |
365: y_data[i] = alpha*tempx; |
[...] |
371: if (1 == alpha) // JSP: a common path |
372: { |
373: for (i = iBegin; i < iEnd; i++) |
374: { |
375: tempx = b_data[i]*temp; |
376: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
377: { |
378: tempx += A_data[jj] * x_data[A_j[jj]]; |
379: } |
380: y_data[i] = tempx; |
381: } |
382: } // y = A*x + temp*y |
383: else if (-1 == alpha) |
384: { |
385: for (i = iBegin; i < iEnd; i++) |
386: { |
387: tempx = -b_data[i]*temp; |
388: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
389: { |
390: tempx -= A_data[jj] * x_data[A_j[jj]]; |
391: } |
392: y_data[i] = tempx; |
393: } |
394: } // y = -A*x - temp*y |
395: else |
396: { |
397: for (i = iBegin; i < iEnd; i++) |
398: { |
399: tempx = b_data[i]*temp; |
400: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
401: { |
402: tempx += A_data[jj] * x_data[A_j[jj]]; |
403: } |
404: y_data[i] = alpha*tempx; |
/scratch_na/users/xoserete/qaas_runs/171-415-3872/intel/AMG/build/AMG/AMG/seq_mv/csr_matrix.c: 645 - 674 |
-------------------------------------------------------------------------------- |
645: HYPRE_Int num_nonzerosA = hypre_CSRMatrixNumNonzeros(A); |
646: HYPRE_Int num_rowsA = hypre_CSRMatrixNumRows(A); |
647: HYPRE_Int *A_i = hypre_CSRMatrixI(A); |
648: |
649: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
650: |
651: HYPRE_Int nonzeros_per_thread = (num_nonzerosA + num_threads - 1)/num_threads; |
652: |
653: if (idx <= 0) |
654: { |
655: return 0; |
656: } |
657: else if (idx >= num_threads) |
[...] |
663: return (HYPRE_Int)(hypre_LowerBound(A_i, A_i + num_rowsA, nonzeros_per_thread*idx) - A_i); |
[...] |
669: return hypre_CSRMatrixGetLoadBalancedPartitionBoundary(A, hypre_GetThreadNum()); |
670: } |
671: |
672: HYPRE_Int hypre_CSRMatrixGetLoadBalancedPartitionEnd(hypre_CSRMatrix *A) |
673: { |
674: return hypre_CSRMatrixGetLoadBalancedPartitionBoundary(A, hypre_GetThreadNum() + 1); |
0x6d60 PUSH %RBP |
0x6d61 MOV %RSP,%RBP |
0x6d64 PUSH %R15 |
0x6d66 PUSH %R14 |
0x6d68 PUSH %R13 |
0x6d6a PUSH %R12 |
0x6d6c PUSH %RBX |
0x6d6d SUB $0x28,%RSP |
0x6d71 MOV %R9,-0x30(%RBP) |
0x6d75 MOV %R8,-0x48(%RBP) |
0x6d79 MOV %RCX,%R15 |
0x6d7c MOV %RDX,%R13 |
0x6d7f CALL 2220 <hypre_GetThreadNum@plt> |
0x6d84 MOV %RAX,%RBX |
0x6d87 MOV 0x20(%R15),%R14 |
0x6d8b MOV (%R15),%R12 |
0x6d8e MOV 0x10(%R15),%RAX |
0x6d92 MOV %RAX,-0x40(%RBP) |
0x6d96 CALL 2310 <hypre_NumActiveThreads@plt> |
0x6d9b MOV %RAX,%RCX |
0x6d9e LEA -0x1(%R14,%RAX,1),%RAX |
0x6da3 MOV %RAX,%RDX |
0x6da6 OR %RCX,%RDX |
0x6da9 SHR $0x20,%RDX |
0x6dad JE 6de2 |
0x6daf CQTO |
0x6db1 IDIV %RCX |
0x6db4 TEST %RBX,%RBX |
0x6db7 JLE 6deb |
0x6db9 CMP %RBX,%RCX |
0x6dbc JLE 6df3 |
0x6dbe MOV -0x40(%RBP),%RCX |
0x6dc2 LEA (%R12,%RCX,8),%RSI |
0x6dc6 IMUL %RBX,%RAX |
0x6dca MOV %R12,%RDI |
0x6dcd MOV %RAX,%RDX |
0x6dd0 CALL 22e0 <hypre_LowerBound@plt> |
0x6dd5 SUB %R12,%RAX |
0x6dd8 SAR $0x3,%RAX |
0x6ddc MOV %RAX,-0x40(%RBP) |
0x6de0 JMP 6df3 |
0x6de2 XOR %EDX,%EDX |
0x6de4 DIV %ECX |
0x6de6 TEST %RBX,%RBX |
0x6de9 JG 6db9 |
0x6deb MOVQ $0,-0x40(%RBP) |
0x6df3 CALL 2220 <hypre_GetThreadNum@plt> |
0x6df8 MOV %RAX,%RBX |
0x6dfb MOV 0x20(%R15),%R14 |
0x6dff MOV (%R15),%R12 |
0x6e02 MOV 0x10(%R15),%R15 |
0x6e06 CALL 2310 <hypre_NumActiveThreads@plt> |
0x6e0b MOV %RAX,%RCX |
0x6e0e LEA -0x1(%R14,%RAX,1),%RAX |
0x6e13 MOV %RAX,%RDX |
0x6e16 OR %RCX,%RDX |
0x6e19 SHR $0x20,%RDX |
0x6e1d JE 6e26 |
0x6e1f CQTO |
0x6e21 IDIV %RCX |
0x6e24 JMP 6e2a |
0x6e26 XOR %EDX,%EDX |
0x6e28 DIV %ECX |
0x6e2a MOV -0x40(%RBP),%R14 |
0x6e2e TEST %RBX,%RBX |
0x6e31 JS 705d |
0x6e37 INC %RBX |
0x6e3a CMP %RBX,%RCX |
0x6e3d JLE 6e5c |
0x6e3f LEA (%R12,%R15,8),%RSI |
0x6e43 IMUL %RBX,%RAX |
0x6e47 MOV %R12,%RDI |
0x6e4a MOV %RAX,%RDX |
0x6e4d CALL 22e0 <hypre_LowerBound@plt> |
0x6e52 MOV %RAX,%R15 |
0x6e55 SUB %R12,%R15 |
0x6e58 SAR $0x3,%R15 |
0x6e5c CMP %R15,%R14 |
0x6e5f JLE 6e98 |
0x6e61 MOV 0x208178(%RIP),%RAX |
0x6e68 MOV (%RAX),%RDI |
0x6e6b LEA 0x41a7(%RIP),%RSI |
0x6e72 LEA 0x4148(%RIP),%RDX |
0x6e79 XOR %EAX,%EAX |
0x6e7b CALL 2380 <hypre_fprintf@plt> |
0x6e80 LEA 0x40b3(%RIP),%RDI |
0x6e87 MOV $0xf8,%ESI |
0x6e8c MOV $0x1,%EDX |
0x6e91 XOR %ECX,%ECX |
0x6e93 CALL 23c0 <hypre_error_handler@plt> |
0x6e98 MOV 0x18(%RBP),%RBX |
0x6e9c TEST %R14,%R14 |
0x6e9f JS 6ea6 |
0x6ea1 CMP %RBX,%R14 |
0x6ea4 JLE 6edd |
0x6ea6 MOV 0x208133(%RIP),%RAX |
0x6ead MOV (%RAX),%RDI |
0x6eb0 LEA 0x4162(%RIP),%RSI |
0x6eb7 LEA 0x4112(%RIP),%RDX |
0x6ebe XOR %EAX,%EAX |
0x6ec0 CALL 2380 <hypre_fprintf@plt> |
0x6ec5 LEA 0x406e(%RIP),%RDI |
0x6ecc MOV $0xf9,%ESI |
0x6ed1 MOV $0x1,%EDX |
0x6ed6 XOR %ECX,%ECX |
0x6ed8 CALL 23c0 <hypre_error_handler@plt> |
0x6edd VMOVSD 0x38(%RBP),%XMM5 |
0x6ee2 TEST %R15,%R15 |
0x6ee5 JS 6eec |
0x6ee7 CMP %RBX,%R15 |
0x6eea JLE 6f28 |
0x6eec MOV 0x2080ed(%RIP),%RAX |
0x6ef3 MOV (%RAX),%RDI |
0x6ef6 LEA 0x411c(%RIP),%RSI |
0x6efd LEA 0x40ee(%RIP),%RDX |
0x6f04 XOR %EAX,%EAX |
0x6f06 CALL 2380 <hypre_fprintf@plt> |
0x6f0b LEA 0x4028(%RIP),%RDI |
0x6f12 MOV $0xfa,%ESI |
0x6f17 MOV $0x1,%EDX |
0x6f1c XOR %ECX,%ECX |
0x6f1e CALL 23c0 <hypre_error_handler@plt> |
0x6f23 VMOVSD 0x38(%RBP),%XMM5 |
0x6f28 MOV 0x30(%RBP),%RSI |
0x6f2c VMOVQ %R13,%XMM0 |
0x6f31 VXORPD %XMM1,%XMM1,%XMM1 |
0x6f35 VUCOMISD %XMM1,%XMM5 |
0x6f39 JNE 706e |
0x6f3f VUCOMISD 0x3d69(%RIP),%XMM0 |
0x6f47 JNE 71ac |
0x6f4d CMP %R15,%R14 |
0x6f50 JGE 7d1c |
0x6f56 MOV -0x30(%RBP),%RAX |
0x6f5a MOV (%RAX),%RDX |
0x6f5d MOV (%RSI),%RSI |
0x6f60 MOV %R14,%RAX |
0x6f63 NOT %RAX |
0x6f66 ADD %RAX,%R15 |
0x6f69 XOR %EDI,%EDI |
0x6f6b MOV %R15,-0x30(%RBP) |
0x6f6f MOV %RSI,-0x38(%RBP) |
0x6f73 JMP 6f96 |
0x6f75 NOPW %CS:(%RAX,%RAX,1) |
(159) 0x6f80 VMOVSD %XMM0,(%RSI,%R8,8) |
(159) 0x6f86 LEA 0x1(%RDI),%RAX |
(159) 0x6f8a CMP %R15,%RDI |
(159) 0x6f8d MOV %RAX,%RDI |
(159) 0x6f90 JE 7d1c |
(159) 0x6f96 LEA (%R14,%RDI,1),%R8 |
(159) 0x6f9a MOV (%RDX,%R8,8),%R13 |
(159) 0x6f9e MOV 0x8(%RDX,%R8,8),%R9 |
(159) 0x6fa3 VXORPD %XMM0,%XMM0,%XMM0 |
(159) 0x6fa7 MOV %R9,%RAX |
(159) 0x6faa SUB %R13,%RAX |
(159) 0x6fad JLE 6f80 |
(159) 0x6faf MOV -0x48(%RBP),%RCX |
(159) 0x6fb3 MOV (%RCX),%R10 |
(159) 0x6fb6 MOV 0x20(%RBP),%RCX |
(159) 0x6fba MOV (%RCX),%R11 |
(159) 0x6fbd MOV 0x10(%RBP),%RCX |
(159) 0x6fc1 MOV (%RCX),%RBX |
(159) 0x6fc4 MOV %RAX,%R12 |
(159) 0x6fc7 AND $-0x4,%R12 |
(159) 0x6fcb JE 702e |
(159) 0x6fcd LEA -0x1(%R12),%RCX |
(159) 0x6fd2 LEA (%R10,%R13,8),%R14 |
(159) 0x6fd6 LEA (%RBX,%R13,8),%R15 |
(159) 0x6fda VXORPD %XMM0,%XMM0,%XMM0 |
(159) 0x6fde XOR %ESI,%ESI |
(161) 0x6fe0 VMOVUPD (%R15,%RSI,8),%YMM1 |
(161) 0x6fe6 KXNORW %K0,%K0,%K1 |
(161) 0x6fea VXORPD %XMM2,%XMM2,%XMM2 |
(161) 0x6fee VGATHERQPD (%R11,%YMM1,8),%YMM2{%K1} |
(161) 0x6ff5 VFMADD231PD (%R14,%RSI,8),%YMM2,%YMM0 |
(161) 0x6ffb ADD $0x4,%RSI |
(161) 0x6fff CMP %RCX,%RSI |
(161) 0x7002 JBE 6fe0 |
(159) 0x7004 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(159) 0x700a VADDPD %XMM1,%XMM0,%XMM0 |
(159) 0x700e VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(159) 0x7013 VADDSD %XMM1,%XMM0,%XMM0 |
(159) 0x7017 CMP %R12,%RAX |
(159) 0x701a MOV -0x40(%RBP),%R14 |
(159) 0x701e MOV -0x30(%RBP),%R15 |
(159) 0x7022 MOV -0x38(%RBP),%RSI |
(159) 0x7026 JE 6f80 |
(159) 0x702c JMP 7031 |
(159) 0x702e XOR %R12D,%R12D |
(159) 0x7031 ADD %R13,%R12 |
(159) 0x7034 NOPW %CS:(%RAX,%RAX,1) |
(160) 0x7040 MOV (%RBX,%R12,8),%RAX |
(160) 0x7044 VMOVSD (%R11,%RAX,8),%XMM1 |
(160) 0x704a VFMADD231SD (%R10,%R12,8),%XMM1,%XMM0 |
(160) 0x7050 INC %R12 |
(160) 0x7053 CMP %R12,%R9 |
(160) 0x7056 JNE 7040 |
(159) 0x7058 JMP 6f80 |
0x705d XOR %R15D,%R15D |
0x7060 CMP %R15,%R14 |
0x7063 JG 6e61 |
0x7069 JMP 6e98 |
0x706e MOV 0x28(%RBP),%RCX |
0x7072 VUCOMISD 0x3c3e(%RIP),%XMM5 |
0x707a JNE 72cd |
0x7080 VUCOMISD 0x3c28(%RIP),%XMM0 |
0x7088 JNE 740c |
0x708e CMP %R15,%R14 |
0x7091 JGE 7d1c |
0x7097 MOV -0x30(%RBP),%RAX |
0x709b MOV (%RAX),%RDI |
0x709e MOV (%RSI),%RSI |
0x70a1 MOV %R14,%RAX |
0x70a4 NOT %RAX |
0x70a7 ADD %RAX,%R15 |
0x70aa XOR %R8D,%R8D |
0x70ad VMOVDDUP 0x3c0b(%RIP),%XMM0 |
0x70b5 MOV %R15,-0x30(%RBP) |
0x70b9 MOV %RSI,-0x38(%RBP) |
0x70bd JMP 70d6 |
0x70bf NOP |
(150) 0x70c0 VMOVSD %XMM1,(%RSI,%R9,8) |
(150) 0x70c6 LEA 0x1(%R8),%RAX |
(150) 0x70ca CMP %R15,%R8 |
(150) 0x70cd MOV %RAX,%R8 |
(150) 0x70d0 JE 7d1c |
(150) 0x70d6 LEA (%R14,%R8,1),%R9 |
(150) 0x70da VMOVSD (%RCX,%R9,8),%XMM1 |
(150) 0x70e0 VXORPD %XMM0,%XMM1,%XMM1 |
(150) 0x70e4 MOV (%RDI,%R9,8),%RDX |
(150) 0x70e8 MOV 0x8(%RDI,%R9,8),%R10 |
(150) 0x70ed MOV %R10,%RAX |
(150) 0x70f0 SUB %RDX,%RAX |
(150) 0x70f3 JLE 70c0 |
(150) 0x70f5 MOV -0x48(%RBP),%RCX |
(150) 0x70f9 MOV (%RCX),%R11 |
(150) 0x70fc MOV 0x20(%RBP),%RCX |
(150) 0x7100 MOV (%RCX),%RBX |
(150) 0x7103 MOV 0x10(%RBP),%RCX |
(150) 0x7107 MOV (%RCX),%R12 |
(150) 0x710a MOV %RAX,%R13 |
(150) 0x710d AND $-0x4,%R13 |
(150) 0x7111 JE 7186 |
(150) 0x7113 LEA -0x1(%R13),%RCX |
(150) 0x7117 LEA (%R11,%RDX,8),%R14 |
(150) 0x711b LEA (%R12,%RDX,8),%R15 |
(150) 0x711f VXORPD %XMM2,%XMM2,%XMM2 |
(150) 0x7123 XOR %ESI,%ESI |
(150) 0x7125 NOPW %CS:(%RAX,%RAX,1) |
(152) 0x7130 VMOVUPD (%R15,%RSI,8),%YMM3 |
(152) 0x7136 KXNORW %K0,%K0,%K1 |
(152) 0x713a VXORPD %XMM4,%XMM4,%XMM4 |
(152) 0x713e VGATHERQPD (%RBX,%YMM3,8),%YMM4{%K1} |
(152) 0x7145 VFMADD231PD (%R14,%RSI,8),%YMM4,%YMM2 |
(152) 0x714b ADD $0x4,%RSI |
(152) 0x714f CMP %RCX,%RSI |
(152) 0x7152 JBE 7130 |
(150) 0x7154 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(150) 0x715a VADDPD %XMM3,%XMM2,%XMM2 |
(150) 0x715e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(150) 0x7163 VADDSD %XMM3,%XMM2,%XMM2 |
(150) 0x7167 VADDSD %XMM2,%XMM1,%XMM1 |
(150) 0x716b CMP %R13,%RAX |
(150) 0x716e MOV -0x40(%RBP),%R14 |
(150) 0x7172 MOV -0x30(%RBP),%R15 |
(150) 0x7176 MOV 0x28(%RBP),%RCX |
(150) 0x717a MOV -0x38(%RBP),%RSI |
(150) 0x717e JE 70c0 |
(150) 0x7184 JMP 718d |
(150) 0x7186 XOR %R13D,%R13D |
(150) 0x7189 MOV 0x28(%RBP),%RCX |
(150) 0x718d ADD %RDX,%R13 |
(151) 0x7190 MOV (%R12,%R13,8),%RAX |
(151) 0x7194 VMOVSD (%RBX,%RAX,8),%XMM2 |
(151) 0x7199 VFMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(151) 0x719f INC %R13 |
(151) 0x71a2 CMP %R13,%R10 |
(151) 0x71a5 JNE 7190 |
(150) 0x71a7 JMP 70c0 |
0x71ac VUCOMISD 0x3b04(%RIP),%XMM0 |
0x71b4 JNE 753c |
0x71ba CMP %R15,%R14 |
0x71bd JGE 7d1c |
0x71c3 MOV -0x30(%RBP),%RAX |
0x71c7 MOV (%RAX),%RDX |
0x71ca MOV (%RSI),%RSI |
0x71cd MOV %R14,%RAX |
0x71d0 NOT %RAX |
0x71d3 ADD %RAX,%R15 |
0x71d6 XOR %EDI,%EDI |
0x71d8 MOV %R15,-0x30(%RBP) |
0x71dc MOV %RSI,-0x38(%RBP) |
0x71e0 JMP 7206 |
0x71e2 NOPW %CS:(%RAX,%RAX,1) |
(156) 0x71f0 VMOVSD %XMM0,(%RSI,%R8,8) |
(156) 0x71f6 LEA 0x1(%RDI),%RAX |
(156) 0x71fa CMP %R15,%RDI |
(156) 0x71fd MOV %RAX,%RDI |
(156) 0x7200 JE 7d1c |
(156) 0x7206 LEA (%R14,%RDI,1),%R8 |
(156) 0x720a MOV (%RDX,%R8,8),%R13 |
(156) 0x720e MOV 0x8(%RDX,%R8,8),%R9 |
(156) 0x7213 VXORPD %XMM0,%XMM0,%XMM0 |
(156) 0x7217 MOV %R9,%RAX |
(156) 0x721a SUB %R13,%RAX |
(156) 0x721d JLE 71f0 |
(156) 0x721f MOV -0x48(%RBP),%RCX |
(156) 0x7223 MOV (%RCX),%R10 |
(156) 0x7226 MOV 0x20(%RBP),%RCX |
(156) 0x722a MOV (%RCX),%R11 |
(156) 0x722d MOV 0x10(%RBP),%RCX |
(156) 0x7231 MOV (%RCX),%RBX |
(156) 0x7234 MOV %RAX,%R12 |
(156) 0x7237 AND $-0x4,%R12 |
(156) 0x723b JE 729e |
(156) 0x723d LEA -0x1(%R12),%RCX |
(156) 0x7242 LEA (%R10,%R13,8),%R14 |
(156) 0x7246 LEA (%RBX,%R13,8),%R15 |
(156) 0x724a VXORPD %XMM0,%XMM0,%XMM0 |
(156) 0x724e XOR %ESI,%ESI |
(158) 0x7250 VMOVUPD (%R15,%RSI,8),%YMM1 |
(158) 0x7256 KXNORW %K0,%K0,%K1 |
(158) 0x725a VXORPD %XMM2,%XMM2,%XMM2 |
(158) 0x725e VGATHERQPD (%R11,%YMM1,8),%YMM2{%K1} |
(158) 0x7265 VFNMADD231PD (%R14,%RSI,8),%YMM2,%YMM0 |
(158) 0x726b ADD $0x4,%RSI |
(158) 0x726f CMP %RCX,%RSI |
(158) 0x7272 JBE 7250 |
(156) 0x7274 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(156) 0x727a VADDPD %XMM1,%XMM0,%XMM0 |
(156) 0x727e VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(156) 0x7283 VADDSD %XMM1,%XMM0,%XMM0 |
(156) 0x7287 CMP %R12,%RAX |
(156) 0x728a MOV -0x40(%RBP),%R14 |
(156) 0x728e MOV -0x30(%RBP),%R15 |
(156) 0x7292 MOV -0x38(%RBP),%RSI |
(156) 0x7296 JE 71f0 |
(156) 0x729c JMP 72a1 |
(156) 0x729e XOR %R12D,%R12D |
(156) 0x72a1 ADD %R13,%R12 |
(156) 0x72a4 NOPW %CS:(%RAX,%RAX,1) |
(157) 0x72b0 MOV (%RBX,%R12,8),%RAX |
(157) 0x72b4 VMOVSD (%R11,%RAX,8),%XMM1 |
(157) 0x72ba VFNMADD231SD (%R10,%R12,8),%XMM1,%XMM0 |
(157) 0x72c0 INC %R12 |
(157) 0x72c3 CMP %R12,%R9 |
(157) 0x72c6 JNE 72b0 |
(156) 0x72c8 JMP 71f0 |
0x72cd VUCOMISD 0x39db(%RIP),%XMM5 |
0x72d5 JNE 765d |
0x72db VUCOMISD 0x39cd(%RIP),%XMM0 |
0x72e3 JNE 778c |
0x72e9 CMP %R15,%R14 |
0x72ec JGE 7d1c |
0x72f2 MOV -0x30(%RBP),%RAX |
0x72f6 MOV (%RAX),%RDI |
0x72f9 MOV (%RSI),%RSI |
0x72fc MOV %R14,%RAX |
0x72ff NOT %RAX |
0x7302 ADD %RAX,%R15 |
0x7305 XOR %R8D,%R8D |
0x7308 MOV %R15,-0x30(%RBP) |
0x730c MOV %RSI,-0x38(%RBP) |
0x7310 JMP 7336 |
0x7312 NOPW %CS:(%RAX,%RAX,1) |
(141) 0x7320 VMOVSD %XMM0,(%RSI,%R9,8) |
(141) 0x7326 LEA 0x1(%R8),%RAX |
(141) 0x732a CMP %R15,%R8 |
(141) 0x732d MOV %RAX,%R8 |
(141) 0x7330 JE 7d1c |
(141) 0x7336 LEA (%R14,%R8,1),%R9 |
(141) 0x733a VMOVSD (%RCX,%R9,8),%XMM0 |
(141) 0x7340 MOV (%RDI,%R9,8),%RDX |
(141) 0x7344 MOV 0x8(%RDI,%R9,8),%R10 |
(141) 0x7349 MOV %R10,%RAX |
(141) 0x734c SUB %RDX,%RAX |
(141) 0x734f JLE 7320 |
(141) 0x7351 MOV -0x48(%RBP),%RCX |
(141) 0x7355 MOV (%RCX),%R11 |
(141) 0x7358 MOV 0x20(%RBP),%RCX |
(141) 0x735c MOV (%RCX),%RBX |
(141) 0x735f MOV 0x10(%RBP),%RCX |
(141) 0x7363 MOV (%RCX),%R12 |
(141) 0x7366 MOV %RAX,%R13 |
(141) 0x7369 AND $-0x4,%R13 |
(141) 0x736d JE 73e6 |
(141) 0x736f LEA -0x1(%R13),%RCX |
(141) 0x7373 LEA (%R11,%RDX,8),%RSI |
(141) 0x7377 LEA (%R12,%RDX,8),%R14 |
(141) 0x737b VXORPD %XMM1,%XMM1,%XMM1 |
(141) 0x737f XOR %R15D,%R15D |
(141) 0x7382 NOPW %CS:(%RAX,%RAX,1) |
(143) 0x7390 VMOVUPD (%R14,%R15,8),%YMM2 |
(143) 0x7396 KXNORW %K0,%K0,%K1 |
(143) 0x739a VXORPD %XMM3,%XMM3,%XMM3 |
(143) 0x739e VGATHERQPD (%RBX,%YMM2,8),%YMM3{%K1} |
(143) 0x73a5 VFMADD231PD (%RSI,%R15,8),%YMM3,%YMM1 |
(143) 0x73ab ADD $0x4,%R15 |
(143) 0x73af CMP %RCX,%R15 |
(143) 0x73b2 JBE 7390 |
(141) 0x73b4 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(141) 0x73ba VADDPD %XMM2,%XMM1,%XMM1 |
(141) 0x73be VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(141) 0x73c3 VADDSD %XMM2,%XMM1,%XMM1 |
(141) 0x73c7 VADDSD %XMM1,%XMM0,%XMM0 |
(141) 0x73cb CMP %R13,%RAX |
(141) 0x73ce MOV -0x40(%RBP),%R14 |
(141) 0x73d2 MOV -0x30(%RBP),%R15 |
(141) 0x73d6 MOV 0x28(%RBP),%RCX |
(141) 0x73da MOV -0x38(%RBP),%RSI |
(141) 0x73de JE 7320 |
(141) 0x73e4 JMP 73ed |
(141) 0x73e6 XOR %R13D,%R13D |
(141) 0x73e9 MOV 0x28(%RBP),%RCX |
(141) 0x73ed ADD %RDX,%R13 |
(142) 0x73f0 MOV (%R12,%R13,8),%RAX |
(142) 0x73f4 VMOVSD (%RBX,%RAX,8),%XMM1 |
(142) 0x73f9 VFMADD231SD (%R11,%R13,8),%XMM1,%XMM0 |
(142) 0x73ff INC %R13 |
(142) 0x7402 CMP %R13,%R10 |
(142) 0x7405 JNE 73f0 |
(141) 0x7407 JMP 7320 |
0x740c VUCOMISD 0x38a4(%RIP),%XMM0 |
0x7414 JNE 78bc |
0x741a CMP %R15,%R14 |
0x741d JGE 7d1c |
0x7423 MOV -0x30(%RBP),%RAX |
0x7427 MOV (%RAX),%RDI |
0x742a MOV (%RSI),%RSI |
0x742d MOV %R14,%RAX |
0x7430 NOT %RAX |
0x7433 ADD %RAX,%R15 |
0x7436 XOR %R8D,%R8D |
0x7439 MOV %R15,-0x30(%RBP) |
0x743d MOV %RSI,-0x38(%RBP) |
0x7441 JMP 7466 |
0x7443 NOPW %CS:(%RAX,%RAX,1) |
(147) 0x7450 VMOVSD %XMM0,(%RSI,%R9,8) |
(147) 0x7456 LEA 0x1(%R8),%RAX |
(147) 0x745a CMP %R15,%R8 |
(147) 0x745d MOV %RAX,%R8 |
(147) 0x7460 JE 7d1c |
(147) 0x7466 LEA (%R14,%R8,1),%R9 |
(147) 0x746a VMOVSD (%RCX,%R9,8),%XMM0 |
(147) 0x7470 MOV (%RDI,%R9,8),%RDX |
(147) 0x7474 MOV 0x8(%RDI,%R9,8),%R10 |
(147) 0x7479 MOV %R10,%RAX |
(147) 0x747c SUB %RDX,%RAX |
(147) 0x747f JLE 7450 |
(147) 0x7481 MOV -0x48(%RBP),%RCX |
(147) 0x7485 MOV (%RCX),%R11 |
(147) 0x7488 MOV 0x20(%RBP),%RCX |
(147) 0x748c MOV (%RCX),%RBX |
(147) 0x748f MOV 0x10(%RBP),%RCX |
(147) 0x7493 MOV (%RCX),%R12 |
(147) 0x7496 MOV %RAX,%R13 |
(147) 0x7499 AND $-0x4,%R13 |
(147) 0x749d JE 7516 |
(147) 0x749f LEA -0x1(%R13),%RCX |
(147) 0x74a3 LEA (%R11,%RDX,8),%RSI |
(147) 0x74a7 LEA (%R12,%RDX,8),%R14 |
(147) 0x74ab VXORPD %XMM1,%XMM1,%XMM1 |
(147) 0x74af XOR %R15D,%R15D |
(147) 0x74b2 NOPW %CS:(%RAX,%RAX,1) |
(149) 0x74c0 VMOVUPD (%R14,%R15,8),%YMM2 |
(149) 0x74c6 KXNORW %K0,%K0,%K1 |
(149) 0x74ca VXORPD %XMM3,%XMM3,%XMM3 |
(149) 0x74ce VGATHERQPD (%RBX,%YMM2,8),%YMM3{%K1} |
(149) 0x74d5 VFNMADD231PD (%RSI,%R15,8),%YMM3,%YMM1 |
(149) 0x74db ADD $0x4,%R15 |
(149) 0x74df CMP %RCX,%R15 |
(149) 0x74e2 JBE 74c0 |
(147) 0x74e4 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(147) 0x74ea VADDPD %XMM2,%XMM1,%XMM1 |
(147) 0x74ee VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(147) 0x74f3 VADDSD %XMM2,%XMM1,%XMM1 |
(147) 0x74f7 VADDSD %XMM1,%XMM0,%XMM0 |
(147) 0x74fb CMP %R13,%RAX |
(147) 0x74fe MOV -0x40(%RBP),%R14 |
(147) 0x7502 MOV -0x30(%RBP),%R15 |
(147) 0x7506 MOV 0x28(%RBP),%RCX |
(147) 0x750a MOV -0x38(%RBP),%RSI |
(147) 0x750e JE 7450 |
(147) 0x7514 JMP 751d |
(147) 0x7516 XOR %R13D,%R13D |
(147) 0x7519 MOV 0x28(%RBP),%RCX |
(147) 0x751d ADD %RDX,%R13 |
(148) 0x7520 MOV (%R12,%R13,8),%RAX |
(148) 0x7524 VMOVSD (%RBX,%RAX,8),%XMM1 |
(148) 0x7529 VFNMADD231SD (%R11,%R13,8),%XMM1,%XMM0 |
(148) 0x752f INC %R13 |
(148) 0x7532 CMP %R13,%R10 |
(148) 0x7535 JNE 7520 |
(147) 0x7537 JMP 7450 |
0x753c CMP %R15,%R14 |
0x753f JGE 7d1c |
0x7545 MOV -0x30(%RBP),%RAX |
0x7549 MOV (%RAX),%RDX |
0x754c MOV (%RSI),%RSI |
0x754f MOV %R14,%RAX |
0x7552 NOT %RAX |
0x7555 ADD %RAX,%R15 |
0x7558 XOR %EDI,%EDI |
0x755a MOV %R15,-0x30(%RBP) |
0x755e MOV %RSI,-0x38(%RBP) |
0x7562 JMP 758a |
0x7564 NOPW %CS:(%RAX,%RAX,1) |
(153) 0x7570 VMULSD %XMM0,%XMM1,%XMM1 |
(153) 0x7574 VMOVSD %XMM1,(%RSI,%R8,8) |
(153) 0x757a LEA 0x1(%RDI),%RAX |
(153) 0x757e CMP %R15,%RDI |
(153) 0x7581 MOV %RAX,%RDI |
(153) 0x7584 JE 7d1c |
(153) 0x758a LEA (%R14,%RDI,1),%R8 |
(153) 0x758e MOV (%RDX,%R8,8),%R13 |
(153) 0x7592 MOV 0x8(%RDX,%R8,8),%R9 |
(153) 0x7597 VXORPD %XMM1,%XMM1,%XMM1 |
(153) 0x759b MOV %R9,%RAX |
(153) 0x759e SUB %R13,%RAX |
(153) 0x75a1 JLE 7570 |
(153) 0x75a3 MOV -0x48(%RBP),%RCX |
(153) 0x75a7 MOV (%RCX),%R10 |
(153) 0x75aa MOV 0x20(%RBP),%RCX |
(153) 0x75ae MOV (%RCX),%R11 |
(153) 0x75b1 MOV 0x10(%RBP),%RCX |
(153) 0x75b5 MOV (%RCX),%RBX |
(153) 0x75b8 MOV %RAX,%R12 |
(153) 0x75bb AND $-0x4,%R12 |
(153) 0x75bf JE 762e |
(153) 0x75c1 LEA -0x1(%R12),%RCX |
(153) 0x75c6 LEA (%R10,%R13,8),%R14 |
(153) 0x75ca LEA (%RBX,%R13,8),%R15 |
(153) 0x75ce VXORPD %XMM1,%XMM1,%XMM1 |
(153) 0x75d2 XOR %ESI,%ESI |
(153) 0x75d4 NOPW %CS:(%RAX,%RAX,1) |
(155) 0x75e0 VMOVUPD (%R15,%RSI,8),%YMM2 |
(155) 0x75e6 KXNORW %K0,%K0,%K1 |
(155) 0x75ea VXORPD %XMM3,%XMM3,%XMM3 |
(155) 0x75ee VGATHERQPD (%R11,%YMM2,8),%YMM3{%K1} |
(155) 0x75f5 VFMADD231PD (%R14,%RSI,8),%YMM3,%YMM1 |
(155) 0x75fb ADD $0x4,%RSI |
(155) 0x75ff CMP %RCX,%RSI |
(155) 0x7602 JBE 75e0 |
(153) 0x7604 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(153) 0x760a VADDPD %XMM2,%XMM1,%XMM1 |
(153) 0x760e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(153) 0x7613 VADDSD %XMM2,%XMM1,%XMM1 |
(153) 0x7617 CMP %R12,%RAX |
(153) 0x761a MOV -0x40(%RBP),%R14 |
(153) 0x761e MOV -0x30(%RBP),%R15 |
(153) 0x7622 MOV -0x38(%RBP),%RSI |
(153) 0x7626 JE 7570 |
(153) 0x762c JMP 7631 |
(153) 0x762e XOR %R12D,%R12D |
(153) 0x7631 ADD %R13,%R12 |
(153) 0x7634 NOPW %CS:(%RAX,%RAX,1) |
(154) 0x7640 MOV (%RBX,%R12,8),%RAX |
(154) 0x7644 VMOVSD (%R11,%RAX,8),%XMM2 |
(154) 0x764a VFMADD231SD (%R10,%R12,8),%XMM2,%XMM1 |
(154) 0x7650 INC %R12 |
(154) 0x7653 CMP %R12,%R9 |
(154) 0x7656 JNE 7640 |
(153) 0x7658 JMP 7570 |
0x765d VUCOMISD 0x364b(%RIP),%XMM0 |
0x7665 JNE 79dc |
0x766b CMP %R15,%R14 |
0x766e JGE 7d1c |
0x7674 MOV -0x30(%RBP),%RAX |
0x7678 MOV (%RAX),%RDI |
0x767b MOV (%RSI),%RSI |
0x767e MOV %R14,%RAX |
0x7681 NOT %RAX |
0x7684 ADD %RAX,%R15 |
0x7687 XOR %R8D,%R8D |
0x768a MOV %R15,-0x30(%RBP) |
0x768e MOV %RSI,-0x38(%RBP) |
0x7692 JMP 76b6 |
0x7694 NOPW %CS:(%RAX,%RAX,1) |
(132) 0x76a0 VMOVSD %XMM0,(%RSI,%R9,8) |
(132) 0x76a6 LEA 0x1(%R8),%RAX |
(132) 0x76aa CMP %R15,%R8 |
(132) 0x76ad MOV %RAX,%R8 |
(132) 0x76b0 JE 7d1c |
(132) 0x76b6 LEA (%R14,%R8,1),%R9 |
(132) 0x76ba VMULSD (%RCX,%R9,8),%XMM5,%XMM0 |
(132) 0x76c0 MOV (%RDI,%R9,8),%RDX |
(132) 0x76c4 MOV 0x8(%RDI,%R9,8),%R10 |
(132) 0x76c9 MOV %R10,%RAX |
(132) 0x76cc SUB %RDX,%RAX |
(132) 0x76cf JLE 76a0 |
(132) 0x76d1 MOV -0x48(%RBP),%RCX |
(132) 0x76d5 MOV (%RCX),%R11 |
(132) 0x76d8 MOV 0x20(%RBP),%RCX |
(132) 0x76dc MOV (%RCX),%RBX |
(132) 0x76df MOV 0x10(%RBP),%RCX |
(132) 0x76e3 MOV (%RCX),%R12 |
(132) 0x76e6 MOV %RAX,%R13 |
(132) 0x76e9 AND $-0x4,%R13 |
(132) 0x76ed JE 7766 |
(132) 0x76ef LEA -0x1(%R13),%RCX |
(132) 0x76f3 LEA (%R11,%RDX,8),%RSI |
(132) 0x76f7 LEA (%R12,%RDX,8),%R14 |
(132) 0x76fb VXORPD %XMM1,%XMM1,%XMM1 |
(132) 0x76ff XOR %R15D,%R15D |
(132) 0x7702 NOPW %CS:(%RAX,%RAX,1) |
(134) 0x7710 VMOVUPD (%R14,%R15,8),%YMM2 |
(134) 0x7716 KXNORW %K0,%K0,%K1 |
(134) 0x771a VXORPD %XMM3,%XMM3,%XMM3 |
(134) 0x771e VGATHERQPD (%RBX,%YMM2,8),%YMM3{%K1} |
(134) 0x7725 VFMADD231PD (%RSI,%R15,8),%YMM3,%YMM1 |
(134) 0x772b ADD $0x4,%R15 |
(134) 0x772f CMP %RCX,%R15 |
(134) 0x7732 JBE 7710 |
(132) 0x7734 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(132) 0x773a VADDPD %XMM2,%XMM1,%XMM1 |
(132) 0x773e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(132) 0x7743 VADDSD %XMM2,%XMM1,%XMM1 |
(132) 0x7747 VADDSD %XMM1,%XMM0,%XMM0 |
(132) 0x774b CMP %R13,%RAX |
(132) 0x774e MOV -0x40(%RBP),%R14 |
(132) 0x7752 MOV -0x30(%RBP),%R15 |
(132) 0x7756 MOV 0x28(%RBP),%RCX |
(132) 0x775a MOV -0x38(%RBP),%RSI |
(132) 0x775e JE 76a0 |
(132) 0x7764 JMP 776d |
(132) 0x7766 XOR %R13D,%R13D |
(132) 0x7769 MOV 0x28(%RBP),%RCX |
(132) 0x776d ADD %RDX,%R13 |
(133) 0x7770 MOV (%R12,%R13,8),%RAX |
(133) 0x7774 VMOVSD (%RBX,%RAX,8),%XMM1 |
(133) 0x7779 VFMADD231SD (%R11,%R13,8),%XMM1,%XMM0 |
(133) 0x777f INC %R13 |
(133) 0x7782 CMP %R13,%R10 |
(133) 0x7785 JNE 7770 |
(132) 0x7787 JMP 76a0 |
0x778c VUCOMISD 0x3524(%RIP),%XMM0 |
0x7794 JNE 7afc |
0x779a CMP %R15,%R14 |
0x779d JGE 7d1c |
0x77a3 MOV -0x30(%RBP),%RAX |
0x77a7 MOV (%RAX),%RDI |
0x77aa MOV (%RSI),%RSI |
0x77ad MOV %R14,%RAX |
0x77b0 NOT %RAX |
0x77b3 ADD %RAX,%R15 |
0x77b6 XOR %R8D,%R8D |
0x77b9 VMOVDDUP 0x34ff(%RIP),%XMM0 |
0x77c1 MOV %R15,-0x30(%RBP) |
0x77c5 MOV %RSI,-0x38(%RBP) |
0x77c9 JMP 77e6 |
0x77cb NOPL (%RAX,%RAX,1) |
(138) 0x77d0 VMOVSD %XMM1,(%RSI,%R9,8) |
(138) 0x77d6 LEA 0x1(%R8),%RAX |
(138) 0x77da CMP %R15,%R8 |
(138) 0x77dd MOV %RAX,%R8 |
(138) 0x77e0 JE 7d1c |
(138) 0x77e6 LEA (%R14,%R8,1),%R9 |
(138) 0x77ea VMOVSD (%RCX,%R9,8),%XMM1 |
(138) 0x77f0 VXORPD %XMM0,%XMM1,%XMM1 |
(138) 0x77f4 MOV (%RDI,%R9,8),%RDX |
(138) 0x77f8 MOV 0x8(%RDI,%R9,8),%R10 |
(138) 0x77fd MOV %R10,%RAX |
(138) 0x7800 SUB %RDX,%RAX |
(138) 0x7803 JLE 77d0 |
(138) 0x7805 MOV -0x48(%RBP),%RCX |
(138) 0x7809 MOV (%RCX),%R11 |
(138) 0x780c MOV 0x20(%RBP),%RCX |
(138) 0x7810 MOV (%RCX),%RBX |
(138) 0x7813 MOV 0x10(%RBP),%RCX |
(138) 0x7817 MOV (%RCX),%R12 |
(138) 0x781a MOV %RAX,%R13 |
(138) 0x781d AND $-0x4,%R13 |
(138) 0x7821 JE 7896 |
(138) 0x7823 LEA -0x1(%R13),%RCX |
(138) 0x7827 LEA (%R11,%RDX,8),%RSI |
(138) 0x782b LEA (%R12,%RDX,8),%R14 |
(138) 0x782f VXORPD %XMM2,%XMM2,%XMM2 |
(138) 0x7833 XOR %R15D,%R15D |
(138) 0x7836 NOPW %CS:(%RAX,%RAX,1) |
(140) 0x7840 VMOVUPD (%R14,%R15,8),%YMM3 |
(140) 0x7846 VXORPD %XMM4,%XMM4,%XMM4 |
(140) 0x784a KXNORW %K0,%K0,%K1 |
(140) 0x784e VGATHERQPD (%RBX,%YMM3,8),%YMM4{%K1} |
(140) 0x7855 VFNMADD231PD (%RSI,%R15,8),%YMM4,%YMM2 |
(140) 0x785b ADD $0x4,%R15 |
(140) 0x785f CMP %RCX,%R15 |
(140) 0x7862 JBE 7840 |
(138) 0x7864 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(138) 0x786a VADDPD %XMM3,%XMM2,%XMM2 |
(138) 0x786e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(138) 0x7873 VADDSD %XMM3,%XMM2,%XMM2 |
(138) 0x7877 VADDSD %XMM2,%XMM1,%XMM1 |
(138) 0x787b CMP %R13,%RAX |
(138) 0x787e MOV -0x40(%RBP),%R14 |
(138) 0x7882 MOV -0x30(%RBP),%R15 |
(138) 0x7886 MOV 0x28(%RBP),%RCX |
(138) 0x788a MOV -0x38(%RBP),%RSI |
(138) 0x788e JE 77d0 |
(138) 0x7894 JMP 789d |
(138) 0x7896 XOR %R13D,%R13D |
(138) 0x7899 MOV 0x28(%RBP),%RCX |
(138) 0x789d ADD %RDX,%R13 |
(139) 0x78a0 MOV (%R12,%R13,8),%RAX |
(139) 0x78a4 VMOVSD (%RBX,%RAX,8),%XMM2 |
(139) 0x78a9 VFNMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(139) 0x78af INC %R13 |
(139) 0x78b2 CMP %R13,%R10 |
(139) 0x78b5 JNE 78a0 |
(138) 0x78b7 JMP 77d0 |
0x78bc CMP %R15,%R14 |
0x78bf JGE 7d1c |
0x78c5 MOV -0x30(%RBP),%RAX |
0x78c9 MOV (%RAX),%RDI |
0x78cc MOV (%RSI),%RSI |
0x78cf MOV %R14,%RAX |
0x78d2 NOT %RAX |
0x78d5 ADD %RAX,%R15 |
0x78d8 XOR %R8D,%R8D |
0x78db VMOVDDUP 0x33dd(%RIP),%XMM1 |
0x78e3 MOV %R15,-0x30(%RBP) |
0x78e7 MOV %RSI,-0x38(%RBP) |
0x78eb JMP 790a |
0x78ed NOPL (%RAX) |
(144) 0x78f0 VMULSD %XMM0,%XMM2,%XMM2 |
(144) 0x78f4 VMOVSD %XMM2,(%RSI,%R9,8) |
(144) 0x78fa LEA 0x1(%R8),%RAX |
(144) 0x78fe CMP %R15,%R8 |
(144) 0x7901 MOV %RAX,%R8 |
(144) 0x7904 JE 7d1c |
(144) 0x790a LEA (%R14,%R8,1),%R9 |
(144) 0x790e VMOVSD (%RCX,%R9,8),%XMM2 |
(144) 0x7914 VXORPD %XMM1,%XMM2,%XMM2 |
(144) 0x7918 MOV (%RDI,%R9,8),%RDX |
(144) 0x791c MOV 0x8(%RDI,%R9,8),%R10 |
(144) 0x7921 MOV %R10,%RAX |
(144) 0x7924 SUB %RDX,%RAX |
(144) 0x7927 JLE 78f0 |
(144) 0x7929 MOV -0x48(%RBP),%RCX |
(144) 0x792d MOV (%RCX),%R11 |
(144) 0x7930 MOV 0x20(%RBP),%RCX |
(144) 0x7934 MOV (%RCX),%RBX |
(144) 0x7937 MOV 0x10(%RBP),%RCX |
(144) 0x793b MOV (%RCX),%R12 |
(144) 0x793e MOV %RAX,%R13 |
(144) 0x7941 AND $-0x4,%R13 |
(144) 0x7945 JE 79b6 |
(144) 0x7947 LEA -0x1(%R13),%RCX |
(144) 0x794b LEA (%R11,%RDX,8),%RSI |
(144) 0x794f LEA (%R12,%RDX,8),%R14 |
(144) 0x7953 VXORPD %XMM3,%XMM3,%XMM3 |
(144) 0x7957 XOR %R15D,%R15D |
(144) 0x795a NOPW (%RAX,%RAX,1) |
(146) 0x7960 VMOVUPD (%R14,%R15,8),%YMM4 |
(146) 0x7966 KXNORW %K0,%K0,%K1 |
(146) 0x796a VXORPD %XMM5,%XMM5,%XMM5 |
(146) 0x796e VGATHERQPD (%RBX,%YMM4,8),%YMM5{%K1} |
(146) 0x7975 VFMADD231PD (%RSI,%R15,8),%YMM5,%YMM3 |
(146) 0x797b ADD $0x4,%R15 |
(146) 0x797f CMP %RCX,%R15 |
(146) 0x7982 JBE 7960 |
(144) 0x7984 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(144) 0x798a VADDPD %XMM4,%XMM3,%XMM3 |
(144) 0x798e VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(144) 0x7993 VADDSD %XMM4,%XMM3,%XMM3 |
(144) 0x7997 VADDSD %XMM3,%XMM2,%XMM2 |
(144) 0x799b CMP %R13,%RAX |
(144) 0x799e MOV -0x40(%RBP),%R14 |
(144) 0x79a2 MOV -0x30(%RBP),%R15 |
(144) 0x79a6 MOV 0x28(%RBP),%RCX |
(144) 0x79aa MOV -0x38(%RBP),%RSI |
(144) 0x79ae JE 78f0 |
(144) 0x79b4 JMP 79bd |
(144) 0x79b6 XOR %R13D,%R13D |
(144) 0x79b9 MOV 0x28(%RBP),%RCX |
(144) 0x79bd ADD %RDX,%R13 |
(145) 0x79c0 MOV (%R12,%R13,8),%RAX |
(145) 0x79c4 VMOVSD (%RBX,%RAX,8),%XMM3 |
(145) 0x79c9 VFMADD231SD (%R11,%R13,8),%XMM3,%XMM2 |
(145) 0x79cf INC %R13 |
(145) 0x79d2 CMP %R13,%R10 |
(145) 0x79d5 JNE 79c0 |
(144) 0x79d7 JMP 78f0 |
0x79dc VUCOMISD 0x32d4(%RIP),%XMM0 |
0x79e4 JNE 7c0c |
0x79ea CMP %R15,%R14 |
0x79ed JGE 7d1c |
0x79f3 VXORPD 0x32c3(%RIP){1to2},%XMM5,%XMM0 |
0x79fd MOV -0x30(%RBP),%RAX |
0x7a01 MOV (%RAX),%RDI |
0x7a04 MOV (%RSI),%RDX |
0x7a07 MOV %R14,%RAX |
0x7a0a NOT %RAX |
0x7a0d ADD %RAX,%R15 |
0x7a10 XOR %R8D,%R8D |
0x7a13 MOV %R15,-0x30(%RBP) |
0x7a17 MOV %RDX,-0x38(%RBP) |
0x7a1b JMP 7a33 |
(129) 0x7a1d VMOVSD %XMM1,(%RDX,%R9,8) |
(129) 0x7a23 LEA 0x1(%R8),%RAX |
(129) 0x7a27 CMP %R15,%R8 |
(129) 0x7a2a MOV %RAX,%R8 |
(129) 0x7a2d JE 7d1c |
(129) 0x7a33 LEA (%R14,%R8,1),%R9 |
(129) 0x7a37 VMULSD (%RCX,%R9,8),%XMM0,%XMM1 |
(129) 0x7a3d MOV (%RDI,%R9,8),%RSI |
(129) 0x7a41 MOV 0x8(%RDI,%R9,8),%R10 |
(129) 0x7a46 MOV %R10,%RAX |
(129) 0x7a49 SUB %RSI,%RAX |
(129) 0x7a4c JLE 7a1d |
(129) 0x7a4e MOV -0x48(%RBP),%RCX |
(129) 0x7a52 MOV (%RCX),%R11 |
(129) 0x7a55 MOV 0x20(%RBP),%RCX |
(129) 0x7a59 MOV (%RCX),%RBX |
(129) 0x7a5c MOV 0x10(%RBP),%RCX |
(129) 0x7a60 MOV (%RCX),%R12 |
(129) 0x7a63 MOV %RAX,%R13 |
(129) 0x7a66 AND $-0x4,%R13 |
(129) 0x7a6a JE 7ad6 |
(129) 0x7a6c LEA -0x1(%R13),%RDX |
(129) 0x7a70 LEA (%R11,%RSI,8),%RCX |
(129) 0x7a74 LEA (%R12,%RSI,8),%R14 |
(129) 0x7a78 VXORPD %XMM2,%XMM2,%XMM2 |
(129) 0x7a7c XOR %R15D,%R15D |
(129) 0x7a7f NOP |
(131) 0x7a80 VMOVUPD (%R14,%R15,8),%YMM3 |
(131) 0x7a86 KXNORW %K0,%K0,%K1 |
(131) 0x7a8a VXORPD %XMM4,%XMM4,%XMM4 |
(131) 0x7a8e VGATHERQPD (%RBX,%YMM3,8),%YMM4{%K1} |
(131) 0x7a95 VFNMADD231PD (%RCX,%R15,8),%YMM4,%YMM2 |
(131) 0x7a9b ADD $0x4,%R15 |
(131) 0x7a9f CMP %RDX,%R15 |
(131) 0x7aa2 JBE 7a80 |
(129) 0x7aa4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(129) 0x7aaa VADDPD %XMM3,%XMM2,%XMM2 |
(129) 0x7aae VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(129) 0x7ab3 VADDSD %XMM3,%XMM2,%XMM2 |
(129) 0x7ab7 VADDSD %XMM2,%XMM1,%XMM1 |
(129) 0x7abb CMP %R13,%RAX |
(129) 0x7abe MOV -0x40(%RBP),%R14 |
(129) 0x7ac2 MOV -0x30(%RBP),%R15 |
(129) 0x7ac6 MOV 0x28(%RBP),%RCX |
(129) 0x7aca MOV -0x38(%RBP),%RDX |
(129) 0x7ace JE 7a1d |
(129) 0x7ad4 JMP 7add |
(129) 0x7ad6 XOR %R13D,%R13D |
(129) 0x7ad9 MOV 0x28(%RBP),%RCX |
(129) 0x7add ADD %RSI,%R13 |
(130) 0x7ae0 MOV (%R12,%R13,8),%RAX |
(130) 0x7ae4 VMOVSD (%RBX,%RAX,8),%XMM2 |
(130) 0x7ae9 VFNMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(130) 0x7aef INC %R13 |
(130) 0x7af2 CMP %R13,%R10 |
(130) 0x7af5 JNE 7ae0 |
(129) 0x7af7 JMP 7a1d |
0x7afc CMP %R15,%R14 |
0x7aff JGE 7d1c |
0x7b05 MOV -0x30(%RBP),%RAX |
0x7b09 MOV (%RAX),%RDI |
0x7b0c MOV (%RSI),%RSI |
0x7b0f MOV %R14,%RAX |
0x7b12 NOT %RAX |
0x7b15 ADD %RAX,%R15 |
0x7b18 XOR %R8D,%R8D |
0x7b1b MOV %R15,-0x30(%RBP) |
0x7b1f MOV %RSI,-0x38(%RBP) |
0x7b23 JMP 7b3f |
(135) 0x7b25 VMULSD %XMM0,%XMM1,%XMM1 |
(135) 0x7b29 VMOVSD %XMM1,(%RSI,%R9,8) |
(135) 0x7b2f LEA 0x1(%R8),%RAX |
(135) 0x7b33 CMP %R15,%R8 |
(135) 0x7b36 MOV %RAX,%R8 |
(135) 0x7b39 JE 7d1c |
(135) 0x7b3f LEA (%R14,%R8,1),%R9 |
(135) 0x7b43 VMOVSD (%RCX,%R9,8),%XMM1 |
(135) 0x7b49 MOV (%RDI,%R9,8),%RDX |
(135) 0x7b4d MOV 0x8(%RDI,%R9,8),%R10 |
(135) 0x7b52 MOV %R10,%RAX |
(135) 0x7b55 SUB %RDX,%RAX |
(135) 0x7b58 JLE 7b25 |
(135) 0x7b5a MOV -0x48(%RBP),%RCX |
(135) 0x7b5e MOV (%RCX),%R11 |
(135) 0x7b61 MOV 0x20(%RBP),%RCX |
(135) 0x7b65 MOV (%RCX),%RBX |
(135) 0x7b68 MOV 0x10(%RBP),%RCX |
(135) 0x7b6c MOV (%RCX),%R12 |
(135) 0x7b6f MOV %RAX,%R13 |
(135) 0x7b72 AND $-0x4,%R13 |
(135) 0x7b76 JE 7be6 |
(135) 0x7b78 LEA -0x1(%R13),%RCX |
(135) 0x7b7c LEA (%R11,%RDX,8),%RSI |
(135) 0x7b80 LEA (%R12,%RDX,8),%R14 |
(135) 0x7b84 VXORPD %XMM2,%XMM2,%XMM2 |
(135) 0x7b88 XOR %R15D,%R15D |
(135) 0x7b8b NOPL (%RAX,%RAX,1) |
(137) 0x7b90 VMOVUPD (%R14,%R15,8),%YMM3 |
(137) 0x7b96 KXNORW %K0,%K0,%K1 |
(137) 0x7b9a VXORPD %XMM4,%XMM4,%XMM4 |
(137) 0x7b9e VGATHERQPD (%RBX,%YMM3,8),%YMM4{%K1} |
(137) 0x7ba5 VFMADD231PD (%RSI,%R15,8),%YMM4,%YMM2 |
(137) 0x7bab ADD $0x4,%R15 |
(137) 0x7baf CMP %RCX,%R15 |
(137) 0x7bb2 JBE 7b90 |
(135) 0x7bb4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(135) 0x7bba VADDPD %XMM3,%XMM2,%XMM2 |
(135) 0x7bbe VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(135) 0x7bc3 VADDSD %XMM3,%XMM2,%XMM2 |
(135) 0x7bc7 VADDSD %XMM2,%XMM1,%XMM1 |
(135) 0x7bcb CMP %R13,%RAX |
(135) 0x7bce MOV -0x40(%RBP),%R14 |
(135) 0x7bd2 MOV -0x30(%RBP),%R15 |
(135) 0x7bd6 MOV 0x28(%RBP),%RCX |
(135) 0x7bda MOV -0x38(%RBP),%RSI |
(135) 0x7bde JE 7b25 |
(135) 0x7be4 JMP 7bed |
(135) 0x7be6 XOR %R13D,%R13D |
(135) 0x7be9 MOV 0x28(%RBP),%RCX |
(135) 0x7bed ADD %RDX,%R13 |
(136) 0x7bf0 MOV (%R12,%R13,8),%RAX |
(136) 0x7bf4 VMOVSD (%RBX,%RAX,8),%XMM2 |
(136) 0x7bf9 VFMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(136) 0x7bff INC %R13 |
(136) 0x7c02 CMP %R13,%R10 |
(136) 0x7c05 JNE 7bf0 |
(135) 0x7c07 JMP 7b25 |
0x7c0c CMP %R15,%R14 |
0x7c0f JGE 7d1c |
0x7c15 MOV -0x30(%RBP),%RAX |
0x7c19 MOV (%RAX),%RDI |
0x7c1c MOV (%RSI),%RDX |
0x7c1f MOV %R14,%RAX |
0x7c22 NOT %RAX |
0x7c25 ADD %RAX,%R15 |
0x7c28 XOR %R8D,%R8D |
0x7c2b MOV %R15,-0x30(%RBP) |
0x7c2f MOV %RDX,-0x38(%RBP) |
0x7c33 JMP 7c4f |
(126) 0x7c35 VMULSD %XMM0,%XMM1,%XMM1 |
(126) 0x7c39 VMOVSD %XMM1,(%RDX,%R9,8) |
(126) 0x7c3f LEA 0x1(%R8),%RAX |
(126) 0x7c43 CMP %R15,%R8 |
(126) 0x7c46 MOV %RAX,%R8 |
(126) 0x7c49 JE 7d1c |
(126) 0x7c4f LEA (%R14,%R8,1),%R9 |
(126) 0x7c53 VMULSD (%RCX,%R9,8),%XMM5,%XMM1 |
(126) 0x7c59 MOV (%RDI,%R9,8),%RSI |
(126) 0x7c5d MOV 0x8(%RDI,%R9,8),%R10 |
(126) 0x7c62 MOV %R10,%RAX |
(126) 0x7c65 SUB %RSI,%RAX |
(126) 0x7c68 JLE 7c35 |
(126) 0x7c6a MOV -0x48(%RBP),%RCX |
(126) 0x7c6e MOV (%RCX),%R11 |
(126) 0x7c71 MOV 0x20(%RBP),%RCX |
(126) 0x7c75 MOV (%RCX),%RBX |
(126) 0x7c78 MOV 0x10(%RBP),%RCX |
(126) 0x7c7c MOV (%RCX),%R12 |
(126) 0x7c7f MOV %RAX,%R13 |
(126) 0x7c82 AND $-0x4,%R13 |
(126) 0x7c86 JE 7cf6 |
(126) 0x7c88 LEA -0x1(%R13),%RDX |
(126) 0x7c8c LEA (%R11,%RSI,8),%RCX |
(126) 0x7c90 LEA (%R12,%RSI,8),%R14 |
(126) 0x7c94 VXORPD %XMM2,%XMM2,%XMM2 |
(126) 0x7c98 XOR %R15D,%R15D |
(126) 0x7c9b NOPL (%RAX,%RAX,1) |
(128) 0x7ca0 VMOVUPD (%R14,%R15,8),%YMM3 |
(128) 0x7ca6 VXORPD %XMM4,%XMM4,%XMM4 |
(128) 0x7caa KXNORW %K0,%K0,%K1 |
(128) 0x7cae VGATHERQPD (%RBX,%YMM3,8),%YMM4{%K1} |
(128) 0x7cb5 VFMADD231PD (%RCX,%R15,8),%YMM4,%YMM2 |
(128) 0x7cbb ADD $0x4,%R15 |
(128) 0x7cbf CMP %RDX,%R15 |
(128) 0x7cc2 JBE 7ca0 |
(126) 0x7cc4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(126) 0x7cca VADDPD %XMM3,%XMM2,%XMM2 |
(126) 0x7cce VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(126) 0x7cd3 VADDSD %XMM3,%XMM2,%XMM2 |
(126) 0x7cd7 VADDSD %XMM2,%XMM1,%XMM1 |
(126) 0x7cdb CMP %R13,%RAX |
(126) 0x7cde MOV -0x40(%RBP),%R14 |
(126) 0x7ce2 MOV -0x30(%RBP),%R15 |
(126) 0x7ce6 MOV 0x28(%RBP),%RCX |
(126) 0x7cea MOV -0x38(%RBP),%RDX |
(126) 0x7cee JE 7c35 |
(126) 0x7cf4 JMP 7cfd |
(126) 0x7cf6 XOR %R13D,%R13D |
(126) 0x7cf9 MOV 0x28(%RBP),%RCX |
(126) 0x7cfd ADD %RSI,%R13 |
(127) 0x7d00 MOV (%R12,%R13,8),%RAX |
(127) 0x7d04 VMOVSD (%RBX,%RAX,8),%XMM2 |
(127) 0x7d09 VFMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(127) 0x7d0f INC %R13 |
(127) 0x7d12 CMP %R13,%R10 |
(127) 0x7d15 JNE 7d00 |
(126) 0x7d17 JMP 7c35 |
0x7d1c ADD $0x28,%RSP |
0x7d20 POP %RBX |
0x7d21 POP %R12 |
0x7d23 POP %R13 |
0x7d25 POP %R14 |
0x7d27 POP %R15 |
0x7d29 POP %RBP |
0x7d2a VZEROUPPER |
0x7d2d RET |
0x7d2e XCHG %AX,%AX |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | csr_matvec.c:243-404 |
Module | libseq_mv.so |
nb instructions | 320 |
nb uops | 357 |
loop length | 1268 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 8 |
micro-operation queue | 59.50 cycles |
front end | 59.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 27.00 | 25.00 | 25.33 | 25.33 | 23.50 | 25.00 | 27.00 | 23.50 | 23.50 | 23.50 | 25.00 | 25.33 |
cycles | 27.00 | 27.40 | 25.33 | 25.33 | 23.50 | 25.00 | 27.00 | 23.50 | 23.50 | 23.50 | 25.00 | 25.33 |
Cycles executing div or sqrt instructions | 32.00 |
FE+BE cycles | 56.66 |
Stall cycles | 0.00 |
Front-end | 59.50 |
Dispatch | 27.40 |
DIV/SQRT | 32.00 |
Overall L1 | 59.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 1% |
all | 11% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 4% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 2220 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 2310 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R14,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 6de2 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x82> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 6deb <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6df3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x93> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%RCX,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RBX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 22e0 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
SUB %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 6df3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x93> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JG 6db9 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x59> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVQ $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 2220 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 2310 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R14,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 6e26 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 6e2a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xca> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x40(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 705d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x2fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6e5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R12,%R15,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RBX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 22e0 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6e98 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x138> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x208178(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x41a7(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x4148(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 2380 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x40b3(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 23c0 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 6ea6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x146> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6edd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x17d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x208133(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x4162(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x4112(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 2380 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x406e(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 23c0 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 6eec <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x18c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6f28 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x2080ed(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x411c(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x40ee(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 2380 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x4028(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 23c0 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE 706e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x30e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x3d69(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 71ac <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x44c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 6f96 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x236> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JG 6e61 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x101> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 6e98 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x138> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x28(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x3c3e(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 72cd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x56d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x3c28(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 740c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x6ac> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x3c0b(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 70d6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x376> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3b04(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 753c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7dc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7206 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4a6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x39db(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 765d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x39cd(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 778c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa2c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7336 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x5d6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x38a4(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 78bc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb5c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7466 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x706> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 758a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x82a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x364b(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 79dc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 76b6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x956> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3524(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 7afc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd9c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x34ff(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 77e6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa86> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x33dd(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 790a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbaa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x32d4(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 7c0c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xeac> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x32c3(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7a33 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcd3> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7b3f <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xddf> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7c4f <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xeef> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matvec.c:243-404 |
Module | libseq_mv.so |
nb instructions | 320 |
nb uops | 357 |
loop length | 1268 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 8 |
micro-operation queue | 59.50 cycles |
front end | 59.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 27.00 | 25.00 | 25.33 | 25.33 | 23.50 | 25.00 | 27.00 | 23.50 | 23.50 | 23.50 | 25.00 | 25.33 |
cycles | 27.00 | 27.40 | 25.33 | 25.33 | 23.50 | 25.00 | 27.00 | 23.50 | 23.50 | 23.50 | 25.00 | 25.33 |
Cycles executing div or sqrt instructions | 32.00 |
FE+BE cycles | 56.66 |
Stall cycles | 0.00 |
Front-end | 59.50 |
Dispatch | 27.40 |
DIV/SQRT | 32.00 |
Overall L1 | 59.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 1% |
all | 11% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 4% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 2220 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 2310 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R14,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 6de2 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x82> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 6deb <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6df3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x93> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%RCX,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RBX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 22e0 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
SUB %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 6df3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x93> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JG 6db9 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x59> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVQ $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 2220 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 2310 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R14,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 6e26 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 6e2a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xca> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x40(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 705d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x2fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6e5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R12,%R15,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RBX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 22e0 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6e98 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x138> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x208178(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x41a7(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x4148(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 2380 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x40b3(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 23c0 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 6ea6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x146> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6edd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x17d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x208133(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x4162(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x4112(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 2380 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x406e(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 23c0 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 6eec <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x18c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 6f28 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x2080ed(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x411c(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x40ee(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 2380 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x4028(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 23c0 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE 706e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x30e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x3d69(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 71ac <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x44c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 6f96 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x236> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JG 6e61 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x101> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 6e98 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x138> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x28(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x3c3e(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 72cd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x56d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x3c28(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 740c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x6ac> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x3c0b(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 70d6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x376> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3b04(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 753c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7dc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7206 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4a6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x39db(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 765d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x39cd(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 778c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa2c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7336 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x5d6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x38a4(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 78bc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb5c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7466 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x706> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 758a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x82a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x364b(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 79dc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 76b6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x956> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3524(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 7afc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd9c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x34ff(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 77e6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa86> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x33dd(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 790a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbaa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x32d4(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 7c0c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xeac> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x32c3(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7a33 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcd3> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7b3f <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xddf> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 7d1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7c4f <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xeef> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace.extracted– | 17.05 | 3.6 |
▼Loop 141 - csr_matvec.c:334-341 - libseq_mv.so– | 0.91 | 0.17 |
○Loop 142 - csr_matvec.c:337-339 - libseq_mv.so | 0.44 | 0.08 |
○Loop 143 - csr_matvec.c:337-339 - libseq_mv.so | 0.12 | 0.02 |
▼Loop 147 - csr_matvec.c:307-314 - libseq_mv.so– | 0.34 | 0.06 |
○Loop 149 - csr_matvec.c:310-312 - libseq_mv.so | 6.9 | 1.31 |
○Loop 148 - csr_matvec.c:310-312 - libseq_mv.so | 0.96 | 0.18 |
▼Loop 159 - csr_matvec.c:256-263 - libseq_mv.so– | 0.26 | 0.05 |
○Loop 161 - csr_matvec.c:259-261 - libseq_mv.so | 6.23 | 1.18 |
○Loop 160 - csr_matvec.c:259-261 - libseq_mv.so | 0.87 | 0.17 |
▼Loop 153 - csr_matvec.c:280-287 - libseq_mv.so– | 0 | 0 |
○Loop 154 - csr_matvec.c:283-285 - libseq_mv.so | 0 | 0 |
○Loop 155 - csr_matvec.c:283-285 - libseq_mv.so | 0 | 0 |
▼Loop 129 - csr_matvec.c:385-392 - libseq_mv.so– | 0 | 0 |
○Loop 130 - csr_matvec.c:388-390 - libseq_mv.so | 0 | 0 |
○Loop 131 - csr_matvec.c:388-390 - libseq_mv.so | 0 | 0 |
▼Loop 144 - csr_matvec.c:319-326 - libseq_mv.so– | 0 | 0 |
○Loop 146 - csr_matvec.c:322-324 - libseq_mv.so | 0 | 0 |
○Loop 145 - csr_matvec.c:322-324 - libseq_mv.so | 0 | 0 |
▼Loop 150 - csr_matvec.c:295-302 - libseq_mv.so– | 0 | 0 |
○Loop 152 - csr_matvec.c:298-300 - libseq_mv.so | 0 | 0 |
○Loop 151 - csr_matvec.c:298-300 - libseq_mv.so | 0 | 0 |
▼Loop 138 - csr_matvec.c:346-353 - libseq_mv.so– | 0 | 0 |
○Loop 140 - csr_matvec.c:349-351 - libseq_mv.so | 0 | 0 |
○Loop 139 - csr_matvec.c:349-351 - libseq_mv.so | 0 | 0 |
▼Loop 156 - csr_matvec.c:268-275 - libseq_mv.so– | 0 | 0 |
○Loop 158 - csr_matvec.c:271-273 - libseq_mv.so | 0 | 0 |
○Loop 157 - csr_matvec.c:271-273 - libseq_mv.so | 0 | 0 |
▼Loop 132 - csr_matvec.c:373-380 - libseq_mv.so– | 0 | 0 |
○Loop 133 - csr_matvec.c:376-378 - libseq_mv.so | 0 | 0 |
○Loop 134 - csr_matvec.c:376-378 - libseq_mv.so | 0 | 0 |
▼Loop 126 - csr_matvec.c:397-404 - libseq_mv.so– | 0 | 0 |
○Loop 128 - csr_matvec.c:400-402 - libseq_mv.so | 0 | 0 |
○Loop 127 - csr_matvec.c:400-402 - libseq_mv.so | 0 | 0 |
▼Loop 135 - csr_matvec.c:358-365 - libseq_mv.so– | 0 | 0 |
○Loop 137 - csr_matvec.c:361-363 - libseq_mv.so | 0 | 0 |
○Loop 136 - csr_matvec.c:361-363 - libseq_mv.so | 0 | 0 |