Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 16.95% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 16.95% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-3872/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 243 - 404 |
-------------------------------------------------------------------------------- |
243: #pragma omp parallel private(i,jj,tempx) |
244: #endif |
245: { |
246: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
247: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
248: hypre_assert(iBegin <= iEnd); |
249: hypre_assert(iBegin >= 0 && iBegin <= num_rows); |
250: hypre_assert(iEnd >= 0 && iEnd <= num_rows); |
251: |
252: if (0 == temp) |
253: { |
254: if (1 == alpha) // JSP: a common path |
255: { |
256: for (i = iBegin; i < iEnd; i++) |
257: { |
258: tempx = 0.0; |
259: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
260: { |
261: tempx += A_data[jj] * x_data[A_j[jj]]; |
262: } |
263: y_data[i] = tempx; |
264: } |
265: } // y = A*x |
266: else if (-1 == alpha) |
267: { |
268: for (i = iBegin; i < iEnd; i++) |
269: { |
270: tempx = 0.0; |
271: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
272: { |
273: tempx -= A_data[jj] * x_data[A_j[jj]]; |
274: } |
275: y_data[i] = tempx; |
276: } |
277: } // y = -A*x |
278: else |
279: { |
280: for (i = iBegin; i < iEnd; i++) |
281: { |
282: tempx = 0.0; |
283: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
284: { |
285: tempx += A_data[jj] * x_data[A_j[jj]]; |
286: } |
287: y_data[i] = alpha*tempx; |
288: } |
289: } // y = alpha*A*x |
290: } // temp == 0 |
291: else if (-1 == temp) // beta == -alpha |
292: { |
293: if (1 == alpha) // JSP: a common path |
294: { |
295: for (i = iBegin; i < iEnd; i++) |
296: { |
297: tempx = -b_data[i]; |
298: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
299: { |
300: tempx += A_data[jj] * x_data[A_j[jj]]; |
301: } |
302: y_data[i] = tempx; |
303: } |
304: } // y = A*x - y |
305: else if (-1 == alpha) // JSP: a common path |
306: { |
307: for (i = iBegin; i < iEnd; i++) |
308: { |
309: tempx = b_data[i]; |
310: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
311: { |
312: tempx -= A_data[jj] * x_data[A_j[jj]]; |
313: } |
314: y_data[i] = tempx; |
315: } |
316: } // y = -A*x + y |
317: else |
318: { |
319: for (i = iBegin; i < iEnd; i++) |
320: { |
321: tempx = -b_data[i]; |
322: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
323: { |
324: tempx += A_data[jj] * x_data[A_j[jj]]; |
325: } |
326: y_data[i] = alpha*tempx; |
327: } |
328: } // y = alpha*(A*x - y) |
329: } // temp == -1 |
330: else if (1 == temp) |
331: { |
332: if (1 == alpha) // JSP: a common path |
333: { |
334: for (i = iBegin; i < iEnd; i++) |
335: { |
336: tempx = b_data[i]; |
337: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
338: { |
339: tempx += A_data[jj] * x_data[A_j[jj]]; |
340: } |
341: y_data[i] = tempx; |
342: } |
343: } // y = A*x + y |
344: else if (-1 == alpha) |
345: { |
346: for (i = iBegin; i < iEnd; i++) |
347: { |
348: tempx = -b_data[i]; |
349: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
350: { |
351: tempx -= A_data[jj] * x_data[A_j[jj]]; |
352: } |
353: y_data[i] = tempx; |
354: } |
355: } // y = -A*x - y |
356: else |
357: { |
358: for (i = iBegin; i < iEnd; i++) |
359: { |
360: tempx = b_data[i]; |
361: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
362: { |
363: tempx += A_data[jj] * x_data[A_j[jj]]; |
364: } |
365: y_data[i] = alpha*tempx; |
[...] |
371: if (1 == alpha) // JSP: a common path |
372: { |
373: for (i = iBegin; i < iEnd; i++) |
374: { |
375: tempx = b_data[i]*temp; |
376: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
377: { |
378: tempx += A_data[jj] * x_data[A_j[jj]]; |
379: } |
380: y_data[i] = tempx; |
381: } |
382: } // y = A*x + temp*y |
383: else if (-1 == alpha) |
384: { |
385: for (i = iBegin; i < iEnd; i++) |
386: { |
387: tempx = -b_data[i]*temp; |
388: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
389: { |
390: tempx -= A_data[jj] * x_data[A_j[jj]]; |
391: } |
392: y_data[i] = tempx; |
393: } |
394: } // y = -A*x - temp*y |
395: else |
396: { |
397: for (i = iBegin; i < iEnd; i++) |
398: { |
399: tempx = b_data[i]*temp; |
400: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
401: { |
402: tempx += A_data[jj] * x_data[A_j[jj]]; |
403: } |
404: y_data[i] = alpha*tempx; |
0x4dd830 PUSH %RBP |
0x4dd831 MOV %RSP,%RBP |
0x4dd834 PUSH %R15 |
0x4dd836 PUSH %R14 |
0x4dd838 PUSH %R13 |
0x4dd83a PUSH %R12 |
0x4dd83c PUSH %RBX |
0x4dd83d SUB $0x18,%RSP |
0x4dd841 MOV %R9,%RBX |
0x4dd844 MOV %R8,%R14 |
0x4dd847 MOV %RCX,%R12 |
0x4dd84a MOV %RDX,-0x38(%RBP) |
0x4dd84e MOV %RCX,%RDI |
0x4dd851 CALL 4dc2d0 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> |
0x4dd856 MOV %R12,%RDI |
0x4dd859 MOV %RAX,%R12 |
0x4dd85c CALL 4dc350 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> |
0x4dd861 MOV %RAX,%R15 |
0x4dd864 CMP %RAX,%R12 |
0x4dd867 JLE 4dd897 |
0x4dd869 MOV 0x25a350(%RIP),%RDI |
0x4dd870 MOV $0x510905,%ESI |
0x4dd875 MOV $0x51292b,%EDX |
0x4dd87a XOR %EAX,%EAX |
0x4dd87c CALL 4e6c10 <hypre_fprintf> |
0x4dd881 MOV $0x5132d1,%EDI |
0x4dd886 MOV $0xf8,%ESI |
0x4dd88b MOV $0x1,%EDX |
0x4dd890 XOR %ECX,%ECX |
0x4dd892 CALL 4e9300 <hypre_error_handler> |
0x4dd897 MOV 0x18(%RBP),%R13 |
0x4dd89b TEST %R12,%R12 |
0x4dd89e JS 4dd8a5 |
0x4dd8a0 CMP %R13,%R12 |
0x4dd8a3 JLE 4dd8d3 |
0x4dd8a5 MOV 0x25a314(%RIP),%RDI |
0x4dd8ac MOV $0x510905,%ESI |
0x4dd8b1 MOV $0x513358,%EDX |
0x4dd8b6 XOR %EAX,%EAX |
0x4dd8b8 CALL 4e6c10 <hypre_fprintf> |
0x4dd8bd MOV $0x5132d1,%EDI |
0x4dd8c2 MOV $0xf9,%ESI |
0x4dd8c7 MOV $0x1,%EDX |
0x4dd8cc XOR %ECX,%ECX |
0x4dd8ce CALL 4e9300 <hypre_error_handler> |
0x4dd8d3 VMOVSD 0x38(%RBP),%XMM5 |
0x4dd8d8 TEST %R15,%R15 |
0x4dd8db JS 4dd8e2 |
0x4dd8dd CMP %R13,%R15 |
0x4dd8e0 JLE 4dd915 |
0x4dd8e2 MOV 0x25a2d7(%RIP),%RDI |
0x4dd8e9 MOV $0x510905,%ESI |
0x4dd8ee MOV $0x51337a,%EDX |
0x4dd8f3 XOR %EAX,%EAX |
0x4dd8f5 CALL 4e6c10 <hypre_fprintf> |
0x4dd8fa MOV $0x5132d1,%EDI |
0x4dd8ff MOV $0xfa,%ESI |
0x4dd904 MOV $0x1,%EDX |
0x4dd909 XOR %ECX,%ECX |
0x4dd90b CALL 4e9300 <hypre_error_handler> |
0x4dd910 VMOVSD 0x38(%RBP),%XMM5 |
0x4dd915 MOV 0x20(%RBP),%RCX |
0x4dd919 MOV 0x10(%RBP),%RDX |
0x4dd91d VMOVSD -0x38(%RBP),%XMM0 |
0x4dd922 VXORPD %XMM1,%XMM1,%XMM1 |
0x4dd926 VUCOMISD %XMM1,%XMM5 |
0x4dd92a MOV %R12,-0x38(%RBP) |
0x4dd92e MOV %RBX,-0x30(%RBP) |
0x4dd932 JNE 4dda3c |
0x4dd938 VUCOMISD 0x20b30(%RIP),%XMM0 |
0x4dd940 JNE 4ddb5c |
0x4dd946 CMP %R15,%R12 |
0x4dd949 JGE 4de59c |
0x4dd94f MOV %R12,%RAX |
0x4dd952 NOT %RAX |
0x4dd955 ADD %RAX,%R15 |
0x4dd958 XOR %ESI,%ESI |
0x4dd95a JMP 4dd979 |
0x4dd95c NOPL (%RAX) |
(4319) 0x4dd960 MOV 0x30(%RBP),%RAX |
(4319) 0x4dd964 VMOVSD %XMM0,(%RAX,%RDI,8) |
(4319) 0x4dd969 LEA 0x1(%RSI),%RAX |
(4319) 0x4dd96d CMP %R15,%RSI |
(4319) 0x4dd970 MOV %RAX,%RSI |
(4319) 0x4dd973 JE 4de59c |
(4319) 0x4dd979 LEA (%R12,%RSI,1),%RDI |
(4319) 0x4dd97d MOV (%RBX,%RDI,8),%R10 |
(4319) 0x4dd981 MOV 0x8(%RBX,%RDI,8),%R8 |
(4319) 0x4dd986 VXORPD %XMM0,%XMM0,%XMM0 |
(4319) 0x4dd98a MOV %R8,%R11 |
(4319) 0x4dd98d SUB %R10,%R11 |
(4319) 0x4dd990 JLE 4dd960 |
(4319) 0x4dd992 MOV %R11,%R9 |
(4319) 0x4dd995 AND $-0x4,%R9 |
(4319) 0x4dd999 JE 4dda0e |
(4319) 0x4dd99b MOV %R15,%RBX |
(4319) 0x4dd99e LEA -0x1(%R9),%R15 |
(4319) 0x4dd9a2 LEA (%R14,%R10,8),%R13 |
(4319) 0x4dd9a6 LEA (%RDX,%R10,8),%RAX |
(4319) 0x4dd9aa VXORPD %XMM0,%XMM0,%XMM0 |
(4319) 0x4dd9ae XOR %R12D,%R12D |
(4319) 0x4dd9b1 NOPW %CS:(%RAX,%RAX,1) |
(4321) 0x4dd9c0 VMOVUPD (%RAX,%R12,8),%YMM1 |
(4321) 0x4dd9c6 KXNORW %K0,%K0,%K1 |
(4321) 0x4dd9ca VXORPD %XMM2,%XMM2,%XMM2 |
(4321) 0x4dd9ce VGATHERQPD (%RCX,%YMM1,8),%YMM2{%K1} |
(4321) 0x4dd9d5 VFMADD231PD (%R13,%R12,8),%YMM2,%YMM0 |
(4321) 0x4dd9dc ADD $0x4,%R12 |
(4321) 0x4dd9e0 CMP %R15,%R12 |
(4321) 0x4dd9e3 JBE 4dd9c0 |
(4319) 0x4dd9e5 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(4319) 0x4dd9eb VADDPD %XMM1,%XMM0,%XMM0 |
(4319) 0x4dd9ef VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(4319) 0x4dd9f4 VADDSD %XMM1,%XMM0,%XMM0 |
(4319) 0x4dd9f8 CMP %R9,%R11 |
(4319) 0x4dd9fb MOV -0x38(%RBP),%R12 |
(4319) 0x4dd9ff MOV %RBX,%R15 |
(4319) 0x4dda02 MOV -0x30(%RBP),%RBX |
(4319) 0x4dda06 JE 4dd960 |
(4319) 0x4dda0c JMP 4dda11 |
(4319) 0x4dda0e XOR %R9D,%R9D |
(4319) 0x4dda11 ADD %R10,%R9 |
(4319) 0x4dda14 NOPW %CS:(%RAX,%RAX,1) |
(4320) 0x4dda20 MOV (%RDX,%R9,8),%RAX |
(4320) 0x4dda24 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4320) 0x4dda29 VFMADD231SD (%R14,%R9,8),%XMM1,%XMM0 |
(4320) 0x4dda2f INC %R9 |
(4320) 0x4dda32 CMP %R9,%R8 |
(4320) 0x4dda35 JNE 4dda20 |
(4319) 0x4dda37 JMP 4dd960 |
0x4dda3c VUCOMISD 0x218ec(%RIP),%XMM5 |
0x4dda44 MOV %R15,%RSI |
0x4dda47 JNE 4ddc5c |
0x4dda4d VUCOMISD 0x20a1b(%RIP),%XMM0 |
0x4dda55 JNE 4ddd7c |
0x4dda5b CMP %RSI,%R12 |
0x4dda5e MOV 0x28(%RBP),%R15 |
0x4dda62 JGE 4de59c |
0x4dda68 MOV %R12,%RAX |
0x4dda6b NOT %RAX |
0x4dda6e ADD %RAX,%RSI |
0x4dda71 XOR %EDI,%EDI |
0x4dda73 VMOVDDUP 0x21665(%RIP),%XMM0 |
0x4dda7b JMP 4dda9a |
0x4dda7d NOPL (%RAX) |
(4310) 0x4dda80 MOV 0x30(%RBP),%RAX |
(4310) 0x4dda84 VMOVSD %XMM1,(%RAX,%R8,8) |
(4310) 0x4dda8a LEA 0x1(%RDI),%RAX |
(4310) 0x4dda8e CMP %RSI,%RDI |
(4310) 0x4dda91 MOV %RAX,%RDI |
(4310) 0x4dda94 JE 4de59c |
(4310) 0x4dda9a LEA (%R12,%RDI,1),%R8 |
(4310) 0x4dda9e VMOVSD (%R15,%R8,8),%XMM1 |
(4310) 0x4ddaa4 VXORPD %XMM0,%XMM1,%XMM1 |
(4310) 0x4ddaa8 MOV (%RBX,%R8,8),%R11 |
(4310) 0x4ddaac MOV 0x8(%RBX,%R8,8),%R9 |
(4310) 0x4ddab1 MOV %R9,%R13 |
(4310) 0x4ddab4 SUB %R11,%R13 |
(4310) 0x4ddab7 JLE 4dda80 |
(4310) 0x4ddab9 MOV %R13,%R10 |
(4310) 0x4ddabc AND $-0x4,%R10 |
(4310) 0x4ddac0 JE 4ddb35 |
(4310) 0x4ddac2 MOV %RSI,%RBX |
(4310) 0x4ddac5 LEA -0x1(%R10),%R15 |
(4310) 0x4ddac9 LEA (%R14,%R11,8),%RSI |
(4310) 0x4ddacd LEA (%RDX,%R11,8),%RAX |
(4310) 0x4ddad1 VXORPD %XMM2,%XMM2,%XMM2 |
(4310) 0x4ddad5 XOR %R12D,%R12D |
(4310) 0x4ddad8 NOPL (%RAX,%RAX,1) |
(4312) 0x4ddae0 VMOVUPD (%RAX,%R12,8),%YMM3 |
(4312) 0x4ddae6 KXNORW %K0,%K0,%K1 |
(4312) 0x4ddaea VXORPD %XMM4,%XMM4,%XMM4 |
(4312) 0x4ddaee VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4312) 0x4ddaf5 VFMADD231PD (%RSI,%R12,8),%YMM4,%YMM2 |
(4312) 0x4ddafb ADD $0x4,%R12 |
(4312) 0x4ddaff CMP %R15,%R12 |
(4312) 0x4ddb02 JBE 4ddae0 |
(4310) 0x4ddb04 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4310) 0x4ddb0a VADDPD %XMM3,%XMM2,%XMM2 |
(4310) 0x4ddb0e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4310) 0x4ddb13 VADDSD %XMM3,%XMM2,%XMM2 |
(4310) 0x4ddb17 VADDSD %XMM2,%XMM1,%XMM1 |
(4310) 0x4ddb1b CMP %R10,%R13 |
(4310) 0x4ddb1e MOV -0x38(%RBP),%R12 |
(4310) 0x4ddb22 MOV %RBX,%RSI |
(4310) 0x4ddb25 MOV -0x30(%RBP),%RBX |
(4310) 0x4ddb29 MOV 0x28(%RBP),%R15 |
(4310) 0x4ddb2d JE 4dda80 |
(4310) 0x4ddb33 JMP 4ddb38 |
(4310) 0x4ddb35 XOR %R10D,%R10D |
(4310) 0x4ddb38 ADD %R11,%R10 |
(4310) 0x4ddb3b NOPL (%RAX,%RAX,1) |
(4311) 0x4ddb40 MOV (%RDX,%R10,8),%RAX |
(4311) 0x4ddb44 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4311) 0x4ddb49 VFMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4311) 0x4ddb4f INC %R10 |
(4311) 0x4ddb52 CMP %R10,%R9 |
(4311) 0x4ddb55 JNE 4ddb40 |
(4310) 0x4ddb57 JMP 4dda80 |
0x4ddb5c VUCOMISD 0x217cc(%RIP),%XMM0 |
0x4ddb64 JNE 4dde8c |
0x4ddb6a CMP %R15,%R12 |
0x4ddb6d JGE 4de59c |
0x4ddb73 MOV %R12,%RAX |
0x4ddb76 NOT %RAX |
0x4ddb79 ADD %RAX,%R15 |
0x4ddb7c XOR %ESI,%ESI |
0x4ddb7e JMP 4ddb99 |
(4316) 0x4ddb80 MOV 0x30(%RBP),%RAX |
(4316) 0x4ddb84 VMOVSD %XMM0,(%RAX,%RDI,8) |
(4316) 0x4ddb89 LEA 0x1(%RSI),%RAX |
(4316) 0x4ddb8d CMP %R15,%RSI |
(4316) 0x4ddb90 MOV %RAX,%RSI |
(4316) 0x4ddb93 JE 4de59c |
(4316) 0x4ddb99 LEA (%R12,%RSI,1),%RDI |
(4316) 0x4ddb9d MOV (%RBX,%RDI,8),%R10 |
(4316) 0x4ddba1 MOV 0x8(%RBX,%RDI,8),%R8 |
(4316) 0x4ddba6 VXORPD %XMM0,%XMM0,%XMM0 |
(4316) 0x4ddbaa MOV %R8,%R11 |
(4316) 0x4ddbad SUB %R10,%R11 |
(4316) 0x4ddbb0 JLE 4ddb80 |
(4316) 0x4ddbb2 MOV %R11,%R9 |
(4316) 0x4ddbb5 AND $-0x4,%R9 |
(4316) 0x4ddbb9 JE 4ddc2e |
(4316) 0x4ddbbb MOV %R15,%RBX |
(4316) 0x4ddbbe LEA -0x1(%R9),%R15 |
(4316) 0x4ddbc2 LEA (%R14,%R10,8),%R13 |
(4316) 0x4ddbc6 LEA (%RDX,%R10,8),%RAX |
(4316) 0x4ddbca VXORPD %XMM0,%XMM0,%XMM0 |
(4316) 0x4ddbce XOR %R12D,%R12D |
(4316) 0x4ddbd1 NOPW %CS:(%RAX,%RAX,1) |
(4318) 0x4ddbe0 VMOVUPD (%RAX,%R12,8),%YMM1 |
(4318) 0x4ddbe6 KXNORW %K0,%K0,%K1 |
(4318) 0x4ddbea VXORPD %XMM2,%XMM2,%XMM2 |
(4318) 0x4ddbee VGATHERQPD (%RCX,%YMM1,8),%YMM2{%K1} |
(4318) 0x4ddbf5 VFNMADD231PD (%R13,%R12,8),%YMM2,%YMM0 |
(4318) 0x4ddbfc ADD $0x4,%R12 |
(4318) 0x4ddc00 CMP %R15,%R12 |
(4318) 0x4ddc03 JBE 4ddbe0 |
(4316) 0x4ddc05 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(4316) 0x4ddc0b VADDPD %XMM1,%XMM0,%XMM0 |
(4316) 0x4ddc0f VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(4316) 0x4ddc14 VADDSD %XMM1,%XMM0,%XMM0 |
(4316) 0x4ddc18 CMP %R9,%R11 |
(4316) 0x4ddc1b MOV -0x38(%RBP),%R12 |
(4316) 0x4ddc1f MOV %RBX,%R15 |
(4316) 0x4ddc22 MOV -0x30(%RBP),%RBX |
(4316) 0x4ddc26 JE 4ddb80 |
(4316) 0x4ddc2c JMP 4ddc31 |
(4316) 0x4ddc2e XOR %R9D,%R9D |
(4316) 0x4ddc31 ADD %R10,%R9 |
(4316) 0x4ddc34 NOPW %CS:(%RAX,%RAX,1) |
(4317) 0x4ddc40 MOV (%RDX,%R9,8),%RAX |
(4317) 0x4ddc44 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4317) 0x4ddc49 VFNMADD231SD (%R14,%R9,8),%XMM1,%XMM0 |
(4317) 0x4ddc4f INC %R9 |
(4317) 0x4ddc52 CMP %R9,%R8 |
(4317) 0x4ddc55 JNE 4ddc40 |
(4316) 0x4ddc57 JMP 4ddb80 |
0x4ddc5c VUCOMISD 0x2080c(%RIP),%XMM5 |
0x4ddc64 JNE 4ddf8c |
0x4ddc6a VUCOMISD 0x207fe(%RIP),%XMM0 |
0x4ddc72 MOV 0x28(%RBP),%R15 |
0x4ddc76 JNE 4de09c |
0x4ddc7c CMP %RSI,%R12 |
0x4ddc7f JGE 4de59c |
0x4ddc85 MOV %R12,%RAX |
0x4ddc88 NOT %RAX |
0x4ddc8b ADD %RAX,%RSI |
0x4ddc8e XOR %EDI,%EDI |
0x4ddc90 MOV %RSI,-0x30(%RBP) |
0x4ddc94 JMP 4ddcba |
0x4ddc96 NOPW %CS:(%RAX,%RAX,1) |
(4301) 0x4ddca0 MOV 0x30(%RBP),%RAX |
(4301) 0x4ddca4 VMOVSD %XMM0,(%RAX,%R8,8) |
(4301) 0x4ddcaa LEA 0x1(%RDI),%RAX |
(4301) 0x4ddcae CMP %RSI,%RDI |
(4301) 0x4ddcb1 MOV %RAX,%RDI |
(4301) 0x4ddcb4 JE 4de59c |
(4301) 0x4ddcba LEA (%R12,%RDI,1),%R8 |
(4301) 0x4ddcbe VMOVSD (%R15,%R8,8),%XMM0 |
(4301) 0x4ddcc4 MOV (%RBX,%R8,8),%R11 |
(4301) 0x4ddcc8 MOV 0x8(%RBX,%R8,8),%R9 |
(4301) 0x4ddccd MOV %R9,%R13 |
(4301) 0x4ddcd0 SUB %R11,%R13 |
(4301) 0x4ddcd3 JLE 4ddca0 |
(4301) 0x4ddcd5 MOV %R13,%R10 |
(4301) 0x4ddcd8 AND $-0x4,%R10 |
(4301) 0x4ddcdc JE 4ddd52 |
(4301) 0x4ddcde LEA -0x1(%R10),%R15 |
(4301) 0x4ddce2 LEA (%R14,%R11,8),%RSI |
(4301) 0x4ddce6 LEA (%RDX,%R11,8),%RAX |
(4301) 0x4ddcea VXORPD %XMM1,%XMM1,%XMM1 |
(4301) 0x4ddcee XOR %R12D,%R12D |
(4301) 0x4ddcf1 NOPW %CS:(%RAX,%RAX,1) |
(4303) 0x4ddd00 VMOVUPD (%RAX,%R12,8),%YMM2 |
(4303) 0x4ddd06 KXNORW %K0,%K0,%K1 |
(4303) 0x4ddd0a VXORPD %XMM3,%XMM3,%XMM3 |
(4303) 0x4ddd0e VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(4303) 0x4ddd15 VFMADD231PD (%RSI,%R12,8),%YMM3,%YMM1 |
(4303) 0x4ddd1b ADD $0x4,%R12 |
(4303) 0x4ddd1f CMP %R15,%R12 |
(4303) 0x4ddd22 JBE 4ddd00 |
(4301) 0x4ddd24 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4301) 0x4ddd2a VADDPD %XMM2,%XMM1,%XMM1 |
(4301) 0x4ddd2e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4301) 0x4ddd33 VADDSD %XMM2,%XMM1,%XMM1 |
(4301) 0x4ddd37 VADDSD %XMM1,%XMM0,%XMM0 |
(4301) 0x4ddd3b CMP %R10,%R13 |
(4301) 0x4ddd3e MOV -0x38(%RBP),%R12 |
(4301) 0x4ddd42 MOV -0x30(%RBP),%RSI |
(4301) 0x4ddd46 MOV 0x28(%RBP),%R15 |
(4301) 0x4ddd4a JE 4ddca0 |
(4301) 0x4ddd50 JMP 4ddd55 |
(4301) 0x4ddd52 XOR %R10D,%R10D |
(4301) 0x4ddd55 ADD %R11,%R10 |
(4301) 0x4ddd58 NOPL (%RAX,%RAX,1) |
(4302) 0x4ddd60 MOV (%RDX,%R10,8),%RAX |
(4302) 0x4ddd64 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4302) 0x4ddd69 VFMADD231SD (%R14,%R10,8),%XMM1,%XMM0 |
(4302) 0x4ddd6f INC %R10 |
(4302) 0x4ddd72 CMP %R10,%R9 |
(4302) 0x4ddd75 JNE 4ddd60 |
(4301) 0x4ddd77 JMP 4ddca0 |
0x4ddd7c VUCOMISD 0x215ac(%RIP),%XMM0 |
0x4ddd84 MOV 0x28(%RBP),%R15 |
0x4ddd88 JNE 4de1ac |
0x4ddd8e CMP %RSI,%R12 |
0x4ddd91 JGE 4de59c |
0x4ddd97 MOV %R12,%RAX |
0x4ddd9a NOT %RAX |
0x4ddd9d ADD %RAX,%RSI |
0x4ddda0 XOR %EDI,%EDI |
0x4ddda2 MOV %RSI,-0x30(%RBP) |
0x4ddda6 JMP 4dddca |
0x4ddda8 NOPL (%RAX,%RAX,1) |
(4307) 0x4dddb0 MOV 0x30(%RBP),%RAX |
(4307) 0x4dddb4 VMOVSD %XMM0,(%RAX,%R8,8) |
(4307) 0x4dddba LEA 0x1(%RDI),%RAX |
(4307) 0x4dddbe CMP %RSI,%RDI |
(4307) 0x4dddc1 MOV %RAX,%RDI |
(4307) 0x4dddc4 JE 4de59c |
(4307) 0x4dddca LEA (%R12,%RDI,1),%R8 |
(4307) 0x4dddce VMOVSD (%R15,%R8,8),%XMM0 |
(4307) 0x4dddd4 MOV (%RBX,%R8,8),%R11 |
(4307) 0x4dddd8 MOV 0x8(%RBX,%R8,8),%R9 |
(4307) 0x4ddddd MOV %R9,%R13 |
(4307) 0x4ddde0 SUB %R11,%R13 |
(4307) 0x4ddde3 JLE 4dddb0 |
(4307) 0x4ddde5 MOV %R13,%R10 |
(4307) 0x4ddde8 AND $-0x4,%R10 |
(4307) 0x4dddec JE 4dde62 |
(4307) 0x4dddee LEA -0x1(%R10),%R15 |
(4307) 0x4dddf2 LEA (%R14,%R11,8),%RSI |
(4307) 0x4dddf6 LEA (%RDX,%R11,8),%RAX |
(4307) 0x4dddfa VXORPD %XMM1,%XMM1,%XMM1 |
(4307) 0x4dddfe XOR %R12D,%R12D |
(4307) 0x4dde01 NOPW %CS:(%RAX,%RAX,1) |
(4309) 0x4dde10 VMOVUPD (%RAX,%R12,8),%YMM2 |
(4309) 0x4dde16 KXNORW %K0,%K0,%K1 |
(4309) 0x4dde1a VXORPD %XMM3,%XMM3,%XMM3 |
(4309) 0x4dde1e VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(4309) 0x4dde25 VFNMADD231PD (%RSI,%R12,8),%YMM3,%YMM1 |
(4309) 0x4dde2b ADD $0x4,%R12 |
(4309) 0x4dde2f CMP %R15,%R12 |
(4309) 0x4dde32 JBE 4dde10 |
(4307) 0x4dde34 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4307) 0x4dde3a VADDPD %XMM2,%XMM1,%XMM1 |
(4307) 0x4dde3e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4307) 0x4dde43 VADDSD %XMM2,%XMM1,%XMM1 |
(4307) 0x4dde47 VADDSD %XMM1,%XMM0,%XMM0 |
(4307) 0x4dde4b CMP %R10,%R13 |
(4307) 0x4dde4e MOV -0x38(%RBP),%R12 |
(4307) 0x4dde52 MOV -0x30(%RBP),%RSI |
(4307) 0x4dde56 MOV 0x28(%RBP),%R15 |
(4307) 0x4dde5a JE 4dddb0 |
(4307) 0x4dde60 JMP 4dde65 |
(4307) 0x4dde62 XOR %R10D,%R10D |
(4307) 0x4dde65 ADD %R11,%R10 |
(4307) 0x4dde68 NOPL (%RAX,%RAX,1) |
(4308) 0x4dde70 MOV (%RDX,%R10,8),%RAX |
(4308) 0x4dde74 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4308) 0x4dde79 VFNMADD231SD (%R14,%R10,8),%XMM1,%XMM0 |
(4308) 0x4dde7f INC %R10 |
(4308) 0x4dde82 CMP %R10,%R9 |
(4308) 0x4dde85 JNE 4dde70 |
(4307) 0x4dde87 JMP 4dddb0 |
0x4dde8c CMP %R15,%R12 |
0x4dde8f JGE 4de59c |
0x4dde95 MOV %R12,%RAX |
0x4dde98 NOT %RAX |
0x4dde9b ADD %RAX,%R15 |
0x4dde9e XOR %ESI,%ESI |
0x4ddea0 JMP 4ddecd |
0x4ddea2 NOPW %CS:(%RAX,%RAX,1) |
(4313) 0x4ddeb0 VMULSD %XMM0,%XMM1,%XMM1 |
(4313) 0x4ddeb4 MOV 0x30(%RBP),%RAX |
(4313) 0x4ddeb8 VMOVSD %XMM1,(%RAX,%RDI,8) |
(4313) 0x4ddebd LEA 0x1(%RSI),%RAX |
(4313) 0x4ddec1 CMP %R15,%RSI |
(4313) 0x4ddec4 MOV %RAX,%RSI |
(4313) 0x4ddec7 JE 4de59c |
(4313) 0x4ddecd LEA (%R12,%RSI,1),%RDI |
(4313) 0x4dded1 MOV (%RBX,%RDI,8),%R10 |
(4313) 0x4dded5 MOV 0x8(%RBX,%RDI,8),%R8 |
(4313) 0x4ddeda VXORPD %XMM1,%XMM1,%XMM1 |
(4313) 0x4ddede MOV %R8,%R11 |
(4313) 0x4ddee1 SUB %R10,%R11 |
(4313) 0x4ddee4 JLE 4ddeb0 |
(4313) 0x4ddee6 MOV %R11,%R9 |
(4313) 0x4ddee9 AND $-0x4,%R9 |
(4313) 0x4ddeed JE 4ddf5e |
(4313) 0x4ddeef MOV %R15,%RBX |
(4313) 0x4ddef2 LEA -0x1(%R9),%R15 |
(4313) 0x4ddef6 LEA (%R14,%R10,8),%R13 |
(4313) 0x4ddefa LEA (%RDX,%R10,8),%RAX |
(4313) 0x4ddefe VXORPD %XMM1,%XMM1,%XMM1 |
(4313) 0x4ddf02 XOR %R12D,%R12D |
(4313) 0x4ddf05 NOPW %CS:(%RAX,%RAX,1) |
(4315) 0x4ddf10 VMOVUPD (%RAX,%R12,8),%YMM2 |
(4315) 0x4ddf16 VXORPD %XMM3,%XMM3,%XMM3 |
(4315) 0x4ddf1a KXNORW %K0,%K0,%K1 |
(4315) 0x4ddf1e VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(4315) 0x4ddf25 VFMADD231PD (%R13,%R12,8),%YMM3,%YMM1 |
(4315) 0x4ddf2c ADD $0x4,%R12 |
(4315) 0x4ddf30 CMP %R15,%R12 |
(4315) 0x4ddf33 JBE 4ddf10 |
(4313) 0x4ddf35 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4313) 0x4ddf3b VADDPD %XMM2,%XMM1,%XMM1 |
(4313) 0x4ddf3f VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4313) 0x4ddf44 VADDSD %XMM2,%XMM1,%XMM1 |
(4313) 0x4ddf48 CMP %R9,%R11 |
(4313) 0x4ddf4b MOV -0x38(%RBP),%R12 |
(4313) 0x4ddf4f MOV %RBX,%R15 |
(4313) 0x4ddf52 MOV -0x30(%RBP),%RBX |
(4313) 0x4ddf56 JE 4ddeb0 |
(4313) 0x4ddf5c JMP 4ddf61 |
(4313) 0x4ddf5e XOR %R9D,%R9D |
(4313) 0x4ddf61 ADD %R10,%R9 |
(4313) 0x4ddf64 NOPW %CS:(%RAX,%RAX,1) |
(4314) 0x4ddf70 MOV (%RDX,%R9,8),%RAX |
(4314) 0x4ddf74 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4314) 0x4ddf79 VFMADD231SD (%R14,%R9,8),%XMM2,%XMM1 |
(4314) 0x4ddf7f INC %R9 |
(4314) 0x4ddf82 CMP %R9,%R8 |
(4314) 0x4ddf85 JNE 4ddf70 |
(4313) 0x4ddf87 JMP 4ddeb0 |
0x4ddf8c VUCOMISD 0x204dc(%RIP),%XMM0 |
0x4ddf94 MOV 0x28(%RBP),%R15 |
0x4ddf98 JNE 4de2ac |
0x4ddf9e CMP %RSI,%R12 |
0x4ddfa1 JGE 4de59c |
0x4ddfa7 MOV %R12,%RAX |
0x4ddfaa NOT %RAX |
0x4ddfad ADD %RAX,%RSI |
0x4ddfb0 XOR %EDI,%EDI |
0x4ddfb2 MOV %RSI,-0x30(%RBP) |
0x4ddfb6 JMP 4ddfda |
0x4ddfb8 NOPL (%RAX,%RAX,1) |
(4292) 0x4ddfc0 MOV 0x30(%RBP),%RAX |
(4292) 0x4ddfc4 VMOVSD %XMM0,(%RAX,%R8,8) |
(4292) 0x4ddfca LEA 0x1(%RDI),%RAX |
(4292) 0x4ddfce CMP %RSI,%RDI |
(4292) 0x4ddfd1 MOV %RAX,%RDI |
(4292) 0x4ddfd4 JE 4de59c |
(4292) 0x4ddfda LEA (%R12,%RDI,1),%R8 |
(4292) 0x4ddfde VMULSD (%R15,%R8,8),%XMM5,%XMM0 |
(4292) 0x4ddfe4 MOV (%RBX,%R8,8),%R11 |
(4292) 0x4ddfe8 MOV 0x8(%RBX,%R8,8),%R9 |
(4292) 0x4ddfed MOV %R9,%R13 |
(4292) 0x4ddff0 SUB %R11,%R13 |
(4292) 0x4ddff3 JLE 4ddfc0 |
(4292) 0x4ddff5 MOV %R13,%R10 |
(4292) 0x4ddff8 AND $-0x4,%R10 |
(4292) 0x4ddffc JE 4de072 |
(4292) 0x4ddffe LEA -0x1(%R10),%R15 |
(4292) 0x4de002 LEA (%R14,%R11,8),%RSI |
(4292) 0x4de006 LEA (%RDX,%R11,8),%RAX |
(4292) 0x4de00a VXORPD %XMM1,%XMM1,%XMM1 |
(4292) 0x4de00e XOR %R12D,%R12D |
(4292) 0x4de011 NOPW %CS:(%RAX,%RAX,1) |
(4294) 0x4de020 VMOVUPD (%RAX,%R12,8),%YMM2 |
(4294) 0x4de026 VXORPD %XMM3,%XMM3,%XMM3 |
(4294) 0x4de02a KXNORW %K0,%K0,%K1 |
(4294) 0x4de02e VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(4294) 0x4de035 VFMADD231PD (%RSI,%R12,8),%YMM3,%YMM1 |
(4294) 0x4de03b ADD $0x4,%R12 |
(4294) 0x4de03f CMP %R15,%R12 |
(4294) 0x4de042 JBE 4de020 |
(4292) 0x4de044 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4292) 0x4de04a VADDPD %XMM2,%XMM1,%XMM1 |
(4292) 0x4de04e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4292) 0x4de053 VADDSD %XMM2,%XMM1,%XMM1 |
(4292) 0x4de057 VADDSD %XMM1,%XMM0,%XMM0 |
(4292) 0x4de05b CMP %R10,%R13 |
(4292) 0x4de05e MOV -0x38(%RBP),%R12 |
(4292) 0x4de062 MOV -0x30(%RBP),%RSI |
(4292) 0x4de066 MOV 0x28(%RBP),%R15 |
(4292) 0x4de06a JE 4ddfc0 |
(4292) 0x4de070 JMP 4de075 |
(4292) 0x4de072 XOR %R10D,%R10D |
(4292) 0x4de075 ADD %R11,%R10 |
(4292) 0x4de078 NOPL (%RAX,%RAX,1) |
(4293) 0x4de080 MOV (%RDX,%R10,8),%RAX |
(4293) 0x4de084 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4293) 0x4de089 VFMADD231SD (%R14,%R10,8),%XMM1,%XMM0 |
(4293) 0x4de08f INC %R10 |
(4293) 0x4de092 CMP %R10,%R9 |
(4293) 0x4de095 JNE 4de080 |
(4292) 0x4de097 JMP 4ddfc0 |
0x4de09c VUCOMISD 0x2128c(%RIP),%XMM0 |
0x4de0a4 JNE 4de3bc |
0x4de0aa CMP %RSI,%R12 |
0x4de0ad JGE 4de59c |
0x4de0b3 MOV %R12,%RAX |
0x4de0b6 NOT %RAX |
0x4de0b9 ADD %RAX,%RSI |
0x4de0bc XOR %EDI,%EDI |
0x4de0be VMOVDDUP 0x2101a(%RIP),%XMM0 |
0x4de0c6 MOV %RSI,-0x30(%RBP) |
0x4de0ca JMP 4de0ea |
0x4de0cc NOPL (%RAX) |
(4298) 0x4de0d0 MOV 0x30(%RBP),%RAX |
(4298) 0x4de0d4 VMOVSD %XMM1,(%RAX,%R8,8) |
(4298) 0x4de0da LEA 0x1(%RDI),%RAX |
(4298) 0x4de0de CMP %RSI,%RDI |
(4298) 0x4de0e1 MOV %RAX,%RDI |
(4298) 0x4de0e4 JE 4de59c |
(4298) 0x4de0ea LEA (%R12,%RDI,1),%R8 |
(4298) 0x4de0ee VMOVSD (%R15,%R8,8),%XMM1 |
(4298) 0x4de0f4 VXORPD %XMM0,%XMM1,%XMM1 |
(4298) 0x4de0f8 MOV (%RBX,%R8,8),%R11 |
(4298) 0x4de0fc MOV 0x8(%RBX,%R8,8),%R9 |
(4298) 0x4de101 MOV %R9,%R13 |
(4298) 0x4de104 SUB %R11,%R13 |
(4298) 0x4de107 JLE 4de0d0 |
(4298) 0x4de109 MOV %R13,%R10 |
(4298) 0x4de10c AND $-0x4,%R10 |
(4298) 0x4de110 JE 4de182 |
(4298) 0x4de112 LEA -0x1(%R10),%R15 |
(4298) 0x4de116 LEA (%R14,%R11,8),%RSI |
(4298) 0x4de11a LEA (%RDX,%R11,8),%RAX |
(4298) 0x4de11e VXORPD %XMM2,%XMM2,%XMM2 |
(4298) 0x4de122 XOR %R12D,%R12D |
(4298) 0x4de125 NOPW %CS:(%RAX,%RAX,1) |
(4300) 0x4de130 VMOVUPD (%RAX,%R12,8),%YMM3 |
(4300) 0x4de136 KXNORW %K0,%K0,%K1 |
(4300) 0x4de13a VXORPD %XMM4,%XMM4,%XMM4 |
(4300) 0x4de13e VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4300) 0x4de145 VFNMADD231PD (%RSI,%R12,8),%YMM4,%YMM2 |
(4300) 0x4de14b ADD $0x4,%R12 |
(4300) 0x4de14f CMP %R15,%R12 |
(4300) 0x4de152 JBE 4de130 |
(4298) 0x4de154 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4298) 0x4de15a VADDPD %XMM3,%XMM2,%XMM2 |
(4298) 0x4de15e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4298) 0x4de163 VADDSD %XMM3,%XMM2,%XMM2 |
(4298) 0x4de167 VADDSD %XMM2,%XMM1,%XMM1 |
(4298) 0x4de16b CMP %R10,%R13 |
(4298) 0x4de16e MOV -0x38(%RBP),%R12 |
(4298) 0x4de172 MOV -0x30(%RBP),%RSI |
(4298) 0x4de176 MOV 0x28(%RBP),%R15 |
(4298) 0x4de17a JE 4de0d0 |
(4298) 0x4de180 JMP 4de185 |
(4298) 0x4de182 XOR %R10D,%R10D |
(4298) 0x4de185 ADD %R11,%R10 |
(4298) 0x4de188 NOPL (%RAX,%RAX,1) |
(4299) 0x4de190 MOV (%RDX,%R10,8),%RAX |
(4299) 0x4de194 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4299) 0x4de199 VFNMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4299) 0x4de19f INC %R10 |
(4299) 0x4de1a2 CMP %R10,%R9 |
(4299) 0x4de1a5 JNE 4de190 |
(4298) 0x4de1a7 JMP 4de0d0 |
0x4de1ac CMP %RSI,%R12 |
0x4de1af JGE 4de59c |
0x4de1b5 MOV %R12,%RAX |
0x4de1b8 NOT %RAX |
0x4de1bb ADD %RAX,%RSI |
0x4de1be XOR %EDI,%EDI |
0x4de1c0 VMOVDDUP 0x20f18(%RIP),%XMM1 |
0x4de1c8 MOV %RSI,-0x30(%RBP) |
0x4de1cc JMP 4de1ee |
0x4de1ce XCHG %AX,%AX |
(4304) 0x4de1d0 VMULSD %XMM0,%XMM2,%XMM2 |
(4304) 0x4de1d4 MOV 0x30(%RBP),%RAX |
(4304) 0x4de1d8 VMOVSD %XMM2,(%RAX,%R8,8) |
(4304) 0x4de1de LEA 0x1(%RDI),%RAX |
(4304) 0x4de1e2 CMP %RSI,%RDI |
(4304) 0x4de1e5 MOV %RAX,%RDI |
(4304) 0x4de1e8 JE 4de59c |
(4304) 0x4de1ee LEA (%R12,%RDI,1),%R8 |
(4304) 0x4de1f2 VMOVSD (%R15,%R8,8),%XMM2 |
(4304) 0x4de1f8 VXORPD %XMM1,%XMM2,%XMM2 |
(4304) 0x4de1fc MOV (%RBX,%R8,8),%R11 |
(4304) 0x4de200 MOV 0x8(%RBX,%R8,8),%R9 |
(4304) 0x4de205 MOV %R9,%R13 |
(4304) 0x4de208 SUB %R11,%R13 |
(4304) 0x4de20b JLE 4de1d0 |
(4304) 0x4de20d MOV %R13,%R10 |
(4304) 0x4de210 AND $-0x4,%R10 |
(4304) 0x4de214 JE 4de282 |
(4304) 0x4de216 LEA -0x1(%R10),%R15 |
(4304) 0x4de21a LEA (%R14,%R11,8),%RSI |
(4304) 0x4de21e LEA (%RDX,%R11,8),%RAX |
(4304) 0x4de222 VXORPD %XMM3,%XMM3,%XMM3 |
(4304) 0x4de226 XOR %R12D,%R12D |
(4304) 0x4de229 NOPL (%RAX) |
(4306) 0x4de230 VMOVUPD (%RAX,%R12,8),%YMM4 |
(4306) 0x4de236 KXNORW %K0,%K0,%K1 |
(4306) 0x4de23a VXORPD %XMM5,%XMM5,%XMM5 |
(4306) 0x4de23e VGATHERQPD (%RCX,%YMM4,8),%YMM5{%K1} |
(4306) 0x4de245 VFMADD231PD (%RSI,%R12,8),%YMM5,%YMM3 |
(4306) 0x4de24b ADD $0x4,%R12 |
(4306) 0x4de24f CMP %R15,%R12 |
(4306) 0x4de252 JBE 4de230 |
(4304) 0x4de254 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(4304) 0x4de25a VADDPD %XMM4,%XMM3,%XMM3 |
(4304) 0x4de25e VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(4304) 0x4de263 VADDSD %XMM4,%XMM3,%XMM3 |
(4304) 0x4de267 VADDSD %XMM3,%XMM2,%XMM2 |
(4304) 0x4de26b CMP %R10,%R13 |
(4304) 0x4de26e MOV -0x38(%RBP),%R12 |
(4304) 0x4de272 MOV -0x30(%RBP),%RSI |
(4304) 0x4de276 MOV 0x28(%RBP),%R15 |
(4304) 0x4de27a JE 4de1d0 |
(4304) 0x4de280 JMP 4de285 |
(4304) 0x4de282 XOR %R10D,%R10D |
(4304) 0x4de285 ADD %R11,%R10 |
(4304) 0x4de288 NOPL (%RAX,%RAX,1) |
(4305) 0x4de290 MOV (%RDX,%R10,8),%RAX |
(4305) 0x4de294 VMOVSD (%RCX,%RAX,8),%XMM3 |
(4305) 0x4de299 VFMADD231SD (%R14,%R10,8),%XMM3,%XMM2 |
(4305) 0x4de29f INC %R10 |
(4305) 0x4de2a2 CMP %R10,%R9 |
(4305) 0x4de2a5 JNE 4de290 |
(4304) 0x4de2a7 JMP 4de1d0 |
0x4de2ac VUCOMISD 0x2107c(%RIP),%XMM0 |
0x4de2b4 JNE 4de4ac |
0x4de2ba CMP %RSI,%R12 |
0x4de2bd JGE 4de59c |
0x4de2c3 VXORPD 0x20e13(%RIP){1to2},%XMM5,%XMM0 |
0x4de2cd MOV %R12,%RAX |
0x4de2d0 NOT %RAX |
0x4de2d3 ADD %RAX,%RSI |
0x4de2d6 XOR %EDI,%EDI |
0x4de2d8 JMP 4de2f4 |
(4289) 0x4de2da MOV 0x30(%RBP),%RAX |
(4289) 0x4de2de VMOVSD %XMM1,(%RAX,%R8,8) |
(4289) 0x4de2e4 LEA 0x1(%RDI),%RAX |
(4289) 0x4de2e8 CMP %RSI,%RDI |
(4289) 0x4de2eb MOV %RAX,%RDI |
(4289) 0x4de2ee JE 4de59c |
(4289) 0x4de2f4 LEA (%R12,%RDI,1),%R8 |
(4289) 0x4de2f8 VMULSD (%R15,%R8,8),%XMM0,%XMM1 |
(4289) 0x4de2fe MOV (%RBX,%R8,8),%RAX |
(4289) 0x4de302 MOV 0x8(%RBX,%R8,8),%R9 |
(4289) 0x4de307 MOV %R9,%R13 |
(4289) 0x4de30a SUB %RAX,%R13 |
(4289) 0x4de30d JLE 4de2da |
(4289) 0x4de30f MOV %R13,%R10 |
(4289) 0x4de312 AND $-0x4,%R10 |
(4289) 0x4de316 JE 4de395 |
(4289) 0x4de318 MOV %RSI,%RBX |
(4289) 0x4de31b LEA -0x1(%R10),%R15 |
(4289) 0x4de31f LEA (%R14,%RAX,8),%RSI |
(4289) 0x4de323 MOV %RAX,-0x38(%RBP) |
(4289) 0x4de327 LEA (%RDX,%RAX,8),%RAX |
(4289) 0x4de32b VXORPD %XMM2,%XMM2,%XMM2 |
(4289) 0x4de32f XOR %R11D,%R11D |
(4289) 0x4de332 NOPW %CS:(%RAX,%RAX,1) |
(4291) 0x4de340 VMOVUPD (%RAX,%R11,8),%YMM3 |
(4291) 0x4de346 KXNORW %K0,%K0,%K1 |
(4291) 0x4de34a VXORPD %XMM4,%XMM4,%XMM4 |
(4291) 0x4de34e VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4291) 0x4de355 VFNMADD231PD (%RSI,%R11,8),%YMM4,%YMM2 |
(4291) 0x4de35b ADD $0x4,%R11 |
(4291) 0x4de35f CMP %R15,%R11 |
(4291) 0x4de362 JBE 4de340 |
(4289) 0x4de364 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4289) 0x4de36a VADDPD %XMM3,%XMM2,%XMM2 |
(4289) 0x4de36e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4289) 0x4de373 VADDSD %XMM3,%XMM2,%XMM2 |
(4289) 0x4de377 VADDSD %XMM2,%XMM1,%XMM1 |
(4289) 0x4de37b CMP %R10,%R13 |
(4289) 0x4de37e MOV %RBX,%RSI |
(4289) 0x4de381 MOV -0x30(%RBP),%RBX |
(4289) 0x4de385 MOV 0x28(%RBP),%R15 |
(4289) 0x4de389 MOV -0x38(%RBP),%RAX |
(4289) 0x4de38d JE 4de2da |
(4289) 0x4de393 JMP 4de398 |
(4289) 0x4de395 XOR %R10D,%R10D |
(4289) 0x4de398 ADD %RAX,%R10 |
(4289) 0x4de39b NOPL (%RAX,%RAX,1) |
(4290) 0x4de3a0 MOV (%RDX,%R10,8),%RAX |
(4290) 0x4de3a4 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4290) 0x4de3a9 VFNMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4290) 0x4de3af INC %R10 |
(4290) 0x4de3b2 CMP %R10,%R9 |
(4290) 0x4de3b5 JNE 4de3a0 |
(4289) 0x4de3b7 JMP 4de2da |
0x4de3bc CMP %RSI,%R12 |
0x4de3bf JGE 4de59c |
0x4de3c5 MOV %R12,%RAX |
0x4de3c8 NOT %RAX |
0x4de3cb ADD %RAX,%RSI |
0x4de3ce XOR %EDI,%EDI |
0x4de3d0 MOV %RSI,-0x30(%RBP) |
0x4de3d4 JMP 4de3f4 |
(4295) 0x4de3d6 VMULSD %XMM0,%XMM1,%XMM1 |
(4295) 0x4de3da MOV 0x30(%RBP),%RAX |
(4295) 0x4de3de VMOVSD %XMM1,(%RAX,%R8,8) |
(4295) 0x4de3e4 LEA 0x1(%RDI),%RAX |
(4295) 0x4de3e8 CMP %RSI,%RDI |
(4295) 0x4de3eb MOV %RAX,%RDI |
(4295) 0x4de3ee JE 4de59c |
(4295) 0x4de3f4 LEA (%R12,%RDI,1),%R8 |
(4295) 0x4de3f8 VMOVSD (%R15,%R8,8),%XMM1 |
(4295) 0x4de3fe MOV (%RBX,%R8,8),%R11 |
(4295) 0x4de402 MOV 0x8(%RBX,%R8,8),%R9 |
(4295) 0x4de407 MOV %R9,%R13 |
(4295) 0x4de40a SUB %R11,%R13 |
(4295) 0x4de40d JLE 4de3d6 |
(4295) 0x4de40f MOV %R13,%R10 |
(4295) 0x4de412 AND $-0x4,%R10 |
(4295) 0x4de416 JE 4de482 |
(4295) 0x4de418 LEA -0x1(%R10),%R15 |
(4295) 0x4de41c LEA (%R14,%R11,8),%RSI |
(4295) 0x4de420 LEA (%RDX,%R11,8),%RAX |
(4295) 0x4de424 VXORPD %XMM2,%XMM2,%XMM2 |
(4295) 0x4de428 XOR %R12D,%R12D |
(4295) 0x4de42b NOPL (%RAX,%RAX,1) |
(4297) 0x4de430 VMOVUPD (%RAX,%R12,8),%YMM3 |
(4297) 0x4de436 KXNORW %K0,%K0,%K1 |
(4297) 0x4de43a VXORPD %XMM4,%XMM4,%XMM4 |
(4297) 0x4de43e VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4297) 0x4de445 VFMADD231PD (%RSI,%R12,8),%YMM4,%YMM2 |
(4297) 0x4de44b ADD $0x4,%R12 |
(4297) 0x4de44f CMP %R15,%R12 |
(4297) 0x4de452 JBE 4de430 |
(4295) 0x4de454 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4295) 0x4de45a VADDPD %XMM3,%XMM2,%XMM2 |
(4295) 0x4de45e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4295) 0x4de463 VADDSD %XMM3,%XMM2,%XMM2 |
(4295) 0x4de467 VADDSD %XMM2,%XMM1,%XMM1 |
(4295) 0x4de46b CMP %R10,%R13 |
(4295) 0x4de46e MOV -0x38(%RBP),%R12 |
(4295) 0x4de472 MOV -0x30(%RBP),%RSI |
(4295) 0x4de476 MOV 0x28(%RBP),%R15 |
(4295) 0x4de47a JE 4de3d6 |
(4295) 0x4de480 JMP 4de485 |
(4295) 0x4de482 XOR %R10D,%R10D |
(4295) 0x4de485 ADD %R11,%R10 |
(4295) 0x4de488 NOPL (%RAX,%RAX,1) |
(4296) 0x4de490 MOV (%RDX,%R10,8),%RAX |
(4296) 0x4de494 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4296) 0x4de499 VFMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4296) 0x4de49f INC %R10 |
(4296) 0x4de4a2 CMP %R10,%R9 |
(4296) 0x4de4a5 JNE 4de490 |
(4295) 0x4de4a7 JMP 4de3d6 |
0x4de4ac CMP %RSI,%R12 |
0x4de4af JGE 4de59c |
0x4de4b5 MOV %R12,%RAX |
0x4de4b8 NOT %RAX |
0x4de4bb ADD %RAX,%RSI |
0x4de4be XOR %EDI,%EDI |
0x4de4c0 JMP 4de4e0 |
(4286) 0x4de4c2 VMULSD %XMM0,%XMM1,%XMM1 |
(4286) 0x4de4c6 MOV 0x30(%RBP),%RAX |
(4286) 0x4de4ca VMOVSD %XMM1,(%RAX,%R8,8) |
(4286) 0x4de4d0 LEA 0x1(%RDI),%RAX |
(4286) 0x4de4d4 CMP %RSI,%RDI |
(4286) 0x4de4d7 MOV %RAX,%RDI |
(4286) 0x4de4da JE 4de59c |
(4286) 0x4de4e0 LEA (%R12,%RDI,1),%R8 |
(4286) 0x4de4e4 VMULSD (%R15,%R8,8),%XMM5,%XMM1 |
(4286) 0x4de4ea MOV (%RBX,%R8,8),%RAX |
(4286) 0x4de4ee MOV 0x8(%RBX,%R8,8),%R9 |
(4286) 0x4de4f3 MOV %R9,%R13 |
(4286) 0x4de4f6 SUB %RAX,%R13 |
(4286) 0x4de4f9 JLE 4de4c2 |
(4286) 0x4de4fb MOV %R13,%R10 |
(4286) 0x4de4fe AND $-0x4,%R10 |
(4286) 0x4de502 JE 4de575 |
(4286) 0x4de504 MOV %RSI,%RBX |
(4286) 0x4de507 LEA -0x1(%R10),%R15 |
(4286) 0x4de50b LEA (%R14,%RAX,8),%RSI |
(4286) 0x4de50f MOV %RAX,-0x38(%RBP) |
(4286) 0x4de513 LEA (%RDX,%RAX,8),%R11 |
(4286) 0x4de517 VXORPD %XMM2,%XMM2,%XMM2 |
(4286) 0x4de51b XOR %EAX,%EAX |
(4286) 0x4de51d NOPL (%RAX) |
(4288) 0x4de520 VMOVUPD (%R11,%RAX,8),%YMM3 |
(4288) 0x4de526 KXNORW %K0,%K0,%K1 |
(4288) 0x4de52a VXORPD %XMM4,%XMM4,%XMM4 |
(4288) 0x4de52e VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4288) 0x4de535 VFMADD231PD (%RSI,%RAX,8),%YMM4,%YMM2 |
(4288) 0x4de53b ADD $0x4,%RAX |
(4288) 0x4de53f CMP %R15,%RAX |
(4288) 0x4de542 JBE 4de520 |
(4286) 0x4de544 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4286) 0x4de54a VADDPD %XMM3,%XMM2,%XMM2 |
(4286) 0x4de54e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4286) 0x4de553 VADDSD %XMM3,%XMM2,%XMM2 |
(4286) 0x4de557 VADDSD %XMM2,%XMM1,%XMM1 |
(4286) 0x4de55b CMP %R10,%R13 |
(4286) 0x4de55e MOV %RBX,%RSI |
(4286) 0x4de561 MOV -0x30(%RBP),%RBX |
(4286) 0x4de565 MOV 0x28(%RBP),%R15 |
(4286) 0x4de569 MOV -0x38(%RBP),%RAX |
(4286) 0x4de56d JE 4de4c2 |
(4286) 0x4de573 JMP 4de578 |
(4286) 0x4de575 XOR %R10D,%R10D |
(4286) 0x4de578 ADD %RAX,%R10 |
(4286) 0x4de57b NOPL (%RAX,%RAX,1) |
(4287) 0x4de580 MOV (%RDX,%R10,8),%RAX |
(4287) 0x4de584 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4287) 0x4de589 VFMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4287) 0x4de58f INC %R10 |
(4287) 0x4de592 CMP %R10,%R9 |
(4287) 0x4de595 JNE 4de580 |
(4286) 0x4de597 JMP 4de4c2 |
0x4de59c ADD $0x18,%RSP |
0x4de5a0 POP %RBX |
0x4de5a1 POP %R12 |
0x4de5a3 POP %R13 |
0x4de5a5 POP %R14 |
0x4de5a7 POP %R15 |
0x4de5a9 POP %RBP |
0x4de5aa VZEROUPPER |
0x4de5ad RET |
0x4de5ae XCHG %AX,%AX |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 206 |
nb uops | 225 |
loop length | 818 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 7 |
micro-operation queue | 37.50 cycles |
front end | 37.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 19.07 | 11.33 | 11.33 | 11.50 | 18.93 | 20.00 | 11.50 | 11.50 | 11.50 | 19.00 | 11.33 |
cycles | 20.00 | 19.07 | 11.33 | 11.33 | 11.50 | 18.93 | 20.00 | 11.50 | 11.50 | 11.50 | 19.00 | 11.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 36.11 |
Stall cycles | 0.00 |
Front-end | 37.50 |
Dispatch | 20.00 |
Overall L1 | 37.50 |
all | 1% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 1% |
all | 10% |
load | 5% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 3% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 10% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4dc2d0 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4dc350 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4dd897 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x67> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x25a350(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x510905,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x51292b,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e6c10 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x5132d1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e9300 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4dd8a5 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4dd8d3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x25a314(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x510905,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x513358,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e6c10 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x5132d1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e9300 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4dd8e2 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4dd915 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x25a2d7(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x510905,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x51337a,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e6c10 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x5132d1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e9300 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD -0x38(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4dda3c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x20c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x20b30(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4ddb5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x32c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4dd979 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x149> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x218ec(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R15,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JNE 4ddc5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x42c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x20a1b(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4ddd7c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x54c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x21665(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4dda9a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x26a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x217cc(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4dde8c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x65c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ddb99 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x369> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VUCOMISD 0x2080c(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4ddf8c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x207fe(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4de09c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x86c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4ddcba <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x48a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x215ac(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4de1ac <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x97c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4dddca <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x59a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ddecd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x69d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x204dc(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4de2ac <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4ddfda <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7aa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x2128c(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de3bc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb8c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x2101a(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de0ea <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8ba> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x20f18(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de1ee <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x9be> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x2107c(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de4ac <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x20e13(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4de2f4 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xac4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de3f4 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbc4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4de4e0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcb0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 206 |
nb uops | 225 |
loop length | 818 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 7 |
micro-operation queue | 37.50 cycles |
front end | 37.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 19.07 | 11.33 | 11.33 | 11.50 | 18.93 | 20.00 | 11.50 | 11.50 | 11.50 | 19.00 | 11.33 |
cycles | 20.00 | 19.07 | 11.33 | 11.33 | 11.50 | 18.93 | 20.00 | 11.50 | 11.50 | 11.50 | 19.00 | 11.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 36.11 |
Stall cycles | 0.00 |
Front-end | 37.50 |
Dispatch | 20.00 |
Overall L1 | 37.50 |
all | 1% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 1% |
all | 10% |
load | 5% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 3% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 10% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4dc2d0 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4dc350 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4dd897 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x67> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x25a350(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x510905,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x51292b,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e6c10 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x5132d1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e9300 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4dd8a5 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4dd8d3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x25a314(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x510905,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x513358,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e6c10 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x5132d1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e9300 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4dd8e2 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4dd915 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x25a2d7(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x510905,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x51337a,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e6c10 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x5132d1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e9300 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD -0x38(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4dda3c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x20c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x20b30(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4ddb5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x32c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4dd979 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x149> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x218ec(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R15,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JNE 4ddc5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x42c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x20a1b(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4ddd7c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x54c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x21665(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4dda9a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x26a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x217cc(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4dde8c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x65c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ddb99 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x369> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VUCOMISD 0x2080c(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4ddf8c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x207fe(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4de09c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x86c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4ddcba <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x48a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x215ac(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4de1ac <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x97c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4dddca <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x59a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ddecd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x69d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x204dc(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4de2ac <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4ddfda <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7aa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x2128c(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de3bc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb8c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x2101a(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de0ea <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8ba> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x20f18(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de1ee <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x9be> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x2107c(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de4ac <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x20e13(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4de2f4 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xac4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de3f4 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbc4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de59c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4de4e0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcb0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace.extracted– | 16.95 | 3.38 |
▼Loop 4301 - csr_matvec.c:248-341 - exec– | 0.89 | 0.17 |
○Loop 4302 - csr_matvec.c:337-339 - exec | 0.44 | 0.08 |
○Loop 4303 - csr_matvec.c:337-339 - exec | 0.11 | 0.02 |
▼Loop 4307 - csr_matvec.c:248-314 - exec– | 0.31 | 0.06 |
○Loop 4309 - csr_matvec.c:310-312 - exec | 6.89 | 1.31 |
○Loop 4308 - csr_matvec.c:310-312 - exec | 0.96 | 0.18 |
▼Loop 4319 - csr_matvec.c:248-263 - exec– | 0.25 | 0.05 |
○Loop 4321 - csr_matvec.c:259-261 - exec | 6.26 | 1.19 |
○Loop 4320 - csr_matvec.c:259-261 - exec | 0.83 | 0.16 |
▼Loop 4316 - csr_matvec.c:248-275 - exec– | 0 | 0 |
○Loop 4318 - csr_matvec.c:271-273 - exec | 0 | 0 |
○Loop 4317 - csr_matvec.c:271-273 - exec | 0 | 0 |
▼Loop 4310 - csr_matvec.c:248-302 - exec– | 0 | 0 |
○Loop 4312 - csr_matvec.c:298-300 - exec | 0 | 0 |
○Loop 4311 - csr_matvec.c:298-300 - exec | 0 | 0 |
▼Loop 4286 - csr_matvec.c:248-404 - exec– | 0 | 0 |
○Loop 4287 - csr_matvec.c:400-402 - exec | 0 | 0 |
○Loop 4288 - csr_matvec.c:400-402 - exec | 0 | 0 |
▼Loop 4289 - csr_matvec.c:248-392 - exec– | 0 | 0 |
○Loop 4290 - csr_matvec.c:388-390 - exec | 0 | 0 |
○Loop 4291 - csr_matvec.c:388-390 - exec | 0 | 0 |
▼Loop 4292 - csr_matvec.c:248-380 - exec– | 0 | 0 |
○Loop 4294 - csr_matvec.c:376-378 - exec | 0 | 0 |
○Loop 4293 - csr_matvec.c:376-378 - exec | 0 | 0 |
▼Loop 4313 - csr_matvec.c:248-287 - exec– | 0 | 0 |
○Loop 4314 - csr_matvec.c:283-285 - exec | 0 | 0 |
○Loop 4315 - csr_matvec.c:283-285 - exec | 0 | 0 |
▼Loop 4298 - csr_matvec.c:248-353 - exec– | 0 | 0 |
○Loop 4299 - csr_matvec.c:349-351 - exec | 0 | 0 |
○Loop 4300 - csr_matvec.c:349-351 - exec | 0 | 0 |
▼Loop 4295 - csr_matvec.c:248-365 - exec– | 0 | 0 |
○Loop 4296 - csr_matvec.c:361-363 - exec | 0 | 0 |
○Loop 4297 - csr_matvec.c:361-363 - exec | 0 | 0 |
▼Loop 4304 - csr_matvec.c:248-326 - exec– | 0 | 0 |
○Loop 4306 - csr_matvec.c:322-324 - exec | 0 | 0 |
○Loop 4305 - csr_matvec.c:322-324 - exec | 0 | 0 |