Function: hypre_CSRMatrixMatvecT | Module: exec | Source: csr_matvec.c:445-648 [...] | Coverage: 2.32% |
---|
Function: hypre_CSRMatrixMatvecT | Module: exec | Source: csr_matvec.c:445-648 [...] | Coverage: 2.32% |
---|
/home/kcamus/qaas_runs/169-443-9681/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 445 - 648 |
-------------------------------------------------------------------------------- |
445: { |
446: HYPRE_Complex *A_data = hypre_CSRMatrixData(A); |
447: HYPRE_Int *A_i = hypre_CSRMatrixI(A); |
448: HYPRE_Int *A_j = hypre_CSRMatrixJ(A); |
449: HYPRE_Int num_rows = hypre_CSRMatrixNumRows(A); |
450: HYPRE_Int num_cols = hypre_CSRMatrixNumCols(A); |
451: |
452: HYPRE_Complex *x_data = hypre_VectorData(x); |
453: HYPRE_Complex *y_data = hypre_VectorData(y); |
454: HYPRE_Int x_size = hypre_VectorSize(x); |
455: HYPRE_Int y_size = hypre_VectorSize(y); |
456: HYPRE_Int num_vectors = hypre_VectorNumVectors(x); |
457: HYPRE_Int idxstride_y = hypre_VectorIndexStride(y); |
458: HYPRE_Int vecstride_y = hypre_VectorVectorStride(y); |
459: HYPRE_Int idxstride_x = hypre_VectorIndexStride(x); |
460: HYPRE_Int vecstride_x = hypre_VectorVectorStride(x); |
[...] |
485: hypre_assert( num_vectors == hypre_VectorNumVectors(y) ); |
486: |
487: if (num_rows != x_size) |
488: ierr = 1; |
489: |
490: if (num_cols != y_size) |
491: ierr = 2; |
492: |
493: if (num_rows != x_size && num_cols != y_size) |
[...] |
499: if (alpha == 0.0) |
500: { |
501: #ifdef HYPRE_USING_OPENMP |
502: #pragma omp parallel for private(i) HYPRE_SMP_SCHEDULE |
503: #endif |
504: for (i = 0; i < num_cols*num_vectors; i++) |
[...] |
510: if (x == y) |
511: { |
512: x_tmp = hypre_SeqVectorCloneDeep(x); |
513: x_data = hypre_VectorData(x_tmp); |
[...] |
520: temp = beta / alpha; |
521: |
522: if (temp != 1.0) |
523: { |
524: if (temp == 0.0) |
525: { |
526: #ifdef HYPRE_USING_OPENMP |
527: #pragma omp parallel for private(i) HYPRE_SMP_SCHEDULE |
528: #endif |
529: for (i = 0; i < num_cols*num_vectors; i++) |
[...] |
535: #pragma omp parallel for private(i) HYPRE_SMP_SCHEDULE |
536: #endif |
537: for (i = 0; i < num_cols*num_vectors; i++) |
[...] |
545: num_threads = hypre_NumThreads(); |
546: if (num_threads > 1) |
547: { |
548: y_data_expand = hypre_CTAlloc(HYPRE_Complex, num_threads*y_size); |
549: |
550: if ( num_vectors==1 ) |
551: { |
552: |
553: #ifdef HYPRE_USING_OPENMP |
554: #pragma omp parallel private(i,jj,j,my_thread_num,offset) |
[...] |
589: for (i = 0; i < num_rows; i++) |
590: { |
591: for ( jv=0; jv<num_vectors; ++jv ) |
592: { |
593: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
594: { |
595: j = A_j[jj]; |
596: y_data[ j*idxstride_y + jv*vecstride_y ] += |
597: A_data[jj] * x_data[ i*idxstride_x + jv*vecstride_x]; |
[...] |
603: hypre_TFree(y_data_expand); |
604: |
605: } |
606: else |
607: { |
608: for (i = 0; i < num_rows; i++) |
609: { |
610: if ( num_vectors==1 ) |
611: { |
612: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
613: { |
614: j = A_j[jj]; |
615: y_data[j] += A_data[jj] * x_data[i]; |
616: } |
617: } |
618: else |
619: { |
620: for ( jv=0; jv<num_vectors; ++jv ) |
621: { |
622: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
623: { |
624: j = A_j[jj]; |
625: y_data[ j*idxstride_y + jv*vecstride_y ] += |
626: A_data[jj] * x_data[ i*idxstride_x + jv*vecstride_x ]; |
[...] |
636: if (alpha != 1.0) |
637: { |
638: #ifdef HYPRE_USING_OPENMP |
639: #pragma omp parallel for private(i) HYPRE_SMP_SCHEDULE |
640: #endif |
641: for (i = 0; i < num_cols*num_vectors; i++) |
642: y_data[i] *= alpha; |
643: } |
644: |
645: if (x == y) hypre_SeqVectorDestroy(x_tmp); |
646: |
647: return ierr; |
648: } |
0x4e9130 PUSH %RBP |
0x4e9131 MOV %RSP,%RBP |
0x4e9134 PUSH %R15 |
0x4e9136 PUSH %R14 |
0x4e9138 PUSH %R13 |
0x4e913a PUSH %R12 |
0x4e913c PUSH %RBX |
0x4e913d SUB $0xb8,%RSP |
0x4e9144 MOV %RSI,%RCX |
0x4e9147 MOV 0x30(%RDI),%R12 |
0x4e914b MOV (%RDI),%RAX |
0x4e914e MOV %RAX,-0x48(%RBP) |
0x4e9152 MOV 0x8(%RDI),%R13 |
0x4e9156 MOV 0x10(%RDI),%RAX |
0x4e915a MOV %RAX,-0x40(%RBP) |
0x4e915e MOV 0x18(%RDI),%RAX |
0x4e9162 MOV %RAX,-0x90(%RBP) |
0x4e9169 MOV (%RSI),%R15 |
0x4e916c MOV 0x8(%RSI),%RAX |
0x4e9170 MOV %RAX,-0xc8(%RBP) |
0x4e9177 MOV (%RDX),%RBX |
0x4e917a MOV 0x8(%RDX),%RAX |
0x4e917e MOV %RAX,-0x60(%RBP) |
0x4e9182 MOV 0x18(%RSI),%RAX |
0x4e9186 MOV 0x30(%RDX),%R14 |
0x4e918a MOV 0x28(%RDX),%RSI |
0x4e918e MOV %RSI,-0x80(%RBP) |
0x4e9192 MOV 0x30(%RCX),%RSI |
0x4e9196 MOV %RSI,-0xd0(%RBP) |
0x4e919d MOV 0x28(%RCX),%RSI |
0x4e91a1 MOV %RSI,-0x78(%RBP) |
0x4e91a5 MOV %RAX,-0x38(%RBP) |
0x4e91a9 MOV %RDX,-0xc0(%RBP) |
0x4e91b0 CMP 0x18(%RDX),%RAX |
0x4e91b4 JE 4e9206 |
0x4e91b6 MOV 0x4da03(%RIP),%RDI |
0x4e91bd MOV $0x510df9,%ESI |
0x4e91c2 MOV $0x5134d8,%EDX |
0x4e91c7 XOR %EAX,%EAX |
0x4e91c9 MOV %RCX,-0x88(%RBP) |
0x4e91d0 VMOVSD %XMM0,-0x58(%RBP) |
0x4e91d5 VMOVSD %XMM1,-0x30(%RBP) |
0x4e91da CALL 4f40b0 <hypre_fprintf> |
0x4e91df MOV $0x513501,%EDI |
0x4e91e4 MOV $0x1e5,%ESI |
0x4e91e9 MOV $0x1,%EDX |
0x4e91ee XOR %ECX,%ECX |
0x4e91f0 CALL 4f6200 <hypre_error_handler> |
0x4e91f5 VMOVSD -0x30(%RBP),%XMM1 |
0x4e91fa VMOVSD -0x58(%RBP),%XMM0 |
0x4e91ff MOV -0x88(%RBP),%RCX |
0x4e9206 VXORPD %XMM2,%XMM2,%XMM2 |
0x4e920a VUCOMISD %XMM2,%XMM0 |
0x4e920e JNE 4e9280 |
0x4e9210 MOV -0x90(%RBP),%R15 |
0x4e9217 MOV -0x38(%RBP),%R10 |
0x4e921b IMUL %R15,%R10 |
0x4e921f TEST %R10,%R10 |
0x4e9222 MOV -0xc8(%RBP),%R14 |
0x4e9229 MOV -0x60(%RBP),%R12 |
0x4e922d JLE 4e9a58 |
0x4e9233 DEC %R10 |
0x4e9236 VMOVQ %XMM1,%RCX |
0x4e923b SUB $0x8,%RSP |
0x4e923f MOV $0x536130,%EDI |
0x4e9244 MOV $0x4ebef0,%EDX |
0x4e9249 MOV $0x4,%ESI |
0x4e924e MOV %RBX,%R8 |
0x4e9251 XOR %R9D,%R9D |
0x4e9254 XOR %EAX,%EAX |
0x4e9256 PUSH %R10 |
0x4e9258 CALL 4103a0 <__kmpc_fork_call@plt> |
0x4e925d ADD $0x10,%RSP |
0x4e9261 JMP 4e9a58 |
0x4e9266 NOPW %CS:(%RAX,%RAX,1) |
0x4e9275 NOPW %CS:(%RAX,%RAX,1) |
0x4e9280 CMP -0xc0(%RBP),%RCX |
0x4e9287 MOV %RCX,-0x88(%RBP) |
0x4e928e VMOVSD %XMM0,-0x58(%RBP) |
0x4e9293 JE 4e92c0 |
0x4e9295 MOVQ $0,-0xb8(%RBP) |
0x4e92a0 VDIVSD %XMM0,%XMM1,%XMM0 |
0x4e92a4 VUCOMISD 0x16d5c(%RIP),%XMM0 |
0x4e92ac JNE 4e92f6 |
0x4e92ae JMP 4e9373 |
0x4e92b3 NOPW %CS:(%RAX,%RAX,1) |
0x4e92c0 MOV %RCX,%RDI |
0x4e92c3 VMOVSD %XMM1,-0x30(%RBP) |
0x4e92c8 CALL 4ed2f0 <hypre_SeqVectorCloneDeep> |
0x4e92cd VMOVSD -0x30(%RBP),%XMM1 |
0x4e92d2 VMOVSD -0x58(%RBP),%XMM0 |
0x4e92d7 MOV %RAX,%RCX |
0x4e92da MOV %RAX,-0xb8(%RBP) |
0x4e92e1 MOV (%RAX),%R15 |
0x4e92e4 VDIVSD %XMM0,%XMM1,%XMM0 |
0x4e92e8 VUCOMISD 0x16d18(%RIP),%XMM0 |
0x4e92f0 JE 4e9373 |
0x4e92f6 MOV -0x38(%RBP),%R10 |
0x4e92fa IMUL -0x90(%RBP),%R10 |
0x4e9302 VXORPD %XMM1,%XMM1,%XMM1 |
0x4e9306 VUCOMISD %XMM1,%XMM0 |
0x4e930a JNE 4e9340 |
0x4e930c TEST %R10,%R10 |
0x4e930f JLE 4e9373 |
0x4e9311 DEC %R10 |
0x4e9314 MOV $0x5360d0,%EDI |
0x4e9319 MOV $0x4ebe60,%EDX |
0x4e931e MOV $0x3,%ESI |
0x4e9323 MOV %RBX,%RCX |
0x4e9326 XOR %R8D,%R8D |
0x4e9329 MOV %R10,%R9 |
0x4e932c XOR %EAX,%EAX |
0x4e932e CALL 4103a0 <__kmpc_fork_call@plt> |
0x4e9333 JMP 4e9373 |
0x4e9335 NOPW %CS:(%RAX,%RAX,1) |
0x4e9340 TEST %R10,%R10 |
0x4e9343 JLE 4e9373 |
0x4e9345 DEC %R10 |
0x4e9348 VMOVQ %XMM0,%R8 |
0x4e934d SUB $0x8,%RSP |
0x4e9351 MOV $0x536070,%EDI |
0x4e9356 MOV $0x4ebd60,%EDX |
0x4e935b MOV $0x4,%ESI |
0x4e9360 MOV %RBX,%RCX |
0x4e9363 XOR %R9D,%R9D |
0x4e9366 XOR %EAX,%EAX |
0x4e9368 PUSH %R10 |
0x4e936a CALL 4103a0 <__kmpc_fork_call@plt> |
0x4e936f ADD $0x10,%RSP |
0x4e9373 CALL 4f60e0 <hypre_NumThreads> |
0x4e9378 CMP $0x1,%RAX |
0x4e937c JLE 4e9400 |
0x4e9382 MOV %RAX,-0x30(%RBP) |
0x4e9386 MOV %RAX,%RDI |
0x4e9389 IMUL -0x60(%RBP),%RDI |
0x4e938e MOV $0x8,%ESI |
0x4e9393 CALL 4f3da0 <hypre_CAlloc> |
0x4e9398 MOV %RAX,%R10 |
0x4e939b CMPQ $0x1,-0x38(%RBP) |
0x4e93a0 MOV %RAX,-0x70(%RBP) |
0x4e93a4 JNE 4e95a0 |
0x4e93aa MOV $0x536010,%EDI |
0x4e93af MOV $0x4eb840,%EDX |
0x4e93b4 MOV $0x9,%ESI |
0x4e93b9 MOV %R12,%RCX |
0x4e93bc MOV -0x48(%RBP),%R8 |
0x4e93c0 MOV %R13,%R9 |
0x4e93c3 XOR %EAX,%EAX |
0x4e93c5 PUSHQ -0x30(%RBP) |
0x4e93c8 PUSH %R10 |
0x4e93ca PUSHQ -0x60(%RBP) |
0x4e93cd PUSH %RBX |
0x4e93ce PUSH %R15 |
0x4e93d0 PUSHQ -0x40(%RBP) |
0x4e93d3 CALL 4103a0 <__kmpc_fork_call@plt> |
0x4e93d8 MOV -0x70(%RBP),%R10 |
0x4e93dc ADD $0x30,%RSP |
0x4e93e0 MOV %R10,%RDI |
0x4e93e3 CALL 4f3eb0 <hypre_Free> |
0x4e93e8 JMP 4e99e0 |
0x4e93ed NOPW %CS:(%RAX,%RAX,1) |
0x4e93fc NOPL (%RAX) |
0x4e9400 CMPQ $0,-0x40(%RBP) |
0x4e9405 JLE 4e99e0 |
0x4e940b CMPQ $0x1,-0x38(%RBP) |
0x4e9410 JNE 4e97e0 |
0x4e9416 MOV -0x40(%RBP),%RAX |
0x4e941a LEA -0x1(%RAX),%R8 |
0x4e941e MOV -0x48(%RBP),%RAX |
0x4e9422 MOV (%RAX),%R11 |
0x4e9425 XOR %EDX,%EDX |
0x4e9427 JMP 4e944d |
0x4e9429 NOPW %CS:(%RAX,%RAX,1) |
0x4e9438 NOPL (%RAX,%RAX,1) |
(3964) 0x4e9440 CMP %R8,%RDX |
(3964) 0x4e9443 LEA 0x1(%RDX),%RDX |
(3964) 0x4e9447 JE 4e99e0 |
(3964) 0x4e944d MOV %R11,%RSI |
(3964) 0x4e9450 MOV -0x48(%RBP),%RAX |
(3964) 0x4e9454 MOV 0x8(%RAX,%RDX,8),%R11 |
(3964) 0x4e9459 MOV %R11,%R10 |
(3964) 0x4e945c SUB %RSI,%R10 |
(3964) 0x4e945f JLE 4e9440 |
(3964) 0x4e9461 MOV %R10,%R9 |
(3964) 0x4e9464 AND $-0x4,%R9 |
(3964) 0x4e9468 JE 4e94a0 |
(3964) 0x4e946a LEA -0x1(%R9),%RAX |
(3964) 0x4e946e XOR %EDI,%EDI |
(3968) 0x4e9470 ADD $0x4,%RDI |
(3968) 0x4e9474 CMP %RAX,%RDI |
(3968) 0x4e9477 JBE 4e9470 |
(3964) 0x4e9479 MOV %R9,%RDI |
(3964) 0x4e947c CMP %R9,%R10 |
(3964) 0x4e947f JNE 4e94a2 |
(3964) 0x4e9481 JMP 4e94b5 |
0x4e9483 NOPW %CS:(%RAX,%RAX,1) |
0x4e9492 NOPW %CS:(%RAX,%RAX,1) |
(3964) 0x4e94a0 XOR %EDI,%EDI |
(3964) 0x4e94a2 MOV %R11,%RAX |
(3964) 0x4e94a5 SUB %RDI,%RAX |
(3964) 0x4e94a8 SUB %RSI,%RAX |
(3964) 0x4e94ab NOPL (%RAX,%RAX,1) |
(3965) 0x4e94b0 DEC %RAX |
(3965) 0x4e94b3 JNE 4e94b0 |
(3964) 0x4e94b5 CMP $0x4,%R10 |
(3964) 0x4e94b9 JB 4e954c |
(3964) 0x4e94bf MOV %R10,%RDI |
(3964) 0x4e94c2 SHR $0x2,%RDI |
(3964) 0x4e94c6 LEA 0x18(,%RSI,8),%RAX |
(3964) 0x4e94ce XCHG %AX,%AX |
(3967) 0x4e94d0 VMOVSD (%R15,%RDX,8),%XMM0 |
(3967) 0x4e94d6 VMOVSD -0x18(%R12,%RAX,1),%XMM1 |
(3967) 0x4e94dd MOV -0x18(%R13,%RAX,1),%RCX |
(3967) 0x4e94e2 VFMADD213SD (%RBX,%RCX,8),%XMM0,%XMM1 |
(3967) 0x4e94e8 VMOVSD %XMM1,(%RBX,%RCX,8) |
(3967) 0x4e94ed MOV -0x10(%R13,%RAX,1),%RCX |
(3967) 0x4e94f2 VMOVSD (%R15,%RDX,8),%XMM0 |
(3967) 0x4e94f8 VMOVSD -0x10(%R12,%RAX,1),%XMM1 |
(3967) 0x4e94ff VFMADD213SD (%RBX,%RCX,8),%XMM0,%XMM1 |
(3967) 0x4e9505 VMOVSD %XMM1,(%RBX,%RCX,8) |
(3967) 0x4e950a MOV -0x8(%R13,%RAX,1),%RCX |
(3967) 0x4e950f VMOVSD (%R15,%RDX,8),%XMM0 |
(3967) 0x4e9515 VMOVSD -0x8(%R12,%RAX,1),%XMM1 |
(3967) 0x4e951c VFMADD213SD (%RBX,%RCX,8),%XMM0,%XMM1 |
(3967) 0x4e9522 VMOVSD %XMM1,(%RBX,%RCX,8) |
(3967) 0x4e9527 MOV (%R13,%RAX,1),%RCX |
(3967) 0x4e952c VMOVSD (%R15,%RDX,8),%XMM0 |
(3967) 0x4e9532 VMOVSD (%R12,%RAX,1),%XMM1 |
(3967) 0x4e9538 VFMADD213SD (%RBX,%RCX,8),%XMM0,%XMM1 |
(3967) 0x4e953e VMOVSD %XMM1,(%RBX,%RCX,8) |
(3967) 0x4e9543 ADD $0x20,%RAX |
(3967) 0x4e9547 DEC %RDI |
(3967) 0x4e954a JNE 4e94d0 |
(3964) 0x4e954c CMP %R10,%R9 |
(3964) 0x4e954f JAE 4e9440 |
(3964) 0x4e9555 ADD %R9,%RSI |
(3964) 0x4e9558 NOPL (%RAX,%RAX,1) |
(3966) 0x4e9560 MOV (%R13,%RSI,8),%RAX |
(3966) 0x4e9565 VMOVSD (%R15,%RDX,8),%XMM0 |
(3966) 0x4e956b VMOVSD (%R12,%RSI,8),%XMM1 |
(3966) 0x4e9571 VFMADD213SD (%RBX,%RAX,8),%XMM0,%XMM1 |
(3966) 0x4e9577 VMOVSD %XMM1,(%RBX,%RAX,8) |
(3966) 0x4e957c INC %RSI |
(3966) 0x4e957f CMP %RSI,%R11 |
(3966) 0x4e9582 JNE 4e9560 |
(3964) 0x4e9584 JMP 4e9440 |
0x4e9589 NOPW %CS:(%RAX,%RAX,1) |
0x4e9598 NOPL (%RAX,%RAX,1) |
0x4e95a0 CMPQ $0,-0x40(%RBP) |
0x4e95a5 JLE 4e93e0 |
0x4e95ab CMPQ $0,-0x38(%RBP) |
0x4e95b0 JLE 4e93e0 |
0x4e95b6 MOV -0x40(%RBP),%RAX |
0x4e95ba DEC %RAX |
0x4e95bd MOV %RAX,-0xd8(%RBP) |
0x4e95c4 MOV -0x48(%RBP),%RAX |
0x4e95c8 MOV (%RAX),%R11 |
0x4e95cb MOV -0x38(%RBP),%RAX |
0x4e95cf LEA -0x1(%RAX),%R8 |
0x4e95d3 XOR %ECX,%ECX |
0x4e95d5 JMP 4e95fe |
0x4e95d7 NOPW (%RAX,%RAX,1) |
(3969) 0x4e95e0 MOV %RDX,%R11 |
(3969) 0x4e95e3 MOV -0x98(%RBP),%RAX |
(3969) 0x4e95ea CMP -0xd8(%RBP),%RAX |
(3969) 0x4e95f1 MOV -0xe0(%RBP),%RCX |
(3969) 0x4e95f8 JE 4e93e0 |
(3969) 0x4e95fe LEA 0x1(%RCX),%RAX |
(3969) 0x4e9602 MOV %RAX,-0xe0(%RBP) |
(3969) 0x4e9609 MOV -0x48(%RBP),%RAX |
(3969) 0x4e960d MOV 0x8(%RAX,%RCX,8),%RDX |
(3969) 0x4e9612 MOV %RDX,%RAX |
(3969) 0x4e9615 SUB %R11,%RAX |
(3969) 0x4e9618 MOV %RAX,%RSI |
(3969) 0x4e961b SHR $0x2,%RSI |
(3969) 0x4e961f MOV %RSI,-0xa8(%RBP) |
(3969) 0x4e9626 MOV -0xd0(%RBP),%RSI |
(3969) 0x4e962d MOV %RCX,-0x98(%RBP) |
(3969) 0x4e9634 IMUL %RCX,%RSI |
(3969) 0x4e9638 MOV %RSI,-0x50(%RBP) |
(3969) 0x4e963c MOV %RAX,-0x30(%RBP) |
(3969) 0x4e9640 AND $-0x4,%RAX |
(3969) 0x4e9644 LEA 0x18(,%R11,8),%RCX |
(3969) 0x4e964c MOV %RCX,-0xa0(%RBP) |
(3969) 0x4e9653 MOV %RAX,-0xb0(%RBP) |
(3969) 0x4e965a ADD %R11,%RAX |
(3969) 0x4e965d MOV %RAX,-0x68(%RBP) |
(3969) 0x4e9661 XOR %R9D,%R9D |
(3969) 0x4e9664 JMP 4e968d |
0x4e9666 NOPW %CS:(%RAX,%RAX,1) |
0x4e9675 NOPW %CS:(%RAX,%RAX,1) |
(3970) 0x4e9680 CMP %R8,%R9 |
(3970) 0x4e9683 LEA 0x1(%R9),%R9 |
(3970) 0x4e9687 JE 4e95e0 |
(3970) 0x4e968d CMP %R11,%RDX |
(3970) 0x4e9690 JLE 4e9680 |
(3970) 0x4e9692 MOV %R11,%RDI |
(3970) 0x4e9695 MOV %R8,%RCX |
(3970) 0x4e9698 CMPQ $0x4,-0x30(%RBP) |
(3970) 0x4e969d JB 4e976c |
(3970) 0x4e96a3 MOV -0x78(%RBP),%R10 |
(3970) 0x4e96a7 IMUL %R9,%R10 |
(3970) 0x4e96ab ADD -0x50(%RBP),%R10 |
(3970) 0x4e96af MOV -0x80(%RBP),%R11 |
(3970) 0x4e96b3 IMUL %R9,%R11 |
(3970) 0x4e96b7 MOV -0xa8(%RBP),%RSI |
(3970) 0x4e96be MOV -0xa0(%RBP),%R8 |
(3970) 0x4e96c5 NOPW %CS:(%RAX,%RAX,1) |
(3972) 0x4e96d0 VMOVSD (%R15,%R10,8),%XMM0 |
(3972) 0x4e96d6 VMOVSD -0x18(%R12,%R8,1),%XMM1 |
(3972) 0x4e96dd MOV -0x18(%R13,%R8,1),%RAX |
(3972) 0x4e96e2 IMUL %R14,%RAX |
(3972) 0x4e96e6 ADD %R11,%RAX |
(3972) 0x4e96e9 VFMADD213SD (%RBX,%RAX,8),%XMM0,%XMM1 |
(3972) 0x4e96ef VMOVSD %XMM1,(%RBX,%RAX,8) |
(3972) 0x4e96f4 VMOVSD (%R15,%R10,8),%XMM0 |
(3972) 0x4e96fa VMOVSD -0x10(%R12,%R8,1),%XMM1 |
(3972) 0x4e9701 MOV -0x10(%R13,%R8,1),%RAX |
(3972) 0x4e9706 IMUL %R14,%RAX |
(3972) 0x4e970a ADD %R11,%RAX |
(3972) 0x4e970d VFMADD213SD (%RBX,%RAX,8),%XMM0,%XMM1 |
(3972) 0x4e9713 VMOVSD %XMM1,(%RBX,%RAX,8) |
(3972) 0x4e9718 VMOVSD (%R15,%R10,8),%XMM0 |
(3972) 0x4e971e VMOVSD -0x8(%R12,%R8,1),%XMM1 |
(3972) 0x4e9725 MOV -0x8(%R13,%R8,1),%RAX |
(3972) 0x4e972a IMUL %R14,%RAX |
(3972) 0x4e972e ADD %R11,%RAX |
(3972) 0x4e9731 VFMADD213SD (%RBX,%RAX,8),%XMM0,%XMM1 |
(3972) 0x4e9737 VMOVSD %XMM1,(%RBX,%RAX,8) |
(3972) 0x4e973c VMOVSD (%R15,%R10,8),%XMM0 |
(3972) 0x4e9742 VMOVSD (%R12,%R8,1),%XMM1 |
(3972) 0x4e9748 MOV (%R13,%R8,1),%RAX |
(3972) 0x4e974d IMUL %R14,%RAX |
(3972) 0x4e9751 ADD %R11,%RAX |
(3972) 0x4e9754 VFMADD213SD (%RBX,%RAX,8),%XMM0,%XMM1 |
(3972) 0x4e975a VMOVSD %XMM1,(%RBX,%RAX,8) |
(3972) 0x4e975f ADD $0x20,%R8 |
(3972) 0x4e9763 DEC %RSI |
(3972) 0x4e9766 JNE 4e96d0 |
(3970) 0x4e976c MOV -0xb0(%RBP),%RAX |
(3970) 0x4e9773 CMP -0x30(%RBP),%RAX |
(3970) 0x4e9777 MOV -0x70(%RBP),%R10 |
(3970) 0x4e977b MOV %RCX,%R8 |
(3970) 0x4e977e MOV %RDI,%R11 |
(3970) 0x4e9781 JAE 4e9680 |
(3970) 0x4e9787 MOV -0x78(%RBP),%RSI |
(3970) 0x4e978b IMUL %R9,%RSI |
(3970) 0x4e978f ADD -0x50(%RBP),%RSI |
(3970) 0x4e9793 MOV -0x80(%RBP),%RCX |
(3970) 0x4e9797 IMUL %R9,%RCX |
(3970) 0x4e979b MOV -0x68(%RBP),%RAX |
(3970) 0x4e979f NOP |
(3971) 0x4e97a0 VMOVSD (%R15,%RSI,8),%XMM0 |
(3971) 0x4e97a6 VMOVSD (%R12,%RAX,8),%XMM1 |
(3971) 0x4e97ac MOV (%R13,%RAX,8),%RDI |
(3971) 0x4e97b1 IMUL %R14,%RDI |
(3971) 0x4e97b5 ADD %RCX,%RDI |
(3971) 0x4e97b8 VFMADD213SD (%RBX,%RDI,8),%XMM0,%XMM1 |
(3971) 0x4e97be VMOVSD %XMM1,(%RBX,%RDI,8) |
(3971) 0x4e97c3 INC %RAX |
(3971) 0x4e97c6 CMP %RAX,%RDX |
(3971) 0x4e97c9 JNE 4e97a0 |
(3970) 0x4e97cb JMP 4e9680 |
0x4e97d0 NOPW %CS:(%RAX,%RAX,1) |
0x4e97df NOP |
0x4e97e0 JL 4e99e0 |
0x4e97e6 MOV -0x40(%RBP),%RAX |
0x4e97ea DEC %RAX |
0x4e97ed MOV %RAX,-0x98(%RBP) |
0x4e97f4 MOV -0x48(%RBP),%RAX |
0x4e97f8 MOV (%RAX),%RDX |
0x4e97fb MOV -0x38(%RBP),%RAX |
0x4e97ff DEC %RAX |
0x4e9802 MOV %RAX,-0xb0(%RBP) |
0x4e9809 XOR %ECX,%ECX |
0x4e980b JMP 4e9838 |
0x4e980d NOPW %CS:(%RAX,%RAX,1) |
0x4e981c NOPL (%RAX) |
(3960) 0x4e9820 MOV %RDI,%RDX |
(3960) 0x4e9823 MOV -0x68(%RBP),%RCX |
(3960) 0x4e9827 CMP -0x98(%RBP),%RCX |
(3960) 0x4e982e LEA 0x1(%RCX),%RCX |
(3960) 0x4e9832 JE 4e99e0 |
(3960) 0x4e9838 MOV -0x48(%RBP),%RAX |
(3960) 0x4e983c MOV %RCX,-0x68(%RBP) |
(3960) 0x4e9840 MOV 0x8(%RAX,%RCX,8),%RDI |
(3960) 0x4e9845 MOV %RDI,%RSI |
(3960) 0x4e9848 SUB %RDX,%RSI |
(3960) 0x4e984b JLE 4e9820 |
(3960) 0x4e984d MOV %RDX,%RAX |
(3960) 0x4e9850 MOV %RSI,%RCX |
(3960) 0x4e9853 SHR $0x2,%RCX |
(3960) 0x4e9857 MOV %RCX,-0xa8(%RBP) |
(3960) 0x4e985e MOV -0xd0(%RBP),%RCX |
(3960) 0x4e9865 IMUL -0x68(%RBP),%RCX |
(3960) 0x4e986a MOV %RCX,-0x50(%RBP) |
(3960) 0x4e986e MOV %RSI,%RCX |
(3960) 0x4e9871 AND $-0x4,%RCX |
(3960) 0x4e9875 LEA 0x18(,%RDX,8),%RDX |
(3960) 0x4e987d MOV %RDX,-0xa0(%RBP) |
(3960) 0x4e9884 MOV %RCX,-0x30(%RBP) |
(3960) 0x4e9888 ADD %RCX,%RAX |
(3960) 0x4e988b MOV %RAX,-0x70(%RBP) |
(3960) 0x4e988f XOR %R9D,%R9D |
(3960) 0x4e9892 JMP 4e98b4 |
0x4e9894 NOPW %CS:(%RAX,%RAX,1) |
(3961) 0x4e98a0 CMP -0xb0(%RBP),%R9 |
(3961) 0x4e98a7 LEA 0x1(%R9),%R9 |
(3961) 0x4e98ab MOV %R8,%RSI |
(3961) 0x4e98ae JE 4e9820 |
(3961) 0x4e98b4 CMP $0x4,%RSI |
(3961) 0x4e98b8 JB 4e997c |
(3961) 0x4e98be MOV -0x78(%RBP),%R8 |
(3961) 0x4e98c2 IMUL %R9,%R8 |
(3961) 0x4e98c6 ADD -0x50(%RBP),%R8 |
(3961) 0x4e98ca MOV -0x80(%RBP),%R10 |
(3961) 0x4e98ce IMUL %R9,%R10 |
(3961) 0x4e98d2 MOV -0xa8(%RBP),%R11 |
(3961) 0x4e98d9 MOV -0xa0(%RBP),%RCX |
(3963) 0x4e98e0 VMOVSD (%R15,%R8,8),%XMM0 |
(3963) 0x4e98e6 VMOVSD -0x18(%R12,%RCX,1),%XMM1 |
(3963) 0x4e98ed MOV -0x18(%R13,%RCX,1),%RDX |
(3963) 0x4e98f2 IMUL %R14,%RDX |
(3963) 0x4e98f6 ADD %R10,%RDX |
(3963) 0x4e98f9 VFMADD213SD (%RBX,%RDX,8),%XMM0,%XMM1 |
(3963) 0x4e98ff VMOVSD %XMM1,(%RBX,%RDX,8) |
(3963) 0x4e9904 VMOVSD (%R15,%R8,8),%XMM0 |
(3963) 0x4e990a VMOVSD -0x10(%R12,%RCX,1),%XMM1 |
(3963) 0x4e9911 MOV -0x10(%R13,%RCX,1),%RDX |
(3963) 0x4e9916 IMUL %R14,%RDX |
(3963) 0x4e991a ADD %R10,%RDX |
(3963) 0x4e991d VFMADD213SD (%RBX,%RDX,8),%XMM0,%XMM1 |
(3963) 0x4e9923 VMOVSD %XMM1,(%RBX,%RDX,8) |
(3963) 0x4e9928 VMOVSD (%R15,%R8,8),%XMM0 |
(3963) 0x4e992e VMOVSD -0x8(%R12,%RCX,1),%XMM1 |
(3963) 0x4e9935 MOV -0x8(%R13,%RCX,1),%RDX |
(3963) 0x4e993a IMUL %R14,%RDX |
(3963) 0x4e993e ADD %R10,%RDX |
(3963) 0x4e9941 VFMADD213SD (%RBX,%RDX,8),%XMM0,%XMM1 |
(3963) 0x4e9947 VMOVSD %XMM1,(%RBX,%RDX,8) |
(3963) 0x4e994c VMOVSD (%R15,%R8,8),%XMM0 |
(3963) 0x4e9952 VMOVSD (%R12,%RCX,1),%XMM1 |
(3963) 0x4e9958 MOV (%R13,%RCX,1),%RDX |
(3963) 0x4e995d IMUL %R14,%RDX |
(3963) 0x4e9961 ADD %R10,%RDX |
(3963) 0x4e9964 VFMADD213SD (%RBX,%RDX,8),%XMM0,%XMM1 |
(3963) 0x4e996a VMOVSD %XMM1,(%RBX,%RDX,8) |
(3963) 0x4e996f ADD $0x20,%RCX |
(3963) 0x4e9973 DEC %R11 |
(3963) 0x4e9976 JNE 4e98e0 |
(3961) 0x4e997c MOV %RSI,%R8 |
(3961) 0x4e997f CMP %RSI,-0x30(%RBP) |
(3961) 0x4e9983 JAE 4e98a0 |
(3961) 0x4e9989 MOV -0x78(%RBP),%RCX |
(3961) 0x4e998d IMUL %R9,%RCX |
(3961) 0x4e9991 ADD -0x50(%RBP),%RCX |
(3961) 0x4e9995 MOV -0x80(%RBP),%RDX |
(3961) 0x4e9999 IMUL %R9,%RDX |
(3961) 0x4e999d MOV -0x70(%RBP),%RSI |
(3961) 0x4e99a1 NOPW %CS:(%RAX,%RAX,1) |
(3962) 0x4e99b0 VMOVSD (%R15,%RCX,8),%XMM0 |
(3962) 0x4e99b6 VMOVSD (%R12,%RSI,8),%XMM1 |
(3962) 0x4e99bc MOV (%R13,%RSI,8),%RAX |
(3962) 0x4e99c1 IMUL %R14,%RAX |
(3962) 0x4e99c5 ADD %RDX,%RAX |
(3962) 0x4e99c8 VFMADD213SD (%RBX,%RAX,8),%XMM0,%XMM1 |
(3962) 0x4e99ce VMOVSD %XMM1,(%RBX,%RAX,8) |
(3962) 0x4e99d3 INC %RSI |
(3962) 0x4e99d6 CMP %RSI,%RDI |
(3962) 0x4e99d9 JNE 4e99b0 |
(3961) 0x4e99db JMP 4e98a0 |
0x4e99e0 VMOVSD -0x58(%RBP),%XMM0 |
0x4e99e5 VUCOMISD 0x1661b(%RIP),%XMM0 |
0x4e99ed MOV -0x90(%RBP),%R15 |
0x4e99f4 MOV -0x38(%RBP),%R10 |
0x4e99f8 JE 4e9a31 |
0x4e99fa IMUL %R15,%R10 |
0x4e99fe TEST %R10,%R10 |
0x4e9a01 JLE 4e9a31 |
0x4e9a03 DEC %R10 |
0x4e9a06 VMOVQ %XMM0,%RCX |
0x4e9a0b SUB $0x8,%RSP |
0x4e9a0f MOV $0x535f30,%EDI |
0x4e9a14 MOV $0x4eb740,%EDX |
0x4e9a19 MOV $0x4,%ESI |
0x4e9a1e MOV %RBX,%R8 |
0x4e9a21 XOR %R9D,%R9D |
0x4e9a24 XOR %EAX,%EAX |
0x4e9a26 PUSH %R10 |
0x4e9a28 CALL 4103a0 <__kmpc_fork_call@plt> |
0x4e9a2d ADD $0x10,%RSP |
0x4e9a31 MOV -0x88(%RBP),%RAX |
0x4e9a38 CMP -0xc0(%RBP),%RAX |
0x4e9a3f MOV -0xc8(%RBP),%R14 |
0x4e9a46 MOV -0x60(%RBP),%R12 |
0x4e9a4a JNE 4e9a58 |
0x4e9a4c MOV -0xb8(%RBP),%RDI |
0x4e9a53 CALL 4eca70 <hypre_SeqVectorDestroy> |
0x4e9a58 XOR %EAX,%EAX |
0x4e9a5a MOV -0x40(%RBP),%RDX |
0x4e9a5e CMP %R14,%RDX |
0x4e9a61 SETNE %AL |
0x4e9a64 CMP %R12,%R15 |
0x4e9a67 MOV $0x2,%ECX |
0x4e9a6c CMOVE %RAX,%RCX |
0x4e9a70 MOV $0x3,%EAX |
0x4e9a75 CMOVE %RCX,%RAX |
0x4e9a79 CMP %R14,%RDX |
0x4e9a7c CMOVE %RCX,%RAX |
0x4e9a80 ADD $0xb8,%RSP |
0x4e9a87 POP %RBX |
0x4e9a88 POP %R12 |
0x4e9a8a POP %R13 |
0x4e9a8c POP %R14 |
0x4e9a8e POP %R15 |
0x4e9a90 POP %RBP |
0x4e9a91 RET |
0x4e9a92 NOPW %CS:(%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►96.02+ | hypre_ParCSRMatrixMatvecT | par_csr_matvec.c:432 | exec |
○ | hypre_BoomerAMGCycle | par_cycle.c:431 | exec |
○ | hypre_BoomerAMGSolve | par_amg_solve.c:272 | exec |
○ | hypre_PCGSolve | pcg.c:545 | exec |
○ | main | amg.c:419 | exec |
○ | __libc_init_first | libc.so.6 | |
►3.98+ | hypre_ParCSRMatrixMatvecT | par_csr_matvec.c:432 | exec |
○ | hypre_BoomerAMGCycle | par_cycle.c:431 | exec |
○ | hypre_BoomerAMGSolve | par_amg_solve.c:272 | exec |
○ | hypre_PCGSolve | pcg.c:424 | exec |
○ | main | amg.c:419 | exec |
○ | __libc_init_first | libc.so.6 |
Path / |
Source file and lines | csr_matvec.c:445-648 |
Module | exec |
nb instructions | 257 |
nb uops | 275 |
loop length | 1210 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 18 |
micro-operation queue | 68.75 cycles |
front end | 68.75 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 28.50 | 28.50 | 40.17 | 39.83 | 50.00 | 28.50 | 28.50 | 40.00 |
cycles | 28.50 | 28.50 | 40.17 | 39.83 | 50.00 | 28.50 | 28.50 | 40.00 |
Cycles executing div or sqrt instructions | 8.00 |
FE+BE cycles | 65.99-66.00 |
Stall cycles | 0.00 |
Front-end | 68.75 |
Dispatch | 50.00 |
DIV/SQRT | 8.00 |
Overall L1 | 68.75 |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 28% |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 5% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 13% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 12% |
other | 16% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 12% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0xb8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x30(%RDI),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RDI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x8(%RDI),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x10(%RDI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x18(%RDI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RSI),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x8(%RSI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RDX),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x8(%RDX),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x18(%RSI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x30(%RDX),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x28(%RDX),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RSI,-0x80(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x30(%RCX),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RSI,-0xd0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RCX),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RSI,-0x78(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDX,-0xc0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMP 0x18(%RDX),%RAX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JE 4e9206 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x4da03(%RIP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x510df9,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x5134d8,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RCX,-0x88(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD %XMM0,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD %XMM1,-0x30(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4f40b0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV $0x513501,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1e5,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4f6200 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
VMOVSD -0x30(%RBP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD -0x58(%RBP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x88(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VXORPD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VUCOMISD %XMM2,%XMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE 4e9280 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x90(%RBP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x38(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
IMUL %R15,%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
TEST %R10,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV -0xc8(%RBP),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x60(%RBP),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JLE 4e9a58 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
DEC %R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVQ %XMM1,%RCX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x536130,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4ebef0,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RBX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R10 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4103a0 <__kmpc_fork_call@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
ADD $0x10,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JMP 4e9a58 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP -0xc0(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
MOV %RCX,-0x88(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD %XMM0,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JE 4e92c0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVQ $0,-0xb8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 2 | 1 |
VDIVSD %XMM0,%XMM1,%XMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-14 | 4 |
VUCOMISD 0x16d5c(%RIP),%XMM0 | 2 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE 4e92f6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 4e9373 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD %XMM1,-0x30(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4ed2f0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
VMOVSD -0x30(%RBP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD -0x58(%RBP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VDIVSD %XMM0,%XMM1,%XMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-14 | 4 |
VUCOMISD 0x16d18(%RIP),%XMM0 | 2 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
JE 4e9373 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x38(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
IMUL -0x90(%RBP),%R10 | 1 | 0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VUCOMISD %XMM1,%XMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE 4e9340 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
TEST %R10,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4e9373 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
DEC %R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x5360d0,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4ebe60,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x3,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RBX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R10,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4103a0 <__kmpc_fork_call@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
JMP 4e9373 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
TEST %R10,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4e9373 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
DEC %R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVQ %XMM0,%R8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x536070,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4ebd60,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RBX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R10 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4103a0 <__kmpc_fork_call@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
ADD $0x10,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 4f60e0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
CMP $0x1,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4e9400 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
IMUL -0x60(%RBP),%RDI | 1 | 0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV $0x8,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 4f3da0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RAX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMPQ $0x1,-0x38(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4e95a0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV $0x536010,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4eb840,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x9,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x48(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R13,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSHQ -0x30(%RBP) | 2 | 0 | 0 | 0.83 | 0.83 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R10 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSHQ -0x60(%RBP) | 2 | 0 | 0 | 0.83 | 0.83 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSHQ -0x40(%RBP) | 2 | 0 | 0 | 0.83 | 0.83 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4103a0 <__kmpc_fork_call@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x70(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x30,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4f3eb0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
JMP 4e99e0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMPQ $0,-0x40(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JLE 4e99e0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMPQ $0x1,-0x38(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JNE 4e97e0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x1(%RAX),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 4e944d | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMPQ $0,-0x40(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JLE 4e93e0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMPQ $0,-0x38(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JLE 4e93e0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
DEC %RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x1(%RAX),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 4e95fe | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JL 4e99e0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
DEC %RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
DEC %RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 4e9838 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD -0x58(%RBP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VUCOMISD 0x1661b(%RIP),%XMM0 | 2 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x90(%RBP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x38(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JE 4e9a31 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
IMUL %R15,%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
TEST %R10,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4e9a31 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
DEC %R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVQ %XMM0,%RCX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x535f30,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4eb740,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RBX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R10 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4103a0 <__kmpc_fork_call@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
ADD $0x10,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP -0xc0(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
MOV -0xc8(%RBP),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x60(%RBP),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JNE 4e9a58 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0xb8(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CALL 4eca70 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x40(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %R14,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETNE %AL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %R12,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x2,%ECX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMOVE %RAX,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV $0x3,%EAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMOVE %RCX,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %R14,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMOVE %RCX,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
ADD $0xb8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Source file and lines | csr_matvec.c:445-648 |
Module | exec |
nb instructions | 257 |
nb uops | 275 |
loop length | 1210 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 18 |
micro-operation queue | 68.75 cycles |
front end | 68.75 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 28.50 | 28.50 | 40.17 | 39.83 | 50.00 | 28.50 | 28.50 | 40.00 |
cycles | 28.50 | 28.50 | 40.17 | 39.83 | 50.00 | 28.50 | 28.50 | 40.00 |
Cycles executing div or sqrt instructions | 8.00 |
FE+BE cycles | 65.99-66.00 |
Stall cycles | 0.00 |
Front-end | 68.75 |
Dispatch | 50.00 |
DIV/SQRT | 8.00 |
Overall L1 | 68.75 |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 28% |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 5% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 13% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 12% |
other | 16% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 12% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0xb8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x30(%RDI),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RDI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x8(%RDI),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x10(%RDI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x18(%RDI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RSI),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x8(%RSI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RDX),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x8(%RDX),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x18(%RSI),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x30(%RDX),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x28(%RDX),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RSI,-0x80(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x30(%RCX),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RSI,-0xd0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RCX),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RSI,-0x78(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDX,-0xc0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMP 0x18(%RDX),%RAX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JE 4e9206 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x4da03(%RIP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x510df9,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x5134d8,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RCX,-0x88(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD %XMM0,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD %XMM1,-0x30(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4f40b0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV $0x513501,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1e5,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4f6200 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
VMOVSD -0x30(%RBP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD -0x58(%RBP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x88(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VXORPD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VUCOMISD %XMM2,%XMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE 4e9280 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x90(%RBP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x38(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
IMUL %R15,%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
TEST %R10,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV -0xc8(%RBP),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x60(%RBP),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JLE 4e9a58 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
DEC %R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVQ %XMM1,%RCX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x536130,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4ebef0,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RBX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R10 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4103a0 <__kmpc_fork_call@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
ADD $0x10,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JMP 4e9a58 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP -0xc0(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
MOV %RCX,-0x88(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
VMOVSD %XMM0,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JE 4e92c0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOVQ $0,-0xb8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 2 | 1 |
VDIVSD %XMM0,%XMM1,%XMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-14 | 4 |
VUCOMISD 0x16d5c(%RIP),%XMM0 | 2 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE 4e92f6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 4e9373 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD %XMM1,-0x30(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4ed2f0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
VMOVSD -0x30(%RBP),%XMM1 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VMOVSD -0x58(%RBP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VDIVSD %XMM0,%XMM1,%XMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-14 | 4 |
VUCOMISD 0x16d18(%RIP),%XMM0 | 2 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
JE 4e9373 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x38(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
IMUL -0x90(%RBP),%R10 | 1 | 0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VUCOMISD %XMM1,%XMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE 4e9340 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
TEST %R10,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4e9373 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
DEC %R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x5360d0,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4ebe60,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x3,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RBX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R10,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4103a0 <__kmpc_fork_call@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
JMP 4e9373 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
TEST %R10,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4e9373 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
DEC %R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVQ %XMM0,%R8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x536070,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4ebd60,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RBX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R10 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4103a0 <__kmpc_fork_call@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
ADD $0x10,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 4f60e0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
CMP $0x1,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4e9400 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
IMUL -0x60(%RBP),%RDI | 1 | 0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV $0x8,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 4f3da0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RAX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMPQ $0x1,-0x38(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4e95a0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV $0x536010,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4eb840,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x9,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x48(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R13,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSHQ -0x30(%RBP) | 2 | 0 | 0 | 0.83 | 0.83 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R10 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSHQ -0x60(%RBP) | 2 | 0 | 0 | 0.83 | 0.83 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSHQ -0x40(%RBP) | 2 | 0 | 0 | 0.83 | 0.83 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4103a0 <__kmpc_fork_call@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x70(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
ADD $0x30,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4f3eb0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
JMP 4e99e0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMPQ $0,-0x40(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JLE 4e99e0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMPQ $0x1,-0x38(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JNE 4e97e0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x1(%RAX),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 4e944d | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMPQ $0,-0x40(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JLE 4e93e0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMPQ $0,-0x38(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JLE 4e93e0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
DEC %RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x1(%RAX),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 4e95fe | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JL 4e99e0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
DEC %RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
DEC %RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 4e9838 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
VMOVSD -0x58(%RBP),%XMM0 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
VUCOMISD 0x1661b(%RIP),%XMM0 | 2 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x90(%RBP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x38(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JE 4e9a31 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
IMUL %R15,%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
TEST %R10,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4e9a31 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
DEC %R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
VMOVQ %XMM0,%RCX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x535f30,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4eb740,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x4,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %RBX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R10 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4103a0 <__kmpc_fork_call@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
ADD $0x10,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP -0xc0(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
MOV -0xc8(%RBP),%R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x60(%RBP),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JNE 4e9a58 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0xb8(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CALL 4eca70 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x40(%RBP),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %R14,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SETNE %AL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %R12,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x2,%ECX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMOVE %RAX,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV $0x3,%EAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMOVE %RCX,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
CMP %R14,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMOVE %RCX,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
ADD $0xb8,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecT– | 2.32 | 0.88 |
▼Loop 3964 - csr_matvec.c:485-615 - exec– | 0.91 | 0.34 |
○Loop 3966 - csr_matvec.c:612-615 - exec | 1.12 | 0.42 |
○Loop 3967 - csr_matvec.c:612-615 - exec | 0.18 | 0.07 |
○Loop 3965 - csr_matvec.c:612-612 - exec | 0.11 | 0.04 |
○Loop 3968 - csr_matvec.c:612-612 - exec | 0 | 0 |
▼Loop 3960 - csr_matvec.c:485-626 - exec– | 0 | 0 |
▼Loop 3961 - csr_matvec.c:620-626 - exec– | 0 | 0 |
○Loop 3963 - csr_matvec.c:622-626 - exec | 0 | 0 |
○Loop 3962 - csr_matvec.c:622-626 - exec | 0 | 0 |
▼Loop 3969 - csr_matvec.c:485-597 - exec– | 0 | 0 |
▼Loop 3970 - csr_matvec.c:591-597 - exec– | 0 | 0 |
○Loop 3972 - csr_matvec.c:593-597 - exec | 0 | 0 |
○Loop 3971 - csr_matvec.c:593-597 - exec | 0 | 0 |