Function: hypre_ParTMatmul.extracted | Module: exec | Source: par_csr_matop.c:3454-3640 [...] | Coverage: 0.05% |
---|
Function: hypre_ParTMatmul.extracted | Module: exec | Source: par_csr_matop.c:3454-3640 [...] | Coverage: 0.05% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-3872/intel/AMG/build/AMG/AMG/parcsr_mv/par_csr_matop.c: 3454 - 3640 |
-------------------------------------------------------------------------------- |
3454: #pragma omp parallel |
[...] |
3462: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
3463: |
3464: size = num_cols_diag_A/num_threads; |
3465: rest = num_cols_diag_A - size*num_threads; |
3466: ii = hypre_GetThreadNum(); |
3467: if (ii < rest) |
3468: { |
3469: ns = ii*size+ii; |
3470: ne = (ii+1)*size+ii+1; |
3471: } |
3472: else |
3473: { |
3474: ns = ii*size+rest; |
3475: ne = (ii+1)*size+rest; |
3476: } |
3477: |
3478: B_marker = hypre_CTAlloc(HYPRE_Int, num_cols_diag_B); |
3479: B_marker_offd = hypre_CTAlloc(HYPRE_Int, num_cols_offd_C); |
3480: |
3481: for (ik = 0; ik < num_cols_diag_B; ik++) |
3482: B_marker[ik] = -1; |
3483: |
3484: for (ik = 0; ik < num_cols_offd_C; ik++) |
3485: B_marker_offd[ik] = -1; |
3486: |
3487: nnz_d = 0; |
3488: nnz_o = 0; |
3489: for (ik = ns; ik < ne; ik++) |
3490: { |
3491: for (jk = C_tmp_diag_i[ik]; jk < C_tmp_diag_i[ik+1]; jk++) |
3492: { |
3493: jcol = C_tmp_diag_j[jk]; |
3494: B_marker[jcol] = ik; |
3495: nnz_d++; |
3496: } |
3497: for (jk = C_tmp_offd_i[ik]; jk < C_tmp_offd_i[ik+1]; jk++) |
3498: { |
3499: jcol = C_tmp_offd_j[jk]; |
3500: B_marker_offd[jcol] = ik; |
3501: nnz_o++; |
3502: } |
3503: for (jk = 0; jk < num_sends_A; jk++) |
3504: for (j1 = send_map_starts_A[jk]; j1 < send_map_starts_A[jk+1]; j1++) |
3505: if (send_map_elmts_A[j1] == ik) |
3506: { |
3507: for (j2 = C_ext_diag_i[j1]; j2 < C_ext_diag_i[j1+1]; j2++) |
3508: { |
3509: jcol = C_ext_diag_j[j2]; |
3510: if (B_marker[jcol] < ik) |
3511: { |
3512: B_marker[jcol] = ik; |
3513: nnz_d++; |
3514: } |
3515: } |
3516: for (j2 = C_ext_offd_i[j1]; j2 < C_ext_offd_i[j1+1]; j2++) |
3517: { |
3518: jcol = C_ext_offd_j[j2]; |
3519: if (B_marker_offd[jcol] < ik) |
3520: { |
3521: B_marker_offd[jcol] = ik; |
3522: nnz_o++; |
3523: } |
3524: } |
3525: break; |
3526: } |
3527: C_diag_array[ii] = nnz_d; |
3528: C_offd_array[ii] = nnz_o; |
3529: } |
3530: #ifdef HYPRE_USING_OPENMP |
3531: #pragma omp barrier |
3532: #endif |
3533: if (ii == 0) |
3534: { |
3535: nnz_d = 0; |
3536: nnz_o = 0; |
3537: for (ik = 0; ik < num_threads-1; ik++) |
3538: { |
3539: C_diag_array[ik+1] += C_diag_array[ik]; |
3540: C_offd_array[ik+1] += C_offd_array[ik]; |
3541: } |
3542: nnz_d = C_diag_array[num_threads-1]; |
3543: nnz_o = C_offd_array[num_threads-1]; |
3544: C_diag_i[num_cols_diag_A] = nnz_d; |
3545: C_offd_i[num_cols_diag_A] = nnz_o; |
3546: |
3547: C_diag = hypre_CSRMatrixCreate(num_cols_diag_A, num_cols_diag_A, nnz_d); |
3548: C_offd = hypre_CSRMatrixCreate(num_cols_diag_A, num_cols_offd_C, nnz_o); |
3549: hypre_CSRMatrixI(C_diag) = C_diag_i; |
3550: hypre_CSRMatrixInitialize(C_diag); |
3551: C_diag_j = hypre_CSRMatrixJ(C_diag); |
3552: C_diag_data = hypre_CSRMatrixData(C_diag); |
3553: hypre_CSRMatrixI(C_offd) = C_offd_i; |
3554: hypre_CSRMatrixInitialize(C_offd); |
3555: C_offd_j = hypre_CSRMatrixJ(C_offd); |
3556: C_offd_data = hypre_CSRMatrixData(C_offd); |
[...] |
3568: for (ik = 0; ik < num_cols_diag_B; ik++) |
3569: B_marker[ik] = -1; |
3570: |
3571: for (ik = 0; ik < num_cols_offd_C; ik++) |
3572: B_marker_offd[ik] = -1; |
[...] |
3581: if (ii) |
3582: { |
3583: nnz_d = C_diag_array[ii-1]; |
3584: nnz_o = C_offd_array[ii-1]; |
3585: } |
3586: for (ik = ns; ik < ne; ik++) |
3587: { |
3588: C_diag_i[ik] = nnz_d; |
3589: C_offd_i[ik] = nnz_o; |
3590: for (jk = C_tmp_diag_i[ik]; jk < C_tmp_diag_i[ik+1]; jk++) |
3591: { |
3592: jcol = C_tmp_diag_j[jk]; |
3593: C_diag_j[nnz_d] = jcol; |
3594: C_diag_data[nnz_d] = C_tmp_diag_data[jk]; |
3595: B_marker[jcol] = nnz_d; |
3596: nnz_d++; |
3597: } |
3598: for (jk = C_tmp_offd_i[ik]; jk < C_tmp_offd_i[ik+1]; jk++) |
3599: { |
3600: jcol = C_tmp_offd_j[jk]; |
3601: C_offd_j[nnz_o] = jcol; |
3602: C_offd_data[nnz_o] = C_tmp_offd_data[jk]; |
3603: B_marker_offd[jcol] = nnz_o; |
3604: nnz_o++; |
3605: } |
3606: for (jk = 0; jk < num_sends_A; jk++) |
3607: for (j1 = send_map_starts_A[jk]; j1 < send_map_starts_A[jk+1]; j1++) |
3608: if (send_map_elmts_A[j1] == ik) |
3609: { |
3610: for (j2 = C_ext_diag_i[j1]; j2 < C_ext_diag_i[j1+1]; j2++) |
3611: { |
3612: jcol = C_ext_diag_j[j2]; |
3613: if (B_marker[jcol] < C_diag_i[ik]) |
3614: { |
3615: C_diag_j[nnz_d] = jcol; |
3616: C_diag_data[nnz_d] = C_ext_diag_data[j2]; |
3617: B_marker[jcol] = nnz_d; |
3618: nnz_d++; |
3619: } |
3620: else |
3621: C_diag_data[B_marker[jcol]] += C_ext_diag_data[j2]; |
3622: } |
3623: for (j2 = C_ext_offd_i[j1]; j2 < C_ext_offd_i[j1+1]; j2++) |
3624: { |
3625: jcol = C_ext_offd_j[j2]; |
3626: if (B_marker_offd[jcol] < C_offd_i[ik]) |
3627: { |
3628: C_offd_j[nnz_o] = jcol; |
3629: C_offd_data[nnz_o] = C_ext_offd_data[j2]; |
3630: B_marker_offd[jcol] = nnz_o; |
3631: nnz_o++; |
3632: } |
3633: else |
3634: C_offd_data[B_marker_offd[jcol]] += C_ext_offd_data[j2]; |
3635: } |
3636: break; |
3637: } |
3638: } |
3639: hypre_TFree(B_marker); |
3640: hypre_TFree(B_marker_offd); |
0x4c0180 PUSH %RBP |
0x4c0181 MOV %RSP,%RBP |
0x4c0184 PUSH %R15 |
0x4c0186 PUSH %R14 |
0x4c0188 PUSH %R13 |
0x4c018a PUSH %R12 |
0x4c018c PUSH %RBX |
0x4c018d SUB $0x128,%RSP |
0x4c0194 MOV %R9,-0xe0(%RBP) |
0x4c019b MOV %R8,-0x128(%RBP) |
0x4c01a2 MOV %RCX,-0xf8(%RBP) |
0x4c01a9 MOV %RDX,%R15 |
0x4c01ac MOV %RDI,-0xb8(%RBP) |
0x4c01b3 MOV 0xc8(%RBP),%RAX |
0x4c01ba MOV %RAX,-0xc8(%RBP) |
0x4c01c1 MOV 0xc0(%RBP),%RAX |
0x4c01c8 MOV %RAX,-0xc0(%RBP) |
0x4c01cf MOV 0xb8(%RBP),%RAX |
0x4c01d6 MOV %RAX,-0x70(%RBP) |
0x4c01da MOV 0xb0(%RBP),%RBX |
0x4c01e1 MOV 0xa8(%RBP),%RAX |
0x4c01e8 MOV %RAX,-0x50(%RBP) |
0x4c01ec MOV 0xa0(%RBP),%RAX |
0x4c01f3 MOV %RAX,-0x38(%RBP) |
0x4c01f7 MOV 0x98(%RBP),%RAX |
0x4c01fe MOV %RAX,-0xf0(%RBP) |
0x4c0205 MOV 0x90(%RBP),%RAX |
0x4c020c MOV %RAX,-0xa0(%RBP) |
0x4c0213 MOV 0x88(%RBP),%RAX |
0x4c021a MOV %RAX,-0xd8(%RBP) |
0x4c0221 MOV 0x80(%RBP),%R13 |
0x4c0228 MOV 0x78(%RBP),%RAX |
0x4c022c MOV %RAX,-0x58(%RBP) |
0x4c0230 MOV 0x70(%RBP),%RAX |
0x4c0234 MOV %RAX,-0x88(%RBP) |
0x4c023b MOV 0x68(%RBP),%R12 |
0x4c023f MOV 0x60(%RBP),%RAX |
0x4c0243 MOV %RAX,-0x100(%RBP) |
0x4c024a MOV 0x58(%RBP),%RAX |
0x4c024e MOV %RAX,-0x78(%RBP) |
0x4c0252 MOV 0x50(%RBP),%RAX |
0x4c0256 MOV %RAX,-0x148(%RBP) |
0x4c025d MOV 0x48(%RBP),%RAX |
0x4c0261 MOV %RAX,-0x110(%RBP) |
0x4c0268 MOV 0x40(%RBP),%RAX |
0x4c026c MOV %RAX,-0xb0(%RBP) |
0x4c0273 MOV 0x38(%RBP),%RAX |
0x4c0277 MOV %RAX,-0x140(%RBP) |
0x4c027e MOV 0x30(%RBP),%RAX |
0x4c0282 MOV %RAX,-0x108(%RBP) |
0x4c0289 MOV 0x28(%RBP),%RAX |
0x4c028d MOV %RAX,-0xa8(%RBP) |
0x4c0294 MOV 0x20(%RBP),%RAX |
0x4c0298 MOV %RAX,-0x120(%RBP) |
0x4c029f MOV 0x18(%RBP),%RAX |
0x4c02a3 MOV %RAX,-0xe8(%RBP) |
0x4c02aa MOV 0x10(%RBP),%RAX |
0x4c02ae MOV %RAX,-0x98(%RBP) |
0x4c02b5 CALL 4e86b0 <hypre_NumActiveThreads> |
0x4c02ba MOV %RAX,%RCX |
0x4c02bd MOV %R15,%RAX |
0x4c02c0 OR %RCX,%RAX |
0x4c02c3 SHR $0x20,%RAX |
0x4c02c7 MOV %R15,-0x130(%RBP) |
0x4c02ce MOV %RCX,-0x118(%RBP) |
0x4c02d5 JE 4c02e7 |
0x4c02d7 MOV %R15,%RAX |
0x4c02da CQTO |
0x4c02dc IDIV %RCX |
0x4c02df MOV %RDX,%R15 |
0x4c02e2 MOV %RAX,%R14 |
0x4c02e5 JMP 4c02f4 |
0x4c02e7 MOV %R15D,%EAX |
0x4c02ea XOR %EDX,%EDX |
0x4c02ec DIV %ECX |
0x4c02ee MOV %EDX,%R15D |
0x4c02f1 MOV %EAX,%R14D |
0x4c02f4 CALL 4e86c0 <hypre_GetThreadNum> |
0x4c02f9 LEA 0x1(%RAX),%RCX |
0x4c02fd MOV %RCX,%RDX |
0x4c0300 IMUL %R14,%RDX |
0x4c0304 CMP %R15,%RAX |
0x4c0307 MOV %R12,-0x138(%RBP) |
0x4c030e MOV %RAX,-0xd0(%RBP) |
0x4c0315 JGE 4c032b |
0x4c0317 INC %R14 |
0x4c031a IMUL %RAX,%R14 |
0x4c031e MOV %R14,-0x40(%RBP) |
0x4c0322 ADD %RDX,%RCX |
0x4c0325 MOV %RCX,-0x60(%RBP) |
0x4c0329 JMP 4c033d |
0x4c032b IMUL %RAX,%R14 |
0x4c032f ADD %R15,%R14 |
0x4c0332 MOV %R14,-0x40(%RBP) |
0x4c0336 ADD %R15,%RDX |
0x4c0339 MOV %RDX,-0x60(%RBP) |
0x4c033d MOV -0x50(%RBP),%R15 |
0x4c0341 MOV $0x8,%ESI |
0x4c0346 MOV -0xf8(%RBP),%R12 |
0x4c034d MOV %R12,%RDI |
0x4c0350 CALL 4e6980 <hypre_CAlloc> |
0x4c0355 MOV %RAX,%R14 |
0x4c0358 MOV $0x8,%ESI |
0x4c035d MOV -0x70(%RBP),%RDI |
0x4c0361 CALL 4e6980 <hypre_CAlloc> |
0x4c0366 MOV %R12,%RCX |
0x4c0369 MOV %RAX,%R12 |
0x4c036c TEST %RCX,%RCX |
0x4c036f JLE 4c0386 |
0x4c0371 LEA (,%RCX,8),%RDX |
0x4c0379 MOV %R14,%RDI |
0x4c037c MOV $0xff,%ESI |
0x4c0381 CALL 4efbb0 <_intel_fast_memset> |
0x4c0386 MOV -0x70(%RBP),%RAX |
0x4c038a TEST %RAX,%RAX |
0x4c038d JLE 4c03a4 |
0x4c038f LEA (,%RAX,8),%RDX |
0x4c0397 MOV %R12,%RDI |
0x4c039a MOV $0xff,%ESI |
0x4c039f CALL 4efbb0 <_intel_fast_memset> |
0x4c03a4 MOV -0x40(%RBP),%RAX |
0x4c03a8 CMP -0x60(%RBP),%RAX |
0x4c03ac MOV %RBX,-0x48(%RBP) |
0x4c03b0 MOV -0x38(%RBP),%R11 |
0x4c03b4 MOV %R13,-0x80(%RBP) |
0x4c03b8 MOV %R14,-0x30(%RBP) |
0x4c03bc JGE 4c06de |
0x4c03c2 XOR %EAX,%EAX |
0x4c03c4 MOV -0x40(%RBP),%RDX |
0x4c03c8 XOR %ECX,%ECX |
0x4c03ca JMP 4c03fe |
0x4c03cc NOPL (%RAX) |
(3674) 0x4c03d0 MOV -0xc0(%RBP),%RDX |
(3674) 0x4c03d7 MOV -0xd0(%RBP),%RSI |
(3674) 0x4c03de MOV %RCX,(%RDX,%RSI,8) |
(3674) 0x4c03e2 MOV -0xc8(%RBP),%RDX |
(3674) 0x4c03e9 MOV %RAX,(%RDX,%RSI,8) |
(3674) 0x4c03ed MOV -0x68(%RBP),%RSI |
(3674) 0x4c03f1 MOV %RSI,%RDX |
(3674) 0x4c03f4 CMP -0x60(%RBP),%RSI |
(3674) 0x4c03f8 JGE 4c06de |
(3674) 0x4c03fe MOV -0x78(%RBP),%RDI |
(3674) 0x4c0402 MOV (%RDI,%RDX,8),%RSI |
(3674) 0x4c0406 LEA 0x1(%RDX),%R8 |
(3674) 0x4c040a MOV %R8,-0x68(%RBP) |
(3674) 0x4c040e CMP 0x8(%RDI,%RDX,8),%RSI |
(3674) 0x4c0413 MOV -0x58(%RBP),%R8 |
(3674) 0x4c0417 JGE 4c06c0 |
(3674) 0x4c041d MOV -0x100(%RBP),%R9 |
(3674) 0x4c0424 MOV -0x78(%RBP),%R10 |
(3674) 0x4c0428 MOV -0x68(%RBP),%RBX |
(3674) 0x4c042c NOPL (%RAX) |
(3681) 0x4c0430 MOV (%R9,%RSI,8),%RDI |
(3681) 0x4c0434 MOV %RDX,(%R14,%RDI,8) |
(3681) 0x4c0438 INC %RCX |
(3681) 0x4c043b INC %RSI |
(3681) 0x4c043e CMP (%R10,%RBX,8),%RSI |
(3681) 0x4c0442 JL 4c0430 |
(3674) 0x4c0444 MOV -0x88(%RBP),%RDI |
(3674) 0x4c044b MOV (%RDI,%RDX,8),%RSI |
(3674) 0x4c044f CMP (%RDI,%RBX,8),%RSI |
(3674) 0x4c0453 JGE 4c047b |
(3674) 0x4c0455 NOPW %CS:(%RAX,%RAX,1) |
(3673) 0x4c0460 MOV (%R8,%RSI,8),%RDI |
(3673) 0x4c0464 MOV %RDX,(%R12,%RDI,8) |
(3673) 0x4c0468 INC %RAX |
(3673) 0x4c046b INC %RSI |
(3673) 0x4c046e MOV -0x88(%RBP),%RDI |
(3673) 0x4c0475 CMP (%RDI,%RBX,8),%RSI |
(3673) 0x4c0479 JL 4c0460 |
(3674) 0x4c047b MOV -0x48(%RBP),%RBX |
(3674) 0x4c047f TEST %RBX,%RBX |
(3674) 0x4c0482 JLE 4c03d0 |
(3674) 0x4c0488 VPBROADCASTQ %RDX,%YMM0 |
(3674) 0x4c048e XOR %EDI,%EDI |
(3674) 0x4c0490 JMP 4c04af |
0x4c0492 NOPW %CS:(%RAX,%RAX,1) |
(3675) 0x4c04a0 MOV %RSI,%R11 |
(3675) 0x4c04a3 INC %RDI |
(3675) 0x4c04a6 CMP %RBX,%RDI |
(3675) 0x4c04a9 JE 4c03d0 |
(3675) 0x4c04af MOV (%R11,%RDI,8),%R10 |
(3675) 0x4c04b3 MOV %R11,%RSI |
(3675) 0x4c04b6 MOV 0x8(%R11,%RDI,8),%R9 |
(3675) 0x4c04bb MOV %R9,%R11 |
(3675) 0x4c04be SUB %R10,%R11 |
(3675) 0x4c04c1 JLE 4c04a0 |
(3675) 0x4c04c3 LEA (%R15,%R10,8),%ESI |
(3675) 0x4c04c7 AND $0x7f,%ESI |
(3675) 0x4c04ca MOV $0x80,%EBX |
(3675) 0x4c04cf SUB %ESI,%EBX |
(3675) 0x4c04d1 SHR $0x3,%EBX |
(3675) 0x4c04d4 CMP %RBX,%R11 |
(3675) 0x4c04d7 MOV %RBX,%RSI |
(3675) 0x4c04da CMOVB %R11,%RSI |
(3675) 0x4c04de TEST %RSI,%RSI |
(3675) 0x4c04e1 JE 4c0502 |
(3675) 0x4c04e3 MOV %R10,%R8 |
(3675) 0x4c04e6 MOV %RSI,%R14 |
(3675) 0x4c04e9 NOPL (%RAX) |
(3680) 0x4c04f0 CMP %RDX,(%R15,%R8,8) |
(3680) 0x4c04f4 JE 4c0599 |
(3680) 0x4c04fa INC %R8 |
(3680) 0x4c04fd DEC %R14 |
(3680) 0x4c0500 JNE 4c04f0 |
(3675) 0x4c0502 CMP %R11,%RBX |
(3675) 0x4c0505 JAE 4c0588 |
(3675) 0x4c050b SUB %RSI,%R11 |
(3675) 0x4c050e MOV %R11,%RBX |
(3675) 0x4c0511 AND $-0x10,%RBX |
(3675) 0x4c0515 JE 4c056a |
(3675) 0x4c0517 LEA -0x1(%RBX),%R13 |
(3675) 0x4c051b LEA (%R10,%RSI,1),%R8 |
(3675) 0x4c051f MOV -0x50(%RBP),%R14 |
(3675) 0x4c0523 LEA (%R14,%R8,8),%R15 |
(3675) 0x4c0527 XOR %R14D,%R14D |
(3675) 0x4c052a NOPW (%RAX,%RAX,1) |
(3679) 0x4c0530 VPCMPEQQ 0x20(%R15,%R14,8),%YMM0,%K0 |
(3679) 0x4c0538 VPCMPEQQ (%R15,%R14,8),%YMM0,%K1 |
(3679) 0x4c053f VPCMPEQQ 0x60(%R15,%R14,8),%YMM0,%K2 |
(3679) 0x4c0547 VPCMPEQQ 0x40(%R15,%R14,8),%YMM0,%K3 |
(3679) 0x4c054f KORB %K0,%K1,%K4 |
(3679) 0x4c0553 KORB %K2,%K3,%K5 |
(3679) 0x4c0557 KORTESTB %K5,%K4 |
(3679) 0x4c055b JNE 4c05e3 |
(3679) 0x4c0561 ADD $0x10,%R14 |
(3679) 0x4c0565 CMP %R13,%R14 |
(3679) 0x4c0568 JBE 4c0530 |
(3675) 0x4c056a CMP %R11,%RBX |
(3675) 0x4c056d JNE 4c05a7 |
(3675) 0x4c056f MOV -0x48(%RBP),%RBX |
(3675) 0x4c0573 MOV -0x50(%RBP),%R15 |
(3675) 0x4c0577 MOV -0x38(%RBP),%R11 |
(3675) 0x4c057b MOV -0x80(%RBP),%R13 |
(3675) 0x4c057f MOV -0x30(%RBP),%R14 |
(3675) 0x4c0583 JMP 4c04a3 |
(3675) 0x4c0588 MOV -0x38(%RBP),%R11 |
(3675) 0x4c058c MOV -0x30(%RBP),%R14 |
(3675) 0x4c0590 MOV -0x48(%RBP),%RBX |
(3675) 0x4c0594 JMP 4c04a3 |
(3675) 0x4c0599 MOV -0x38(%RBP),%R11 |
(3675) 0x4c059d MOV -0x30(%RBP),%R14 |
(3675) 0x4c05a1 MOV -0x48(%RBP),%RBX |
(3675) 0x4c05a5 JMP 4c061d |
(3675) 0x4c05a7 ADD %RSI,%R10 |
(3675) 0x4c05aa ADD %RBX,%R10 |
(3675) 0x4c05ad MOV %R10,%R8 |
(3675) 0x4c05b0 MOV -0x48(%RBP),%RBX |
(3675) 0x4c05b4 MOV -0x50(%RBP),%R15 |
(3675) 0x4c05b8 MOV -0x38(%RBP),%R11 |
(3675) 0x4c05bc MOV -0x80(%RBP),%R13 |
(3675) 0x4c05c0 MOV -0x40(%RBP),%RSI |
(3675) 0x4c05c4 MOV -0x30(%RBP),%R14 |
(3675) 0x4c05c8 MOV %RSI,-0x40(%RBP) |
(3675) 0x4c05cc NOPL (%RAX) |
(3678) 0x4c05d0 CMP %RDX,(%R15,%R8,8) |
(3678) 0x4c05d4 JE 4c061d |
(3678) 0x4c05d6 INC %R8 |
(3678) 0x4c05d9 CMP %R8,%R9 |
(3678) 0x4c05dc JNE 4c05d0 |
(3675) 0x4c05de JMP 4c04a3 |
(3675) 0x4c05e3 KSHIFTLB $0x4,%K0,%K0 |
(3675) 0x4c05e9 KORB %K0,%K1,%K0 |
(3675) 0x4c05ed KSHIFTLB $0x4,%K2,%K1 |
(3675) 0x4c05f3 KORB %K1,%K3,%K1 |
(3675) 0x4c05f7 KUNPCKBW %K0,%K1,%K0 |
(3675) 0x4c05fb KMOVD %K0,%ESI |
(3675) 0x4c05ff TZCNT %ESI,%ESI |
(3675) 0x4c0603 ADD %R14,%R8 |
(3675) 0x4c0606 ADD %RSI,%R8 |
(3675) 0x4c0609 MOV -0x48(%RBP),%RBX |
(3675) 0x4c060d MOV -0x50(%RBP),%R15 |
(3675) 0x4c0611 MOV -0x38(%RBP),%R11 |
(3675) 0x4c0615 MOV -0x80(%RBP),%R13 |
(3675) 0x4c0619 MOV -0x30(%RBP),%R14 |
(3675) 0x4c061d MOV -0xa8(%RBP),%R9 |
(3675) 0x4c0624 MOV (%R9,%R8,8),%RSI |
(3675) 0x4c0628 MOV 0x8(%R9,%R8,8),%R9 |
(3675) 0x4c062d JMP 4c0633 |
0x4c062f NOP |
(3677) 0x4c0630 INC %RSI |
(3677) 0x4c0633 CMP %R9,%RSI |
(3677) 0x4c0636 JGE 4c0660 |
(3677) 0x4c0638 MOV -0x108(%RBP),%R10 |
(3677) 0x4c063f MOV (%R10,%RSI,8),%R10 |
(3677) 0x4c0643 CMP %RDX,(%R14,%R10,8) |
(3677) 0x4c0647 JGE 4c0630 |
(3677) 0x4c0649 MOV %RDX,(%R14,%R10,8) |
(3677) 0x4c064d INC %RCX |
(3677) 0x4c0650 MOV -0xa8(%RBP),%R9 |
(3677) 0x4c0657 MOV 0x8(%R9,%R8,8),%R9 |
(3677) 0x4c065c JMP 4c0630 |
0x4c065e XCHG %AX,%AX |
(3675) 0x4c0660 MOV -0xb0(%RBP),%R9 |
(3675) 0x4c0667 MOV (%R9,%R8,8),%RSI |
(3675) 0x4c066b MOV 0x8(%R9,%R8,8),%R9 |
(3675) 0x4c0670 JMP 4c0683 |
0x4c0672 NOPW %CS:(%RAX,%RAX,1) |
(3676) 0x4c0680 INC %RSI |
(3676) 0x4c0683 CMP %R9,%RSI |
(3676) 0x4c0686 JGE 4c04a3 |
(3676) 0x4c068c MOV -0x110(%RBP),%R10 |
(3676) 0x4c0693 MOV (%R10,%RSI,8),%R10 |
(3676) 0x4c0697 CMP %RDX,(%R12,%R10,8) |
(3676) 0x4c069b JGE 4c0680 |
(3676) 0x4c069d MOV %RDX,(%R12,%R10,8) |
(3676) 0x4c06a1 INC %RAX |
(3676) 0x4c06a4 MOV -0xb0(%RBP),%R9 |
(3676) 0x4c06ab MOV 0x8(%R9,%R8,8),%R9 |
(3676) 0x4c06b0 JMP 4c0680 |
0x4c06b2 NOPW %CS:(%RAX,%RAX,1) |
(3674) 0x4c06c0 MOV -0x68(%RBP),%RBX |
(3674) 0x4c06c4 MOV -0x88(%RBP),%RDI |
(3674) 0x4c06cb MOV (%RDI,%RDX,8),%RSI |
(3674) 0x4c06cf CMP (%RDI,%RBX,8),%RSI |
(3674) 0x4c06d3 JL 4c0460 |
(3674) 0x4c06d9 JMP 4c047b |
0x4c06de MOV -0xb8(%RBP),%RAX |
0x4c06e5 MOV (%RAX),%ESI |
0x4c06e7 MOV $0x736270,%EDI |
0x4c06ec VZEROUPPER |
0x4c06ef CALL 410030 <__kmpc_barrier@plt> |
0x4c06f4 MOV -0xb8(%RBP),%RAX |
0x4c06fb CMPQ $0,-0xd0(%RBP) |
0x4c0703 JNE 4c0930 |
0x4c0709 MOV -0x118(%RBP),%RDI |
0x4c0710 CMP $0x1,%RDI |
0x4c0714 MOV -0xc8(%RBP),%R10 |
0x4c071b MOV -0xc0(%RBP),%R11 |
0x4c0722 JLE 4c086c |
0x4c0728 LEA -0x1(%RDI),%RAX |
0x4c072c LEA (%R11,%RAX,8),%RCX |
0x4c0730 CMP %R10,%RCX |
0x4c0733 JB 4c0791 |
0x4c0735 LEA (%R10,%RAX,8),%RCX |
0x4c0739 CMP %R11,%RCX |
0x4c073c JB 4c0791 |
0x4c073e LEA (%R10,%RDI,8),%RAX |
0x4c0742 CMP %R11,%RAX |
0x4c0745 JBE 4c083e |
0x4c074b LEA (%R11,%RDI,8),%RAX |
0x4c074f CMP %R10,%RAX |
0x4c0752 JBE 4c083e |
0x4c0758 MOV $0x1,%EAX |
0x4c075d NOPL (%RAX) |
(3672) 0x4c0760 MOV -0x8(%R11,%RAX,8),%RCX |
(3672) 0x4c0765 LEA (%R11,%RAX,8),%RDX |
(3672) 0x4c0769 MOV (%RDX),%RSI |
(3672) 0x4c076c ADD %RCX,%RSI |
(3672) 0x4c076f MOV %RSI,(%RDX) |
(3672) 0x4c0772 MOV -0x8(%R10,%RAX,8),%RCX |
(3672) 0x4c0777 LEA (%R10,%RAX,8),%RDX |
(3672) 0x4c077b MOV (%RDX),%RSI |
(3672) 0x4c077e ADD %RCX,%RSI |
(3672) 0x4c0781 MOV %RSI,(%RDX) |
(3672) 0x4c0784 INC %RAX |
(3672) 0x4c0787 CMP %RAX,%RDI |
(3672) 0x4c078a JNE 4c0760 |
0x4c078c JMP 4c086c |
0x4c0791 MOV %RDI,%RBX |
0x4c0794 CMP $0x5,%RDI |
0x4c0798 JB 4c07fd |
0x4c079a MOV %RAX,%RCX |
0x4c079d SHR $0x2,%RCX |
0x4c07a1 MOV (%R11),%RDX |
0x4c07a4 MOV (%R10),%RSI |
0x4c07a7 MOV $0x20,%EDI |
0x4c07ac NOPL (%RAX) |
(3670) 0x4c07b0 LEA (%R11,%RDI,1),%R8 |
(3670) 0x4c07b4 ADD -0x18(%R8),%RDX |
(3670) 0x4c07b8 MOV %RDX,-0x18(%R8) |
(3670) 0x4c07bc LEA (%R10,%RDI,1),%R9 |
(3670) 0x4c07c0 ADD -0x18(%R9),%RSI |
(3670) 0x4c07c4 MOV %RSI,-0x18(%R9) |
(3670) 0x4c07c8 ADD -0x10(%R8),%RDX |
(3670) 0x4c07cc MOV %RDX,-0x10(%R8) |
(3670) 0x4c07d0 ADD -0x10(%R9),%RSI |
(3670) 0x4c07d4 MOV %RSI,-0x10(%R9) |
(3670) 0x4c07d8 ADD -0x8(%R8),%RDX |
(3670) 0x4c07dc MOV %RDX,-0x8(%R8) |
(3670) 0x4c07e0 ADD -0x8(%R9),%RSI |
(3670) 0x4c07e4 MOV %RSI,-0x8(%R9) |
(3670) 0x4c07e8 ADD (%R8),%RDX |
(3670) 0x4c07eb MOV %RDX,(%R8) |
(3670) 0x4c07ee ADD (%R9),%RSI |
(3670) 0x4c07f1 MOV %RSI,(%R9) |
(3670) 0x4c07f4 ADD $0x20,%RDI |
(3670) 0x4c07f8 DEC %RCX |
(3670) 0x4c07fb JNE 4c07b0 |
0x4c07fd MOV %RAX,%RCX |
0x4c0800 AND $-0x4,%RCX |
0x4c0804 CMP %RAX,%RCX |
0x4c0807 MOV %RBX,%RDI |
0x4c080a JE 4c086c |
0x4c080c MOV (%R11,%RCX,8),%RAX |
0x4c0810 MOV (%R10,%RCX,8),%RDX |
0x4c0814 INC %RCX |
0x4c0817 NOPW (%RAX,%RAX,1) |
(3669) 0x4c0820 LEA (%R11,%RCX,8),%RSI |
(3669) 0x4c0824 ADD (%RSI),%RAX |
(3669) 0x4c0827 MOV %RAX,(%RSI) |
(3669) 0x4c082a LEA (%R10,%RCX,8),%RSI |
(3669) 0x4c082e ADD (%RSI),%RDX |
(3669) 0x4c0831 MOV %RDX,(%RSI) |
(3669) 0x4c0834 INC %RCX |
(3669) 0x4c0837 CMP %RCX,%RDI |
(3669) 0x4c083a JNE 4c0820 |
0x4c083c JMP 4c086c |
0x4c083e MOV (%R11),%RAX |
0x4c0841 MOV (%R10),%RCX |
0x4c0844 MOV $0x1,%EDX |
0x4c0849 NOPL (%RAX) |
(3671) 0x4c0850 LEA (%R11,%RDX,8),%RSI |
(3671) 0x4c0854 ADD (%RSI),%RAX |
(3671) 0x4c0857 MOV %RAX,(%RSI) |
(3671) 0x4c085a LEA (%R10,%RDX,8),%RSI |
(3671) 0x4c085e ADD (%RSI),%RCX |
(3671) 0x4c0861 MOV %RCX,(%RSI) |
(3671) 0x4c0864 INC %RDX |
(3671) 0x4c0867 CMP %RDX,%RDI |
(3671) 0x4c086a JNE 4c0850 |
0x4c086c MOV -0x8(%R11,%RDI,8),%RDX |
0x4c0871 MOV -0x8(%R10,%RDI,8),%RCX |
0x4c0876 MOV %RCX,-0x68(%RBP) |
0x4c087a MOV -0x130(%RBP),%RBX |
0x4c0881 MOV -0x98(%RBP),%RAX |
0x4c0888 MOV %RDX,(%RAX,%RBX,8) |
0x4c088c MOV -0xa0(%RBP),%RAX |
0x4c0893 MOV %RCX,(%RAX,%RBX,8) |
0x4c0897 MOV %RBX,%RDI |
0x4c089a MOV %RBX,%RSI |
0x4c089d CALL 4da400 <hypre_CSRMatrixCreate> |
0x4c08a2 MOV %RAX,%R13 |
0x4c08a5 MOV -0x128(%RBP),%RAX |
0x4c08ac MOV %R13,(%RAX) |
0x4c08af MOV %RBX,%RDI |
0x4c08b2 MOV -0x70(%RBP),%RSI |
0x4c08b6 MOV -0x68(%RBP),%RDX |
0x4c08ba CALL 4da400 <hypre_CSRMatrixCreate> |
0x4c08bf MOV %RAX,%RBX |
0x4c08c2 MOV -0x120(%RBP),%RAX |
0x4c08c9 MOV %RBX,(%RAX) |
0x4c08cc MOV -0x98(%RBP),%RAX |
0x4c08d3 MOV %RAX,(%R13) |
0x4c08d7 MOV %R13,%RDI |
0x4c08da CALL 4da4e0 <hypre_CSRMatrixInitialize> |
0x4c08df MOV 0x8(%R13),%RAX |
0x4c08e3 MOV -0xe8(%RBP),%RCX |
0x4c08ea MOV %RAX,(%RCX) |
0x4c08ed MOV 0x30(%R13),%RAX |
0x4c08f1 MOV -0xe0(%RBP),%RCX |
0x4c08f8 MOV %RAX,(%RCX) |
0x4c08fb MOV -0xa0(%RBP),%RAX |
0x4c0902 MOV %RAX,(%RBX) |
0x4c0905 MOV %RBX,%RDI |
0x4c0908 CALL 4da4e0 <hypre_CSRMatrixInitialize> |
0x4c090d MOV 0x8(%RBX),%RAX |
0x4c0911 MOV -0xf0(%RBP),%RCX |
0x4c0918 MOV %RAX,(%RCX) |
0x4c091b MOV 0x30(%RBX),%RAX |
0x4c091f MOV -0xd8(%RBP),%RCX |
0x4c0926 MOV %RAX,(%RCX) |
0x4c0929 MOV -0xb8(%RBP),%RAX |
0x4c0930 MOV (%RAX),%ESI |
0x4c0932 MOV $0x736290,%EDI |
0x4c0937 CALL 410030 <__kmpc_barrier@plt> |
0x4c093c MOV -0xf8(%RBP),%RDX |
0x4c0943 TEST %RDX,%RDX |
0x4c0946 JLE 4c0959 |
0x4c0948 SAL $0x3,%RDX |
0x4c094c MOV %R14,%RDI |
0x4c094f MOV $0xff,%ESI |
0x4c0954 CALL 4efbb0 <_intel_fast_memset> |
0x4c0959 MOV -0x70(%RBP),%RDX |
0x4c095d TEST %RDX,%RDX |
0x4c0960 JLE 4c0973 |
0x4c0962 SAL $0x3,%RDX |
0x4c0966 MOV %R12,%RDI |
0x4c0969 MOV $0xff,%ESI |
0x4c096e CALL 4efbb0 <_intel_fast_memset> |
0x4c0973 MOV -0xd0(%RBP),%RDX |
0x4c097a TEST %RDX,%RDX |
0x4c097d JE 4c09a9 |
0x4c097f MOV -0xc0(%RBP),%RAX |
0x4c0986 MOV -0x8(%RAX,%RDX,8),%RAX |
0x4c098b MOV -0xc8(%RBP),%RCX |
0x4c0992 MOV -0x8(%RCX,%RDX,8),%RCX |
0x4c0997 MOV -0x60(%RBP),%RDX |
0x4c099b MOV -0x40(%RBP),%RSI |
0x4c099f CMP %RDX,%RSI |
0x4c09a2 JL 4c09be |
0x4c09a4 JMP 4c0def |
0x4c09a9 XOR %EAX,%EAX |
0x4c09ab XOR %ECX,%ECX |
0x4c09ad MOV -0x60(%RBP),%RDX |
0x4c09b1 MOV -0x40(%RBP),%RSI |
0x4c09b5 CMP %RDX,%RSI |
0x4c09b8 JGE 4c0def |
0x4c09be MOV %R12,-0x90(%RBP) |
0x4c09c5 JMP 4c09e8 |
0x4c09c7 NOPW (%RAX,%RAX,1) |
(3661) 0x4c09d0 MOV -0x90(%RBP),%R12 |
(3661) 0x4c09d7 MOV -0x60(%RBP),%RDX |
(3661) 0x4c09db MOV -0x40(%RBP),%RSI |
(3661) 0x4c09df CMP %RDX,%RSI |
(3661) 0x4c09e2 JGE 4c0def |
(3661) 0x4c09e8 MOV %RSI,%RDX |
(3661) 0x4c09eb MOV -0x98(%RBP),%RSI |
(3661) 0x4c09f2 MOV %RAX,(%RSI,%RDX,8) |
(3661) 0x4c09f6 MOV -0xa0(%RBP),%RSI |
(3661) 0x4c09fd MOV %RCX,(%RSI,%RDX,8) |
(3661) 0x4c0a01 MOV -0x78(%RBP),%R8 |
(3661) 0x4c0a05 MOV (%R8,%RDX,8),%RSI |
(3661) 0x4c0a09 LEA 0x1(%RDX),%RDI |
(3661) 0x4c0a0d MOV %RDI,-0x40(%RBP) |
(3661) 0x4c0a11 CMP 0x8(%R8,%RDX,8),%RSI |
(3661) 0x4c0a16 JGE 4c0b00 |
(3661) 0x4c0a1c MOV -0xe8(%RBP),%RDI |
(3661) 0x4c0a23 MOV (%RDI),%RDI |
(3661) 0x4c0a26 MOV -0xe0(%RBP),%R8 |
(3661) 0x4c0a2d MOV (%R8),%R8 |
(3661) 0x4c0a30 MOV -0x138(%RBP),%R10 |
(3661) 0x4c0a37 MOV -0x100(%RBP),%R14 |
(3661) 0x4c0a3e MOV -0x78(%RBP),%RBX |
(3661) 0x4c0a42 MOV -0x40(%RBP),%R13 |
(3661) 0x4c0a46 MOV -0x30(%RBP),%R11 |
(3661) 0x4c0a4a NOPW (%RAX,%RAX,1) |
(3668) 0x4c0a50 MOV (%R14,%RSI,8),%R9 |
(3668) 0x4c0a54 MOV %R9,(%RDI,%RAX,8) |
(3668) 0x4c0a58 VMOVQ (%R10,%RSI,8),%XMM0 |
(3668) 0x4c0a5e VMOVQ %XMM0,(%R8,%RAX,8) |
(3668) 0x4c0a64 MOV %RAX,(%R11,%R9,8) |
(3668) 0x4c0a68 INC %RAX |
(3668) 0x4c0a6b INC %RSI |
(3668) 0x4c0a6e CMP (%RBX,%R13,8),%RSI |
(3668) 0x4c0a72 JL 4c0a50 |
(3661) 0x4c0a74 MOV -0x88(%RBP),%RDI |
(3661) 0x4c0a7b MOV (%RDI,%RDX,8),%RSI |
(3661) 0x4c0a7f CMP (%RDI,%R13,8),%RSI |
(3661) 0x4c0a83 JGE 4c0b19 |
(3661) 0x4c0a89 MOV -0xf0(%RBP),%RDI |
(3661) 0x4c0a90 MOV (%RDI),%RDI |
(3661) 0x4c0a93 MOV -0xd8(%RBP),%R8 |
(3661) 0x4c0a9a MOV (%R8),%R8 |
(3661) 0x4c0a9d MOV -0x30(%RBP),%R14 |
(3661) 0x4c0aa1 MOV -0x80(%RBP),%R13 |
(3661) 0x4c0aa5 MOV -0x38(%RBP),%R11 |
(3661) 0x4c0aa9 MOV -0x40(%RBP),%R10 |
(3661) 0x4c0aad MOV -0x88(%RBP),%RBX |
(3661) 0x4c0ab4 MOV -0x58(%RBP),%R12 |
(3661) 0x4c0ab8 MOV -0x90(%RBP),%R15 |
(3661) 0x4c0abf NOP |
(3660) 0x4c0ac0 MOV (%R12,%RSI,8),%R9 |
(3660) 0x4c0ac4 MOV %R9,(%RDI,%RCX,8) |
(3660) 0x4c0ac8 VMOVQ (%R13,%RSI,8),%XMM0 |
(3660) 0x4c0acf VMOVQ %XMM0,(%R8,%RCX,8) |
(3660) 0x4c0ad5 MOV %RCX,(%R15,%R9,8) |
(3660) 0x4c0ad9 INC %RCX |
(3660) 0x4c0adc INC %RSI |
(3660) 0x4c0adf CMP (%RBX,%R10,8),%RSI |
(3660) 0x4c0ae3 JL 4c0ac0 |
(3661) 0x4c0ae5 MOV -0x48(%RBP),%RBX |
(3661) 0x4c0ae9 TEST %RBX,%RBX |
(3661) 0x4c0aec JG 4c0b2e |
(3661) 0x4c0aee JMP 4c09d0 |
0x4c0af3 NOPW %CS:(%RAX,%RAX,1) |
(3661) 0x4c0b00 MOV -0x40(%RBP),%R13 |
(3661) 0x4c0b04 MOV -0x88(%RBP),%RDI |
(3661) 0x4c0b0b MOV (%RDI,%RDX,8),%RSI |
(3661) 0x4c0b0f CMP (%RDI,%R13,8),%RSI |
(3661) 0x4c0b13 JL 4c0a89 |
(3661) 0x4c0b19 MOV -0x30(%RBP),%R14 |
(3661) 0x4c0b1d MOV -0x38(%RBP),%R11 |
(3661) 0x4c0b21 MOV -0x48(%RBP),%RBX |
(3661) 0x4c0b25 TEST %RBX,%RBX |
(3661) 0x4c0b28 JLE 4c09d0 |
(3661) 0x4c0b2e VPBROADCASTQ %RDX,%YMM0 |
(3661) 0x4c0b34 XOR %ESI,%ESI |
(3661) 0x4c0b36 MOV -0x58(%RBP),%R10 |
(3661) 0x4c0b3a MOV -0x50(%RBP),%R15 |
(3661) 0x4c0b3e JMP 4c0b56 |
(3662) 0x4c0b40 MOV %R12,%R10 |
(3662) 0x4c0b43 MOV -0x90(%RBP),%R12 |
(3662) 0x4c0b4a INC %RSI |
(3662) 0x4c0b4d CMP %RBX,%RSI |
(3662) 0x4c0b50 JE 4c09d7 |
(3662) 0x4c0b56 MOV %R10,%R12 |
(3662) 0x4c0b59 MOV (%R11,%RSI,8),%R9 |
(3662) 0x4c0b5d MOV 0x8(%R11,%RSI,8),%R8 |
(3662) 0x4c0b62 MOV %R8,%R10 |
(3662) 0x4c0b65 SUB %R9,%R10 |
(3662) 0x4c0b68 JLE 4c0b40 |
(3662) 0x4c0b6a LEA (%R15,%R9,8),%EDI |
(3662) 0x4c0b6e AND $0x7f,%EDI |
(3662) 0x4c0b71 MOV $0x80,%EBX |
(3662) 0x4c0b76 SUB %EDI,%EBX |
(3662) 0x4c0b78 SHR $0x3,%EBX |
(3662) 0x4c0b7b CMP %RBX,%R10 |
(3662) 0x4c0b7e MOV %RBX,%R11 |
(3662) 0x4c0b81 CMOVB %R10,%R11 |
(3662) 0x4c0b85 TEST %R11,%R11 |
(3662) 0x4c0b88 MOV -0x90(%RBP),%R12 |
(3662) 0x4c0b8f JE 4c0bb2 |
(3662) 0x4c0b91 MOV %R9,%RDI |
(3662) 0x4c0b94 MOV %R11,%R14 |
(3662) 0x4c0b97 NOPW (%RAX,%RAX,1) |
(3667) 0x4c0ba0 CMP %RDX,(%R15,%RDI,8) |
(3667) 0x4c0ba4 JE 4c0cae |
(3667) 0x4c0baa INC %RDI |
(3667) 0x4c0bad DEC %R14 |
(3667) 0x4c0bb0 JNE 4c0ba0 |
(3662) 0x4c0bb2 CMP %R10,%RBX |
(3662) 0x4c0bb5 JAE 4c0c34 |
(3662) 0x4c0bb7 SUB %R11,%R10 |
(3662) 0x4c0bba MOV %R10,%RBX |
(3662) 0x4c0bbd AND $-0x10,%RBX |
(3662) 0x4c0bc1 JE 4c0c16 |
(3662) 0x4c0bc3 LEA -0x1(%RBX),%R13 |
(3662) 0x4c0bc7 LEA (%R9,%R11,1),%RDI |
(3662) 0x4c0bcb MOV -0x50(%RBP),%R14 |
(3662) 0x4c0bcf LEA (%R14,%RDI,8),%R15 |
(3662) 0x4c0bd3 XOR %R14D,%R14D |
(3662) 0x4c0bd6 NOPW %CS:(%RAX,%RAX,1) |
(3666) 0x4c0be0 VPCMPEQQ 0x20(%R15,%R14,8),%YMM0,%K0 |
(3666) 0x4c0be8 VPCMPEQQ (%R15,%R14,8),%YMM0,%K1 |
(3666) 0x4c0bef VPCMPEQQ 0x60(%R15,%R14,8),%YMM0,%K2 |
(3666) 0x4c0bf7 VPCMPEQQ 0x40(%R15,%R14,8),%YMM0,%K3 |
(3666) 0x4c0bff KORB %K0,%K1,%K4 |
(3666) 0x4c0c03 KORB %K2,%K3,%K5 |
(3666) 0x4c0c07 KORTESTB %K5,%K4 |
(3666) 0x4c0c0b JNE 4c0c83 |
(3666) 0x4c0c0d ADD $0x10,%R14 |
(3666) 0x4c0c11 CMP %R13,%R14 |
(3666) 0x4c0c14 JBE 4c0be0 |
(3662) 0x4c0c16 CMP %R10,%RBX |
(3662) 0x4c0c19 JNE 4c0c49 |
(3662) 0x4c0c1b MOV -0x48(%RBP),%RBX |
(3662) 0x4c0c1f MOV -0x50(%RBP),%R15 |
(3662) 0x4c0c23 MOV -0x38(%RBP),%R11 |
(3662) 0x4c0c27 MOV -0x58(%RBP),%R10 |
(3662) 0x4c0c2b MOV -0x30(%RBP),%R14 |
(3662) 0x4c0c2f JMP 4c0b4a |
(3662) 0x4c0c34 MOV -0x38(%RBP),%R11 |
(3662) 0x4c0c38 MOV -0x58(%RBP),%R10 |
(3662) 0x4c0c3c MOV -0x30(%RBP),%R14 |
(3662) 0x4c0c40 MOV -0x48(%RBP),%RBX |
(3662) 0x4c0c44 JMP 4c0b4a |
(3662) 0x4c0c49 ADD %R11,%R9 |
(3662) 0x4c0c4c ADD %RBX,%R9 |
(3662) 0x4c0c4f MOV %R9,%RDI |
(3662) 0x4c0c52 MOV -0x48(%RBP),%RBX |
(3662) 0x4c0c56 MOV -0x50(%RBP),%R15 |
(3662) 0x4c0c5a MOV -0x38(%RBP),%R11 |
(3662) 0x4c0c5e MOV -0x58(%RBP),%R10 |
(3662) 0x4c0c62 MOV -0x30(%RBP),%R14 |
(3662) 0x4c0c66 NOPW %CS:(%RAX,%RAX,1) |
(3665) 0x4c0c70 CMP %RDX,(%R15,%RDI,8) |
(3665) 0x4c0c74 JE 4c0cb2 |
(3665) 0x4c0c76 INC %RDI |
(3665) 0x4c0c79 CMP %RDI,%R8 |
(3665) 0x4c0c7c JNE 4c0c70 |
(3662) 0x4c0c7e JMP 4c0b4a |
(3662) 0x4c0c83 KSHIFTLB $0x4,%K0,%K0 |
(3662) 0x4c0c89 KORB %K0,%K1,%K0 |
(3662) 0x4c0c8d KSHIFTLB $0x4,%K2,%K1 |
(3662) 0x4c0c93 KORB %K1,%K3,%K1 |
(3662) 0x4c0c97 KUNPCKBW %K0,%K1,%K0 |
(3662) 0x4c0c9b KMOVD %K0,%R8D |
(3662) 0x4c0c9f TZCNT %R8D,%R8D |
(3662) 0x4c0ca4 ADD %R14,%RDI |
(3662) 0x4c0ca7 ADD %R8,%RDI |
(3662) 0x4c0caa MOV -0x50(%RBP),%R15 |
(3662) 0x4c0cae MOV -0x30(%RBP),%R14 |
(3662) 0x4c0cb2 MOV -0xa8(%RBP),%R9 |
(3662) 0x4c0cb9 MOV (%R9,%RDI,8),%R8 |
(3662) 0x4c0cbd MOV 0x8(%R9,%RDI,8),%R10 |
(3662) 0x4c0cc2 CMP %R10,%R8 |
(3662) 0x4c0cc5 JGE 4c0d4e |
(3662) 0x4c0ccb MOV -0xe0(%RBP),%R9 |
(3662) 0x4c0cd2 MOV (%R9),%R9 |
(3662) 0x4c0cd5 JMP 4c0cf4 |
0x4c0cd7 NOPW (%RAX,%RAX,1) |
(3664) 0x4c0ce0 VADDSD (%R9,%RBX,8),%XMM1,%XMM1 |
(3664) 0x4c0ce6 VMOVSD %XMM1,(%R9,%RBX,8) |
(3664) 0x4c0cec INC %R8 |
(3664) 0x4c0cef CMP %R10,%R8 |
(3664) 0x4c0cf2 JGE 4c0d4e |
(3664) 0x4c0cf4 MOV -0x108(%RBP),%R11 |
(3664) 0x4c0cfb MOV (%R11,%R8,8),%R11 |
(3664) 0x4c0cff MOV (%R14,%R11,8),%RBX |
(3664) 0x4c0d03 MOV -0x140(%RBP),%R13 |
(3664) 0x4c0d0a VMOVSD (%R13,%R8,8),%XMM1 |
(3664) 0x4c0d11 MOV -0x98(%RBP),%R13 |
(3664) 0x4c0d18 CMP (%R13,%RDX,8),%RBX |
(3664) 0x4c0d1d JGE 4c0ce0 |
(3664) 0x4c0d1f MOV -0xe8(%RBP),%R10 |
(3664) 0x4c0d26 MOV (%R10),%R10 |
(3664) 0x4c0d29 MOV %R11,(%R10,%RAX,8) |
(3664) 0x4c0d2d VMOVSD %XMM1,(%R9,%RAX,8) |
(3664) 0x4c0d33 MOV %RAX,(%R14,%R11,8) |
(3664) 0x4c0d37 INC %RAX |
(3664) 0x4c0d3a MOV -0xa8(%RBP),%R10 |
(3664) 0x4c0d41 MOV 0x8(%R10,%RDI,8),%R10 |
(3664) 0x4c0d46 INC %R8 |
(3664) 0x4c0d49 CMP %R10,%R8 |
(3664) 0x4c0d4c JL 4c0cf4 |
(3662) 0x4c0d4e MOV -0xb0(%RBP),%R9 |
(3662) 0x4c0d55 MOV (%R9,%RDI,8),%R8 |
(3662) 0x4c0d59 MOV 0x8(%R9,%RDI,8),%R10 |
(3662) 0x4c0d5e CMP %R10,%R8 |
(3662) 0x4c0d61 JGE 4c0dde |
(3662) 0x4c0d63 MOV -0xd8(%RBP),%R9 |
(3662) 0x4c0d6a MOV (%R9),%R9 |
(3662) 0x4c0d6d JMP 4c0d84 |
0x4c0d6f NOP |
(3663) 0x4c0d70 VADDSD (%R9,%RBX,8),%XMM1,%XMM1 |
(3663) 0x4c0d76 VMOVSD %XMM1,(%R9,%RBX,8) |
(3663) 0x4c0d7c INC %R8 |
(3663) 0x4c0d7f CMP %R10,%R8 |
(3663) 0x4c0d82 JGE 4c0dde |
(3663) 0x4c0d84 MOV -0x110(%RBP),%R11 |
(3663) 0x4c0d8b MOV (%R11,%R8,8),%R11 |
(3663) 0x4c0d8f MOV (%R12,%R11,8),%RBX |
(3663) 0x4c0d93 MOV -0x148(%RBP),%R13 |
(3663) 0x4c0d9a VMOVSD (%R13,%R8,8),%XMM1 |
(3663) 0x4c0da1 MOV -0xa0(%RBP),%R13 |
(3663) 0x4c0da8 CMP (%R13,%RDX,8),%RBX |
(3663) 0x4c0dad JGE 4c0d70 |
(3663) 0x4c0daf MOV -0xf0(%RBP),%R10 |
(3663) 0x4c0db6 MOV (%R10),%R10 |
(3663) 0x4c0db9 MOV %R11,(%R10,%RCX,8) |
(3663) 0x4c0dbd VMOVSD %XMM1,(%R9,%RCX,8) |
(3663) 0x4c0dc3 MOV %RCX,(%R12,%R11,8) |
(3663) 0x4c0dc7 INC %RCX |
(3663) 0x4c0dca MOV -0xb0(%RBP),%R10 |
(3663) 0x4c0dd1 MOV 0x8(%R10,%RDI,8),%R10 |
(3663) 0x4c0dd6 INC %R8 |
(3663) 0x4c0dd9 CMP %R10,%R8 |
(3663) 0x4c0ddc JL 4c0d84 |
(3662) 0x4c0dde MOV -0x58(%RBP),%R10 |
(3662) 0x4c0de2 MOV -0x48(%RBP),%RBX |
(3662) 0x4c0de6 MOV -0x38(%RBP),%R11 |
(3662) 0x4c0dea JMP 4c0b4a |
0x4c0def MOV %R14,%RDI |
0x4c0df2 VZEROUPPER |
0x4c0df5 CALL 4e6a60 <hypre_Free> |
0x4c0dfa MOV %R12,%RDI |
0x4c0dfd ADD $0x128,%RSP |
0x4c0e04 POP %RBX |
0x4c0e05 POP %R12 |
0x4c0e07 POP %R13 |
0x4c0e09 POP %R14 |
0x4c0e0b POP %R15 |
0x4c0e0d POP %RBP |
0x4c0e0e JMP 4e6a60 |
0x4c0e13 NOPW %CS:(%RAX,%RAX,1) |
0x4c0e1d NOPL (%RAX) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | par_csr_matop.c:3454-3640 |
Module | exec |
nb instructions | 286 |
nb uops | 310 |
loop length | 1286 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 60 |
micro-operation queue | 51.67 cycles |
front end | 51.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 13.50 | 13.40 | 27.67 | 27.67 | 34.50 | 13.40 | 13.30 | 34.50 | 34.50 | 34.50 | 13.40 | 27.67 |
cycles | 13.50 | 16.00 | 27.67 | 27.67 | 34.50 | 13.40 | 13.30 | 34.50 | 34.50 | 34.50 | 13.40 | 27.67 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 48.51-48.56 |
Stall cycles | 0.00 |
Front-end | 51.67 |
Dispatch | 34.50 |
DIV/SQRT | 16.00 |
Overall L1 | 51.67 |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 5% |
all | 12% |
load | 11% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x80(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x148(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4e86b0 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R15,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4c02e7 <hypre_ParTMatmul.extracted+0x167> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4c02f4 <hypre_ParTMatmul.extracted+0x174> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R15D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %EDX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e86c0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c032b <hypre_ParTMatmul.extracted+0x1ab> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RAX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R14,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c033d <hypre_ParTMatmul.extracted+0x1bd> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
IMUL %RAX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R15,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x50(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xf8(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e6980 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e6980 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0386 <hypre_ParTMatmul.extracted+0x206> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RCX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efbb0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c03a4 <hypre_ParTMatmul.extracted+0x224> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RAX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efbb0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP -0x60(%RBP),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RBX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c06de <hypre_ParTMatmul.extracted+0x55e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x40(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c03fe <hypre_ParTMatmul.extracted+0x27e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x736270,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 410030 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,-0xd0(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 4c0930 <hypre_ParTMatmul.extracted+0x7b0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x118(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xc8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc0(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c086c <hypre_ParTMatmul.extracted+0x6ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R11,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c0791 <hypre_ParTMatmul.extracted+0x611> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c0791 <hypre_ParTMatmul.extracted+0x611> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4c083e <hypre_ParTMatmul.extracted+0x6be> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R11,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4c083e <hypre_ParTMatmul.extracted+0x6be> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c086c <hypre_ParTMatmul.extracted+0x6ec> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x5,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c07fd <hypre_ParTMatmul.extracted+0x67d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R11),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JE 4c086c <hypre_ParTMatmul.extracted+0x6ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R11,%RCX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c086c <hypre_ParTMatmul.extracted+0x6ec> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV (%R11),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%R11,%RDI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%R10,%RDI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x130(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4da400 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x128(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x70(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4da400 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x120(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4da4e0 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x8(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4da4e0 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x8(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x736290,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410030 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xf8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0959 <hypre_ParTMatmul.extracted+0x7d9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efbb0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x70(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0973 <hypre_ParTMatmul.extracted+0x7f3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efbb0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xd0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4c09a9 <hypre_ParTMatmul.extracted+0x829> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RAX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RCX,%RDX,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4c09be <hypre_ParTMatmul.extracted+0x83e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4c0def <hypre_ParTMatmul.extracted+0xc6f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x60(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c0def <hypre_ParTMatmul.extracted+0xc6f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c09e8 <hypre_ParTMatmul.extracted+0x868> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e6a60 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 4e6a60 <hypre_Free> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | par_csr_matop.c:3454-3640 |
Module | exec |
nb instructions | 286 |
nb uops | 310 |
loop length | 1286 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 60 |
micro-operation queue | 51.67 cycles |
front end | 51.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 13.50 | 13.40 | 27.67 | 27.67 | 34.50 | 13.40 | 13.30 | 34.50 | 34.50 | 34.50 | 13.40 | 27.67 |
cycles | 13.50 | 16.00 | 27.67 | 27.67 | 34.50 | 13.40 | 13.30 | 34.50 | 34.50 | 34.50 | 13.40 | 27.67 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 48.51-48.56 |
Stall cycles | 0.00 |
Front-end | 51.67 |
Dispatch | 34.50 |
DIV/SQRT | 16.00 |
Overall L1 | 51.67 |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 5% |
all | 12% |
load | 11% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x80(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x148(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4e86b0 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R15,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4c02e7 <hypre_ParTMatmul.extracted+0x167> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4c02f4 <hypre_ParTMatmul.extracted+0x174> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R15D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %EDX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e86c0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c032b <hypre_ParTMatmul.extracted+0x1ab> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RAX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R14,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c033d <hypre_ParTMatmul.extracted+0x1bd> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
IMUL %RAX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R15,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x50(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xf8(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e6980 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e6980 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0386 <hypre_ParTMatmul.extracted+0x206> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RCX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efbb0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c03a4 <hypre_ParTMatmul.extracted+0x224> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RAX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efbb0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP -0x60(%RBP),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RBX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c06de <hypre_ParTMatmul.extracted+0x55e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x40(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c03fe <hypre_ParTMatmul.extracted+0x27e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x736270,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 410030 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,-0xd0(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 4c0930 <hypre_ParTMatmul.extracted+0x7b0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x118(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xc8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc0(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c086c <hypre_ParTMatmul.extracted+0x6ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R11,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c0791 <hypre_ParTMatmul.extracted+0x611> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c0791 <hypre_ParTMatmul.extracted+0x611> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4c083e <hypre_ParTMatmul.extracted+0x6be> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R11,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4c083e <hypre_ParTMatmul.extracted+0x6be> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c086c <hypre_ParTMatmul.extracted+0x6ec> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x5,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c07fd <hypre_ParTMatmul.extracted+0x67d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R11),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JE 4c086c <hypre_ParTMatmul.extracted+0x6ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R11,%RCX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c086c <hypre_ParTMatmul.extracted+0x6ec> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV (%R11),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%R11,%RDI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%R10,%RDI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x130(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4da400 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x128(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x70(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4da400 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x120(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4da4e0 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x8(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4da4e0 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x8(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x736290,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410030 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xf8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0959 <hypre_ParTMatmul.extracted+0x7d9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efbb0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x70(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0973 <hypre_ParTMatmul.extracted+0x7f3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efbb0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xd0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4c09a9 <hypre_ParTMatmul.extracted+0x829> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RAX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RCX,%RDX,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4c09be <hypre_ParTMatmul.extracted+0x83e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4c0def <hypre_ParTMatmul.extracted+0xc6f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x60(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c0def <hypre_ParTMatmul.extracted+0xc6f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c09e8 <hypre_ParTMatmul.extracted+0x868> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e6a60 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 4e6a60 <hypre_Free> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_ParTMatmul.extracted– | 0.05 | 0.01 |
○Loop 3670 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
○Loop 3672 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
○Loop 3671 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
○Loop 3669 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
▼Loop 3661 - par_csr_matop.c:3467-3634 - exec– | 0 | 0.01 |
○Loop 3668 - par_csr_matop.c:3590-3596 - exec | 0.01 | 0.01 |
▼Loop 3662 - par_csr_matop.c:3467-3634 - exec– | 0 | 0 |
○Loop 3666 - par_csr_matop.c:3505-3608 - exec | 0.01 | 0.01 |
○Loop 3665 - par_csr_matop.c:3607-3608 - exec | 0 | 0 |
○Loop 3663 - par_csr_matop.c:3623-3634 - exec | 0 | 0 |
○Loop 3667 - par_csr_matop.c:3607-3608 - exec | 0 | 0 |
○Loop 3664 - par_csr_matop.c:3610-3621 - exec | 0 | 0 |
○Loop 3660 - par_csr_matop.c:3598-3604 - exec | 0 | 0 |
▼Loop 3674 - par_csr_matop.c:3467-3528 - exec– | 0 | 0 |
○Loop 3681 - par_csr_matop.c:3491-3495 - exec | 0.01 | 0.01 |
▼Loop 3675 - par_csr_matop.c:3467-3522 - exec– | 0 | 0 |
○Loop 3679 - par_csr_matop.c:3504-3505 - exec | 0.02 | 0.01 |
○Loop 3678 - par_csr_matop.c:3504-3505 - exec | 0 | 0 |
○Loop 3676 - par_csr_matop.c:3516-3522 - exec | 0 | 0 |
○Loop 3680 - par_csr_matop.c:3504-3505 - exec | 0 | 0 |
○Loop 3677 - par_csr_matop.c:3507-3513 - exec | 0 | 0 |
○Loop 3673 - par_csr_matop.c:3497-3501 - exec | 0 | 0 |