Function: hypre_IJMatrixSetValuesOMPParCSR.extracted.28 | Module: libIJ_mv.so | Source: IJMatrix_parcsr.c:3240-3484 [...] | Coverage: 1.21% |
---|
Function: hypre_IJMatrixSetValuesOMPParCSR.extracted.28 | Module: libIJ_mv.so | Source: IJMatrix_parcsr.c:3240-3484 [...] | Coverage: 1.21% |
---|
/home/eoseret/qaas_runs_CPU_9468/172-019-1763/intel/AMG/build/AMG/AMG/IJ_mv/IJMatrix_parcsr.c: 3240 - 3484 |
-------------------------------------------------------------------------------- |
3240: #pragma omp parallel |
[...] |
3256: num_threads = hypre_NumActiveThreads(); |
3257: my_thread_num = hypre_GetThreadNum(); |
3258: |
3259: len = nrows/num_threads; |
3260: rest = nrows - len*num_threads; |
3261: |
3262: if (my_thread_num < rest) |
3263: { |
3264: ns = my_thread_num*(len+1); |
3265: ne = (my_thread_num+1)*(len+1); |
3266: } |
3267: else |
3268: { |
3269: ns = my_thread_num*len+rest; |
3270: ne = (my_thread_num+1)*len+rest; |
3271: } |
3272: |
3273: value_start[my_thread_num] = 0; |
3274: for (ii=ns; ii < ne; ii++) |
3275: value_start[my_thread_num] += ncols[ii]; |
3276: |
3277: #ifdef HYPRE_USING_OPENMP |
3278: #pragma omp barrier |
3279: #endif |
3280: if (my_thread_num == 0) |
3281: { |
3282: for (i=0; i < max_num_threads; i++) |
3283: value_start[i+1] += value_start[i]; |
[...] |
3289: if (my_thread_num) |
3290: indx = value_start[my_thread_num-1]; |
3291: for (ii=ns; ii < ne; ii++) |
3292: { |
3293: row = rows[ii]; |
3294: n = ncols[ii]; |
3295: /* processor owns the row */ |
3296: if (row >= row_partitioning[pstart] && row < row_partitioning[pstart+1]) |
3297: { |
3298: row_local = row - row_partitioning[pstart]; |
3299: /* compute local row number */ |
3300: if (need_aux) |
3301: { |
3302: local_j = aux_j[row_local]; |
3303: local_data = aux_data[row_local]; |
3304: space = row_space[row_local]; |
3305: old_size = row_length[row_local]; |
3306: size = space - old_size; |
3307: if (size < n) |
3308: { |
3309: size = n - size; |
3310: tmp_j = hypre_CTAlloc(HYPRE_Int,size); |
3311: tmp_data = hypre_CTAlloc(HYPRE_Complex,size); |
3312: } |
3313: tmp_indx = 0; |
3314: not_found = 1; |
3315: size = old_size; |
3316: for (i=0; i < n; i++) |
3317: { |
3318: for (j=0; j < old_size; j++) |
3319: { |
3320: if (local_j[j] == cols[indx]) |
3321: { |
3322: local_data[j] = values[indx]; |
[...] |
3329: if (size < space) |
3330: { |
3331: local_j[size] = cols[indx]; |
3332: local_data[size++] = values[indx]; |
3333: } |
3334: else |
3335: { |
3336: tmp_j[tmp_indx] = cols[indx]; |
3337: tmp_data[tmp_indx++] = values[indx]; |
3338: } |
3339: } |
3340: not_found = 1; |
3341: indx++; |
3342: } |
3343: |
3344: row_length[row_local] = size+tmp_indx; |
3345: |
3346: if (tmp_indx) |
3347: { |
3348: aux_j[row_local] = hypre_TReAlloc(aux_j[row_local],HYPRE_Int, |
3349: size+tmp_indx); |
3350: aux_data[row_local] = hypre_TReAlloc(aux_data[row_local], |
3351: HYPRE_Complex,size+tmp_indx); |
3352: row_space[row_local] = size+tmp_indx; |
3353: local_j = aux_j[row_local]; |
[...] |
3359: for (i=0; i < tmp_indx; i++) |
3360: { |
3361: local_j[cnt] = tmp_j[i]; |
3362: local_data[cnt++] = tmp_data[i]; |
3363: } |
3364: |
3365: if (tmp_j) |
3366: { |
3367: hypre_TFree(tmp_j); |
3368: hypre_TFree(tmp_data); |
[...] |
3376: offd_indx = hypre_AuxParCSRMatrixIndxOffd(aux_matrix)[row_local]; |
3377: diag_indx = hypre_AuxParCSRMatrixIndxDiag(aux_matrix)[row_local]; |
3378: cnt_diag = diag_indx; |
3379: cnt_offd = offd_indx; |
3380: diag_space = diag_i[row_local+1]; |
3381: offd_space = offd_i[row_local+1]; |
3382: not_found = 1; |
3383: for (i=0; i < n; i++) |
3384: { |
3385: if (cols[indx] < col_0 || cols[indx] > col_n) |
3386: /* insert into offd */ |
3387: { |
3388: for (j=offd_i[row_local]; j < offd_indx; j++) |
3389: { |
3390: if (offd_j[j] == cols[indx]) |
3391: { |
3392: offd_data[j] = values[indx]; |
[...] |
3399: if (cnt_offd < offd_space) |
3400: { |
3401: offd_j[cnt_offd] = cols[indx]; |
3402: offd_data[cnt_offd++] = values[indx]; |
3403: } |
3404: else |
3405: { |
3406: hypre_error(HYPRE_ERROR_GENERIC); |
3407: #ifdef HYPRE_USING_OPENMP |
3408: #pragma omp atomic |
3409: #endif |
3410: error_flag++; |
3411: if (print_level) |
3412: hypre_printf("Error in row %d ! Too many elements!\n", |
[...] |
3422: for (j=diag_i[row_local]; j < diag_indx; j++) |
3423: { |
3424: if (diag_j[j] == cols[indx]) |
3425: { |
3426: diag_data[j] = values[indx]; |
[...] |
3433: if (cnt_diag < diag_space) |
3434: { |
3435: diag_j[cnt_diag] = cols[indx]; |
3436: diag_data[cnt_diag++] = values[indx]; |
3437: } |
3438: else |
3439: { |
3440: hypre_error(HYPRE_ERROR_GENERIC); |
3441: #ifdef HYPRE_USING_OPENMP |
3442: #pragma omp atomic |
3443: #endif |
3444: error_flag++; |
3445: if (print_level) |
3446: hypre_printf("Error in row %d ! Too many elements !\n", |
[...] |
3454: indx++; |
3455: } |
3456: |
3457: hypre_AuxParCSRMatrixIndxDiag(aux_matrix)[row_local] = cnt_diag; |
3458: hypre_AuxParCSRMatrixIndxOffd(aux_matrix)[row_local] = cnt_offd; |
[...] |
3466: indx += n; |
3467: if (aux_matrix) |
3468: { |
3469: col_indx = 0; |
3470: for (i=0; i < off_proc_i_indx; i=i+2) |
3471: { |
3472: row_len = off_proc_i[i+1]; |
3473: if (off_proc_i[i] == row) |
3474: { |
3475: for (j=0; j < n; j++) |
3476: { |
3477: cnt1 = col_indx; |
3478: for (k=0; k < row_len; k++) |
3479: { |
3480: if (off_proc_j[cnt1] == cols[j]) |
3481: { |
3482: off_proc_j[cnt1++] = -1; |
3483: /*cancel_indx++;*/ |
3484: offproc_cnt[my_thread_num]++; |
0xf440 PUSH %RBP |
0xf441 MOV %RSP,%RBP |
0xf444 PUSH %R15 |
0xf446 PUSH %R14 |
0xf448 PUSH %R13 |
0xf44a PUSH %R12 |
0xf44c PUSH %RBX |
0xf44d SUB $0x68,%RSP |
0xf451 MOV %R9,%RBX |
0xf454 MOV %R8,-0x88(%RBP) |
0xf45b MOV %RCX,-0x58(%RBP) |
0xf45f MOV %RDX,%R14 |
0xf462 MOV %RDI,%R13 |
0xf465 CALL 5440 <hypre_NumActiveThreads@plt> |
0xf46a MOV %RAX,%R15 |
0xf46d CALL 5160 <hypre_GetThreadNum@plt> |
0xf472 MOV %RAX,%R12 |
0xf475 MOV %R15,%RAX |
0xf478 OR %R14,%RAX |
0xf47b SHR $0x20,%RAX |
0xf47f JE f48b |
0xf481 MOV %R14,%RAX |
0xf484 CQTO |
0xf486 IDIV %R15 |
0xf489 JMP f493 |
0xf48b MOV %R14D,%EAX |
0xf48e XOR %EDX,%EDX |
0xf490 DIV %R15D |
0xf493 MOV 0xb8(%RBP),%R14 |
0xf49a LEA 0x1(%R12),%RCX |
0xf49f CMP %RDX,%R12 |
0xf4a2 MOV -0x58(%RBP),%R9 |
0xf4a6 JGE f4b9 |
0xf4a8 LEA 0x1(%RAX),%RSI |
0xf4ac MOV %RSI,%RDI |
0xf4af IMUL %R12,%RDI |
0xf4b3 IMUL %RCX,%RSI |
0xf4b7 JMP f4cd |
0xf4b9 MOV %RAX,%RDI |
0xf4bc IMUL %R12,%RDI |
0xf4c0 ADD %RDX,%RDI |
0xf4c3 IMUL %RAX,%RCX |
0xf4c7 ADD %RDX,%RCX |
0xf4ca MOV %RCX,%RSI |
0xf4cd MOVQ $0,(%R14,%R12,8) |
0xf4d5 CMP %RSI,%RDI |
0xf4d8 MOV %RDI,%R15 |
0xf4db MOV %RSI,-0x50(%RBP) |
0xf4df JGE f5b2 |
0xf4e5 CMP %RDX,%R12 |
0xf4e8 CMOVL %R12,%RDX |
0xf4ec IMUL %R12,%RAX |
0xf4f0 ADD %RDX,%RAX |
0xf4f3 MOV %RSI,%RDX |
0xf4f6 SUB %RAX,%RDX |
0xf4f9 CMP $0x8,%RDX |
0xf4fd JAE f503 |
0xf4ff XOR %ECX,%ECX |
0xf501 JMP f549 |
0xf503 MOV %RDX,%RSI |
0xf506 SHR $0x3,%RSI |
0xf50a LEA (%R9,%RDI,8),%RDI |
0xf50e XOR %ECX,%ECX |
(160) 0xf510 MOVDQU (%RDI),%XMM0 |
(160) 0xf514 MOVDQU 0x10(%RDI),%XMM1 |
(160) 0xf519 MOVDQU 0x20(%RDI),%XMM2 |
(160) 0xf51e PADDQ %XMM0,%XMM2 |
(160) 0xf522 MOVDQU 0x30(%RDI),%XMM0 |
(160) 0xf527 PADDQ %XMM1,%XMM0 |
(160) 0xf52b PADDQ %XMM2,%XMM0 |
(160) 0xf52f PSHUFD $-0x12,%XMM0,%XMM1 |
(160) 0xf534 PADDQ %XMM0,%XMM1 |
(160) 0xf538 MOVQ %XMM1,%R8 |
(160) 0xf53d ADD %R8,%RCX |
(160) 0xf540 ADD $0x40,%RDI |
(160) 0xf544 DEC %RSI |
(160) 0xf547 JNE f510 |
0xf549 MOV %EDX,%ESI |
0xf54b AND $0x7,%ESI |
0xf54e DEC %RSI |
0xf551 CMP $0x6,%RSI |
0xf555 JA f5ae |
0xf557 AND $-0x8,%RDX |
0xf55b LEA 0x11bb6(%RIP),%RDI |
0xf562 MOVSXD (%RDI,%RSI,4),%RSI |
0xf566 ADD %RDI,%RSI |
0xf569 JMP %RSI |
0xf56b ADD %RDX,%RAX |
0xf56e JMP f5aa |
0xf570 ADD %RDX,%RAX |
0xf573 JMP f5a5 |
0xf575 ADD %RDX,%RAX |
0xf578 JMP f5a0 |
0xf57a ADD %RDX,%RAX |
0xf57d JMP f59b |
0xf57f ADD %RDX,%RAX |
0xf582 JMP f596 |
0xf584 ADD %RDX,%RAX |
0xf587 JMP f591 |
0xf589 ADD %RDX,%RAX |
0xf58c ADD 0x30(%R9,%RAX,8),%RCX |
0xf591 ADD 0x28(%R9,%RAX,8),%RCX |
0xf596 ADD 0x20(%R9,%RAX,8),%RCX |
0xf59b ADD 0x18(%R9,%RAX,8),%RCX |
0xf5a0 ADD 0x10(%R9,%RAX,8),%RCX |
0xf5a5 ADD 0x8(%R9,%RAX,8),%RCX |
0xf5aa ADD (%R9,%RAX,8),%RCX |
0xf5ae MOV %RCX,(%R14,%R12,8) |
0xf5b2 MOV (%R13),%ESI |
0xf5b6 LEA 0x17dd3(%RIP),%RDI |
0xf5bd CALL 5500 <__kmpc_barrier@plt> |
0xf5c2 TEST %R12,%R12 |
0xf5c5 JNE f666 |
0xf5cb MOV 0xc8(%RBP),%RAX |
0xf5d2 TEST %RAX,%RAX |
0xf5d5 JLE f666 |
0xf5db MOV (%R14),%RCX |
0xf5de CMP $0x8,%RAX |
0xf5e2 JB f637 |
0xf5e4 MOV %RAX,%RDX |
0xf5e7 SHR $0x3,%RDX |
0xf5eb LEA 0x40(%R14),%RSI |
0xf5ef NOP |
(159) 0xf5f0 ADD -0x38(%RSI),%RCX |
(159) 0xf5f4 MOV %RCX,-0x38(%RSI) |
(159) 0xf5f8 ADD -0x30(%RSI),%RCX |
(159) 0xf5fc MOV %RCX,-0x30(%RSI) |
(159) 0xf600 ADD -0x28(%RSI),%RCX |
(159) 0xf604 MOV %RCX,-0x28(%RSI) |
(159) 0xf608 ADD -0x20(%RSI),%RCX |
(159) 0xf60c MOV %RCX,-0x20(%RSI) |
(159) 0xf610 ADD -0x18(%RSI),%RCX |
(159) 0xf614 MOV %RCX,-0x18(%RSI) |
(159) 0xf618 ADD -0x10(%RSI),%RCX |
(159) 0xf61c MOV %RCX,-0x10(%RSI) |
(159) 0xf620 ADD -0x8(%RSI),%RCX |
(159) 0xf624 MOV %RCX,-0x8(%RSI) |
(159) 0xf628 ADD (%RSI),%RCX |
(159) 0xf62b MOV %RCX,(%RSI) |
(159) 0xf62e ADD $0x40,%RSI |
(159) 0xf632 DEC %RDX |
(159) 0xf635 JNE f5f0 |
0xf637 MOV %RAX,%RDX |
0xf63a AND $-0x8,%RDX |
0xf63e CMP %RAX,%RDX |
0xf641 JAE f666 |
0xf643 NOPW %CS:(%RAX,%RAX,1) |
(158) 0xf650 ADD 0x8(%R14,%RDX,8),%RCX |
(158) 0xf655 MOV %RCX,0x8(%R14,%RDX,8) |
(158) 0xf65a LEA 0x1(%RDX),%RSI |
(158) 0xf65e MOV %RSI,%RDX |
(158) 0xf661 CMP %RSI,%RAX |
(158) 0xf664 JNE f650 |
0xf666 MOV (%R13),%ESI |
0xf66a LEA 0x17d3f(%RIP),%RDI |
0xf671 CALL 5500 <__kmpc_barrier@plt> |
0xf676 TEST %R12,%R12 |
0xf679 JE f682 |
0xf67b MOV -0x8(%R14,%R12,8),%RAX |
0xf680 JMP f684 |
0xf682 XOR %EAX,%EAX |
0xf684 MOV %RAX,-0x68(%RBP) |
0xf688 MOV -0x58(%RBP),%R11 |
0xf68c MOV %R15,%RDX |
0xf68f MOV -0x50(%RBP),%RSI |
0xf693 CMP %RSI,%R15 |
0xf696 JGE fe08 |
0xf69c MOV 0xb0(%RBP),%RAX |
0xf6a3 MOV 0xa8(%RBP),%RCX |
0xf6aa CMPQ $0,0x18(%RBP) |
0xf6af LEA (%RAX,%R12,8),%R13 |
0xf6b3 SETNE %AL |
0xf6b6 CMPQ $0,0x98(%RBP) |
0xf6be SETG %DIL |
0xf6c2 AND %AL,%DIL |
0xf6c5 MOV %DIL,-0x29(%RBP) |
0xf6c9 MOV 0x20(%RBP),%R15 |
0xf6cd LEA 0x18(%RCX),%RAX |
0xf6d1 MOV %RAX,-0x90(%RBP) |
0xf6d8 XOR %EAX,%EAX |
0xf6da MOV %RAX,-0x78(%RBP) |
0xf6de JMP f6fc |
(144) 0xf6e0 MOV -0x58(%RBP),%R11 |
(144) 0xf6e4 MOV -0x60(%RBP),%RDX |
(144) 0xf6e8 MOV -0x50(%RBP),%RSI |
(144) 0xf6ec MOV 0x20(%RBP),%R15 |
(144) 0xf6f0 INC %RDX |
(144) 0xf6f3 CMP %RSI,%RDX |
(144) 0xf6f6 JGE fe08 |
(144) 0xf6fc MOV -0x88(%RBP),%RAX |
(144) 0xf703 MOV (%RAX,%RDX,8),%RDI |
(144) 0xf707 MOV (%R11,%RDX,8),%R14 |
(144) 0xf70b MOV %RDI,-0x70(%RBP) |
(144) 0xf70f SUB (%R15),%RDI |
(144) 0xf712 JL f7c0 |
(144) 0xf718 MOV -0x70(%RBP),%RAX |
(144) 0xf71c CMP 0x8(%R15),%RAX |
(144) 0xf720 JGE f7c0 |
(144) 0xf726 CMPQ $0,0x58(%RBP) |
(144) 0xf72b JE f98a |
(144) 0xf731 MOV 0x38(%RBP),%R8 |
(144) 0xf735 MOV (%R8,%RDI,8),%R15 |
(144) 0xf739 MOV 0x40(%RBP),%RAX |
(144) 0xf73d MOV (%RAX,%RDI,8),%RAX |
(144) 0xf741 MOV %RAX,-0x40(%RBP) |
(144) 0xf745 MOV 0x50(%RBP),%RAX |
(144) 0xf749 MOV (%RAX,%RDI,8),%RCX |
(144) 0xf74d MOV 0x48(%RBP),%RAX |
(144) 0xf751 MOV %RDI,-0x38(%RBP) |
(144) 0xf755 MOV (%RAX,%RDI,8),%R12 |
(144) 0xf759 MOV %RCX,-0x70(%RBP) |
(144) 0xf75d MOV %RCX,%RAX |
(144) 0xf760 SUB %R12,%RAX |
(144) 0xf763 MOV %R14,%RCX |
(144) 0xf766 SUB %RAX,%RCX |
(144) 0xf769 MOV %RDX,-0x60(%RBP) |
(144) 0xf76d JLE faf6 |
(144) 0xf773 MOV $0x8,%ESI |
(144) 0xf778 MOV %RCX,%RDI |
(144) 0xf77b MOV %RCX,-0x80(%RBP) |
(144) 0xf77f CALL 54d0 <hypre_CAlloc@plt> |
(144) 0xf784 MOV %RAX,-0x48(%RBP) |
(144) 0xf788 MOV $0x8,%ESI |
(144) 0xf78d MOV -0x80(%RBP),%RDI |
(144) 0xf791 CALL 54d0 <hypre_CAlloc@plt> |
(144) 0xf796 MOV -0x48(%RBP),%R10 |
(144) 0xf79a MOV 0x10(%RBP),%RDI |
(144) 0xf79e TEST %R14,%R14 |
(144) 0xf7a1 MOV %RAX,%RCX |
(144) 0xf7a4 MOV %RAX,-0x78(%RBP) |
(144) 0xf7a8 JG fb11 |
(144) 0xf7ae MOV 0x48(%RBP),%RAX |
(144) 0xf7b2 MOV -0x38(%RBP),%RCX |
(144) 0xf7b6 MOV %R12,(%RAX,%RCX,8) |
(144) 0xf7ba JMP fcc3 |
0xf7bf NOP |
(144) 0xf7c0 ADD %R14,-0x68(%RBP) |
(144) 0xf7c4 TEST %R14,%R14 |
(144) 0xf7c7 SETG %AL |
(144) 0xf7ca TEST %AL,-0x29(%RBP) |
(144) 0xf7cd JE f6f0 |
(144) 0xf7d3 MOV %RDX,-0x60(%RBP) |
(144) 0xf7d7 MOV 0x98(%RBP),%RAX |
(144) 0xf7de DEC %RAX |
(144) 0xf7e1 SHR $0x1,%RAX |
(144) 0xf7e4 MOV %RAX,-0x40(%RBP) |
(144) 0xf7e8 DEC %R14 |
(144) 0xf7eb XOR %EDX,%EDX |
(144) 0xf7ed XOR %ECX,%ECX |
(144) 0xf7ef JMP f811 |
0xf7f1 NOPW %CS:(%RAX,%RAX,1) |
(145) 0xf800 LEA 0x1(%RCX),%RAX |
(145) 0xf804 CMP -0x40(%RBP),%RCX |
(145) 0xf808 MOV %RAX,%RCX |
(145) 0xf80b JE f6e0 |
(145) 0xf811 MOV %RDX,%RAX |
(145) 0xf814 MOV %RCX,%RDI |
(145) 0xf817 SAL $0x4,%RDI |
(145) 0xf81b MOV 0xa0(%RBP),%R8 |
(145) 0xf822 MOV 0x8(%R8,%RDI,1),%RSI |
(145) 0xf827 ADD %RSI,%RDX |
(145) 0xf82a MOV -0x70(%RBP),%R9 |
(145) 0xf82e CMP %R9,(%R8,%RDI,1) |
(145) 0xf832 JNE f800 |
(145) 0xf834 TEST %RSI,%RSI |
(145) 0xf837 JLE f800 |
(145) 0xf839 MOV 0xa8(%RBP),%RDI |
(145) 0xf840 LEA (%RDI,%RDX,8),%R8 |
(145) 0xf844 ADD $-0x8,%R8 |
(145) 0xf848 LEA (%RDI,%RAX,8),%RDI |
(145) 0xf84c CMP %R13,%R8 |
(145) 0xf84f JB f8a0 |
(145) 0xf851 CMP %RDI,%R13 |
(145) 0xf854 JB f8a0 |
(145) 0xf856 XOR %EAX,%EAX |
(145) 0xf858 JMP f86c |
0xf85a NOPW (%RAX,%RAX,1) |
(149) 0xf860 LEA 0x1(%RAX),%R8 |
(149) 0xf864 CMP %R14,%RAX |
(149) 0xf867 MOV %R8,%RAX |
(149) 0xf86a JE f800 |
(149) 0xf86c MOV (%RBX,%RAX,8),%R8 |
(149) 0xf870 XOR %R9D,%R9D |
(149) 0xf873 JMP f888 |
0xf875 NOPW %CS:(%RAX,%RAX,1) |
(150) 0xf880 INC %R9 |
(150) 0xf883 CMP %R9,%RSI |
(150) 0xf886 JE f860 |
(150) 0xf888 CMP %R8,(%RDI,%R9,8) |
(150) 0xf88c JNE f880 |
(150) 0xf88e MOVQ $-0x1,(%RDI,%R9,8) |
(150) 0xf896 INCQ (%R13) |
(150) 0xf89a JMP f880 |
0xf89c NOPL (%RAX) |
(145) 0xf8a0 MOV -0x90(%RBP),%R8 |
(145) 0xf8a7 LEA (%R8,%RAX,8),%RAX |
(145) 0xf8ab MOV %RSI,%R12 |
(145) 0xf8ae SHR $0x2,%R12 |
(145) 0xf8b2 MOV %RSI,%R10 |
(145) 0xf8b5 AND $-0x4,%R10 |
(145) 0xf8b9 XOR %R11D,%R11D |
(145) 0xf8bc JMP f8d0 |
0xf8be XCHG %AX,%AX |
(146) 0xf8c0 LEA 0x1(%R11),%R8 |
(146) 0xf8c4 CMP %R14,%R11 |
(146) 0xf8c7 MOV %R8,%R11 |
(146) 0xf8ca JE f800 |
(146) 0xf8d0 MOV (%RBX,%R11,8),%R15 |
(146) 0xf8d4 CMP $0x4,%RSI |
(146) 0xf8d8 JAE f910 |
(146) 0xf8da CMP %RSI,%R10 |
(146) 0xf8dd JAE f8c0 |
(146) 0xf8df MOV %R10,%R8 |
(146) 0xf8e2 JMP f8f8 |
0xf8e4 NOPW %CS:(%RAX,%RAX,1) |
(147) 0xf8f0 INC %R8 |
(147) 0xf8f3 CMP %R8,%RSI |
(147) 0xf8f6 JE f8c0 |
(147) 0xf8f8 CMP %R15,(%RDI,%R8,8) |
(147) 0xf8fc JNE f8f0 |
(147) 0xf8fe MOVQ $-0x1,(%RDI,%R8,8) |
(147) 0xf906 INCQ (%R13) |
(147) 0xf90a JMP f8f0 |
0xf90c NOPL (%RAX) |
(146) 0xf910 MOV %R12,%R9 |
(146) 0xf913 MOV %RAX,%R8 |
(146) 0xf916 JMP f929 |
0xf918 NOPL (%RAX,%RAX,1) |
(148) 0xf920 ADD $0x20,%R8 |
(148) 0xf924 DEC %R9 |
(148) 0xf927 JE f8da |
(148) 0xf929 CMP %R15,-0x18(%R8) |
(148) 0xf92d JNE f960 |
(148) 0xf92f MOVQ $-0x1,-0x18(%R8) |
(148) 0xf937 INCQ (%R13) |
(148) 0xf93b CMP %R15,-0x10(%R8) |
(148) 0xf93f JE f966 |
(148) 0xf941 CMP %R15,-0x8(%R8) |
(148) 0xf945 JNE f978 |
(148) 0xf947 MOVQ $-0x1,-0x8(%R8) |
(148) 0xf94f INCQ (%R13) |
(148) 0xf953 CMP %R15,(%R8) |
(148) 0xf956 JNE f920 |
(148) 0xf958 JMP f97d |
0xf95a NOPW (%RAX,%RAX,1) |
(148) 0xf960 CMP %R15,-0x10(%R8) |
(148) 0xf964 JNE f941 |
(148) 0xf966 MOVQ $-0x1,-0x10(%R8) |
(148) 0xf96e INCQ (%R13) |
(148) 0xf972 CMP %R15,-0x8(%R8) |
(148) 0xf976 JE f947 |
(148) 0xf978 CMP %R15,(%R8) |
(148) 0xf97b JNE f920 |
(148) 0xf97d MOVQ $-0x1,(%R8) |
(148) 0xf984 INCQ (%R13) |
(148) 0xf988 JMP f920 |
(144) 0xf98a MOV 0x18(%RBP),%RAX |
(144) 0xf98e MOV 0x38(%RAX),%RCX |
(144) 0xf992 MOV 0x40(%RAX),%RAX |
(144) 0xf996 MOV (%RAX,%RDI,8),%RAX |
(144) 0xf99a MOV (%RCX,%RDI,8),%RCX |
(144) 0xf99e TEST %R14,%R14 |
(144) 0xf9a1 JLE fcab |
(144) 0xf9a7 MOV %RDX,-0x60(%RBP) |
(144) 0xf9ab MOV 0x60(%RBP),%RDX |
(144) 0xf9af MOV 0x8(%RDX,%RDI,8),%RDX |
(144) 0xf9b4 MOV 0x78(%RBP),%RSI |
(144) 0xf9b8 MOV %RDI,-0x38(%RBP) |
(144) 0xf9bc MOV 0x8(%RSI,%RDI,8),%RDI |
(144) 0xf9c1 MOV -0x68(%RBP),%R12 |
(144) 0xf9c5 LEA (%R14,%R12,1),%RSI |
(144) 0xf9c9 XOR %R8D,%R8D |
(144) 0xf9cc MOV %RAX,-0x40(%RBP) |
(144) 0xf9d0 MOV %RCX,-0x48(%RBP) |
(144) 0xf9d4 JMP f9f9 |
(151) 0xf9d6 MOV 0x10(%RBP),%R9 |
(151) 0xf9da MOVQ (%R9,%R12,8),%XMM0 |
(151) 0xf9e0 MOV 0x70(%RBP),%R9 |
(151) 0xf9e4 MOVQ %XMM0,(%R9,%R10,8) |
(151) 0xf9ea INC %R12 |
(151) 0xf9ed INC %R8 |
(151) 0xf9f0 CMP %R14,%R8 |
(151) 0xf9f3 JE fcb6 |
(151) 0xf9f9 MOV (%RBX,%R12,8),%R9 |
(151) 0xf9fd CMP 0x28(%RBP),%R9 |
(151) 0xfa01 JL fa70 |
(151) 0xfa03 CMP 0x30(%RBP),%R9 |
(151) 0xfa07 JG fa70 |
(151) 0xfa09 MOV 0x60(%RBP),%R10 |
(151) 0xfa0d MOV -0x38(%RBP),%R15 |
(151) 0xfa11 MOV (%R10,%R15,8),%R10 |
(151) 0xfa15 CMP %RCX,%R10 |
(151) 0xfa18 JGE fa32 |
(151) 0xfa1a NOPW (%RAX,%RAX,1) |
(153) 0xfa20 MOV 0x68(%RBP),%R15 |
(153) 0xfa24 CMP %R9,(%R15,%R10,8) |
(153) 0xfa28 JE f9d6 |
(153) 0xfa2a INC %R10 |
(153) 0xfa2d CMP %R10,%RCX |
(153) 0xfa30 JNE fa20 |
(151) 0xfa32 MOV -0x48(%RBP),%R15 |
(151) 0xfa36 CMP %RDX,%R15 |
(151) 0xfa39 JGE fd01 |
(151) 0xfa3f MOV 0x68(%RBP),%R10 |
(151) 0xfa43 MOV %R9,(%R10,%R15,8) |
(151) 0xfa47 MOV 0x10(%RBP),%R9 |
(151) 0xfa4b MOVQ (%R9,%R12,8),%XMM0 |
(151) 0xfa51 MOV 0x70(%RBP),%R9 |
(151) 0xfa55 MOVQ %XMM0,(%R9,%R15,8) |
(151) 0xfa5b INC %R15 |
(151) 0xfa5e MOV %R15,-0x48(%RBP) |
(151) 0xfa62 JMP f9ea |
0xfa64 NOPW %CS:(%RAX,%RAX,1) |
(151) 0xfa70 MOV 0x78(%RBP),%R10 |
(151) 0xfa74 MOV -0x38(%RBP),%R15 |
(151) 0xfa78 MOV (%R10,%R15,8),%R10 |
(151) 0xfa7c CMP %RAX,%R10 |
(151) 0xfa7f JGE faa5 |
(151) 0xfa81 NOPW %CS:(%RAX,%RAX,1) |
(152) 0xfa90 MOV 0x80(%RBP),%R15 |
(152) 0xfa97 CMP %R9,(%R15,%R10,8) |
(152) 0xfa9b JE fae0 |
(152) 0xfa9d INC %R10 |
(152) 0xfaa0 CMP %R10,%RAX |
(152) 0xfaa3 JNE fa90 |
(151) 0xfaa5 MOV -0x40(%RBP),%R15 |
(151) 0xfaa9 CMP %RDI,%R15 |
(151) 0xfaac JGE fd3b |
(151) 0xfab2 MOV 0x80(%RBP),%R10 |
(151) 0xfab9 MOV %R9,(%R10,%R15,8) |
(151) 0xfabd MOV 0x10(%RBP),%R9 |
(151) 0xfac1 MOVQ (%R9,%R12,8),%XMM0 |
(151) 0xfac7 MOV 0x88(%RBP),%R9 |
(151) 0xface MOVQ %XMM0,(%R9,%R15,8) |
(151) 0xfad4 INC %R15 |
(151) 0xfad7 MOV %R15,-0x40(%RBP) |
(151) 0xfadb JMP f9ea |
(151) 0xfae0 MOV 0x10(%RBP),%R9 |
(151) 0xfae4 MOVQ (%R9,%R12,8),%XMM0 |
(151) 0xfaea MOV 0x88(%RBP),%R9 |
(151) 0xfaf1 JMP f9e4 |
(144) 0xfaf6 XOR %R10D,%R10D |
(144) 0xfaf9 MOV 0x10(%RBP),%RDI |
(144) 0xfafd MOV -0x78(%RBP),%RAX |
(144) 0xfb01 TEST %R14,%R14 |
(144) 0xfb04 MOV %RAX,%RCX |
(144) 0xfb07 MOV %RAX,-0x78(%RBP) |
(144) 0xfb0b JLE f7ae |
(144) 0xfb11 XOR %R9D,%R9D |
(144) 0xfb14 MOV %R12,%R8 |
(144) 0xfb17 MOV -0x68(%RBP),%RCX |
(144) 0xfb1b XOR %R11D,%R11D |
(144) 0xfb1e JMP fb38 |
(156) 0xfb20 MOV %RDX,(%R10,%R11,8) |
(156) 0xfb24 MOVQ %XMM0,(%RAX,%R11,8) |
(156) 0xfb2a INC %R11 |
(156) 0xfb2d INC %RCX |
(156) 0xfb30 INC %R9 |
(156) 0xfb33 CMP %R14,%R9 |
(156) 0xfb36 JE fb90 |
(156) 0xfb38 MOV (%RBX,%RCX,8),%RDX |
(156) 0xfb3c TEST %R12,%R12 |
(156) 0xfb3f JLE fb5e |
(156) 0xfb41 XOR %ESI,%ESI |
(156) 0xfb43 NOPW %CS:(%RAX,%RAX,1) |
(157) 0xfb50 CMP %RDX,(%R15,%RSI,8) |
(157) 0xfb54 JE fb80 |
(157) 0xfb56 INC %RSI |
(157) 0xfb59 CMP %RSI,%R12 |
(157) 0xfb5c JNE fb50 |
(156) 0xfb5e MOVQ (%RDI,%RCX,8),%XMM0 |
(156) 0xfb63 CMP -0x70(%RBP),%R8 |
(156) 0xfb67 JGE fb20 |
(156) 0xfb69 MOV %RDX,(%R15,%R8,8) |
(156) 0xfb6d MOV -0x40(%RBP),%RDX |
(156) 0xfb71 MOVQ %XMM0,(%RDX,%R8,8) |
(156) 0xfb77 INC %R8 |
(156) 0xfb7a JMP fb2d |
0xfb7c NOPL (%RAX) |
(156) 0xfb80 MOVQ (%RDI,%RCX,8),%XMM0 |
(156) 0xfb85 MOV -0x40(%RBP),%RDX |
(156) 0xfb89 MOVQ %XMM0,(%RDX,%RSI,8) |
(156) 0xfb8e JMP fb2d |
(144) 0xfb90 MOV -0x68(%RBP),%R12 |
(144) 0xfb94 ADD %R14,%R12 |
(144) 0xfb97 LEA (%R8,%R11,1),%R15 |
(144) 0xfb9b MOV 0x48(%RBP),%RAX |
(144) 0xfb9f MOV -0x38(%RBP),%RCX |
(144) 0xfba3 MOV %R15,(%RAX,%RCX,8) |
(144) 0xfba7 TEST %R11,%R11 |
(144) 0xfbaa MOV %R12,-0x68(%RBP) |
(144) 0xfbae JE fcc3 |
(144) 0xfbb4 MOV %R8,-0x40(%RBP) |
(144) 0xfbb8 MOV %R10,-0x48(%RBP) |
(144) 0xfbbc MOV -0x38(%RBP),%RAX |
(144) 0xfbc0 MOV 0x38(%RBP),%RCX |
(144) 0xfbc4 MOV (%RCX,%RAX,8),%RDI |
(144) 0xfbc8 LEA (,%R15,8),%R14 |
(144) 0xfbd0 MOV %R14,%RSI |
(144) 0xfbd3 MOV %R11,-0x70(%RBP) |
(144) 0xfbd7 CALL 51a0 <hypre_ReAlloc@plt> |
(144) 0xfbdc MOV -0x38(%RBP),%RCX |
(144) 0xfbe0 MOV 0x38(%RBP),%RDX |
(144) 0xfbe4 MOV %RAX,(%RDX,%RCX,8) |
(144) 0xfbe8 MOV 0x40(%RBP),%RCX |
(144) 0xfbec MOV -0x38(%RBP),%RAX |
(144) 0xfbf0 MOV (%RCX,%RAX,8),%RDI |
(144) 0xfbf4 MOV %R14,%RSI |
(144) 0xfbf7 CALL 51a0 <hypre_ReAlloc@plt> |
(144) 0xfbfc MOV -0x70(%RBP),%RDX |
(144) 0xfc00 MOV -0x38(%RBP),%RSI |
(144) 0xfc04 MOV 0x40(%RBP),%RCX |
(144) 0xfc08 MOV %RAX,(%RCX,%RSI,8) |
(144) 0xfc0c MOV 0x50(%RBP),%RCX |
(144) 0xfc10 MOV %R15,(%RCX,%RSI,8) |
(144) 0xfc14 TEST %RDX,%RDX |
(144) 0xfc17 JLE fcbf |
(144) 0xfc1d MOV 0x38(%RBP),%RCX |
(144) 0xfc21 MOV (%RCX,%RSI,8),%RCX |
(144) 0xfc25 MOV -0x48(%RBP),%R10 |
(144) 0xfc29 LEA (%R10,%RDX,8),%RSI |
(144) 0xfc2d ADD $-0x8,%RSI |
(144) 0xfc31 MOV -0x40(%RBP),%R11 |
(144) 0xfc35 LEA (%RCX,%R11,8),%RDI |
(144) 0xfc39 CMP %RDI,%RSI |
(144) 0xfc3c SETAE %R9B |
(144) 0xfc40 LEA (%RDX,%R11,1),%RSI |
(144) 0xfc44 DEC %RSI |
(144) 0xfc47 LEA (%RCX,%RSI,8),%RCX |
(144) 0xfc4b CMP %R10,%RCX |
(144) 0xfc4e SETAE %R8B |
(144) 0xfc52 MOV -0x78(%RBP),%R15 |
(144) 0xfc56 LEA (%R15,%RDX,8),%RCX |
(144) 0xfc5a ADD $-0x8,%RCX |
(144) 0xfc5e LEA (%RAX,%R11,8),%R14 |
(144) 0xfc62 CMP %R14,%RCX |
(144) 0xfc65 SETB %CL |
(144) 0xfc68 LEA (%RAX,%RSI,8),%RAX |
(144) 0xfc6c CMP %R15,%RAX |
(144) 0xfc6f SETB %AL |
(144) 0xfc72 TEST %R8B,%R9B |
(144) 0xfc75 JNE fcd5 |
(144) 0xfc77 OR %AL,%CL |
(144) 0xfc79 JE fcd5 |
(144) 0xfc7b CMP $0xc,%RDX |
(144) 0xfc7f JBE fdb3 |
(144) 0xfc85 SAL $0x3,%RDX |
(144) 0xfc89 MOV %R10,%RSI |
(144) 0xfc8c MOV %RDX,%R12 |
(144) 0xfc8f CALL 50a0 <_intel_fast_memcpy@plt> |
(144) 0xfc94 MOV %R14,%RDI |
(144) 0xfc97 MOV %R15,%RSI |
(144) 0xfc9a MOV %R12,%RDX |
(144) 0xfc9d CALL 50a0 <_intel_fast_memcpy@plt> |
(144) 0xfca2 MOV -0x48(%RBP),%R10 |
(144) 0xfca6 JMP fddc |
(144) 0xfcab MOV %RCX,%R9 |
(144) 0xfcae MOV %RAX,%R8 |
(144) 0xfcb1 JMP fd9a |
(144) 0xfcb6 MOV %RSI,-0x68(%RBP) |
(144) 0xfcba JMP fd82 |
(144) 0xfcbf MOV -0x48(%RBP),%R10 |
(144) 0xfcc3 TEST %R10,%R10 |
(144) 0xfcc6 MOV 0x20(%RBP),%R15 |
(144) 0xfcca JNE fde0 |
(144) 0xfcd0 JMP fdf7 |
(144) 0xfcd5 XOR %EAX,%EAX |
(144) 0xfcd7 NOPW (%RAX,%RAX,1) |
(154) 0xfce0 MOV (%R10,%RAX,8),%RCX |
(154) 0xfce4 MOV %RCX,(%RDI,%RAX,8) |
(154) 0xfce8 MOVQ (%R15,%RAX,8),%XMM0 |
(154) 0xfcee MOVQ %XMM0,(%R14,%RAX,8) |
(154) 0xfcf4 INC %RAX |
(154) 0xfcf7 CMP %RAX,%RDX |
(154) 0xfcfa JNE fce0 |
(144) 0xfcfc JMP fddc |
(144) 0xfd01 MOV %R12,-0x68(%RBP) |
(144) 0xfd05 MOV $0xd70,%ESI |
(144) 0xfd0a MOV $0x1,%EDX |
(144) 0xfd0f LEA 0x1170d(%RIP),%RDI |
(144) 0xfd16 XOR %ECX,%ECX |
(144) 0xfd18 CALL 55d0 <hypre_error_handler@plt> |
(144) 0xfd1d MOV 0xd0(%RBP),%RAX |
(144) 0xfd24 LOCK INCQ (%RAX) |
(144) 0xfd28 CMPQ $0,0xc0(%RBP) |
(144) 0xfd30 JE fd7e |
(144) 0xfd32 LEA 0x11868(%RIP),%RDI |
(144) 0xfd39 JMP fd73 |
(144) 0xfd3b MOV %R12,-0x68(%RBP) |
(144) 0xfd3f MOV $0xd4e,%ESI |
(144) 0xfd44 MOV $0x1,%EDX |
(144) 0xfd49 LEA 0x116d3(%RIP),%RDI |
(144) 0xfd50 XOR %ECX,%ECX |
(144) 0xfd52 CALL 55d0 <hypre_error_handler@plt> |
(144) 0xfd57 MOV 0xd0(%RBP),%RAX |
(144) 0xfd5e LOCK INCQ (%RAX) |
(144) 0xfd62 CMPQ $0,0xc0(%RBP) |
(144) 0xfd6a JE fd7e |
(144) 0xfd6c LEA 0x11808(%RIP),%RDI |
(144) 0xfd73 MOV -0x70(%RBP),%RSI |
(144) 0xfd77 XOR %EAX,%EAX |
(144) 0xfd79 CALL 55a0 <hypre_printf@plt> |
(144) 0xfd7e MOV -0x58(%RBP),%R11 |
(144) 0xfd82 MOV -0x60(%RBP),%RDX |
(144) 0xfd86 MOV -0x50(%RBP),%RSI |
(144) 0xfd8a MOV 0x20(%RBP),%R15 |
(144) 0xfd8e MOV -0x38(%RBP),%RDI |
(144) 0xfd92 MOV -0x40(%RBP),%R8 |
(144) 0xfd96 MOV -0x48(%RBP),%R9 |
(144) 0xfd9a MOV 0x18(%RBP),%RCX |
(144) 0xfd9e MOV 0x38(%RCX),%RAX |
(144) 0xfda2 MOV %R9,(%RAX,%RDI,8) |
(144) 0xfda6 MOV 0x40(%RCX),%RAX |
(144) 0xfdaa MOV %R8,(%RAX,%RDI,8) |
(144) 0xfdae JMP f6f0 |
(144) 0xfdb3 XOR %EAX,%EAX |
(144) 0xfdb5 NOPW %CS:(%RAX,%RAX,1) |
(155) 0xfdc0 MOV (%R10,%RAX,8),%RCX |
(155) 0xfdc4 MOV %RCX,(%RDI,%RAX,8) |
(155) 0xfdc8 MOVQ (%R15,%RAX,8),%XMM0 |
(155) 0xfdce MOVQ %XMM0,(%R14,%RAX,8) |
(155) 0xfdd4 INC %RAX |
(155) 0xfdd7 CMP %RAX,%RDX |
(155) 0xfdda JNE fdc0 |
(144) 0xfddc MOV 0x20(%RBP),%R15 |
(144) 0xfde0 MOV %R10,%RDI |
(144) 0xfde3 CALL 5260 <hypre_Free@plt> |
(144) 0xfde8 MOV -0x78(%RBP),%RDI |
(144) 0xfdec CALL 5260 <hypre_Free@plt> |
(144) 0xfdf1 XOR %EAX,%EAX |
(144) 0xfdf3 MOV %RAX,-0x78(%RBP) |
(144) 0xfdf7 MOV -0x58(%RBP),%R11 |
(144) 0xfdfb MOV -0x60(%RBP),%RDX |
(144) 0xfdff MOV -0x50(%RBP),%RSI |
(144) 0xfe03 JMP f6f0 |
0xfe08 ADD $0x68,%RSP |
0xfe0c POP %RBX |
0xfe0d POP %R12 |
0xfe0f POP %R13 |
0xfe11 POP %R14 |
0xfe13 POP %R15 |
0xfe15 POP %RBP |
0xfe16 RET |
0xfe17 NOPW (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | IJMatrix_parcsr.c:3240-3484 |
Module | libIJ_mv.so |
nb instructions | 164 |
nb uops | 154 |
loop length | 631 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 25.67 cycles |
front end | 25.67 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 19.25 | 19.25 | 19.25 | 19.25 | 16.00 | 11.67 | 11.67 | 11.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 19.25 | 19.25 | 19.25 | 19.25 | 16.00 | 11.67 | 11.67 | 11.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | 13.00-18.00 |
Front-end | 25.67 |
Dispatch | 19.25 |
DIV/SQRT | 13.00-18.00 |
Overall L1 | 25.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 12% |
load | 12% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x68,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %RDI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
CALL 5440 <hypre_NumActiveThreads@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CALL 5160 <hypre_GetThreadNum@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
OR %R14,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SHR $0x20,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
JE f48b <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x4b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
CQTO | scal (12.5%) | |||||||||||||||||
IDIV %R15 | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-19 | 7-12 | scal (12.5%) |
JMP f493 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x53> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
MOV %R14D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | scal (6.3%) |
DIV %R15D | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 10-17 | 6 | scal (6.3%) |
MOV 0xb8(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
LEA 0x1(%R12),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CMP %RDX,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV -0x58(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
JGE f4b9 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x79> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
LEA 0x1(%RAX),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RSI,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
IMUL %R12,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
IMUL %RCX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
JMP f4cd <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x8d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
IMUL %R12,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
ADD %RDX,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
ADD %RDX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOVQ $0,(%R14,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
CMP %RSI,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RSI,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JGE f5b2 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x172> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
CMP %RDX,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
CMOVL %R12,%RDX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
IMUL %R12,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
SUB %RAX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
CMP $0x8,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JAE f503 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc3> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
JMP f549 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x109> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
MOV %RDX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SHR $0x3,%RSI | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
LEA (%R9,%RDI,8),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %EDX,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
AND $0x7,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
DEC %RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CMP $0x6,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JA f5ae <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x16e> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
AND $-0x8,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
LEA 0x11bb6(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOVSXD (%RDI,%RSI,4),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD %RDI,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP %RSI | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP f5aa <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x16a> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP f5a5 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x165> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP f5a0 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x160> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP f59b <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x15b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP f596 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x156> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP f591 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x151> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
ADD 0x30(%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD 0x28(%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD 0x20(%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD 0x18(%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD 0x10(%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD 0x8(%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD (%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
MOV %RCX,(%R14,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV (%R13),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
LEA 0x17dd3(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL 5500 <__kmpc_barrier@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
TEST %R12,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JNE f666 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x226> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JLE f666 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x226> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV (%R14),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CMP $0x8,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JB f637 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x1f7> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
SHR $0x3,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
LEA 0x40(%R14),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
AND $-0x8,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
CMP %RAX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JAE f666 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x226> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
MOV (%R13),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
LEA 0x17d3f(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL 5500 <__kmpc_barrier@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
TEST %R12,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JE f682 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x242> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV -0x8(%R14,%R12,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
JMP f684 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x244> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %RAX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV -0x58(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV %R15,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV -0x50(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CMP %RSI,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JGE fe08 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x9c8> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0xa8(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CMPQ $0,0x18(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
LEA (%RAX,%R12,8),%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SETNE %AL | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CMPQ $0,0x98(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
SETG %DIL | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
AND %AL,%DIL | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %DIL,-0x29(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | N/A |
MOV 0x20(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
LEA 0x18(%RCX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP f6fc <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2bc> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
ADD $0x68,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Source file and lines | IJMatrix_parcsr.c:3240-3484 |
Module | libIJ_mv.so |
nb instructions | 164 |
nb uops | 154 |
loop length | 631 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 25.67 cycles |
front end | 25.67 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 19.25 | 19.25 | 19.25 | 19.25 | 16.00 | 11.67 | 11.67 | 11.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 19.25 | 19.25 | 19.25 | 19.25 | 16.00 | 11.67 | 11.67 | 11.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | 13.00-18.00 |
Front-end | 25.67 |
Dispatch | 19.25 |
DIV/SQRT | 13.00-18.00 |
Overall L1 | 25.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 12% |
load | 12% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x68,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %RDI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
CALL 5440 <hypre_NumActiveThreads@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CALL 5160 <hypre_GetThreadNum@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
OR %R14,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SHR $0x20,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
JE f48b <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x4b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
CQTO | scal (12.5%) | |||||||||||||||||
IDIV %R15 | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-19 | 7-12 | scal (12.5%) |
JMP f493 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x53> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
MOV %R14D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | scal (6.3%) |
DIV %R15D | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 10-17 | 6 | scal (6.3%) |
MOV 0xb8(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
LEA 0x1(%R12),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CMP %RDX,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV -0x58(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
JGE f4b9 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x79> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
LEA 0x1(%RAX),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RSI,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
IMUL %R12,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
IMUL %RCX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
JMP f4cd <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x8d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
IMUL %R12,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
ADD %RDX,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
ADD %RDX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOVQ $0,(%R14,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
CMP %RSI,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RSI,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JGE f5b2 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x172> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
CMP %RDX,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
CMOVL %R12,%RDX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
IMUL %R12,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
SUB %RAX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
CMP $0x8,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JAE f503 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc3> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
JMP f549 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x109> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
MOV %RDX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SHR $0x3,%RSI | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
LEA (%R9,%RDI,8),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %EDX,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
AND $0x7,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
DEC %RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CMP $0x6,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JA f5ae <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x16e> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
AND $-0x8,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
LEA 0x11bb6(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOVSXD (%RDI,%RSI,4),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD %RDI,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP %RSI | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP f5aa <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x16a> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP f5a5 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x165> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP f5a0 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x160> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP f59b <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x15b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP f596 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x156> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP f591 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x151> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
ADD 0x30(%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD 0x28(%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD 0x20(%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD 0x18(%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD 0x10(%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD 0x8(%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
ADD (%R9,%RAX,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
MOV %RCX,(%R14,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV (%R13),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
LEA 0x17dd3(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL 5500 <__kmpc_barrier@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
TEST %R12,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JNE f666 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x226> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JLE f666 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x226> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV (%R14),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CMP $0x8,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JB f637 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x1f7> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
SHR $0x3,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
LEA 0x40(%R14),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
AND $-0x8,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
CMP %RAX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JAE f666 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x226> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
MOV (%R13),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
LEA 0x17d3f(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL 5500 <__kmpc_barrier@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
TEST %R12,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JE f682 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x242> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV -0x8(%R14,%R12,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
JMP f684 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x244> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %RAX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV -0x58(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV %R15,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV -0x50(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CMP %RSI,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JGE fe08 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x9c8> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0xa8(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CMPQ $0,0x18(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
LEA (%RAX,%R12,8),%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SETNE %AL | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CMPQ $0,0x98(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
SETG %DIL | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
AND %AL,%DIL | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %DIL,-0x29(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | N/A |
MOV 0x20(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
LEA 0x18(%RCX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP f6fc <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2bc> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
ADD $0x68,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_IJMatrixSetValuesOMPParCSR.extracted.28– | 1.21 | 0.89 |
▼Loop 144 - IJMatrix_parcsr.c:3262-3484 - libIJ_mv.so– | 0.15 | 0.11 |
▼Loop 156 - IJMatrix_parcsr.c:3316-3341 - libIJ_mv.so– | 0.00 | 0.00 |
○Loop 157 - IJMatrix_parcsr.c:3318-3320 - libIJ_mv.so | 0.00 | 0.00 |
○Loop 155 - IJMatrix_parcsr.c:3359-3362 - libIJ_mv.so | 0.00 | 0.00 |
▼Loop 151 - IJMatrix_parcsr.c:3383-3454 - libIJ_mv.so– | 0.00 | 0.00 |
○Loop 153 - IJMatrix_parcsr.c:3422-3424 - libIJ_mv.so | 0.00 | 0.00 |
○Loop 152 - IJMatrix_parcsr.c:3388-3390 - libIJ_mv.so | 0.00 | 0.00 |
○Loop 154 - IJMatrix_parcsr.c:3359-3362 - libIJ_mv.so | 0.00 | 0.00 |
▼Loop 145 - IJMatrix_parcsr.c:3262-3484 - libIJ_mv.so– | 0.00 | 0.00 |
▼Loop 146 - IJMatrix_parcsr.c:3473-3484 - libIJ_mv.so– | 0.38 | 0.26 |
○Loop 148 - IJMatrix_parcsr.c:3478-3484 - libIJ_mv.so | 0.20 | 0.14 |
○Loop 147 - IJMatrix_parcsr.c:3478-3484 - libIJ_mv.so | 0.00 | 0.00 |
▼Loop 149 - IJMatrix_parcsr.c:3475-3484 - libIJ_mv.so– | 0.00 | 0.00 |
○Loop 150 - IJMatrix_parcsr.c:3478-3484 - libIJ_mv.so | 0.00 | 0.00 |
○Loop 160 - IJMatrix_parcsr.c:3274-3275 - libIJ_mv.so | 0.01 | 0.01 |
○Loop 158 - IJMatrix_parcsr.c:3282-3283 - libIJ_mv.so | 0.00 | 0.00 |
○Loop 159 - IJMatrix_parcsr.c:3282-3283 - libIJ_mv.so | 0.00 | 0.00 |