Function: hypre_IJMatrixAssembleParCSR.extracted.25 | Module: exec | Source: IJMatrix_parcsr.c:2798-2812 | Coverage: 0.57% |
---|
Function: hypre_IJMatrixAssembleParCSR.extracted.25 | Module: exec | Source: IJMatrix_parcsr.c:2798-2812 | Coverage: 0.57% |
---|
/home/eoseret/qaas_runs_CPU_9468/172-019-1763/intel/AMG/build/AMG/AMG/IJ_mv/IJMatrix_parcsr.c: 2798 - 2812 |
-------------------------------------------------------------------------------- |
2798: #pragma omp parallel for private (i,j,j0,temp) |
2799: #endif |
2800: for (i=0; i < num_rows; i++) |
2801: { |
2802: j0 = diag_i[i]; |
2803: for (j=j0; j < diag_i[i+1]; j++) |
2804: { |
2805: diag_j[j] -= col_0; |
2806: if (diag_j[j] == i) |
2807: { |
2808: temp = diag_data[j0]; |
2809: diag_data[j0] = diag_data[j]; |
2810: diag_data[j] = temp; |
2811: diag_j[j] = diag_j[j0]; |
2812: diag_j[j0] = i; |
0x55a990 PUSH %RBP |
0x55a991 MOV %RSP,%RBP |
0x55a994 PUSH %R15 |
0x55a996 PUSH %R14 |
0x55a998 PUSH %R13 |
0x55a99a PUSH %R12 |
0x55a99c PUSH %RBX |
0x55a99d SUB $0x18,%RSP |
0x55a9a1 MOVL $0,-0x2c(%RBP) |
0x55a9a8 MOV %R9,%RBX |
0x55a9ab MOV %R8,%R14 |
0x55a9ae MOV %RCX,%R15 |
0x55a9b1 MOV %RDX,%R13 |
0x55a9b4 MOV (%RDI),%R12D |
0x55a9b7 MOVQ $0,-0x38(%RBP) |
0x55a9bf MOVQ $0x1,-0x40(%RBP) |
0x55a9c7 SUB $0x8,%RSP |
0x55a9cb LEA -0x40(%RBP),%RAX |
0x55a9cf MOV $0x5d9770,%EDI |
0x55a9d4 MOV %R12D,%ESI |
0x55a9d7 LEA -0x2c(%RBP),%RCX |
0x55a9db LEA -0x38(%RBP),%R8 |
0x55a9df LEA 0x18(%RBP),%R9 |
0x55a9e3 MOV $0x22,%EDX |
0x55a9e8 PUSH $0x1 |
0x55a9ea PUSH $0x1 |
0x55a9ec PUSH %RAX |
0x55a9ed CALL 410420 <__kmpc_for_static_init_8@plt> |
0x55a9f2 ADD $0x20,%RSP |
0x55a9f6 MOV 0x18(%RBP),%RAX |
0x55a9fa MOV -0x38(%RBP),%RDI |
0x55a9fe MOV %RAX,%RSI |
0x55aa01 SUB %RDI,%RSI |
0x55aa04 JB 55aaaf |
0x55aa0a MOV (%R13,%RDI,8),%R9 |
0x55aa0f MOV %EAX,%R8D |
0x55aa12 SUB %EDI,%R8D |
0x55aa15 INC %R8D |
0x55aa18 AND $0x7,%R8 |
0x55aa1c JE 55aaa3 |
0x55aa22 XOR %R10D,%R10D |
0x55aa25 JMP 55aa3e |
0x55aa27 NOPW (%RAX,%RAX,1) |
(5766) 0x55aa30 INC %R10 |
(5766) 0x55aa33 MOV %RDX,%R9 |
(5766) 0x55aa36 MOV %RCX,%RDI |
(5766) 0x55aa39 CMP %R8,%R10 |
(5766) 0x55aa3c JE 55aaa9 |
(5766) 0x55aa3e MOV 0x8(%R13,%RDI,8),%RDX |
(5766) 0x55aa43 LEA 0x1(%RDI),%RCX |
(5766) 0x55aa47 CMP %RDX,%R9 |
(5766) 0x55aa4a JGE 55aa30 |
(5766) 0x55aa4c MOV %R9,%R11 |
(5766) 0x55aa4f JMP 55aa6d |
0x55aa51 NOPW %CS:(%RAX,%RAX,1) |
(5767) 0x55aa60 MOV (%R13,%RCX,8),%RDX |
(5767) 0x55aa65 INC %R11 |
(5767) 0x55aa68 CMP %RDX,%R11 |
(5767) 0x55aa6b JGE 55aa30 |
(5767) 0x55aa6d MOV (%R15,%R11,8),%RDX |
(5767) 0x55aa71 SUB %RBX,%RDX |
(5767) 0x55aa74 MOV %RDX,(%R15,%R11,8) |
(5767) 0x55aa78 CMP %RDI,%RDX |
(5767) 0x55aa7b JNE 55aa60 |
(5767) 0x55aa7d VMOVSD (%R14,%R9,8),%XMM0 |
(5767) 0x55aa83 VMOVSD (%R14,%R11,8),%XMM1 |
(5767) 0x55aa89 VMOVSD %XMM1,(%R14,%R9,8) |
(5767) 0x55aa8f VMOVSD %XMM0,(%R14,%R11,8) |
(5767) 0x55aa95 MOV (%R15,%R9,8),%RDX |
(5767) 0x55aa99 MOV %RDX,(%R15,%R11,8) |
(5767) 0x55aa9d MOV %RDI,(%R15,%R9,8) |
(5767) 0x55aaa1 JMP 55aa60 |
0x55aaa3 MOV %R9,%RDX |
0x55aaa6 MOV %RDI,%RCX |
0x55aaa9 CMP $0x7,%RSI |
0x55aaad JAE 55aad5 |
0x55aaaf MOV $0x5d9790,%EDI |
0x55aab4 MOV %R12D,%ESI |
0x55aab7 ADD $0x18,%RSP |
0x55aabb POP %RBX |
0x55aabc POP %R12 |
0x55aabe POP %R13 |
0x55aac0 POP %R14 |
0x55aac2 POP %R15 |
0x55aac4 POP %RBP |
0x55aac5 JMP 410170 |
0x55aaca NOPW (%RAX,%RAX,1) |
(5757) 0x55aad0 CMP %RAX,%RDI |
(5757) 0x55aad3 JE 55aaaf |
(5757) 0x55aad5 MOV 0x8(%R13,%RCX,8),%RSI |
(5757) 0x55aada CMP %RSI,%RDX |
(5757) 0x55aadd JGE 55ab40 |
(5757) 0x55aadf MOV %RDX,%RDI |
(5757) 0x55aae2 JMP 55aafd |
0x55aae4 NOPW %CS:(%RAX,%RAX,1) |
(5765) 0x55aaf0 MOV 0x8(%R13,%RCX,8),%RSI |
(5765) 0x55aaf5 INC %RDI |
(5765) 0x55aaf8 CMP %RSI,%RDI |
(5765) 0x55aafb JGE 55ab40 |
(5765) 0x55aafd MOV (%R15,%RDI,8),%RSI |
(5765) 0x55ab01 SUB %RBX,%RSI |
(5765) 0x55ab04 MOV %RSI,(%R15,%RDI,8) |
(5765) 0x55ab08 CMP %RCX,%RSI |
(5765) 0x55ab0b JNE 55aaf0 |
(5765) 0x55ab0d VMOVSD (%R14,%RDX,8),%XMM0 |
(5765) 0x55ab13 VMOVSD (%R14,%RDI,8),%XMM1 |
(5765) 0x55ab19 VMOVSD %XMM1,(%R14,%RDX,8) |
(5765) 0x55ab1f VMOVSD %XMM0,(%R14,%RDI,8) |
(5765) 0x55ab25 MOV (%R15,%RDX,8),%RSI |
(5765) 0x55ab29 MOV %RSI,(%R15,%RDI,8) |
(5765) 0x55ab2d MOV %RCX,(%R15,%RDX,8) |
(5765) 0x55ab31 JMP 55aaf0 |
0x55ab33 NOPW %CS:(%RAX,%RAX,1) |
(5757) 0x55ab40 MOV 0x10(%R13,%RCX,8),%RDX |
(5757) 0x55ab45 CMP %RDX,%RSI |
(5757) 0x55ab48 JGE 55abb0 |
(5757) 0x55ab4a LEA 0x1(%RCX),%RDI |
(5757) 0x55ab4e MOV %RSI,%R8 |
(5757) 0x55ab51 JMP 55ab6d |
0x55ab53 NOPW %CS:(%RAX,%RAX,1) |
(5764) 0x55ab60 MOV 0x10(%R13,%RCX,8),%RDX |
(5764) 0x55ab65 INC %R8 |
(5764) 0x55ab68 CMP %RDX,%R8 |
(5764) 0x55ab6b JGE 55abb0 |
(5764) 0x55ab6d MOV (%R15,%R8,8),%RDX |
(5764) 0x55ab71 SUB %RBX,%RDX |
(5764) 0x55ab74 MOV %RDX,(%R15,%R8,8) |
(5764) 0x55ab78 CMP %RDI,%RDX |
(5764) 0x55ab7b JNE 55ab60 |
(5764) 0x55ab7d VMOVSD (%R14,%RSI,8),%XMM0 |
(5764) 0x55ab83 VMOVSD (%R14,%R8,8),%XMM1 |
(5764) 0x55ab89 VMOVSD %XMM1,(%R14,%RSI,8) |
(5764) 0x55ab8f VMOVSD %XMM0,(%R14,%R8,8) |
(5764) 0x55ab95 MOV (%R15,%RSI,8),%RDX |
(5764) 0x55ab99 MOV %RDX,(%R15,%R8,8) |
(5764) 0x55ab9d MOV %RDI,(%R15,%RSI,8) |
(5764) 0x55aba1 JMP 55ab60 |
0x55aba3 NOPW %CS:(%RAX,%RAX,1) |
(5757) 0x55abb0 MOV 0x18(%R13,%RCX,8),%RSI |
(5757) 0x55abb5 CMP %RSI,%RDX |
(5757) 0x55abb8 JGE 55ac20 |
(5757) 0x55abba LEA 0x2(%RCX),%RDI |
(5757) 0x55abbe MOV %RDX,%R8 |
(5757) 0x55abc1 JMP 55abdd |
0x55abc3 NOPW %CS:(%RAX,%RAX,1) |
(5763) 0x55abd0 MOV 0x18(%R13,%RCX,8),%RSI |
(5763) 0x55abd5 INC %R8 |
(5763) 0x55abd8 CMP %RSI,%R8 |
(5763) 0x55abdb JGE 55ac20 |
(5763) 0x55abdd MOV (%R15,%R8,8),%RSI |
(5763) 0x55abe1 SUB %RBX,%RSI |
(5763) 0x55abe4 MOV %RSI,(%R15,%R8,8) |
(5763) 0x55abe8 CMP %RDI,%RSI |
(5763) 0x55abeb JNE 55abd0 |
(5763) 0x55abed VMOVSD (%R14,%RDX,8),%XMM0 |
(5763) 0x55abf3 VMOVSD (%R14,%R8,8),%XMM1 |
(5763) 0x55abf9 VMOVSD %XMM1,(%R14,%RDX,8) |
(5763) 0x55abff VMOVSD %XMM0,(%R14,%R8,8) |
(5763) 0x55ac05 MOV (%R15,%RDX,8),%RSI |
(5763) 0x55ac09 MOV %RSI,(%R15,%R8,8) |
(5763) 0x55ac0d MOV %RDI,(%R15,%RDX,8) |
(5763) 0x55ac11 JMP 55abd0 |
0x55ac13 NOPW %CS:(%RAX,%RAX,1) |
(5757) 0x55ac20 MOV 0x20(%R13,%RCX,8),%RDX |
(5757) 0x55ac25 CMP %RDX,%RSI |
(5757) 0x55ac28 JGE 55ac90 |
(5757) 0x55ac2a LEA 0x3(%RCX),%RDI |
(5757) 0x55ac2e MOV %RSI,%R8 |
(5757) 0x55ac31 JMP 55ac4d |
0x55ac33 NOPW %CS:(%RAX,%RAX,1) |
(5762) 0x55ac40 MOV 0x20(%R13,%RCX,8),%RDX |
(5762) 0x55ac45 INC %R8 |
(5762) 0x55ac48 CMP %RDX,%R8 |
(5762) 0x55ac4b JGE 55ac90 |
(5762) 0x55ac4d MOV (%R15,%R8,8),%RDX |
(5762) 0x55ac51 SUB %RBX,%RDX |
(5762) 0x55ac54 MOV %RDX,(%R15,%R8,8) |
(5762) 0x55ac58 CMP %RDI,%RDX |
(5762) 0x55ac5b JNE 55ac40 |
(5762) 0x55ac5d VMOVSD (%R14,%RSI,8),%XMM0 |
(5762) 0x55ac63 VMOVSD (%R14,%R8,8),%XMM1 |
(5762) 0x55ac69 VMOVSD %XMM1,(%R14,%RSI,8) |
(5762) 0x55ac6f VMOVSD %XMM0,(%R14,%R8,8) |
(5762) 0x55ac75 MOV (%R15,%RSI,8),%RDX |
(5762) 0x55ac79 MOV %RDX,(%R15,%R8,8) |
(5762) 0x55ac7d MOV %RDI,(%R15,%RSI,8) |
(5762) 0x55ac81 JMP 55ac40 |
0x55ac83 NOPW %CS:(%RAX,%RAX,1) |
(5757) 0x55ac90 MOV 0x28(%R13,%RCX,8),%RSI |
(5757) 0x55ac95 CMP %RSI,%RDX |
(5757) 0x55ac98 JGE 55ad00 |
(5757) 0x55ac9a LEA 0x4(%RCX),%RDI |
(5757) 0x55ac9e MOV %RDX,%R8 |
(5757) 0x55aca1 JMP 55acbd |
0x55aca3 NOPW %CS:(%RAX,%RAX,1) |
(5761) 0x55acb0 MOV 0x28(%R13,%RCX,8),%RSI |
(5761) 0x55acb5 INC %R8 |
(5761) 0x55acb8 CMP %RSI,%R8 |
(5761) 0x55acbb JGE 55ad00 |
(5761) 0x55acbd MOV (%R15,%R8,8),%RSI |
(5761) 0x55acc1 SUB %RBX,%RSI |
(5761) 0x55acc4 MOV %RSI,(%R15,%R8,8) |
(5761) 0x55acc8 CMP %RDI,%RSI |
(5761) 0x55accb JNE 55acb0 |
(5761) 0x55accd VMOVSD (%R14,%RDX,8),%XMM0 |
(5761) 0x55acd3 VMOVSD (%R14,%R8,8),%XMM1 |
(5761) 0x55acd9 VMOVSD %XMM1,(%R14,%RDX,8) |
(5761) 0x55acdf VMOVSD %XMM0,(%R14,%R8,8) |
(5761) 0x55ace5 MOV (%R15,%RDX,8),%RSI |
(5761) 0x55ace9 MOV %RSI,(%R15,%R8,8) |
(5761) 0x55aced MOV %RDI,(%R15,%RDX,8) |
(5761) 0x55acf1 JMP 55acb0 |
0x55acf3 NOPW %CS:(%RAX,%RAX,1) |
(5757) 0x55ad00 MOV 0x30(%R13,%RCX,8),%RDX |
(5757) 0x55ad05 CMP %RDX,%RSI |
(5757) 0x55ad08 JGE 55ad70 |
(5757) 0x55ad0a LEA 0x5(%RCX),%RDI |
(5757) 0x55ad0e MOV %RSI,%R8 |
(5757) 0x55ad11 JMP 55ad2d |
0x55ad13 NOPW %CS:(%RAX,%RAX,1) |
(5760) 0x55ad20 MOV 0x30(%R13,%RCX,8),%RDX |
(5760) 0x55ad25 INC %R8 |
(5760) 0x55ad28 CMP %RDX,%R8 |
(5760) 0x55ad2b JGE 55ad70 |
(5760) 0x55ad2d MOV (%R15,%R8,8),%RDX |
(5760) 0x55ad31 SUB %RBX,%RDX |
(5760) 0x55ad34 MOV %RDX,(%R15,%R8,8) |
(5760) 0x55ad38 CMP %RDI,%RDX |
(5760) 0x55ad3b JNE 55ad20 |
(5760) 0x55ad3d VMOVSD (%R14,%RSI,8),%XMM0 |
(5760) 0x55ad43 VMOVSD (%R14,%R8,8),%XMM1 |
(5760) 0x55ad49 VMOVSD %XMM1,(%R14,%RSI,8) |
(5760) 0x55ad4f VMOVSD %XMM0,(%R14,%R8,8) |
(5760) 0x55ad55 MOV (%R15,%RSI,8),%RDX |
(5760) 0x55ad59 MOV %RDX,(%R15,%R8,8) |
(5760) 0x55ad5d MOV %RDI,(%R15,%RSI,8) |
(5760) 0x55ad61 JMP 55ad20 |
0x55ad63 NOPW %CS:(%RAX,%RAX,1) |
(5757) 0x55ad70 MOV 0x38(%R13,%RCX,8),%RSI |
(5757) 0x55ad75 CMP %RSI,%RDX |
(5757) 0x55ad78 JGE 55ade0 |
(5757) 0x55ad7a LEA 0x6(%RCX),%RDI |
(5757) 0x55ad7e MOV %RDX,%R8 |
(5757) 0x55ad81 JMP 55ad9d |
0x55ad83 NOPW %CS:(%RAX,%RAX,1) |
(5759) 0x55ad90 MOV 0x38(%R13,%RCX,8),%RSI |
(5759) 0x55ad95 INC %R8 |
(5759) 0x55ad98 CMP %RSI,%R8 |
(5759) 0x55ad9b JGE 55ade0 |
(5759) 0x55ad9d MOV (%R15,%R8,8),%RSI |
(5759) 0x55ada1 SUB %RBX,%RSI |
(5759) 0x55ada4 MOV %RSI,(%R15,%R8,8) |
(5759) 0x55ada8 CMP %RDI,%RSI |
(5759) 0x55adab JNE 55ad90 |
(5759) 0x55adad VMOVSD (%R14,%RDX,8),%XMM0 |
(5759) 0x55adb3 VMOVSD (%R14,%R8,8),%XMM1 |
(5759) 0x55adb9 VMOVSD %XMM1,(%R14,%RDX,8) |
(5759) 0x55adbf VMOVSD %XMM0,(%R14,%R8,8) |
(5759) 0x55adc5 MOV (%R15,%RDX,8),%RSI |
(5759) 0x55adc9 MOV %RSI,(%R15,%R8,8) |
(5759) 0x55adcd MOV %RDI,(%R15,%RDX,8) |
(5759) 0x55add1 JMP 55ad90 |
0x55add3 NOPW %CS:(%RAX,%RAX,1) |
(5757) 0x55ade0 MOV 0x40(%R13,%RCX,8),%RDX |
(5757) 0x55ade5 LEA 0x7(%RCX),%RDI |
(5757) 0x55ade9 ADD $0x8,%RCX |
(5757) 0x55aded CMP %RDX,%RSI |
(5757) 0x55adf0 JGE 55aad0 |
(5757) 0x55adf6 MOV %RSI,%R8 |
(5757) 0x55adf9 JMP 55ae11 |
0x55adfb NOPL (%RAX,%RAX,1) |
(5758) 0x55ae00 MOV (%R13,%RCX,8),%RDX |
(5758) 0x55ae05 INC %R8 |
(5758) 0x55ae08 CMP %RDX,%R8 |
(5758) 0x55ae0b JGE 55aad0 |
(5758) 0x55ae11 MOV (%R15,%R8,8),%RDX |
(5758) 0x55ae15 SUB %RBX,%RDX |
(5758) 0x55ae18 MOV %RDX,(%R15,%R8,8) |
(5758) 0x55ae1c CMP %RDI,%RDX |
(5758) 0x55ae1f JNE 55ae00 |
(5758) 0x55ae21 VMOVSD (%R14,%RSI,8),%XMM0 |
(5758) 0x55ae27 VMOVSD (%R14,%R8,8),%XMM1 |
(5758) 0x55ae2d VMOVSD %XMM1,(%R14,%RSI,8) |
(5758) 0x55ae33 VMOVSD %XMM0,(%R14,%R8,8) |
(5758) 0x55ae39 MOV (%R15,%RSI,8),%RDX |
(5758) 0x55ae3d MOV %RDX,(%R15,%R8,8) |
(5758) 0x55ae41 MOV %RDI,(%R15,%RSI,8) |
(5758) 0x55ae45 JMP 55ae00 |
0x55ae47 NOPW (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | IJMatrix_parcsr.c:2798-2812 |
Module | exec |
nb instructions | 75 |
nb uops | 57 |
loop length | 415 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 4 |
micro-operation queue | 9.50 cycles |
front end | 9.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.75 | 4.75 | 4.75 | 4.75 | 3.00 | 2.67 | 2.67 | 2.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 4.75 | 4.75 | 4.75 | 4.75 | 3.00 | 2.67 | 2.67 | 2.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 9.50 |
Dispatch | 4.75 |
Overall L1 | 9.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 9% |
load | 9% |
store | 6% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 8% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x18,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOVL $0,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV (%RDI),%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOVQ $0,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVQ $0x1,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x40(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x5d9770,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R12D,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (6.3%) |
LEA -0x2c(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x38(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x18(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL 410420 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV -0x38(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
SUB %RDI,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JB 55aaaf <hypre_IJMatrixAssembleParCSR.extracted.25+0x11f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV (%R13,%RDI,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV %EAX,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (6.3%) |
SUB %EDI,%R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
INC %R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
AND $0x7,%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JE 55aaa3 <hypre_IJMatrixAssembleParCSR.extracted.25+0x113> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | scal (6.3%) |
JMP 55aa3e <hypre_IJMatrixAssembleParCSR.extracted.25+0xae> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
MOV %R9,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CMP $0x7,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JAE 55aad5 <hypre_IJMatrixAssembleParCSR.extracted.25+0x145> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV $0x5d9790,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R12D,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (6.3%) |
ADD $0x18,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
JMP 410170 <__kmpc_for_static_fini@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Source file and lines | IJMatrix_parcsr.c:2798-2812 |
Module | exec |
nb instructions | 75 |
nb uops | 57 |
loop length | 415 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 4 |
micro-operation queue | 9.50 cycles |
front end | 9.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.75 | 4.75 | 4.75 | 4.75 | 3.00 | 2.67 | 2.67 | 2.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 4.75 | 4.75 | 4.75 | 4.75 | 3.00 | 2.67 | 2.67 | 2.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 9.50 |
Dispatch | 4.75 |
Overall L1 | 9.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 9% |
load | 9% |
store | 6% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 8% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x18,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOVL $0,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV (%RDI),%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOVQ $0,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVQ $0x1,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x40(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x5d9770,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R12D,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (6.3%) |
LEA -0x2c(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x38(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x18(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL 410420 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV -0x38(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
SUB %RDI,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JB 55aaaf <hypre_IJMatrixAssembleParCSR.extracted.25+0x11f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV (%R13,%RDI,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV %EAX,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (6.3%) |
SUB %EDI,%R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
INC %R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
AND $0x7,%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JE 55aaa3 <hypre_IJMatrixAssembleParCSR.extracted.25+0x113> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | scal (6.3%) |
JMP 55aa3e <hypre_IJMatrixAssembleParCSR.extracted.25+0xae> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
MOV %R9,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CMP $0x7,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JAE 55aad5 <hypre_IJMatrixAssembleParCSR.extracted.25+0x145> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV $0x5d9790,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R12D,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (6.3%) |
ADD $0x18,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
JMP 410170 <__kmpc_for_static_fini@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_IJMatrixAssembleParCSR.extracted.25– | 0.57 | 0.43 |
▼Loop 5757 - IJMatrix_parcsr.c:2798-2812 - exec– | 0.00 | 0.00 |
○Loop 5765 - IJMatrix_parcsr.c:2803-2812 - exec | 0.11 | 0.08 |
○Loop 5763 - IJMatrix_parcsr.c:2803-2812 - exec | 0.11 | 0.08 |
○Loop 5761 - IJMatrix_parcsr.c:2803-2812 - exec | 0.11 | 0.08 |
○Loop 5759 - IJMatrix_parcsr.c:2803-2812 - exec | 0.11 | 0.08 |
○Loop 5760 - IJMatrix_parcsr.c:2803-2812 - exec | 0.03 | 0.02 |
○Loop 5762 - IJMatrix_parcsr.c:2803-2812 - exec | 0.03 | 0.02 |
○Loop 5758 - IJMatrix_parcsr.c:2803-2812 - exec | 0.03 | 0.02 |
○Loop 5764 - IJMatrix_parcsr.c:2803-2812 - exec | 0.03 | 0.02 |
▼Loop 5766 - IJMatrix_parcsr.c:2798-2812 - exec– | 0.00 | 0.00 |
○Loop 5767 - IJMatrix_parcsr.c:2803-2812 - exec | 0.00 | 0.00 |