Function: hypre_CSRMatrixMatvecOutOfPlace.extracted.19 | Module: exec | Source: csr_matvec.c:178-204 [...] | Coverage: 0.03% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace.extracted.19 | Module: exec | Source: csr_matvec.c:178-204 [...] | Coverage: 0.03% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-586-9096/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 178 - 204 |
-------------------------------------------------------------------------------- |
178: #pragma omp parallel for private(i,j,jj,m,tempx) HYPRE_SMP_SCHEDULE |
179: #endif |
180: |
181: for (i = 0; i < num_rownnz; i++) |
182: { |
183: m = A_rownnz[i]; |
[...] |
191: if ( num_vectors==1 ) |
192: { |
193: tempx = 0; |
194: for (jj = A_i[m]; jj < A_i[m+1]; jj++) |
195: tempx += A_data[jj] * x_data[A_j[jj]]; |
196: y_data[m] += tempx; |
197: } |
198: else |
199: for ( j=0; j<num_vectors; ++j ) |
200: { |
201: tempx = 0; |
202: for (jj = A_i[m]; jj < A_i[m+1]; jj++) |
203: tempx += A_data[jj] * x_data[ j*vecstride_x + A_j[jj]*idxstride_x ]; |
204: y_data[ j*vecstride_y + m*idxstride_y] += tempx; |
0x4c8570 PUSH %RBP |
0x4c8571 MOV %RSP,%RBP |
0x4c8574 PUSH %R15 |
0x4c8576 PUSH %R14 |
0x4c8578 PUSH %R13 |
0x4c857a PUSH %R12 |
0x4c857c PUSH %RBX |
0x4c857d SUB $0xc8,%RSP |
0x4c8584 MOV %R9,-0xb8(%RBP) |
0x4c858b MOV %R8,-0x88(%RBP) |
0x4c8592 MOV %RCX,-0x50(%RBP) |
0x4c8596 MOV %RDX,-0x80(%RBP) |
0x4c859a MOV 0x40(%RBP),%RBX |
0x4c859e MOV 0x38(%RBP),%R15 |
0x4c85a2 MOV 0x30(%RBP),%R14 |
0x4c85a6 MOV 0x28(%RBP),%RAX |
0x4c85aa MOV %RAX,-0xa0(%RBP) |
0x4c85b1 MOV 0x20(%RBP),%RAX |
0x4c85b5 MOV %RAX,-0x58(%RBP) |
0x4c85b9 MOV 0x18(%RBP),%RAX |
0x4c85bd MOV %RAX,-0x48(%RBP) |
0x4c85c1 MOV 0x10(%RBP),%RAX |
0x4c85c5 MOV %RAX,-0x78(%RBP) |
0x4c85c9 MOVL $0,-0x40(%RBP) |
0x4c85d0 MOV (%RDI),%ESI |
0x4c85d2 MOVQ $0,-0x98(%RBP) |
0x4c85dd MOVQ $0x1,-0xe8(%RBP) |
0x4c85e8 SUB $0x8,%RSP |
0x4c85ec LEA -0xe8(%RBP),%RAX |
0x4c85f3 LEA -0x40(%RBP),%RCX |
0x4c85f7 LEA -0x98(%RBP),%R8 |
0x4c85fe LEA 0x50(%RBP),%R9 |
0x4c8602 MOV $0x520db0,%EDI |
0x4c8607 MOV %ESI,-0x3c(%RBP) |
0x4c860a MOV $0x22,%EDX |
0x4c860f PUSH $0x1 |
0x4c8611 PUSH $0x1 |
0x4c8613 PUSH %RAX |
0x4c8614 CALL 410430 <__kmpc_for_static_init_8@plt> |
0x4c8619 ADD $0x20,%RSP |
0x4c861d MOV -0x98(%RBP),%RAX |
0x4c8624 MOV 0x50(%RBP),%RCX |
0x4c8628 MOV %RAX,-0xb0(%RBP) |
0x4c862f SUB %RAX,%RCX |
0x4c8632 MOV %RCX,-0xa8(%RBP) |
0x4c8639 JAE 4c865c |
0x4c863b MOV $0x520dd0,%EDI |
0x4c8640 MOV -0x3c(%RBP),%ESI |
0x4c8643 ADD $0xc8,%RSP |
0x4c864a POP %RBX |
0x4c864b POP %R12 |
0x4c864d POP %R13 |
0x4c864f POP %R14 |
0x4c8651 POP %R15 |
0x4c8653 POP %RBP |
0x4c8654 VZEROUPPER |
0x4c8657 JMP 410180 |
0x4c865c MOV -0x58(%RBP),%RAX |
0x4c8660 LEA -0x1(%RAX),%R11 |
0x4c8664 XOR %EDX,%EDX |
0x4c8666 MOV %RBX,-0x70(%RBP) |
0x4c866a MOV %R14,-0x68(%RBP) |
0x4c866e MOV %R11,-0x60(%RBP) |
0x4c8672 JMP 4c86a7 |
0x4c8674 NOPW %CS:(%RAX,%RAX,1) |
(3820) 0x4c8680 MOV -0x48(%RBP),%RAX |
(3820) 0x4c8684 MOV (%RAX),%RAX |
(3820) 0x4c8687 VADDSD (%RAX,%R12,8),%XMM0,%XMM0 |
(3820) 0x4c868d VMOVSD %XMM0,(%RAX,%R12,8) |
(3820) 0x4c8693 MOV -0xc0(%RBP),%RCX |
(3820) 0x4c869a LEA 0x1(%RCX),%RDX |
(3820) 0x4c869e CMP -0xa8(%RBP),%RCX |
(3820) 0x4c86a5 JE 4c863b |
(3820) 0x4c86a7 MOV -0xb0(%RBP),%RAX |
(3820) 0x4c86ae ADD %RDX,%RAX |
(3820) 0x4c86b1 MOV -0xb8(%RBP),%RCX |
(3820) 0x4c86b8 MOV (%RCX,%RAX,8),%R12 |
(3820) 0x4c86bc CMPQ $0x1,-0x58(%RBP) |
(3820) 0x4c86c1 MOV %RDX,-0xc0(%RBP) |
(3820) 0x4c86c8 JNE 4c8780 |
(3820) 0x4c86ce MOV -0x50(%RBP),%RAX |
(3820) 0x4c86d2 MOV (%RAX),%RAX |
(3820) 0x4c86d5 MOV (%RAX,%R12,8),%R10 |
(3820) 0x4c86d9 MOV 0x8(%RAX,%R12,8),%RAX |
(3820) 0x4c86de VXORPD %XMM0,%XMM0,%XMM0 |
(3820) 0x4c86e2 MOV %RAX,%RDX |
(3820) 0x4c86e5 SUB %R10,%RDX |
(3820) 0x4c86e8 JLE 4c8680 |
(3820) 0x4c86ea MOV -0x80(%RBP),%RCX |
(3820) 0x4c86ee MOV (%RCX),%RCX |
(3820) 0x4c86f1 MOV -0x78(%RBP),%RSI |
(3820) 0x4c86f5 MOV (%RSI),%RSI |
(3820) 0x4c86f8 MOV -0x88(%RBP),%RDI |
(3820) 0x4c86ff MOV (%RDI),%R8 |
(3820) 0x4c8702 MOV %RDX,%R9 |
(3820) 0x4c8705 AND $-0x2,%R9 |
(3820) 0x4c8709 JE 4c8945 |
(3820) 0x4c870f MOV %R12,-0x38(%RBP) |
(3820) 0x4c8713 LEA -0x1(%R9),%RDI |
(3820) 0x4c8717 LEA (%RCX,%R10,8),%R11 |
(3820) 0x4c871b LEA (%R8,%R10,8),%RBX |
(3820) 0x4c871f VXORPD %XMM0,%XMM0,%XMM0 |
(3820) 0x4c8723 XOR %R14D,%R14D |
(3820) 0x4c8726 NOPW %CS:(%RAX,%RAX,1) |
(3825) 0x4c8730 MOV (%RBX,%R14,8),%R12 |
(3825) 0x4c8734 MOV 0x8(%RBX,%R14,8),%R13 |
(3825) 0x4c8739 VMOVSD (%RSI,%R12,8),%XMM1 |
(3825) 0x4c873f VMOVHPD (%RSI,%R13,8),%XMM1,%XMM1 |
(3825) 0x4c8745 VFMADD231PD (%R11,%R14,8),%XMM1,%XMM0 |
(3825) 0x4c874b ADD $0x2,%R14 |
(3825) 0x4c874f CMP %RDI,%R14 |
(3825) 0x4c8752 JBE 4c8730 |
(3820) 0x4c8754 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(3820) 0x4c8759 VADDSD %XMM1,%XMM0,%XMM0 |
(3820) 0x4c875d CMP %R9,%RDX |
(3820) 0x4c8760 MOV -0x70(%RBP),%RBX |
(3820) 0x4c8764 MOV -0x68(%RBP),%R14 |
(3820) 0x4c8768 MOV -0x60(%RBP),%R11 |
(3820) 0x4c876c MOV -0x38(%RBP),%R12 |
(3820) 0x4c8770 JE 4c8680 |
(3820) 0x4c8776 JMP 4c8948 |
0x4c877b NOPL (%RAX,%RAX,1) |
(3820) 0x4c8780 JL 4c8693 |
(3820) 0x4c8786 MOV -0x50(%RBP),%RAX |
(3820) 0x4c878a MOV (%RAX),%RAX |
(3820) 0x4c878d MOV (%RAX,%R12,8),%R10 |
(3820) 0x4c8791 MOV 0x8(%RAX,%R12,8),%R9 |
(3820) 0x4c8796 MOV -0x48(%RBP),%RAX |
(3820) 0x4c879a MOV (%RAX),%RAX |
(3820) 0x4c879d MOV %RAX,-0xe0(%RBP) |
(3820) 0x4c87a4 MOV %R9,%RAX |
(3820) 0x4c87a7 SUB %R10,%RAX |
(3820) 0x4c87aa MOV %RAX,-0xd0(%RBP) |
(3820) 0x4c87b1 AND $-0x4,%RAX |
(3820) 0x4c87b5 MOV %RAX,-0x90(%RBP) |
(3820) 0x4c87bc LEA -0x1(%RAX),%RCX |
(3820) 0x4c87c0 IMUL -0xa0(%RBP),%R12 |
(3820) 0x4c87c8 LEA (,%R10,8),%RAX |
(3820) 0x4c87d0 MOV %RAX,-0xc8(%RBP) |
(3820) 0x4c87d7 MOVQ $0,-0x30(%RBP) |
(3820) 0x4c87df MOV %R12,-0x38(%RBP) |
(3820) 0x4c87e3 MOV %R10,-0xd8(%RBP) |
(3820) 0x4c87ea JMP 4c8820 |
0x4c87ec NOPL (%RAX) |
(3821) 0x4c87f0 MOV -0x30(%RBP),%RSI |
(3821) 0x4c87f4 MOV %RSI,%RAX |
(3821) 0x4c87f7 IMUL %R14,%RAX |
(3821) 0x4c87fb ADD %R12,%RAX |
(3821) 0x4c87fe MOV -0xe0(%RBP),%RDX |
(3821) 0x4c8805 VADDSD (%RDX,%RAX,8),%XMM0,%XMM0 |
(3821) 0x4c880a VMOVSD %XMM0,(%RDX,%RAX,8) |
(3821) 0x4c880f LEA 0x1(%RSI),%RAX |
(3821) 0x4c8813 CMP %R11,%RSI |
(3821) 0x4c8816 MOV %RAX,-0x30(%RBP) |
(3821) 0x4c881a JE 4c8693 |
(3821) 0x4c8820 VXORPD %XMM0,%XMM0,%XMM0 |
(3821) 0x4c8824 CMP %R10,%R9 |
(3821) 0x4c8827 JLE 4c87f0 |
(3821) 0x4c8829 MOV -0x80(%RBP),%RAX |
(3821) 0x4c882d MOV (%RAX),%R13 |
(3821) 0x4c8830 MOV -0x78(%RBP),%RAX |
(3821) 0x4c8834 MOV (%RAX),%RSI |
(3821) 0x4c8837 MOV -0x88(%RBP),%RAX |
(3821) 0x4c883e MOV (%RAX),%RAX |
(3821) 0x4c8841 CMPQ $0,-0x90(%RBP) |
(3821) 0x4c8849 JE 4c890e |
(3821) 0x4c884f MOV -0x30(%RBP),%R14 |
(3821) 0x4c8853 IMUL %RBX,%R14 |
(3821) 0x4c8857 MOV -0xc8(%RBP),%RDI |
(3821) 0x4c885e LEA (%RDI,%R13,1),%RDX |
(3821) 0x4c8862 LEA (%RAX,%RDI,1),%R12 |
(3821) 0x4c8866 VXORPD %XMM0,%XMM0,%XMM0 |
(3821) 0x4c886a XOR %EDI,%EDI |
(3821) 0x4c886c NOPL (%RAX) |
(3823) 0x4c8870 MOV (%R12,%RDI,8),%R11 |
(3823) 0x4c8874 IMUL %R15,%R11 |
(3823) 0x4c8878 ADD %R14,%R11 |
(3823) 0x4c887b MOV 0x8(%R12,%RDI,8),%R8 |
(3823) 0x4c8880 IMUL %R15,%R8 |
(3823) 0x4c8884 ADD %R14,%R8 |
(3823) 0x4c8887 MOV 0x10(%R12,%RDI,8),%R10 |
(3823) 0x4c888c IMUL %R15,%R10 |
(3823) 0x4c8890 ADD %R14,%R10 |
(3823) 0x4c8893 MOV 0x18(%R12,%RDI,8),%RBX |
(3823) 0x4c8898 IMUL %R15,%RBX |
(3823) 0x4c889c ADD %R14,%RBX |
(3823) 0x4c889f VMOVSD (%RSI,%R10,8),%XMM1 |
(3823) 0x4c88a5 VMOVHPD (%RSI,%RBX,8),%XMM1,%XMM1 |
(3823) 0x4c88aa VMOVSD (%RSI,%R11,8),%XMM2 |
(3823) 0x4c88b0 VMOVHPD (%RSI,%R8,8),%XMM2,%XMM2 |
(3823) 0x4c88b6 VINSERTF128 $0x1,%XMM1,%YMM2,%YMM1 |
(3823) 0x4c88bc VFMADD231PD (%RDX,%RDI,8),%YMM1,%YMM0 |
(3823) 0x4c88c2 ADD $0x4,%RDI |
(3823) 0x4c88c6 CMP %RCX,%RDI |
(3823) 0x4c88c9 JBE 4c8870 |
(3821) 0x4c88cb VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(3821) 0x4c88d1 VADDPD %XMM1,%XMM0,%XMM0 |
(3821) 0x4c88d5 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(3821) 0x4c88da VADDSD %XMM1,%XMM0,%XMM0 |
(3821) 0x4c88de MOV -0x90(%RBP),%RDI |
(3821) 0x4c88e5 MOV %RDI,%RDX |
(3821) 0x4c88e8 CMP %RDI,-0xd0(%RBP) |
(3821) 0x4c88ef MOV -0x70(%RBP),%RBX |
(3821) 0x4c88f3 MOV -0x68(%RBP),%R14 |
(3821) 0x4c88f7 MOV -0x60(%RBP),%R11 |
(3821) 0x4c88fb MOV -0x38(%RBP),%R12 |
(3821) 0x4c88ff MOV -0xd8(%RBP),%R10 |
(3821) 0x4c8906 JE 4c87f0 |
(3821) 0x4c890c JMP 4c8910 |
(3821) 0x4c890e XOR %EDX,%EDX |
(3821) 0x4c8910 MOV -0x30(%RBP),%RDI |
(3821) 0x4c8914 IMUL %RBX,%RDI |
(3821) 0x4c8918 ADD %R10,%RDX |
(3821) 0x4c891b NOPL (%RAX,%RAX,1) |
(3822) 0x4c8920 MOV (%RAX,%RDX,8),%R8 |
(3822) 0x4c8924 IMUL %R15,%R8 |
(3822) 0x4c8928 ADD %RDI,%R8 |
(3822) 0x4c892b VMOVSD (%RSI,%R8,8),%XMM1 |
(3822) 0x4c8931 VFMADD231SD (%R13,%RDX,8),%XMM1,%XMM0 |
(3822) 0x4c8938 INC %RDX |
(3822) 0x4c893b CMP %RDX,%R9 |
(3822) 0x4c893e JNE 4c8920 |
(3821) 0x4c8940 JMP 4c87f0 |
(3820) 0x4c8945 XOR %R9D,%R9D |
(3820) 0x4c8948 ADD %R10,%R9 |
(3820) 0x4c894b NOPL (%RAX,%RAX,1) |
(3824) 0x4c8950 MOV (%R8,%R9,8),%RDX |
(3824) 0x4c8954 VMOVSD (%RSI,%RDX,8),%XMM1 |
(3824) 0x4c8959 VFMADD231SD (%RCX,%R9,8),%XMM1,%XMM0 |
(3824) 0x4c895f INC %R9 |
(3824) 0x4c8962 CMP %R9,%RAX |
(3824) 0x4c8965 JNE 4c8950 |
(3820) 0x4c8967 JMP 4c8680 |
0x4c896c NOPL (%RAX) |
Path / |
Source file and lines | csr_matvec.c:178-204 |
Module | exec |
nb instructions | 68 |
nb uops | 70 |
loop length | 285 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 25 |
micro-operation queue | 11.67 cycles |
front end | 11.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 1.50 | 1.40 | 6.00 | 6.00 | 13.50 | 1.40 | 1.30 | 13.50 | 13.50 | 13.50 | 1.40 | 6.00 |
cycles | 1.50 | 1.40 | 6.00 | 6.00 | 13.50 | 1.40 | 1.30 | 13.50 | 13.50 | 13.50 | 1.40 | 6.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 13.58 |
Stall cycles | 1.80-1.80 |
RS full (events) | 5.23-4.97 |
Front-end | 11.67 |
Dispatch | 13.50 |
Overall L1 | 13.50 |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 11% |
load | 10% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0xc8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0xe8(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x40(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x98(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x50(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x520db0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 410430 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 4c865c <hypre_CSRMatrixMatvecOutOfPlace.extracted.19+0xec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x520dd0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0xc8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 410180 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%RAX),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c86a7 <hypre_CSRMatrixMatvecOutOfPlace.extracted.19+0x137> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matvec.c:178-204 |
Module | exec |
nb instructions | 68 |
nb uops | 70 |
loop length | 285 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 25 |
micro-operation queue | 11.67 cycles |
front end | 11.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 1.50 | 1.40 | 6.00 | 6.00 | 13.50 | 1.40 | 1.30 | 13.50 | 13.50 | 13.50 | 1.40 | 6.00 |
cycles | 1.50 | 1.40 | 6.00 | 6.00 | 13.50 | 1.40 | 1.30 | 13.50 | 13.50 | 13.50 | 1.40 | 6.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 13.58 |
Stall cycles | 1.80-1.80 |
RS full (events) | 5.23-4.97 |
Front-end | 11.67 |
Dispatch | 13.50 |
Overall L1 | 13.50 |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 11% |
load | 10% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0xc8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0xe8(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x40(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x98(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x50(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x520db0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 410430 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 4c865c <hypre_CSRMatrixMatvecOutOfPlace.extracted.19+0xec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x520dd0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0xc8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 410180 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%RAX),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c86a7 <hypre_CSRMatrixMatvecOutOfPlace.extracted.19+0x137> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace.extracted.19– | 0.03 | 0.01 |
▼Loop 3820 - csr_matvec.c:178-204 - exec– | 0 | 0 |
○Loop 3825 - csr_matvec.c:194-195 - exec | 0.02 | 0.01 |
○Loop 3824 - csr_matvec.c:194-195 - exec | 0 | 0 |
▼Loop 3821 - csr_matvec.c:199-204 - exec– | 0 | 0 |
○Loop 3822 - csr_matvec.c:202-203 - exec | 0 | 0 |
○Loop 3823 - csr_matvec.c:202-203 - exec | 0 | 0 |