Function: hypre_CSRMatrixMatvecT.extracted.49 | Module: exec | Source: csr_matvec.c:554-579 [...] | Coverage: 1.26% |
---|
Function: hypre_CSRMatrixMatvecT.extracted.49 | Module: exec | Source: csr_matvec.c:554-579 [...] | Coverage: 1.26% |
---|
/home/eoseret/qaas_runs_CPU_9468/172-019-1763/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 554 - 579 |
-------------------------------------------------------------------------------- |
554: #pragma omp parallel private(i,jj,j,my_thread_num,offset) |
555: #endif |
556: { |
557: my_thread_num = hypre_GetThreadNum(); |
558: offset = y_size*my_thread_num; |
559: #ifdef HYPRE_USING_OPENMP |
560: #pragma omp for HYPRE_SMP_SCHEDULE |
561: #endif |
562: for (i = 0; i < num_rows; i++) |
563: { |
564: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
565: { |
566: j = A_j[jj]; |
567: y_data_expand[offset + j] += A_data[jj] * x_data[i]; |
[...] |
573: #pragma omp for HYPRE_SMP_SCHEDULE |
574: #endif |
575: for (i = 0; i < y_size; i++) |
576: { |
577: for (j = 0; j < num_threads; j++) |
578: { |
579: y_data[i] += y_data_expand[j*y_size + i]; |
0x5786a0 PUSH %RBP |
0x5786a1 MOV %RSP,%RBP |
0x5786a4 PUSH %R15 |
0x5786a6 PUSH %R14 |
0x5786a8 PUSH %R13 |
0x5786aa PUSH %R12 |
0x5786ac PUSH %RBX |
0x5786ad SUB $0x98,%RSP |
0x5786b4 MOV %R9,-0x40(%RBP) |
0x5786b8 MOV %RCX,-0x50(%RBP) |
0x5786bc MOV %R8,%R14 |
0x5786bf MOV %RDX,%R12 |
0x5786c2 MOV %RDI,%R13 |
0x5786c5 MOV 0x30(%RBP),%RAX |
0x5786c9 MOV %RAX,-0x30(%RBP) |
0x5786cd MOV 0x20(%RBP),%RAX |
0x5786d1 MOV 0x28(%RBP),%RBX |
0x5786d5 MOV %RAX,-0x38(%RBP) |
0x5786d9 MOV 0x18(%RBP),%RAX |
0x5786dd MOV %RAX,-0x48(%RBP) |
0x5786e1 MOV 0x10(%RBP),%R15 |
0x5786e5 CALL 586110 <hypre_GetThreadNum> |
0x5786ea MOV -0x40(%RBP),%RCX |
0x5786ee MOV %R13,%RDX |
0x5786f1 MOV %R13,-0x70(%RBP) |
0x5786f5 TEST %RCX,%RCX |
0x5786f8 JLE 57894b |
0x5786fe MOVL $0,-0x84(%RBP) |
0x578708 DEC %RCX |
0x57870b MOV %RAX,%R13 |
0x57870e MOV (%RDX),%ESI |
0x578710 MOVQ $0,-0xa8(%RBP) |
0x57871b MOV %RCX,-0xa0(%RBP) |
0x578722 MOVQ $0x1,-0xb8(%RBP) |
0x57872d SUB $0x8,%RSP |
0x578731 LEA -0xb8(%RBP),%RAX |
0x578738 LEA -0x84(%RBP),%RCX |
0x57873f LEA -0xa8(%RBP),%R8 |
0x578746 LEA -0xa0(%RBP),%R9 |
0x57874d MOV $0x5d9fb0,%EDI |
0x578752 MOV %ESI,-0x78(%RBP) |
0x578755 MOV $0x22,%EDX |
0x57875a PUSH $0x1 |
0x57875c PUSH $0x1 |
0x57875e PUSH %RAX |
0x57875f CALL 410420 <__kmpc_for_static_init_8@plt> |
0x578764 ADD $0x20,%RSP |
0x578768 MOV -0xa8(%RBP),%RDX |
0x57876f MOV -0xa0(%RBP),%RAX |
0x578776 SUB %RDX,%RAX |
0x578779 MOV %RDX,%RCX |
0x57877c MOV %RDX,-0x40(%RBP) |
0x578780 JB 57892b |
0x578786 IMUL -0x38(%RBP),%R13 |
0x57878b LEA 0x1(%RAX),%RDX |
0x57878f VPBROADCASTQ %RBX,%ZMM0 |
0x578795 MOV %EDX,%ECX |
0x578797 AND $0x3,%ECX |
0x57879a MOV %RCX,-0x60(%RBP) |
0x57879e VPBROADCASTQ %R13,%ZMM1 |
0x5787a4 CMP $0x3,%RAX |
0x5787a8 JAE 578a8a |
0x5787ae XOR %R11D,%R11D |
0x5787b1 CMPQ $0,-0x60(%RBP) |
0x5787b6 JE 57892b |
0x5787bc VPBROADCASTQ 0x25cfa(%RIP),%ZMM2 |
0x5787c6 VPTERNLOGD $-0x1,%ZMM3,%ZMM3,%ZMM3 |
0x5787cd XOR %ESI,%ESI |
0x5787cf JMP 5787f0 |
0x5787d1 NOPW %CS:(%RAX,%RAX,1) |
(6538) 0x5787e0 INC %R11 |
(6538) 0x5787e3 INC %RSI |
(6538) 0x5787e6 CMP -0x60(%RBP),%RSI |
(6538) 0x5787ea JE 57892b |
(6538) 0x5787f0 MOV -0x40(%RBP),%RAX |
(6538) 0x5787f4 MOV -0x50(%RBP),%RCX |
(6538) 0x5787f8 LEA (%RAX,%R11,1),%RDI |
(6538) 0x5787fc MOV (%RCX,%RDI,8),%R10 |
(6538) 0x578800 MOV 0x8(%RCX,%RDI,8),%R8 |
(6538) 0x578805 MOV %R8,%RCX |
(6538) 0x578808 SUB %R10,%RCX |
(6538) 0x57880b JLE 5787e0 |
(6538) 0x57880d MOV %RCX,%R9 |
(6538) 0x578810 AND $-0x8,%R9 |
(6538) 0x578814 JE 5788ef |
(6538) 0x57881a MOV %R11,-0x58(%RBP) |
(6538) 0x57881e LEA -0x1(%R9),%R11 |
(6538) 0x578822 XOR %EAX,%EAX |
(6538) 0x578824 JMP 57886a |
0x578826 NOPW %CS:(%RAX,%RAX,1) |
(6540) 0x578830 KXNORW %K0,%K0,%K1 |
(6540) 0x578834 VXORPD %XMM7,%XMM7,%XMM7 |
(6540) 0x578838 VPSLLQ $0x3,%ZMM5,%ZMM6 |
(6540) 0x57883f ADD $0x8,%RAX |
(6540) 0x578843 VGATHERQPD (%RBX,%ZMM5,8),%ZMM7{%K1} |
(6540) 0x57884a VPADDQ %ZMM6,%ZMM0,%ZMM6 |
(6540) 0x578850 KXNORW %K0,%K0,%K1 |
(6540) 0x578854 VADDPD %ZMM4,%ZMM7,%ZMM4 |
(6540) 0x57885a VSCATTERQPD %ZMM4,(,%ZMM6,1){%K1} |
(6540) 0x578865 CMP %R11,%RAX |
(6540) 0x578868 JA 5788e0 |
(6540) 0x57886a VBROADCASTSD (%R15,%RDI,8),%ZMM4 |
(6540) 0x578871 LEA (%R10,%RAX,1),%RDX |
(6540) 0x578875 VPADDQ (%R14,%RDX,8),%ZMM1,%ZMM5 |
(6540) 0x57887c VPCONFLICTQ %ZMM5,%ZMM6 |
(6540) 0x578882 VPTESTMQ %ZMM6,%ZMM6,%K1 |
(6540) 0x578888 KORTESTB %K1,%K1 |
(6540) 0x57888c VMULPD (%R12,%RDX,8),%ZMM4,%ZMM4 |
(6540) 0x578893 JE 578830 |
(6540) 0x578895 VPLZCNTQ %ZMM6,%ZMM6 |
(6540) 0x57889b VPSUBQ %ZMM6,%ZMM2,%ZMM6 |
(6540) 0x5788a1 NOPW %CS:(%RAX,%RAX,1) |
(6541) 0x5788b0 VPERMQ %ZMM4,%ZMM6,%ZMM7 |
(6541) 0x5788b6 VPERMQ %ZMM6,%ZMM6,%ZMM6{%K1} |
(6541) 0x5788bc VADDPD %ZMM7,%ZMM4,%ZMM4{%K1} |
(6541) 0x5788c2 VPCMPNEQQ %ZMM3,%ZMM6,%K1 |
(6541) 0x5788c9 KORTESTB %K1,%K1 |
(6541) 0x5788cd JNE 5788b0 |
(6540) 0x5788cf JMP 578830 |
0x5788d4 NOPW %CS:(%RAX,%RAX,1) |
(6538) 0x5788e0 MOV -0x58(%RBP),%R11 |
(6538) 0x5788e4 CMP %R9,%RCX |
(6538) 0x5788e7 JE 5787e0 |
(6538) 0x5788ed JMP 5788f2 |
(6538) 0x5788ef XOR %R9D,%R9D |
(6538) 0x5788f2 ADD %R10,%R9 |
(6538) 0x5788f5 NOPW %CS:(%RAX,%RAX,1) |
(6539) 0x578900 VMOVSD (%R15,%RDI,8),%XMM4 |
(6539) 0x578906 MOV (%R14,%R9,8),%RAX |
(6539) 0x57890a VMOVSD (%R12,%R9,8),%XMM5 |
(6539) 0x578910 INC %R9 |
(6539) 0x578913 ADD %R13,%RAX |
(6539) 0x578916 VFMADD213SD (%RBX,%RAX,8),%XMM4,%XMM5 |
(6539) 0x57891c VMOVSD %XMM5,(%RBX,%RAX,8) |
(6539) 0x578921 CMP %R9,%R8 |
(6539) 0x578924 JNE 578900 |
(6538) 0x578926 JMP 5787e0 |
0x57892b MOV -0x78(%RBP),%ESI |
0x57892e MOV $0x5d9fd0,%EDI |
0x578933 VZEROUPPER |
0x578936 CALL 410170 <__kmpc_for_static_fini@plt> |
0x57893b MOV -0x70(%RBP),%RAX |
0x57893f MOV $0x5d9ff0,%EDI |
0x578944 MOV (%RAX),%ESI |
0x578946 CALL 410560 <__kmpc_barrier@plt> |
0x57894b MOV -0x38(%RBP),%R12 |
0x57894f TEST %R12,%R12 |
0x578952 JLE 578a78 |
0x578958 MOV -0x70(%RBP),%R15 |
0x57895c MOVL $0,-0x80(%RBP) |
0x578963 LEA -0x1(%R12),%RAX |
0x578968 MOV (%R15),%ESI |
0x57896b MOVQ $0,-0x98(%RBP) |
0x578976 MOV %RAX,-0x90(%RBP) |
0x57897d MOVQ $0x1,-0xb0(%RBP) |
0x578988 SUB $0x8,%RSP |
0x57898c LEA -0xb0(%RBP),%RAX |
0x578993 LEA -0x80(%RBP),%RCX |
0x578997 MOV $0x22,%EDX |
0x57899c LEA -0x98(%RBP),%R8 |
0x5789a3 LEA -0x90(%RBP),%R9 |
0x5789aa MOV $0x5d9f50,%EDI |
0x5789af MOV %ESI,-0x7c(%RBP) |
0x5789b2 PUSH $0x1 |
0x5789b4 PUSH $0x1 |
0x5789b6 PUSH %RAX |
0x5789b7 CALL 410420 <__kmpc_for_static_init_8@plt> |
0x5789bc ADD $0x20,%RSP |
0x5789c0 MOV -0x90(%RBP),%RDX |
0x5789c7 MOV -0x98(%RBP),%RAX |
0x5789ce MOV -0x30(%RBP),%R13 |
0x5789d2 MOV -0x48(%RBP),%R11 |
0x5789d6 MOV %RDX,%RCX |
0x5789d9 SUB %RAX,%RCX |
0x5789dc JB 5790b2 |
0x5789e2 MOV %R12,%R8 |
0x5789e5 SAR $0x3f,%R8 |
0x5789e9 MOV %RAX,%RSI |
0x5789ec LEA (%R11,%RDX,8),%RDI |
0x5789f0 AND %R12,%R8 |
0x5789f3 SUB %R8,%RSI |
0x5789f6 IMUL %R13,%R8 |
0x5789fa ADD %RSI,%R8 |
0x5789fd XOR %ESI,%ESI |
0x5789ff TEST %R12,%R12 |
0x578a02 LEA (%RBX,%R8,8),%R8 |
0x578a06 CMOVG %R12,%RSI |
0x578a0a CMP %R8,%RDI |
0x578a0d JB 578f7b |
0x578a13 SUB %RSI,%RDX |
0x578a16 IMUL %R13,%RSI |
0x578a1a LEA (%R11,%RAX,8),%RDI |
0x578a1e ADD %RDX,%RSI |
0x578a21 LEA (%RBX,%RSI,8),%RDX |
0x578a25 CMP %RDI,%RDX |
0x578a28 JB 578f7b |
0x578a2e LEA (%RBX,%RAX,8),%RDX |
0x578a32 SAL $0x3,%R12 |
0x578a36 XOR %ESI,%ESI |
0x578a38 NOPL (%RAX,%RAX,1) |
(6537) 0x578a40 LEA (%RAX,%RSI,1),%RDI |
(6537) 0x578a44 MOV %RDX,%R8 |
(6537) 0x578a47 MOV %R13,%R9 |
(6537) 0x578a4a VMOVSD (%R11,%RDI,8),%XMM0 |
(6536) 0x578a50 VADDSD (%R8),%XMM0,%XMM0 |
(6536) 0x578a55 ADD %R12,%R8 |
(6536) 0x578a58 DEC %R9 |
(6536) 0x578a5b VMOVSD %XMM0,(%R11,%RDI,8) |
(6536) 0x578a61 JNE 578a50 |
(6537) 0x578a63 ADD $0x8,%RDX |
(6537) 0x578a67 LEA 0x1(%RSI),%RDI |
(6537) 0x578a6b CMP %RCX,%RSI |
(6537) 0x578a6e MOV %RDI,%RSI |
(6537) 0x578a71 JNE 578a40 |
0x578a73 JMP 5790b2 |
0x578a78 ADD $0x98,%RSP |
0x578a7f POP %RBX |
0x578a80 POP %R12 |
0x578a82 POP %R13 |
0x578a84 POP %R14 |
0x578a86 POP %R15 |
0x578a88 POP %RBP |
0x578a89 RET |
0x578a8a VPBROADCASTQ 0x25a2c(%RIP),%ZMM2 |
0x578a94 MOV -0x50(%RBP),%RSI |
0x578a98 AND $-0x4,%RDX |
0x578a9c VPTERNLOGD $-0x1,%ZMM3,%ZMM3,%ZMM3 |
0x578aa3 XOR %R11D,%R11D |
0x578aa6 MOV %RDX,-0x68(%RBP) |
0x578aaa JMP 578ac1 |
0x578aac NOPL (%RAX) |
(6542) 0x578ab0 MOV -0x68(%RBP),%RDX |
(6542) 0x578ab4 ADD $0x4,%R11 |
(6542) 0x578ab8 CMP %RDX,%R11 |
(6542) 0x578abb JE 5787b1 |
(6542) 0x578ac1 MOV -0x40(%RBP),%RAX |
(6542) 0x578ac5 MOV %R11,-0x58(%RBP) |
(6542) 0x578ac9 LEA (%RAX,%R11,1),%RDI |
(6542) 0x578acd MOV 0x8(%RSI,%RDI,8),%R8 |
(6542) 0x578ad2 MOV (%RSI,%RDI,8),%R10 |
(6542) 0x578ad6 MOV %R8,%RCX |
(6542) 0x578ad9 SUB %R10,%RCX |
(6542) 0x578adc JLE 578be6 |
(6542) 0x578ae2 MOV %RCX,%R9 |
(6542) 0x578ae5 AND $-0x8,%R9 |
(6542) 0x578ae9 JE 578bb7 |
(6542) 0x578aef LEA -0x1(%R9),%R11 |
(6542) 0x578af3 XOR %EAX,%EAX |
(6542) 0x578af5 JMP 578b3a |
0x578af7 NOPW (%RAX,%RAX,1) |
(6553) 0x578b00 KXNORW %K0,%K0,%K1 |
(6553) 0x578b04 VXORPD %XMM7,%XMM7,%XMM7 |
(6553) 0x578b08 VPSLLQ $0x3,%ZMM5,%ZMM6 |
(6553) 0x578b0f ADD $0x8,%RAX |
(6553) 0x578b13 VGATHERQPD (%RBX,%ZMM5,8),%ZMM7{%K1} |
(6553) 0x578b1a VPADDQ %ZMM6,%ZMM0,%ZMM6 |
(6553) 0x578b20 KXNORW %K0,%K0,%K1 |
(6553) 0x578b24 VADDPD %ZMM4,%ZMM7,%ZMM4 |
(6553) 0x578b2a VSCATTERQPD %ZMM4,(,%ZMM6,1){%K1} |
(6553) 0x578b35 CMP %R11,%RAX |
(6553) 0x578b38 JA 578bb0 |
(6553) 0x578b3a VBROADCASTSD (%R15,%RDI,8),%ZMM4 |
(6553) 0x578b41 LEA (%R10,%RAX,1),%RDX |
(6553) 0x578b45 VPADDQ (%R14,%RDX,8),%ZMM1,%ZMM5 |
(6553) 0x578b4c VPCONFLICTQ %ZMM5,%ZMM6 |
(6553) 0x578b52 VPTESTMQ %ZMM6,%ZMM6,%K1 |
(6553) 0x578b58 KORTESTB %K1,%K1 |
(6553) 0x578b5c VMULPD (%R12,%RDX,8),%ZMM4,%ZMM4 |
(6553) 0x578b63 JE 578b00 |
(6553) 0x578b65 VPLZCNTQ %ZMM6,%ZMM6 |
(6553) 0x578b6b VPSUBQ %ZMM6,%ZMM2,%ZMM6 |
(6553) 0x578b71 NOPW %CS:(%RAX,%RAX,1) |
(6554) 0x578b80 VPERMQ %ZMM4,%ZMM6,%ZMM7 |
(6554) 0x578b86 VPERMQ %ZMM6,%ZMM6,%ZMM6{%K1} |
(6554) 0x578b8c VADDPD %ZMM7,%ZMM4,%ZMM4{%K1} |
(6554) 0x578b92 VPCMPNEQQ %ZMM3,%ZMM6,%K1 |
(6554) 0x578b99 KORTESTB %K1,%K1 |
(6554) 0x578b9d JNE 578b80 |
(6553) 0x578b9f JMP 578b00 |
0x578ba4 NOPW %CS:(%RAX,%RAX,1) |
(6542) 0x578bb0 CMP %R9,%RCX |
(6542) 0x578bb3 JNE 578bba |
(6542) 0x578bb5 JMP 578be6 |
(6542) 0x578bb7 XOR %R9D,%R9D |
(6542) 0x578bba ADD %R10,%R9 |
(6542) 0x578bbd NOPL (%RAX) |
(6552) 0x578bc0 VMOVSD (%R15,%RDI,8),%XMM4 |
(6552) 0x578bc6 MOV (%R14,%R9,8),%RAX |
(6552) 0x578bca VMOVSD (%R12,%R9,8),%XMM5 |
(6552) 0x578bd0 INC %R9 |
(6552) 0x578bd3 ADD %R13,%RAX |
(6552) 0x578bd6 VFMADD213SD (%RBX,%RAX,8),%XMM4,%XMM5 |
(6552) 0x578bdc VMOVSD %XMM5,(%RBX,%RAX,8) |
(6552) 0x578be1 CMP %R9,%R8 |
(6552) 0x578be4 JNE 578bc0 |
(6542) 0x578be6 MOV 0x10(%RSI,%RDI,8),%R8 |
(6542) 0x578beb MOV 0x8(%RSI,%RDI,8),%R11 |
(6542) 0x578bf0 MOV %R8,%RCX |
(6542) 0x578bf3 SUB %R11,%RCX |
(6542) 0x578bf6 JLE 578d16 |
(6542) 0x578bfc MOV -0x40(%RBP),%RAX |
(6542) 0x578c00 MOV -0x58(%RBP),%RDX |
(6542) 0x578c04 MOV %RCX,%R10 |
(6542) 0x578c07 AND $-0x8,%R10 |
(6542) 0x578c0b LEA 0x1(%RDX,%RAX,1),%R9 |
(6542) 0x578c10 JE 578cdb |
(6542) 0x578c16 LEA -0x1(%R10),%RSI |
(6542) 0x578c1a XOR %EAX,%EAX |
(6542) 0x578c1c JMP 578c5a |
0x578c1e XCHG %AX,%AX |
(6550) 0x578c20 KXNORW %K0,%K0,%K1 |
(6550) 0x578c24 VXORPD %XMM7,%XMM7,%XMM7 |
(6550) 0x578c28 VPSLLQ $0x3,%ZMM5,%ZMM6 |
(6550) 0x578c2f ADD $0x8,%RAX |
(6550) 0x578c33 VGATHERQPD (%RBX,%ZMM5,8),%ZMM7{%K1} |
(6550) 0x578c3a VPADDQ %ZMM6,%ZMM0,%ZMM6 |
(6550) 0x578c40 KXNORW %K0,%K0,%K1 |
(6550) 0x578c44 VADDPD %ZMM4,%ZMM7,%ZMM4 |
(6550) 0x578c4a VSCATTERQPD %ZMM4,(,%ZMM6,1){%K1} |
(6550) 0x578c55 CMP %RSI,%RAX |
(6550) 0x578c58 JA 578cd0 |
(6550) 0x578c5a VBROADCASTSD (%R15,%R9,8),%ZMM4 |
(6550) 0x578c61 LEA (%R11,%RAX,1),%RDX |
(6550) 0x578c65 VPADDQ (%R14,%RDX,8),%ZMM1,%ZMM5 |
(6550) 0x578c6c VPCONFLICTQ %ZMM5,%ZMM6 |
(6550) 0x578c72 VPTESTMQ %ZMM6,%ZMM6,%K1 |
(6550) 0x578c78 KORTESTB %K1,%K1 |
(6550) 0x578c7c VMULPD (%R12,%RDX,8),%ZMM4,%ZMM4 |
(6550) 0x578c83 JE 578c20 |
(6550) 0x578c85 VPLZCNTQ %ZMM6,%ZMM6 |
(6550) 0x578c8b VPSUBQ %ZMM6,%ZMM2,%ZMM6 |
(6550) 0x578c91 NOPW %CS:(%RAX,%RAX,1) |
(6551) 0x578ca0 VPERMQ %ZMM4,%ZMM6,%ZMM7 |
(6551) 0x578ca6 VPERMQ %ZMM6,%ZMM6,%ZMM6{%K1} |
(6551) 0x578cac VADDPD %ZMM7,%ZMM4,%ZMM4{%K1} |
(6551) 0x578cb2 VPCMPNEQQ %ZMM3,%ZMM6,%K1 |
(6551) 0x578cb9 KORTESTB %K1,%K1 |
(6551) 0x578cbd JNE 578ca0 |
(6550) 0x578cbf JMP 578c20 |
0x578cc4 NOPW %CS:(%RAX,%RAX,1) |
(6542) 0x578cd0 MOV -0x50(%RBP),%RSI |
(6542) 0x578cd4 CMP %R10,%RCX |
(6542) 0x578cd7 JNE 578cde |
(6542) 0x578cd9 JMP 578d16 |
(6542) 0x578cdb XOR %R10D,%R10D |
(6542) 0x578cde ADD %R11,%R10 |
(6542) 0x578ce1 NOPW %CS:(%RAX,%RAX,1) |
(6549) 0x578cf0 VMOVSD (%R15,%R9,8),%XMM4 |
(6549) 0x578cf6 MOV (%R14,%R10,8),%RAX |
(6549) 0x578cfa VMOVSD (%R12,%R10,8),%XMM5 |
(6549) 0x578d00 INC %R10 |
(6549) 0x578d03 ADD %R13,%RAX |
(6549) 0x578d06 VFMADD213SD (%RBX,%RAX,8),%XMM4,%XMM5 |
(6549) 0x578d0c VMOVSD %XMM5,(%RBX,%RAX,8) |
(6549) 0x578d11 CMP %R10,%R8 |
(6549) 0x578d14 JNE 578cf0 |
(6542) 0x578d16 MOV 0x18(%RSI,%RDI,8),%R8 |
(6542) 0x578d1b MOV 0x10(%RSI,%RDI,8),%R11 |
(6542) 0x578d20 MOV %R8,%RCX |
(6542) 0x578d23 SUB %R11,%RCX |
(6542) 0x578d26 JLE 578e46 |
(6542) 0x578d2c MOV -0x40(%RBP),%RAX |
(6542) 0x578d30 MOV -0x58(%RBP),%RDX |
(6542) 0x578d34 MOV %RCX,%R10 |
(6542) 0x578d37 AND $-0x8,%R10 |
(6542) 0x578d3b LEA 0x2(%RDX,%RAX,1),%R9 |
(6542) 0x578d40 JE 578e0b |
(6542) 0x578d46 LEA -0x1(%R10),%RSI |
(6542) 0x578d4a XOR %EAX,%EAX |
(6542) 0x578d4c JMP 578d8a |
0x578d4e XCHG %AX,%AX |
(6547) 0x578d50 KXNORW %K0,%K0,%K1 |
(6547) 0x578d54 VXORPD %XMM7,%XMM7,%XMM7 |
(6547) 0x578d58 VPSLLQ $0x3,%ZMM5,%ZMM6 |
(6547) 0x578d5f ADD $0x8,%RAX |
(6547) 0x578d63 VGATHERQPD (%RBX,%ZMM5,8),%ZMM7{%K1} |
(6547) 0x578d6a VPADDQ %ZMM6,%ZMM0,%ZMM6 |
(6547) 0x578d70 KXNORW %K0,%K0,%K1 |
(6547) 0x578d74 VADDPD %ZMM4,%ZMM7,%ZMM4 |
(6547) 0x578d7a VSCATTERQPD %ZMM4,(,%ZMM6,1){%K1} |
(6547) 0x578d85 CMP %RSI,%RAX |
(6547) 0x578d88 JA 578e00 |
(6547) 0x578d8a VBROADCASTSD (%R15,%R9,8),%ZMM4 |
(6547) 0x578d91 LEA (%R11,%RAX,1),%RDX |
(6547) 0x578d95 VPADDQ (%R14,%RDX,8),%ZMM1,%ZMM5 |
(6547) 0x578d9c VPCONFLICTQ %ZMM5,%ZMM6 |
(6547) 0x578da2 VPTESTMQ %ZMM6,%ZMM6,%K1 |
(6547) 0x578da8 KORTESTB %K1,%K1 |
(6547) 0x578dac VMULPD (%R12,%RDX,8),%ZMM4,%ZMM4 |
(6547) 0x578db3 JE 578d50 |
(6547) 0x578db5 VPLZCNTQ %ZMM6,%ZMM6 |
(6547) 0x578dbb VPSUBQ %ZMM6,%ZMM2,%ZMM6 |
(6547) 0x578dc1 NOPW %CS:(%RAX,%RAX,1) |
(6548) 0x578dd0 VPERMQ %ZMM4,%ZMM6,%ZMM7 |
(6548) 0x578dd6 VPERMQ %ZMM6,%ZMM6,%ZMM6{%K1} |
(6548) 0x578ddc VADDPD %ZMM7,%ZMM4,%ZMM4{%K1} |
(6548) 0x578de2 VPCMPNEQQ %ZMM3,%ZMM6,%K1 |
(6548) 0x578de9 KORTESTB %K1,%K1 |
(6548) 0x578ded JNE 578dd0 |
(6547) 0x578def JMP 578d50 |
0x578df4 NOPW %CS:(%RAX,%RAX,1) |
(6542) 0x578e00 MOV -0x50(%RBP),%RSI |
(6542) 0x578e04 CMP %R10,%RCX |
(6542) 0x578e07 JNE 578e0e |
(6542) 0x578e09 JMP 578e46 |
(6542) 0x578e0b XOR %R10D,%R10D |
(6542) 0x578e0e ADD %R11,%R10 |
(6542) 0x578e11 NOPW %CS:(%RAX,%RAX,1) |
(6546) 0x578e20 VMOVSD (%R15,%R9,8),%XMM4 |
(6546) 0x578e26 MOV (%R14,%R10,8),%RAX |
(6546) 0x578e2a VMOVSD (%R12,%R10,8),%XMM5 |
(6546) 0x578e30 INC %R10 |
(6546) 0x578e33 ADD %R13,%RAX |
(6546) 0x578e36 VFMADD213SD (%RBX,%RAX,8),%XMM4,%XMM5 |
(6546) 0x578e3c VMOVSD %XMM5,(%RBX,%RAX,8) |
(6546) 0x578e41 CMP %R10,%R8 |
(6546) 0x578e44 JNE 578e20 |
(6542) 0x578e46 MOV 0x18(%RSI,%RDI,8),%R10 |
(6542) 0x578e4b MOV 0x20(%RSI,%RDI,8),%RDI |
(6542) 0x578e50 MOV -0x58(%RBP),%R11 |
(6542) 0x578e54 MOV %RDI,%RCX |
(6542) 0x578e57 SUB %R10,%RCX |
(6542) 0x578e5a JLE 578ab0 |
(6542) 0x578e60 MOV -0x40(%RBP),%RAX |
(6542) 0x578e64 MOV %RCX,%R9 |
(6542) 0x578e67 AND $-0x8,%R9 |
(6542) 0x578e6b LEA 0x3(%R11,%RAX,1),%R8 |
(6542) 0x578e70 JE 578f3f |
(6542) 0x578e76 LEA -0x1(%R9),%RSI |
(6542) 0x578e7a XOR %EAX,%EAX |
(6542) 0x578e7c JMP 578eba |
0x578e7e XCHG %AX,%AX |
(6544) 0x578e80 KXNORW %K0,%K0,%K1 |
(6544) 0x578e84 VXORPD %XMM7,%XMM7,%XMM7 |
(6544) 0x578e88 VPSLLQ $0x3,%ZMM5,%ZMM6 |
(6544) 0x578e8f ADD $0x8,%RAX |
(6544) 0x578e93 VGATHERQPD (%RBX,%ZMM5,8),%ZMM7{%K1} |
(6544) 0x578e9a VPADDQ %ZMM6,%ZMM0,%ZMM6 |
(6544) 0x578ea0 KXNORW %K0,%K0,%K1 |
(6544) 0x578ea4 VADDPD %ZMM4,%ZMM7,%ZMM4 |
(6544) 0x578eaa VSCATTERQPD %ZMM4,(,%ZMM6,1){%K1} |
(6544) 0x578eb5 CMP %RSI,%RAX |
(6544) 0x578eb8 JA 578f30 |
(6544) 0x578eba VBROADCASTSD (%R15,%R8,8),%ZMM4 |
(6544) 0x578ec1 LEA (%R10,%RAX,1),%RDX |
(6544) 0x578ec5 VPADDQ (%R14,%RDX,8),%ZMM1,%ZMM5 |
(6544) 0x578ecc VPCONFLICTQ %ZMM5,%ZMM6 |
(6544) 0x578ed2 VPTESTMQ %ZMM6,%ZMM6,%K1 |
(6544) 0x578ed8 KORTESTB %K1,%K1 |
(6544) 0x578edc VMULPD (%R12,%RDX,8),%ZMM4,%ZMM4 |
(6544) 0x578ee3 JE 578e80 |
(6544) 0x578ee5 VPLZCNTQ %ZMM6,%ZMM6 |
(6544) 0x578eeb VPSUBQ %ZMM6,%ZMM2,%ZMM6 |
(6544) 0x578ef1 NOPW %CS:(%RAX,%RAX,1) |
(6545) 0x578f00 VPERMQ %ZMM4,%ZMM6,%ZMM7 |
(6545) 0x578f06 VPERMQ %ZMM6,%ZMM6,%ZMM6{%K1} |
(6545) 0x578f0c VADDPD %ZMM7,%ZMM4,%ZMM4{%K1} |
(6545) 0x578f12 VPCMPNEQQ %ZMM3,%ZMM6,%K1 |
(6545) 0x578f19 KORTESTB %K1,%K1 |
(6545) 0x578f1d JNE 578f00 |
(6544) 0x578f1f JMP 578e80 |
0x578f24 NOPW %CS:(%RAX,%RAX,1) |
(6542) 0x578f30 MOV -0x50(%RBP),%RSI |
(6542) 0x578f34 CMP %R9,%RCX |
(6542) 0x578f37 JE 578ab0 |
(6542) 0x578f3d JMP 578f42 |
(6542) 0x578f3f XOR %R9D,%R9D |
(6542) 0x578f42 ADD %R10,%R9 |
(6542) 0x578f45 NOPW %CS:(%RAX,%RAX,1) |
(6543) 0x578f50 VMOVSD (%R15,%R8,8),%XMM4 |
(6543) 0x578f56 MOV (%R14,%R9,8),%RAX |
(6543) 0x578f5a VMOVSD (%R12,%R9,8),%XMM5 |
(6543) 0x578f60 INC %R9 |
(6543) 0x578f63 ADD %R13,%RAX |
(6543) 0x578f66 VFMADD213SD (%RBX,%RAX,8),%XMM4,%XMM5 |
(6543) 0x578f6c VMOVSD %XMM5,(%RBX,%RAX,8) |
(6543) 0x578f71 CMP %R9,%RDI |
(6543) 0x578f74 JNE 578f50 |
(6542) 0x578f76 JMP 578ab0 |
0x578f7b LEA 0x1(%RCX),%R15 |
0x578f7f VPBROADCASTQ %R12,%ZMM0 |
0x578f85 MOV %R15D,%EDX |
0x578f88 AND $0x7,%EDX |
0x578f8b MOV %RDX,-0x68(%RBP) |
0x578f8f CMP $0x7,%RCX |
0x578f93 JAE 5790e0 |
0x578f99 XOR %EDX,%EDX |
0x578f9b CMPQ $0,-0x68(%RBP) |
0x578fa0 MOV -0x70(%RBP),%R15 |
0x578fa4 JE 5790b2 |
0x578faa VMOVDQU64 0x3c38c(%RIP),%ZMM1 |
0x578fb4 MOV %R13,%RCX |
0x578fb7 AND $-0x8,%RCX |
0x578fbb LEA (,%R12,8),%R8 |
0x578fc3 LEA (%RDX,%RAX,1),%RDI |
0x578fc7 XOR %R9D,%R9D |
0x578fca LEA -0x1(%RCX),%RSI |
0x578fce JMP 578fed |
(6525) 0x578fd0 MOV -0x48(%RBP),%R11 |
(6525) 0x578fd4 INC %RDX |
(6525) 0x578fd7 INC %R9 |
(6525) 0x578fda INC %RDI |
(6525) 0x578fdd VMOVSD %XMM2,(%R11,%R10,8) |
(6525) 0x578fe3 CMP -0x68(%RBP),%R9 |
(6525) 0x578fe7 JE 5790b2 |
(6525) 0x578fed LEA (%RAX,%RDX,1),%R10 |
(6525) 0x578ff1 VMOVSD (%R11,%R10,8),%XMM2 |
(6525) 0x578ff7 TEST %RCX,%RCX |
(6525) 0x578ffa JE 579080 |
(6525) 0x579000 VPBROADCASTQ %R10,%ZMM4 |
(6525) 0x579006 VPXOR %XMM3,%XMM3,%XMM3 |
(6525) 0x57900a XOR %R11D,%R11D |
(6525) 0x57900d NOPL (%RAX) |
(6526) 0x579010 VPBROADCASTQ %R11,%ZMM5 |
(6526) 0x579016 KXNORW %K0,%K0,%K1 |
(6526) 0x57901a VXORPD %XMM6,%XMM6,%XMM6 |
(6526) 0x57901e ADD $0x8,%R11 |
(6526) 0x579022 VPADDQ %ZMM1,%ZMM5,%ZMM5 |
(6526) 0x579028 VPMULLQ %ZMM5,%ZMM0,%ZMM5 |
(6526) 0x57902e VPADDQ %ZMM5,%ZMM4,%ZMM5 |
(6526) 0x579034 VGATHERQPD (%RBX,%ZMM5,8),%ZMM6{%K1} |
(6526) 0x57903b VADDPD %ZMM6,%ZMM3,%ZMM3 |
(6526) 0x579041 CMP %RSI,%R11 |
(6526) 0x579044 JLE 579010 |
(6525) 0x579046 VEXTRACTF64X4 $0x1,%ZMM3,%YMM4 |
(6525) 0x57904d MOV %RCX,%R14 |
(6525) 0x579050 VADDPD %ZMM4,%ZMM3,%ZMM3 |
(6525) 0x579056 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(6525) 0x57905c VADDPD %XMM4,%XMM3,%XMM3 |
(6525) 0x579060 VPERMILPD $0x1,%XMM3,%XMM4 |
(6525) 0x579066 VADDSD %XMM4,%XMM3,%XMM3 |
(6525) 0x57906a VADDSD %XMM3,%XMM2,%XMM2 |
(6525) 0x57906e CMP %R13,%RCX |
(6525) 0x579071 JE 578fd0 |
(6525) 0x579077 JMP 579083 |
0x579079 NOPL (%RAX) |
(6525) 0x579080 XOR %R14D,%R14D |
(6525) 0x579083 MOV %R13,%R11 |
(6525) 0x579086 SUB %R14,%R11 |
(6525) 0x579089 IMUL %R12,%R14 |
(6525) 0x57908d ADD %RDI,%R14 |
(6525) 0x579090 LEA (%RBX,%R14,8),%R14 |
(6525) 0x579094 NOPW %CS:(%RAX,%RAX,1) |
(6524) 0x5790a0 VADDSD (%R14),%XMM2,%XMM2 |
(6524) 0x5790a5 ADD %R8,%R14 |
(6524) 0x5790a8 DEC %R11 |
(6524) 0x5790ab JNE 5790a0 |
(6525) 0x5790ad JMP 578fd0 |
0x5790b2 MOV -0x7c(%RBP),%ESI |
0x5790b5 MOV $0x5d9f70,%EDI |
0x5790ba VZEROUPPER |
0x5790bd CALL 410170 <__kmpc_for_static_fini@plt> |
0x5790c2 MOV (%R15),%ESI |
0x5790c5 MOV $0x5d9f90,%EDI |
0x5790ca ADD $0x98,%RSP |
0x5790d1 POP %RBX |
0x5790d2 POP %R12 |
0x5790d4 POP %R13 |
0x5790d6 POP %R14 |
0x5790d8 POP %R15 |
0x5790da POP %RBP |
0x5790db JMP 410560 |
0x5790e0 VMOVDQU64 0x3c256(%RIP),%ZMM1 |
0x5790ea LEA 0x1(%RAX),%RCX |
0x5790ee MOV %R13,%RDI |
0x5790f1 AND $-0x8,%RDI |
0x5790f5 LEA (,%R12,8),%R9 |
0x5790fd AND $-0x8,%R15 |
0x579101 LEA 0x5(%RAX),%R14 |
0x579105 LEA 0x6(%RAX),%RSI |
0x579109 XOR %EDX,%EDX |
0x57910b MOV %RAX,%R10 |
0x57910e MOV %RCX,-0x40(%RBP) |
0x579112 LEA 0x2(%RAX),%RCX |
0x579116 LEA -0x1(%RDI),%R8 |
0x57911a MOV %RCX,-0x58(%RBP) |
0x57911e LEA 0x3(%RAX),%RCX |
0x579122 MOV %RCX,-0x50(%RBP) |
0x579126 LEA 0x4(%RAX),%RCX |
0x57912a MOV %RCX,-0x60(%RBP) |
0x57912e LEA 0x7(%RAX),%RCX |
0x579132 MOV %R15,-0x78(%RBP) |
0x579136 JMP 579186 |
0x579138 NOPL (%RAX,%RAX,1) |
(6527) 0x579140 MOV -0x48(%RBP),%R15 |
(6527) 0x579144 ADDQ $0x8,-0x40(%RBP) |
(6527) 0x579149 ADDQ $0x8,-0x58(%RBP) |
(6527) 0x57914e ADDQ $0x8,-0x50(%RBP) |
(6527) 0x579153 ADDQ $0x8,-0x60(%RBP) |
(6527) 0x579158 ADD $0x8,%RDX |
(6527) 0x57915c ADD $0x8,%R10 |
(6527) 0x579160 ADD $0x8,%R14 |
(6527) 0x579164 ADD $0x8,%RSI |
(6527) 0x579168 ADD $0x8,%RCX |
(6527) 0x57916c MOV -0x78(%RBP),%R12 |
(6527) 0x579170 VMOVSD %XMM2,(%R15,%R11,8) |
(6527) 0x579176 MOV %R15,%R11 |
(6527) 0x579179 CMP %R12,%RDX |
(6527) 0x57917c MOV -0x38(%RBP),%R12 |
(6527) 0x579180 JE 578f9b |
(6527) 0x579186 LEA (%RAX,%RDX,1),%R15 |
(6527) 0x57918a VMOVSD (%R11,%R15,8),%XMM2 |
(6527) 0x579190 TEST %RDI,%RDI |
(6527) 0x579193 JE 579220 |
(6527) 0x579199 VPBROADCASTQ %R15,%ZMM4 |
(6527) 0x57919f VPXOR %XMM3,%XMM3,%XMM3 |
(6527) 0x5791a3 XOR %R11D,%R11D |
(6527) 0x5791a6 NOPW %CS:(%RAX,%RAX,1) |
(6535) 0x5791b0 VPBROADCASTQ %R11,%ZMM5 |
(6535) 0x5791b6 VXORPD %XMM6,%XMM6,%XMM6 |
(6535) 0x5791ba KXNORW %K0,%K0,%K1 |
(6535) 0x5791be ADD $0x8,%R11 |
(6535) 0x5791c2 VPADDQ %ZMM1,%ZMM5,%ZMM5 |
(6535) 0x5791c8 VPMULLQ %ZMM5,%ZMM0,%ZMM5 |
(6535) 0x5791ce VPADDQ %ZMM5,%ZMM4,%ZMM5 |
(6535) 0x5791d4 VGATHERQPD (%RBX,%ZMM5,8),%ZMM6{%K1} |
(6535) 0x5791db VADDPD %ZMM6,%ZMM3,%ZMM3 |
(6535) 0x5791e1 CMP %R8,%R11 |
(6535) 0x5791e4 JLE 5791b0 |
(6527) 0x5791e6 VEXTRACTF64X4 $0x1,%ZMM3,%YMM4 |
(6527) 0x5791ed MOV %RDI,%R12 |
(6527) 0x5791f0 VADDPD %ZMM4,%ZMM3,%ZMM3 |
(6527) 0x5791f6 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(6527) 0x5791fc VADDPD %XMM4,%XMM3,%XMM3 |
(6527) 0x579200 VPERMILPD $0x1,%XMM3,%XMM4 |
(6527) 0x579206 VADDSD %XMM4,%XMM3,%XMM3 |
(6527) 0x57920a VADDSD %XMM3,%XMM2,%XMM2 |
(6527) 0x57920e CMP %R13,%RDI |
(6527) 0x579211 JNE 579223 |
(6527) 0x579213 JMP 57924e |
0x579215 NOPW %CS:(%RAX,%RAX,1) |
(6527) 0x579220 XOR %R12D,%R12D |
(6527) 0x579223 MOV %R13,%R11 |
(6527) 0x579226 SUB %R12,%R11 |
(6527) 0x579229 IMUL -0x38(%RBP),%R12 |
(6527) 0x57922e ADD %R10,%R12 |
(6527) 0x579231 LEA (%RBX,%R12,8),%R12 |
(6527) 0x579235 NOPW %CS:(%RAX,%RAX,1) |
(6516) 0x579240 VADDSD (%R12),%XMM2,%XMM2 |
(6516) 0x579246 ADD %R9,%R12 |
(6516) 0x579249 DEC %R11 |
(6516) 0x57924c JNE 579240 |
(6527) 0x57924e MOV -0x48(%RBP),%R12 |
(6527) 0x579252 LEA 0x1(%RDX,%RAX,1),%R11 |
(6527) 0x579257 VMOVSD %XMM2,(%R12,%R15,8) |
(6527) 0x57925d VMOVSD 0x8(%R12,%R15,8),%XMM2 |
(6527) 0x579264 TEST %RDI,%RDI |
(6527) 0x579267 JE 5792f0 |
(6527) 0x57926d VPBROADCASTQ %R11,%ZMM4 |
(6527) 0x579273 VXORPD %XMM3,%XMM3,%XMM3 |
(6527) 0x579277 XOR %R12D,%R12D |
(6527) 0x57927a NOPW (%RAX,%RAX,1) |
(6534) 0x579280 VPBROADCASTQ %R12,%ZMM5 |
(6534) 0x579286 VXORPD %XMM6,%XMM6,%XMM6 |
(6534) 0x57928a KXNORW %K0,%K0,%K1 |
(6534) 0x57928e ADD $0x8,%R12 |
(6534) 0x579292 VPADDQ %ZMM1,%ZMM5,%ZMM5 |
(6534) 0x579298 VPMULLQ %ZMM5,%ZMM0,%ZMM5 |
(6534) 0x57929e VPADDQ %ZMM5,%ZMM4,%ZMM5 |
(6534) 0x5792a4 VGATHERQPD (%RBX,%ZMM5,8),%ZMM6{%K1} |
(6534) 0x5792ab VADDPD %ZMM6,%ZMM3,%ZMM3 |
(6534) 0x5792b1 CMP %R8,%R12 |
(6534) 0x5792b4 JLE 579280 |
(6527) 0x5792b6 VEXTRACTF64X4 $0x1,%ZMM3,%YMM4 |
(6527) 0x5792bd MOV %RDI,%R13 |
(6527) 0x5792c0 VADDPD %ZMM4,%ZMM3,%ZMM3 |
(6527) 0x5792c6 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(6527) 0x5792cc VADDPD %XMM4,%XMM3,%XMM3 |
(6527) 0x5792d0 VPERMILPD $0x1,%XMM3,%XMM4 |
(6527) 0x5792d6 VADDSD %XMM4,%XMM3,%XMM3 |
(6527) 0x5792da VADDSD %XMM3,%XMM2,%XMM2 |
(6527) 0x5792de CMP -0x30(%RBP),%RDI |
(6527) 0x5792e2 JNE 5792f3 |
(6527) 0x5792e4 JMP 57931e |
0x5792e6 NOPW %CS:(%RAX,%RAX,1) |
(6527) 0x5792f0 XOR %R13D,%R13D |
(6527) 0x5792f3 MOV -0x30(%RBP),%R12 |
(6527) 0x5792f7 SUB %R13,%R12 |
(6527) 0x5792fa IMUL -0x38(%RBP),%R13 |
(6527) 0x5792ff ADD -0x40(%RBP),%R13 |
(6527) 0x579303 LEA (%RBX,%R13,8),%R13 |
(6527) 0x579307 NOPW (%RAX,%RAX,1) |
(6517) 0x579310 VADDSD (%R13),%XMM2,%XMM2 |
(6517) 0x579316 ADD %R9,%R13 |
(6517) 0x579319 DEC %R12 |
(6517) 0x57931c JNE 579310 |
(6527) 0x57931e MOV -0x48(%RBP),%R12 |
(6527) 0x579322 VMOVSD %XMM2,(%R12,%R11,8) |
(6527) 0x579328 LEA 0x2(%RDX,%RAX,1),%R11 |
(6527) 0x57932d VMOVSD 0x10(%R12,%R15,8),%XMM2 |
(6527) 0x579334 TEST %RDI,%RDI |
(6527) 0x579337 JE 5793c0 |
(6527) 0x57933d VPBROADCASTQ %R11,%ZMM4 |
(6527) 0x579343 VXORPD %XMM3,%XMM3,%XMM3 |
(6527) 0x579347 XOR %R12D,%R12D |
(6527) 0x57934a NOPW (%RAX,%RAX,1) |
(6533) 0x579350 VPBROADCASTQ %R12,%ZMM5 |
(6533) 0x579356 VXORPD %XMM6,%XMM6,%XMM6 |
(6533) 0x57935a KXNORW %K0,%K0,%K1 |
(6533) 0x57935e ADD $0x8,%R12 |
(6533) 0x579362 VPADDQ %ZMM1,%ZMM5,%ZMM5 |
(6533) 0x579368 VPMULLQ %ZMM5,%ZMM0,%ZMM5 |
(6533) 0x57936e VPADDQ %ZMM5,%ZMM4,%ZMM5 |
(6533) 0x579374 VGATHERQPD (%RBX,%ZMM5,8),%ZMM6{%K1} |
(6533) 0x57937b VADDPD %ZMM6,%ZMM3,%ZMM3 |
(6533) 0x579381 CMP %R8,%R12 |
(6533) 0x579384 JLE 579350 |
(6527) 0x579386 VEXTRACTF64X4 $0x1,%ZMM3,%YMM4 |
(6527) 0x57938d MOV %RDI,%R13 |
(6527) 0x579390 VADDPD %ZMM4,%ZMM3,%ZMM3 |
(6527) 0x579396 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(6527) 0x57939c VADDPD %XMM4,%XMM3,%XMM3 |
(6527) 0x5793a0 VPERMILPD $0x1,%XMM3,%XMM4 |
(6527) 0x5793a6 VADDSD %XMM4,%XMM3,%XMM3 |
(6527) 0x5793aa VADDSD %XMM3,%XMM2,%XMM2 |
(6527) 0x5793ae CMP -0x30(%RBP),%RDI |
(6527) 0x5793b2 JNE 5793c3 |
(6527) 0x5793b4 JMP 5793ee |
0x5793b6 NOPW %CS:(%RAX,%RAX,1) |
(6527) 0x5793c0 XOR %R13D,%R13D |
(6527) 0x5793c3 MOV -0x30(%RBP),%R12 |
(6527) 0x5793c7 SUB %R13,%R12 |
(6527) 0x5793ca IMUL -0x38(%RBP),%R13 |
(6527) 0x5793cf ADD -0x58(%RBP),%R13 |
(6527) 0x5793d3 LEA (%RBX,%R13,8),%R13 |
(6527) 0x5793d7 NOPW (%RAX,%RAX,1) |
(6518) 0x5793e0 VADDSD (%R13),%XMM2,%XMM2 |
(6518) 0x5793e6 ADD %R9,%R13 |
(6518) 0x5793e9 DEC %R12 |
(6518) 0x5793ec JNE 5793e0 |
(6527) 0x5793ee MOV -0x48(%RBP),%R12 |
(6527) 0x5793f2 VMOVSD %XMM2,(%R12,%R11,8) |
(6527) 0x5793f8 LEA 0x3(%RDX,%RAX,1),%R11 |
(6527) 0x5793fd VMOVSD 0x18(%R12,%R15,8),%XMM2 |
(6527) 0x579404 TEST %RDI,%RDI |
(6527) 0x579407 JE 579490 |
(6527) 0x57940d VPBROADCASTQ %R11,%ZMM4 |
(6527) 0x579413 VXORPD %XMM3,%XMM3,%XMM3 |
(6527) 0x579417 XOR %R12D,%R12D |
(6527) 0x57941a NOPW (%RAX,%RAX,1) |
(6532) 0x579420 VPBROADCASTQ %R12,%ZMM5 |
(6532) 0x579426 VXORPD %XMM6,%XMM6,%XMM6 |
(6532) 0x57942a KXNORW %K0,%K0,%K1 |
(6532) 0x57942e ADD $0x8,%R12 |
(6532) 0x579432 VPADDQ %ZMM1,%ZMM5,%ZMM5 |
(6532) 0x579438 VPMULLQ %ZMM5,%ZMM0,%ZMM5 |
(6532) 0x57943e VPADDQ %ZMM5,%ZMM4,%ZMM5 |
(6532) 0x579444 VGATHERQPD (%RBX,%ZMM5,8),%ZMM6{%K1} |
(6532) 0x57944b VADDPD %ZMM6,%ZMM3,%ZMM3 |
(6532) 0x579451 CMP %R8,%R12 |
(6532) 0x579454 JLE 579420 |
(6527) 0x579456 VEXTRACTF64X4 $0x1,%ZMM3,%YMM4 |
(6527) 0x57945d MOV %RDI,%R13 |
(6527) 0x579460 VADDPD %ZMM4,%ZMM3,%ZMM3 |
(6527) 0x579466 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(6527) 0x57946c VADDPD %XMM4,%XMM3,%XMM3 |
(6527) 0x579470 VPERMILPD $0x1,%XMM3,%XMM4 |
(6527) 0x579476 VADDSD %XMM4,%XMM3,%XMM3 |
(6527) 0x57947a VADDSD %XMM3,%XMM2,%XMM2 |
(6527) 0x57947e CMP -0x30(%RBP),%RDI |
(6527) 0x579482 JNE 579493 |
(6527) 0x579484 JMP 5794be |
0x579486 NOPW %CS:(%RAX,%RAX,1) |
(6527) 0x579490 XOR %R13D,%R13D |
(6527) 0x579493 MOV -0x30(%RBP),%R12 |
(6527) 0x579497 SUB %R13,%R12 |
(6527) 0x57949a IMUL -0x38(%RBP),%R13 |
(6527) 0x57949f ADD -0x50(%RBP),%R13 |
(6527) 0x5794a3 LEA (%RBX,%R13,8),%R13 |
(6527) 0x5794a7 NOPW (%RAX,%RAX,1) |
(6519) 0x5794b0 VADDSD (%R13),%XMM2,%XMM2 |
(6519) 0x5794b6 ADD %R9,%R13 |
(6519) 0x5794b9 DEC %R12 |
(6519) 0x5794bc JNE 5794b0 |
(6527) 0x5794be MOV -0x48(%RBP),%R12 |
(6527) 0x5794c2 VMOVSD %XMM2,(%R12,%R11,8) |
(6527) 0x5794c8 LEA 0x4(%RDX,%RAX,1),%R11 |
(6527) 0x5794cd VMOVSD 0x20(%R12,%R15,8),%XMM2 |
(6527) 0x5794d4 TEST %RDI,%RDI |
(6527) 0x5794d7 JE 579560 |
(6527) 0x5794dd VPBROADCASTQ %R11,%ZMM4 |
(6527) 0x5794e3 VXORPD %XMM3,%XMM3,%XMM3 |
(6527) 0x5794e7 XOR %R12D,%R12D |
(6527) 0x5794ea NOPW (%RAX,%RAX,1) |
(6531) 0x5794f0 VPBROADCASTQ %R12,%ZMM5 |
(6531) 0x5794f6 VXORPD %XMM6,%XMM6,%XMM6 |
(6531) 0x5794fa KXNORW %K0,%K0,%K1 |
(6531) 0x5794fe ADD $0x8,%R12 |
(6531) 0x579502 VPADDQ %ZMM1,%ZMM5,%ZMM5 |
(6531) 0x579508 VPMULLQ %ZMM5,%ZMM0,%ZMM5 |
(6531) 0x57950e VPADDQ %ZMM5,%ZMM4,%ZMM5 |
(6531) 0x579514 VGATHERQPD (%RBX,%ZMM5,8),%ZMM6{%K1} |
(6531) 0x57951b VADDPD %ZMM6,%ZMM3,%ZMM3 |
(6531) 0x579521 CMP %R8,%R12 |
(6531) 0x579524 JLE 5794f0 |
(6527) 0x579526 VEXTRACTF64X4 $0x1,%ZMM3,%YMM4 |
(6527) 0x57952d MOV %RDI,%R13 |
(6527) 0x579530 VADDPD %ZMM4,%ZMM3,%ZMM3 |
(6527) 0x579536 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(6527) 0x57953c VADDPD %XMM4,%XMM3,%XMM3 |
(6527) 0x579540 VPERMILPD $0x1,%XMM3,%XMM4 |
(6527) 0x579546 VADDSD %XMM4,%XMM3,%XMM3 |
(6527) 0x57954a VADDSD %XMM3,%XMM2,%XMM2 |
(6527) 0x57954e CMP -0x30(%RBP),%RDI |
(6527) 0x579552 JNE 579563 |
(6527) 0x579554 JMP 57958e |
0x579556 NOPW %CS:(%RAX,%RAX,1) |
(6527) 0x579560 XOR %R13D,%R13D |
(6527) 0x579563 MOV -0x30(%RBP),%R12 |
(6527) 0x579567 SUB %R13,%R12 |
(6527) 0x57956a IMUL -0x38(%RBP),%R13 |
(6527) 0x57956f ADD -0x60(%RBP),%R13 |
(6527) 0x579573 LEA (%RBX,%R13,8),%R13 |
(6527) 0x579577 NOPW (%RAX,%RAX,1) |
(6520) 0x579580 VADDSD (%R13),%XMM2,%XMM2 |
(6520) 0x579586 ADD %R9,%R13 |
(6520) 0x579589 DEC %R12 |
(6520) 0x57958c JNE 579580 |
(6527) 0x57958e MOV -0x48(%RBP),%R12 |
(6527) 0x579592 VMOVSD %XMM2,(%R12,%R11,8) |
(6527) 0x579598 LEA 0x5(%RDX,%RAX,1),%R11 |
(6527) 0x57959d VMOVSD 0x28(%R12,%R15,8),%XMM2 |
(6527) 0x5795a4 TEST %RDI,%RDI |
(6527) 0x5795a7 JE 579630 |
(6527) 0x5795ad VPBROADCASTQ %R11,%ZMM4 |
(6527) 0x5795b3 VXORPD %XMM3,%XMM3,%XMM3 |
(6527) 0x5795b7 XOR %R12D,%R12D |
(6527) 0x5795ba NOPW (%RAX,%RAX,1) |
(6530) 0x5795c0 VPBROADCASTQ %R12,%ZMM5 |
(6530) 0x5795c6 VXORPD %XMM6,%XMM6,%XMM6 |
(6530) 0x5795ca KXNORW %K0,%K0,%K1 |
(6530) 0x5795ce ADD $0x8,%R12 |
(6530) 0x5795d2 VPADDQ %ZMM1,%ZMM5,%ZMM5 |
(6530) 0x5795d8 VPMULLQ %ZMM5,%ZMM0,%ZMM5 |
(6530) 0x5795de VPADDQ %ZMM5,%ZMM4,%ZMM5 |
(6530) 0x5795e4 VGATHERQPD (%RBX,%ZMM5,8),%ZMM6{%K1} |
(6530) 0x5795eb VADDPD %ZMM6,%ZMM3,%ZMM3 |
(6530) 0x5795f1 CMP %R8,%R12 |
(6530) 0x5795f4 JLE 5795c0 |
(6527) 0x5795f6 VEXTRACTF64X4 $0x1,%ZMM3,%YMM4 |
(6527) 0x5795fd MOV %RDI,%R13 |
(6527) 0x579600 VADDPD %ZMM4,%ZMM3,%ZMM3 |
(6527) 0x579606 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(6527) 0x57960c VADDPD %XMM4,%XMM3,%XMM3 |
(6527) 0x579610 VPERMILPD $0x1,%XMM3,%XMM4 |
(6527) 0x579616 VADDSD %XMM4,%XMM3,%XMM3 |
(6527) 0x57961a VADDSD %XMM3,%XMM2,%XMM2 |
(6527) 0x57961e CMP -0x30(%RBP),%RDI |
(6527) 0x579622 JNE 579633 |
(6527) 0x579624 JMP 57965e |
0x579626 NOPW %CS:(%RAX,%RAX,1) |
(6527) 0x579630 XOR %R13D,%R13D |
(6527) 0x579633 MOV -0x30(%RBP),%R12 |
(6527) 0x579637 SUB %R13,%R12 |
(6527) 0x57963a IMUL -0x38(%RBP),%R13 |
(6527) 0x57963f ADD %R14,%R13 |
(6527) 0x579642 LEA (%RBX,%R13,8),%R13 |
(6527) 0x579646 NOPW %CS:(%RAX,%RAX,1) |
(6521) 0x579650 VADDSD (%R13),%XMM2,%XMM2 |
(6521) 0x579656 ADD %R9,%R13 |
(6521) 0x579659 DEC %R12 |
(6521) 0x57965c JNE 579650 |
(6527) 0x57965e MOV -0x48(%RBP),%R12 |
(6527) 0x579662 VMOVSD %XMM2,(%R12,%R11,8) |
(6527) 0x579668 LEA 0x6(%RDX,%RAX,1),%R11 |
(6527) 0x57966d VMOVSD 0x30(%R12,%R15,8),%XMM2 |
(6527) 0x579674 TEST %RDI,%RDI |
(6527) 0x579677 JE 579700 |
(6527) 0x57967d VPBROADCASTQ %R11,%ZMM4 |
(6527) 0x579683 VXORPD %XMM3,%XMM3,%XMM3 |
(6527) 0x579687 XOR %R12D,%R12D |
(6527) 0x57968a NOPW (%RAX,%RAX,1) |
(6529) 0x579690 VPBROADCASTQ %R12,%ZMM5 |
(6529) 0x579696 VXORPD %XMM6,%XMM6,%XMM6 |
(6529) 0x57969a KXNORW %K0,%K0,%K1 |
(6529) 0x57969e ADD $0x8,%R12 |
(6529) 0x5796a2 VPADDQ %ZMM1,%ZMM5,%ZMM5 |
(6529) 0x5796a8 VPMULLQ %ZMM5,%ZMM0,%ZMM5 |
(6529) 0x5796ae VPADDQ %ZMM5,%ZMM4,%ZMM5 |
(6529) 0x5796b4 VGATHERQPD (%RBX,%ZMM5,8),%ZMM6{%K1} |
(6529) 0x5796bb VADDPD %ZMM6,%ZMM3,%ZMM3 |
(6529) 0x5796c1 CMP %R8,%R12 |
(6529) 0x5796c4 JLE 579690 |
(6527) 0x5796c6 VEXTRACTF64X4 $0x1,%ZMM3,%YMM4 |
(6527) 0x5796cd MOV %RDI,%R13 |
(6527) 0x5796d0 VADDPD %ZMM4,%ZMM3,%ZMM3 |
(6527) 0x5796d6 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(6527) 0x5796dc VADDPD %XMM4,%XMM3,%XMM3 |
(6527) 0x5796e0 VPERMILPD $0x1,%XMM3,%XMM4 |
(6527) 0x5796e6 VADDSD %XMM4,%XMM3,%XMM3 |
(6527) 0x5796ea VADDSD %XMM3,%XMM2,%XMM2 |
(6527) 0x5796ee CMP -0x30(%RBP),%RDI |
(6527) 0x5796f2 JNE 579703 |
(6527) 0x5796f4 JMP 57972e |
0x5796f6 NOPW %CS:(%RAX,%RAX,1) |
(6527) 0x579700 XOR %R13D,%R13D |
(6527) 0x579703 MOV -0x30(%RBP),%R12 |
(6527) 0x579707 SUB %R13,%R12 |
(6527) 0x57970a IMUL -0x38(%RBP),%R13 |
(6527) 0x57970f ADD %RSI,%R13 |
(6527) 0x579712 LEA (%RBX,%R13,8),%R13 |
(6527) 0x579716 NOPW %CS:(%RAX,%RAX,1) |
(6522) 0x579720 VADDSD (%R13),%XMM2,%XMM2 |
(6522) 0x579726 ADD %R9,%R13 |
(6522) 0x579729 DEC %R12 |
(6522) 0x57972c JNE 579720 |
(6527) 0x57972e MOV -0x48(%RBP),%R12 |
(6527) 0x579732 VMOVSD %XMM2,(%R12,%R11,8) |
(6527) 0x579738 LEA 0x7(%RDX,%RAX,1),%R11 |
(6527) 0x57973d VMOVSD 0x38(%R12,%R15,8),%XMM2 |
(6527) 0x579744 TEST %RDI,%RDI |
(6527) 0x579747 JE 5797d0 |
(6527) 0x57974d VPBROADCASTQ %R11,%ZMM4 |
(6527) 0x579753 VXORPD %XMM3,%XMM3,%XMM3 |
(6527) 0x579757 XOR %R15D,%R15D |
(6527) 0x57975a NOPW (%RAX,%RAX,1) |
(6528) 0x579760 VPBROADCASTQ %R15,%ZMM5 |
(6528) 0x579766 VXORPD %XMM6,%XMM6,%XMM6 |
(6528) 0x57976a KXNORW %K0,%K0,%K1 |
(6528) 0x57976e ADD $0x8,%R15 |
(6528) 0x579772 VPADDQ %ZMM1,%ZMM5,%ZMM5 |
(6528) 0x579778 VPMULLQ %ZMM5,%ZMM0,%ZMM5 |
(6528) 0x57977e VPADDQ %ZMM5,%ZMM4,%ZMM5 |
(6528) 0x579784 VGATHERQPD (%RBX,%ZMM5,8),%ZMM6{%K1} |
(6528) 0x57978b VADDPD %ZMM6,%ZMM3,%ZMM3 |
(6528) 0x579791 CMP %R8,%R15 |
(6528) 0x579794 JLE 579760 |
(6527) 0x579796 VEXTRACTF64X4 $0x1,%ZMM3,%YMM4 |
(6527) 0x57979d MOV -0x30(%RBP),%R13 |
(6527) 0x5797a1 MOV %RDI,%R12 |
(6527) 0x5797a4 VADDPD %ZMM4,%ZMM3,%ZMM3 |
(6527) 0x5797aa VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(6527) 0x5797b0 VADDPD %XMM4,%XMM3,%XMM3 |
(6527) 0x5797b4 VPERMILPD $0x1,%XMM3,%XMM4 |
(6527) 0x5797ba VADDSD %XMM4,%XMM3,%XMM3 |
(6527) 0x5797be VADDSD %XMM3,%XMM2,%XMM2 |
(6527) 0x5797c2 CMP %R13,%RDI |
(6527) 0x5797c5 JE 579140 |
(6527) 0x5797cb JMP 5797d7 |
0x5797cd NOPL (%RAX) |
(6527) 0x5797d0 MOV -0x30(%RBP),%R13 |
(6527) 0x5797d4 XOR %R12D,%R12D |
(6527) 0x5797d7 MOV %R13,%R15 |
(6527) 0x5797da SUB %R12,%R15 |
(6527) 0x5797dd IMUL -0x38(%RBP),%R12 |
(6527) 0x5797e2 ADD %RCX,%R12 |
(6527) 0x5797e5 LEA (%RBX,%R12,8),%R12 |
(6527) 0x5797e9 NOPL (%RAX) |
(6523) 0x5797f0 VADDSD (%R12),%XMM2,%XMM2 |
(6523) 0x5797f6 ADD %R9,%R12 |
(6523) 0x5797f9 DEC %R15 |
(6523) 0x5797fc JNE 5797f0 |
(6527) 0x5797fe JMP 579140 |
0x579803 NOPW %CS:(%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | csr_matvec.c:554-579 |
Module | exec |
nb instructions | 225 |
nb uops | 210 |
loop length | 1064 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 4 |
nb stack references | 24 |
micro-operation queue | 35.00 cycles |
front end | 35.00 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 21.00 | 21.00 | 20.75 | 20.75 | 11.50 | 20.33 | 20.33 | 20.33 | 1.00 | 3.00 | 3.00 | 1.00 | 0.00 | 0.00 |
cycles | 21.00 | 21.00 | 20.75 | 20.75 | 11.50 | 21.00 | 21.00 | 21.00 | 1.00 | 3.00 | 3.00 | 1.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 35.00 |
Dispatch | 21.00 |
Overall L1 | 35.00 |
all | 11% |
load | 25% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
all | 18% |
load | 34% |
store | 10% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 20% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x98,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R9,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RCX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %RDI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x28(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x10(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CALL 586110 <hypre_GetThreadNum> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV -0x40(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %R13,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
TEST %RCX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JLE 57894b <hypre_CSRMatrixMatvecT.extracted.49+0x2ab> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOVL $0,-0x84(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
DEC %RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV (%RDX),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOVQ $0,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %RCX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOVQ $0x1,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0xb8(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x84(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0xa8(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0xa0(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x5d9fb0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %ESI,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL 410420 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV -0xa8(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
SUB %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JB 57892b <hypre_CSRMatrixMatvecT.extracted.49+0x28b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
IMUL -0x38(%RBP),%R13 | 1 | 0 | 1 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | scal (12.5%) |
LEA 0x1(%RAX),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VPBROADCASTQ %RBX,%ZMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 | scal (12.5%) |
MOV %EDX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
AND $0x3,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VPBROADCASTQ %R13,%ZMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 | scal (12.5%) |
CMP $0x3,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JAE 578a8a <hypre_CSRMatrixMatvecT.extracted.49+0x3ea> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
CMPQ $0,-0x60(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
JE 57892b <hypre_CSRMatrixMatvecT.extracted.49+0x28b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
VPBROADCASTQ 0x25cfa(%RIP),%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 0.50 | scal (12.5%) |
VPTERNLOGD $-0x1,%ZMM3,%ZMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 | vect (100.0%) |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
JMP 5787f0 <hypre_CSRMatrixMatvecT.extracted.49+0x150> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
MOV -0x78(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV $0x5d9fd0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | vect (25.0%) |
CALL 410170 <__kmpc_for_static_fini@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV -0x70(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV $0x5d9ff0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV -0x38(%RBP),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
TEST %R12,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JLE 578a78 <hypre_CSRMatrixMatvecT.extracted.49+0x3d8> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV -0x70(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOVL $0,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
LEA -0x1(%R12),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV (%R15),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOVQ $0,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOVQ $0x1,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0xb0(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x80(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x98(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x90(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x5d9f50,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %ESI,-0x7c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL 410420 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV -0x30(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RDX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SUB %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JB 5790b2 <hypre_CSRMatrixMatvecT.extracted.49+0xa12> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %R12,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SAR $0x3f,%R8 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
LEA (%R11,%RDX,8),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
AND %R12,%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SUB %R8,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
IMUL %R13,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
ADD %RSI,%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
TEST %R12,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
LEA (%RBX,%R8,8),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CMOVG %R12,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CMP %R8,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JB 578f7b <hypre_CSRMatrixMatvecT.extracted.49+0x8db> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
SUB %RSI,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
IMUL %R13,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
LEA (%R11,%RAX,8),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
ADD %RDX,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA (%RBX,%RSI,8),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CMP %RDI,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JB 578f7b <hypre_CSRMatrixMatvecT.extracted.49+0x8db> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
LEA (%RBX,%RAX,8),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SAL $0x3,%R12 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
JMP 5790b2 <hypre_CSRMatrixMatvecT.extracted.49+0xa12> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD $0x98,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
VPBROADCASTQ 0x25a2c(%RIP),%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 0.50 | scal (12.5%) |
MOV -0x50(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
AND $-0x4,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VPTERNLOGD $-0x1,%ZMM3,%ZMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 | vect (100.0%) |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %RDX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP 578ac1 <hypre_CSRMatrixMatvecT.extracted.49+0x421> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
LEA 0x1(%RCX),%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VPBROADCASTQ %R12,%ZMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 | scal (12.5%) |
MOV %R15D,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
AND $0x7,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
CMP $0x7,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JAE 5790e0 <hypre_CSRMatrixMatvecT.extracted.49+0xa40> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
CMPQ $0,-0x68(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
MOV -0x70(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
JE 5790b2 <hypre_CSRMatrixMatvecT.extracted.49+0xa12> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
VMOVDQU64 0x3c38c(%RIP),%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
MOV %R13,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
AND $-0x8,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA (,%R12,8),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA (%RDX,%RAX,1),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | scal (6.3%) |
LEA -0x1(%RCX),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP 578fed <hypre_CSRMatrixMatvecT.extracted.49+0x94d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
MOV -0x7c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV $0x5d9f70,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | vect (25.0%) |
CALL 410170 <__kmpc_for_static_fini@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV (%R15),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV $0x5d9f90,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
ADD $0x98,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
JMP 410560 <__kmpc_barrier@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
VMOVDQU64 0x3c256(%RIP),%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
LEA 0x1(%RAX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
AND $-0x8,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA (,%R12,8),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
AND $-0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x5(%RAX),%R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x6(%RAX),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %RAX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RCX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x2(%RAX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x1(%RDI),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x3(%RAX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x4(%RAX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x7(%RAX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R15,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP 579186 <hypre_CSRMatrixMatvecT.extracted.49+0xae6> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Source file and lines | csr_matvec.c:554-579 |
Module | exec |
nb instructions | 225 |
nb uops | 210 |
loop length | 1064 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 4 |
nb stack references | 24 |
micro-operation queue | 35.00 cycles |
front end | 35.00 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 21.00 | 21.00 | 20.75 | 20.75 | 11.50 | 20.33 | 20.33 | 20.33 | 1.00 | 3.00 | 3.00 | 1.00 | 0.00 | 0.00 |
cycles | 21.00 | 21.00 | 20.75 | 20.75 | 11.50 | 21.00 | 21.00 | 21.00 | 1.00 | 3.00 | 3.00 | 1.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 35.00 |
Dispatch | 21.00 |
Overall L1 | 35.00 |
all | 11% |
load | 25% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
all | 18% |
load | 34% |
store | 10% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 20% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x98,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R9,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RCX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %RDI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x28(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x10(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CALL 586110 <hypre_GetThreadNum> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV -0x40(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %R13,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
TEST %RCX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JLE 57894b <hypre_CSRMatrixMatvecT.extracted.49+0x2ab> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOVL $0,-0x84(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
DEC %RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV (%RDX),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOVQ $0,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %RCX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOVQ $0x1,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0xb8(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x84(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0xa8(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0xa0(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x5d9fb0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %ESI,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL 410420 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV -0xa8(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
SUB %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JB 57892b <hypre_CSRMatrixMatvecT.extracted.49+0x28b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
IMUL -0x38(%RBP),%R13 | 1 | 0 | 1 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | scal (12.5%) |
LEA 0x1(%RAX),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VPBROADCASTQ %RBX,%ZMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 | scal (12.5%) |
MOV %EDX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
AND $0x3,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VPBROADCASTQ %R13,%ZMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 | scal (12.5%) |
CMP $0x3,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JAE 578a8a <hypre_CSRMatrixMatvecT.extracted.49+0x3ea> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
CMPQ $0,-0x60(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
JE 57892b <hypre_CSRMatrixMatvecT.extracted.49+0x28b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
VPBROADCASTQ 0x25cfa(%RIP),%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 0.50 | scal (12.5%) |
VPTERNLOGD $-0x1,%ZMM3,%ZMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 | vect (100.0%) |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
JMP 5787f0 <hypre_CSRMatrixMatvecT.extracted.49+0x150> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
MOV -0x78(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV $0x5d9fd0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | vect (25.0%) |
CALL 410170 <__kmpc_for_static_fini@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV -0x70(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV $0x5d9ff0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV -0x38(%RBP),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
TEST %R12,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JLE 578a78 <hypre_CSRMatrixMatvecT.extracted.49+0x3d8> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV -0x70(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOVL $0,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
LEA -0x1(%R12),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV (%R15),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOVQ $0,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOVQ $0x1,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0xb0(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x80(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x98(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x90(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x5d9f50,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %ESI,-0x7c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL 410420 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV -0x30(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RDX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SUB %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JB 5790b2 <hypre_CSRMatrixMatvecT.extracted.49+0xa12> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %R12,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SAR $0x3f,%R8 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
LEA (%R11,%RDX,8),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
AND %R12,%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SUB %R8,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
IMUL %R13,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
ADD %RSI,%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
TEST %R12,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
LEA (%RBX,%R8,8),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CMOVG %R12,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CMP %R8,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JB 578f7b <hypre_CSRMatrixMatvecT.extracted.49+0x8db> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
SUB %RSI,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
IMUL %R13,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
LEA (%R11,%RAX,8),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
ADD %RDX,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA (%RBX,%RSI,8),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CMP %RDI,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JB 578f7b <hypre_CSRMatrixMatvecT.extracted.49+0x8db> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
LEA (%RBX,%RAX,8),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SAL $0x3,%R12 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
JMP 5790b2 <hypre_CSRMatrixMatvecT.extracted.49+0xa12> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
ADD $0x98,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
VPBROADCASTQ 0x25a2c(%RIP),%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 0.50 | scal (12.5%) |
MOV -0x50(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
AND $-0x4,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VPTERNLOGD $-0x1,%ZMM3,%ZMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 | vect (100.0%) |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %RDX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP 578ac1 <hypre_CSRMatrixMatvecT.extracted.49+0x421> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
LEA 0x1(%RCX),%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VPBROADCASTQ %R12,%ZMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 | scal (12.5%) |
MOV %R15D,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
AND $0x7,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
CMP $0x7,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JAE 5790e0 <hypre_CSRMatrixMatvecT.extracted.49+0xa40> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
CMPQ $0,-0x68(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
MOV -0x70(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
JE 5790b2 <hypre_CSRMatrixMatvecT.extracted.49+0xa12> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
VMOVDQU64 0x3c38c(%RIP),%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
MOV %R13,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
AND $-0x8,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA (,%R12,8),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA (%RDX,%RAX,1),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | scal (6.3%) |
LEA -0x1(%RCX),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JMP 578fed <hypre_CSRMatrixMatvecT.extracted.49+0x94d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
MOV -0x7c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV $0x5d9f70,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | vect (25.0%) |
CALL 410170 <__kmpc_for_static_fini@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV (%R15),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV $0x5d9f90,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
ADD $0x98,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
JMP 410560 <__kmpc_barrier@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
VMOVDQU64 0x3c256(%RIP),%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
LEA 0x1(%RAX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
AND $-0x8,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA (,%R12,8),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
AND $-0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x5(%RAX),%R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x6(%RAX),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %RAX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RCX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x2(%RAX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x1(%RDI),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x3(%RAX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x4(%RAX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x7(%RAX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R15,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP 579186 <hypre_CSRMatrixMatvecT.extracted.49+0xae6> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecT.extracted.49– | 1.26 | 0.93 |
▼Loop 6542 - csr_matvec.c:560-567 - exec– | 0.34 | 0.24 |
○Loop 6546 - csr_matvec.c:564-567 - exec | 0.21 | 0.15 |
○Loop 6552 - csr_matvec.c:564-567 - exec | 0.21 | 0.15 |
○Loop 6549 - csr_matvec.c:564-567 - exec | 0.21 | 0.15 |
○Loop 6543 - csr_matvec.c:564-567 - exec | 0.20 | 0.14 |
▼Loop 6553 - csr_matvec.c:560-567 - exec– | 0.01 | 0.01 |
○Loop 6554 - csr_matvec.c:560-564 - exec | 0.00 | 0.00 |
▼Loop 6544 - csr_matvec.c:560-567 - exec– | 0.01 | 0.01 |
○Loop 6545 - csr_matvec.c:560-564 - exec | 0.00 | 0.00 |
▼Loop 6547 - csr_matvec.c:560-567 - exec– | 0.01 | 0.01 |
○Loop 6548 - csr_matvec.c:560-564 - exec | 0.00 | 0.00 |
▼Loop 6550 - csr_matvec.c:560-567 - exec– | 0.01 | 0.01 |
○Loop 6551 - csr_matvec.c:560-564 - exec | 0.00 | 0.00 |
▼Loop 6527 - csr_matvec.c:560-579 - exec– | 0.01 | 0.00 |
○Loop 6529 - csr_matvec.c:577-579 - exec | 0.01 | 0.00 |
○Loop 6533 - csr_matvec.c:577-579 - exec | 0.01 | 0.00 |
○Loop 6535 - csr_matvec.c:577-579 - exec | 0.01 | 0.00 |
○Loop 6531 - csr_matvec.c:577-579 - exec | 0.01 | 0.00 |
○Loop 6534 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
○Loop 6530 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
○Loop 6528 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
○Loop 6532 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
○Loop 6520 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
○Loop 6521 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
○Loop 6517 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
○Loop 6516 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
○Loop 6523 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
○Loop 6518 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
○Loop 6519 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
○Loop 6522 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
▼Loop 6538 - csr_matvec.c:560-567 - exec– | 0.00 | 0.00 |
○Loop 6539 - csr_matvec.c:564-567 - exec | 0.00 | 0.00 |
▼Loop 6540 - csr_matvec.c:560-567 - exec– | 0.00 | 0.00 |
○Loop 6541 - csr_matvec.c:560-564 - exec | 0.00 | 0.00 |
▼Loop 6525 - csr_matvec.c:560-579 - exec– | 0.00 | 0.00 |
○Loop 6526 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
○Loop 6524 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |
▼Loop 6537 - csr_matvec.c:573-579 - exec– | 0.00 | 0.00 |
○Loop 6536 - csr_matvec.c:577-579 - exec | 0.00 | 0.00 |