Function: hypre_CSRMatrixTranspose.extracted | Module: exec | Source: csr_matop.c:380-560 [...] | Coverage: 0.15% |
---|
Function: hypre_CSRMatrixTranspose.extracted | Module: exec | Source: csr_matop.c:380-560 [...] | Coverage: 0.15% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-586-9096/intel/AMG/build/AMG/AMG/seq_mv/csr_matop.c: 380 - 560 |
-------------------------------------------------------------------------------- |
380: return idx%dim1*dim2 + idx/dim1; |
[...] |
463: #pragma omp parallel |
464: #endif |
465: { |
466: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
467: HYPRE_Int my_thread_num = hypre_GetThreadNum(); |
468: |
469: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
470: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
471: hypre_assert(iBegin <= iEnd); |
472: hypre_assert(iBegin >= 0 && iBegin <= num_rowsA); |
473: hypre_assert(iEnd >= 0 && iEnd <= num_rowsA); |
474: |
475: HYPRE_Int i, j; |
476: memset(bucket + my_thread_num*num_colsA, 0, sizeof(HYPRE_Int)*num_colsA); |
[...] |
483: for (j = A_i[iBegin]; j < A_i[iEnd]; ++j) { |
484: HYPRE_Int idx = A_j[j]; |
485: bucket[my_thread_num*num_colsA + idx]++; |
[...] |
496: for (i = my_thread_num*num_colsA + 1; i < (my_thread_num + 1)*num_colsA; ++i) { |
497: HYPRE_Int transpose_i = transpose_idx(i, num_threads, num_colsA); |
498: HYPRE_Int transpose_i_minus_1 = transpose_idx(i - 1, num_threads, num_colsA); |
499: |
500: bucket[transpose_i] += bucket[transpose_i_minus_1]; |
501: } |
502: |
503: #ifdef HYPRE_USING_OPENMP |
504: #pragma omp barrier |
505: #pragma omp master |
506: #endif |
507: { |
508: for (i = 1; i < num_threads; ++i) { |
509: HYPRE_Int j0 = num_colsA*i - 1, j1 = num_colsA*(i + 1) - 1; |
510: HYPRE_Int transpose_j0 = transpose_idx(j0, num_threads, num_colsA); |
511: HYPRE_Int transpose_j1 = transpose_idx(j1, num_threads, num_colsA); |
512: |
513: bucket[transpose_j1] += bucket[transpose_j0]; |
[...] |
520: if (my_thread_num > 0) { |
521: HYPRE_Int transpose_i0 = transpose_idx(num_colsA*my_thread_num - 1, num_threads, num_colsA); |
522: HYPRE_Int offset = bucket[transpose_i0]; |
523: |
524: for (i = my_thread_num*num_colsA; i < (my_thread_num + 1)*num_colsA - 1; ++i) { |
525: HYPRE_Int transpose_i = transpose_idx(i, num_threads, num_colsA); |
526: |
527: bucket[transpose_i] += offset; |
[...] |
539: if (data) { |
540: for (i = iEnd - 1; i >= iBegin; --i) { |
541: for (j = A_i[i + 1] - 1; j >= A_i[i]; --j) { |
542: HYPRE_Int idx = A_j[j]; |
543: --bucket[my_thread_num*num_colsA + idx]; |
544: |
545: HYPRE_Int offset = bucket[my_thread_num*num_colsA + idx]; |
546: |
547: AT_data[offset] = A_data[j]; |
548: AT_j[offset] = i; |
549: } |
550: } |
551: } |
552: else { |
553: for (i = iEnd - 1; i >= iBegin; --i) { |
554: for (j = A_i[i + 1] - 1; j >= A_i[i]; --j) { |
555: HYPRE_Int idx = A_j[j]; |
556: --bucket[my_thread_num*num_colsA + idx]; |
557: |
558: HYPRE_Int offset = bucket[my_thread_num*num_colsA + idx]; |
559: |
560: AT_j[offset] = i; |
0x4c3d30 PUSH %RBP |
0x4c3d31 MOV %RSP,%RBP |
0x4c3d34 PUSH %R15 |
0x4c3d36 PUSH %R14 |
0x4c3d38 PUSH %R13 |
0x4c3d3a PUSH %R12 |
0x4c3d3c PUSH %RBX |
0x4c3d3d SUB $0x48,%RSP |
0x4c3d41 MOV %R9,-0x40(%RBP) |
0x4c3d45 MOV %R8,-0x58(%RBP) |
0x4c3d49 MOV %RCX,-0x68(%RBP) |
0x4c3d4d MOV %RDX,%R12 |
0x4c3d50 MOV %RDI,%R15 |
0x4c3d53 CALL 4d1400 <hypre_NumActiveThreads> |
0x4c3d58 MOV %RAX,-0x48(%RBP) |
0x4c3d5c CALL 4d1410 <hypre_GetThreadNum> |
0x4c3d61 MOV %RAX,%R14 |
0x4c3d64 MOV %R12,%RDI |
0x4c3d67 CALL 4c5bc0 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> |
0x4c3d6c MOV %RAX,%RBX |
0x4c3d6f MOV %R12,%RDI |
0x4c3d72 CALL 4c5c40 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> |
0x4c3d77 MOV %RBX,%RCX |
0x4c3d7a MOV %RAX,%R12 |
0x4c3d7d CMP %RBX,%RAX |
0x4c3d80 MOV %RBX,%RAX |
0x4c3d83 MOV %RBX,-0x30(%RBP) |
0x4c3d87 JGE 4c3dbb |
0x4c3d89 MOV 0x5de70(%RIP),%RDI |
0x4c3d90 MOV $0x4fa05a,%ESI |
0x4c3d95 MOV $0x4fc003,%EDX |
0x4c3d9a XOR %EAX,%EAX |
0x4c3d9c CALL 4cf9e0 <hypre_fprintf> |
0x4c3da1 MOV $0x4fbf80,%EDI |
0x4c3da6 MOV $0x1d7,%ESI |
0x4c3dab MOV $0x1,%EDX |
0x4c3db0 XOR %ECX,%ECX |
0x4c3db2 CALL 4d2330 <hypre_error_handler> |
0x4c3db7 MOV -0x30(%RBP),%RCX |
0x4c3dbb MOV %R15,-0x38(%RBP) |
0x4c3dbf MOV 0x18(%RBP),%RBX |
0x4c3dc3 TEST %RCX,%RCX |
0x4c3dc6 JS 4c3dcd |
0x4c3dc8 CMP %RBX,%RCX |
0x4c3dcb JLE 4c3dfb |
0x4c3dcd MOV 0x5de2c(%RIP),%RDI |
0x4c3dd4 MOV $0x4fa05a,%ESI |
0x4c3dd9 MOV $0x4fc012,%EDX |
0x4c3dde XOR %EAX,%EAX |
0x4c3de0 CALL 4cf9e0 <hypre_fprintf> |
0x4c3de5 MOV $0x4fbf80,%EDI |
0x4c3dea MOV $0x1d8,%ESI |
0x4c3def MOV $0x1,%EDX |
0x4c3df4 XOR %ECX,%ECX |
0x4c3df6 CALL 4d2330 <hypre_error_handler> |
0x4c3dfb MOV 0x38(%RBP),%R15 |
0x4c3dff MOV 0x20(%RBP),%R13 |
0x4c3e03 TEST %R12,%R12 |
0x4c3e06 JS 4c3e0d |
0x4c3e08 CMP %RBX,%R12 |
0x4c3e0b JLE 4c3e3b |
0x4c3e0d MOV 0x5ddec(%RIP),%RDI |
0x4c3e14 MOV $0x4fa05a,%ESI |
0x4c3e19 MOV $0x4fc035,%EDX |
0x4c3e1e XOR %EAX,%EAX |
0x4c3e20 CALL 4cf9e0 <hypre_fprintf> |
0x4c3e25 MOV $0x4fbf80,%EDI |
0x4c3e2a MOV $0x1d9,%ESI |
0x4c3e2f MOV $0x1,%EDX |
0x4c3e34 XOR %ECX,%ECX |
0x4c3e36 CALL 4d2330 <hypre_error_handler> |
0x4c3e3b MOV 0x10(%RBP),%RBX |
0x4c3e3f MOV (%R13),%RDX |
0x4c3e43 MOV %RDX,%RAX |
0x4c3e46 IMUL %R14,%RAX |
0x4c3e4a LEA (%R15,%RAX,8),%RDI |
0x4c3e4e SAL $0x3,%RDX |
0x4c3e52 XOR %ESI,%ESI |
0x4c3e54 CALL 4d8930 <_intel_fast_memset> |
0x4c3e59 MOV -0x40(%RBP),%RDX |
0x4c3e5d MOV -0x30(%RBP),%RAX |
0x4c3e61 MOV (%RDX,%RAX,8),%RAX |
0x4c3e65 CMP (%RDX,%R12,8),%RAX |
0x4c3e69 JGE 4c3e89 |
0x4c3e6b MOV %RBX,%RSI |
0x4c3e6e XCHG %AX,%AX |
(3709) 0x4c3e70 MOV (%R13),%RCX |
(3709) 0x4c3e74 IMUL %R14,%RCX |
(3709) 0x4c3e78 ADD (%RSI,%RAX,8),%RCX |
(3709) 0x4c3e7c INCQ (%R15,%RCX,8) |
(3709) 0x4c3e80 INC %RAX |
(3709) 0x4c3e83 CMP (%RDX,%R12,8),%RAX |
(3709) 0x4c3e87 JL 4c3e70 |
0x4c3e89 MOV -0x38(%RBP),%RAX |
0x4c3e8d MOV (%RAX),%ESI |
0x4c3e8f MOV $0x520ab0,%EDI |
0x4c3e94 CALL 410570 <__kmpc_barrier@plt> |
0x4c3e99 MOV (%R13),%R9 |
0x4c3e9d MOV %R9,%RCX |
0x4c3ea0 IMUL %R14,%RCX |
0x4c3ea4 LEA 0x1(%R14),%RBX |
0x4c3ea8 LEA 0x1(%RCX),%RAX |
0x4c3eac MOV %R9,%RDX |
0x4c3eaf IMUL %RBX,%RDX |
0x4c3eb3 CMP %RDX,%RAX |
0x4c3eb6 MOV -0x48(%RBP),%R11 |
0x4c3eba JL 4c3fe9 |
0x4c3ec0 MOV %RBX,-0x60(%RBP) |
0x4c3ec4 MOV -0x38(%RBP),%RBX |
0x4c3ec8 MOV (%RBX),%ESI |
0x4c3eca MOV $0x520ad0,%EDI |
0x4c3ecf CALL 410570 <__kmpc_barrier@plt> |
0x4c3ed4 MOV (%RBX),%ESI |
0x4c3ed6 MOV $0x520af0,%EDI |
0x4c3edb XOR %EDX,%EDX |
0x4c3edd CALL 4106e0 <__kmpc_masked@plt> |
0x4c3ee2 CMP $0x1,%EAX |
0x4c3ee5 JNE 4c4144 |
0x4c3eeb MOV -0x48(%RBP),%RBX |
0x4c3eef CMP $0x1,%RBX |
0x4c3ef3 JLE 4c4134 |
0x4c3ef9 LEA -0x1(%RBX),%RAX |
0x4c3efd MOV %RAX,-0x50(%RBP) |
0x4c3f01 CMP $0x4,%RAX |
0x4c3f05 JAE 4c43ad |
0x4c3f0b MOV -0x50(%RBP),%RAX |
0x4c3f0f MOV %RAX,%R8 |
0x4c3f12 AND $-0x4,%R8 |
0x4c3f16 CMP %RAX,%R8 |
0x4c3f19 JAE 4c4134 |
0x4c3f1f INC %R8 |
0x4c3f22 JMP 4c3f54 |
0x4c3f24 NOPW %CS:(%RAX,%RAX,1) |
(3706) 0x4c3f30 CQTO |
(3706) 0x4c3f32 IDIV %RBX |
(3706) 0x4c3f35 IMUL %RDI,%RCX |
(3706) 0x4c3f39 ADD %RSI,%RCX |
(3706) 0x4c3f3c MOV (%R15,%RCX,8),%RCX |
(3706) 0x4c3f40 IMUL %RDI,%RDX |
(3706) 0x4c3f44 ADD %RAX,%RDX |
(3706) 0x4c3f47 ADD %RCX,(%R15,%RDX,8) |
(3706) 0x4c3f4b CMP %R8,%RBX |
(3706) 0x4c3f4e JE 4c4134 |
(3706) 0x4c3f54 MOV (%R13),%RDI |
(3706) 0x4c3f58 MOV %RDI,%RAX |
(3706) 0x4c3f5b IMUL %R8,%RAX |
(3706) 0x4c3f5f DEC %RAX |
(3706) 0x4c3f62 MOV %RAX,%RCX |
(3706) 0x4c3f65 OR %RBX,%RCX |
(3706) 0x4c3f68 SHR $0x20,%RCX |
(3706) 0x4c3f6c JE 4c3f80 |
(3706) 0x4c3f6e CQTO |
(3706) 0x4c3f70 IDIV %RBX |
(3706) 0x4c3f73 MOV %RDX,%RCX |
(3706) 0x4c3f76 MOV %RAX,%RSI |
(3706) 0x4c3f79 JMP 4c3f88 |
0x4c3f7b NOPL (%RAX,%RAX,1) |
(3706) 0x4c3f80 XOR %EDX,%EDX |
(3706) 0x4c3f82 DIV %EBX |
(3706) 0x4c3f84 MOV %EDX,%ECX |
(3706) 0x4c3f86 MOV %EAX,%ESI |
(3706) 0x4c3f88 INC %R8 |
(3706) 0x4c3f8b MOV %RDI,%RAX |
(3706) 0x4c3f8e IMUL %R8,%RAX |
(3706) 0x4c3f92 DEC %RAX |
(3706) 0x4c3f95 MOV %RAX,%RDX |
(3706) 0x4c3f98 OR %RBX,%RDX |
(3706) 0x4c3f9b SHR $0x20,%RDX |
(3706) 0x4c3f9f JNE 4c3f30 |
(3706) 0x4c3fa1 XOR %EDX,%EDX |
(3706) 0x4c3fa3 DIV %EBX |
(3706) 0x4c3fa5 JMP 4c3f35 |
0x4c3fa7 NOPW (%RAX,%RAX,1) |
(3708) 0x4c3fb0 MOV %R8,%RAX |
(3708) 0x4c3fb3 CQTO |
(3708) 0x4c3fb5 IDIV %R11 |
(3708) 0x4c3fb8 IMUL %R9,%RDI |
(3708) 0x4c3fbc ADD %RDI,%RSI |
(3708) 0x4c3fbf MOV (%R15,%RSI,8),%RSI |
(3708) 0x4c3fc3 IMUL %R9,%RDX |
(3708) 0x4c3fc7 ADD %RAX,%RDX |
(3708) 0x4c3fca ADD %RSI,(%R15,%RDX,8) |
(3708) 0x4c3fce MOV (%R13),%R9 |
(3708) 0x4c3fd2 MOV %RBX,%RAX |
(3708) 0x4c3fd5 IMUL %R9,%RAX |
(3708) 0x4c3fd9 ADD $0x5,%RCX |
(3708) 0x4c3fdd CMP %RAX,%RCX |
(3708) 0x4c3fe0 MOV %R8,%RCX |
(3708) 0x4c3fe3 JGE 4c3ec0 |
(3708) 0x4c3fe9 LEA 0x1(%RCX),%RAX |
(3708) 0x4c3fed MOV %RAX,%RDX |
(3708) 0x4c3ff0 OR %R11,%RDX |
(3708) 0x4c3ff3 SHR $0x20,%RDX |
(3708) 0x4c3ff7 JE 4c4010 |
(3708) 0x4c3ff9 CQTO |
(3708) 0x4c3ffb IDIV %R11 |
(3708) 0x4c3ffe MOV %RDX,%RDI |
(3708) 0x4c4001 MOV %RAX,%RSI |
(3708) 0x4c4004 JMP 4c4019 |
0x4c4006 NOPW %CS:(%RAX,%RAX,1) |
(3708) 0x4c4010 XOR %EDX,%EDX |
(3708) 0x4c4012 DIV %R11D |
(3708) 0x4c4015 MOV %EDX,%EDI |
(3708) 0x4c4017 MOV %EAX,%ESI |
(3708) 0x4c4019 MOV %RCX,%RAX |
(3708) 0x4c401c OR %R11,%RAX |
(3708) 0x4c401f SHR $0x20,%RAX |
(3708) 0x4c4023 JE 4c4030 |
(3708) 0x4c4025 MOV %RCX,%RAX |
(3708) 0x4c4028 CQTO |
(3708) 0x4c402a IDIV %R11 |
(3708) 0x4c402d JMP 4c4037 |
0x4c402f NOP |
(3708) 0x4c4030 MOV %ECX,%EAX |
(3708) 0x4c4032 XOR %EDX,%EDX |
(3708) 0x4c4034 DIV %R11D |
(3708) 0x4c4037 IMUL %R9,%RDX |
(3708) 0x4c403b ADD %RAX,%RDX |
(3708) 0x4c403e MOV (%R15,%RDX,8),%RAX |
(3708) 0x4c4042 IMUL %RDI,%R9 |
(3708) 0x4c4046 ADD %RSI,%R9 |
(3708) 0x4c4049 ADD %RAX,(%R15,%R9,8) |
(3708) 0x4c404d MOV (%R13),%R10 |
(3708) 0x4c4051 LEA 0x2(%RCX),%RAX |
(3708) 0x4c4055 MOV %RBX,%RDX |
(3708) 0x4c4058 IMUL %R10,%RDX |
(3708) 0x4c405c CMP %RDX,%RAX |
(3708) 0x4c405f JGE 4c3ec0 |
(3708) 0x4c4065 MOV %RAX,%RDX |
(3708) 0x4c4068 OR %R11,%RDX |
(3708) 0x4c406b SHR $0x20,%RDX |
(3708) 0x4c406f JE 4c4080 |
(3708) 0x4c4071 CQTO |
(3708) 0x4c4073 IDIV %R11 |
(3708) 0x4c4076 MOV %RDX,%R9 |
(3708) 0x4c4079 MOV %RAX,%R8 |
(3708) 0x4c407c JMP 4c408b |
0x4c407e XCHG %AX,%AX |
(3708) 0x4c4080 XOR %EDX,%EDX |
(3708) 0x4c4082 DIV %R11D |
(3708) 0x4c4085 MOV %EDX,%R9D |
(3708) 0x4c4088 MOV %EAX,%R8D |
(3708) 0x4c408b IMUL %R10,%RDI |
(3708) 0x4c408f ADD %RDI,%RSI |
(3708) 0x4c4092 MOV (%R15,%RSI,8),%RAX |
(3708) 0x4c4096 IMUL %R9,%R10 |
(3708) 0x4c409a ADD %R8,%R10 |
(3708) 0x4c409d ADD %RAX,(%R15,%R10,8) |
(3708) 0x4c40a1 MOV (%R13),%R10 |
(3708) 0x4c40a5 LEA 0x3(%RCX),%RAX |
(3708) 0x4c40a9 MOV %RBX,%RDX |
(3708) 0x4c40ac IMUL %R10,%RDX |
(3708) 0x4c40b0 CMP %RDX,%RAX |
(3708) 0x4c40b3 JGE 4c3ec0 |
(3708) 0x4c40b9 MOV %RAX,%RDX |
(3708) 0x4c40bc OR %R11,%RDX |
(3708) 0x4c40bf SHR $0x20,%RDX |
(3708) 0x4c40c3 JE 4c40e0 |
(3708) 0x4c40c5 CQTO |
(3708) 0x4c40c7 IDIV %R11 |
(3708) 0x4c40ca MOV %RDX,%RDI |
(3708) 0x4c40cd MOV %RAX,%RSI |
(3708) 0x4c40d0 JMP 4c40e9 |
0x4c40d2 NOPW %CS:(%RAX,%RAX,1) |
(3708) 0x4c40e0 XOR %EDX,%EDX |
(3708) 0x4c40e2 DIV %R11D |
(3708) 0x4c40e5 MOV %EDX,%EDI |
(3708) 0x4c40e7 MOV %EAX,%ESI |
(3708) 0x4c40e9 IMUL %R10,%R9 |
(3708) 0x4c40ed ADD %R9,%R8 |
(3708) 0x4c40f0 MOV (%R15,%R8,8),%RAX |
(3708) 0x4c40f4 IMUL %RDI,%R10 |
(3708) 0x4c40f8 ADD %RSI,%R10 |
(3708) 0x4c40fb ADD %RAX,(%R15,%R10,8) |
(3708) 0x4c40ff MOV (%R13),%R9 |
(3708) 0x4c4103 LEA 0x4(%RCX),%R8 |
(3708) 0x4c4107 MOV %RBX,%RAX |
(3708) 0x4c410a IMUL %R9,%RAX |
(3708) 0x4c410e CMP %RAX,%R8 |
(3708) 0x4c4111 JGE 4c3ec0 |
(3708) 0x4c4117 MOV %R8,%RAX |
(3708) 0x4c411a OR %R11,%RAX |
(3708) 0x4c411d SHR $0x20,%RAX |
(3708) 0x4c4121 JNE 4c3fb0 |
(3708) 0x4c4127 MOV %R8D,%EAX |
(3708) 0x4c412a XOR %EDX,%EDX |
(3708) 0x4c412c DIV %R11D |
(3708) 0x4c412f JMP 4c3fb8 |
0x4c4134 MOV -0x38(%RBP),%RBX |
0x4c4138 MOV (%RBX),%ESI |
0x4c413a MOV $0x520b10,%EDI |
0x4c413f CALL 410500 <__kmpc_end_masked@plt> |
0x4c4144 MOV (%RBX),%ESI |
0x4c4146 MOV $0x520b30,%EDI |
0x4c414b CALL 410570 <__kmpc_barrier@plt> |
0x4c4150 TEST %R14,%R14 |
0x4c4153 MOV -0x48(%RBP),%R8 |
0x4c4157 MOV -0x60(%RBP),%R9 |
0x4c415b JLE 4c42c1 |
0x4c4161 MOV (%R13),%RDI |
0x4c4165 MOV %R14,%RCX |
0x4c4168 IMUL %RDI,%RCX |
0x4c416c LEA -0x1(%RCX),%RAX |
0x4c4170 MOV %RAX,%RDX |
0x4c4173 OR %R8,%RDX |
0x4c4176 SHR $0x20,%RDX |
0x4c417a JE 4c4183 |
0x4c417c CQTO |
0x4c417e IDIV %R8 |
0x4c4181 JMP 4c4188 |
0x4c4183 XOR %EDX,%EDX |
0x4c4185 DIV %R8D |
0x4c4188 MOV %RDI,%RSI |
0x4c418b IMUL %R9,%RSI |
0x4c418f DEC %RSI |
0x4c4192 CMP %RSI,%RCX |
0x4c4195 JGE 4c42c1 |
0x4c419b IMUL %RDI,%RDX |
0x4c419f ADD %RAX,%RDX |
0x4c41a2 MOV (%R15,%RDX,8),%RSI |
0x4c41a6 JMP 4c41db |
0x4c41a8 NOPL (%RAX,%RAX,1) |
(3705) 0x4c41b0 CQTO |
(3705) 0x4c41b2 IDIV %R8 |
(3705) 0x4c41b5 IMUL %RDX,%RDI |
(3705) 0x4c41b9 ADD %RAX,%RDI |
(3705) 0x4c41bc ADD %RSI,(%R15,%RDI,8) |
(3705) 0x4c41c0 MOV (%R13),%RDI |
(3705) 0x4c41c4 MOV %R9,%RAX |
(3705) 0x4c41c7 IMUL %RDI,%RAX |
(3705) 0x4c41cb DEC %RAX |
(3705) 0x4c41ce ADD $0x4,%RCX |
(3705) 0x4c41d2 CMP %RAX,%RCX |
(3705) 0x4c41d5 JGE 4c42c1 |
(3705) 0x4c41db MOV %RCX,%RAX |
(3705) 0x4c41de OR %R8,%RAX |
(3705) 0x4c41e1 SHR $0x20,%RAX |
(3705) 0x4c41e5 JE 4c4200 |
(3705) 0x4c41e7 MOV %RCX,%RAX |
(3705) 0x4c41ea CQTO |
(3705) 0x4c41ec IDIV %R8 |
(3705) 0x4c41ef JMP 4c4207 |
0x4c41f1 NOPW %CS:(%RAX,%RAX,1) |
(3705) 0x4c4200 MOV %ECX,%EAX |
(3705) 0x4c4202 XOR %EDX,%EDX |
(3705) 0x4c4204 DIV %R8D |
(3705) 0x4c4207 IMUL %RDX,%RDI |
(3705) 0x4c420b ADD %RAX,%RDI |
(3705) 0x4c420e ADD %RSI,(%R15,%RDI,8) |
(3705) 0x4c4212 MOV (%R13),%RDI |
(3705) 0x4c4216 LEA 0x1(%RCX),%RAX |
(3705) 0x4c421a MOV %R9,%RDX |
(3705) 0x4c421d IMUL %RDI,%RDX |
(3705) 0x4c4221 DEC %RDX |
(3705) 0x4c4224 CMP %RDX,%RAX |
(3705) 0x4c4227 JGE 4c42c1 |
(3705) 0x4c422d MOV %RAX,%RDX |
(3705) 0x4c4230 OR %R8,%RDX |
(3705) 0x4c4233 SHR $0x20,%RDX |
(3705) 0x4c4237 JE 4c4240 |
(3705) 0x4c4239 CQTO |
(3705) 0x4c423b IDIV %R8 |
(3705) 0x4c423e JMP 4c4245 |
(3705) 0x4c4240 XOR %EDX,%EDX |
(3705) 0x4c4242 DIV %R8D |
(3705) 0x4c4245 IMUL %RDX,%RDI |
(3705) 0x4c4249 ADD %RAX,%RDI |
(3705) 0x4c424c ADD %RSI,(%R15,%RDI,8) |
(3705) 0x4c4250 MOV (%R13),%RDI |
(3705) 0x4c4254 LEA 0x2(%RCX),%RAX |
(3705) 0x4c4258 MOV %R9,%RDX |
(3705) 0x4c425b IMUL %RDI,%RDX |
(3705) 0x4c425f DEC %RDX |
(3705) 0x4c4262 CMP %RDX,%RAX |
(3705) 0x4c4265 JGE 4c42c1 |
(3705) 0x4c4267 MOV %RAX,%RDX |
(3705) 0x4c426a OR %R8,%RDX |
(3705) 0x4c426d SHR $0x20,%RDX |
(3705) 0x4c4271 JE 4c4280 |
(3705) 0x4c4273 CQTO |
(3705) 0x4c4275 IDIV %R8 |
(3705) 0x4c4278 JMP 4c4285 |
0x4c427a NOPW (%RAX,%RAX,1) |
(3705) 0x4c4280 XOR %EDX,%EDX |
(3705) 0x4c4282 DIV %R8D |
(3705) 0x4c4285 IMUL %RDX,%RDI |
(3705) 0x4c4289 ADD %RAX,%RDI |
(3705) 0x4c428c ADD %RSI,(%R15,%RDI,8) |
(3705) 0x4c4290 MOV (%R13),%RDI |
(3705) 0x4c4294 LEA 0x3(%RCX),%RAX |
(3705) 0x4c4298 MOV %R9,%RDX |
(3705) 0x4c429b IMUL %RDI,%RDX |
(3705) 0x4c429f DEC %RDX |
(3705) 0x4c42a2 CMP %RDX,%RAX |
(3705) 0x4c42a5 JGE 4c42c1 |
(3705) 0x4c42a7 MOV %RAX,%RDX |
(3705) 0x4c42aa OR %R8,%RDX |
(3705) 0x4c42ad SHR $0x20,%RDX |
(3705) 0x4c42b1 JNE 4c41b0 |
(3705) 0x4c42b7 XOR %EDX,%EDX |
(3705) 0x4c42b9 DIV %R8D |
(3705) 0x4c42bc JMP 4c41b5 |
0x4c42c1 MOV 0x30(%RBP),%RBX |
0x4c42c5 MOV -0x38(%RBP),%RAX |
0x4c42c9 MOV (%RAX),%ESI |
0x4c42cb MOV $0x520b50,%EDI |
0x4c42d0 CALL 410570 <__kmpc_barrier@plt> |
0x4c42d5 CMPQ $0,-0x68(%RBP) |
0x4c42da JE 4c4371 |
0x4c42e0 MOV -0x30(%RBP),%R8 |
0x4c42e4 CMP %R8,%R12 |
0x4c42e7 MOV -0x40(%RBP),%RDI |
0x4c42eb MOV 0x10(%RBP),%R9 |
0x4c42ef MOV -0x58(%RBP),%R10 |
0x4c42f3 JLE 4c461e |
0x4c42f9 MOV 0x28(%RBP),%RAX |
0x4c42fd MOV (%RDI,%R12,8),%RCX |
0x4c4301 JMP 4c431c |
0x4c4303 NOPW %CS:(%RAX,%RAX,1) |
(3703) 0x4c4310 MOV %RDX,%RCX |
(3703) 0x4c4313 CMP %R8,%R12 |
(3703) 0x4c4316 JLE 4c461e |
(3703) 0x4c431c MOV -0x8(%RDI,%R12,8),%RDX |
(3703) 0x4c4321 DEC %R12 |
(3703) 0x4c4324 CMP %RDX,%RCX |
(3703) 0x4c4327 JLE 4c4310 |
(3703) 0x4c4329 NOPL (%RAX) |
(3704) 0x4c4330 MOV -0x8(%R9,%RCX,8),%RDX |
(3704) 0x4c4335 MOV (%R13),%RSI |
(3704) 0x4c4339 IMUL %R14,%RSI |
(3704) 0x4c433d ADD %RDX,%RSI |
(3704) 0x4c4340 DECQ (%R15,%RSI,8) |
(3704) 0x4c4344 MOV (%R13),%RSI |
(3704) 0x4c4348 IMUL %R14,%RSI |
(3704) 0x4c434c ADD %RDX,%RSI |
(3704) 0x4c434f MOV (%R15,%RSI,8),%RDX |
(3704) 0x4c4353 VMOVSD -0x8(%R10,%RCX,8),%XMM0 |
(3704) 0x4c435a VMOVSD %XMM0,(%RAX,%RDX,8) |
(3704) 0x4c435f DEC %RCX |
(3704) 0x4c4362 MOV %R12,(%RBX,%RDX,8) |
(3704) 0x4c4366 MOV (%RDI,%R12,8),%RDX |
(3704) 0x4c436a CMP %RDX,%RCX |
(3704) 0x4c436d JG 4c4330 |
(3703) 0x4c436f JMP 4c4310 |
0x4c4371 MOV -0x30(%RBP),%R9 |
0x4c4375 CMP %R9,%R12 |
0x4c4378 MOV -0x40(%RBP),%R8 |
0x4c437c MOV 0x10(%RBP),%R10 |
0x4c4380 JLE 4c461e |
0x4c4386 MOV (%R8,%R12,8),%RCX |
0x4c438a MOV %R12D,%EAX |
0x4c438d SUB %R9D,%EAX |
0x4c4390 LEA 0x1(%R9),%RDX |
0x4c4394 TEST $0x1,%AL |
0x4c4396 JNE 4c45db |
0x4c439c MOV %R12,%RAX |
0x4c439f CMP %RDX,%R12 |
0x4c43a2 JNE 4c4635 |
0x4c43a8 JMP 4c461e |
0x4c43ad MOV -0x50(%RBP),%R8 |
0x4c43b1 SHR $0x2,%R8 |
0x4c43b5 XOR %R9D,%R9D |
0x4c43b8 JMP 4c43e7 |
0x4c43ba NOPW (%RAX,%RAX,1) |
(3707) 0x4c43c0 CQTO |
(3707) 0x4c43c2 IDIV %RBX |
(3707) 0x4c43c5 IMUL %R10,%RCX |
(3707) 0x4c43c9 ADD %RSI,%RCX |
(3707) 0x4c43cc MOV (%R15,%RCX,8),%RCX |
(3707) 0x4c43d0 IMUL %R10,%RDX |
(3707) 0x4c43d4 ADD %RAX,%RDX |
(3707) 0x4c43d7 ADD %RCX,(%R15,%RDX,8) |
(3707) 0x4c43db INC %R9 |
(3707) 0x4c43de CMP %R9,%R8 |
(3707) 0x4c43e1 JE 4c3f0b |
(3707) 0x4c43e7 MOV (%R13),%R10 |
(3707) 0x4c43eb MOV %R10,%R11 |
(3707) 0x4c43ee IMUL %R9,%R11 |
(3707) 0x4c43f2 LEA (%R10,%R11,4),%RAX |
(3707) 0x4c43f6 DEC %RAX |
(3707) 0x4c43f9 MOV %RAX,%RCX |
(3707) 0x4c43fc OR %RBX,%RCX |
(3707) 0x4c43ff SHR $0x20,%RCX |
(3707) 0x4c4403 JE 4c4420 |
(3707) 0x4c4405 CQTO |
(3707) 0x4c4407 IDIV %RBX |
(3707) 0x4c440a MOV %RDX,%RCX |
(3707) 0x4c440d MOV %RAX,%RSI |
(3707) 0x4c4410 JMP 4c4428 |
0x4c4412 NOPW %CS:(%RAX,%RAX,1) |
(3707) 0x4c4420 XOR %EDX,%EDX |
(3707) 0x4c4422 DIV %EBX |
(3707) 0x4c4424 MOV %EDX,%ECX |
(3707) 0x4c4426 MOV %EAX,%ESI |
(3707) 0x4c4428 SAL $0x2,%R11 |
(3707) 0x4c442c LEA (%R11,%R10,2),%RAX |
(3707) 0x4c4430 DEC %RAX |
(3707) 0x4c4433 MOV %RAX,%RDX |
(3707) 0x4c4436 OR %RBX,%RDX |
(3707) 0x4c4439 SHR $0x20,%RDX |
(3707) 0x4c443d JE 4c4450 |
(3707) 0x4c443f CQTO |
(3707) 0x4c4441 IDIV %RBX |
(3707) 0x4c4444 JMP 4c4454 |
0x4c4446 NOPW %CS:(%RAX,%RAX,1) |
(3707) 0x4c4450 XOR %EDX,%EDX |
(3707) 0x4c4452 DIV %EBX |
(3707) 0x4c4454 IMUL %R10,%RCX |
(3707) 0x4c4458 ADD %RSI,%RCX |
(3707) 0x4c445b MOV (%R15,%RCX,8),%RCX |
(3707) 0x4c445f IMUL %R10,%RDX |
(3707) 0x4c4463 ADD %RAX,%RDX |
(3707) 0x4c4466 ADD %RCX,(%R15,%RDX,8) |
(3707) 0x4c446a MOV (%R13),%R10 |
(3707) 0x4c446e MOV %R10,%R11 |
(3707) 0x4c4471 IMUL %R9,%R11 |
(3707) 0x4c4475 SAL $0x2,%R11 |
(3707) 0x4c4479 LEA (%R11,%R10,2),%RAX |
(3707) 0x4c447d DEC %RAX |
(3707) 0x4c4480 MOV %RAX,%RCX |
(3707) 0x4c4483 OR %RBX,%RCX |
(3707) 0x4c4486 SHR $0x20,%RCX |
(3707) 0x4c448a JE 4c44a0 |
(3707) 0x4c448c CQTO |
(3707) 0x4c448e IDIV %RBX |
(3707) 0x4c4491 MOV %RDX,%RCX |
(3707) 0x4c4494 MOV %RAX,%RSI |
(3707) 0x4c4497 JMP 4c44a8 |
0x4c4499 NOPL (%RAX) |
(3707) 0x4c44a0 XOR %EDX,%EDX |
(3707) 0x4c44a2 DIV %EBX |
(3707) 0x4c44a4 MOV %EDX,%ECX |
(3707) 0x4c44a6 MOV %EAX,%ESI |
(3707) 0x4c44a8 LEA (%R10,%R10,2),%RAX |
(3707) 0x4c44ac ADD %R11,%RAX |
(3707) 0x4c44af DEC %RAX |
(3707) 0x4c44b2 MOV %RAX,%RDX |
(3707) 0x4c44b5 OR %RBX,%RDX |
(3707) 0x4c44b8 SHR $0x20,%RDX |
(3707) 0x4c44bc JE 4c44d0 |
(3707) 0x4c44be CQTO |
(3707) 0x4c44c0 IDIV %RBX |
(3707) 0x4c44c3 JMP 4c44d4 |
0x4c44c5 NOPW %CS:(%RAX,%RAX,1) |
(3707) 0x4c44d0 XOR %EDX,%EDX |
(3707) 0x4c44d2 DIV %EBX |
(3707) 0x4c44d4 MOV %RBX,%RDI |
(3707) 0x4c44d7 IMUL %R10,%RCX |
(3707) 0x4c44db ADD %RSI,%RCX |
(3707) 0x4c44de MOV (%R15,%RCX,8),%RCX |
(3707) 0x4c44e2 IMUL %R10,%RDX |
(3707) 0x4c44e6 ADD %RAX,%RDX |
(3707) 0x4c44e9 ADD %RCX,(%R15,%RDX,8) |
(3707) 0x4c44ed MOV (%R13),%R10 |
(3707) 0x4c44f1 LEA (%R10,%R10,2),%RAX |
(3707) 0x4c44f5 LEA (,%R10,4),%R11 |
(3707) 0x4c44fd MOV %R11,%RBX |
(3707) 0x4c4500 IMUL %R9,%RBX |
(3707) 0x4c4504 ADD %RBX,%RAX |
(3707) 0x4c4507 DEC %RAX |
(3707) 0x4c450a MOV %RAX,%RCX |
(3707) 0x4c450d OR %RDI,%RCX |
(3707) 0x4c4510 SHR $0x20,%RCX |
(3707) 0x4c4514 JE 4c4530 |
(3707) 0x4c4516 CQTO |
(3707) 0x4c4518 IDIV %RDI |
(3707) 0x4c451b MOV %RDX,%RCX |
(3707) 0x4c451e MOV %RAX,%RSI |
(3707) 0x4c4521 JMP 4c4538 |
0x4c4523 NOPW %CS:(%RAX,%RAX,1) |
(3707) 0x4c4530 XOR %EDX,%EDX |
(3707) 0x4c4532 DIV %EDI |
(3707) 0x4c4534 MOV %EDX,%ECX |
(3707) 0x4c4536 MOV %EAX,%ESI |
(3707) 0x4c4538 LEA (%R11,%RBX,1),%RAX |
(3707) 0x4c453c DEC %RAX |
(3707) 0x4c453f MOV %RAX,%RDX |
(3707) 0x4c4542 OR %RDI,%RDX |
(3707) 0x4c4545 SHR $0x20,%RDX |
(3707) 0x4c4549 MOV %RDI,%RBX |
(3707) 0x4c454c JE 4c4560 |
(3707) 0x4c454e CQTO |
(3707) 0x4c4550 IDIV %RBX |
(3707) 0x4c4553 JMP 4c4564 |
0x4c4555 NOPW %CS:(%RAX,%RAX,1) |
(3707) 0x4c4560 XOR %EDX,%EDX |
(3707) 0x4c4562 DIV %EBX |
(3707) 0x4c4564 IMUL %R10,%RCX |
(3707) 0x4c4568 ADD %RSI,%RCX |
(3707) 0x4c456b MOV (%R15,%RCX,8),%RCX |
(3707) 0x4c456f IMUL %R10,%RDX |
(3707) 0x4c4573 ADD %RAX,%RDX |
(3707) 0x4c4576 ADD %RCX,(%R15,%RDX,8) |
(3707) 0x4c457a MOV (%R13),%R10 |
(3707) 0x4c457e LEA (,%R10,4),%R11 |
(3707) 0x4c4586 IMUL %R9,%R11 |
(3707) 0x4c458a LEA (%R11,%R10,4),%RAX |
(3707) 0x4c458e DEC %RAX |
(3707) 0x4c4591 MOV %RAX,%RCX |
(3707) 0x4c4594 OR %RBX,%RCX |
(3707) 0x4c4597 SHR $0x20,%RCX |
(3707) 0x4c459b JE 4c45b0 |
(3707) 0x4c459d CQTO |
(3707) 0x4c459f IDIV %RBX |
(3707) 0x4c45a2 MOV %RDX,%RCX |
(3707) 0x4c45a5 MOV %RAX,%RSI |
(3707) 0x4c45a8 JMP 4c45b8 |
0x4c45aa NOPW (%RAX,%RAX,1) |
(3707) 0x4c45b0 XOR %EDX,%EDX |
(3707) 0x4c45b2 DIV %EBX |
(3707) 0x4c45b4 MOV %EDX,%ECX |
(3707) 0x4c45b6 MOV %EAX,%ESI |
(3707) 0x4c45b8 LEA (%R10,%R10,4),%RAX |
(3707) 0x4c45bc ADD %R11,%RAX |
(3707) 0x4c45bf DEC %RAX |
(3707) 0x4c45c2 MOV %RAX,%RDX |
(3707) 0x4c45c5 OR %RBX,%RDX |
(3707) 0x4c45c8 SHR $0x20,%RDX |
(3707) 0x4c45cc JNE 4c43c0 |
(3707) 0x4c45d2 XOR %EDX,%EDX |
(3707) 0x4c45d4 DIV %EBX |
(3707) 0x4c45d6 JMP 4c43c5 |
0x4c45db LEA -0x1(%R12),%RAX |
(3702) 0x4c45e0 MOV -0x8(%R8,%R12,8),%RSI |
(3702) 0x4c45e5 CMP %RSI,%RCX |
(3702) 0x4c45e8 JLE 4c4616 |
(3702) 0x4c45ea MOV -0x8(%R10,%RCX,8),%RSI |
(3702) 0x4c45ef MOV (%R13),%RDI |
(3702) 0x4c45f3 IMUL %R14,%RDI |
(3702) 0x4c45f7 ADD %RSI,%RDI |
(3702) 0x4c45fa DECQ (%R15,%RDI,8) |
(3702) 0x4c45fe DEC %RCX |
(3702) 0x4c4601 MOV (%R13),%RDI |
(3702) 0x4c4605 IMUL %R14,%RDI |
(3702) 0x4c4609 ADD %RSI,%RDI |
(3702) 0x4c460c MOV (%R15,%RDI,8),%RSI |
(3702) 0x4c4610 MOV %RAX,(%RBX,%RSI,8) |
(3702) 0x4c4614 JMP 4c45e0 |
0x4c4616 MOV %RSI,%RCX |
0x4c4619 CMP %RDX,%R12 |
0x4c461c JNE 4c4635 |
0x4c461e ADD $0x48,%RSP |
0x4c4622 POP %RBX |
0x4c4623 POP %R12 |
0x4c4625 POP %R13 |
0x4c4627 POP %R14 |
0x4c4629 POP %R15 |
0x4c462b POP %RBP |
0x4c462c RET |
0x4c462d NOPL (%RAX) |
(3699) 0x4c4630 CMP %R9,%RAX |
(3699) 0x4c4633 JLE 4c461e |
(3699) 0x4c4635 MOV -0x8(%R8,%RAX,8),%RDX |
(3699) 0x4c463a CMP %RDX,%RCX |
(3699) 0x4c463d JLE 4c4684 |
(3699) 0x4c463f LEA -0x1(%RAX),%RSI |
(3699) 0x4c4643 NOPW %CS:(%RAX,%RAX,1) |
(3701) 0x4c4650 MOV -0x8(%R10,%RCX,8),%RDX |
(3701) 0x4c4655 MOV (%R13),%RDI |
(3701) 0x4c4659 IMUL %R14,%RDI |
(3701) 0x4c465d ADD %RDX,%RDI |
(3701) 0x4c4660 DECQ (%R15,%RDI,8) |
(3701) 0x4c4664 DEC %RCX |
(3701) 0x4c4667 MOV (%R13),%RDI |
(3701) 0x4c466b IMUL %R14,%RDI |
(3701) 0x4c466f ADD %RDX,%RDI |
(3701) 0x4c4672 MOV (%R15,%RDI,8),%RDX |
(3701) 0x4c4676 MOV %RSI,(%RBX,%RDX,8) |
(3701) 0x4c467a MOV -0x8(%R8,%RAX,8),%RDX |
(3701) 0x4c467f CMP %RDX,%RCX |
(3701) 0x4c4682 JG 4c4650 |
(3699) 0x4c4684 MOV -0x10(%R8,%RAX,8),%RCX |
(3699) 0x4c4689 ADD $-0x2,%RAX |
(3699) 0x4c468d CMP %RCX,%RDX |
(3699) 0x4c4690 JLE 4c4630 |
(3699) 0x4c4692 NOPW %CS:(%RAX,%RAX,1) |
(3700) 0x4c46a0 MOV -0x8(%R10,%RDX,8),%RCX |
(3700) 0x4c46a5 MOV (%R13),%RSI |
(3700) 0x4c46a9 IMUL %R14,%RSI |
(3700) 0x4c46ad ADD %RCX,%RSI |
(3700) 0x4c46b0 DECQ (%R15,%RSI,8) |
(3700) 0x4c46b4 DEC %RDX |
(3700) 0x4c46b7 MOV (%R13),%RSI |
(3700) 0x4c46bb IMUL %R14,%RSI |
(3700) 0x4c46bf ADD %RCX,%RSI |
(3700) 0x4c46c2 MOV (%R15,%RSI,8),%RCX |
(3700) 0x4c46c6 MOV %RAX,(%RBX,%RCX,8) |
(3700) 0x4c46ca MOV (%R8,%RAX,8),%RCX |
(3700) 0x4c46ce CMP %RCX,%RDX |
(3700) 0x4c46d1 JG 4c46a0 |
(3699) 0x4c46d3 JMP 4c4630 |
0x4c46d8 NOPL (%RAX,%RAX,1) |
Path / |
Source file and lines | csr_matop.c:380-560 |
Module | exec |
nb instructions | 226 |
nb uops | 250 |
loop length | 942 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 41.83 cycles |
front end | 41.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 16.30 | 16.20 | 17.00 | 17.00 | 15.50 | 16.20 | 16.10 | 15.50 | 15.50 | 15.50 | 16.20 | 17.00 |
cycles | 16.30 | 20.80 | 17.00 | 17.00 | 15.50 | 16.20 | 16.10 | 15.50 | 15.50 | 15.50 | 16.20 | 17.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 38.73-38.76 |
Stall cycles | 0.00 |
Front-end | 41.83 |
Dispatch | 20.80 |
DIV/SQRT | 16.00 |
Overall L1 | 41.83 |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 10% |
load | 9% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x48,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d1400 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4d1410 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4c5bc0 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4c5c40 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RBX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c3dbb <hypre_CSRMatrixTranspose.extracted+0x8b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x5de70(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4fa05a,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4fc003,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4cf9e0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4fbf80,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d7,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d2330 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c3dcd <hypre_CSRMatrixTranspose.extracted+0x9d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c3dfb <hypre_CSRMatrixTranspose.extracted+0xcb> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x5de2c(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4fa05a,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4fc012,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4cf9e0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4fbf80,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d2330 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x38(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c3e0d <hypre_CSRMatrixTranspose.extracted+0xdd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c3e3b <hypre_CSRMatrixTranspose.extracted+0x10b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x5ddec(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4fa05a,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4fc035,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4cf9e0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4fbf80,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d2330 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R15,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8930 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x40(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX,%RAX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RDX,%R12,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JGE 4c3e89 <hypre_CSRMatrixTranspose.extracted+0x159> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x520ab0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410570 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R13),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x1(%R14),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RBX,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JL 4c3fe9 <hypre_CSRMatrixTranspose.extracted+0x2b9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x520ad0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410570 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x520af0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4106e0 <__kmpc_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMP $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4c4144 <hypre_CSRMatrixTranspose.extracted+0x414> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c4134 <hypre_CSRMatrixTranspose.extracted+0x404> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4c43ad <hypre_CSRMatrixTranspose.extracted+0x67d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4c4134 <hypre_CSRMatrixTranspose.extracted+0x404> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4c3f54 <hypre_CSRMatrixTranspose.extracted+0x224> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x520b10,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410500 <__kmpc_end_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x520b30,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410570 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x48(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c42c1 <hypre_CSRMatrixTranspose.extracted+0x591> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R13),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RDI,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA -0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R8,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4c4183 <hypre_CSRMatrixTranspose.extracted+0x453> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R8 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 4c4188 <hypre_CSRMatrixTranspose.extracted+0x458> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R8D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R9,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c42c1 <hypre_CSRMatrixTranspose.extracted+0x591> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %RDI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R15,%RDX,8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4c41db <hypre_CSRMatrixTranspose.extracted+0x4ab> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x520b50,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410570 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,-0x68(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4c4371 <hypre_CSRMatrixTranspose.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c461e <hypre_CSRMatrixTranspose.extracted+0x8ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI,%R12,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4c431c <hypre_CSRMatrixTranspose.extracted+0x5ec> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c461e <hypre_CSRMatrixTranspose.extracted+0x8ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R8,%R12,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R9D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R9),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4c45db <hypre_CSRMatrixTranspose.extracted+0x8ab> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4c4635 <hypre_CSRMatrixTranspose.extracted+0x905> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4c461e <hypre_CSRMatrixTranspose.extracted+0x8ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x50(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SHR $0x2,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c43e7 <hypre_CSRMatrixTranspose.extracted+0x6b7> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x1(%R12),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4c4635 <hypre_CSRMatrixTranspose.extracted+0x905> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x48,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matop.c:380-560 |
Module | exec |
nb instructions | 226 |
nb uops | 250 |
loop length | 942 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 41.83 cycles |
front end | 41.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 16.30 | 16.20 | 17.00 | 17.00 | 15.50 | 16.20 | 16.10 | 15.50 | 15.50 | 15.50 | 16.20 | 17.00 |
cycles | 16.30 | 20.80 | 17.00 | 17.00 | 15.50 | 16.20 | 16.10 | 15.50 | 15.50 | 15.50 | 16.20 | 17.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 38.73-38.76 |
Stall cycles | 0.00 |
Front-end | 41.83 |
Dispatch | 20.80 |
DIV/SQRT | 16.00 |
Overall L1 | 41.83 |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 10% |
load | 9% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x48,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d1400 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4d1410 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4c5bc0 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4c5c40 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RBX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c3dbb <hypre_CSRMatrixTranspose.extracted+0x8b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x5de70(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4fa05a,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4fc003,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4cf9e0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4fbf80,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d7,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d2330 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c3dcd <hypre_CSRMatrixTranspose.extracted+0x9d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c3dfb <hypre_CSRMatrixTranspose.extracted+0xcb> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x5de2c(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4fa05a,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4fc012,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4cf9e0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4fbf80,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d2330 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x38(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c3e0d <hypre_CSRMatrixTranspose.extracted+0xdd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c3e3b <hypre_CSRMatrixTranspose.extracted+0x10b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x5ddec(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4fa05a,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4fc035,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4cf9e0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4fbf80,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d2330 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R15,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8930 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x40(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX,%RAX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RDX,%R12,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JGE 4c3e89 <hypre_CSRMatrixTranspose.extracted+0x159> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x520ab0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410570 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R13),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x1(%R14),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RBX,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JL 4c3fe9 <hypre_CSRMatrixTranspose.extracted+0x2b9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x520ad0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410570 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x520af0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4106e0 <__kmpc_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMP $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4c4144 <hypre_CSRMatrixTranspose.extracted+0x414> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c4134 <hypre_CSRMatrixTranspose.extracted+0x404> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4c43ad <hypre_CSRMatrixTranspose.extracted+0x67d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4c4134 <hypre_CSRMatrixTranspose.extracted+0x404> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4c3f54 <hypre_CSRMatrixTranspose.extracted+0x224> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x520b10,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410500 <__kmpc_end_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x520b30,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410570 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x48(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c42c1 <hypre_CSRMatrixTranspose.extracted+0x591> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R13),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RDI,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA -0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R8,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4c4183 <hypre_CSRMatrixTranspose.extracted+0x453> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R8 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 4c4188 <hypre_CSRMatrixTranspose.extracted+0x458> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R8D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R9,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c42c1 <hypre_CSRMatrixTranspose.extracted+0x591> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %RDI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R15,%RDX,8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4c41db <hypre_CSRMatrixTranspose.extracted+0x4ab> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x520b50,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410570 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,-0x68(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4c4371 <hypre_CSRMatrixTranspose.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c461e <hypre_CSRMatrixTranspose.extracted+0x8ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI,%R12,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4c431c <hypre_CSRMatrixTranspose.extracted+0x5ec> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c461e <hypre_CSRMatrixTranspose.extracted+0x8ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R8,%R12,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R9D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R9),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4c45db <hypre_CSRMatrixTranspose.extracted+0x8ab> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4c4635 <hypre_CSRMatrixTranspose.extracted+0x905> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4c461e <hypre_CSRMatrixTranspose.extracted+0x8ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x50(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SHR $0x2,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c43e7 <hypre_CSRMatrixTranspose.extracted+0x6b7> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x1(%R12),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4c4635 <hypre_CSRMatrixTranspose.extracted+0x905> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x48,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixTranspose.extracted– | 0.15 | 0.06 |
▼Loop 3703 - csr_matop.c:540-548 - exec– | 0.02 | 0.01 |
○Loop 3704 - csr_matop.c:541-548 - exec | 0.09 | 0.03 |
○Loop 3705 - csr_matop.c:380-527 - exec | 0.01 | 0.01 |
○Loop 3708 - csr_matop.c:380-500 - exec | 0.01 | 0.01 |
○Loop 3709 - csr_matop.c:483-485 - exec | 0.01 | 0.01 |
▼Loop 3699 - csr_matop.c:553-560 - exec– | 0 | 0 |
○Loop 3701 - csr_matop.c:554-560 - exec | 0 | 0 |
○Loop 3700 - csr_matop.c:554-560 - exec | 0 | 0 |
○Loop 3706 - csr_matop.c:380-513 - exec | 0 | 0 |
○Loop 3707 - csr_matop.c:380-513 - exec | 0 | 0 |
○Loop 3702 - csr_matop.c:554-560 - exec | 0 | 0 |