Function: hypre_CSRMatrixTranspose.extracted | Module: exec | Source: csr_matop.c:380-560 [...] | Coverage: 0.18% |
---|
Function: hypre_CSRMatrixTranspose.extracted | Module: exec | Source: csr_matop.c:380-560 [...] | Coverage: 0.18% |
---|
/home/kcamus/qaas_runs/169-443-9681/intel/AMG/build/AMG/AMG/seq_mv/csr_matop.c: 380 - 560 |
-------------------------------------------------------------------------------- |
380: return idx%dim1*dim2 + idx/dim1; |
[...] |
463: #pragma omp parallel |
464: #endif |
465: { |
466: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
467: HYPRE_Int my_thread_num = hypre_GetThreadNum(); |
468: |
469: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
470: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
471: hypre_assert(iBegin <= iEnd); |
472: hypre_assert(iBegin >= 0 && iBegin <= num_rowsA); |
473: hypre_assert(iEnd >= 0 && iEnd <= num_rowsA); |
474: |
475: HYPRE_Int i, j; |
476: memset(bucket + my_thread_num*num_colsA, 0, sizeof(HYPRE_Int)*num_colsA); |
[...] |
483: for (j = A_i[iBegin]; j < A_i[iEnd]; ++j) { |
484: HYPRE_Int idx = A_j[j]; |
485: bucket[my_thread_num*num_colsA + idx]++; |
[...] |
496: for (i = my_thread_num*num_colsA + 1; i < (my_thread_num + 1)*num_colsA; ++i) { |
497: HYPRE_Int transpose_i = transpose_idx(i, num_threads, num_colsA); |
498: HYPRE_Int transpose_i_minus_1 = transpose_idx(i - 1, num_threads, num_colsA); |
499: |
500: bucket[transpose_i] += bucket[transpose_i_minus_1]; |
501: } |
502: |
503: #ifdef HYPRE_USING_OPENMP |
504: #pragma omp barrier |
505: #pragma omp master |
506: #endif |
507: { |
508: for (i = 1; i < num_threads; ++i) { |
509: HYPRE_Int j0 = num_colsA*i - 1, j1 = num_colsA*(i + 1) - 1; |
510: HYPRE_Int transpose_j0 = transpose_idx(j0, num_threads, num_colsA); |
511: HYPRE_Int transpose_j1 = transpose_idx(j1, num_threads, num_colsA); |
512: |
513: bucket[transpose_j1] += bucket[transpose_j0]; |
[...] |
520: if (my_thread_num > 0) { |
521: HYPRE_Int transpose_i0 = transpose_idx(num_colsA*my_thread_num - 1, num_threads, num_colsA); |
522: HYPRE_Int offset = bucket[transpose_i0]; |
523: |
524: for (i = my_thread_num*num_colsA; i < (my_thread_num + 1)*num_colsA - 1; ++i) { |
525: HYPRE_Int transpose_i = transpose_idx(i, num_threads, num_colsA); |
526: |
527: bucket[transpose_i] += offset; |
[...] |
539: if (data) { |
540: for (i = iEnd - 1; i >= iBegin; --i) { |
541: for (j = A_i[i + 1] - 1; j >= A_i[i]; --j) { |
542: HYPRE_Int idx = A_j[j]; |
543: --bucket[my_thread_num*num_colsA + idx]; |
544: |
545: HYPRE_Int offset = bucket[my_thread_num*num_colsA + idx]; |
546: |
547: AT_data[offset] = A_data[j]; |
548: AT_j[offset] = i; |
549: } |
550: } |
551: } |
552: else { |
553: for (i = iEnd - 1; i >= iBegin; --i) { |
554: for (j = A_i[i + 1] - 1; j >= A_i[i]; --j) { |
555: HYPRE_Int idx = A_j[j]; |
556: --bucket[my_thread_num*num_colsA + idx]; |
557: |
558: HYPRE_Int offset = bucket[my_thread_num*num_colsA + idx]; |
559: |
560: AT_j[offset] = i; |
0x4d08a0 PUSH %RBP |
0x4d08a1 MOV %RSP,%RBP |
0x4d08a4 PUSH %R15 |
0x4d08a6 PUSH %R14 |
0x4d08a8 PUSH %R13 |
0x4d08aa PUSH %R12 |
0x4d08ac PUSH %RBX |
0x4d08ad SUB $0x58,%RSP |
0x4d08b1 MOV %R9,%R14 |
0x4d08b4 MOV %R8,-0x70(%RBP) |
0x4d08b8 MOV %RCX,-0x78(%RBP) |
0x4d08bc MOV %RDX,%RBX |
0x4d08bf MOV %RDI,-0x40(%RBP) |
0x4d08c3 CALL 4df9c0 <hypre_NumActiveThreads> |
0x4d08c8 MOV %RAX,%R13 |
0x4d08cb CALL 4df9d0 <hypre_GetThreadNum> |
0x4d08d0 MOV %RAX,-0x50(%RBP) |
0x4d08d4 MOV %RBX,%RDI |
0x4d08d7 CALL 4d3050 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> |
0x4d08dc MOV %RAX,%R15 |
0x4d08df MOV %RBX,%RDI |
0x4d08e2 CALL 4d30d0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> |
0x4d08e7 MOV %RAX,%RCX |
0x4d08ea CMP %R15,%RAX |
0x4d08ed MOV %R15,%RAX |
0x4d08f0 MOV %R15,-0x38(%RBP) |
0x4d08f4 MOV %RCX,-0x30(%RBP) |
0x4d08f8 JGE 4d0930 |
0x4d08fa MOV 0x5c2bf(%RIP),%RDI |
0x4d0901 MOV $0x505dec,%ESI |
0x4d0906 MOV $0x507bbf,%EDX |
0x4d090b XOR %EAX,%EAX |
0x4d090d CALL 4ddb80 <hypre_fprintf> |
0x4d0912 MOV $0x507b46,%EDI |
0x4d0917 MOV $0x1d7,%ESI |
0x4d091c MOV $0x1,%EDX |
0x4d0921 XOR %ECX,%ECX |
0x4d0923 CALL 4dfac0 <hypre_error_handler> |
0x4d0928 MOV -0x30(%RBP),%RCX |
0x4d092c MOV -0x38(%RBP),%R15 |
0x4d0930 MOV 0x18(%RBP),%RBX |
0x4d0934 TEST %R15,%R15 |
0x4d0937 JS 4d093e |
0x4d0939 CMP %RBX,%R15 |
0x4d093c JLE 4d0970 |
0x4d093e MOV 0x5c27b(%RIP),%RDI |
0x4d0945 MOV $0x505dec,%ESI |
0x4d094a MOV $0x507bce,%EDX |
0x4d094f XOR %EAX,%EAX |
0x4d0951 CALL 4ddb80 <hypre_fprintf> |
0x4d0956 MOV $0x507b46,%EDI |
0x4d095b MOV $0x1d8,%ESI |
0x4d0960 MOV $0x1,%EDX |
0x4d0965 XOR %ECX,%ECX |
0x4d0967 CALL 4dfac0 <hypre_error_handler> |
0x4d096c MOV -0x30(%RBP),%RCX |
0x4d0970 MOV 0x38(%RBP),%R12 |
0x4d0974 MOV 0x20(%RBP),%RAX |
0x4d0978 TEST %RCX,%RCX |
0x4d097b JS 4d0982 |
0x4d097d CMP %RBX,%RCX |
0x4d0980 JLE 4d09b4 |
0x4d0982 MOV 0x5c237(%RIP),%RDI |
0x4d0989 MOV $0x505dec,%ESI |
0x4d098e MOV $0x507bf1,%EDX |
0x4d0993 XOR %EAX,%EAX |
0x4d0995 CALL 4ddb80 <hypre_fprintf> |
0x4d099a MOV $0x507b46,%EDI |
0x4d099f MOV $0x1d9,%ESI |
0x4d09a4 MOV $0x1,%EDX |
0x4d09a9 XOR %ECX,%ECX |
0x4d09ab CALL 4dfac0 <hypre_error_handler> |
0x4d09b0 MOV 0x20(%RBP),%RAX |
0x4d09b4 MOV 0x10(%RBP),%RBX |
0x4d09b8 MOV -0x50(%RBP),%R15 |
0x4d09bc IMUL %RAX,%R15 |
0x4d09c0 LEA (%R12,%R15,8),%RDI |
0x4d09c4 LEA (,%RAX,8),%RDX |
0x4d09cc XOR %ESI,%ESI |
0x4d09ce CALL 4e6020 <_intel_fast_memset> |
0x4d09d3 MOV -0x30(%RBP),%RSI |
0x4d09d7 MOV -0x38(%RBP),%RAX |
0x4d09db MOV (%R14,%RAX,8),%RAX |
0x4d09df CMP (%R14,%RSI,8),%RAX |
0x4d09e3 JGE 4d0a04 |
0x4d09e5 MOV %RBX,%RDX |
0x4d09e8 NOPL (%RAX,%RAX,1) |
(3855) 0x4d09f0 MOV (%RDX,%RAX,8),%RCX |
(3855) 0x4d09f4 ADD %R15,%RCX |
(3855) 0x4d09f7 INCQ (%R12,%RCX,8) |
(3855) 0x4d09fb INC %RAX |
(3855) 0x4d09fe CMP (%R14,%RSI,8),%RAX |
(3855) 0x4d0a02 JL 4d09f0 |
0x4d0a04 MOV -0x40(%RBP),%RAX |
0x4d0a08 MOV (%RAX),%ESI |
0x4d0a0a MOV $0x52ba70,%EDI |
0x4d0a0f CALL 410560 <__kmpc_barrier@plt> |
0x4d0a14 MOV -0x50(%RBP),%RAX |
0x4d0a18 LEA 0x1(%RAX),%RCX |
0x4d0a1c MOV 0x20(%RBP),%R10 |
0x4d0a20 IMUL %R10,%RCX |
0x4d0a24 LEA 0x1(%R15),%RAX |
0x4d0a28 MOV %RCX,-0x60(%RBP) |
0x4d0a2c CMP %RCX,%RAX |
0x4d0a2f JGE 4d0ae1 |
0x4d0a35 LEA -0x1(%R10),%R8 |
0x4d0a39 CMP $0x4,%R8 |
0x4d0a3d JAE 4d0c3a |
0x4d0a43 MOV %R8,%RBX |
0x4d0a46 AND $-0x4,%RBX |
0x4d0a4a CMP %R8,%RBX |
0x4d0a4d JAE 4d0ae1 |
0x4d0a53 LEA (%R15,%RBX,1),%RDI |
0x4d0a57 NOT %RBX |
0x4d0a5a ADD %R10,%RBX |
0x4d0a5d JMP 4d0a86 |
0x4d0a5f NOP |
(3853) 0x4d0a60 MOV %RDI,%RAX |
(3853) 0x4d0a63 CQTO |
(3853) 0x4d0a65 IDIV %R13 |
(3853) 0x4d0a68 IMUL %R10,%RDX |
(3853) 0x4d0a6c ADD %RAX,%RDX |
(3853) 0x4d0a6f MOV (%R12,%RDX,8),%RAX |
(3853) 0x4d0a73 IMUL %R10,%RSI |
(3853) 0x4d0a77 ADD %R8,%RSI |
(3853) 0x4d0a7a ADD %RAX,(%R12,%RSI,8) |
(3853) 0x4d0a7e MOV %RCX,%RDI |
(3853) 0x4d0a81 DEC %RBX |
(3853) 0x4d0a84 JE 4d0ae1 |
(3853) 0x4d0a86 LEA 0x1(%RDI),%RCX |
(3853) 0x4d0a8a MOV %RCX,%RAX |
(3853) 0x4d0a8d OR %R13,%RAX |
(3853) 0x4d0a90 SHR $0x20,%RAX |
(3853) 0x4d0a94 JE 4d0ac0 |
(3853) 0x4d0a96 MOV %RCX,%RAX |
(3853) 0x4d0a99 CQTO |
(3853) 0x4d0a9b IDIV %R13 |
(3853) 0x4d0a9e MOV %RDX,%RSI |
(3853) 0x4d0aa1 MOV %RAX,%R8 |
(3853) 0x4d0aa4 MOV %RDI,%RAX |
(3853) 0x4d0aa7 OR %R13,%RAX |
(3853) 0x4d0aaa SHR $0x20,%RAX |
(3853) 0x4d0aae JNE 4d0a60 |
(3853) 0x4d0ab0 JMP 4d0ad8 |
0x4d0ab2 NOPW %CS:(%RAX,%RAX,1) |
(3853) 0x4d0ac0 MOV %ECX,%EAX |
(3853) 0x4d0ac2 XOR %EDX,%EDX |
(3853) 0x4d0ac4 DIV %R13D |
(3853) 0x4d0ac7 MOV %EDX,%ESI |
(3853) 0x4d0ac9 MOV %EAX,%R8D |
(3853) 0x4d0acc MOV %RDI,%RAX |
(3853) 0x4d0acf OR %R13,%RAX |
(3853) 0x4d0ad2 SHR $0x20,%RAX |
(3853) 0x4d0ad6 JNE 4d0a60 |
(3853) 0x4d0ad8 MOV %EDI,%EAX |
(3853) 0x4d0ada XOR %EDX,%EDX |
(3853) 0x4d0adc DIV %R13D |
(3853) 0x4d0adf JMP 4d0a68 |
0x4d0ae1 MOV -0x40(%RBP),%RBX |
0x4d0ae5 MOV (%RBX),%ESI |
0x4d0ae7 MOV $0x52ba90,%EDI |
0x4d0aec CALL 410560 <__kmpc_barrier@plt> |
0x4d0af1 MOV (%RBX),%ESI |
0x4d0af3 MOV $0x52bab0,%EDI |
0x4d0af8 XOR %EDX,%EDX |
0x4d0afa CALL 4106b0 <__kmpc_masked@plt> |
0x4d0aff CMP $0x1,%EAX |
0x4d0b02 JNE 4d0bf1 |
0x4d0b08 CMP $0x1,%R13 |
0x4d0b0c MOV 0x20(%RBP),%R11 |
0x4d0b10 JLE 4d0be1 |
0x4d0b16 LEA -0x1(%R13),%RAX |
0x4d0b1a MOV %RAX,-0x58(%RBP) |
0x4d0b1e CMP $0x4,%RAX |
0x4d0b22 JAE 4d107f |
0x4d0b28 MOV -0x58(%RBP),%RAX |
0x4d0b2c MOV %RAX,%RCX |
0x4d0b2f AND $-0x4,%RCX |
0x4d0b33 CMP %RAX,%RCX |
0x4d0b36 JAE 4d0be1 |
0x4d0b3c LEA 0x1(%RCX),%RBX |
0x4d0b40 MOV %R11,%RSI |
0x4d0b43 IMUL %RBX,%RSI |
0x4d0b47 DEC %RSI |
0x4d0b4a ADD $0x2,%RCX |
0x4d0b4e IMUL %R11,%RCX |
0x4d0b52 DEC %RCX |
0x4d0b55 JMP 4d0b8c |
0x4d0b57 NOPW (%RAX,%RAX,1) |
(3851) 0x4d0b60 MOV %RCX,%RAX |
(3851) 0x4d0b63 CQTO |
(3851) 0x4d0b65 IDIV %R13 |
(3851) 0x4d0b68 IMUL %R11,%RDI |
(3851) 0x4d0b6c ADD %R8,%RDI |
(3851) 0x4d0b6f MOV (%R12,%RDI,8),%RDI |
(3851) 0x4d0b73 IMUL %R11,%RDX |
(3851) 0x4d0b77 ADD %RAX,%RDX |
(3851) 0x4d0b7a ADD %RDI,(%R12,%RDX,8) |
(3851) 0x4d0b7e ADD %R11,%RSI |
(3851) 0x4d0b81 ADD %R11,%RCX |
(3851) 0x4d0b84 INC %RBX |
(3851) 0x4d0b87 CMP %RBX,%R13 |
(3851) 0x4d0b8a JE 4d0be1 |
(3851) 0x4d0b8c MOV %RSI,%RAX |
(3851) 0x4d0b8f OR %R13,%RAX |
(3851) 0x4d0b92 SHR $0x20,%RAX |
(3851) 0x4d0b96 JE 4d0bc0 |
(3851) 0x4d0b98 MOV %RSI,%RAX |
(3851) 0x4d0b9b CQTO |
(3851) 0x4d0b9d IDIV %R13 |
(3851) 0x4d0ba0 MOV %RDX,%RDI |
(3851) 0x4d0ba3 MOV %RAX,%R8 |
(3851) 0x4d0ba6 MOV %RCX,%RAX |
(3851) 0x4d0ba9 OR %R13,%RAX |
(3851) 0x4d0bac SHR $0x20,%RAX |
(3851) 0x4d0bb0 JNE 4d0b60 |
(3851) 0x4d0bb2 JMP 4d0bd8 |
0x4d0bb4 NOPW %CS:(%RAX,%RAX,1) |
(3851) 0x4d0bc0 MOV %ESI,%EAX |
(3851) 0x4d0bc2 XOR %EDX,%EDX |
(3851) 0x4d0bc4 DIV %R13D |
(3851) 0x4d0bc7 MOV %EDX,%EDI |
(3851) 0x4d0bc9 MOV %EAX,%R8D |
(3851) 0x4d0bcc MOV %RCX,%RAX |
(3851) 0x4d0bcf OR %R13,%RAX |
(3851) 0x4d0bd2 SHR $0x20,%RAX |
(3851) 0x4d0bd6 JNE 4d0b60 |
(3851) 0x4d0bd8 MOV %ECX,%EAX |
(3851) 0x4d0bda XOR %EDX,%EDX |
(3851) 0x4d0bdc DIV %R13D |
(3851) 0x4d0bdf JMP 4d0b68 |
0x4d0be1 MOV -0x40(%RBP),%RBX |
0x4d0be5 MOV (%RBX),%ESI |
0x4d0be7 MOV $0x52bad0,%EDI |
0x4d0bec CALL 4104f0 <__kmpc_end_masked@plt> |
0x4d0bf1 MOV (%RBX),%ESI |
0x4d0bf3 MOV $0x52baf0,%EDI |
0x4d0bf8 CALL 410560 <__kmpc_barrier@plt> |
0x4d0bfd CMPQ $0,-0x50(%RBP) |
0x4d0c02 MOV 0x20(%RBP),%RBX |
0x4d0c06 JLE 4d0dd0 |
0x4d0c0c LEA -0x1(%R15),%RAX |
0x4d0c10 MOV %RAX,%RCX |
0x4d0c13 OR %R13,%RCX |
0x4d0c16 SHR $0x20,%RCX |
0x4d0c1a JE 4d0d54 |
0x4d0c20 CQTO |
0x4d0c22 IDIV %R13 |
0x4d0c25 MOV -0x60(%RBP),%RCX |
0x4d0c29 DEC %RCX |
0x4d0c2c CMP %RCX,%R15 |
0x4d0c2f JL 4d0d65 |
0x4d0c35 JMP 4d0dd0 |
0x4d0c3a MOV %R8,%RBX |
0x4d0c3d SHR $0x2,%RBX |
0x4d0c41 MOV %R15,%RCX |
0x4d0c44 JMP 4d0c6c |
0x4d0c46 NOPW %CS:(%RAX,%RAX,1) |
(3854) 0x4d0c50 MOV %RCX,%RAX |
(3854) 0x4d0c53 CQTO |
(3854) 0x4d0c55 IDIV %R13 |
(3854) 0x4d0c58 IMUL %R10,%RDX |
(3854) 0x4d0c5c ADD %RAX,%RDX |
(3854) 0x4d0c5f ADD %RDI,(%R12,%RDX,8) |
(3854) 0x4d0c63 DEC %RBX |
(3854) 0x4d0c66 JE 4d0a43 |
(3854) 0x4d0c6c LEA 0x1(%RCX),%RAX |
(3854) 0x4d0c70 MOV %RAX,%RDX |
(3854) 0x4d0c73 OR %R13,%RDX |
(3854) 0x4d0c76 SHR $0x20,%RDX |
(3854) 0x4d0c7a JE 4d0ca0 |
(3854) 0x4d0c7c CQTO |
(3854) 0x4d0c7e IDIV %R13 |
(3854) 0x4d0c81 MOV %RDX,%RSI |
(3854) 0x4d0c84 MOV %RAX,%R9 |
(3854) 0x4d0c87 MOV %RCX,%RAX |
(3854) 0x4d0c8a OR %R13,%RAX |
(3854) 0x4d0c8d SHR $0x20,%RAX |
(3854) 0x4d0c91 JE 4d0cb6 |
(3854) 0x4d0c93 MOV %RCX,%RAX |
(3854) 0x4d0c96 CQTO |
(3854) 0x4d0c98 IDIV %R13 |
(3854) 0x4d0c9b JMP 4d0cbd |
0x4d0c9d NOPL (%RAX) |
(3854) 0x4d0ca0 XOR %EDX,%EDX |
(3854) 0x4d0ca2 DIV %R13D |
(3854) 0x4d0ca5 MOV %EDX,%ESI |
(3854) 0x4d0ca7 MOV %EAX,%R9D |
(3854) 0x4d0caa MOV %RCX,%RAX |
(3854) 0x4d0cad OR %R13,%RAX |
(3854) 0x4d0cb0 SHR $0x20,%RAX |
(3854) 0x4d0cb4 JNE 4d0c93 |
(3854) 0x4d0cb6 MOV %ECX,%EAX |
(3854) 0x4d0cb8 XOR %EDX,%EDX |
(3854) 0x4d0cba DIV %R13D |
(3854) 0x4d0cbd IMUL %R10,%RDX |
(3854) 0x4d0cc1 ADD %RAX,%RDX |
(3854) 0x4d0cc4 MOV (%R12,%RDX,8),%RDI |
(3854) 0x4d0cc8 IMUL %R10,%RSI |
(3854) 0x4d0ccc ADD %R9,%RSI |
(3854) 0x4d0ccf ADD (%R12,%RSI,8),%RDI |
(3854) 0x4d0cd3 MOV %RDI,(%R12,%RSI,8) |
(3854) 0x4d0cd7 LEA 0x2(%RCX),%RAX |
(3854) 0x4d0cdb MOV %RAX,%RDX |
(3854) 0x4d0cde OR %R13,%RDX |
(3854) 0x4d0ce1 SHR $0x20,%RDX |
(3854) 0x4d0ce5 JE 4d0cf0 |
(3854) 0x4d0ce7 CQTO |
(3854) 0x4d0ce9 IDIV %R13 |
(3854) 0x4d0cec JMP 4d0cf5 |
0x4d0cee XCHG %AX,%AX |
(3854) 0x4d0cf0 XOR %EDX,%EDX |
(3854) 0x4d0cf2 DIV %R13D |
(3854) 0x4d0cf5 IMUL %R10,%RDX |
(3854) 0x4d0cf9 ADD %RAX,%RDX |
(3854) 0x4d0cfc ADD (%R12,%RDX,8),%RDI |
(3854) 0x4d0d00 MOV %RDI,(%R12,%RDX,8) |
(3854) 0x4d0d04 LEA 0x3(%RCX),%RAX |
(3854) 0x4d0d08 MOV %RAX,%RDX |
(3854) 0x4d0d0b OR %R13,%RDX |
(3854) 0x4d0d0e SHR $0x20,%RDX |
(3854) 0x4d0d12 JE 4d0d20 |
(3854) 0x4d0d14 CQTO |
(3854) 0x4d0d16 IDIV %R13 |
(3854) 0x4d0d19 JMP 4d0d25 |
0x4d0d1b NOPL (%RAX,%RAX,1) |
(3854) 0x4d0d20 XOR %EDX,%EDX |
(3854) 0x4d0d22 DIV %R13D |
(3854) 0x4d0d25 IMUL %R10,%RDX |
(3854) 0x4d0d29 ADD %RAX,%RDX |
(3854) 0x4d0d2c ADD (%R12,%RDX,8),%RDI |
(3854) 0x4d0d30 MOV %RDI,(%R12,%RDX,8) |
(3854) 0x4d0d34 ADD $0x4,%RCX |
(3854) 0x4d0d38 MOV %RCX,%RAX |
(3854) 0x4d0d3b OR %R13,%RAX |
(3854) 0x4d0d3e SHR $0x20,%RAX |
(3854) 0x4d0d42 JNE 4d0c50 |
(3854) 0x4d0d48 MOV %ECX,%EAX |
(3854) 0x4d0d4a XOR %EDX,%EDX |
(3854) 0x4d0d4c DIV %R13D |
(3854) 0x4d0d4f JMP 4d0c58 |
0x4d0d54 XOR %EDX,%EDX |
0x4d0d56 DIV %R13D |
0x4d0d59 MOV -0x60(%RBP),%RCX |
0x4d0d5d DEC %RCX |
0x4d0d60 CMP %RCX,%R15 |
0x4d0d63 JGE 4d0dd0 |
0x4d0d65 IMUL %RBX,%RDX |
0x4d0d69 ADD %RAX,%RDX |
0x4d0d6c MOV (%R12,%RDX,8),%RSI |
0x4d0d70 LEA -0x1(%RBX),%R8 |
0x4d0d74 CMP $0x8,%R8 |
0x4d0d78 JAE 4d0e6c |
0x4d0d7e MOV %R8,%RDI |
0x4d0d81 AND $-0x8,%RDI |
0x4d0d85 CMP %R8,%RDI |
0x4d0d88 JAE 4d0dd0 |
0x4d0d8a LEA (%R15,%RDI,1),%RCX |
0x4d0d8e NOT %RDI |
0x4d0d91 ADD %RBX,%RDI |
0x4d0d94 JMP 4d0dbb |
0x4d0d96 NOPW %CS:(%RAX,%RAX,1) |
(3849) 0x4d0da0 MOV %RCX,%RAX |
(3849) 0x4d0da3 CQTO |
(3849) 0x4d0da5 IDIV %R13 |
(3849) 0x4d0da8 IMUL %RBX,%RDX |
(3849) 0x4d0dac ADD %RAX,%RDX |
(3849) 0x4d0daf ADD %RSI,(%R12,%RDX,8) |
(3849) 0x4d0db3 INC %RCX |
(3849) 0x4d0db6 DEC %RDI |
(3849) 0x4d0db9 JE 4d0dd0 |
(3849) 0x4d0dbb MOV %RCX,%RAX |
(3849) 0x4d0dbe OR %R13,%RAX |
(3849) 0x4d0dc1 SHR $0x20,%RAX |
(3849) 0x4d0dc5 JNE 4d0da0 |
(3849) 0x4d0dc7 MOV %ECX,%EAX |
(3849) 0x4d0dc9 XOR %EDX,%EDX |
(3849) 0x4d0dcb DIV %R13D |
(3849) 0x4d0dce JMP 4d0da8 |
0x4d0dd0 MOV 0x30(%RBP),%R13 |
0x4d0dd4 MOV -0x40(%RBP),%RAX |
0x4d0dd8 MOV (%RAX),%ESI |
0x4d0dda MOV $0x52bb10,%EDI |
0x4d0ddf CALL 410560 <__kmpc_barrier@plt> |
0x4d0de4 CMPQ $0,-0x78(%RBP) |
0x4d0de9 JE 4d0e30 |
0x4d0deb MOV -0x38(%RBP),%R11 |
0x4d0def MOV -0x30(%RBP),%R8 |
0x4d0df3 CMP %R11,%R8 |
0x4d0df6 MOV -0x70(%RBP),%R9 |
0x4d0dfa JLE 4d12ea |
0x4d0e00 MOV 0x28(%RBP),%R10 |
0x4d0e04 MOV (%R14,%R8,8),%RDX |
0x4d0e08 MOV %R8D,%ECX |
0x4d0e0b SUB %R11D,%ECX |
0x4d0e0e LEA 0x1(%R11),%RAX |
0x4d0e12 TEST $0x1,%CL |
0x4d0e15 JNE 4d100c |
0x4d0e1b MOV %R8,%RCX |
0x4d0e1e CMP %RAX,%R8 |
0x4d0e21 MOV 0x10(%RBP),%R8 |
0x4d0e25 JNE 4d1305 |
0x4d0e2b JMP 4d12ea |
0x4d0e30 MOV -0x38(%RBP),%R9 |
0x4d0e34 MOV -0x30(%RBP),%R10 |
0x4d0e38 CMP %R9,%R10 |
0x4d0e3b JLE 4d12ea |
0x4d0e41 MOV (%R14,%R10,8),%RCX |
0x4d0e45 MOV %R10D,%EAX |
0x4d0e48 SUB %R9D,%EAX |
0x4d0e4b LEA 0x1(%R9),%R8 |
0x4d0e4f TEST $0x1,%AL |
0x4d0e51 JNE 4d11f2 |
0x4d0e57 MOV %R10,%RAX |
0x4d0e5a CMP %R8,%R10 |
0x4d0e5d MOV 0x10(%RBP),%R8 |
0x4d0e61 JNE 4d1259 |
0x4d0e67 JMP 4d12ea |
0x4d0e6c MOV %R8,%RDI |
0x4d0e6f SHR $0x3,%RDI |
0x4d0e73 LEA 0x7(%R15),%RCX |
0x4d0e77 JMP 4d0ea0 |
0x4d0e79 NOPL (%RAX) |
(3850) 0x4d0e80 MOV %RCX,%RAX |
(3850) 0x4d0e83 CQTO |
(3850) 0x4d0e85 IDIV %R13 |
(3850) 0x4d0e88 IMUL %RBX,%RDX |
(3850) 0x4d0e8c ADD %RAX,%RDX |
(3850) 0x4d0e8f ADD %RSI,(%R12,%RDX,8) |
(3850) 0x4d0e93 ADD $0x8,%RCX |
(3850) 0x4d0e97 DEC %RDI |
(3850) 0x4d0e9a JE 4d0d7e |
(3850) 0x4d0ea0 LEA -0x7(%RCX),%RAX |
(3850) 0x4d0ea4 MOV %RAX,%RDX |
(3850) 0x4d0ea7 OR %R13,%RDX |
(3850) 0x4d0eaa SHR $0x20,%RDX |
(3850) 0x4d0eae JE 4d0ec0 |
(3850) 0x4d0eb0 CQTO |
(3850) 0x4d0eb2 IDIV %R13 |
(3850) 0x4d0eb5 JMP 4d0ec5 |
0x4d0eb7 NOPW (%RAX,%RAX,1) |
(3850) 0x4d0ec0 XOR %EDX,%EDX |
(3850) 0x4d0ec2 DIV %R13D |
(3850) 0x4d0ec5 IMUL %RBX,%RDX |
(3850) 0x4d0ec9 ADD %RAX,%RDX |
(3850) 0x4d0ecc ADD %RSI,(%R12,%RDX,8) |
(3850) 0x4d0ed0 LEA -0x6(%RCX),%RAX |
(3850) 0x4d0ed4 MOV %RAX,%RDX |
(3850) 0x4d0ed7 OR %R13,%RDX |
(3850) 0x4d0eda SHR $0x20,%RDX |
(3850) 0x4d0ede JE 4d0ef0 |
(3850) 0x4d0ee0 CQTO |
(3850) 0x4d0ee2 IDIV %R13 |
(3850) 0x4d0ee5 JMP 4d0ef5 |
0x4d0ee7 NOPW (%RAX,%RAX,1) |
(3850) 0x4d0ef0 XOR %EDX,%EDX |
(3850) 0x4d0ef2 DIV %R13D |
(3850) 0x4d0ef5 IMUL %RBX,%RDX |
(3850) 0x4d0ef9 ADD %RAX,%RDX |
(3850) 0x4d0efc ADD %RSI,(%R12,%RDX,8) |
(3850) 0x4d0f00 LEA -0x5(%RCX),%RAX |
(3850) 0x4d0f04 MOV %RAX,%RDX |
(3850) 0x4d0f07 OR %R13,%RDX |
(3850) 0x4d0f0a SHR $0x20,%RDX |
(3850) 0x4d0f0e JE 4d0f20 |
(3850) 0x4d0f10 CQTO |
(3850) 0x4d0f12 IDIV %R13 |
(3850) 0x4d0f15 JMP 4d0f25 |
0x4d0f17 NOPW (%RAX,%RAX,1) |
(3850) 0x4d0f20 XOR %EDX,%EDX |
(3850) 0x4d0f22 DIV %R13D |
(3850) 0x4d0f25 IMUL %RBX,%RDX |
(3850) 0x4d0f29 ADD %RAX,%RDX |
(3850) 0x4d0f2c ADD %RSI,(%R12,%RDX,8) |
(3850) 0x4d0f30 LEA -0x4(%RCX),%RAX |
(3850) 0x4d0f34 MOV %RAX,%RDX |
(3850) 0x4d0f37 OR %R13,%RDX |
(3850) 0x4d0f3a SHR $0x20,%RDX |
(3850) 0x4d0f3e JE 4d0f50 |
(3850) 0x4d0f40 CQTO |
(3850) 0x4d0f42 IDIV %R13 |
(3850) 0x4d0f45 JMP 4d0f55 |
0x4d0f47 NOPW (%RAX,%RAX,1) |
(3850) 0x4d0f50 XOR %EDX,%EDX |
(3850) 0x4d0f52 DIV %R13D |
(3850) 0x4d0f55 IMUL %RBX,%RDX |
(3850) 0x4d0f59 ADD %RAX,%RDX |
(3850) 0x4d0f5c ADD %RSI,(%R12,%RDX,8) |
(3850) 0x4d0f60 LEA -0x3(%RCX),%RAX |
(3850) 0x4d0f64 MOV %RAX,%RDX |
(3850) 0x4d0f67 OR %R13,%RDX |
(3850) 0x4d0f6a SHR $0x20,%RDX |
(3850) 0x4d0f6e JE 4d0f80 |
(3850) 0x4d0f70 CQTO |
(3850) 0x4d0f72 IDIV %R13 |
(3850) 0x4d0f75 JMP 4d0f85 |
0x4d0f77 NOPW (%RAX,%RAX,1) |
(3850) 0x4d0f80 XOR %EDX,%EDX |
(3850) 0x4d0f82 DIV %R13D |
(3850) 0x4d0f85 IMUL %RBX,%RDX |
(3850) 0x4d0f89 ADD %RAX,%RDX |
(3850) 0x4d0f8c ADD %RSI,(%R12,%RDX,8) |
(3850) 0x4d0f90 LEA -0x2(%RCX),%RAX |
(3850) 0x4d0f94 MOV %RAX,%RDX |
(3850) 0x4d0f97 OR %R13,%RDX |
(3850) 0x4d0f9a SHR $0x20,%RDX |
(3850) 0x4d0f9e JE 4d0fb0 |
(3850) 0x4d0fa0 CQTO |
(3850) 0x4d0fa2 IDIV %R13 |
(3850) 0x4d0fa5 JMP 4d0fb5 |
0x4d0fa7 NOPW (%RAX,%RAX,1) |
(3850) 0x4d0fb0 XOR %EDX,%EDX |
(3850) 0x4d0fb2 DIV %R13D |
(3850) 0x4d0fb5 IMUL %RBX,%RDX |
(3850) 0x4d0fb9 ADD %RAX,%RDX |
(3850) 0x4d0fbc ADD %RSI,(%R12,%RDX,8) |
(3850) 0x4d0fc0 LEA -0x1(%RCX),%RAX |
(3850) 0x4d0fc4 MOV %RAX,%RDX |
(3850) 0x4d0fc7 OR %R13,%RDX |
(3850) 0x4d0fca SHR $0x20,%RDX |
(3850) 0x4d0fce JE 4d0fe0 |
(3850) 0x4d0fd0 CQTO |
(3850) 0x4d0fd2 IDIV %R13 |
(3850) 0x4d0fd5 JMP 4d0fe5 |
0x4d0fd7 NOPW (%RAX,%RAX,1) |
(3850) 0x4d0fe0 XOR %EDX,%EDX |
(3850) 0x4d0fe2 DIV %R13D |
(3850) 0x4d0fe5 IMUL %RBX,%RDX |
(3850) 0x4d0fe9 ADD %RAX,%RDX |
(3850) 0x4d0fec ADD %RSI,(%R12,%RDX,8) |
(3850) 0x4d0ff0 MOV %RCX,%RAX |
(3850) 0x4d0ff3 OR %R13,%RAX |
(3850) 0x4d0ff6 SHR $0x20,%RAX |
(3850) 0x4d0ffa JNE 4d0e80 |
(3850) 0x4d1000 MOV %ECX,%EAX |
(3850) 0x4d1002 XOR %EDX,%EDX |
(3850) 0x4d1004 DIV %R13D |
(3850) 0x4d1007 JMP 4d0e88 |
0x4d100c LEA -0x1(%R8),%RCX |
0x4d1010 MOV -0x8(%R14,%R8,8),%RDI |
0x4d1015 CMP %RDI,%RDX |
0x4d1018 JLE 4d12da |
0x4d101e MOV %RAX,-0x48(%RBP) |
0x4d1022 MOV 0x10(%RBP),%RAX |
0x4d1026 MOV %R9,%RBX |
0x4d1029 MOV -0x30(%RBP),%R8 |
0x4d102d NOPL (%RAX) |
(3848) 0x4d1030 MOV -0x8(%RAX,%RDX,8),%RDI |
(3848) 0x4d1035 ADD %R15,%RDI |
(3848) 0x4d1038 MOV (%R12,%RDI,8),%R9 |
(3848) 0x4d103c LEA -0x1(%R9),%RSI |
(3848) 0x4d1040 MOV %RSI,(%R12,%RDI,8) |
(3848) 0x4d1044 VMOVSD -0x8(%RBX,%RDX,8),%XMM0 |
(3848) 0x4d104a DEC %RDX |
(3848) 0x4d104d VMOVSD %XMM0,-0x8(%R10,%R9,8) |
(3848) 0x4d1054 MOV %RCX,-0x8(%R13,%R9,8) |
(3848) 0x4d1059 MOV -0x8(%R14,%R8,8),%RDI |
(3848) 0x4d105e CMP %RDI,%RDX |
(3848) 0x4d1061 JG 4d1030 |
0x4d1063 MOV %RDI,%RDX |
0x4d1066 MOV %RBX,%R9 |
0x4d1069 MOV -0x48(%RBP),%RAX |
0x4d106d CMP %RAX,%R8 |
0x4d1070 MOV 0x10(%RBP),%R8 |
0x4d1074 JNE 4d1305 |
0x4d107a JMP 4d12ea |
0x4d107f MOV -0x58(%RBP),%RDI |
0x4d1083 SHR $0x2,%RDI |
0x4d1087 LEA (,%R11,4),%RAX |
0x4d108f MOV %RAX,-0x80(%RBP) |
0x4d1093 LEA (%R11,%R11,4),%RCX |
0x4d1097 DEC %RCX |
0x4d109a LEA -0x1(,%R11,4),%RSI |
0x4d10a2 LEA (%R11,%R11,2),%R8 |
0x4d10a6 DEC %R8 |
0x4d10a9 LEA (%R11,%R11,1),%R9 |
0x4d10ad DEC %R9 |
0x4d10b0 LEA -0x1(%R11),%R10 |
0x4d10b4 JMP 4d10ef |
0x4d10b6 NOPW %CS:(%RAX,%RAX,1) |
(3852) 0x4d10c0 MOV %RCX,%RAX |
(3852) 0x4d10c3 CQTO |
(3852) 0x4d10c5 IDIV %R13 |
(3852) 0x4d10c8 IMUL %R11,%RDX |
(3852) 0x4d10cc ADD %RAX,%RDX |
(3852) 0x4d10cf ADD %RBX,(%R12,%RDX,8) |
(3852) 0x4d10d3 MOV -0x80(%RBP),%RAX |
(3852) 0x4d10d7 ADD %RAX,%RCX |
(3852) 0x4d10da ADD %RAX,%RSI |
(3852) 0x4d10dd ADD %RAX,%R8 |
(3852) 0x4d10e0 ADD %RAX,%R9 |
(3852) 0x4d10e3 ADD %RAX,%R10 |
(3852) 0x4d10e6 DEC %RDI |
(3852) 0x4d10e9 JE 4d0b28 |
(3852) 0x4d10ef MOV %R10,%RAX |
(3852) 0x4d10f2 OR %R13,%RAX |
(3852) 0x4d10f5 SHR $0x20,%RAX |
(3852) 0x4d10f9 JE 4d1110 |
(3852) 0x4d10fb MOV %R10,%RAX |
(3852) 0x4d10fe CQTO |
(3852) 0x4d1100 IDIV %R13 |
(3852) 0x4d1103 MOV %RDX,%RBX |
(3852) 0x4d1106 JMP 4d111a |
0x4d1108 NOPL (%RAX,%RAX,1) |
(3852) 0x4d1110 MOV %R10D,%EAX |
(3852) 0x4d1113 XOR %EDX,%EDX |
(3852) 0x4d1115 DIV %R13D |
(3852) 0x4d1118 MOV %EDX,%EBX |
(3852) 0x4d111a MOV %RAX,-0x68(%RBP) |
(3852) 0x4d111e MOV %R9,%RAX |
(3852) 0x4d1121 OR %R13,%RAX |
(3852) 0x4d1124 SHR $0x20,%RAX |
(3852) 0x4d1128 MOV %RDI,-0x48(%RBP) |
(3852) 0x4d112c JE 4d1140 |
(3852) 0x4d112e MOV %R9,%RAX |
(3852) 0x4d1131 CQTO |
(3852) 0x4d1133 IDIV %R13 |
(3852) 0x4d1136 JMP 4d1148 |
0x4d1138 NOPL (%RAX,%RAX,1) |
(3852) 0x4d1140 MOV %R9D,%EAX |
(3852) 0x4d1143 XOR %EDX,%EDX |
(3852) 0x4d1145 DIV %R13D |
(3852) 0x4d1148 MOV 0x20(%RBP),%R11 |
(3852) 0x4d114c IMUL %R11,%RBX |
(3852) 0x4d1150 ADD -0x68(%RBP),%RBX |
(3852) 0x4d1154 MOV (%R12,%RBX,8),%RBX |
(3852) 0x4d1158 IMUL %R11,%RDX |
(3852) 0x4d115c ADD %RAX,%RDX |
(3852) 0x4d115f ADD (%R12,%RDX,8),%RBX |
(3852) 0x4d1163 MOV %RBX,(%R12,%RDX,8) |
(3852) 0x4d1167 MOV %R8,%RAX |
(3852) 0x4d116a OR %R13,%RAX |
(3852) 0x4d116d SHR $0x20,%RAX |
(3852) 0x4d1171 JE 4d1180 |
(3852) 0x4d1173 MOV %R8,%RAX |
(3852) 0x4d1176 CQTO |
(3852) 0x4d1178 IDIV %R13 |
(3852) 0x4d117b JMP 4d1188 |
0x4d117d NOPL (%RAX) |
(3852) 0x4d1180 MOV %R8D,%EAX |
(3852) 0x4d1183 XOR %EDX,%EDX |
(3852) 0x4d1185 DIV %R13D |
(3852) 0x4d1188 MOV -0x48(%RBP),%RDI |
(3852) 0x4d118c IMUL %R11,%RDX |
(3852) 0x4d1190 ADD %RAX,%RDX |
(3852) 0x4d1193 ADD (%R12,%RDX,8),%RBX |
(3852) 0x4d1197 MOV %RBX,(%R12,%RDX,8) |
(3852) 0x4d119b MOV %RSI,%RAX |
(3852) 0x4d119e OR %R13,%RAX |
(3852) 0x4d11a1 SHR $0x20,%RAX |
(3852) 0x4d11a5 JE 4d11c0 |
(3852) 0x4d11a7 MOV %RSI,%RAX |
(3852) 0x4d11aa CQTO |
(3852) 0x4d11ac IDIV %R13 |
(3852) 0x4d11af JMP 4d11c7 |
0x4d11b1 NOPW %CS:(%RAX,%RAX,1) |
(3852) 0x4d11c0 MOV %ESI,%EAX |
(3852) 0x4d11c2 XOR %EDX,%EDX |
(3852) 0x4d11c4 DIV %R13D |
(3852) 0x4d11c7 IMUL %R11,%RDX |
(3852) 0x4d11cb ADD %RAX,%RDX |
(3852) 0x4d11ce ADD (%R12,%RDX,8),%RBX |
(3852) 0x4d11d2 MOV %RBX,(%R12,%RDX,8) |
(3852) 0x4d11d6 MOV %RCX,%RAX |
(3852) 0x4d11d9 OR %R13,%RAX |
(3852) 0x4d11dc SHR $0x20,%RAX |
(3852) 0x4d11e0 JNE 4d10c0 |
(3852) 0x4d11e6 MOV %ECX,%EAX |
(3852) 0x4d11e8 XOR %EDX,%EDX |
(3852) 0x4d11ea DIV %R13D |
(3852) 0x4d11ed JMP 4d10c8 |
0x4d11f2 LEA -0x1(%R10),%RAX |
0x4d11f6 MOV -0x8(%R14,%R10,8),%RSI |
0x4d11fb CMP %RSI,%RCX |
0x4d11fe JLE 4d1236 |
0x4d1200 MOV 0x10(%RBP),%RBX |
0x4d1204 NOPW %CS:(%RAX,%RAX,1) |
(3844) 0x4d1210 MOV -0x8(%RBX,%RCX,8),%RSI |
(3844) 0x4d1215 ADD %R15,%RSI |
(3844) 0x4d1218 DEC %RCX |
(3844) 0x4d121b MOV (%R12,%RSI,8),%RDI |
(3844) 0x4d121f LEA -0x1(%RDI),%RDX |
(3844) 0x4d1223 MOV %RDX,(%R12,%RSI,8) |
(3844) 0x4d1227 MOV %RAX,-0x8(%R13,%RDI,8) |
(3844) 0x4d122c MOV -0x8(%R14,%R10,8),%RSI |
(3844) 0x4d1231 CMP %RSI,%RCX |
(3844) 0x4d1234 JG 4d1210 |
0x4d1236 MOV %RSI,%RCX |
0x4d1239 CMP %R8,%R10 |
0x4d123c MOV 0x10(%RBP),%R8 |
0x4d1240 JNE 4d1259 |
0x4d1242 JMP 4d12ea |
0x4d1247 NOPW (%RAX,%RAX,1) |
(3841) 0x4d1250 CMP %R9,%RAX |
(3841) 0x4d1253 JLE 4d12ea |
(3841) 0x4d1259 MOV -0x8(%R14,%RAX,8),%RDX |
(3841) 0x4d125e CMP %RDX,%RCX |
(3841) 0x4d1261 JLE 4d1296 |
(3841) 0x4d1263 LEA -0x1(%RAX),%RSI |
(3841) 0x4d1267 NOPW (%RAX,%RAX,1) |
(3843) 0x4d1270 MOV -0x8(%R8,%RCX,8),%RDX |
(3843) 0x4d1275 ADD %R15,%RDX |
(3843) 0x4d1278 DEC %RCX |
(3843) 0x4d127b MOV (%R12,%RDX,8),%RDI |
(3843) 0x4d127f LEA -0x1(%RDI),%RBX |
(3843) 0x4d1283 MOV %RBX,(%R12,%RDX,8) |
(3843) 0x4d1287 MOV %RSI,-0x8(%R13,%RDI,8) |
(3843) 0x4d128c MOV -0x8(%R14,%RAX,8),%RDX |
(3843) 0x4d1291 CMP %RDX,%RCX |
(3843) 0x4d1294 JG 4d1270 |
(3841) 0x4d1296 MOV -0x10(%R14,%RAX,8),%RCX |
(3841) 0x4d129b ADD $-0x2,%RAX |
(3841) 0x4d129f CMP %RCX,%RDX |
(3841) 0x4d12a2 JLE 4d1250 |
(3841) 0x4d12a4 NOPW %CS:(%RAX,%RAX,1) |
(3842) 0x4d12b0 MOV -0x8(%R8,%RDX,8),%RCX |
(3842) 0x4d12b5 ADD %R15,%RCX |
(3842) 0x4d12b8 DEC %RDX |
(3842) 0x4d12bb MOV (%R12,%RCX,8),%RSI |
(3842) 0x4d12bf LEA -0x1(%RSI),%RDI |
(3842) 0x4d12c3 MOV %RDI,(%R12,%RCX,8) |
(3842) 0x4d12c7 MOV %RAX,-0x8(%R13,%RSI,8) |
(3842) 0x4d12cc MOV (%R14,%RAX,8),%RCX |
(3842) 0x4d12d0 CMP %RCX,%RDX |
(3842) 0x4d12d3 JG 4d12b0 |
(3841) 0x4d12d5 JMP 4d1250 |
0x4d12da MOV %RDI,%RDX |
0x4d12dd MOV -0x30(%RBP),%R8 |
0x4d12e1 CMP %RAX,%R8 |
0x4d12e4 MOV 0x10(%RBP),%R8 |
0x4d12e8 JNE 4d1305 |
0x4d12ea ADD $0x58,%RSP |
0x4d12ee POP %RBX |
0x4d12ef POP %R12 |
0x4d12f1 POP %R13 |
0x4d12f3 POP %R14 |
0x4d12f5 POP %R15 |
0x4d12f7 POP %RBP |
0x4d12f8 RET |
0x4d12f9 NOPL (%RAX) |
(3845) 0x4d1300 CMP %R11,%RCX |
(3845) 0x4d1303 JLE 4d12ea |
(3845) 0x4d1305 MOV -0x8(%R14,%RCX,8),%RSI |
(3845) 0x4d130a CMP %RSI,%RDX |
(3845) 0x4d130d JLE 4d1354 |
(3845) 0x4d130f LEA -0x1(%RCX),%RDI |
(3845) 0x4d1313 NOPW %CS:(%RAX,%RAX,1) |
(3847) 0x4d1320 MOV -0x8(%R8,%RDX,8),%RSI |
(3847) 0x4d1325 ADD %R15,%RSI |
(3847) 0x4d1328 MOV (%R12,%RSI,8),%RBX |
(3847) 0x4d132c LEA -0x1(%RBX),%RAX |
(3847) 0x4d1330 MOV %RAX,(%R12,%RSI,8) |
(3847) 0x4d1334 VMOVSD -0x8(%R9,%RDX,8),%XMM0 |
(3847) 0x4d133b DEC %RDX |
(3847) 0x4d133e VMOVSD %XMM0,-0x8(%R10,%RBX,8) |
(3847) 0x4d1345 MOV %RDI,-0x8(%R13,%RBX,8) |
(3847) 0x4d134a MOV -0x8(%R14,%RCX,8),%RSI |
(3847) 0x4d134f CMP %RSI,%RDX |
(3847) 0x4d1352 JG 4d1320 |
(3845) 0x4d1354 MOV -0x10(%R14,%RCX,8),%RDX |
(3845) 0x4d1359 ADD $-0x2,%RCX |
(3845) 0x4d135d CMP %RDX,%RSI |
(3845) 0x4d1360 JLE 4d1300 |
(3845) 0x4d1362 NOPW %CS:(%RAX,%RAX,1) |
(3846) 0x4d1370 MOV -0x8(%R8,%RSI,8),%RDX |
(3846) 0x4d1375 ADD %R15,%RDX |
(3846) 0x4d1378 MOV (%R12,%RDX,8),%RDI |
(3846) 0x4d137c LEA -0x1(%RDI),%RBX |
(3846) 0x4d1380 MOV %RBX,(%R12,%RDX,8) |
(3846) 0x4d1384 VMOVSD -0x8(%R9,%RSI,8),%XMM0 |
(3846) 0x4d138b DEC %RSI |
(3846) 0x4d138e VMOVSD %XMM0,-0x8(%R10,%RDI,8) |
(3846) 0x4d1395 MOV %RCX,-0x8(%R13,%RDI,8) |
(3846) 0x4d139a MOV (%R14,%RCX,8),%RDX |
(3846) 0x4d139e CMP %RDX,%RSI |
(3846) 0x4d13a1 JG 4d1370 |
(3845) 0x4d13a3 JMP 4d1300 |
0x4d13a8 NOPL (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | hypre_CSRMatrixTranspose | csr_matop.c:463 | exec |
○ | hypre_ParTMatmul | par_csr_matop.c:3282 | exec |
○ | hypre_BoomerAMGSetup | par_amg_setup.c:1227 | exec |
○ | hypre_PCGSetup | pcg.c:234 | exec |
○ | main | amg.c:398 | exec |
○ | __libc_init_first | libc.so.6 |
Path / |
Source file and lines | csr_matop.c:380-560 |
Module | exec |
nb instructions | 307 |
nb uops | 389 |
loop length | 1282 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 16 |
micro-operation queue | 97.50 cycles |
front end | 97.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 57.75 | 57.75 | 32.67 | 32.67 | 33.00 | 57.75 | 57.75 | 32.67 |
cycles | 57.75 | 57.75 | 32.67 | 32.67 | 33.00 | 57.75 | 57.75 | 32.67 |
Cycles executing div or sqrt instructions | 30.00-96.00 |
FE+BE cycles | 78.52-137.59 |
Stall cycles | 0.00-59.04 |
Front-end | 97.50 |
Dispatch | 57.75 |
DIV/SQRT | 30.00-96.00 |
Overall L1 | 97.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0x58,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R9,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R8,-0x70(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RCX,-0x78(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,-0x40(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4df9c0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4df9d0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4d3050 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4d30d0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP %R15,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RCX,-0x30(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JGE 4d0930 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x5c2bf(%RIP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x505dec,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x507bbf,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4ddb80 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV $0x507b46,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1d7,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4dfac0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x30(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x38(%RBP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %R15,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JS 4d093e | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP %RBX,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4d0970 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x5c27b(%RIP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x505dec,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x507bce,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4ddb80 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV $0x507b46,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1d8,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4dfac0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x30(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x38(%RBP),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %RCX,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JS 4d0982 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP %RBX,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4d09b4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x5c237(%RIP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x505dec,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x507bf1,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4ddb80 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV $0x507b46,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1d9,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4dfac0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x50(%RBP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
IMUL %RAX,%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R12,%R15,8),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RAX,8),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4e6020 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%R14,%RAX,8),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP (%R14,%RSI,8),%RAX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JGE 4d0a04 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x52ba70,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA 0x1(%RAX),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
IMUL %R10,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x1(%R15),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMP %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JGE 4d0ae1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA -0x1(%R10),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x4,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JAE 4d0c3a | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
AND $-0x4,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R8,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JAE 4d0ae1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA (%R15,%RBX,1),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
NOT %RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %R10,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JMP 4d0a86 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x40(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x52ba90,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x52bab0,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4106b0 <__kmpc_masked@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
CMP $0x1,%EAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JNE 4d0bf1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x1,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x20(%RBP),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JLE 4d0be1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA -0x1(%R13),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMP $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JAE 4d107f | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
AND $-0x4,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %RAX,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JAE 4d0be1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA 0x1(%RCX),%RBX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
IMUL %RBX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x2,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
IMUL %R11,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JMP 4d0b8c | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x40(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x52bad0,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 4104f0 <__kmpc_end_masked@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x52baf0,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
CMPQ $0,-0x50(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JLE 4d0dd0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA -0x1(%R15),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
OR %R13,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SHR $0x20,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
JE 4d0d54 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
IDIV %R13 | 57 | 14.25 | 14.25 | 0 | 0 | 0 | 14.25 | 14.25 | 0 | 42-95 | 24-90 |
MOV -0x60(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
DEC %RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %RCX,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JL 4d0d65 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 4d0dd0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SHR $0x2,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %R15,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 4d0c6c | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
DIV %R13D | 10 | 2.50 | 2.50 | 0 | 0 | 0 | 2.50 | 2.50 | 0 | 26 | 6 |
MOV -0x60(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
DEC %RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %RCX,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JGE 4d0dd0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
IMUL %RBX,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV (%R12,%RDX,8),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x1(%RBX),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x8,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JAE 4d0e6c | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R8,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
AND $-0x8,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R8,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JAE 4d0dd0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA (%R15,%RDI,1),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
NOT %RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RBX,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JMP 4d0dbb | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x30(%RBP),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x52bb10,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
CMPQ $0,-0x78(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JE 4d0e30 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x38(%RBP),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %R11,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV -0x70(%RBP),%R9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JLE 4d12ea | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x28(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%R14,%R8,8),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R8D,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SUB %R11D,%ECX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA 0x1(%R11),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST $0x1,%CL | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JNE 4d100c | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R8,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP %RAX,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JNE 4d1305 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 4d12ea | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV -0x38(%RBP),%R9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x30(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %R9,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4d12ea | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV (%R14,%R10,8),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R10D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SUB %R9D,%EAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA 0x1(%R9),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST $0x1,%AL | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JNE 4d11f2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP %R8,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JNE 4d1259 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 4d12ea | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV %R8,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SHR $0x3,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
LEA 0x7(%R15),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4d0ea0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA -0x1(%R8),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x8(%R14,%R8,8),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %RDI,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4d12da | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RBX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %RAX,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JNE 4d1305 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 4d12ea | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV -0x58(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
SHR $0x2,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
LEA (,%R11,4),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R11,%R11,4),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA -0x1(,%R11,4),%RSI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R11,%R11,2),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA (%R11,%R11,1),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA -0x1(%R11),%R10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4d10ef | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA -0x1(%R10),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x8(%R14,%R10,8),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %RSI,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4d1236 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP %R8,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JNE 4d1259 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 4d12ea | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %RAX,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JNE 4d1305 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
ADD $0x58,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Source file and lines | csr_matop.c:380-560 |
Module | exec |
nb instructions | 307 |
nb uops | 389 |
loop length | 1282 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 16 |
micro-operation queue | 97.50 cycles |
front end | 97.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | |
---|---|---|---|---|---|---|---|---|
uops | 57.75 | 57.75 | 32.67 | 32.67 | 33.00 | 57.75 | 57.75 | 32.67 |
cycles | 57.75 | 57.75 | 32.67 | 32.67 | 33.00 | 57.75 | 57.75 | 32.67 |
Cycles executing div or sqrt instructions | 30.00-96.00 |
FE+BE cycles | 78.52-137.59 |
Stall cycles | 0.00-59.04 |
Front-end | 97.50 |
Dispatch | 57.75 |
DIV/SQRT | 30.00-96.00 |
Overall L1 | 97.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
PUSH %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
PUSH %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
SUB $0x58,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R9,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R8,-0x70(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RCX,-0x78(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RDX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,-0x40(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CALL 4df9c0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4df9d0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4d3050 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4d30d0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP %R15,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV %RCX,-0x30(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
JGE 4d0930 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x5c2bf(%RIP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x505dec,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x507bbf,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4ddb80 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV $0x507b46,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1d7,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4dfac0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x30(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x38(%RBP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %R15,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JS 4d093e | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP %RBX,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4d0970 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x5c27b(%RIP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x505dec,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x507bce,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4ddb80 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV $0x507b46,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1d8,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4dfac0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x30(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x38(%RBP),%R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
TEST %RCX,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JS 4d0982 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP %RBX,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4d09b4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x5c237(%RIP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x505dec,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x507bf1,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4ddb80 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV $0x507b46,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1d9,%ESI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV $0x1,%EDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4dfac0 | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x50(%RBP),%R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
IMUL %RAX,%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R12,%R15,8),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RAX,8),%RDX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4e6020 <_intel_fast_memset> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%R14,%RAX,8),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP (%R14,%RSI,8),%RAX | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JGE 4d0a04 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x52ba70,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA 0x1(%RAX),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
IMUL %R10,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x1(%R15),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMP %RCX,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JGE 4d0ae1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA -0x1(%R10),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x4,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JAE 4d0c3a | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
AND $-0x4,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R8,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JAE 4d0ae1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA (%R15,%RBX,1),%RDI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
NOT %RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %R10,%RBX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JMP 4d0a86 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x40(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x52ba90,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x52bab0,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CALL 4106b0 <__kmpc_masked@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
CMP $0x1,%EAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JNE 4d0bf1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CMP $0x1,%R13 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x20(%RBP),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JLE 4d0be1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA -0x1(%R13),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
CMP $0x4,%RAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JAE 4d107f | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
AND $-0x4,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %RAX,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JAE 4d0be1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA 0x1(%RCX),%RBX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
IMUL %RBX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RSI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD $0x2,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
IMUL %R11,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JMP 4d0b8c | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x40(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x52bad0,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 4104f0 <__kmpc_end_masked@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x52baf0,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
CMPQ $0,-0x50(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JLE 4d0dd0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA -0x1(%R15),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
OR %R13,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
SHR $0x20,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
JE 4d0d54 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
IDIV %R13 | 57 | 14.25 | 14.25 | 0 | 0 | 0 | 14.25 | 14.25 | 0 | 42-95 | 24-90 |
MOV -0x60(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
DEC %RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %RCX,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JL 4d0d65 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 4d0dd0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SHR $0x2,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
MOV %R15,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 4d0c6c | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
DIV %R13D | 10 | 2.50 | 2.50 | 0 | 0 | 0 | 2.50 | 2.50 | 0 | 26 | 6 |
MOV -0x60(%RBP),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
DEC %RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %RCX,%R15 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JGE 4d0dd0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
IMUL %RBX,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV (%R12,%RDX,8),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
LEA -0x1(%RBX),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x8,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JAE 4d0e6c | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R8,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
AND $-0x8,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CMP %R8,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JAE 4d0dd0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
LEA (%R15,%RDI,1),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
NOT %RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
ADD %RBX,%RDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JMP 4d0dbb | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV 0x30(%RBP),%R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV $0x52bb10,%EDI | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 1 | 0.33 | 0 | 1 |
CMPQ $0,-0x78(%RBP) | 1 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0.25 | 0.25 | 0 | 1 | 0.50 |
JE 4d0e30 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV -0x38(%RBP),%R11 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %R11,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV -0x70(%RBP),%R9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JLE 4d12ea | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x28(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV (%R14,%R8,8),%RDX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R8D,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SUB %R11D,%ECX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA 0x1(%R11),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST $0x1,%CL | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JNE 4d100c | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R8,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP %RAX,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JNE 4d1305 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 4d12ea | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV -0x38(%RBP),%R9 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV -0x30(%RBP),%R10 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %R9,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4d12ea | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV (%R14,%R10,8),%RCX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R10D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SUB %R9D,%EAX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA 0x1(%R9),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST $0x1,%AL | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JNE 4d11f2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP %R8,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JNE 4d1259 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 4d12ea | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV %R8,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
SHR $0x3,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
LEA 0x7(%R15),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4d0ea0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA -0x1(%R8),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x8(%R14,%R8,8),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %RDI,%RDX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4d12da | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RBX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %RAX,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JNE 4d1305 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 4d12ea | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
MOV -0x58(%RBP),%RDI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
SHR $0x2,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 1 | 0.50 |
LEA (,%R11,4),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0.33 | 0.33 | 1 | 0 | 0 | 0.33 | 3 | 1 |
LEA (%R11,%R11,4),%RCX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA -0x1(,%R11,4),%RSI | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R11,%R11,2),%R8 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA (%R11,%R11,1),%R9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %R9 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
LEA -0x1(%R11),%R10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4d10ef | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
LEA -0x1(%R10),%RAX | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x8(%R14,%R10,8),%RSI | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %RSI,%RCX | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
JLE 4d1236 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
CMP %R8,%R10 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JNE 4d1259 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
JMP 4d12ea | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 1-2 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
CMP %RAX,%R8 | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 4-5 | 0.50 |
JNE 4d1305 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50-1 |
ADD $0x58,%RSP | 1 | 0.25 | 0.25 | 0 | 0 | 0 | 0.25 | 0.25 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R12 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R13 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R14 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %R15 | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
POP %RBP | 1 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 2 | 0.50 |
RET | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | 0 | 1 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixTranspose.extracted– | 0.18 | 0.06 |
○Loop 3855 - csr_matop.c:483-485 - exec | 0.03 | 0.01 |
○Loop 3844 - csr_matop.c:554-560 - exec | 0 | 0 |
▼Loop 3845 - csr_matop.c:540-548 - exec– | 0 | 0 |
○Loop 3846 - csr_matop.c:541-548 - exec | 0.08 | 0.03 |
○Loop 3847 - csr_matop.c:541-548 - exec | 0.07 | 0.02 |
○Loop 3854 - csr_matop.c:380-500 - exec | 0 | 0 |
○Loop 3850 - csr_matop.c:380-527 - exec | 0 | 0 |
○Loop 3848 - csr_matop.c:541-548 - exec | 0 | 0 |
○Loop 3852 - csr_matop.c:380-513 - exec | 0 | 0 |
○Loop 3853 - csr_matop.c:380-500 - exec | 0 | 0 |
▼Loop 3841 - csr_matop.c:553-560 - exec– | 0 | 0 |
○Loop 3843 - csr_matop.c:554-560 - exec | 0 | 0 |
○Loop 3842 - csr_matop.c:554-560 - exec | 0 | 0 |
○Loop 3851 - csr_matop.c:380-513 - exec | 0 | 0 |
○Loop 3849 - csr_matop.c:380-527 - exec | 0 | 0 |