Function: hypre_ParMatmul_RowSizes.extracted | Module: exec | Source: par_csr_matop.c:102-276 [...] | Coverage: 1.15% |
---|
Function: hypre_ParMatmul_RowSizes.extracted | Module: exec | Source: par_csr_matop.c:102-276 [...] | Coverage: 1.15% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-3872/intel/AMG/build/AMG/AMG/parcsr_mv/par_csr_matop.c: 102 - 276 |
-------------------------------------------------------------------------------- |
102: #pragma omp parallel private(ii, i1, jj_row_begin_diag, jj_row_begin_offd, jj_count_diag, jj_count_offd, jj2, i2, jj3, i3) |
[...] |
108: ii = hypre_GetThreadNum(); |
109: if (ii < rest) |
110: { |
111: ns = ii*size+ii; |
112: ne = (ii+1)*size+ii+1; |
113: } |
114: else |
115: { |
116: ns = ii*size+rest; |
117: ne = (ii+1)*size+rest; |
118: } |
119: jj_count_diag = start_indexing; |
120: jj_count_offd = start_indexing; |
121: |
122: if (num_cols_diag_B || num_cols_offd_C) |
123: B_marker = hypre_CTAlloc(HYPRE_Int, num_cols_diag_B+num_cols_offd_C); |
124: for (i1 = 0; i1 < num_cols_diag_B+num_cols_offd_C; i1++) |
125: B_marker[i1] = -1; |
126: |
127: for (i1 = ns; i1 < ne; i1++) |
[...] |
135: if ( allsquare ) { |
136: B_marker[i1] = jj_count_diag; |
137: jj_count_diag++; |
[...] |
144: if (num_cols_offd_A) |
145: { |
146: for (jj2 = A_offd_i[i1]; jj2 < A_offd_i[i1+1]; jj2++) |
147: { |
148: i2 = A_offd_j[jj2]; |
[...] |
154: for (jj3 = B_ext_offd_i[i2]; jj3 < B_ext_offd_i[i2+1]; jj3++) |
[...] |
164: if (B_marker[i3] < jj_row_begin_offd) |
165: { |
166: B_marker[i3] = jj_count_offd; |
167: jj_count_offd++; |
168: } |
169: } |
170: for (jj3 = B_ext_diag_i[i2]; jj3 < B_ext_diag_i[i2+1]; jj3++) |
171: { |
172: i3 = B_ext_diag_j[jj3]; |
173: |
174: if (B_marker[i3] < jj_row_begin_diag) |
175: { |
176: B_marker[i3] = jj_count_diag; |
177: jj_count_diag++; |
[...] |
187: for (jj2 = A_diag_i[i1]; jj2 < A_diag_i[i1+1]; jj2++) |
188: { |
189: i2 = A_diag_j[jj2]; |
[...] |
195: for (jj3 = B_diag_i[i2]; jj3 < B_diag_i[i2+1]; jj3++) |
196: { |
197: i3 = B_diag_j[jj3]; |
[...] |
205: if (B_marker[i3] < jj_row_begin_diag) |
206: { |
207: B_marker[i3] = jj_count_diag; |
208: jj_count_diag++; |
[...] |
216: if (num_cols_offd_B) |
217: { |
218: for (jj3 = B_offd_i[i2]; jj3 < B_offd_i[i2+1]; jj3++) |
219: { |
220: i3 = num_cols_diag_B+map_B_to_C[B_offd_j[jj3]]; |
[...] |
228: if (B_marker[i3] < jj_row_begin_offd) |
229: { |
230: B_marker[i3] = jj_count_offd; |
231: jj_count_offd++; |
[...] |
241: (*C_diag_i)[i1] = jj_row_begin_diag; |
242: (*C_offd_i)[i1] = jj_row_begin_offd; |
243: |
244: } |
245: jj_count_diag_array[ii] = jj_count_diag; |
246: jj_count_offd_array[ii] = jj_count_offd; |
247: |
248: hypre_TFree(B_marker); |
249: #ifdef HYPRE_USING_OPENMP |
250: #pragma omp barrier |
251: #endif |
252: |
253: if (ii) |
254: { |
255: jj_count_diag = jj_count_diag_array[0]; |
256: jj_count_offd = jj_count_offd_array[0]; |
257: for (i1 = 1; i1 < ii; i1++) |
258: { |
259: jj_count_diag += jj_count_diag_array[i1]; |
260: jj_count_offd += jj_count_offd_array[i1]; |
261: } |
262: |
263: for (i1 = ns; i1 < ne; i1++) |
264: { |
265: (*C_diag_i)[i1] += jj_count_diag; |
266: (*C_offd_i)[i1] += jj_count_offd; |
267: } |
268: } |
269: else |
270: { |
271: (*C_diag_i)[num_rows_diag_A] = 0; |
272: (*C_offd_i)[num_rows_diag_A] = 0; |
273: for (i1 = 0; i1 < num_threads; i1++) |
274: { |
275: (*C_diag_i)[num_rows_diag_A] += jj_count_diag_array[i1]; |
276: (*C_offd_i)[num_rows_diag_A] += jj_count_offd_array[i1]; |
0x4bbd50 PUSH %RBP |
0x4bbd51 MOV %RSP,%RBP |
0x4bbd54 PUSH %R15 |
0x4bbd56 PUSH %R14 |
0x4bbd58 PUSH %R13 |
0x4bbd5a PUSH %R12 |
0x4bbd5c PUSH %RBX |
0x4bbd5d SUB $0xb8,%RSP |
0x4bbd64 MOV %R9,-0x80(%RBP) |
0x4bbd68 MOV %R8,-0xb0(%RBP) |
0x4bbd6f MOV %RCX,-0x48(%RBP) |
0x4bbd73 MOV %RDX,-0x40(%RBP) |
0x4bbd77 MOV %RDI,-0x88(%RBP) |
0x4bbd7e MOV 0xc0(%RBP),%R14 |
0x4bbd85 MOV 0xb8(%RBP),%R13 |
0x4bbd8c MOV 0x90(%RBP),%R12 |
0x4bbd93 MOV 0x80(%RBP),%R15 |
0x4bbd9a CALL 4e86c0 <hypre_GetThreadNum> |
0x4bbd9f MOV %RAX,%RCX |
0x4bbda2 LEA 0x1(%RAX),%RBX |
0x4bbda6 MOV %RBX,%RAX |
0x4bbda9 IMUL %R14,%RAX |
0x4bbdad CMP %R13,%RCX |
0x4bbdb0 JGE 4bbef4 |
0x4bbdb6 LEA 0x1(%R14),%RDX |
0x4bbdba IMUL %RCX,%RDX |
0x4bbdbe MOV %RDX,-0x58(%RBP) |
0x4bbdc2 ADD %RAX,%RBX |
0x4bbdc5 MOV %R15,%RAX |
0x4bbdc8 OR %R12,%RAX |
0x4bbdcb MOV %RCX,-0x50(%RBP) |
0x4bbdcf JE 4bbf18 |
0x4bbdd5 LEA (%R12,%R15,1),%RDI |
0x4bbdd9 MOV $0x8,%ESI |
0x4bbdde CALL 4e6980 <hypre_CAlloc> |
0x4bbde3 MOV %RAX,%R14 |
0x4bbde6 ADD %R15,%R12 |
0x4bbde9 JLE 4bbdff |
0x4bbdeb SAL $0x3,%R12 |
0x4bbdef MOV %R14,%RDI |
0x4bbdf2 MOV $0xff,%ESI |
0x4bbdf7 MOV %R12,%RDX |
0x4bbdfa CALL 4efbb0 <_intel_fast_memset> |
0x4bbdff MOV -0x50(%RBP),%RCX |
0x4bbe03 CMP %RBX,-0x58(%RBP) |
0x4bbe07 MOV %RBX,-0x68(%RBP) |
0x4bbe0b JL 4bbf29 |
0x4bbe11 XOR %EBX,%EBX |
0x4bbe13 XOR %EDX,%EDX |
0x4bbe15 MOV 0xa8(%RBP),%R15 |
0x4bbe1c MOV -0x50(%RBP),%R12 |
0x4bbe20 MOV %RBX,(%R15,%R12,8) |
0x4bbe24 MOV 0xb0(%RBP),%RBX |
0x4bbe2b MOV %RDX,(%RBX,%R12,8) |
0x4bbe2f MOV %R14,%RDI |
0x4bbe32 CALL 4e6a60 <hypre_Free> |
0x4bbe37 MOV -0x88(%RBP),%RAX |
0x4bbe3e MOV (%RAX),%ESI |
0x4bbe40 MOV $0x736190,%EDI |
0x4bbe45 CALL 410030 <__kmpc_barrier@plt> |
0x4bbe4a TEST %R12,%R12 |
0x4bbe4d JE 4bc88a |
0x4bbe53 MOV %R12,%RDI |
0x4bbe56 MOV (%R15),%RAX |
0x4bbe59 MOV (%RBX),%RCX |
0x4bbe5c CMP $0x1,%R12 |
0x4bbe60 JLE 4bc9c3 |
0x4bbe66 LEA -0x1(%RDI),%RSI |
0x4bbe6a MOV %RSI,%RDX |
0x4bbe6d AND $-0x4,%RDX |
0x4bbe71 MOV -0x68(%RBP),%R11 |
0x4bbe75 MOV 0xc0(%RBP),%R14 |
0x4bbe7c JE 4bca07 |
0x4bbe82 VMOVQ %RAX,%XMM1 |
0x4bbe87 VMOVQ %RCX,%XMM0 |
0x4bbe8c LEA -0x1(%RDX),%RAX |
0x4bbe90 XOR %ECX,%ECX |
0x4bbe92 NOPW %CS:(%RAX,%RAX,1) |
(3562) 0x4bbea0 VPADDQ 0x8(%R15,%RCX,8),%YMM1,%YMM1 |
(3562) 0x4bbea7 VPADDQ 0x8(%RBX,%RCX,8),%YMM0,%YMM0 |
(3562) 0x4bbead ADD $0x4,%RCX |
(3562) 0x4bbeb1 CMP %RAX,%RCX |
(3562) 0x4bbeb4 JLE 4bbea0 |
0x4bbeb6 VEXTRACTI128 $0x1,%YMM1,%XMM2 |
0x4bbebc VPADDQ %XMM2,%XMM1,%XMM1 |
0x4bbec0 VPSHUFD $-0x12,%XMM1,%XMM2 |
0x4bbec5 VPADDQ %XMM2,%XMM1,%XMM1 |
0x4bbec9 VMOVQ %XMM1,%RAX |
0x4bbece VEXTRACTI128 $0x1,%YMM0,%XMM1 |
0x4bbed4 VPADDQ %XMM1,%XMM0,%XMM0 |
0x4bbed8 VPSHUFD $-0x12,%XMM0,%XMM1 |
0x4bbedd VPADDQ %XMM1,%XMM0,%XMM0 |
0x4bbee1 VMOVQ %XMM0,%RCX |
0x4bbee6 CMP %RDX,%RSI |
0x4bbee9 JNE 4bca09 |
0x4bbeef JMP 4bca20 |
0x4bbef4 MOV %RCX,%RDX |
0x4bbef7 IMUL %R14,%RDX |
0x4bbefb ADD %R13,%RDX |
0x4bbefe MOV %RDX,-0x58(%RBP) |
0x4bbf02 ADD %R13,%RAX |
0x4bbf05 MOV %RAX,%RBX |
0x4bbf08 MOV %R15,%RAX |
0x4bbf0b OR %R12,%RAX |
0x4bbf0e MOV %RCX,-0x50(%RBP) |
0x4bbf12 JNE 4bbdd5 |
0x4bbf18 XOR %R14D,%R14D |
0x4bbf1b CMP %RBX,-0x58(%RBP) |
0x4bbf1f MOV %RBX,-0x68(%RBP) |
0x4bbf23 JGE 4bbe11 |
0x4bbf29 MOV 0x60(%RBP),%RSI |
0x4bbf2d MOV 0x58(%RBP),%RDX |
0x4bbf31 MOV 0x48(%RBP),%RDI |
0x4bbf35 MOV 0x38(%RBP),%R8 |
0x4bbf39 MOV 0x28(%RBP),%R9 |
0x4bbf3d MOV 0xb8(%RBP),%RAX |
0x4bbf44 CMP %RAX,%RCX |
0x4bbf47 CMOVL %RCX,%RAX |
0x4bbf4b IMUL 0xc0(%RBP),%RCX |
0x4bbf53 ADD %RAX,%RCX |
0x4bbf56 MOV %RCX,-0xa8(%RBP) |
0x4bbf5d NOT %RCX |
0x4bbf60 ADD %RBX,%RCX |
0x4bbf63 MOV %RCX,-0xa0(%RBP) |
0x4bbf6a MOV -0x40(%RBP),%RAX |
0x4bbf6e MOV (%RAX),%RAX |
0x4bbf71 MOV %RAX,-0x98(%RBP) |
0x4bbf78 MOV -0x48(%RBP),%RAX |
0x4bbf7c MOV (%RAX),%RAX |
0x4bbf7f MOV %RAX,-0x90(%RBP) |
0x4bbf86 LEA 0x38(%RDX),%RAX |
0x4bbf8a MOV %RAX,-0xd0(%RBP) |
0x4bbf91 LEA 0x38(%RDI),%RAX |
0x4bbf95 MOV %RAX,-0xc8(%RBP) |
0x4bbf9c LEA 0x38(%R9),%RAX |
0x4bbfa0 MOV %RAX,-0x78(%RBP) |
0x4bbfa4 LEA 0x18(%R8),%RAX |
0x4bbfa8 MOV %RAX,-0xc0(%RBP) |
0x4bbfaf XOR %EDI,%EDI |
0x4bbfb1 XOR %R10D,%R10D |
0x4bbfb4 XOR %R8D,%R8D |
0x4bbfb7 MOV %R8,%RBX |
0x4bbfba JMP 4bbff8 |
0x4bbfbc NOPL (%RAX) |
(3563) 0x4bbfc0 MOV -0x98(%RBP),%RAX |
(3563) 0x4bbfc7 MOV -0x70(%RBP),%RCX |
(3563) 0x4bbfcb MOV %R8,(%RAX,%RCX,8) |
(3563) 0x4bbfcf MOV -0x90(%RBP),%RAX |
(3563) 0x4bbfd6 MOV %R10,(%RAX,%RCX,8) |
(3563) 0x4bbfda MOV -0xb8(%RBP),%RCX |
(3563) 0x4bbfe1 LEA 0x1(%RCX),%RDI |
(3563) 0x4bbfe5 MOV %RDX,%R10 |
(3563) 0x4bbfe8 MOV %RBX,%R8 |
(3563) 0x4bbfeb CMP -0xa0(%RBP),%RCX |
(3563) 0x4bbff2 JE 4bbe15 |
(3563) 0x4bbff8 MOV 0x78(%RBP),%RAX |
(3563) 0x4bbffc TEST %RAX,%RAX |
(3563) 0x4bbfff MOV -0xa8(%RBP),%RCX |
(3563) 0x4bc006 JE 4bc014 |
(3563) 0x4bc008 LEA (%RCX,%RDI,1),%RAX |
(3563) 0x4bc00c MOV %R8,(%R14,%RAX,8) |
(3563) 0x4bc010 LEA 0x1(%R8),%RBX |
(3563) 0x4bc014 ADD %RDI,%RCX |
(3563) 0x4bc017 CMPQ $0,0x70(%RBP) |
(3563) 0x4bc01c MOV %RCX,-0x70(%RBP) |
(3563) 0x4bc020 MOV %RDI,-0xb8(%RBP) |
(3563) 0x4bc027 JE 4bc400 |
(3563) 0x4bc02d MOV 0x10(%RBP),%RAX |
(3563) 0x4bc031 MOV (%RAX,%RCX,8),%R13 |
(3563) 0x4bc035 MOV 0x8(%RAX,%RCX,8),%RDX |
(3563) 0x4bc03a LEA 0x1(%RCX),%R9 |
(3563) 0x4bc03e CMP %RDX,%R13 |
(3563) 0x4bc041 JGE 4bc404 |
(3563) 0x4bc047 MOV %R13,%RAX |
(3563) 0x4bc04a NOT %RAX |
(3563) 0x4bc04d ADD %RAX,%RDX |
(3563) 0x4bc050 MOV %RDX,-0xd8(%RBP) |
(3563) 0x4bc057 XOR %EAX,%EAX |
(3563) 0x4bc059 MOV %R10,%RDX |
(3563) 0x4bc05c MOV %R9,-0x38(%RBP) |
(3563) 0x4bc060 MOV %R13,-0x30(%RBP) |
(3563) 0x4bc064 JMP 4bc08d |
0x4bc066 NOPW %CS:(%RAX,%RAX,1) |
(3572) 0x4bc070 MOV -0x30(%RBP),%R13 |
(3572) 0x4bc074 MOV -0x60(%RBP),%RCX |
(3572) 0x4bc078 LEA 0x1(%RCX),%RAX |
(3572) 0x4bc07c CMP -0xd8(%RBP),%RCX |
(3572) 0x4bc083 MOV -0x38(%RBP),%R9 |
(3572) 0x4bc087 JE 4bc410 |
(3572) 0x4bc08d MOV %RAX,-0x60(%RBP) |
(3572) 0x4bc091 ADD %R13,%RAX |
(3572) 0x4bc094 MOV 0x18(%RBP),%RCX |
(3572) 0x4bc098 MOV (%RCX,%RAX,8),%RAX |
(3572) 0x4bc09c MOV 0x50(%RBP),%RCX |
(3572) 0x4bc0a0 MOV (%RCX,%RAX,8),%R13 |
(3572) 0x4bc0a4 MOV 0x8(%RCX,%RAX,8),%RDI |
(3572) 0x4bc0a9 MOV %RDI,%R11 |
(3572) 0x4bc0ac SUB %R13,%R11 |
(3572) 0x4bc0af JLE 4bc0c7 |
(3572) 0x4bc0b1 CMP $0x8,%R11 |
(3572) 0x4bc0b5 JAE 4bc130 |
(3572) 0x4bc0b7 MOV %R11,%RCX |
(3572) 0x4bc0ba AND $-0x8,%RCX |
(3572) 0x4bc0be CMP %R11,%RCX |
(3572) 0x4bc0c1 JNE 4bc2b0 |
(3572) 0x4bc0c7 MOV 0x40(%RBP),%RCX |
(3572) 0x4bc0cb MOV (%RCX,%RAX,8),%RDI |
(3572) 0x4bc0cf MOV 0x8(%RCX,%RAX,8),%RAX |
(3572) 0x4bc0d4 MOV %RAX,%R9 |
(3572) 0x4bc0d7 SUB %RDI,%R9 |
(3572) 0x4bc0da JLE 4bc070 |
(3572) 0x4bc0dc CMP $0x8,%R9 |
(3572) 0x4bc0e0 MOV -0x30(%RBP),%R13 |
(3572) 0x4bc0e4 JAE 4bc2f0 |
(3572) 0x4bc0ea MOV %R9,%RCX |
(3572) 0x4bc0ed AND $-0x8,%RCX |
(3572) 0x4bc0f1 CMP %R9,%RCX |
(3572) 0x4bc0f4 JE 4bc074 |
(3572) 0x4bc0fa ADD %RCX,%RDI |
(3572) 0x4bc0fd MOV 0x48(%RBP),%R9 |
(3572) 0x4bc101 JMP 4bc11c |
0x4bc103 NOPW %CS:(%RAX,%RAX,1) |
(3573) 0x4bc110 INC %RDI |
(3573) 0x4bc113 CMP %RDI,%RAX |
(3573) 0x4bc116 JE 4bc074 |
(3573) 0x4bc11c MOV (%R9,%RDI,8),%RCX |
(3573) 0x4bc120 CMP %R8,(%R14,%RCX,8) |
(3573) 0x4bc124 JGE 4bc110 |
(3573) 0x4bc126 MOV %RBX,(%R14,%RCX,8) |
(3573) 0x4bc12a INC %RBX |
(3573) 0x4bc12d JMP 4bc110 |
0x4bc12f NOP |
(3572) 0x4bc130 MOV %R11,%R9 |
(3572) 0x4bc133 SHR $0x3,%R9 |
(3572) 0x4bc137 MOV -0xd0(%RBP),%RCX |
(3572) 0x4bc13e LEA (%RCX,%R13,8),%RCX |
(3572) 0x4bc142 JMP 4bc15d |
0x4bc144 NOPW %CS:(%RAX,%RAX,1) |
(3576) 0x4bc150 ADD $0x40,%RCX |
(3576) 0x4bc154 DEC %R9 |
(3576) 0x4bc157 JE 4bc0b7 |
(3576) 0x4bc15d MOV -0x38(%RCX),%R12 |
(3576) 0x4bc161 ADD %R15,%R12 |
(3576) 0x4bc164 CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc168 JGE 4bc210 |
(3576) 0x4bc16e MOV %RDX,(%R14,%R12,8) |
(3576) 0x4bc172 INC %RDX |
(3576) 0x4bc175 MOV -0x30(%RCX),%R12 |
(3576) 0x4bc179 ADD %R15,%R12 |
(3576) 0x4bc17c CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc180 JL 4bc221 |
(3576) 0x4bc186 MOV -0x28(%RCX),%R12 |
(3576) 0x4bc18a ADD %R15,%R12 |
(3576) 0x4bc18d CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc191 JGE 4bc239 |
(3576) 0x4bc197 MOV %RDX,(%R14,%R12,8) |
(3576) 0x4bc19b INC %RDX |
(3576) 0x4bc19e MOV -0x20(%RCX),%R12 |
(3576) 0x4bc1a2 ADD %R15,%R12 |
(3576) 0x4bc1a5 CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc1a9 JL 4bc24a |
(3576) 0x4bc1af MOV -0x18(%RCX),%R12 |
(3576) 0x4bc1b3 ADD %R15,%R12 |
(3576) 0x4bc1b6 CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc1ba JGE 4bc262 |
(3576) 0x4bc1c0 MOV %RDX,(%R14,%R12,8) |
(3576) 0x4bc1c4 INC %RDX |
(3576) 0x4bc1c7 MOV -0x10(%RCX),%R12 |
(3576) 0x4bc1cb ADD %R15,%R12 |
(3576) 0x4bc1ce CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc1d2 JL 4bc273 |
(3576) 0x4bc1d8 MOV -0x8(%RCX),%R12 |
(3576) 0x4bc1dc ADD %R15,%R12 |
(3576) 0x4bc1df CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc1e3 JGE 4bc28b |
(3576) 0x4bc1e9 MOV %RDX,(%R14,%R12,8) |
(3576) 0x4bc1ed INC %RDX |
(3576) 0x4bc1f0 MOV (%RCX),%R12 |
(3576) 0x4bc1f3 ADD %R15,%R12 |
(3576) 0x4bc1f6 CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc1fa JGE 4bc150 |
(3576) 0x4bc200 JMP 4bc29b |
0x4bc205 NOPW %CS:(%RAX,%RAX,1) |
(3576) 0x4bc210 MOV -0x30(%RCX),%R12 |
(3576) 0x4bc214 ADD %R15,%R12 |
(3576) 0x4bc217 CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc21b JGE 4bc186 |
(3576) 0x4bc221 MOV %RDX,(%R14,%R12,8) |
(3576) 0x4bc225 INC %RDX |
(3576) 0x4bc228 MOV -0x28(%RCX),%R12 |
(3576) 0x4bc22c ADD %R15,%R12 |
(3576) 0x4bc22f CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc233 JL 4bc197 |
(3576) 0x4bc239 MOV -0x20(%RCX),%R12 |
(3576) 0x4bc23d ADD %R15,%R12 |
(3576) 0x4bc240 CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc244 JGE 4bc1af |
(3576) 0x4bc24a MOV %RDX,(%R14,%R12,8) |
(3576) 0x4bc24e INC %RDX |
(3576) 0x4bc251 MOV -0x18(%RCX),%R12 |
(3576) 0x4bc255 ADD %R15,%R12 |
(3576) 0x4bc258 CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc25c JL 4bc1c0 |
(3576) 0x4bc262 MOV -0x10(%RCX),%R12 |
(3576) 0x4bc266 ADD %R15,%R12 |
(3576) 0x4bc269 CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc26d JGE 4bc1d8 |
(3576) 0x4bc273 MOV %RDX,(%R14,%R12,8) |
(3576) 0x4bc277 INC %RDX |
(3576) 0x4bc27a MOV -0x8(%RCX),%R12 |
(3576) 0x4bc27e ADD %R15,%R12 |
(3576) 0x4bc281 CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc285 JL 4bc1e9 |
(3576) 0x4bc28b MOV (%RCX),%R12 |
(3576) 0x4bc28e ADD %R15,%R12 |
(3576) 0x4bc291 CMP %R10,(%R14,%R12,8) |
(3576) 0x4bc295 JGE 4bc150 |
(3576) 0x4bc29b MOV %RDX,(%R14,%R12,8) |
(3576) 0x4bc29f INC %RDX |
(3576) 0x4bc2a2 JMP 4bc150 |
0x4bc2a7 NOPW (%RAX,%RAX,1) |
(3572) 0x4bc2b0 ADD %RCX,%R13 |
(3572) 0x4bc2b3 MOV 0x58(%RBP),%R9 |
(3572) 0x4bc2b7 JMP 4bc2cc |
0x4bc2b9 NOPL (%RAX) |
(3575) 0x4bc2c0 INC %R13 |
(3575) 0x4bc2c3 CMP %R13,%RDI |
(3575) 0x4bc2c6 JE 4bc0c7 |
(3575) 0x4bc2cc MOV (%R9,%R13,8),%RCX |
(3575) 0x4bc2d0 ADD %R15,%RCX |
(3575) 0x4bc2d3 CMP %R10,(%R14,%RCX,8) |
(3575) 0x4bc2d7 JGE 4bc2c0 |
(3575) 0x4bc2d9 MOV %RDX,(%R14,%RCX,8) |
(3575) 0x4bc2dd INC %RDX |
(3575) 0x4bc2e0 JMP 4bc2c0 |
0x4bc2e2 NOPW %CS:(%RAX,%RAX,1) |
(3572) 0x4bc2f0 MOV %R9,%RCX |
(3572) 0x4bc2f3 SHR $0x3,%RCX |
(3572) 0x4bc2f7 MOV -0xc8(%RBP),%R11 |
(3572) 0x4bc2fe LEA (%R11,%RDI,8),%R11 |
(3572) 0x4bc302 JMP 4bc31d |
0x4bc304 NOPW %CS:(%RAX,%RAX,1) |
(3574) 0x4bc310 ADD $0x40,%R11 |
(3574) 0x4bc314 DEC %RCX |
(3574) 0x4bc317 JE 4bc0ea |
(3574) 0x4bc31d MOV -0x38(%R11),%R12 |
(3574) 0x4bc321 CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc325 JGE 4bc390 |
(3574) 0x4bc327 MOV %RBX,(%R14,%R12,8) |
(3574) 0x4bc32b INC %RBX |
(3574) 0x4bc32e MOV -0x30(%R11),%R12 |
(3574) 0x4bc332 CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc336 JL 4bc39a |
(3574) 0x4bc338 MOV -0x28(%R11),%R12 |
(3574) 0x4bc33c CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc340 JGE 4bc3ab |
(3574) 0x4bc342 MOV %RBX,(%R14,%R12,8) |
(3574) 0x4bc346 INC %RBX |
(3574) 0x4bc349 MOV -0x20(%R11),%R12 |
(3574) 0x4bc34d CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc351 JL 4bc3b5 |
(3574) 0x4bc353 MOV -0x18(%R11),%R12 |
(3574) 0x4bc357 CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc35b JGE 4bc3c6 |
(3574) 0x4bc35d MOV %RBX,(%R14,%R12,8) |
(3574) 0x4bc361 INC %RBX |
(3574) 0x4bc364 MOV -0x10(%R11),%R12 |
(3574) 0x4bc368 CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc36c JL 4bc3d0 |
(3574) 0x4bc36e MOV -0x8(%R11),%R12 |
(3574) 0x4bc372 CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc376 JGE 4bc3e1 |
(3574) 0x4bc378 MOV %RBX,(%R14,%R12,8) |
(3574) 0x4bc37c INC %RBX |
(3574) 0x4bc37f MOV (%R11),%R12 |
(3574) 0x4bc382 CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc386 JGE 4bc310 |
(3574) 0x4bc388 JMP 4bc3ee |
0x4bc38a NOPW (%RAX,%RAX,1) |
(3574) 0x4bc390 MOV -0x30(%R11),%R12 |
(3574) 0x4bc394 CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc398 JGE 4bc338 |
(3574) 0x4bc39a MOV %RBX,(%R14,%R12,8) |
(3574) 0x4bc39e INC %RBX |
(3574) 0x4bc3a1 MOV -0x28(%R11),%R12 |
(3574) 0x4bc3a5 CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc3a9 JL 4bc342 |
(3574) 0x4bc3ab MOV -0x20(%R11),%R12 |
(3574) 0x4bc3af CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc3b3 JGE 4bc353 |
(3574) 0x4bc3b5 MOV %RBX,(%R14,%R12,8) |
(3574) 0x4bc3b9 INC %RBX |
(3574) 0x4bc3bc MOV -0x18(%R11),%R12 |
(3574) 0x4bc3c0 CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc3c4 JL 4bc35d |
(3574) 0x4bc3c6 MOV -0x10(%R11),%R12 |
(3574) 0x4bc3ca CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc3ce JGE 4bc36e |
(3574) 0x4bc3d0 MOV %RBX,(%R14,%R12,8) |
(3574) 0x4bc3d4 INC %RBX |
(3574) 0x4bc3d7 MOV -0x8(%R11),%R12 |
(3574) 0x4bc3db CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc3df JL 4bc378 |
(3574) 0x4bc3e1 MOV (%R11),%R12 |
(3574) 0x4bc3e4 CMP %R8,(%R14,%R12,8) |
(3574) 0x4bc3e8 JGE 4bc310 |
(3574) 0x4bc3ee MOV %RBX,(%R14,%R12,8) |
(3574) 0x4bc3f2 INC %RBX |
(3574) 0x4bc3f5 JMP 4bc310 |
0x4bc3fa NOPW (%RAX,%RAX,1) |
(3563) 0x4bc400 LEA 0x1(%RCX),%R9 |
(3563) 0x4bc404 MOV %R10,%RDX |
(3563) 0x4bc407 JMP 4bc414 |
0x4bc409 NOPL (%RAX) |
(3563) 0x4bc410 MOV -0x70(%RBP),%RCX |
(3563) 0x4bc414 MOV -0xb0(%RBP),%RAX |
(3563) 0x4bc41b MOV (%RAX,%RCX,8),%R11 |
(3563) 0x4bc41f MOV (%RAX,%R9,8),%RCX |
(3563) 0x4bc423 CMP %RCX,%R11 |
(3563) 0x4bc426 JGE 4bbfc0 |
(3563) 0x4bc42c MOV %R11,%RAX |
(3563) 0x4bc42f NOT %RAX |
(3563) 0x4bc432 ADD %RAX,%RCX |
(3563) 0x4bc435 MOV %RCX,-0x38(%RBP) |
(3563) 0x4bc439 CMPQ $0,0x88(%RBP) |
(3563) 0x4bc441 MOV %R11,-0x30(%RBP) |
(3563) 0x4bc445 JE 4bc6ee |
(3563) 0x4bc44b XOR %EAX,%EAX |
(3563) 0x4bc44d JMP 4bc469 |
0x4bc44f NOP |
(3567) 0x4bc450 MOV -0x30(%RBP),%R11 |
(3567) 0x4bc454 MOV -0x60(%RBP),%RDI |
(3567) 0x4bc458 LEA 0x1(%RDI),%RAX |
(3567) 0x4bc45c MOV -0x38(%RBP),%RCX |
(3567) 0x4bc460 CMP %RCX,%RDI |
(3567) 0x4bc463 JE 4bbfc0 |
(3567) 0x4bc469 MOV %RAX,-0x60(%RBP) |
(3567) 0x4bc46d ADD %R11,%RAX |
(3567) 0x4bc470 MOV -0x80(%RBP),%RCX |
(3567) 0x4bc474 MOV (%RCX,%RAX,8),%RDI |
(3567) 0x4bc478 MOV 0x20(%RBP),%RCX |
(3567) 0x4bc47c MOV (%RCX,%RDI,8),%RAX |
(3567) 0x4bc480 MOV 0x8(%RCX,%RDI,8),%R13 |
(3567) 0x4bc485 MOV %R13,%R9 |
(3567) 0x4bc488 SUB %RAX,%R9 |
(3567) 0x4bc48b JLE 4bc4ab |
(3567) 0x4bc48d CMP $0x8,%R9 |
(3567) 0x4bc491 JAE 4bc520 |
(3567) 0x4bc497 MOV %R9,%RCX |
(3567) 0x4bc49a AND $-0x8,%RCX |
(3567) 0x4bc49e CMP %R9,%RCX |
(3567) 0x4bc4a1 JNE 4bc630 |
(3567) 0x4bc4a7 MOV -0x30(%RBP),%R11 |
(3567) 0x4bc4ab MOV 0x30(%RBP),%RCX |
(3567) 0x4bc4af MOV (%RCX,%RDI,8),%RAX |
(3567) 0x4bc4b3 MOV 0x8(%RCX,%RDI,8),%RCX |
(3567) 0x4bc4b8 MOV %RCX,%RDI |
(3567) 0x4bc4bb SUB %RAX,%RDI |
(3567) 0x4bc4be JLE 4bc454 |
(3567) 0x4bc4c0 CMP $0x4,%RDI |
(3567) 0x4bc4c4 JAE 4bc660 |
(3567) 0x4bc4ca MOV %RDI,%R9 |
(3567) 0x4bc4cd AND $-0x4,%R9 |
(3567) 0x4bc4d1 CMP %RDI,%R9 |
(3567) 0x4bc4d4 JE 4bc450 |
(3567) 0x4bc4da ADD %R9,%RAX |
(3567) 0x4bc4dd MOV 0x38(%RBP),%R9 |
(3567) 0x4bc4e1 MOV -0x30(%RBP),%R11 |
(3567) 0x4bc4e5 JMP 4bc4fc |
0x4bc4e7 NOPW (%RAX,%RAX,1) |
(3568) 0x4bc4f0 INC %RAX |
(3568) 0x4bc4f3 CMP %RAX,%RCX |
(3568) 0x4bc4f6 JE 4bc454 |
(3568) 0x4bc4fc MOV (%R9,%RAX,8),%RDI |
(3568) 0x4bc500 MOV (%RSI,%RDI,8),%RDI |
(3568) 0x4bc504 ADD %R15,%RDI |
(3568) 0x4bc507 CMP %R10,(%R14,%RDI,8) |
(3568) 0x4bc50b JGE 4bc4f0 |
(3568) 0x4bc50d MOV %RDX,(%R14,%RDI,8) |
(3568) 0x4bc511 INC %RDX |
(3568) 0x4bc514 JMP 4bc4f0 |
0x4bc516 NOPW %CS:(%RAX,%RAX,1) |
(3567) 0x4bc520 MOV %R9,%RCX |
(3567) 0x4bc523 SHR $0x3,%RCX |
(3567) 0x4bc527 MOV -0x78(%RBP),%R11 |
(3567) 0x4bc52b LEA (%R11,%RAX,8),%R11 |
(3567) 0x4bc52f JMP 4bc54d |
0x4bc531 NOPW %CS:(%RAX,%RAX,1) |
(3571) 0x4bc540 ADD $0x40,%R11 |
(3571) 0x4bc544 DEC %RCX |
(3571) 0x4bc547 JE 4bc497 |
(3571) 0x4bc54d MOV -0x38(%R11),%R12 |
(3571) 0x4bc551 CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc555 JGE 4bc5c0 |
(3571) 0x4bc557 MOV %RBX,(%R14,%R12,8) |
(3571) 0x4bc55b INC %RBX |
(3571) 0x4bc55e MOV -0x30(%R11),%R12 |
(3571) 0x4bc562 CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc566 JL 4bc5ca |
(3571) 0x4bc568 MOV -0x28(%R11),%R12 |
(3571) 0x4bc56c CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc570 JGE 4bc5db |
(3571) 0x4bc572 MOV %RBX,(%R14,%R12,8) |
(3571) 0x4bc576 INC %RBX |
(3571) 0x4bc579 MOV -0x20(%R11),%R12 |
(3571) 0x4bc57d CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc581 JL 4bc5e5 |
(3571) 0x4bc583 MOV -0x18(%R11),%R12 |
(3571) 0x4bc587 CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc58b JGE 4bc5f6 |
(3571) 0x4bc58d MOV %RBX,(%R14,%R12,8) |
(3571) 0x4bc591 INC %RBX |
(3571) 0x4bc594 MOV -0x10(%R11),%R12 |
(3571) 0x4bc598 CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc59c JL 4bc600 |
(3571) 0x4bc59e MOV -0x8(%R11),%R12 |
(3571) 0x4bc5a2 CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc5a6 JGE 4bc611 |
(3571) 0x4bc5a8 MOV %RBX,(%R14,%R12,8) |
(3571) 0x4bc5ac INC %RBX |
(3571) 0x4bc5af MOV (%R11),%R12 |
(3571) 0x4bc5b2 CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc5b6 JGE 4bc540 |
(3571) 0x4bc5b8 JMP 4bc61e |
0x4bc5ba NOPW (%RAX,%RAX,1) |
(3571) 0x4bc5c0 MOV -0x30(%R11),%R12 |
(3571) 0x4bc5c4 CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc5c8 JGE 4bc568 |
(3571) 0x4bc5ca MOV %RBX,(%R14,%R12,8) |
(3571) 0x4bc5ce INC %RBX |
(3571) 0x4bc5d1 MOV -0x28(%R11),%R12 |
(3571) 0x4bc5d5 CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc5d9 JL 4bc572 |
(3571) 0x4bc5db MOV -0x20(%R11),%R12 |
(3571) 0x4bc5df CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc5e3 JGE 4bc583 |
(3571) 0x4bc5e5 MOV %RBX,(%R14,%R12,8) |
(3571) 0x4bc5e9 INC %RBX |
(3571) 0x4bc5ec MOV -0x18(%R11),%R12 |
(3571) 0x4bc5f0 CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc5f4 JL 4bc58d |
(3571) 0x4bc5f6 MOV -0x10(%R11),%R12 |
(3571) 0x4bc5fa CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc5fe JGE 4bc59e |
(3571) 0x4bc600 MOV %RBX,(%R14,%R12,8) |
(3571) 0x4bc604 INC %RBX |
(3571) 0x4bc607 MOV -0x8(%R11),%R12 |
(3571) 0x4bc60b CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc60f JL 4bc5a8 |
(3571) 0x4bc611 MOV (%R11),%R12 |
(3571) 0x4bc614 CMP %R8,(%R14,%R12,8) |
(3571) 0x4bc618 JGE 4bc540 |
(3571) 0x4bc61e MOV %RBX,(%R14,%R12,8) |
(3571) 0x4bc622 INC %RBX |
(3571) 0x4bc625 JMP 4bc540 |
0x4bc62a NOPW (%RAX,%RAX,1) |
(3567) 0x4bc630 ADD %RCX,%RAX |
(3567) 0x4bc633 MOV 0x28(%RBP),%R9 |
(3567) 0x4bc637 MOV -0x30(%RBP),%R11 |
(3567) 0x4bc63b JMP 4bc64c |
0x4bc63d NOPL (%RAX) |
(3570) 0x4bc640 INC %RAX |
(3570) 0x4bc643 CMP %RAX,%R13 |
(3570) 0x4bc646 JE 4bc4ab |
(3570) 0x4bc64c MOV (%R9,%RAX,8),%RCX |
(3570) 0x4bc650 CMP %R8,(%R14,%RCX,8) |
(3570) 0x4bc654 JGE 4bc640 |
(3570) 0x4bc656 MOV %RBX,(%R14,%RCX,8) |
(3570) 0x4bc65a INC %RBX |
(3570) 0x4bc65d JMP 4bc640 |
0x4bc65f NOP |
(3567) 0x4bc660 MOV %RDI,%R9 |
(3567) 0x4bc663 SHR $0x2,%R9 |
(3567) 0x4bc667 MOV -0xc0(%RBP),%R11 |
(3567) 0x4bc66e LEA (%R11,%RAX,8),%R11 |
(3567) 0x4bc672 JMP 4bc68d |
0x4bc674 NOPW %CS:(%RAX,%RAX,1) |
(3569) 0x4bc680 ADD $0x20,%R11 |
(3569) 0x4bc684 DEC %R9 |
(3569) 0x4bc687 JE 4bc4ca |
(3569) 0x4bc68d MOV -0x18(%R11),%R12 |
(3569) 0x4bc691 MOV (%RSI,%R12,8),%R13 |
(3569) 0x4bc695 ADD %R15,%R13 |
(3569) 0x4bc698 CMP %R10,(%R14,%R13,8) |
(3569) 0x4bc69c JGE 4bc6a5 |
(3569) 0x4bc69e MOV %RDX,(%R14,%R13,8) |
(3569) 0x4bc6a2 INC %RDX |
(3569) 0x4bc6a5 MOV -0x10(%R11),%R12 |
(3569) 0x4bc6a9 MOV (%RSI,%R12,8),%R13 |
(3569) 0x4bc6ad ADD %R15,%R13 |
(3569) 0x4bc6b0 CMP %R10,(%R14,%R13,8) |
(3569) 0x4bc6b4 JGE 4bc6bd |
(3569) 0x4bc6b6 MOV %RDX,(%R14,%R13,8) |
(3569) 0x4bc6ba INC %RDX |
(3569) 0x4bc6bd MOV -0x8(%R11),%R12 |
(3569) 0x4bc6c1 MOV (%RSI,%R12,8),%R13 |
(3569) 0x4bc6c5 ADD %R15,%R13 |
(3569) 0x4bc6c8 CMP %R10,(%R14,%R13,8) |
(3569) 0x4bc6cc JGE 4bc6d5 |
(3569) 0x4bc6ce MOV %RDX,(%R14,%R13,8) |
(3569) 0x4bc6d2 INC %RDX |
(3569) 0x4bc6d5 MOV (%R11),%R12 |
(3569) 0x4bc6d8 MOV (%RSI,%R12,8),%R13 |
(3569) 0x4bc6dc ADD %R15,%R13 |
(3569) 0x4bc6df CMP %R10,(%R14,%R13,8) |
(3569) 0x4bc6e3 JGE 4bc680 |
(3569) 0x4bc6e5 MOV %RDX,(%R14,%R13,8) |
(3569) 0x4bc6e9 INC %RDX |
(3569) 0x4bc6ec JMP 4bc680 |
(3563) 0x4bc6ee XOR %R12D,%R12D |
(3563) 0x4bc6f1 JMP 4bc719 |
0x4bc6f3 NOPW %CS:(%RAX,%RAX,1) |
(3564) 0x4bc700 MOV -0x30(%RBP),%R11 |
(3564) 0x4bc704 LEA 0x1(%R12),%RAX |
(3564) 0x4bc709 MOV -0x38(%RBP),%RCX |
(3564) 0x4bc70d CMP %RCX,%R12 |
(3564) 0x4bc710 MOV %RAX,%R12 |
(3564) 0x4bc713 JE 4bbfc0 |
(3564) 0x4bc719 LEA (%R11,%R12,1),%RAX |
(3564) 0x4bc71d MOV -0x80(%RBP),%RCX |
(3564) 0x4bc721 MOV (%RCX,%RAX,8),%RAX |
(3564) 0x4bc725 MOV 0x20(%RBP),%RCX |
(3564) 0x4bc729 MOV (%RCX,%RAX,8),%RDI |
(3564) 0x4bc72d MOV 0x8(%RCX,%RAX,8),%RAX |
(3564) 0x4bc732 MOV %RAX,%R9 |
(3564) 0x4bc735 SUB %RDI,%R9 |
(3564) 0x4bc738 JLE 4bc704 |
(3564) 0x4bc73a CMP $0x8,%R9 |
(3564) 0x4bc73e JAE 4bc780 |
(3564) 0x4bc740 MOV %R9,%RCX |
(3564) 0x4bc743 AND $-0x8,%RCX |
(3564) 0x4bc747 CMP %R9,%RCX |
(3564) 0x4bc74a JE 4bc700 |
(3564) 0x4bc74c ADD %RCX,%RDI |
(3564) 0x4bc74f MOV 0x28(%RBP),%R9 |
(3564) 0x4bc753 MOV -0x30(%RBP),%R11 |
(3564) 0x4bc757 JMP 4bc768 |
0x4bc759 NOPL (%RAX) |
(3565) 0x4bc760 INC %RDI |
(3565) 0x4bc763 CMP %RDI,%RAX |
(3565) 0x4bc766 JE 4bc704 |
(3565) 0x4bc768 MOV (%R9,%RDI,8),%RCX |
(3565) 0x4bc76c CMP %R8,(%R14,%RCX,8) |
(3565) 0x4bc770 JGE 4bc760 |
(3565) 0x4bc772 MOV %RBX,(%R14,%RCX,8) |
(3565) 0x4bc776 INC %RBX |
(3565) 0x4bc779 JMP 4bc760 |
0x4bc77b NOPL (%RAX,%RAX,1) |
(3564) 0x4bc780 MOV %R9,%RCX |
(3564) 0x4bc783 SHR $0x3,%RCX |
(3564) 0x4bc787 MOV -0x78(%RBP),%R11 |
(3564) 0x4bc78b LEA (%R11,%RDI,8),%R11 |
(3564) 0x4bc78f JMP 4bc7a9 |
0x4bc791 NOPW %CS:(%RAX,%RAX,1) |
(3566) 0x4bc7a0 ADD $0x40,%R11 |
(3566) 0x4bc7a4 DEC %RCX |
(3566) 0x4bc7a7 JE 4bc740 |
(3566) 0x4bc7a9 MOV -0x38(%R11),%R13 |
(3566) 0x4bc7ad CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc7b1 JGE 4bc820 |
(3566) 0x4bc7b3 MOV %RBX,(%R14,%R13,8) |
(3566) 0x4bc7b7 INC %RBX |
(3566) 0x4bc7ba MOV -0x30(%R11),%R13 |
(3566) 0x4bc7be CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc7c2 JL 4bc82a |
(3566) 0x4bc7c4 MOV -0x28(%R11),%R13 |
(3566) 0x4bc7c8 CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc7cc JGE 4bc83b |
(3566) 0x4bc7ce MOV %RBX,(%R14,%R13,8) |
(3566) 0x4bc7d2 INC %RBX |
(3566) 0x4bc7d5 MOV -0x20(%R11),%R13 |
(3566) 0x4bc7d9 CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc7dd JL 4bc845 |
(3566) 0x4bc7df MOV -0x18(%R11),%R13 |
(3566) 0x4bc7e3 CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc7e7 JGE 4bc856 |
(3566) 0x4bc7e9 MOV %RBX,(%R14,%R13,8) |
(3566) 0x4bc7ed INC %RBX |
(3566) 0x4bc7f0 MOV -0x10(%R11),%R13 |
(3566) 0x4bc7f4 CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc7f8 JL 4bc860 |
(3566) 0x4bc7fa MOV -0x8(%R11),%R13 |
(3566) 0x4bc7fe CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc802 JGE 4bc871 |
(3566) 0x4bc804 MOV %RBX,(%R14,%R13,8) |
(3566) 0x4bc808 INC %RBX |
(3566) 0x4bc80b MOV (%R11),%R13 |
(3566) 0x4bc80e CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc812 JGE 4bc7a0 |
(3566) 0x4bc814 JMP 4bc87e |
0x4bc816 NOPW %CS:(%RAX,%RAX,1) |
(3566) 0x4bc820 MOV -0x30(%R11),%R13 |
(3566) 0x4bc824 CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc828 JGE 4bc7c4 |
(3566) 0x4bc82a MOV %RBX,(%R14,%R13,8) |
(3566) 0x4bc82e INC %RBX |
(3566) 0x4bc831 MOV -0x28(%R11),%R13 |
(3566) 0x4bc835 CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc839 JL 4bc7ce |
(3566) 0x4bc83b MOV -0x20(%R11),%R13 |
(3566) 0x4bc83f CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc843 JGE 4bc7df |
(3566) 0x4bc845 MOV %RBX,(%R14,%R13,8) |
(3566) 0x4bc849 INC %RBX |
(3566) 0x4bc84c MOV -0x18(%R11),%R13 |
(3566) 0x4bc850 CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc854 JL 4bc7e9 |
(3566) 0x4bc856 MOV -0x10(%R11),%R13 |
(3566) 0x4bc85a CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc85e JGE 4bc7fa |
(3566) 0x4bc860 MOV %RBX,(%R14,%R13,8) |
(3566) 0x4bc864 INC %RBX |
(3566) 0x4bc867 MOV -0x8(%R11),%R13 |
(3566) 0x4bc86b CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc86f JL 4bc804 |
(3566) 0x4bc871 MOV (%R11),%R13 |
(3566) 0x4bc874 CMP %R8,(%R14,%R13,8) |
(3566) 0x4bc878 JGE 4bc7a0 |
(3566) 0x4bc87e MOV %RBX,(%R14,%R13,8) |
(3566) 0x4bc882 INC %RBX |
(3566) 0x4bc885 JMP 4bc7a0 |
0x4bc88a MOV 0xa0(%RBP),%RAX |
0x4bc891 MOV 0x68(%RBP),%RDX |
0x4bc895 MOV -0x40(%RBP),%RCX |
0x4bc899 MOV (%RCX),%RSI |
0x4bc89c MOVQ $0,(%RSI,%RDX,8) |
0x4bc8a4 MOV -0x48(%RBP),%RCX |
0x4bc8a8 MOV (%RCX),%RDI |
0x4bc8ab MOVQ $0,(%RDI,%RDX,8) |
0x4bc8b3 TEST %RAX,%RAX |
0x4bc8b6 JLE 4bcb56 |
0x4bc8bc LEA (%RSI,%RDX,8),%RCX |
0x4bc8c0 LEA (%RDI,%RDX,8),%RDX |
0x4bc8c4 LEA -0x8(%R15,%RAX,8),%R8 |
0x4bc8c9 CMP %RCX,%R8 |
0x4bc8cc MOV %R15,%R9 |
0x4bc8cf SETAE %R15B |
0x4bc8d3 CMP %R9,%RCX |
0x4bc8d6 SETAE %R12B |
0x4bc8da CMP %RDX,%R8 |
0x4bc8dd MOV %RBX,%R10 |
0x4bc8e0 SETB %BL |
0x4bc8e3 CMP %R9,%RDX |
0x4bc8e6 SETB %R14B |
0x4bc8ea CMP %R10,%RCX |
0x4bc8ed SETB %R8B |
0x4bc8f1 LEA -0x8(%R10,%RAX,8),%R9 |
0x4bc8f6 CMP %RCX,%R9 |
0x4bc8f9 SETB %R11B |
0x4bc8fd CMP %RDX,%R9 |
0x4bc900 SETB %R9B |
0x4bc904 CMP %R10,%RDX |
0x4bc907 SETB %R10B |
0x4bc90b TEST %R12B,%R15B |
0x4bc90e JNE 4bc9d0 |
0x4bc914 OR %R14B,%BL |
0x4bc917 JE 4bc9d0 |
0x4bc91d CMP %RSI,%RDI |
0x4bc920 JE 4bc9d0 |
0x4bc926 OR %R11B,%R8B |
0x4bc929 JE 4bc9d0 |
0x4bc92f OR %R10B,%R9B |
0x4bc932 JE 4bc9d0 |
0x4bc938 MOV %RAX,%RSI |
0x4bc93b AND $-0x4,%RSI |
0x4bc93f JE 4bcb24 |
0x4bc945 LEA -0x1(%RSI),%RDI |
0x4bc949 VPXOR %XMM0,%XMM0,%XMM0 |
0x4bc94d XOR %R8D,%R8D |
0x4bc950 VPXOR %XMM1,%XMM1,%XMM1 |
0x4bc954 MOV 0xb0(%RBP),%R9 |
0x4bc95b MOV 0xa8(%RBP),%R10 |
0x4bc962 NOPW %CS:(%RAX,%RAX,1) |
(3557) 0x4bc970 VPADDQ (%R10,%R8,8),%YMM1,%YMM1 |
(3557) 0x4bc976 VPADDQ (%R9,%R8,8),%YMM0,%YMM0 |
(3557) 0x4bc97c ADD $0x4,%R8 |
(3557) 0x4bc980 CMP %RDI,%R8 |
(3557) 0x4bc983 JLE 4bc970 |
0x4bc985 VEXTRACTI128 $0x1,%YMM1,%XMM2 |
0x4bc98b VPADDQ %XMM2,%XMM1,%XMM1 |
0x4bc98f VPSHUFD $-0x12,%XMM1,%XMM2 |
0x4bc994 VPADDQ %XMM2,%XMM1,%XMM1 |
0x4bc998 VMOVQ %XMM1,%RDI |
0x4bc99d VEXTRACTI128 $0x1,%YMM0,%XMM1 |
0x4bc9a3 VPADDQ %XMM1,%XMM0,%XMM0 |
0x4bc9a7 VPSHUFD $-0x12,%XMM0,%XMM1 |
0x4bc9ac VPADDQ %XMM1,%XMM0,%XMM0 |
0x4bc9b0 VMOVQ %XMM0,%R8 |
0x4bc9b5 CMP %RAX,%RSI |
0x4bc9b8 JNE 4bcb40 |
0x4bc9be JMP 4bcb50 |
0x4bc9c3 MOV -0x68(%RBP),%R11 |
0x4bc9c7 MOV 0xc0(%RBP),%R14 |
0x4bc9ce JMP 4bca20 |
0x4bc9d0 XOR %ESI,%ESI |
0x4bc9d2 MOV 0xb0(%RBP),%R9 |
0x4bc9d9 MOV 0xa8(%RBP),%R10 |
(3555) 0x4bc9e0 MOV (%R10,%RSI,8),%RDI |
(3555) 0x4bc9e4 MOV (%RCX),%R8 |
(3555) 0x4bc9e7 ADD %RDI,%R8 |
(3555) 0x4bc9ea MOV %R8,(%RCX) |
(3555) 0x4bc9ed MOV (%R9,%RSI,8),%RDI |
(3555) 0x4bc9f1 MOV (%RDX),%R8 |
(3555) 0x4bc9f4 ADD %RDI,%R8 |
(3555) 0x4bc9f7 MOV %R8,(%RDX) |
(3555) 0x4bc9fa INC %RSI |
(3555) 0x4bc9fd CMP %RSI,%RAX |
(3555) 0x4bca00 JNE 4bc9e0 |
0x4bca02 JMP 4bcb56 |
0x4bca07 XOR %EDX,%EDX |
0x4bca09 INC %RDX |
0x4bca0c NOPL (%RAX) |
(3561) 0x4bca10 ADD (%R15,%RDX,8),%RAX |
(3561) 0x4bca14 ADD (%RBX,%RDX,8),%RCX |
(3561) 0x4bca18 INC %RDX |
(3561) 0x4bca1b CMP %RDX,%RDI |
(3561) 0x4bca1e JNE 4bca10 |
0x4bca20 CMP %R11,-0x58(%RBP) |
0x4bca24 JGE 4bcb56 |
0x4bca2a MOV -0x40(%RBP),%RDX |
0x4bca2e MOV (%RDX),%RDX |
0x4bca31 MOV -0x48(%RBP),%RSI |
0x4bca35 MOV (%RSI),%RSI |
0x4bca38 LEA -0x8(%RDX,%R11,8),%R10 |
0x4bca3d MOV 0xb8(%RBP),%R12 |
0x4bca44 CMP %R12,%RDI |
0x4bca47 CMOVL %RDI,%R12 |
0x4bca4b IMUL %RDI,%R14 |
0x4bca4f LEA (%R12,%R14,1),%RDI |
0x4bca53 LEA (%RSI,%RDI,8),%R8 |
0x4bca57 LEA (%RDX,%RDI,8),%R9 |
0x4bca5b CMP %R8,%R10 |
0x4bca5e JB 4bca97 |
0x4bca60 LEA -0x8(%RSI,%R11,8),%R10 |
0x4bca65 CMP %R9,%R10 |
0x4bca68 JB 4bca97 |
0x4bca6a NOPW (%RAX,%RAX,1) |
(3560) 0x4bca70 LEA (%RDX,%RDI,8),%R8 |
(3560) 0x4bca74 MOV (%R8),%R9 |
(3560) 0x4bca77 ADD %RAX,%R9 |
(3560) 0x4bca7a MOV %R9,(%R8) |
(3560) 0x4bca7d LEA (%RSI,%RDI,8),%R8 |
(3560) 0x4bca81 MOV (%R8),%R9 |
(3560) 0x4bca84 ADD %RCX,%R9 |
(3560) 0x4bca87 MOV %R9,(%R8) |
(3560) 0x4bca8a INC %RDI |
(3560) 0x4bca8d CMP %RDI,%R11 |
(3560) 0x4bca90 JNE 4bca70 |
0x4bca92 JMP 4bcb56 |
0x4bca97 MOV %R11,%R10 |
0x4bca9a SUB %RDI,%R10 |
0x4bca9d MOV %R10,%RDI |
0x4bcaa0 AND $-0x4,%RDI |
0x4bcaa4 JE 4bcaee |
0x4bcaa6 MOV %R14,%R15 |
0x4bcaa9 MOV %R11,%R14 |
0x4bcaac LEA -0x1(%RDI),%R11 |
0x4bcab0 VPBROADCASTQ %RAX,%YMM0 |
0x4bcab6 VPBROADCASTQ %RCX,%YMM1 |
0x4bcabc XOR %EBX,%EBX |
0x4bcabe XCHG %AX,%AX |
(3559) 0x4bcac0 VPADDQ (%R9,%RBX,8),%YMM0,%YMM2 |
(3559) 0x4bcac6 VMOVDQU %YMM2,(%R9,%RBX,8) |
(3559) 0x4bcacc VPADDQ (%R8,%RBX,8),%YMM1,%YMM2 |
(3559) 0x4bcad2 VMOVDQU %YMM2,(%R8,%RBX,8) |
(3559) 0x4bcad8 ADD $0x4,%RBX |
(3559) 0x4bcadc CMP %R11,%RBX |
(3559) 0x4bcadf JBE 4bcac0 |
0x4bcae1 CMP %RDI,%R10 |
0x4bcae4 MOV %R14,%R11 |
0x4bcae7 MOV %R15,%R14 |
0x4bcaea JNE 4bcaf0 |
0x4bcaec JMP 4bcb56 |
0x4bcaee XOR %EDI,%EDI |
0x4bcaf0 ADD %R12,%RDI |
0x4bcaf3 ADD %R14,%RDI |
0x4bcaf6 NOPW %CS:(%RAX,%RAX,1) |
(3558) 0x4bcb00 LEA (%RDX,%RDI,8),%R8 |
(3558) 0x4bcb04 MOV (%R8),%R9 |
(3558) 0x4bcb07 ADD %RAX,%R9 |
(3558) 0x4bcb0a MOV %R9,(%R8) |
(3558) 0x4bcb0d LEA (%RSI,%RDI,8),%R8 |
(3558) 0x4bcb11 MOV (%R8),%R9 |
(3558) 0x4bcb14 ADD %RCX,%R9 |
(3558) 0x4bcb17 MOV %R9,(%R8) |
(3558) 0x4bcb1a INC %RDI |
(3558) 0x4bcb1d CMP %RDI,%R11 |
(3558) 0x4bcb20 JNE 4bcb00 |
0x4bcb22 JMP 4bcb56 |
0x4bcb24 XOR %R8D,%R8D |
0x4bcb27 XOR %EDI,%EDI |
0x4bcb29 XOR %ESI,%ESI |
0x4bcb2b MOV 0xb0(%RBP),%R9 |
0x4bcb32 MOV 0xa8(%RBP),%R10 |
0x4bcb39 NOPL (%RAX) |
(3556) 0x4bcb40 ADD (%R10,%RSI,8),%RDI |
(3556) 0x4bcb44 ADD (%R9,%RSI,8),%R8 |
(3556) 0x4bcb48 INC %RSI |
(3556) 0x4bcb4b CMP %RSI,%RAX |
(3556) 0x4bcb4e JNE 4bcb40 |
0x4bcb50 ADD %RDI,(%RCX) |
0x4bcb53 MOV %R8,(%RDX) |
0x4bcb56 ADD $0xb8,%RSP |
0x4bcb5d POP %RBX |
0x4bcb5e POP %R12 |
0x4bcb60 POP %R13 |
0x4bcb62 POP %R14 |
0x4bcb64 POP %R15 |
0x4bcb66 POP %RBP |
0x4bcb67 VZEROUPPER |
0x4bcb6a RET |
0x4bcb6b NOPL (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | par_csr_matop.c:102-276 |
Module | exec |
nb instructions | 301 |
nb uops | 308 |
loop length | 1377 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 29 |
micro-operation queue | 51.33 cycles |
front end | 51.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 23.10 | 23.30 | 18.33 | 18.33 | 18.00 | 23.30 | 23.10 | 18.00 | 18.00 | 18.00 | 23.20 | 18.33 |
cycles | 23.10 | 23.30 | 18.33 | 18.33 | 18.00 | 23.30 | 23.10 | 18.00 | 18.00 | 18.00 | 23.20 | 18.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 50.67-50.65 |
Stall cycles | 0.00 |
Front-end | 51.33 |
Dispatch | 23.30 |
Overall L1 | 51.33 |
all | 25% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 26% |
all | 15% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x90(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e86c0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x1(%RAX),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R13,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4bbef4 <hypre_ParMatmul_RowSizes.extracted+0x1a4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x1(%R14),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RCX,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RDX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RAX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4bbf18 <hypre_ParMatmul_RowSizes.extracted+0x1c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R12,%R15,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4e6980 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4bbdff <hypre_ParMatmul_RowSizes.extracted+0xaf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4efbb0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RBX,-0x58(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RBX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JL 4bbf29 <hypre_ParMatmul_RowSizes.extracted+0x1d9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa8(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,(%R15,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RBX,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e6a60 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x736190,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410030 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4bc88a <hypre_ParMatmul_RowSizes.extracted+0xb3a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4bc9c3 <hypre_ParMatmul_RowSizes.extracted+0xc73> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV -0x68(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 4bca07 <hypre_ParMatmul_RowSizes.extracted+0xcb7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ %RAX,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVQ %RCX,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
LEA -0x1(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM1,%XMM2 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM1,%RAX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%RCX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4bca09 <hypre_ParMatmul_RowSizes.extracted+0xcb9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bca20 <hypre_ParMatmul_RowSizes.extracted+0xcd0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R13,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R13,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4bbdd5 <hypre_ParMatmul_RowSizes.extracted+0x85> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RBX,-0x58(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RBX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4bbe11 <hypre_ParMatmul_RowSizes.extracted+0xc1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x60(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %RCX,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL 0xc0(%RBP),%RCX | 1 | 0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
ADD %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOT %RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%R9),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x18(%R8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4bbff8 <hypre_ParMatmul_RowSizes.extracted+0x2a8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,(%RSI,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x48(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,(%RDI,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4bcb56 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RSI,%RDX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RDX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(%R15,%RAX,8),%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RCX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SETAE %R15B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETAE %R12B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SETB %BL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R14B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R8B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA -0x8(%R10,%RAX,8),%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R11B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R9B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R10,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R10B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %R12B,%R15B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4bc9d0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R14B,%BL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bc9d0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 4bc9d0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R11B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bc9d0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R10B,%R9B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bc9d0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bcb24 <hypre_ParMatmul_RowSizes.extracted+0xdd4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RSI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM1,%XMM2 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM1,%RDI | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%R8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4bcb40 <hypre_ParMatmul_RowSizes.extracted+0xdf0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bcb50 <hypre_ParMatmul_RowSizes.extracted+0xe00> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x68(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4bca20 <hypre_ParMatmul_RowSizes.extracted+0xcd0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4bcb56 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,-0x58(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JGE 4bcb56 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x8(%RDX,%R11,8),%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0xb8(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R12,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %RDI,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RDI,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R12,%R14,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RSI,%RDI,8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDX,%RDI,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4bca97 <hypre_ParMatmul_RowSizes.extracted+0xd47> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x8(%RSI,%R11,8),%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R9,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4bca97 <hypre_ParMatmul_RowSizes.extracted+0xd47> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bcb56 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R11,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bcaee <hypre_ParMatmul_RowSizes.extracted+0xd9e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%RDI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JNE 4bcaf0 <hypre_ParMatmul_RowSizes.extracted+0xda0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bcb56 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R12,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R14,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bcb56 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %RDI,(%RCX) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV %R8,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | par_csr_matop.c:102-276 |
Module | exec |
nb instructions | 301 |
nb uops | 308 |
loop length | 1377 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 29 |
micro-operation queue | 51.33 cycles |
front end | 51.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 23.10 | 23.30 | 18.33 | 18.33 | 18.00 | 23.30 | 23.10 | 18.00 | 18.00 | 18.00 | 23.20 | 18.33 |
cycles | 23.10 | 23.30 | 18.33 | 18.33 | 18.00 | 23.30 | 23.10 | 18.00 | 18.00 | 18.00 | 23.20 | 18.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 50.67-50.65 |
Stall cycles | 0.00 |
Front-end | 51.33 |
Dispatch | 23.30 |
Overall L1 | 51.33 |
all | 25% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 26% |
all | 15% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x90(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e86c0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x1(%RAX),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R13,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4bbef4 <hypre_ParMatmul_RowSizes.extracted+0x1a4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x1(%R14),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RCX,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RDX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RAX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4bbf18 <hypre_ParMatmul_RowSizes.extracted+0x1c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R12,%R15,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4e6980 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4bbdff <hypre_ParMatmul_RowSizes.extracted+0xaf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4efbb0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RBX,-0x58(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RBX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JL 4bbf29 <hypre_ParMatmul_RowSizes.extracted+0x1d9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa8(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,(%R15,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RBX,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e6a60 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x736190,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410030 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4bc88a <hypre_ParMatmul_RowSizes.extracted+0xb3a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4bc9c3 <hypre_ParMatmul_RowSizes.extracted+0xc73> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV -0x68(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 4bca07 <hypre_ParMatmul_RowSizes.extracted+0xcb7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ %RAX,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVQ %RCX,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
LEA -0x1(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM1,%XMM2 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM1,%RAX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%RCX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4bca09 <hypre_ParMatmul_RowSizes.extracted+0xcb9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bca20 <hypre_ParMatmul_RowSizes.extracted+0xcd0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R13,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R13,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4bbdd5 <hypre_ParMatmul_RowSizes.extracted+0x85> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RBX,-0x58(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RBX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4bbe11 <hypre_ParMatmul_RowSizes.extracted+0xc1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x60(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %RCX,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL 0xc0(%RBP),%RCX | 1 | 0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
ADD %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOT %RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%R9),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x18(%R8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4bbff8 <hypre_ParMatmul_RowSizes.extracted+0x2a8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,(%RSI,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x48(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,(%RDI,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4bcb56 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RSI,%RDX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RDX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(%R15,%RAX,8),%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RCX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SETAE %R15B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETAE %R12B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SETB %BL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R14B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R8B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA -0x8(%R10,%RAX,8),%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R11B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R9B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R10,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R10B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %R12B,%R15B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4bc9d0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R14B,%BL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bc9d0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 4bc9d0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R11B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bc9d0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R10B,%R9B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bc9d0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bcb24 <hypre_ParMatmul_RowSizes.extracted+0xdd4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RSI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM1,%XMM2 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM1,%RDI | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%R8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4bcb40 <hypre_ParMatmul_RowSizes.extracted+0xdf0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bcb50 <hypre_ParMatmul_RowSizes.extracted+0xe00> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x68(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4bca20 <hypre_ParMatmul_RowSizes.extracted+0xcd0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4bcb56 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,-0x58(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JGE 4bcb56 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x8(%RDX,%R11,8),%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0xb8(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R12,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %RDI,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RDI,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R12,%R14,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RSI,%RDI,8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDX,%RDI,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4bca97 <hypre_ParMatmul_RowSizes.extracted+0xd47> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x8(%RSI,%R11,8),%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R9,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4bca97 <hypre_ParMatmul_RowSizes.extracted+0xd47> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bcb56 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R11,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bcaee <hypre_ParMatmul_RowSizes.extracted+0xd9e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%RDI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JNE 4bcaf0 <hypre_ParMatmul_RowSizes.extracted+0xda0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bcb56 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R12,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R14,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bcb56 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %RDI,(%RCX) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV %R8,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_ParMatmul_RowSizes.extracted– | 1.15 | 0.23 |
▼Loop 3563 - par_csr_matop.c:109-242 - exec– | 0.03 | 0.01 |
▼Loop 3567 - par_csr_matop.c:109-231 - exec– | 0.49 | 0.09 |
○Loop 3570 - par_csr_matop.c:195-208 - exec | 0.58 | 0.11 |
○Loop 3571 - par_csr_matop.c:195-208 - exec | 0.02 | 0.01 |
○Loop 3568 - par_csr_matop.c:218-231 - exec | 0 | 0 |
○Loop 3569 - par_csr_matop.c:218-231 - exec | 0 | 0 |
▼Loop 3564 - par_csr_matop.c:109-231 - exec– | 0 | 0 |
○Loop 3565 - par_csr_matop.c:195-208 - exec | 0 | 0 |
○Loop 3566 - par_csr_matop.c:195-208 - exec | 0 | 0 |
▼Loop 3572 - par_csr_matop.c:109-177 - exec– | 0 | 0 |
○Loop 3573 - par_csr_matop.c:170-177 - exec | 0 | 0 |
○Loop 3576 - par_csr_matop.c:154-167 - exec | 0 | 0 |
○Loop 3574 - par_csr_matop.c:170-177 - exec | 0 | 0 |
○Loop 3575 - par_csr_matop.c:154-167 - exec | 0 | 0 |
○Loop 3559 - par_csr_matop.c:263-266 - exec | 0.02 | 0 |
○Loop 3557 - par_csr_matop.c:109-273 - exec | 0 | 0 |
○Loop 3562 - par_csr_matop.c:257-260 - exec | 0 | 0 |
○Loop 3561 - par_csr_matop.c:257-260 - exec | 0 | 0 |
○Loop 3560 - par_csr_matop.c:263-266 - exec | 0 | 0 |
○Loop 3556 - par_csr_matop.c:109-273 - exec | 0 | 0 |
○Loop 3555 - par_csr_matop.c:273-276 - exec | 0 | 0 |
○Loop 3558 - par_csr_matop.c:263-266 - exec | 0 | 0 |