Function: hypre_BoomerAMGCoarsenPMIS.extracted.10 | Module: exec | Source: par_coarsen.c:2435-2477 [...] | Coverage: 0.53% |
---|
Function: hypre_BoomerAMGCoarsenPMIS.extracted.10 | Module: exec | Source: par_coarsen.c:2435-2477 [...] | Coverage: 0.53% |
---|
/home/eoseret/qaas_runs_CPU_9468/172-019-1763/intel/AMG/build/AMG/AMG/parcsr_ls/par_coarsen.c: 2435 - 2477 |
-------------------------------------------------------------------------------- |
2435: #pragma omp parallel for private(ig, i, jS, j) HYPRE_SMP_SCHEDULE |
2436: #endif |
2437: for (ig = 0; ig < graph_size; ig++) { |
2438: i = graph_array[ig]; |
[...] |
2446: if(measure_array[i]<1.) CF_marker[i]= F_PT; |
[...] |
2453: if (CF_marker[i] > 0) CF_marker[i] = C_PT; |
[...] |
2465: for (jS = S_diag_i[i]; jS < S_diag_i[i+1]; jS++) |
2466: { |
2467: /* j is the column number, or the local number of the point influencing i */ |
2468: j = S_diag_j[jS]; |
2469: if (CF_marker[j] > 0) /* j is a C-point */ |
2470: CF_marker[i] = F_PT; |
2471: } |
2472: /* now the external part */ |
2473: for (jS = S_offd_i[i]; jS < S_offd_i[i+1]; jS++) |
2474: { |
2475: j = S_offd_j[jS]; |
2476: if (CF_marker_offd[j] > 0) /* j is a C-point */ |
2477: CF_marker[i] = F_PT; |
0x42a0f0 PUSH %RBP |
0x42a0f1 MOV %RSP,%RBP |
0x42a0f4 PUSH %R15 |
0x42a0f6 PUSH %R14 |
0x42a0f8 PUSH %R13 |
0x42a0fa PUSH %R12 |
0x42a0fc PUSH %RBX |
0x42a0fd SUB $0x48,%RSP |
0x42a101 MOV %R8,-0x60(%RBP) |
0x42a105 MOV %R9,%RBX |
0x42a108 MOV %RCX,%R15 |
0x42a10b MOV %RDX,%R12 |
0x42a10e MOV 0x28(%RBP),%RAX |
0x42a112 MOV %RAX,-0x58(%RBP) |
0x42a116 MOV 0x20(%RBP),%RAX |
0x42a11a MOV %RAX,-0x40(%RBP) |
0x42a11e MOV 0x18(%RBP),%R13 |
0x42a122 MOV 0x10(%RBP),%R14 |
0x42a126 MOVL $0,-0x30(%RBP) |
0x42a12d MOV (%RDI),%ESI |
0x42a12f MOVQ $0,-0x48(%RBP) |
0x42a137 MOVQ $0x1,-0x68(%RBP) |
0x42a13f SUB $0x8,%RSP |
0x42a143 LEA -0x68(%RBP),%RAX |
0x42a147 MOV $0x22,%EDX |
0x42a14c LEA -0x30(%RBP),%RCX |
0x42a150 LEA -0x48(%RBP),%R8 |
0x42a154 LEA 0x38(%RBP),%R9 |
0x42a158 MOV $0x5d4470,%EDI |
0x42a15d MOV %ESI,-0x2c(%RBP) |
0x42a160 PUSH $0x1 |
0x42a162 PUSH $0x1 |
0x42a164 PUSH %RAX |
0x42a165 CALL 410420 <__kmpc_for_static_init_8@plt> |
0x42a16a MOV -0x58(%RBP),%R11 |
0x42a16e MOV -0x60(%RBP),%R10 |
0x42a172 ADD $0x20,%RSP |
0x42a176 MOV 0x38(%RBP),%RDX |
0x42a17a MOV -0x48(%RBP),%RAX |
0x42a17e MOV %RDX,-0x38(%RBP) |
0x42a182 SUB %RAX,%RDX |
0x42a185 JB 42a2a2 |
0x42a18b MOV %RDX,-0x50(%RBP) |
0x42a18f MOV -0x38(%RBP),%RSI |
0x42a193 SUB %EAX,%ESI |
0x42a195 INC %ESI |
0x42a197 AND $0x7,%RSI |
0x42a19b JE 42a297 |
0x42a1a1 VMOVSD 0x172e67(%RIP),%XMM0 |
0x42a1a9 XOR %EDI,%EDI |
0x42a1ab MOV %R10,%RCX |
0x42a1ae MOV %R11,%RDX |
0x42a1b1 JMP 42a1dd |
0x42a1b3 NOPW %CS:(%RAX,%RAX,1) |
(429) 0x42a1c0 MOVQ $0x1,(%R14,%R8,8) |
(429) 0x42a1c8 INC %RAX |
(429) 0x42a1cb INC %RDI |
(429) 0x42a1ce MOV %RCX,%R10 |
(429) 0x42a1d1 MOV %RDX,%R11 |
(429) 0x42a1d4 CMP %RSI,%RDI |
(429) 0x42a1d7 JE 42a297 |
(429) 0x42a1dd MOV (%R11,%RAX,8),%R8 |
(429) 0x42a1e1 MOV -0x40(%RBP),%R9 |
(429) 0x42a1e5 VUCOMISD (%R9,%R8,8),%XMM0 |
(429) 0x42a1eb JBE 42a210 |
(429) 0x42a1ed MOV $-0x1,%R9 |
(429) 0x42a1f4 MOVQ $-0x1,(%R14,%R8,8) |
(429) 0x42a1fc TEST %R9,%R9 |
(429) 0x42a1ff JG 42a1c0 |
(429) 0x42a201 JMP 42a219 |
0x42a203 NOPW %CS:(%RAX,%RAX,1) |
(429) 0x42a210 MOV (%R14,%R8,8),%R9 |
(429) 0x42a214 TEST %R9,%R9 |
(429) 0x42a217 JG 42a1c0 |
(429) 0x42a219 MOV (%R12,%R8,8),%R9 |
(429) 0x42a21d MOV 0x8(%R12,%R8,8),%R10 |
(429) 0x42a222 JMP 42a233 |
0x42a224 NOPW %CS:(%RAX,%RAX,1) |
(431) 0x42a230 INC %R9 |
(431) 0x42a233 CMP %R10,%R9 |
(431) 0x42a236 JGE 42a260 |
(431) 0x42a238 MOV (%R15,%R9,8),%R11 |
(431) 0x42a23c CMPQ $0,(%R14,%R11,8) |
(431) 0x42a241 JLE 42a230 |
(431) 0x42a243 MOVQ $-0x1,(%R14,%R8,8) |
(431) 0x42a24b MOV 0x8(%R12,%R8,8),%R10 |
(431) 0x42a250 JMP 42a230 |
0x42a252 NOPW %CS:(%RAX,%RAX,1) |
(429) 0x42a260 MOV %RCX,%R10 |
(429) 0x42a263 MOV (%RCX,%R8,8),%R9 |
(429) 0x42a267 MOV 0x8(%RCX,%R8,8),%R10 |
(429) 0x42a26c JMP 42a273 |
0x42a26e XCHG %AX,%AX |
(430) 0x42a270 INC %R9 |
(430) 0x42a273 CMP %R10,%R9 |
(430) 0x42a276 JGE 42a1c8 |
(430) 0x42a27c MOV (%RBX,%R9,8),%R11 |
(430) 0x42a280 CMPQ $0,(%R13,%R11,8) |
(430) 0x42a286 JLE 42a270 |
(430) 0x42a288 MOVQ $-0x1,(%R14,%R8,8) |
(430) 0x42a290 MOV 0x8(%RCX,%R8,8),%R10 |
(430) 0x42a295 JMP 42a270 |
0x42a297 CMPQ $0x7,-0x50(%RBP) |
0x42a29c MOV -0x40(%RBP),%RCX |
0x42a2a0 JAE 42a2bd |
0x42a2a2 MOV -0x2c(%RBP),%ESI |
0x42a2a5 MOV $0x5d4490,%EDI |
0x42a2aa ADD $0x48,%RSP |
0x42a2ae POP %RBX |
0x42a2af POP %R12 |
0x42a2b1 POP %R13 |
0x42a2b3 POP %R14 |
0x42a2b5 POP %R15 |
0x42a2b7 POP %RBP |
0x42a2b8 JMP 410170 |
0x42a2bd VMOVSD 0x172d4b(%RIP),%XMM0 |
0x42a2c5 JMP 42a2e2 |
0x42a2c7 NOPW (%RAX,%RAX,1) |
(412) 0x42a2d0 MOVQ $0x1,(%R14,%RDX,8) |
(412) 0x42a2d8 ADD $0x8,%RAX |
(412) 0x42a2dc CMP -0x38(%RBP),%RSI |
(412) 0x42a2e0 JE 42a2a2 |
(412) 0x42a2e2 MOV (%R11,%RAX,8),%RDX |
(412) 0x42a2e6 VUCOMISD (%RCX,%RDX,8),%XMM0 |
(412) 0x42a2eb JBE 42a340 |
(412) 0x42a2ed MOV $-0x1,%RSI |
(412) 0x42a2f4 MOVQ $-0x1,(%R14,%RDX,8) |
(412) 0x42a2fc TEST %RSI,%RSI |
(412) 0x42a2ff JG 42a349 |
(412) 0x42a301 MOV (%R12,%RDX,8),%RSI |
(412) 0x42a305 MOV 0x8(%R12,%RDX,8),%RDI |
(412) 0x42a30a JMP 42a313 |
0x42a30c NOPL (%RAX) |
(428) 0x42a310 INC %RSI |
(428) 0x42a313 CMP %RDI,%RSI |
(428) 0x42a316 JGE 42a670 |
(428) 0x42a31c MOV (%R15,%RSI,8),%R8 |
(428) 0x42a320 CMPQ $0,(%R14,%R8,8) |
(428) 0x42a325 JLE 42a310 |
(428) 0x42a327 MOVQ $-0x1,(%R14,%RDX,8) |
(428) 0x42a32f MOV 0x8(%R12,%RDX,8),%RDI |
(428) 0x42a334 JMP 42a310 |
0x42a336 NOPW %CS:(%RAX,%RAX,1) |
(412) 0x42a340 MOV (%R14,%RDX,8),%RSI |
(412) 0x42a344 TEST %RSI,%RSI |
(412) 0x42a347 JLE 42a301 |
(412) 0x42a349 MOVQ $0x1,(%R14,%RDX,8) |
(412) 0x42a351 MOV 0x8(%R11,%RAX,8),%RDX |
(412) 0x42a356 VUCOMISD (%RCX,%RDX,8),%XMM0 |
(412) 0x42a35b JBE 42a3b0 |
(412) 0x42a35d MOV $-0x1,%RSI |
(412) 0x42a364 MOVQ $-0x1,(%R14,%RDX,8) |
(412) 0x42a36c TEST %RSI,%RSI |
(412) 0x42a36f JG 42a3b9 |
(412) 0x42a371 MOV (%R12,%RDX,8),%RSI |
(412) 0x42a375 MOV 0x8(%R12,%RDX,8),%RDI |
(412) 0x42a37a JMP 42a383 |
0x42a37c NOPL (%RAX) |
(426) 0x42a380 INC %RSI |
(426) 0x42a383 CMP %RDI,%RSI |
(426) 0x42a386 JGE 42a6b0 |
(426) 0x42a38c MOV (%R15,%RSI,8),%R8 |
(426) 0x42a390 CMPQ $0,(%R14,%R8,8) |
(426) 0x42a395 JLE 42a380 |
(426) 0x42a397 MOVQ $-0x1,(%R14,%RDX,8) |
(426) 0x42a39f MOV 0x8(%R12,%RDX,8),%RDI |
(426) 0x42a3a4 JMP 42a380 |
0x42a3a6 NOPW %CS:(%RAX,%RAX,1) |
(412) 0x42a3b0 MOV (%R14,%RDX,8),%RSI |
(412) 0x42a3b4 TEST %RSI,%RSI |
(412) 0x42a3b7 JLE 42a371 |
(412) 0x42a3b9 MOVQ $0x1,(%R14,%RDX,8) |
(412) 0x42a3c1 MOV 0x10(%R11,%RAX,8),%RDX |
(412) 0x42a3c6 VUCOMISD (%RCX,%RDX,8),%XMM0 |
(412) 0x42a3cb JBE 42a420 |
(412) 0x42a3cd MOV $-0x1,%RSI |
(412) 0x42a3d4 MOVQ $-0x1,(%R14,%RDX,8) |
(412) 0x42a3dc TEST %RSI,%RSI |
(412) 0x42a3df JG 42a429 |
(412) 0x42a3e1 MOV (%R12,%RDX,8),%RSI |
(412) 0x42a3e5 MOV 0x8(%R12,%RDX,8),%RDI |
(412) 0x42a3ea JMP 42a3f3 |
0x42a3ec NOPL (%RAX) |
(424) 0x42a3f0 INC %RSI |
(424) 0x42a3f3 CMP %RDI,%RSI |
(424) 0x42a3f6 JGE 42a6f0 |
(424) 0x42a3fc MOV (%R15,%RSI,8),%R8 |
(424) 0x42a400 CMPQ $0,(%R14,%R8,8) |
(424) 0x42a405 JLE 42a3f0 |
(424) 0x42a407 MOVQ $-0x1,(%R14,%RDX,8) |
(424) 0x42a40f MOV 0x8(%R12,%RDX,8),%RDI |
(424) 0x42a414 JMP 42a3f0 |
0x42a416 NOPW %CS:(%RAX,%RAX,1) |
(412) 0x42a420 MOV (%R14,%RDX,8),%RSI |
(412) 0x42a424 TEST %RSI,%RSI |
(412) 0x42a427 JLE 42a3e1 |
(412) 0x42a429 MOVQ $0x1,(%R14,%RDX,8) |
(412) 0x42a431 MOV 0x18(%R11,%RAX,8),%RDX |
(412) 0x42a436 VUCOMISD (%RCX,%RDX,8),%XMM0 |
(412) 0x42a43b JBE 42a490 |
(412) 0x42a43d MOV $-0x1,%RSI |
(412) 0x42a444 MOVQ $-0x1,(%R14,%RDX,8) |
(412) 0x42a44c TEST %RSI,%RSI |
(412) 0x42a44f JG 42a499 |
(412) 0x42a451 MOV (%R12,%RDX,8),%RSI |
(412) 0x42a455 MOV 0x8(%R12,%RDX,8),%RDI |
(412) 0x42a45a JMP 42a463 |
0x42a45c NOPL (%RAX) |
(422) 0x42a460 INC %RSI |
(422) 0x42a463 CMP %RDI,%RSI |
(422) 0x42a466 JGE 42a730 |
(422) 0x42a46c MOV (%R15,%RSI,8),%R8 |
(422) 0x42a470 CMPQ $0,(%R14,%R8,8) |
(422) 0x42a475 JLE 42a460 |
(422) 0x42a477 MOVQ $-0x1,(%R14,%RDX,8) |
(422) 0x42a47f MOV 0x8(%R12,%RDX,8),%RDI |
(422) 0x42a484 JMP 42a460 |
0x42a486 NOPW %CS:(%RAX,%RAX,1) |
(412) 0x42a490 MOV (%R14,%RDX,8),%RSI |
(412) 0x42a494 TEST %RSI,%RSI |
(412) 0x42a497 JLE 42a451 |
(412) 0x42a499 MOVQ $0x1,(%R14,%RDX,8) |
(412) 0x42a4a1 MOV 0x20(%R11,%RAX,8),%RDX |
(412) 0x42a4a6 VUCOMISD (%RCX,%RDX,8),%XMM0 |
(412) 0x42a4ab JBE 42a500 |
(412) 0x42a4ad MOV $-0x1,%RSI |
(412) 0x42a4b4 MOVQ $-0x1,(%R14,%RDX,8) |
(412) 0x42a4bc TEST %RSI,%RSI |
(412) 0x42a4bf JG 42a509 |
(412) 0x42a4c1 MOV (%R12,%RDX,8),%RSI |
(412) 0x42a4c5 MOV 0x8(%R12,%RDX,8),%RDI |
(412) 0x42a4ca JMP 42a4d3 |
0x42a4cc NOPL (%RAX) |
(420) 0x42a4d0 INC %RSI |
(420) 0x42a4d3 CMP %RDI,%RSI |
(420) 0x42a4d6 JGE 42a770 |
(420) 0x42a4dc MOV (%R15,%RSI,8),%R8 |
(420) 0x42a4e0 CMPQ $0,(%R14,%R8,8) |
(420) 0x42a4e5 JLE 42a4d0 |
(420) 0x42a4e7 MOVQ $-0x1,(%R14,%RDX,8) |
(420) 0x42a4ef MOV 0x8(%R12,%RDX,8),%RDI |
(420) 0x42a4f4 JMP 42a4d0 |
0x42a4f6 NOPW %CS:(%RAX,%RAX,1) |
(412) 0x42a500 MOV (%R14,%RDX,8),%RSI |
(412) 0x42a504 TEST %RSI,%RSI |
(412) 0x42a507 JLE 42a4c1 |
(412) 0x42a509 MOVQ $0x1,(%R14,%RDX,8) |
(412) 0x42a511 MOV 0x28(%R11,%RAX,8),%RDX |
(412) 0x42a516 VUCOMISD (%RCX,%RDX,8),%XMM0 |
(412) 0x42a51b JBE 42a570 |
(412) 0x42a51d MOV $-0x1,%RSI |
(412) 0x42a524 MOVQ $-0x1,(%R14,%RDX,8) |
(412) 0x42a52c TEST %RSI,%RSI |
(412) 0x42a52f JG 42a579 |
(412) 0x42a531 MOV (%R12,%RDX,8),%RSI |
(412) 0x42a535 MOV 0x8(%R12,%RDX,8),%RDI |
(412) 0x42a53a JMP 42a543 |
0x42a53c NOPL (%RAX) |
(418) 0x42a540 INC %RSI |
(418) 0x42a543 CMP %RDI,%RSI |
(418) 0x42a546 JGE 42a7b0 |
(418) 0x42a54c MOV (%R15,%RSI,8),%R8 |
(418) 0x42a550 CMPQ $0,(%R14,%R8,8) |
(418) 0x42a555 JLE 42a540 |
(418) 0x42a557 MOVQ $-0x1,(%R14,%RDX,8) |
(418) 0x42a55f MOV 0x8(%R12,%RDX,8),%RDI |
(418) 0x42a564 JMP 42a540 |
0x42a566 NOPW %CS:(%RAX,%RAX,1) |
(412) 0x42a570 MOV (%R14,%RDX,8),%RSI |
(412) 0x42a574 TEST %RSI,%RSI |
(412) 0x42a577 JLE 42a531 |
(412) 0x42a579 MOVQ $0x1,(%R14,%RDX,8) |
(412) 0x42a581 MOV 0x30(%R11,%RAX,8),%RDX |
(412) 0x42a586 VUCOMISD (%RCX,%RDX,8),%XMM0 |
(412) 0x42a58b JBE 42a5e0 |
(412) 0x42a58d MOV $-0x1,%RSI |
(412) 0x42a594 MOVQ $-0x1,(%R14,%RDX,8) |
(412) 0x42a59c TEST %RSI,%RSI |
(412) 0x42a59f JG 42a5e9 |
(412) 0x42a5a1 MOV (%R12,%RDX,8),%RSI |
(412) 0x42a5a5 MOV 0x8(%R12,%RDX,8),%RDI |
(412) 0x42a5aa JMP 42a5b3 |
0x42a5ac NOPL (%RAX) |
(416) 0x42a5b0 INC %RSI |
(416) 0x42a5b3 CMP %RDI,%RSI |
(416) 0x42a5b6 JGE 42a7f0 |
(416) 0x42a5bc MOV (%R15,%RSI,8),%R8 |
(416) 0x42a5c0 CMPQ $0,(%R14,%R8,8) |
(416) 0x42a5c5 JLE 42a5b0 |
(416) 0x42a5c7 MOVQ $-0x1,(%R14,%RDX,8) |
(416) 0x42a5cf MOV 0x8(%R12,%RDX,8),%RDI |
(416) 0x42a5d4 JMP 42a5b0 |
0x42a5d6 NOPW %CS:(%RAX,%RAX,1) |
(412) 0x42a5e0 MOV (%R14,%RDX,8),%RSI |
(412) 0x42a5e4 TEST %RSI,%RSI |
(412) 0x42a5e7 JLE 42a5a1 |
(412) 0x42a5e9 MOVQ $0x1,(%R14,%RDX,8) |
(412) 0x42a5f1 MOV 0x38(%R11,%RAX,8),%RDX |
(412) 0x42a5f6 VUCOMISD (%RCX,%RDX,8),%XMM0 |
(412) 0x42a5fb JBE 42a620 |
(412) 0x42a5fd MOV $-0x1,%RDI |
(412) 0x42a604 MOVQ $-0x1,(%R14,%RDX,8) |
(412) 0x42a60c LEA 0x7(%RAX),%RSI |
(412) 0x42a610 TEST %RDI,%RDI |
(412) 0x42a613 JG 42a2d0 |
(412) 0x42a619 JMP 42a631 |
0x42a61b NOPL (%RAX,%RAX,1) |
(412) 0x42a620 MOV (%R14,%RDX,8),%RDI |
(412) 0x42a624 LEA 0x7(%RAX),%RSI |
(412) 0x42a628 TEST %RDI,%RDI |
(412) 0x42a62b JG 42a2d0 |
(412) 0x42a631 MOV (%R12,%RDX,8),%RDI |
(412) 0x42a635 MOV 0x8(%R12,%RDX,8),%R8 |
(412) 0x42a63a JMP 42a643 |
0x42a63c NOPL (%RAX) |
(414) 0x42a640 INC %RDI |
(414) 0x42a643 CMP %R8,%RDI |
(414) 0x42a646 JGE 42a830 |
(414) 0x42a64c MOV (%R15,%RDI,8),%R9 |
(414) 0x42a650 CMPQ $0,(%R14,%R9,8) |
(414) 0x42a655 JLE 42a640 |
(414) 0x42a657 MOVQ $-0x1,(%R14,%RDX,8) |
(414) 0x42a65f MOV 0x8(%R12,%RDX,8),%R8 |
(414) 0x42a664 JMP 42a640 |
0x42a666 NOPW %CS:(%RAX,%RAX,1) |
(412) 0x42a670 MOV (%R10,%RDX,8),%RSI |
(412) 0x42a674 MOV 0x8(%R10,%RDX,8),%RDI |
(412) 0x42a679 JMP 42a683 |
0x42a67b NOPL (%RAX,%RAX,1) |
(427) 0x42a680 INC %RSI |
(427) 0x42a683 CMP %RDI,%RSI |
(427) 0x42a686 JGE 42a351 |
(427) 0x42a68c MOV (%RBX,%RSI,8),%R8 |
(427) 0x42a690 CMPQ $0,(%R13,%R8,8) |
(427) 0x42a696 JLE 42a680 |
(427) 0x42a698 MOVQ $-0x1,(%R14,%RDX,8) |
(427) 0x42a6a0 MOV 0x8(%R10,%RDX,8),%RDI |
(427) 0x42a6a5 JMP 42a680 |
0x42a6a7 NOPW (%RAX,%RAX,1) |
(412) 0x42a6b0 MOV (%R10,%RDX,8),%RSI |
(412) 0x42a6b4 MOV 0x8(%R10,%RDX,8),%RDI |
(412) 0x42a6b9 JMP 42a6c3 |
0x42a6bb NOPL (%RAX,%RAX,1) |
(425) 0x42a6c0 INC %RSI |
(425) 0x42a6c3 CMP %RDI,%RSI |
(425) 0x42a6c6 JGE 42a3c1 |
(425) 0x42a6cc MOV (%RBX,%RSI,8),%R8 |
(425) 0x42a6d0 CMPQ $0,(%R13,%R8,8) |
(425) 0x42a6d6 JLE 42a6c0 |
(425) 0x42a6d8 MOVQ $-0x1,(%R14,%RDX,8) |
(425) 0x42a6e0 MOV 0x8(%R10,%RDX,8),%RDI |
(425) 0x42a6e5 JMP 42a6c0 |
0x42a6e7 NOPW (%RAX,%RAX,1) |
(412) 0x42a6f0 MOV (%R10,%RDX,8),%RSI |
(412) 0x42a6f4 MOV 0x8(%R10,%RDX,8),%RDI |
(412) 0x42a6f9 JMP 42a703 |
0x42a6fb NOPL (%RAX,%RAX,1) |
(423) 0x42a700 INC %RSI |
(423) 0x42a703 CMP %RDI,%RSI |
(423) 0x42a706 JGE 42a431 |
(423) 0x42a70c MOV (%RBX,%RSI,8),%R8 |
(423) 0x42a710 CMPQ $0,(%R13,%R8,8) |
(423) 0x42a716 JLE 42a700 |
(423) 0x42a718 MOVQ $-0x1,(%R14,%RDX,8) |
(423) 0x42a720 MOV 0x8(%R10,%RDX,8),%RDI |
(423) 0x42a725 JMP 42a700 |
0x42a727 NOPW (%RAX,%RAX,1) |
(412) 0x42a730 MOV (%R10,%RDX,8),%RSI |
(412) 0x42a734 MOV 0x8(%R10,%RDX,8),%RDI |
(412) 0x42a739 JMP 42a743 |
0x42a73b NOPL (%RAX,%RAX,1) |
(421) 0x42a740 INC %RSI |
(421) 0x42a743 CMP %RDI,%RSI |
(421) 0x42a746 JGE 42a4a1 |
(421) 0x42a74c MOV (%RBX,%RSI,8),%R8 |
(421) 0x42a750 CMPQ $0,(%R13,%R8,8) |
(421) 0x42a756 JLE 42a740 |
(421) 0x42a758 MOVQ $-0x1,(%R14,%RDX,8) |
(421) 0x42a760 MOV 0x8(%R10,%RDX,8),%RDI |
(421) 0x42a765 JMP 42a740 |
0x42a767 NOPW (%RAX,%RAX,1) |
(412) 0x42a770 MOV (%R10,%RDX,8),%RSI |
(412) 0x42a774 MOV 0x8(%R10,%RDX,8),%RDI |
(412) 0x42a779 JMP 42a783 |
0x42a77b NOPL (%RAX,%RAX,1) |
(419) 0x42a780 INC %RSI |
(419) 0x42a783 CMP %RDI,%RSI |
(419) 0x42a786 JGE 42a511 |
(419) 0x42a78c MOV (%RBX,%RSI,8),%R8 |
(419) 0x42a790 CMPQ $0,(%R13,%R8,8) |
(419) 0x42a796 JLE 42a780 |
(419) 0x42a798 MOVQ $-0x1,(%R14,%RDX,8) |
(419) 0x42a7a0 MOV 0x8(%R10,%RDX,8),%RDI |
(419) 0x42a7a5 JMP 42a780 |
0x42a7a7 NOPW (%RAX,%RAX,1) |
(412) 0x42a7b0 MOV (%R10,%RDX,8),%RSI |
(412) 0x42a7b4 MOV 0x8(%R10,%RDX,8),%RDI |
(412) 0x42a7b9 JMP 42a7c3 |
0x42a7bb NOPL (%RAX,%RAX,1) |
(417) 0x42a7c0 INC %RSI |
(417) 0x42a7c3 CMP %RDI,%RSI |
(417) 0x42a7c6 JGE 42a581 |
(417) 0x42a7cc MOV (%RBX,%RSI,8),%R8 |
(417) 0x42a7d0 CMPQ $0,(%R13,%R8,8) |
(417) 0x42a7d6 JLE 42a7c0 |
(417) 0x42a7d8 MOVQ $-0x1,(%R14,%RDX,8) |
(417) 0x42a7e0 MOV 0x8(%R10,%RDX,8),%RDI |
(417) 0x42a7e5 JMP 42a7c0 |
0x42a7e7 NOPW (%RAX,%RAX,1) |
(412) 0x42a7f0 MOV (%R10,%RDX,8),%RSI |
(412) 0x42a7f4 MOV 0x8(%R10,%RDX,8),%RDI |
(412) 0x42a7f9 JMP 42a803 |
0x42a7fb NOPL (%RAX,%RAX,1) |
(415) 0x42a800 INC %RSI |
(415) 0x42a803 CMP %RDI,%RSI |
(415) 0x42a806 JGE 42a5f1 |
(415) 0x42a80c MOV (%RBX,%RSI,8),%R8 |
(415) 0x42a810 CMPQ $0,(%R13,%R8,8) |
(415) 0x42a816 JLE 42a800 |
(415) 0x42a818 MOVQ $-0x1,(%R14,%RDX,8) |
(415) 0x42a820 MOV 0x8(%R10,%RDX,8),%RDI |
(415) 0x42a825 JMP 42a800 |
0x42a827 NOPW (%RAX,%RAX,1) |
(412) 0x42a830 MOV (%R10,%RDX,8),%RDI |
(412) 0x42a834 MOV 0x8(%R10,%RDX,8),%R8 |
(412) 0x42a839 JMP 42a843 |
0x42a83b NOPL (%RAX,%RAX,1) |
(413) 0x42a840 INC %RDI |
(413) 0x42a843 CMP %R8,%RDI |
(413) 0x42a846 JGE 42a2d8 |
(413) 0x42a84c MOV (%RBX,%RDI,8),%R9 |
(413) 0x42a850 CMPQ $0,(%R13,%R9,8) |
(413) 0x42a856 JLE 42a840 |
(413) 0x42a858 MOVQ $-0x1,(%R14,%RDX,8) |
(413) 0x42a860 MOV 0x8(%R10,%RDX,8),%R8 |
(413) 0x42a865 JMP 42a840 |
0x42a867 NOPW (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | par_coarsen.c:2435-2477 |
Module | exec |
nb instructions | 107 |
nb uops | 69 |
loop length | 535 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 11.50 cycles |
front end | 11.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.00 | 5.00 | 4.75 | 4.75 | 3.50 | 8.33 | 8.33 | 8.33 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 5.00 | 5.00 | 4.75 | 4.75 | 3.50 | 8.33 | 8.33 | 8.33 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 11.50 |
Dispatch | 8.33 |
Overall L1 | 11.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 11% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 8% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 10% |
load | 11% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 8% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 11% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x48,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R8,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x18(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV 0x10(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOVQ $0,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVQ $0x1,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x68(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
LEA -0x30(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x48(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x38(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x5d4470,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %ESI,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL 410420 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV -0x58(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV -0x60(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV 0x38(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
SUB %RAX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JB 42a2a2 <hypre_BoomerAMGCoarsenPMIS.extracted.10+0x1b2> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %RDX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
SUB %EAX,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
INC %ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
AND $0x7,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JE 42a297 <hypre_BoomerAMGCoarsenPMIS.extracted.10+0x1a7> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
VMOVSD 0x172e67(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %R10,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %R11,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
JMP 42a1dd <hypre_BoomerAMGCoarsenPMIS.extracted.10+0xed> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
CMPQ $0x7,-0x50(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
MOV -0x40(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
JAE 42a2bd <hypre_BoomerAMGCoarsenPMIS.extracted.10+0x1cd> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV -0x2c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOV $0x5d4490,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
ADD $0x48,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
JMP 410170 <__kmpc_for_static_fini@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
VMOVSD 0x172d4b(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
JMP 42a2e2 <hypre_BoomerAMGCoarsenPMIS.extracted.10+0x1f2> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Source file and lines | par_coarsen.c:2435-2477 |
Module | exec |
nb instructions | 107 |
nb uops | 69 |
loop length | 535 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 11.50 cycles |
front end | 11.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.00 | 5.00 | 4.75 | 4.75 | 3.50 | 8.33 | 8.33 | 8.33 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 5.00 | 5.00 | 4.75 | 4.75 | 3.50 | 8.33 | 8.33 | 8.33 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 11.50 |
Dispatch | 8.33 |
Overall L1 | 11.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 11% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 8% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 10% |
load | 11% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 8% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 11% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x48,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R8,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x18(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV 0x10(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOVQ $0,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVQ $0x1,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x68(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
LEA -0x30(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x48(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x38(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x5d4470,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %ESI,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL 410420 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV -0x58(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV -0x60(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV 0x38(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
SUB %RAX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JB 42a2a2 <hypre_BoomerAMGCoarsenPMIS.extracted.10+0x1b2> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %RDX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
SUB %EAX,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
INC %ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
AND $0x7,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JE 42a297 <hypre_BoomerAMGCoarsenPMIS.extracted.10+0x1a7> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
VMOVSD 0x172e67(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %R10,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %R11,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
JMP 42a1dd <hypre_BoomerAMGCoarsenPMIS.extracted.10+0xed> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
CMPQ $0x7,-0x50(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
MOV -0x40(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
JAE 42a2bd <hypre_BoomerAMGCoarsenPMIS.extracted.10+0x1cd> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV -0x2c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOV $0x5d4490,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
ADD $0x48,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
JMP 410170 <__kmpc_for_static_fini@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
VMOVSD 0x172d4b(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
JMP 42a2e2 <hypre_BoomerAMGCoarsenPMIS.extracted.10+0x1f2> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_BoomerAMGCoarsenPMIS.extracted.10– | 0.53 | 0.39 |
▼Loop 412 - par_coarsen.c:2435-2477 - exec– | 0.06 | 0.04 |
○Loop 422 - par_coarsen.c:2465-2470 - exec | 0.06 | 0.04 |
○Loop 416 - par_coarsen.c:2465-2470 - exec | 0.06 | 0.04 |
○Loop 414 - par_coarsen.c:2465-2470 - exec | 0.06 | 0.04 |
○Loop 426 - par_coarsen.c:2465-2470 - exec | 0.06 | 0.04 |
○Loop 428 - par_coarsen.c:2465-2470 - exec | 0.06 | 0.04 |
○Loop 418 - par_coarsen.c:2465-2470 - exec | 0.06 | 0.04 |
○Loop 424 - par_coarsen.c:2465-2470 - exec | 0.06 | 0.04 |
○Loop 420 - par_coarsen.c:2465-2470 - exec | 0.05 | 0.04 |
○Loop 413 - par_coarsen.c:2473-2477 - exec | 0.00 | 0.00 |
○Loop 423 - par_coarsen.c:2473-2477 - exec | 0.00 | 0.00 |
○Loop 417 - par_coarsen.c:2473-2477 - exec | 0.00 | 0.00 |
○Loop 415 - par_coarsen.c:2473-2477 - exec | 0.00 | 0.00 |
○Loop 427 - par_coarsen.c:2473-2477 - exec | 0.00 | 0.00 |
○Loop 425 - par_coarsen.c:2473-2477 - exec | 0.00 | 0.01 |
○Loop 419 - par_coarsen.c:2473-2477 - exec | 0.00 | 0.00 |
○Loop 421 - par_coarsen.c:2473-2477 - exec | 0.00 | 0.01 |
▼Loop 429 - par_coarsen.c:2435-2477 - exec– | 0.00 | 0.00 |
○Loop 431 - par_coarsen.c:2465-2470 - exec | 0.00 | 0.00 |
○Loop 430 - par_coarsen.c:2473-2477 - exec | 0.00 | 0.00 |