Function: hypre_BoomerAMGCoarsenPMIS.extracted.15 | Module: exec | Source: par_coarsen.c:2354-2381 | Coverage: 0.94% |
---|
Function: hypre_BoomerAMGCoarsenPMIS.extracted.15 | Module: exec | Source: par_coarsen.c:2354-2381 | Coverage: 0.94% |
---|
/home/eoseret/qaas_runs_CPU_9468/172-019-1763/intel/AMG/build/AMG/AMG/parcsr_ls/par_coarsen.c: 2354 - 2381 |
-------------------------------------------------------------------------------- |
2354: #pragma omp parallel for private(ig, i, jS, j, jj) HYPRE_SMP_SCHEDULE |
2355: #endif |
2356: for (ig = 0; ig < graph_size; ig++) |
2357: { |
2358: i = graph_array[ig]; |
2359: if (measure_array[i] > 1) |
2360: { |
2361: for (jS = S_diag_i[i]; jS < S_diag_i[i+1]; jS++) |
2362: { |
2363: j = S_diag_j[jS]; |
2364: if (measure_array[j] > 1) |
2365: { |
2366: if (measure_array[i] > measure_array[j]) |
2367: CF_marker[j] = 0; |
2368: else if (measure_array[j] > measure_array[i]) |
2369: CF_marker[i] = 0; |
2370: } |
2371: } /* for each local neighbor j of i */ |
2372: for (jS = S_offd_i[i]; jS < S_offd_i[i+1]; jS++) |
2373: { |
2374: jj = S_offd_j[jS]; |
2375: j = num_variables+jj; |
2376: if (measure_array[j] > 1) |
2377: { |
2378: if (measure_array[i] > measure_array[j]) |
2379: CF_marker_offd[jj] = 0; |
2380: else if (measure_array[j] > measure_array[i]) |
2381: CF_marker[i] = 0; |
0x42a870 PUSH %RBP |
0x42a871 MOV %RSP,%RBP |
0x42a874 PUSH %R15 |
0x42a876 PUSH %R14 |
0x42a878 PUSH %R13 |
0x42a87a PUSH %R12 |
0x42a87c PUSH %RBX |
0x42a87d SUB $0x58,%RSP |
0x42a881 MOV %R9,-0x68(%RBP) |
0x42a885 MOV %R8,%R14 |
0x42a888 MOV %RCX,%R15 |
0x42a88b MOV %RDX,%R12 |
0x42a88e MOV 0x30(%RBP),%RAX |
0x42a892 MOV %RAX,-0x60(%RBP) |
0x42a896 MOV 0x20(%RBP),%RAX |
0x42a89a MOV 0x28(%RBP),%R13 |
0x42a89e MOV %RAX,-0x38(%RBP) |
0x42a8a2 MOV 0x18(%RBP),%RAX |
0x42a8a6 MOV %RAX,-0x30(%RBP) |
0x42a8aa MOV 0x10(%RBP),%RBX |
0x42a8ae MOVL $0,-0x40(%RBP) |
0x42a8b5 MOV (%RDI),%ESI |
0x42a8b7 MOVQ $0,-0x50(%RBP) |
0x42a8bf MOVQ $0x1,-0x78(%RBP) |
0x42a8c7 SUB $0x8,%RSP |
0x42a8cb LEA -0x78(%RBP),%RAX |
0x42a8cf LEA -0x40(%RBP),%RCX |
0x42a8d3 LEA -0x50(%RBP),%R8 |
0x42a8d7 LEA 0x40(%RBP),%R9 |
0x42a8db MOV $0x5d44d0,%EDI |
0x42a8e0 MOV %ESI,-0x3c(%RBP) |
0x42a8e3 MOV $0x22,%EDX |
0x42a8e8 PUSH $0x1 |
0x42a8ea PUSH $0x1 |
0x42a8ec PUSH %RAX |
0x42a8ed CALL 410420 <__kmpc_for_static_init_8@plt> |
0x42a8f2 MOV -0x60(%RBP),%R10 |
0x42a8f6 MOV -0x68(%RBP),%R11 |
0x42a8fa ADD $0x20,%RSP |
0x42a8fe MOV 0x40(%RBP),%RCX |
0x42a902 MOV -0x50(%RBP),%RAX |
0x42a906 MOV %RCX,-0x48(%RBP) |
0x42a90a SUB %RAX,%RCX |
0x42a90d JB 42aa20 |
0x42a913 MOV %RCX,-0x58(%RBP) |
0x42a917 MOV -0x48(%RBP),%RCX |
0x42a91b SUB %EAX,%ECX |
0x42a91d INC %ECX |
0x42a91f AND $0x7,%RCX |
0x42a923 MOV %RCX,-0x70(%RBP) |
0x42a927 JE 42aa19 |
0x42a92d VMOVSD 0x1726db(%RIP),%XMM0 |
0x42a935 XOR %EDI,%EDI |
0x42a937 JMP 42a953 |
0x42a939 NOPL (%RAX) |
(449) 0x42a940 INC %RAX |
(449) 0x42a943 INC %RDI |
(449) 0x42a946 MOV %RSI,%R10 |
(449) 0x42a949 CMP -0x70(%RBP),%RDI |
(449) 0x42a94d JE 42aa19 |
(449) 0x42a953 MOV (%R10,%RAX,8),%R8 |
(449) 0x42a957 MOV %R10,%RSI |
(449) 0x42a95a VMOVSD (%R13,%R8,8),%XMM1 |
(449) 0x42a961 VUCOMISD %XMM1,%XMM0 |
(449) 0x42a965 JAE 42a940 |
(449) 0x42a967 MOV (%R12,%R8,8),%R9 |
(449) 0x42a96b MOV -0x30(%RBP),%RCX |
(449) 0x42a96f CMP 0x8(%R12,%R8,8),%R9 |
(449) 0x42a974 JL 42a9a2 |
(449) 0x42a976 MOV (%R14,%R8,8),%R9 |
(449) 0x42a97a CMP 0x8(%R14,%R8,8),%R9 |
(449) 0x42a97f JGE 42a940 |
(449) 0x42a981 MOV -0x30(%RBP),%RCX |
(449) 0x42a985 LEA (%RCX,%R8,8),%R10 |
(449) 0x42a989 JMP 42a9f0 |
0x42a98b NOPL (%RAX,%RAX,1) |
(451) 0x42a990 MOVQ $0,(%RCX,%R10,8) |
(451) 0x42a998 INC %R9 |
(451) 0x42a99b CMP 0x8(%R12,%R8,8),%R9 |
(451) 0x42a9a0 JGE 42a976 |
(451) 0x42a9a2 MOV (%R15,%R9,8),%R10 |
(451) 0x42a9a6 VMOVSD (%R13,%R10,8),%XMM2 |
(451) 0x42a9ad VUCOMISD %XMM2,%XMM0 |
(451) 0x42a9b1 JAE 42a998 |
(451) 0x42a9b3 VUCOMISD %XMM2,%XMM1 |
(451) 0x42a9b7 JA 42a990 |
(451) 0x42a9b9 VUCOMISD %XMM1,%XMM2 |
(451) 0x42a9bd MOV %R8,%R10 |
(451) 0x42a9c0 JA 42a990 |
(451) 0x42a9c2 JMP 42a998 |
0x42a9c4 NOPW %CS:(%RAX,%RAX,1) |
(450) 0x42a9d0 MOV -0x38(%RBP),%RCX |
(450) 0x42a9d4 LEA (%RCX,%R11,8),%R11 |
(450) 0x42a9d8 MOVQ $0,(%R11) |
(450) 0x42a9df INC %R9 |
(450) 0x42a9e2 MOV %RDX,%R11 |
(450) 0x42a9e5 CMP 0x8(%R14,%R8,8),%R9 |
(450) 0x42a9ea JGE 42a940 |
(450) 0x42a9f0 MOV %R11,%RDX |
(450) 0x42a9f3 MOV (%R11,%R9,8),%R11 |
(450) 0x42a9f7 LEA (%R11,%RBX,1),%RCX |
(450) 0x42a9fb VMOVSD (%R13,%RCX,8),%XMM2 |
(450) 0x42aa02 VUCOMISD %XMM2,%XMM0 |
(450) 0x42aa06 JAE 42a9df |
(450) 0x42aa08 VUCOMISD %XMM2,%XMM1 |
(450) 0x42aa0c JA 42a9d0 |
(450) 0x42aa0e VUCOMISD %XMM1,%XMM2 |
(450) 0x42aa12 MOV %R10,%R11 |
(450) 0x42aa15 JA 42a9d8 |
(450) 0x42aa17 JMP 42a9df |
0x42aa19 CMPQ $0x7,-0x58(%RBP) |
0x42aa1e JAE 42aa3b |
0x42aa20 MOV -0x3c(%RBP),%ESI |
0x42aa23 MOV $0x5d44f0,%EDI |
0x42aa28 ADD $0x58,%RSP |
0x42aa2c POP %RBX |
0x42aa2d POP %R12 |
0x42aa2f POP %R13 |
0x42aa31 POP %R14 |
0x42aa33 POP %R15 |
0x42aa35 POP %RBP |
0x42aa36 JMP 410170 |
0x42aa3b VMOVSD 0x1725cd(%RIP),%XMM0 |
0x42aa43 JMP 42aa5a |
0x42aa45 NOPW %CS:(%RAX,%RAX,1) |
(432) 0x42aa50 ADD $0x8,%RAX |
(432) 0x42aa54 CMP -0x48(%RBP),%RDX |
(432) 0x42aa58 JE 42aa20 |
(432) 0x42aa5a MOV (%R10,%RAX,8),%RDX |
(432) 0x42aa5e MOV -0x38(%RBP),%R9 |
(432) 0x42aa62 VMOVSD (%R13,%RDX,8),%XMM1 |
(432) 0x42aa69 VUCOMISD %XMM1,%XMM0 |
(432) 0x42aa6d JAE 42ab20 |
(432) 0x42aa73 MOV (%R12,%RDX,8),%RSI |
(432) 0x42aa77 MOV -0x30(%RBP),%RCX |
(432) 0x42aa7b CMP 0x8(%R12,%RDX,8),%RSI |
(432) 0x42aa80 JL 42aab2 |
(432) 0x42aa82 MOV (%R14,%RDX,8),%RSI |
(432) 0x42aa86 CMP 0x8(%R14,%RDX,8),%RSI |
(432) 0x42aa8b JGE 42ab20 |
(432) 0x42aa91 MOV -0x30(%RBP),%RCX |
(432) 0x42aa95 LEA (%RCX,%RDX,8),%RDI |
(432) 0x42aa99 JMP 42aaf5 |
0x42aa9b NOPL (%RAX,%RAX,1) |
(448) 0x42aaa0 MOVQ $0,(%RCX,%RDI,8) |
(448) 0x42aaa8 INC %RSI |
(448) 0x42aaab CMP 0x8(%R12,%RDX,8),%RSI |
(448) 0x42aab0 JGE 42aa82 |
(448) 0x42aab2 MOV (%R15,%RSI,8),%RDI |
(448) 0x42aab6 VMOVSD (%R13,%RDI,8),%XMM2 |
(448) 0x42aabd VUCOMISD %XMM2,%XMM0 |
(448) 0x42aac1 JAE 42aaa8 |
(448) 0x42aac3 VUCOMISD %XMM2,%XMM1 |
(448) 0x42aac7 JA 42aaa0 |
(448) 0x42aac9 VUCOMISD %XMM1,%XMM2 |
(448) 0x42aacd MOV %RDX,%RDI |
(448) 0x42aad0 JA 42aaa0 |
(448) 0x42aad2 JMP 42aaa8 |
0x42aad4 NOPW %CS:(%RAX,%RAX,1) |
(447) 0x42aae0 LEA (%R9,%R8,8),%R8 |
(447) 0x42aae4 MOVQ $0,(%R8) |
(447) 0x42aaeb INC %RSI |
(447) 0x42aaee CMP 0x8(%R14,%RDX,8),%RSI |
(447) 0x42aaf3 JGE 42ab20 |
(447) 0x42aaf5 MOV (%R11,%RSI,8),%R8 |
(447) 0x42aaf9 LEA (%R8,%RBX,1),%RCX |
(447) 0x42aafd VMOVSD (%R13,%RCX,8),%XMM2 |
(447) 0x42ab04 VUCOMISD %XMM2,%XMM0 |
(447) 0x42ab08 JAE 42aaeb |
(447) 0x42ab0a VUCOMISD %XMM2,%XMM1 |
(447) 0x42ab0e JA 42aae0 |
(447) 0x42ab10 VUCOMISD %XMM1,%XMM2 |
(447) 0x42ab14 MOV %RDI,%R8 |
(447) 0x42ab17 JA 42aae4 |
(447) 0x42ab19 JMP 42aaeb |
0x42ab1b NOPL (%RAX,%RAX,1) |
(432) 0x42ab20 MOV 0x8(%R10,%RAX,8),%RDX |
(432) 0x42ab25 VMOVSD (%R13,%RDX,8),%XMM1 |
(432) 0x42ab2c VUCOMISD %XMM1,%XMM0 |
(432) 0x42ab30 JAE 42abe0 |
(432) 0x42ab36 MOV (%R12,%RDX,8),%RSI |
(432) 0x42ab3a MOV -0x30(%RBP),%RCX |
(432) 0x42ab3e CMP 0x8(%R12,%RDX,8),%RSI |
(432) 0x42ab43 JL 42ab72 |
(432) 0x42ab45 MOV (%R14,%RDX,8),%RSI |
(432) 0x42ab49 CMP 0x8(%R14,%RDX,8),%RSI |
(432) 0x42ab4e JGE 42abe0 |
(432) 0x42ab54 MOV -0x30(%RBP),%RCX |
(432) 0x42ab58 LEA (%RCX,%RDX,8),%RDI |
(432) 0x42ab5c JMP 42abb5 |
0x42ab5e XCHG %AX,%AX |
(446) 0x42ab60 MOVQ $0,(%RCX,%RDI,8) |
(446) 0x42ab68 INC %RSI |
(446) 0x42ab6b CMP 0x8(%R12,%RDX,8),%RSI |
(446) 0x42ab70 JGE 42ab45 |
(446) 0x42ab72 MOV (%R15,%RSI,8),%RDI |
(446) 0x42ab76 VMOVSD (%R13,%RDI,8),%XMM2 |
(446) 0x42ab7d VUCOMISD %XMM2,%XMM0 |
(446) 0x42ab81 JAE 42ab68 |
(446) 0x42ab83 VUCOMISD %XMM2,%XMM1 |
(446) 0x42ab87 JA 42ab60 |
(446) 0x42ab89 VUCOMISD %XMM1,%XMM2 |
(446) 0x42ab8d MOV %RDX,%RDI |
(446) 0x42ab90 JA 42ab60 |
(446) 0x42ab92 JMP 42ab68 |
0x42ab94 NOPW %CS:(%RAX,%RAX,1) |
(445) 0x42aba0 LEA (%R9,%R8,8),%R8 |
(445) 0x42aba4 MOVQ $0,(%R8) |
(445) 0x42abab INC %RSI |
(445) 0x42abae CMP 0x8(%R14,%RDX,8),%RSI |
(445) 0x42abb3 JGE 42abe0 |
(445) 0x42abb5 MOV (%R11,%RSI,8),%R8 |
(445) 0x42abb9 LEA (%R8,%RBX,1),%RCX |
(445) 0x42abbd VMOVSD (%R13,%RCX,8),%XMM2 |
(445) 0x42abc4 VUCOMISD %XMM2,%XMM0 |
(445) 0x42abc8 JAE 42abab |
(445) 0x42abca VUCOMISD %XMM2,%XMM1 |
(445) 0x42abce JA 42aba0 |
(445) 0x42abd0 VUCOMISD %XMM1,%XMM2 |
(445) 0x42abd4 MOV %RDI,%R8 |
(445) 0x42abd7 JA 42aba4 |
(445) 0x42abd9 JMP 42abab |
0x42abdb NOPL (%RAX,%RAX,1) |
(432) 0x42abe0 MOV 0x10(%R10,%RAX,8),%RDX |
(432) 0x42abe5 VMOVSD (%R13,%RDX,8),%XMM1 |
(432) 0x42abec VUCOMISD %XMM1,%XMM0 |
(432) 0x42abf0 JAE 42aca0 |
(432) 0x42abf6 MOV (%R12,%RDX,8),%RSI |
(432) 0x42abfa MOV -0x30(%RBP),%RCX |
(432) 0x42abfe CMP 0x8(%R12,%RDX,8),%RSI |
(432) 0x42ac03 JL 42ac32 |
(432) 0x42ac05 MOV (%R14,%RDX,8),%RSI |
(432) 0x42ac09 CMP 0x8(%R14,%RDX,8),%RSI |
(432) 0x42ac0e JGE 42aca0 |
(432) 0x42ac14 MOV -0x30(%RBP),%RCX |
(432) 0x42ac18 LEA (%RCX,%RDX,8),%RDI |
(432) 0x42ac1c JMP 42ac75 |
0x42ac1e XCHG %AX,%AX |
(444) 0x42ac20 MOVQ $0,(%RCX,%RDI,8) |
(444) 0x42ac28 INC %RSI |
(444) 0x42ac2b CMP 0x8(%R12,%RDX,8),%RSI |
(444) 0x42ac30 JGE 42ac05 |
(444) 0x42ac32 MOV (%R15,%RSI,8),%RDI |
(444) 0x42ac36 VMOVSD (%R13,%RDI,8),%XMM2 |
(444) 0x42ac3d VUCOMISD %XMM2,%XMM0 |
(444) 0x42ac41 JAE 42ac28 |
(444) 0x42ac43 VUCOMISD %XMM2,%XMM1 |
(444) 0x42ac47 JA 42ac20 |
(444) 0x42ac49 VUCOMISD %XMM1,%XMM2 |
(444) 0x42ac4d MOV %RDX,%RDI |
(444) 0x42ac50 JA 42ac20 |
(444) 0x42ac52 JMP 42ac28 |
0x42ac54 NOPW %CS:(%RAX,%RAX,1) |
(443) 0x42ac60 LEA (%R9,%R8,8),%R8 |
(443) 0x42ac64 MOVQ $0,(%R8) |
(443) 0x42ac6b INC %RSI |
(443) 0x42ac6e CMP 0x8(%R14,%RDX,8),%RSI |
(443) 0x42ac73 JGE 42aca0 |
(443) 0x42ac75 MOV (%R11,%RSI,8),%R8 |
(443) 0x42ac79 LEA (%R8,%RBX,1),%RCX |
(443) 0x42ac7d VMOVSD (%R13,%RCX,8),%XMM2 |
(443) 0x42ac84 VUCOMISD %XMM2,%XMM0 |
(443) 0x42ac88 JAE 42ac6b |
(443) 0x42ac8a VUCOMISD %XMM2,%XMM1 |
(443) 0x42ac8e JA 42ac60 |
(443) 0x42ac90 VUCOMISD %XMM1,%XMM2 |
(443) 0x42ac94 MOV %RDI,%R8 |
(443) 0x42ac97 JA 42ac64 |
(443) 0x42ac99 JMP 42ac6b |
0x42ac9b NOPL (%RAX,%RAX,1) |
(432) 0x42aca0 MOV 0x18(%R10,%RAX,8),%RDX |
(432) 0x42aca5 VMOVSD (%R13,%RDX,8),%XMM1 |
(432) 0x42acac VUCOMISD %XMM1,%XMM0 |
(432) 0x42acb0 JAE 42ad60 |
(432) 0x42acb6 MOV (%R12,%RDX,8),%RSI |
(432) 0x42acba MOV -0x30(%RBP),%RCX |
(432) 0x42acbe CMP 0x8(%R12,%RDX,8),%RSI |
(432) 0x42acc3 JL 42acf2 |
(432) 0x42acc5 MOV (%R14,%RDX,8),%RSI |
(432) 0x42acc9 CMP 0x8(%R14,%RDX,8),%RSI |
(432) 0x42acce JGE 42ad60 |
(432) 0x42acd4 MOV -0x30(%RBP),%RCX |
(432) 0x42acd8 LEA (%RCX,%RDX,8),%RDI |
(432) 0x42acdc JMP 42ad35 |
0x42acde XCHG %AX,%AX |
(442) 0x42ace0 MOVQ $0,(%RCX,%RDI,8) |
(442) 0x42ace8 INC %RSI |
(442) 0x42aceb CMP 0x8(%R12,%RDX,8),%RSI |
(442) 0x42acf0 JGE 42acc5 |
(442) 0x42acf2 MOV (%R15,%RSI,8),%RDI |
(442) 0x42acf6 VMOVSD (%R13,%RDI,8),%XMM2 |
(442) 0x42acfd VUCOMISD %XMM2,%XMM0 |
(442) 0x42ad01 JAE 42ace8 |
(442) 0x42ad03 VUCOMISD %XMM2,%XMM1 |
(442) 0x42ad07 JA 42ace0 |
(442) 0x42ad09 VUCOMISD %XMM1,%XMM2 |
(442) 0x42ad0d MOV %RDX,%RDI |
(442) 0x42ad10 JA 42ace0 |
(442) 0x42ad12 JMP 42ace8 |
0x42ad14 NOPW %CS:(%RAX,%RAX,1) |
(441) 0x42ad20 LEA (%R9,%R8,8),%R8 |
(441) 0x42ad24 MOVQ $0,(%R8) |
(441) 0x42ad2b INC %RSI |
(441) 0x42ad2e CMP 0x8(%R14,%RDX,8),%RSI |
(441) 0x42ad33 JGE 42ad60 |
(441) 0x42ad35 MOV (%R11,%RSI,8),%R8 |
(441) 0x42ad39 LEA (%R8,%RBX,1),%RCX |
(441) 0x42ad3d VMOVSD (%R13,%RCX,8),%XMM2 |
(441) 0x42ad44 VUCOMISD %XMM2,%XMM0 |
(441) 0x42ad48 JAE 42ad2b |
(441) 0x42ad4a VUCOMISD %XMM2,%XMM1 |
(441) 0x42ad4e JA 42ad20 |
(441) 0x42ad50 VUCOMISD %XMM1,%XMM2 |
(441) 0x42ad54 MOV %RDI,%R8 |
(441) 0x42ad57 JA 42ad24 |
(441) 0x42ad59 JMP 42ad2b |
0x42ad5b NOPL (%RAX,%RAX,1) |
(432) 0x42ad60 MOV 0x20(%R10,%RAX,8),%RDX |
(432) 0x42ad65 VMOVSD (%R13,%RDX,8),%XMM1 |
(432) 0x42ad6c VUCOMISD %XMM1,%XMM0 |
(432) 0x42ad70 JAE 42ae20 |
(432) 0x42ad76 MOV (%R12,%RDX,8),%RSI |
(432) 0x42ad7a MOV -0x30(%RBP),%RCX |
(432) 0x42ad7e CMP 0x8(%R12,%RDX,8),%RSI |
(432) 0x42ad83 JL 42adb2 |
(432) 0x42ad85 MOV (%R14,%RDX,8),%RSI |
(432) 0x42ad89 CMP 0x8(%R14,%RDX,8),%RSI |
(432) 0x42ad8e JGE 42ae20 |
(432) 0x42ad94 MOV -0x30(%RBP),%RCX |
(432) 0x42ad98 LEA (%RCX,%RDX,8),%RDI |
(432) 0x42ad9c JMP 42adf5 |
0x42ad9e XCHG %AX,%AX |
(440) 0x42ada0 MOVQ $0,(%RCX,%RDI,8) |
(440) 0x42ada8 INC %RSI |
(440) 0x42adab CMP 0x8(%R12,%RDX,8),%RSI |
(440) 0x42adb0 JGE 42ad85 |
(440) 0x42adb2 MOV (%R15,%RSI,8),%RDI |
(440) 0x42adb6 VMOVSD (%R13,%RDI,8),%XMM2 |
(440) 0x42adbd VUCOMISD %XMM2,%XMM0 |
(440) 0x42adc1 JAE 42ada8 |
(440) 0x42adc3 VUCOMISD %XMM2,%XMM1 |
(440) 0x42adc7 JA 42ada0 |
(440) 0x42adc9 VUCOMISD %XMM1,%XMM2 |
(440) 0x42adcd MOV %RDX,%RDI |
(440) 0x42add0 JA 42ada0 |
(440) 0x42add2 JMP 42ada8 |
0x42add4 NOPW %CS:(%RAX,%RAX,1) |
(439) 0x42ade0 LEA (%R9,%R8,8),%R8 |
(439) 0x42ade4 MOVQ $0,(%R8) |
(439) 0x42adeb INC %RSI |
(439) 0x42adee CMP 0x8(%R14,%RDX,8),%RSI |
(439) 0x42adf3 JGE 42ae20 |
(439) 0x42adf5 MOV (%R11,%RSI,8),%R8 |
(439) 0x42adf9 LEA (%R8,%RBX,1),%RCX |
(439) 0x42adfd VMOVSD (%R13,%RCX,8),%XMM2 |
(439) 0x42ae04 VUCOMISD %XMM2,%XMM0 |
(439) 0x42ae08 JAE 42adeb |
(439) 0x42ae0a VUCOMISD %XMM2,%XMM1 |
(439) 0x42ae0e JA 42ade0 |
(439) 0x42ae10 VUCOMISD %XMM1,%XMM2 |
(439) 0x42ae14 MOV %RDI,%R8 |
(439) 0x42ae17 JA 42ade4 |
(439) 0x42ae19 JMP 42adeb |
0x42ae1b NOPL (%RAX,%RAX,1) |
(432) 0x42ae20 MOV 0x28(%R10,%RAX,8),%RDX |
(432) 0x42ae25 VMOVSD (%R13,%RDX,8),%XMM1 |
(432) 0x42ae2c VUCOMISD %XMM1,%XMM0 |
(432) 0x42ae30 JAE 42aee0 |
(432) 0x42ae36 MOV (%R12,%RDX,8),%RSI |
(432) 0x42ae3a MOV -0x30(%RBP),%RCX |
(432) 0x42ae3e CMP 0x8(%R12,%RDX,8),%RSI |
(432) 0x42ae43 JL 42ae72 |
(432) 0x42ae45 MOV (%R14,%RDX,8),%RSI |
(432) 0x42ae49 CMP 0x8(%R14,%RDX,8),%RSI |
(432) 0x42ae4e JGE 42aee0 |
(432) 0x42ae54 MOV -0x30(%RBP),%RCX |
(432) 0x42ae58 LEA (%RCX,%RDX,8),%RDI |
(432) 0x42ae5c JMP 42aeb5 |
0x42ae5e XCHG %AX,%AX |
(438) 0x42ae60 MOVQ $0,(%RCX,%RDI,8) |
(438) 0x42ae68 INC %RSI |
(438) 0x42ae6b CMP 0x8(%R12,%RDX,8),%RSI |
(438) 0x42ae70 JGE 42ae45 |
(438) 0x42ae72 MOV (%R15,%RSI,8),%RDI |
(438) 0x42ae76 VMOVSD (%R13,%RDI,8),%XMM2 |
(438) 0x42ae7d VUCOMISD %XMM2,%XMM0 |
(438) 0x42ae81 JAE 42ae68 |
(438) 0x42ae83 VUCOMISD %XMM2,%XMM1 |
(438) 0x42ae87 JA 42ae60 |
(438) 0x42ae89 VUCOMISD %XMM1,%XMM2 |
(438) 0x42ae8d MOV %RDX,%RDI |
(438) 0x42ae90 JA 42ae60 |
(438) 0x42ae92 JMP 42ae68 |
0x42ae94 NOPW %CS:(%RAX,%RAX,1) |
(437) 0x42aea0 LEA (%R9,%R8,8),%R8 |
(437) 0x42aea4 MOVQ $0,(%R8) |
(437) 0x42aeab INC %RSI |
(437) 0x42aeae CMP 0x8(%R14,%RDX,8),%RSI |
(437) 0x42aeb3 JGE 42aee0 |
(437) 0x42aeb5 MOV (%R11,%RSI,8),%R8 |
(437) 0x42aeb9 LEA (%R8,%RBX,1),%RCX |
(437) 0x42aebd VMOVSD (%R13,%RCX,8),%XMM2 |
(437) 0x42aec4 VUCOMISD %XMM2,%XMM0 |
(437) 0x42aec8 JAE 42aeab |
(437) 0x42aeca VUCOMISD %XMM2,%XMM1 |
(437) 0x42aece JA 42aea0 |
(437) 0x42aed0 VUCOMISD %XMM1,%XMM2 |
(437) 0x42aed4 MOV %RDI,%R8 |
(437) 0x42aed7 JA 42aea4 |
(437) 0x42aed9 JMP 42aeab |
0x42aedb NOPL (%RAX,%RAX,1) |
(432) 0x42aee0 MOV 0x30(%R10,%RAX,8),%RDX |
(432) 0x42aee5 VMOVSD (%R13,%RDX,8),%XMM1 |
(432) 0x42aeec VUCOMISD %XMM1,%XMM0 |
(432) 0x42aef0 JAE 42afa0 |
(432) 0x42aef6 MOV (%R12,%RDX,8),%RSI |
(432) 0x42aefa MOV -0x30(%RBP),%RCX |
(432) 0x42aefe CMP 0x8(%R12,%RDX,8),%RSI |
(432) 0x42af03 JL 42af32 |
(432) 0x42af05 MOV (%R14,%RDX,8),%RSI |
(432) 0x42af09 CMP 0x8(%R14,%RDX,8),%RSI |
(432) 0x42af0e JGE 42afa0 |
(432) 0x42af14 MOV -0x30(%RBP),%RCX |
(432) 0x42af18 LEA (%RCX,%RDX,8),%RDI |
(432) 0x42af1c JMP 42af75 |
0x42af1e XCHG %AX,%AX |
(436) 0x42af20 MOVQ $0,(%RCX,%RDI,8) |
(436) 0x42af28 INC %RSI |
(436) 0x42af2b CMP 0x8(%R12,%RDX,8),%RSI |
(436) 0x42af30 JGE 42af05 |
(436) 0x42af32 MOV (%R15,%RSI,8),%RDI |
(436) 0x42af36 VMOVSD (%R13,%RDI,8),%XMM2 |
(436) 0x42af3d VUCOMISD %XMM2,%XMM0 |
(436) 0x42af41 JAE 42af28 |
(436) 0x42af43 VUCOMISD %XMM2,%XMM1 |
(436) 0x42af47 JA 42af20 |
(436) 0x42af49 VUCOMISD %XMM1,%XMM2 |
(436) 0x42af4d MOV %RDX,%RDI |
(436) 0x42af50 JA 42af20 |
(436) 0x42af52 JMP 42af28 |
0x42af54 NOPW %CS:(%RAX,%RAX,1) |
(435) 0x42af60 LEA (%R9,%R8,8),%R8 |
(435) 0x42af64 MOVQ $0,(%R8) |
(435) 0x42af6b INC %RSI |
(435) 0x42af6e CMP 0x8(%R14,%RDX,8),%RSI |
(435) 0x42af73 JGE 42afa0 |
(435) 0x42af75 MOV (%R11,%RSI,8),%R8 |
(435) 0x42af79 LEA (%R8,%RBX,1),%RCX |
(435) 0x42af7d VMOVSD (%R13,%RCX,8),%XMM2 |
(435) 0x42af84 VUCOMISD %XMM2,%XMM0 |
(435) 0x42af88 JAE 42af6b |
(435) 0x42af8a VUCOMISD %XMM2,%XMM1 |
(435) 0x42af8e JA 42af60 |
(435) 0x42af90 VUCOMISD %XMM1,%XMM2 |
(435) 0x42af94 MOV %RDI,%R8 |
(435) 0x42af97 JA 42af64 |
(435) 0x42af99 JMP 42af6b |
0x42af9b NOPL (%RAX,%RAX,1) |
(432) 0x42afa0 MOV 0x38(%R10,%RAX,8),%RSI |
(432) 0x42afa5 LEA 0x7(%RAX),%RDX |
(432) 0x42afa9 VMOVSD (%R13,%RSI,8),%XMM1 |
(432) 0x42afb0 VUCOMISD %XMM1,%XMM0 |
(432) 0x42afb4 JAE 42aa50 |
(432) 0x42afba MOV (%R12,%RSI,8),%RDI |
(432) 0x42afbe MOV -0x30(%RBP),%RCX |
(432) 0x42afc2 CMP 0x8(%R12,%RSI,8),%RDI |
(432) 0x42afc7 JL 42b002 |
(432) 0x42afc9 MOV (%R14,%RSI,8),%RDI |
(432) 0x42afcd CMP 0x8(%R14,%RSI,8),%RDI |
(432) 0x42afd2 JGE 42aa50 |
(432) 0x42afd8 MOV -0x30(%RBP),%RCX |
(432) 0x42afdc LEA (%RCX,%RSI,8),%R8 |
(432) 0x42afe0 JMP 42b04d |
0x42afe2 NOPW %CS:(%RAX,%RAX,1) |
(434) 0x42aff0 MOVQ $0,(%RCX,%R8,8) |
(434) 0x42aff8 INC %RDI |
(434) 0x42affb CMP 0x8(%R12,%RSI,8),%RDI |
(434) 0x42b000 JGE 42afc9 |
(434) 0x42b002 MOV (%R15,%RDI,8),%R8 |
(434) 0x42b006 VMOVSD (%R13,%R8,8),%XMM2 |
(434) 0x42b00d VUCOMISD %XMM2,%XMM0 |
(434) 0x42b011 JAE 42aff8 |
(434) 0x42b013 VUCOMISD %XMM2,%XMM1 |
(434) 0x42b017 JA 42aff0 |
(434) 0x42b019 VUCOMISD %XMM1,%XMM2 |
(434) 0x42b01d MOV %RSI,%R8 |
(434) 0x42b020 JA 42aff0 |
(434) 0x42b022 JMP 42aff8 |
0x42b024 NOPW %CS:(%RAX,%RAX,1) |
(433) 0x42b030 MOV -0x38(%RBP),%RCX |
(433) 0x42b034 LEA (%RCX,%R9,8),%R9 |
(433) 0x42b038 MOVQ $0,(%R9) |
(433) 0x42b03f INC %RDI |
(433) 0x42b042 CMP 0x8(%R14,%RSI,8),%RDI |
(433) 0x42b047 JGE 42aa50 |
(433) 0x42b04d MOV (%R11,%RDI,8),%R9 |
(433) 0x42b051 LEA (%R9,%RBX,1),%RCX |
(433) 0x42b055 VMOVSD (%R13,%RCX,8),%XMM2 |
(433) 0x42b05c VUCOMISD %XMM2,%XMM0 |
(433) 0x42b060 JAE 42b03f |
(433) 0x42b062 VUCOMISD %XMM2,%XMM1 |
(433) 0x42b066 JA 42b030 |
(433) 0x42b068 VUCOMISD %XMM1,%XMM2 |
(433) 0x42b06c MOV %R8,%R9 |
(433) 0x42b06f JA 42b038 |
(433) 0x42b071 JMP 42b03f |
0x42b073 NOPW %CS:(%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►98.11+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
○1.89 | __kmp_invoke_microtask | libiomp5.so |
Path / |
Source file and lines | par_coarsen.c:2354-2381 |
Module | exec |
nb instructions | 96 |
nb uops | 69 |
loop length | 455 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 17 |
micro-operation queue | 11.50 cycles |
front end | 11.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.00 | 5.00 | 4.75 | 4.75 | 3.50 | 9.00 | 9.00 | 9.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 5.00 | 5.00 | 4.75 | 4.75 | 3.50 | 9.00 | 9.00 | 9.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 11.50 |
Dispatch | 9.00 |
Overall L1 | 11.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 11% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 8% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 10% |
load | 11% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 8% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 11% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x58,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x28(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOVL $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOVQ $0,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVQ $0x1,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x78(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x40(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x50(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x40(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x5d44d0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %ESI,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL 410420 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV -0x60(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV -0x68(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV 0x40(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RCX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
SUB %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JB 42aa20 <hypre_BoomerAMGCoarsenPMIS.extracted.15+0x1b0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV -0x48(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
SUB %EAX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
INC %ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
AND $0x7,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV %RCX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JE 42aa19 <hypre_BoomerAMGCoarsenPMIS.extracted.15+0x1a9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
VMOVSD 0x1726db(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
JMP 42a953 <hypre_BoomerAMGCoarsenPMIS.extracted.15+0xe3> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
CMPQ $0x7,-0x58(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
JAE 42aa3b <hypre_BoomerAMGCoarsenPMIS.extracted.15+0x1cb> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOV $0x5d44f0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
ADD $0x58,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
JMP 410170 <__kmpc_for_static_fini@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
VMOVSD 0x1725cd(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
JMP 42aa5a <hypre_BoomerAMGCoarsenPMIS.extracted.15+0x1ea> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Source file and lines | par_coarsen.c:2354-2381 |
Module | exec |
nb instructions | 96 |
nb uops | 69 |
loop length | 455 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 17 |
micro-operation queue | 11.50 cycles |
front end | 11.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.00 | 5.00 | 4.75 | 4.75 | 3.50 | 9.00 | 9.00 | 9.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 5.00 | 5.00 | 4.75 | 4.75 | 3.50 | 9.00 | 9.00 | 9.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 11.50 |
Dispatch | 9.00 |
Overall L1 | 11.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 11% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 8% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 10% |
load | 11% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 8% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 11% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x58,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x28(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOVL $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOVQ $0,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVQ $0x1,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x78(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x40(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x50(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x40(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x5d44d0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %ESI,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL 410420 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV -0x60(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV -0x68(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV 0x40(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RCX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
SUB %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JB 42aa20 <hypre_BoomerAMGCoarsenPMIS.extracted.15+0x1b0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV -0x48(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
SUB %EAX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
INC %ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
AND $0x7,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV %RCX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JE 42aa19 <hypre_BoomerAMGCoarsenPMIS.extracted.15+0x1a9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
VMOVSD 0x1726db(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
JMP 42a953 <hypre_BoomerAMGCoarsenPMIS.extracted.15+0xe3> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
CMPQ $0x7,-0x58(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
JAE 42aa3b <hypre_BoomerAMGCoarsenPMIS.extracted.15+0x1cb> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOV $0x5d44f0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
ADD $0x58,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
JMP 410170 <__kmpc_for_static_fini@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
VMOVSD 0x1725cd(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
JMP 42aa5a <hypre_BoomerAMGCoarsenPMIS.extracted.15+0x1ea> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_BoomerAMGCoarsenPMIS.extracted.15– | 0.94 | 0.70 |
▼Loop 432 - par_coarsen.c:2354-2381 - exec– | 0.07 | 0.05 |
○Loop 434 - par_coarsen.c:2361-2381 - exec | 0.11 | 0.08 |
○Loop 446 - par_coarsen.c:2361-2381 - exec | 0.11 | 0.08 |
○Loop 438 - par_coarsen.c:2361-2381 - exec | 0.11 | 0.08 |
○Loop 436 - par_coarsen.c:2361-2381 - exec | 0.11 | 0.08 |
○Loop 448 - par_coarsen.c:2361-2381 - exec | 0.11 | 0.08 |
○Loop 442 - par_coarsen.c:2361-2381 - exec | 0.11 | 0.07 |
○Loop 444 - par_coarsen.c:2361-2381 - exec | 0.11 | 0.07 |
○Loop 440 - par_coarsen.c:2361-2381 - exec | 0.11 | 0.07 |
○Loop 435 - par_coarsen.c:2372-2380 - exec | 0.00 | 0.00 |
○Loop 441 - par_coarsen.c:2372-2380 - exec | 0.00 | 0.00 |
○Loop 445 - par_coarsen.c:2372-2380 - exec | 0.00 | 0.00 |
○Loop 447 - par_coarsen.c:2372-2380 - exec | 0.00 | 0.00 |
○Loop 443 - par_coarsen.c:2372-2380 - exec | 0.00 | 0.00 |
○Loop 439 - par_coarsen.c:2372-2380 - exec | 0.00 | 0.00 |
○Loop 437 - par_coarsen.c:2372-2380 - exec | 0.00 | 0.00 |
○Loop 433 - par_coarsen.c:2368-2380 - exec | 0.00 | 0.00 |
▼Loop 449 - par_coarsen.c:2354-2381 - exec– | 0.00 | 0.00 |
○Loop 451 - par_coarsen.c:2361-2381 - exec | 0.00 | 0.00 |
○Loop 450 - par_coarsen.c:2368-2380 - exec | 0.00 | 0.00 |