Function: hypre_qsort2abs.A | Module: libparcsr_ls.so | Source: par_interp.c:3180-3192 | Coverage: 0.02% |
---|
Function: hypre_qsort2abs.A | Module: libparcsr_ls.so | Source: par_interp.c:3180-3192 | Coverage: 0.02% |
---|
/home/eoseret/qaas_runs_CPU_9468/172-019-1763/intel/AMG/build/AMG/AMG/parcsr_ls/par_interp.c: 3180 - 3192 |
-------------------------------------------------------------------------------- |
3180: if (left >= right) |
3181: return; |
3182: hypre_swap2( v, w, left, (left+right)/2); |
3183: last = left; |
3184: for (i = left+1; i <= right; i++) |
3185: if (fabs(w[i]) > fabs(w[left])) |
3186: { |
3187: hypre_swap2(v, w, ++last, i); |
3188: } |
3189: hypre_swap2(v, w, left, last); |
3190: hypre_qsort2abs(v, w, left, last-1); |
3191: hypre_qsort2abs(v, w, last+1, right); |
3192: } |
0x520a0 CMP %RCX,%RDX |
0x520a3 JGE 52478 |
0x520a9 PUSH %RBP |
0x520aa MOV %RSP,%RBP |
0x520ad PUSH %R15 |
0x520af PUSH %R14 |
0x520b1 PUSH %R13 |
0x520b3 PUSH %R12 |
0x520b5 PUSH %RBX |
0x520b6 SUB $0x28,%RSP |
0x520ba MOV %RCX,%R15 |
0x520bd MOV %RDX,%R12 |
0x520c0 MOV %RSI,%R14 |
0x520c3 MOV %RDI,%RBX |
0x520c6 MOV %RDX,%R13 |
0x520c9 MOV %RCX,-0x38(%RBP) |
0x520cd MOV %RDI,-0x30(%RBP) |
0x520d1 JMP 5211a |
0x520d3 NOPW %CS:(%RAX,%RAX,1) |
(923) 0x520e0 MOV -0x38(%RBP),%R15 |
(923) 0x520e4 MOV -0x30(%RBP),%RBX |
(923) 0x520e8 MOV %RBX,%RDI |
(923) 0x520eb MOV %R14,%RSI |
(923) 0x520ee MOV %R12,%RDX |
(923) 0x520f1 MOV %R13,%RCX |
(923) 0x520f4 CALL 15470 <hypre_swap2@plt> |
(923) 0x520f9 LEA -0x1(%R13),%RCX |
(923) 0x520fd MOV %RBX,%RDI |
(923) 0x52100 MOV %R14,%RSI |
(923) 0x52103 MOV %R12,%RDX |
(923) 0x52106 CALL 163e0 <hypre_qsort2abs.A@plt> |
(923) 0x5210b INC %R13 |
(923) 0x5210e MOV %R13,%R12 |
(923) 0x52111 CMP %R15,%R13 |
(923) 0x52114 JGE 5246a |
(923) 0x5211a LEA (%R12,%R15,1),%RAX |
(923) 0x5211e MOV %RAX,%RCX |
(923) 0x52121 SHR $0x3f,%RCX |
(923) 0x52125 ADD %RAX,%RCX |
(923) 0x52128 SAR $0x1,%RCX |
(923) 0x5212b MOV %RBX,%RDI |
(923) 0x5212e MOV %R14,%RSI |
(923) 0x52131 MOV %R12,%RDX |
(923) 0x52134 CALL 15470 <hypre_swap2@plt> |
(923) 0x52139 LEA 0x1(%R12),%RAX |
(923) 0x5213e CMP %RAX,%R15 |
(923) 0x52141 CMOVG %R15,%RAX |
(923) 0x52145 MOV %RAX,-0x48(%RBP) |
(923) 0x52149 SUB %R12,%RAX |
(923) 0x5214c MOV %RAX,-0x40(%RBP) |
(923) 0x52150 CMP $0x8,%RAX |
(923) 0x52154 JAE 521d0 |
(923) 0x52156 MOV -0x40(%RBP),%RCX |
(923) 0x5215a MOV %RCX,%RAX |
(923) 0x5215d AND $-0x8,%RAX |
(923) 0x52161 CMP %RCX,%RAX |
(923) 0x52164 JAE 520e0 |
(923) 0x5216a LEA (%R12,%RAX,1),%RBX |
(923) 0x5216e INC %RBX |
(923) 0x52171 NEGQ -0x48(%RBP) |
(923) 0x52175 MOV -0x38(%RBP),%R15 |
(923) 0x52179 JMP 52197 |
0x5217b NOPL (%RAX,%RAX,1) |
(924) 0x52180 MOV -0x48(%RBP),%RAX |
(924) 0x52184 ADD %RBX,%RAX |
(924) 0x52187 INC %RAX |
(924) 0x5218a INC %RBX |
(924) 0x5218d CMP $0x1,%RAX |
(924) 0x52191 JE 520e4 |
(924) 0x52197 MOVSD (%R14,%RBX,8),%XMM0 |
(924) 0x5219d MOVAPD 0xe2f6b(%RIP),%XMM2 |
(924) 0x521a5 ANDPD %XMM2,%XMM0 |
(924) 0x521a9 MOVSD (%R14,%R12,8),%XMM1 |
(924) 0x521af ANDPD %XMM2,%XMM1 |
(924) 0x521b3 UCOMISD %XMM1,%XMM0 |
(924) 0x521b7 JBE 52180 |
(924) 0x521b9 INC %R13 |
(924) 0x521bc MOV -0x30(%RBP),%RDI |
(924) 0x521c0 MOV %R14,%RSI |
(924) 0x521c3 MOV %R13,%RDX |
(924) 0x521c6 MOV %RBX,%RCX |
(924) 0x521c9 CALL 15470 <hypre_swap2@plt> |
(924) 0x521ce JMP 52180 |
(923) 0x521d0 MOV -0x40(%RBP),%R15 |
(923) 0x521d4 SHR $0x3,%R15 |
(923) 0x521d8 LEA 0x8(%R12),%RBX |
(923) 0x521dd MOV %R12,%R13 |
(923) 0x521e0 JMP 521fd |
0x521e2 NOPW %CS:(%RAX,%RAX,1) |
(925) 0x521f0 ADD $0x8,%RBX |
(925) 0x521f4 DEC %R15 |
(925) 0x521f7 JE 52156 |
(925) 0x521fd MOVSD -0x38(%R14,%RBX,8),%XMM1 |
(925) 0x52204 MOVAPD 0xe2f04(%RIP),%XMM2 |
(925) 0x5220c ANDPD %XMM2,%XMM1 |
(925) 0x52210 MOVSD (%R14,%R12,8),%XMM0 |
(925) 0x52216 ANDPD %XMM2,%XMM0 |
(925) 0x5221a UCOMISD %XMM0,%XMM1 |
(925) 0x5221e JBE 52260 |
(925) 0x52220 LEA -0x7(%RBX),%RCX |
(925) 0x52224 INC %R13 |
(925) 0x52227 MOV -0x30(%RBP),%RDI |
(925) 0x5222b MOV %R14,%RSI |
(925) 0x5222e MOV %R13,%RDX |
(925) 0x52231 CALL 15470 <hypre_swap2@plt> |
(925) 0x52236 MOVSD (%R14,%R12,8),%XMM0 |
(925) 0x5223c MOVAPD 0xe2ecc(%RIP),%XMM2 |
(925) 0x52244 ANDPD %XMM2,%XMM0 |
(925) 0x52248 MOVSD -0x30(%R14,%RBX,8),%XMM1 |
(925) 0x5224f ANDPD %XMM2,%XMM1 |
(925) 0x52253 UCOMISD %XMM0,%XMM1 |
(925) 0x52257 JA 52279 |
(925) 0x52259 JMP 522a1 |
0x5225b NOPL (%RAX,%RAX,1) |
(925) 0x52260 MOVAPD 0xe2ea8(%RIP),%XMM2 |
(925) 0x52268 MOVSD -0x30(%R14,%RBX,8),%XMM1 |
(925) 0x5226f ANDPD %XMM2,%XMM1 |
(925) 0x52273 UCOMISD %XMM0,%XMM1 |
(925) 0x52277 JBE 522a1 |
(925) 0x52279 LEA -0x6(%RBX),%RCX |
(925) 0x5227d INC %R13 |
(925) 0x52280 MOV -0x30(%RBP),%RDI |
(925) 0x52284 MOV %R14,%RSI |
(925) 0x52287 MOV %R13,%RDX |
(925) 0x5228a CALL 15470 <hypre_swap2@plt> |
(925) 0x5228f MOVAPD 0xe2e79(%RIP),%XMM2 |
(925) 0x52297 MOVSD (%R14,%R12,8),%XMM0 |
(925) 0x5229d ANDPD %XMM2,%XMM0 |
(925) 0x522a1 MOVSD -0x28(%R14,%RBX,8),%XMM1 |
(925) 0x522a8 ANDPD %XMM2,%XMM1 |
(925) 0x522ac UCOMISD %XMM0,%XMM1 |
(925) 0x522b0 JA 52320 |
(925) 0x522b2 MOVSD -0x20(%R14,%RBX,8),%XMM1 |
(925) 0x522b9 ANDPD %XMM2,%XMM1 |
(925) 0x522bd UCOMISD %XMM0,%XMM1 |
(925) 0x522c1 JA 5235d |
(925) 0x522c7 MOVSD -0x18(%R14,%RBX,8),%XMM1 |
(925) 0x522ce ANDPD %XMM2,%XMM1 |
(925) 0x522d2 UCOMISD %XMM0,%XMM1 |
(925) 0x522d6 JA 5239a |
(925) 0x522dc MOVSD -0x10(%R14,%RBX,8),%XMM1 |
(925) 0x522e3 ANDPD %XMM2,%XMM1 |
(925) 0x522e7 UCOMISD %XMM0,%XMM1 |
(925) 0x522eb JA 523d7 |
(925) 0x522f1 MOVSD -0x8(%R14,%RBX,8),%XMM1 |
(925) 0x522f8 ANDPD %XMM2,%XMM1 |
(925) 0x522fc UCOMISD %XMM0,%XMM1 |
(925) 0x52300 JA 52414 |
(925) 0x52306 MOVSD (%R14,%RBX,8),%XMM1 |
(925) 0x5230c ANDPD %XMM2,%XMM1 |
(925) 0x52310 UCOMISD %XMM0,%XMM1 |
(925) 0x52314 JBE 521f0 |
(925) 0x5231a JMP 52450 |
0x5231f NOP |
(925) 0x52320 LEA -0x5(%RBX),%RCX |
(925) 0x52324 INC %R13 |
(925) 0x52327 MOV -0x30(%RBP),%RDI |
(925) 0x5232b MOV %R14,%RSI |
(925) 0x5232e MOV %R13,%RDX |
(925) 0x52331 CALL 15470 <hypre_swap2@plt> |
(925) 0x52336 MOVAPD 0xe2dd2(%RIP),%XMM2 |
(925) 0x5233e MOVSD (%R14,%R12,8),%XMM0 |
(925) 0x52344 ANDPD %XMM2,%XMM0 |
(925) 0x52348 MOVSD -0x20(%R14,%RBX,8),%XMM1 |
(925) 0x5234f ANDPD %XMM2,%XMM1 |
(925) 0x52353 UCOMISD %XMM0,%XMM1 |
(925) 0x52357 JBE 522c7 |
(925) 0x5235d LEA -0x4(%RBX),%RCX |
(925) 0x52361 INC %R13 |
(925) 0x52364 MOV -0x30(%RBP),%RDI |
(925) 0x52368 MOV %R14,%RSI |
(925) 0x5236b MOV %R13,%RDX |
(925) 0x5236e CALL 15470 <hypre_swap2@plt> |
(925) 0x52373 MOVAPD 0xe2d95(%RIP),%XMM2 |
(925) 0x5237b MOVSD (%R14,%R12,8),%XMM0 |
(925) 0x52381 ANDPD %XMM2,%XMM0 |
(925) 0x52385 MOVSD -0x18(%R14,%RBX,8),%XMM1 |
(925) 0x5238c ANDPD %XMM2,%XMM1 |
(925) 0x52390 UCOMISD %XMM0,%XMM1 |
(925) 0x52394 JBE 522dc |
(925) 0x5239a LEA -0x3(%RBX),%RCX |
(925) 0x5239e INC %R13 |
(925) 0x523a1 MOV -0x30(%RBP),%RDI |
(925) 0x523a5 MOV %R14,%RSI |
(925) 0x523a8 MOV %R13,%RDX |
(925) 0x523ab CALL 15470 <hypre_swap2@plt> |
(925) 0x523b0 MOVAPD 0xe2d58(%RIP),%XMM2 |
(925) 0x523b8 MOVSD (%R14,%R12,8),%XMM0 |
(925) 0x523be ANDPD %XMM2,%XMM0 |
(925) 0x523c2 MOVSD -0x10(%R14,%RBX,8),%XMM1 |
(925) 0x523c9 ANDPD %XMM2,%XMM1 |
(925) 0x523cd UCOMISD %XMM0,%XMM1 |
(925) 0x523d1 JBE 522f1 |
(925) 0x523d7 LEA -0x2(%RBX),%RCX |
(925) 0x523db INC %R13 |
(925) 0x523de MOV -0x30(%RBP),%RDI |
(925) 0x523e2 MOV %R14,%RSI |
(925) 0x523e5 MOV %R13,%RDX |
(925) 0x523e8 CALL 15470 <hypre_swap2@plt> |
(925) 0x523ed MOVAPD 0xe2d1b(%RIP),%XMM2 |
(925) 0x523f5 MOVSD (%R14,%R12,8),%XMM0 |
(925) 0x523fb ANDPD %XMM2,%XMM0 |
(925) 0x523ff MOVSD -0x8(%R14,%RBX,8),%XMM1 |
(925) 0x52406 ANDPD %XMM2,%XMM1 |
(925) 0x5240a UCOMISD %XMM0,%XMM1 |
(925) 0x5240e JBE 52306 |
(925) 0x52414 LEA -0x1(%RBX),%RCX |
(925) 0x52418 INC %R13 |
(925) 0x5241b MOV -0x30(%RBP),%RDI |
(925) 0x5241f MOV %R14,%RSI |
(925) 0x52422 MOV %R13,%RDX |
(925) 0x52425 CALL 15470 <hypre_swap2@plt> |
(925) 0x5242a MOVAPD 0xe2cde(%RIP),%XMM2 |
(925) 0x52432 MOVSD (%R14,%R12,8),%XMM0 |
(925) 0x52438 ANDPD %XMM2,%XMM0 |
(925) 0x5243c MOVSD (%R14,%RBX,8),%XMM1 |
(925) 0x52442 ANDPD %XMM2,%XMM1 |
(925) 0x52446 UCOMISD %XMM0,%XMM1 |
(925) 0x5244a JBE 521f0 |
(925) 0x52450 INC %R13 |
(925) 0x52453 MOV -0x30(%RBP),%RDI |
(925) 0x52457 MOV %R14,%RSI |
(925) 0x5245a MOV %R13,%RDX |
(925) 0x5245d MOV %RBX,%RCX |
(925) 0x52460 CALL 15470 <hypre_swap2@plt> |
(925) 0x52465 JMP 521f0 |
0x5246a ADD $0x28,%RSP |
0x5246e POP %RBX |
0x5246f POP %R12 |
0x52471 POP %R13 |
0x52473 POP %R14 |
0x52475 POP %R15 |
0x52477 POP %RBP |
0x52478 RET |
0x52479 NOPL (%RAX) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►44.12+ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | hypre_BoomerAMGBuildExtPIInter[...] | ams.c:3855 | libparcsr_ls.so |
○ | hypre_BoomerAMGSetup.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_BoomerAMGSetup | ams.c:3550 | libparcsr_ls.so |
○ | hypre_PCGSetup | gmres.c:1245 | libkrylov.so |
○ | main.A | amg.c:398 | exec |
○ | __libc_start_call_main | libc.so.6 | |
►36.27+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | hypre_BoomerAMGBuildExtPIInter[...] | ams.c:3855 | libparcsr_ls.so |
○ | hypre_BoomerAMGSetup.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_BoomerAMGSetup | ams.c:3550 | libparcsr_ls.so |
○ | hypre_PCGSetup | gmres.c:1245 | libkrylov.so |
○ | main.A | amg.c:398 | exec |
○ | __libc_start_call_main | libc.so.6 | |
►11.76+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | hypre_BoomerAMGBuildExtPIInter[...] | ams.c:3855 | libparcsr_ls.so |
○ | hypre_BoomerAMGSetup.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_BoomerAMGSetup | ams.c:3550 | libparcsr_ls.so |
○ | hypre_PCGSetup | gmres.c:1245 | libkrylov.so |
○ | main.A | amg.c:398 | exec |
○ | __libc_start_call_main | libc.so.6 | |
►6.86+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_fork_call | libiomp5.so | |
○ | __kmpc_fork_call | libiomp5.so | |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | hypre_BoomerAMGBuildExtPIInter[...] | ams.c:3855 | libparcsr_ls.so |
○ | hypre_BoomerAMGSetup.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_BoomerAMGSetup | ams.c:3550 | libparcsr_ls.so |
○ | hypre_PCGSetup | gmres.c:1245 | libkrylov.so |
○ | main.A | amg.c:398 | exec |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►53.33+ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►27.62+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►15.24+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►1.90+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►1.90+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►52.58+ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►36.08+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►8.25+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►3.09+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►42.72+ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►34.95+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►16.50+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►4.85+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►48.15+ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►35.19+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►14.81+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►42.86+ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►34.13+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►19.05+ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs.A | ams.c:3855 | libparcsr_ls.so |
○ | hypre_qsort2abs | par_rap.c:199 | libparcsr_ls.so |
○ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►1.59+ | hypre_BoomerAMGInterpTruncatio[...] | ams.c:3855 | libparcsr_ls.so |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | par_interp.c:3180-3192 |
Module | libparcsr_ls.so |
nb instructions | 32 |
nb uops | 26 |
loop length | 111 |
used x86 registers | 12 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 2 |
micro-operation queue | 4.33 cycles |
front end | 4.33 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 1.50 | 1.00 | 1.00 | 1.00 | 1.50 | 0.67 | 0.67 | 0.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 1.50 | 1.00 | 1.00 | 1.00 | 1.50 | 0.67 | 0.67 | 0.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 4.33 |
Dispatch | 1.50 |
Overall L1 | 4.33 |
all | 0% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 12% |
load | NA (no load vectorizable/vectorized instructions) |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
CMP %RCX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JGE 52478 <hypre_qsort2abs.A+0x3d8> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x28,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP 5211a <hypre_qsort2abs.A+0x7a> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
ADD $0x28,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Source file and lines | par_interp.c:3180-3192 |
Module | libparcsr_ls.so |
nb instructions | 32 |
nb uops | 26 |
loop length | 111 |
used x86 registers | 12 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 2 |
micro-operation queue | 4.33 cycles |
front end | 4.33 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 1.50 | 1.00 | 1.00 | 1.00 | 1.50 | 0.67 | 0.67 | 0.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 1.50 | 1.00 | 1.00 | 1.00 | 1.50 | 0.67 | 0.67 | 0.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 4.33 |
Dispatch | 1.50 |
Overall L1 | 4.33 |
all | 0% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 12% |
load | NA (no load vectorizable/vectorized instructions) |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
CMP %RCX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JGE 52478 <hypre_qsort2abs.A+0x3d8> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x28,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP 5211a <hypre_qsort2abs.A+0x7a> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
ADD $0x28,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Run 8x1 | Number processes: 8Number nodes: 1Run Command: <executable> -n 400 400 400MPI Command: mpirun -n <number_processes>Dataset: Run Directory: /home/eoseret/qaas_runs_CPU_9468/172-019-1763/intel/AMG/run/oneview_runs/multicore/icx_9/oneview_run_1720211326OMP_PROC_BIND: spreadI_MPI_PIN_DOMAIN: auto:scatterOMP_PLACES: threadsOMP_NUM_THREADS: 1 |
---|---|
Run 8x2 | Number processes: 8OMP_NUM_THREADS: 2OMP_PROC_BIND: spreadI_MPI_PIN_DOMAIN: auto:scatterOMP_PLACES: threads |
Run 8x4 | Number processes: 8OMP_NUM_THREADS: 4OMP_PROC_BIND: spreadI_MPI_PIN_DOMAIN: auto:scatterOMP_PLACES: threads |
Run 8x8 | Number processes: 8OMP_NUM_THREADS: 8OMP_PROC_BIND: spreadI_MPI_PIN_DOMAIN: auto:scatterOMP_PLACES: threads |
Run 8x16 | Number processes: 8OMP_NUM_THREADS: 16OMP_PROC_BIND: spreadI_MPI_PIN_DOMAIN: auto:scatterOMP_PLACES: threads |
Run 8x24 | Number processes: 8OMP_NUM_THREADS: 24OMP_PROC_BIND: spreadI_MPI_PIN_DOMAIN: auto:scatterOMP_PLACES: threads |
(8x1) Efficiency | (8x1) Potential Speed-Up (%) | (8x2) Efficiency | (8x2) Potential Speed-Up (%) | (8x4) Efficiency | (8x4) Potential Speed-Up (%) | (8x8) Efficiency | (8x8) Potential Speed-Up (%) | (8x16) Efficiency | (8x16) Potential Speed-Up (%) | (8x24) Efficiency | (8x24) Potential Speed-Up (%) |
---|---|---|---|---|---|---|---|---|---|---|---|
1 | 0 | 1.91 | 0 | 4.06 | 0 | 7.54 | 0 | 14.31 | 0 | 18.3 | 0 |
Run | Number of threads | Efficiency (ideal is 1) | Speedup | Ideal Speedup | Time (s) | Coverage (%) |
---|---|---|---|---|---|---|
8x1 | 8 | 1 | 1 | 1 | 0.079999998211861 | 0.018906891345978 |
8x2 | 16 | 1.91 | 1.91 | 2 | 0.049999989569187 | 0.019424706697464 |
8x4 | 32 | 4.06 | 4.06 | 4 | 0.029999997466803 | 0.012917910702527 |
8x8 | 64 | 7.54 | 7.54 | 8 | 0.019999999552965 | 0.0095599349588156 |
8x16 | 128 | 14.31 | 14.31 | 16 | 0.014999999664724 | 0.0054605696350336 |
8x24 | 190 | 18.3 | 18.3 | 24 | 0.014999999664724 | 0.004682547878474 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_qsort2abs.A– | 0.02 | 0.06 |
▼Loop 923 - par_interp.c:3180-3191 - libparcsr_ls.so– | 0.00 | 0.01 |
○Loop 924 - par_interp.c:3180-3187 - libparcsr_ls.so | 0.01 | 0.03 |
○Loop 925 - par_interp.c:3184-3187 - libparcsr_ls.so | 0.00 | 0.01 |