| | | | | | | requested parallelism | walltime sum (s) | nb instances | any sync average per thread time (s) | any wait average per thread time (s) | parallelism overhead (%) | local speedup if perfectly balanced | global speedup if perfectly balanced |
start addr | function name | source location | level | ancestor thread num | invoker | parallel or teams | 2x1 | 2x2 | 2x4 | 2x8 | 2x16 | 2x32 | 2x64 | 2x96 | 2x1 | 2x2 | 2x4 | 2x8 | 2x16 | 2x32 | 2x64 | 2x96 | 2x1 | 2x2 | 2x4 | 2x8 | 2x16 | 2x32 | 2x64 | 2x96 | 2x1 | 2x2 | 2x4 | 2x8 | 2x16 | 2x32 | 2x64 | 2x96 | 2x1 | 2x2 | 2x4 | 2x8 | 2x16 | 2x32 | 2x64 | 2x96 | 2x1 | 2x2 | 2x4 | 2x8 | 2x16 | 2x32 | 2x64 | 2x96 | 2x1 | 2x2 | 2x4 | 2x8 | 2x16 | 2x32 | 2x64 | 2x96 | 2x1 | 2x2 | 2x4 | 2x8 | 2x16 | 2x32 | 2x64 | 2x96 |
exec:0x58c258 | hypre_CSRMatrixMatvecOutOfPlace.A | csr_matvec.c:243 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 76.051 | 14.840 | 9.313 | 4.906 | 4.259 | 3.117 | 2.766 | 2.768 | 1.39 E3 | 480 | 480 | 480 | 480 | 480 | 480 | 480 | 0.0 | 0.174 | 0.727 | 0.381 | 0.932 | 0.616 | 0.465 | 0.428 | 0.0 | 0.174 | 0.727 | 0.381 | 0.932 | 0.616 | 0.465 | 0.428 | 0 | 1.17 | 7.50 | 7.59 | 21.1 | 19.7 | 16.8 | 15.4 | 1.000 | 1.012 | 1.081 | 1.082 | 1.268 | 1.246 | 1.202 | 1.183 | 1.000 | 1.002 | 1.012 | 1.011 | 1.034 | 1.033 | 1.027 | 1.025 |
exec:0x466432 | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:891 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 11.688 | 7.251 | 4.706 | 2.205 | 1.300 | 0.702 | 0.432 | 0.314 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 3.73 E-6 | 0.409 | 0.846 | 0.259 | 0.257 | 0.142 | 63.5 E-3 | 48.8 E-3 | 705 E-9 | 0.409 | 0.846 | 0.259 | 0.257 | 0.141 | 63.5 E-3 | 48.8 E-3 | 0.00 | 4.87 | 18.0 | 11.7 | 19.8 | 20.2 | 15.1 | 15.5 | 1.000 | 1.051 | 1.220 | 1.133 | 1.247 | 1.253 | 1.178 | 1.184 | 1.000 | 1.004 | 1.014 | 1.008 | 1.009 | 1.007 | 1.004 | 1.003 |
exec:0x4682df | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:1737 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 11.470 | 6.860 | 4.182 | 2.160 | 1.214 | 0.757 | 0.611 | 0.654 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 0.0 | 29.5 E-3 | 0.516 | 0.255 | 0.175 | 0.119 | 74.3 E-3 | 68.0 E-3 | 0.0 | 29.5 E-3 | 0.516 | 0.255 | 0.175 | 0.119 | 74.3 E-3 | 68.0 E-3 | 0 | 0.43 | 12.3 | 11.8 | 14.4 | 15.8 | 12.1 | 10.4 | 1.000 | 1.004 | 1.140 | 1.134 | 1.169 | 1.187 | 1.138 | 1.116 | 1.000 | 1.000 | 1.009 | 1.008 | 1.006 | 1.006 | 1.004 | 1.004 |
exec:0x4f89a5 | hypre_BoomerAMGCreate2ndS.A | par_strength.c:1668 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 10.175 | 5.192 | 2.747 | 1.425 | 0.755 | 0.398 | 0.224 | 0.183 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 2.12 E-6 | 43.8 E-3 | 75.9 E-3 | 69.6 E-3 | 54.3 E-3 | 24.4 E-3 | 11.9 E-3 | 12.7 E-3 | 570 E-9 | 43.8 E-3 | 75.9 E-3 | 69.6 E-3 | 54.3 E-3 | 24.4 E-3 | 11.9 E-3 | 12.7 E-3 | 0.00 | 0.84 | 2.76 | 4.89 | 7.19 | 6.16 | 5.34 | 6.93 | 1.000 | 1.008 | 1.028 | 1.051 | 1.078 | 1.066 | 1.056 | 1.074 | 1.000 | 1.000 | 1.001 | 1.002 | 1.002 | 1.001 | 1.001 | 1.001 |
exec:0x548b67 | hypre_ParMatmul.A | par_csr_matop.c:829 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 9.117 | 4.574 | 2.314 | 1.154 | 0.583 | 0.295 | 0.153 | 0.124 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 0.0 | 5.10 E-3 | 18.2 E-3 | 8.67 E-3 | 7.62 E-3 | 5.46 E-3 | 4.92 E-3 | 4.27 E-3 | 0.0 | 5.10 E-3 | 18.2 E-3 | 8.67 E-3 | 7.62 E-3 | 5.46 E-3 | 4.92 E-3 | 4.27 E-3 | 0 | 0.11 | 0.78 | 0.75 | 1.31 | 1.85 | 3.20 | 3.44 | 1.000 | 1.001 | 1.008 | 1.008 | 1.013 | 1.019 | 1.033 | 1.036 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x548a00 | hypre_ParMatmul.A | par_csr_matop.c:102 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 7.518 | 3.782 | 1.903 | 0.955 | 0.483 | 0.243 | 0.125 | 94.5 E-3 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 4.44 E-6 | 14.2 E-3 | 14.9 E-3 | 9.87 E-3 | 8.18 E-3 | 4.70 E-3 | 3.26 E-3 | 3.72 E-3 | 1.89 E-6 | 14.2 E-3 | 14.9 E-3 | 9.86 E-3 | 8.17 E-3 | 4.69 E-3 | 3.26 E-3 | 3.72 E-3 | 0.00 | 0.37 | 0.78 | 1.03 | 1.69 | 1.93 | 2.61 | 3.94 | 1.000 | 1.004 | 1.008 | 1.010 | 1.017 | 1.020 | 1.027 | 1.041 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x43c604 | hypre_BoomerAMGCoarsenPMIS.A | par_coarsen.c:2354 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 6.485 | 3.275 | 1.657 | 0.824 | 0.418 | 0.213 | 0.119 | 92.2 E-3 | 48.5 | 48.5 | 48.5 | 48.5 | 48.5 | 48.5 | 48.5 | 48.5 | 0.0 | 18.9 E-3 | 23.1 E-3 | 9.48 E-3 | 8.65 E-3 | 6.25 E-3 | 11.0 E-3 | 10.5 E-3 | 0.0 | 18.9 E-3 | 23.1 E-3 | 9.48 E-3 | 8.64 E-3 | 6.24 E-3 | 11.0 E-3 | 10.5 E-3 | 0 | 0.57 | 1.39 | 1.15 | 2.07 | 2.94 | 9.29 | 11.4 | 1.000 | 1.006 | 1.014 | 1.012 | 1.021 | 1.030 | 1.102 | 1.129 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.001 | 1.001 |
exec:0x5859bf | hypre_CSRMatrixMultiply | csr_matop.c:185 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 4.038 | 2.045 | 1.053 | 0.542 | 0.323 | 0.176 | 0.113 | 94.1 E-3 | 20.0 | 20.0 | 20.0 | 20.0 | 20.0 | 20.0 | 20.0 | 20.0 | 15.7 E-6 | 9.63 E-3 | 20.2 E-3 | 18.5 E-3 | 36.6 E-3 | 16.7 E-3 | 19.4 E-3 | 13.6 E-3 | 4.81 E-6 | 9.61 E-3 | 20.2 E-3 | 18.5 E-3 | 36.5 E-3 | 16.6 E-3 | 19.4 E-3 | 13.6 E-3 | 0.00 | 0.47 | 1.92 | 3.42 | 11.3 | 9.44 | 17.1 | 14.5 | 1.000 | 1.005 | 1.020 | 1.035 | 1.128 | 1.104 | 1.207 | 1.169 | 1.000 | 1.000 | 1.000 | 1.001 | 1.001 | 1.001 | 1.001 | 1.001 |
exec:0x574ec0 | hypre_IJMatrixSetValuesOMPParCSR.A | IJMatrix_parcsr.c:3240 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 2.515 | 1.270 | 0.661 | 0.332 | 0.223 | 0.161 | 0.188 | 0.183 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.82 E-6 | 2.67 E-3 | 7.15 E-3 | 4.58 E-3 | 35.1 E-3 | 16.5 E-3 | 28.3 E-3 | 11.2 E-3 | 600 E-9 | 2.66 E-3 | 7.15 E-3 | 4.58 E-3 | 35.1 E-3 | 16.5 E-3 | 28.3 E-3 | 11.2 E-3 | 0.00 | 0.21 | 1.08 | 1.38 | 15.7 | 10.2 | 15.1 | 6.12 | 1.000 | 1.002 | 1.011 | 1.014 | 1.187 | 1.114 | 1.177 | 1.065 | 1.000 | 1.000 | 1.000 | 1.000 | 1.001 | 1.001 | 1.002 | 1.001 |
exec:0x4f6bdd | hypre_BoomerAMGCreateS.A | par_strength.c:246 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 2.453 | 1.243 | 0.672 | 0.339 | 0.255 | 0.180 | 0.192 | 0.181 | 6.00 | 6.00 | 6.00 | 6.00 | 6.00 | 6.00 | 6.00 | 6.00 | 6.94 E-6 | 2.35 E-3 | 16.0 E-3 | 8.46 E-3 | 49.7 E-3 | 20.7 E-3 | 30.3 E-3 | 9.82 E-3 | 2.04 E-6 | 2.34 E-3 | 15.9 E-3 | 8.46 E-3 | 49.6 E-3 | 20.7 E-3 | 30.3 E-3 | 9.82 E-3 | 0.00 | 0.19 | 2.37 | 2.50 | 19.5 | 11.5 | 15.7 | 5.41 | 1.000 | 1.002 | 1.024 | 1.026 | 1.242 | 1.130 | 1.187 | 1.057 | 1.000 | 1.000 | 1.000 | 1.000 | 1.002 | 1.001 | 1.002 | 1.001 |
exec:0x41f994 | BuildIJLaplacian27pt.A | amg.c:760 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 2.408 | 1.455 | 0.949 | 0.754 | 0.477 | 0.294 | 0.268 | 0.282 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 6.35 E-6 | 34.1 E-3 | 86.7 E-3 | 0.128 | 0.136 | 79.6 E-3 | 90.4 E-3 | 97.0 E-3 | 1.12 E-6 | 34.1 E-3 | 86.7 E-3 | 0.128 | 0.136 | 79.6 E-3 | 90.4 E-3 | 97.0 E-3 | 0.00 | 2.35 | 8.99 | 17.0 | 28.6 | 27.1 | 33.8 | 34.4 | 1.000 | 1.024 | 1.099 | 1.204 | 1.400 | 1.372 | 1.510 | 1.525 | 1.000 | 1.000 | 1.001 | 1.004 | 1.005 | 1.004 | 1.005 | 1.006 |
exec:0x43bd83 | hypre_BoomerAMGCoarsenPMIS.A | par_coarsen.c:2132 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 2.310 | 1.160 | 0.582 | 0.294 | 0.151 | 78.4 E-3 | 47.0 E-3 | 36.7 E-3 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 0.0 | 3.01 E-3 | 2.52 E-3 | 2.71 E-3 | 3.89 E-3 | 3.41 E-3 | 6.56 E-3 | 7.67 E-3 | 0.0 | 3.01 E-3 | 2.52 E-3 | 2.71 E-3 | 3.89 E-3 | 3.41 E-3 | 6.56 E-3 | 7.67 E-3 | 0 | 0.26 | 0.43 | 0.92 | 2.58 | 4.35 | 14.0 | 20.9 | 1.000 | 1.003 | 1.004 | 1.009 | 1.026 | 1.045 | 1.162 | 1.264 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x467d1a | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:1575 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 2.021 | 1.221 | 0.850 | 0.501 | 0.324 | 0.217 | 0.255 | 0.339 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 23.8 E-3 | 0.148 | 87.4 E-3 | 62.0 E-3 | 28.7 E-3 | 35.8 E-3 | 42.0 E-3 | 0.0 | 23.8 E-3 | 0.148 | 87.4 E-3 | 62.0 E-3 | 28.7 E-3 | 35.8 E-3 | 42.0 E-3 | 0 | 1.78 | 17.1 | 17.4 | 19.2 | 13.3 | 14.1 | 12.4 | 1.000 | 1.018 | 1.207 | 1.210 | 1.237 | 1.153 | 1.164 | 1.141 | 1.000 | 1.000 | 1.002 | 1.003 | 1.002 | 1.002 | 1.002 | 1.002 |
exec:0x476bce | hypre_BoomerAMGBuildExtPIInterp.A | par_lr_interp.c:1196 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.611 | 0.815 | 0.425 | 0.221 | 0.116 | 65.8 E-3 | 41.0 E-3 | 33.8 E-3 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 6.53 E-6 | 5.67 E-3 | 17.7 E-3 | 16.7 E-3 | 12.9 E-3 | 13.1 E-3 | 12.4 E-3 | 11.2 E-3 | 1.76 E-6 | 5.67 E-3 | 17.7 E-3 | 16.7 E-3 | 12.9 E-3 | 13.1 E-3 | 12.4 E-3 | 11.2 E-3 | 0.00 | 0.70 | 4.18 | 7.54 | 11.1 | 19.8 | 30.2 | 33.0 | 1.000 | 1.007 | 1.044 | 1.081 | 1.125 | 1.247 | 1.433 | 1.493 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.001 | 1.001 | 1.001 |
exec:0x43c720 | hypre_BoomerAMGCoarsenPMIS.A | par_coarsen.c:2435 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.478 | 0.761 | 0.387 | 0.196 | 0.107 | 80.1 E-3 | 70.6 E-3 | 65.6 E-3 | 49.5 | 49.5 | 49.5 | 49.5 | 49.5 | 49.5 | 49.5 | 49.5 | 0.0 | 8.59 E-3 | 8.08 E-3 | 5.47 E-3 | 8.53 E-3 | 18.2 E-3 | 14.8 E-3 | 11.4 E-3 | 0.0 | 8.58 E-3 | 8.07 E-3 | 5.47 E-3 | 8.52 E-3 | 18.2 E-3 | 14.8 E-3 | 11.4 E-3 | 0 | 1.13 | 2.09 | 2.79 | 7.88 | 22.7 | 21.0 | 17.4 | 1.000 | 1.011 | 1.021 | 1.029 | 1.086 | 1.293 | 1.266 | 1.211 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.001 | 1.001 | 1.001 |
exec:0x58c35d | hypre_CSRMatrixMatvecOutOfPlace.A | csr_matvec.c:158 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.273 | 0.143 | 86.5 E-3 | 34.6 E-3 | 28.8 E-3 | 32.3 E-3 | 30.0 E-3 | 25.2 E-3 | 121 | 25.0 | 25.0 | 25.0 | 25.0 | 25.0 | 25.0 | 25.0 | 0.0 | 324 E-6 | 6.15 E-3 | 1.56 E-3 | 7.24 E-3 | 7.02 E-3 | 5.02 E-3 | 1.91 E-3 | 0.0 | 320 E-6 | 6.14 E-3 | 1.55 E-3 | 7.24 E-3 | 7.02 E-3 | 5.01 E-3 | 1.91 E-3 | 0 | 0.23 | 7.11 | 4.50 | 25.1 | 21.7 | 16.7 | 7.58 | 1.000 | 1.002 | 1.076 | 1.047 | 1.336 | 1.277 | 1.201 | 1.082 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x58c4ab | hypre_CSRMatrixMatvecOutOfPlace.A | csr_matvec.c:234 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.241 | 0.144 | 0.101 | 37.9 E-3 | 25.5 E-3 | 22.7 E-3 | 24.9 E-3 | 22.4 E-3 | 121 | 25.0 | 25.0 | 25.0 | 25.0 | 25.0 | 25.0 | 25.0 | 0.0 | 549 E-6 | 10.6 E-3 | 3.27 E-3 | 10.6 E-3 | 9.31 E-3 | 7.70 E-3 | 6.34 E-3 | 0.0 | 545 E-6 | 10.6 E-3 | 3.27 E-3 | 10.6 E-3 | 9.31 E-3 | 7.70 E-3 | 6.34 E-3 | 0 | 0.38 | 10.5 | 8.61 | 41.7 | 41.1 | 30.9 | 28.4 | 1.000 | 1.004 | 1.118 | 1.094 | 1.716 | 1.698 | 1.448 | 1.397 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x592c07 | hypre_SeqVectorCopy.A | vector.c:334 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.130 | 15.7 E-3 | 9.91 E-3 | 5.01 E-3 | 3.90 E-3 | 3.09 E-3 | 2.74 E-3 | 2.36 E-3 | 505 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 31.6 E-6 | 799 E-6 | 262 E-6 | 928 E-6 | 755 E-6 | 565 E-6 | 568 E-6 | 0.0 | 31.4 E-6 | 799 E-6 | 262 E-6 | 928 E-6 | 755 E-6 | 564 E-6 | 568 E-6 | 0 | 0.20 | 8.05 | 5.22 | 23.8 | 24.5 | 20.6 | 24.0 | 1.000 | 1.002 | 1.088 | 1.055 | 1.312 | 1.324 | 1.259 | 1.316 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x54e782 | hypre_ParTMatmul.A | par_csr_matop.c:3454 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.116 | 0.583 | 0.304 | 0.181 | 96.4 E-3 | 49.0 E-3 | 30.1 E-3 | 21.8 E-3 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 4.70 E-6 | 4.73 E-3 | 6.77 E-3 | 13.7 E-3 | 14.4 E-3 | 8.57 E-3 | 9.56 E-3 | 6.42 E-3 | 1.50 E-6 | 4.72 E-3 | 6.77 E-3 | 13.7 E-3 | 14.4 E-3 | 8.57 E-3 | 9.56 E-3 | 6.41 E-3 | 0.00 | 0.81 | 2.23 | 7.59 | 15.0 | 17.2 | 31.5 | 28.7 | 1.000 | 1.008 | 1.023 | 1.082 | 1.176 | 1.208 | 1.459 | 1.403 | 1.000 | 1.000 | 1.000 | 1.000 | 1.001 | 1.000 | 1.001 | 1.000 |
exec:0x592e5a | hypre_SeqVectorAxpy | vector.c:449 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.063 | 0.606 | 0.453 | 0.219 | 0.204 | 0.147 | 0.135 | 0.117 | 68.0 | 68.0 | 68.0 | 68.0 | 68.0 | 68.0 | 68.0 | 68.0 | 0.0 | 2.31 E-3 | 45.0 E-3 | 16.7 E-3 | 63.9 E-3 | 25.8 E-3 | 27.2 E-3 | 18.4 E-3 | 0.0 | 2.30 E-3 | 45.0 E-3 | 16.7 E-3 | 63.9 E-3 | 25.8 E-3 | 27.2 E-3 | 18.4 E-3 | 0 | 0.38 | 9.94 | 7.64 | 31.3 | 17.6 | 20.0 | 15.8 | 1.000 | 1.004 | 1.110 | 1.083 | 1.455 | 1.214 | 1.250 | 1.188 | 1.000 | 1.000 | 1.001 | 1.000 | 1.002 | 1.001 | 1.002 | 1.001 |
exec:0x592eb8 | hypre_SeqVectorInnerProd | vector.c:483 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.008 | 0.511 | 0.296 | 0.153 | 0.132 | 0.114 | 0.108 | 91.0 E-3 | 71.0 | 71.0 | 71.0 | 71.0 | 71.0 | 71.0 | 71.0 | 71.0 | 77.3 E-6 | 5.58 E-3 | 10.1 E-3 | 9.73 E-3 | 31.6 E-3 | 25.0 E-3 | 23.4 E-3 | 14.5 E-3 | 38.8 E-6 | 5.52 E-3 | 10.1 E-3 | 9.67 E-3 | 31.5 E-3 | 25.0 E-3 | 23.4 E-3 | 14.5 E-3 | 0.01 | 1.09 | 3.42 | 6.36 | 23.8 | 21.5 | 20.7 | 15.6 | 1.000 | 1.011 | 1.035 | 1.068 | 1.312 | 1.273 | 1.260 | 1.184 | 1.000 | 1.000 | 1.000 | 1.000 | 1.001 | 1.001 | 1.001 | 1.001 |
exec:0x5747b3 | hypre_IJMatrixAssembleParCSR.A | IJMatrix_parcsr.c:2798 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 0.487 | 0.293 | 0.224 | 0.112 | 83.4 E-3 | 60.5 E-3 | 59.8 E-3 | 54.3 E-3 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 1.00 E-3 | 25.9 E-3 | 7.83 E-3 | 16.1 E-3 | 7.07 E-3 | 8.35 E-3 | 3.05 E-3 | 0.0 | 1.00 E-3 | 25.9 E-3 | 7.83 E-3 | 16.1 E-3 | 7.07 E-3 | 8.35 E-3 | 3.05 E-3 | 0 | 0.30 | 11.6 | 7.00 | 19.3 | 11.6 | 13.9 | 5.63 | 1.000 | 1.003 | 1.131 | 1.075 | 1.239 | 1.131 | 1.162 | 1.060 | 1.000 | 1.000 | 1.000 | 1.000 | 1.001 | 1.000 | 1.000 | 1.000 |
exec:0x585f0c | hypre_CSRMatrixTranspose.A | csr_matop.c:463 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 0.379 | 0.200 | 0.111 | 60.5 E-3 | 41.6 E-3 | 34.4 E-3 | 35.1 E-3 | 37.2 E-3 | 10.0 | 10.0 | 10.0 | 10.0 | 10.0 | 10.0 | 10.0 | 10.0 | 12.4 E-6 | 2.83 E-3 | 4.73 E-3 | 3.97 E-3 | 7.40 E-3 | 7.36 E-3 | 9.42 E-3 | 8.06 E-3 | 3.98 E-6 | 2.82 E-3 | 4.71 E-3 | 3.95 E-3 | 7.39 E-3 | 7.34 E-3 | 9.40 E-3 | 8.05 E-3 | 0.00 | 1.42 | 4.27 | 6.55 | 17.8 | 21.3 | 26.9 | 21.7 | 1.000 | 1.014 | 1.045 | 1.070 | 1.216 | 1.270 | 1.368 | 1.277 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.001 | 1.000 |
exec:0x43c4c5 | hypre_BoomerAMGCoarsenPMIS.A | par_coarsen.c:2516 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 0.250 | 0.130 | 69.7 E-3 | 39.5 E-3 | 33.6 E-3 | 31.8 E-3 | 32.9 E-3 | 30.5 E-3 | 52.0 | 52.0 | 52.0 | 52.0 | 52.0 | 52.0 | 52.0 | 52.0 | 45.4 E-6 | 2.97 E-3 | 3.44 E-3 | 3.96 E-3 | 8.77 E-3 | 10.3 E-3 | 12.0 E-3 | 10.7 E-3 | 23.2 E-6 | 2.93 E-3 | 3.40 E-3 | 3.92 E-3 | 8.73 E-3 | 10.3 E-3 | 12.0 E-3 | 10.7 E-3 | 0.02 | 2.22 | 4.93 | 10.0 | 26.1 | 32.6 | 36.8 | 35.5 | 1.000 | 1.023 | 1.052 | 1.111 | 1.353 | 1.484 | 1.583 | 1.550 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.001 | 1.001 | 1.001 |
exec:0x592a5e | hypre_SeqVectorSetConstantValues | vector.c:268 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 0.241 | 0.140 | 0.101 | 44.9 E-3 | 93.3 E-3 | 79.6 E-3 | 39.8 E-3 | 38.3 E-3 | 144 | 144 | 144 | 144 | 144 | 144 | 144 | 144 | 0.0 | 1.17 E-3 | 11.3 E-3 | 6.27 E-3 | 63.8 E-3 | 50.9 E-3 | 16.2 E-3 | 20.4 E-3 | 0.0 | 1.16 E-3 | 11.3 E-3 | 6.26 E-3 | 63.8 E-3 | 50.8 E-3 | 16.2 E-3 | 20.4 E-3 | 0 | 0.85 | 11.2 | 13.9 | 68.0 | 63.0 | 40.8 | 52.8 | 1.000 | 1.009 | 1.126 | 1.162 | 3.122 | 2.701 | 1.689 | 2.120 | 1.000 | 1.000 | 1.000 | 1.000 | 1.002 | 1.003 | 1.001 | 1.001 |
exec:0x592e0e | hypre_SeqVectorScale | vector.c:413 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 0.222 | 0.121 | 76.5 E-3 | 29.2 E-3 | 28.5 E-3 | 30.8 E-3 | 26.2 E-3 | 21.8 E-3 | 22.0 | 22.0 | 22.0 | 22.0 | 22.0 | 22.0 | 22.0 | 22.0 | 0.0 | 725 E-6 | 7.53 E-3 | 1.96 E-3 | 8.70 E-3 | 6.53 E-3 | 4.02 E-3 | 971 E-6 | 0.0 | 720 E-6 | 7.53 E-3 | 1.95 E-3 | 8.70 E-3 | 6.53 E-3 | 4.02 E-3 | 969 E-6 | 0 | 0.60 | 9.84 | 6.68 | 30.4 | 21.2 | 15.3 | 4.44 | 1.000 | 1.006 | 1.109 | 1.072 | 1.437 | 1.269 | 1.181 | 1.047 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x58c462 | hypre_CSRMatrixMatvecOutOfPlace.A | csr_matvec.c:211 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 0.120 | 24.0 E-3 | 16.0 E-3 | 9.26 E-3 | 6.95 E-3 | 6.11 E-3 | 7.79 E-3 | 5.47 E-3 | 144 | 48.0 | 48.0 | 48.0 | 48.0 | 48.0 | 48.0 | 48.0 | 0.0 | 776 E-6 | 1.61 E-3 | 2.06 E-3 | 1.65 E-3 | 1.34 E-3 | 2.61 E-3 | 1.11 E-3 | 0.0 | 773 E-6 | 1.61 E-3 | 2.05 E-3 | 1.65 E-3 | 1.34 E-3 | 2.60 E-3 | 1.10 E-3 | 0 | 3.24 | 10.1 | 20.7 | 23.8 | 21.9 | 32.7 | 20.2 | 1.000 | 1.033 | 1.112 | 1.261 | 1.312 | 1.281 | 1.485 | 1.254 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x467514 | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:1167 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 72.8 E-3 | 42.7 E-3 | 22.2 E-3 | 14.0 E-3 | 8.15 E-3 | 5.52 E-3 | 5.47 E-3 | 5.16 E-3 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 1.98 E-3 | 1.03 E-3 | 2.64 E-3 | 1.70 E-3 | 827 E-6 | 1.22 E-3 | 762 E-6 | 0.0 | 1.98 E-3 | 1.03 E-3 | 2.64 E-3 | 1.70 E-3 | 827 E-6 | 1.22 E-3 | 762 E-6 | 0 | 4.33 | 4.64 | 18.8 | 20.9 | 14.8 | 22.1 | 14.8 | 1.000 | 1.045 | 1.049 | 1.231 | 1.264 | 1.174 | 1.284 | 1.174 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x43c572 | hypre_BoomerAMGCoarsenPMIS.A | par_coarsen.c:2327 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 64.2 E-3 | 42.5 E-3 | 28.3 E-3 | 19.5 E-3 | 17.9 E-3 | 16.9 E-3 | 18.1 E-3 | 18.4 E-3 | 48.5 | 48.5 | 48.5 | 48.5 | 48.5 | 48.5 | 48.5 | 48.5 | 0.0 | 2.94 E-3 | 2.96 E-3 | 3.37 E-3 | 5.23 E-3 | 4.67 E-3 | 5.59 E-3 | 5.86 E-3 | 0.0 | 2.94 E-3 | 2.95 E-3 | 3.36 E-3 | 5.23 E-3 | 4.66 E-3 | 5.59 E-3 | 5.86 E-3 | 0 | 6.79 | 10.5 | 17.3 | 29.3 | 27.7 | 31.1 | 31.6 | 1.000 | 1.073 | 1.117 | 1.209 | 1.414 | 1.383 | 1.450 | 1.462 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x45233d | hypre_BoomerAMGInterpTruncation.A | par_interp.c:2726 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 62.3 E-3 | 35.8 E-3 | 20.2 E-3 | 12.6 E-3 | 7.82 E-3 | 4.73 E-3 | 4.36 E-3 | 3.69 E-3 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 9.96 E-6 | 2.85 E-3 | 2.29 E-3 | 2.41 E-3 | 2.48 E-3 | 1.86 E-3 | 2.44 E-3 | 1.79 E-3 | 2.72 E-6 | 2.84 E-3 | 2.28 E-3 | 2.40 E-3 | 2.47 E-3 | 1.86 E-3 | 2.43 E-3 | 1.78 E-3 | 0.02 | 7.89 | 11.3 | 19.1 | 31.7 | 39.2 | 55.8 | 48.4 | 1.000 | 1.086 | 1.128 | 1.236 | 1.464 | 1.646 | 2.265 | 1.937 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x4f7f0c | hypre_BoomerAMGCreate2ndS.A | par_strength.c:1253 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 59.5 E-3 | 30.9 E-3 | 18.3 E-3 | 11.9 E-3 | 9.09 E-3 | 9.29 E-3 | 9.20 E-3 | 9.77 E-3 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.06 E-6 | 672 E-6 | 1.52 E-3 | 1.64 E-3 | 2.45 E-3 | 3.30 E-3 | 3.12 E-3 | 2.89 E-3 | 415 E-9 | 671 E-6 | 1.51 E-3 | 1.64 E-3 | 2.44 E-3 | 3.30 E-3 | 3.12 E-3 | 2.89 E-3 | 0.00 | 2.17 | 8.08 | 13.7 | 27.0 | 35.9 | 34.1 | 29.8 | 1.000 | 1.022 | 1.088 | 1.158 | 1.369 | 1.559 | 1.517 | 1.424 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x570599 | hypre_IJMatrixInitializeParCSR | IJMatrix_parcsr.c:302 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 58.5 E-3 | 42.2 E-3 | 23.2 E-3 | 12.9 E-3 | 12.7 E-3 | 14.0 E-3 | 14.4 E-3 | 12.6 E-3 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 2.65 E-3 | 1.11 E-3 | 1.12 E-3 | 2.39 E-3 | 3.21 E-3 | 3.82 E-3 | 2.55 E-3 | 0.0 | 2.65 E-3 | 1.11 E-3 | 1.12 E-3 | 2.39 E-3 | 3.21 E-3 | 3.82 E-3 | 2.55 E-3 | 0 | 5.69 | 4.86 | 8.42 | 18.8 | 23.0 | 26.2 | 20.2 | 1.000 | 1.060 | 1.051 | 1.092 | 1.231 | 1.298 | 1.356 | 1.253 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x580247 | hypre_IJVectorSetValuesPar.A | IJVector_parcsr.c:440 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 53.9 E-3 | 49.8 E-3 | 22.1 E-3 | 11.5 E-3 | 10.7 E-3 | 9.28 E-3 | 9.74 E-3 | 9.60 E-3 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 0.0 | 10.5 E-3 | 3.75 E-3 | 1.49 E-3 | 2.42 E-3 | 2.03 E-3 | 2.54 E-3 | 2.99 E-3 | 0.0 | 10.5 E-3 | 3.75 E-3 | 1.49 E-3 | 2.42 E-3 | 2.03 E-3 | 2.54 E-3 | 2.99 E-3 | 0 | 21.0 | 15.8 | 12.9 | 22.3 | 21.9 | 26.2 | 30.6 | 1.000 | 1.265 | 1.187 | 1.148 | 1.288 | 1.281 | 1.355 | 1.440 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x43bdb9 | hypre_BoomerAMGCoarsenPMIS.A | par_coarsen.c:2139 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 34.7 E-3 | 19.0 E-3 | 10.7 E-3 | 5.66 E-3 | 3.96 E-3 | 3.07 E-3 | 2.92 E-3 | 2.61 E-3 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 0.0 | 629 E-6 | 842 E-6 | 700 E-6 | 989 E-6 | 768 E-6 | 812 E-6 | 712 E-6 | 0.0 | 627 E-6 | 838 E-6 | 699 E-6 | 988 E-6 | 767 E-6 | 811 E-6 | 711 E-6 | 0 | 3.32 | 7.86 | 12.3 | 25.0 | 25.0 | 27.8 | 27.3 | 1.000 | 1.034 | 1.085 | 1.140 | 1.333 | 1.333 | 1.385 | 1.375 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x5749bf | hypre_IJMatrixAssembleParCSR.A | IJMatrix_parcsr.c:2843 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 30.5 E-3 | 17.7 E-3 | 10.2 E-3 | 4.89 E-3 | 2.56 E-3 | 1.43 E-3 | 710 E-6 | 455 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 1.24 E-3 | 1.04 E-3 | 371 E-6 | 319 E-6 | 277 E-6 | 129 E-6 | 65.7 E-6 | 0.0 | 1.24 E-3 | 1.04 E-3 | 370 E-6 | 319 E-6 | 276 E-6 | 129 E-6 | 65.6 E-6 | 0 | 6.49 | 10.2 | 7.71 | 12.5 | 18.6 | 17.9 | 14.4 | 1.000 | 1.069 | 1.113 | 1.084 | 1.142 | 1.229 | 1.218 | 1.168 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x56536d | hypre_ParCSRMatrixMatvecOutOfPlace.A | par_csr_matvec.c:151 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 20.5 E-3 | 5.01 E-3 | 3.66 E-3 | 2.84 E-3 | 2.88 E-3 | 2.85 E-3 | 2.79 E-3 | 2.64 E-3 | 768 | 264 | 264 | 264 | 264 | 264 | 264 | 264 | 0.0 | 575 E-6 | 675 E-6 | 824 E-6 | 945 E-6 | 1.03 E-3 | 976 E-6 | 947 E-6 | 0.0 | 550 E-6 | 656 E-6 | 805 E-6 | 923 E-6 | 1.00 E-3 | 955 E-6 | 923 E-6 | 0 | 11.4 | 18.4 | 29.1 | 32.9 | 36.3 | 35.0 | 35.9 | 1.000 | 1.128 | 1.225 | 1.409 | 1.490 | 1.569 | 1.538 | 1.560 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x4650f6 | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:272 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 16.2 E-3 | 8.49 E-3 | 4.33 E-3 | 4.85 E-3 | 4.57 E-3 | 4.17 E-3 | 4.35 E-3 | 4.38 E-3 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 965 E-9 | 185 E-6 | 124 E-6 | 988 E-6 | 1.63 E-3 | 1.38 E-3 | 1.52 E-3 | 1.47 E-3 | 435 E-9 | 184 E-6 | 123 E-6 | 986 E-6 | 1.63 E-3 | 1.38 E-3 | 1.52 E-3 | 1.47 E-3 | 0.01 | 2.16 | 2.82 | 20.0 | 36.1 | 33.9 | 35.7 | 34.2 | 1.000 | 1.022 | 1.029 | 1.249 | 1.564 | 1.512 | 1.556 | 1.520 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x548788 | hypre_ParMatmul.A | par_csr_matop.c:442 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 10.1 E-3 | 12.9 E-3 | 11.7 E-3 | 11.2 E-3 | 8.72 E-3 | 6.30 E-3 | 6.87 E-3 | 6.61 E-3 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 3.17 E-6 | 1.72 E-3 | 3.04 E-3 | 5.50 E-3 | 5.72 E-3 | 4.66 E-3 | 5.86 E-3 | 5.83 E-3 | 850 E-9 | 1.71 E-3 | 3.03 E-3 | 5.50 E-3 | 5.72 E-3 | 4.66 E-3 | 5.86 E-3 | 5.83 E-3 | 0.03 | 12.9 | 25.9 | 49.1 | 65.2 | 73.3 | 85.4 | 88.1 | 1.000 | 1.149 | 1.349 | 1.964 | 2.871 | 3.751 | 6.831 | 8.407 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x4f869d | hypre_BoomerAMGCreate2ndS.A | par_strength.c:1446 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 8.80 E-3 | 9.41 E-3 | 6.82 E-3 | 4.00 E-3 | 2.38 E-3 | 1.27 E-3 | 1.26 E-3 | 1.15 E-3 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 955 E-9 | 315 E-6 | 679 E-6 | 395 E-6 | 242 E-6 | 135 E-6 | 198 E-6 | 186 E-6 | 315 E-9 | 314 E-6 | 678 E-6 | 393 E-6 | 241 E-6 | 134 E-6 | 197 E-6 | 185 E-6 | 0.01 | 3.37 | 9.96 | 9.87 | 10.2 | 10.8 | 15.7 | 16.1 | 1.000 | 1.035 | 1.111 | 1.109 | 1.114 | 1.122 | 1.186 | 1.192 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x549398 | hypre_ParCSRMatrixExtractBExt_Arrays_Overlap.A | par_csr_matop.c:1153 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 8.07 E-3 | 5.36 E-3 | 3.97 E-3 | 2.01 E-3 | 2.23 E-3 | 1.69 E-3 | 1.14 E-3 | 1.64 E-3 | 13.0 | 13.0 | 13.0 | 13.0 | 13.0 | 13.0 | 13.0 | 13.0 | 9.63 E-6 | 895 E-6 | 1.12 E-3 | 545 E-6 | 1.26 E-3 | 1.09 E-3 | 694 E-6 | 1.23 E-3 | 2.17 E-6 | 885 E-6 | 1.11 E-3 | 535 E-6 | 1.25 E-3 | 1.08 E-3 | 684 E-6 | 1.22 E-3 | 0.12 | 15.9 | 28.4 | 27.1 | 56.6 | 64.5 | 59.2 | 67.5 | 1.001 | 1.189 | 1.396 | 1.371 | 2.302 | 2.815 | 2.454 | 3.081 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x58c71d | hypre_CSRMatrixMatvecT.A | csr_matvec.c:527 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 4.81 E-3 | 3.29 E-3 | 2.70 E-3 | 2.33 E-3 | 3.19 E-3 | 3.81 E-3 | 3.19 E-3 | 3.55 E-3 | 240 | 240 | 240 | 240 | 240 | 240 | 240 | 240 | 0.0 | 626 E-6 | 673 E-6 | 700 E-6 | 1.23 E-3 | 1.51 E-3 | 1.34 E-3 | 1.37 E-3 | 0.0 | 609 E-6 | 654 E-6 | 679 E-6 | 1.21 E-3 | 1.49 E-3 | 1.32 E-3 | 1.35 E-3 | 0 | 17.5 | 24.9 | 29.9 | 37.9 | 39.7 | 41.7 | 39.7 | 1.000 | 1.211 | 1.331 | 1.427 | 1.612 | 1.659 | 1.714 | 1.658 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x43bce1 | hypre_BoomerAMGCoarsenPMIS.A | par_coarsen.c:2106 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 2.94 E-3 | 1.66 E-3 | 975 E-6 | 993 E-6 | 547 E-6 | 378 E-6 | 362 E-6 | 451 E-6 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 0.0 | 73.4 E-6 | 97.2 E-6 | 355 E-6 | 138 E-6 | 87.3 E-6 | 97.3 E-6 | 147 E-6 | 0.0 | 71.8 E-6 | 96.5 E-6 | 352 E-6 | 129 E-6 | 86.6 E-6 | 96.7 E-6 | 147 E-6 | 0 | 4.40 | 9.72 | 29.5 | 25.2 | 23.1 | 26.8 | 32.6 | 1.000 | 1.046 | 1.108 | 1.419 | 1.337 | 1.301 | 1.367 | 1.484 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x5369ca | hypre_exchange_interp_data.A | aux_interp.c:347 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 2.46 E-3 | 1.98 E-3 | 1.18 E-3 | 699 E-6 | 414 E-6 | 374 E-6 | 215 E-6 | 268 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 1.36 E-6 | 234 E-6 | 144 E-6 | 120 E-6 | 92.1 E-6 | 87.7 E-6 | 82.2 E-6 | 81.1 E-6 | 335 E-9 | 232 E-6 | 142 E-6 | 118 E-6 | 90.2 E-6 | 86.0 E-6 | 80.6 E-6 | 79.4 E-6 | 0.06 | 11.1 | 11.8 | 17.1 | 22.3 | 23.4 | 38.3 | 32.1 | 1.001 | 1.125 | 1.134 | 1.206 | 1.286 | 1.305 | 1.620 | 1.473 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x4f8194 | hypre_BoomerAMGCreate2ndS.A | par_strength.c:1338 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.74 E-3 | 1.01 E-3 | 523 E-6 | 273 E-6 | 162 E-6 | 182 E-6 | 146 E-6 | 134 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 2.38 E-6 | 51.9 E-6 | 37.4 E-6 | 30.8 E-6 | 23.4 E-6 | 52.5 E-6 | 31.8 E-6 | 34.4 E-6 | 450 E-9 | 51.3 E-6 | 36.6 E-6 | 29.4 E-6 | 22.3 E-6 | 51.4 E-6 | 30.8 E-6 | 33.8 E-6 | 0.14 | 5.00 | 6.97 | 11.3 | 14.4 | 26.5 | 21.9 | 24.4 | 1.001 | 1.053 | 1.075 | 1.127 | 1.169 | 1.360 | 1.281 | 1.324 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x548819 | hypre_ParMatmul.A | par_csr_matop.c:563 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.48 E-3 | 974 E-6 | 625 E-6 | 389 E-6 | 249 E-6 | 170 E-6 | 118 E-6 | 98.0 E-6 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 0.0 | 21.3 E-6 | 51.0 E-6 | 53.6 E-6 | 52.1 E-6 | 41.8 E-6 | 36.3 E-6 | 35.5 E-6 | 0.0 | 20.9 E-6 | 50.7 E-6 | 53.2 E-6 | 51.7 E-6 | 41.3 E-6 | 35.8 E-6 | 35.2 E-6 | 0 | 2.11 | 8.17 | 13.7 | 21.0 | 24.7 | 30.7 | 36.2 | 1.000 | 1.022 | 1.089 | 1.159 | 1.265 | 1.328 | 1.444 | 1.566 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x5a3d36 | hypre_sort_and_create_inverse_map | hypre_merge_sort.c:355 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.29 E-3 | 3.01 E-3 | 2.48 E-3 | 1.53 E-3 | 988 E-6 | 625 E-6 | 382 E-6 | 316 E-6 | 14.0 | 14.0 | 14.0 | 14.0 | 14.0 | 14.0 | 14.0 | 14.0 | 0.0 | 116 E-6 | 229 E-6 | 207 E-6 | 189 E-6 | 144 E-6 | 98.7 E-6 | 83.4 E-6 | 0.0 | 115 E-6 | 228 E-6 | 206 E-6 | 182 E-6 | 143 E-6 | 97.6 E-6 | 82.3 E-6 | 0 | 3.94 | 9.29 | 13.8 | 19.2 | 23.3 | 25.7 | 26.3 | 1.000 | 1.041 | 1.102 | 1.160 | 1.238 | 1.304 | 1.347 | 1.356 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x5a3cea | hypre_sort_and_create_inverse_map | hypre_merge_sort.c:326 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.29 E-3 | 794 E-6 | 550 E-6 | 481 E-6 | 487 E-6 | 475 E-6 | 549 E-6 | 603 E-6 | 14.0 | 14.0 | 14.0 | 14.0 | 14.0 | 14.0 | 14.0 | 14.0 | 0.0 | 65.2 E-6 | 98.7 E-6 | 162 E-6 | 221 E-6 | 286 E-6 | 371 E-6 | 414 E-6 | 0.0 | 60.5 E-6 | 91.5 E-6 | 152 E-6 | 210 E-6 | 275 E-6 | 359 E-6 | 400 E-6 | 0 | 8.06 | 17.9 | 33.7 | 45.2 | 60.2 | 67.5 | 68.7 | 1.000 | 1.088 | 1.218 | 1.508 | 1.826 | 2.516 | 3.074 | 3.191 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x5a51c7 | hypre_UnorderedIntSetCopyToArray | hypre_hopscotch_hash.c:197 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.24 E-3 | 1.22 E-3 | 947 E-6 | 672 E-6 | 564 E-6 | 448 E-6 | 426 E-6 | 506 E-6 | 10.0 | 10.0 | 10.0 | 10.0 | 10.0 | 10.0 | 10.0 | 10.0 | 8.68 E-6 | 91.8 E-6 | 182 E-6 | 195 E-6 | 209 E-6 | 235 E-6 | 239 E-6 | 283 E-6 | 1.32 E-6 | 80.3 E-6 | 166 E-6 | 183 E-6 | 187 E-6 | 226 E-6 | 229 E-6 | 274 E-6 | 0.70 | 7.55 | 19.2 | 29.0 | 37.0 | 52.5 | 56.0 | 55.6 | 1.007 | 1.082 | 1.238 | 1.408 | 1.588 | 2.106 | 2.273 | 2.252 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x4f862f | hypre_BoomerAMGCreate2ndS.A | par_strength.c:1444 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.19 E-3 | 2.26 E-3 | 1.55 E-3 | 1.37 E-3 | 949 E-6 | 510 E-6 | 629 E-6 | 773 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 844 E-6 | 617 E-6 | 636 E-6 | 350 E-6 | 225 E-6 | 322 E-6 | 402 E-6 | 0.0 | 844 E-6 | 617 E-6 | 636 E-6 | 350 E-6 | 225 E-6 | 322 E-6 | 402 E-6 | 0 | 35.7 | 39.9 | 46.1 | 35.3 | 41.9 | 50.6 | 51.7 | 1.000 | 1.556 | 1.663 | 1.854 | 1.547 | 1.721 | 2.025 | 2.070 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x4f8729 | hypre_BoomerAMGCreate2ndS.A | par_strength.c:1512 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.04 E-3 | 928 E-6 | 670 E-6 | 352 E-6 | 210 E-6 | 107 E-6 | 65.9 E-6 | 53.0 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 10.4 E-6 | 58.8 E-6 | 34.8 E-6 | 30.7 E-6 | 19.1 E-6 | 19.6 E-6 | 20.3 E-6 | 0.0 | 10.4 E-6 | 58.7 E-6 | 34.7 E-6 | 30.6 E-6 | 19.1 E-6 | 19.5 E-6 | 20.2 E-6 | 0 | 1.13 | 8.97 | 9.66 | 14.7 | 18.3 | 29.8 | 38.4 | 1.000 | 1.011 | 1.099 | 1.107 | 1.172 | 1.223 | 1.425 | 1.623 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x536596 | hypre_initialize_vecs | aux_interp.c:313 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 864 E-6 | 240 E-6 | 484 E-6 | 248 E-6 | 488 E-6 | 177 E-6 | 160 E-6 | 480 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 91.1 E-6 | 170 E-6 | 112 E-6 | 305 E-6 | 54.9 E-6 | 47.1 E-6 | 330 E-6 | 0.0 | 90.6 E-6 | 170 E-6 | 111 E-6 | 305 E-6 | 54.4 E-6 | 46.7 E-6 | 329 E-6 | 0 | 37.3 | 36.8 | 43.3 | 53.9 | 30.9 | 29.4 | 53.6 | 1.000 | 1.594 | 1.582 | 1.762 | 2.171 | 1.448 | 1.417 | 2.157 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x536a5f | hypre_exchange_interp_data.A | aux_interp.c:409 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 853 E-6 | 483 E-6 | 282 E-6 | 169 E-6 | 111 E-6 | 72.8 E-6 | 54.2 E-6 | 47.4 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 8.48 E-6 | 15.8 E-6 | 20.0 E-6 | 20.7 E-6 | 17.7 E-6 | 19.0 E-6 | 18.1 E-6 | 0.0 | 8.10 E-6 | 15.5 E-6 | 19.6 E-6 | 20.3 E-6 | 17.2 E-6 | 18.7 E-6 | 17.7 E-6 | 0 | 1.76 | 5.57 | 11.8 | 18.6 | 24.3 | 35.1 | 38.1 | 1.000 | 1.018 | 1.059 | 1.134 | 1.229 | 1.320 | 1.541 | 1.617 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x55def8 | hypre_MergeDiagAndOffd | par_csr_matrix.c:1459 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 695 E-6 | 1.35 E-3 | 787 E-6 | 897 E-6 | 409 E-6 | 322 E-6 | 349 E-6 | 308 E-6 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 0.0 | 485 E-6 | 194 E-6 | 209 E-6 | 103 E-6 | 88.8 E-6 | 94.6 E-6 | 104 E-6 | 0.0 | 484 E-6 | 194 E-6 | 208 E-6 | 103 E-6 | 88.3 E-6 | 94.2 E-6 | 104 E-6 | 0 | 34.9 | 24.7 | 23.3 | 25.1 | 27.6 | 27.3 | 33.8 | 1.000 | 1.537 | 1.328 | 1.304 | 1.335 | 1.381 | 1.376 | 1.512 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x53697d | hypre_exchange_interp_data.A | aux_interp.c:347 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 640 E-6 | 3.10 E-3 | 2.27 E-3 | 1.27 E-3 | 848 E-6 | 442 E-6 | 288 E-6 | 335 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 1.09 E-3 | 925 E-6 | 412 E-6 | 339 E-6 | 140 E-6 | 125 E-6 | 120 E-6 | 0.0 | 1.09 E-3 | 924 E-6 | 412 E-6 | 339 E-6 | 139 E-6 | 125 E-6 | 120 E-6 | 0 | 32.8 | 40.1 | 33.2 | 40.3 | 31.5 | 44.3 | 36.9 | 1.000 | 1.488 | 1.669 | 1.497 | 1.674 | 1.460 | 1.794 | 1.585 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x536957 | hypre_exchange_interp_data.A | aux_interp.c:336 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 613 E-6 | 1.47 E-3 | 1.21 E-3 | 758 E-6 | 479 E-6 | 295 E-6 | 188 E-6 | 150 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 63.6 E-6 | 152 E-6 | 77.0 E-6 | 79.7 E-6 | 50.5 E-6 | 44.4 E-6 | 35.9 E-6 | 0.0 | 63.1 E-6 | 152 E-6 | 76.7 E-6 | 79.4 E-6 | 50.1 E-6 | 44.0 E-6 | 35.6 E-6 | 0 | 4.36 | 12.8 | 10.1 | 16.8 | 17.2 | 23.6 | 24.1 | 1.000 | 1.046 | 1.147 | 1.113 | 1.202 | 1.208 | 1.309 | 1.318 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x466579 | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:706 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 595 E-6 | 11.5 E-3 | 313 E-6 | 9.81 E-3 | 181 E-6 | 206 E-6 | 182 E-6 | 204 E-6 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.00 | 2.85 E-6 | 5.57 E-3 | 76.9 E-6 | 4.20 E-3 | 59.1 E-6 | 73.2 E-6 | 68.2 E-6 | 79.3 E-6 | 1.76 E-6 | 5.57 E-3 | 75.4 E-6 | 4.19 E-3 | 56.7 E-6 | 71.6 E-6 | 66.7 E-6 | 77.9 E-6 | 0.48 | 26.1 | 24.4 | 44.0 | 32.9 | 36.1 | 37.9 | 39.9 | 1.005 | 1.352 | 1.323 | 1.786 | 1.490 | 1.565 | 1.611 | 1.663 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x4f6a4f | hypre_BoomerAMGCreateS.A | par_strength.c:201 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 295 E-6 | 551 E-6 | 414 E-6 | 257 E-6 | 260 E-6 | 383 E-6 | 649 E-6 | 468 E-6 | 6.00 | 6.00 | 6.00 | 6.00 | 6.00 | 6.00 | 6.00 | 6.00 | 0.0 | 32.2 E-6 | 87.6 E-6 | 67.8 E-6 | 82.7 E-6 | 140 E-6 | 277 E-6 | 169 E-6 | 0.0 | 31.6 E-6 | 87.0 E-6 | 67.0 E-6 | 82.0 E-6 | 123 E-6 | 209 E-6 | 156 E-6 | 0 | 6.67 | 24.1 | 26.6 | 32.1 | 36.7 | 42.7 | 36.9 | 1.000 | 1.071 | 1.317 | 1.362 | 1.472 | 1.580 | 1.745 | 1.585 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x43bd16 | hypre_BoomerAMGCoarsenPMIS.A | par_coarsen.c:2113 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 294 E-6 | 308 E-6 | 261 E-6 | 294 E-6 | 263 E-6 | 181 E-6 | 180 E-6 | 207 E-6 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 7.00 | 0.0 | 49.2 E-6 | 38.1 E-6 | 50.8 E-6 | 57.5 E-6 | 49.5 E-6 | 56.0 E-6 | 72.8 E-6 | 0.0 | 48.7 E-6 | 37.4 E-6 | 50.0 E-6 | 54.8 E-6 | 48.8 E-6 | 55.4 E-6 | 72.2 E-6 | 0 | 15.9 | 14.6 | 17.2 | 21.9 | 27.4 | 31.1 | 35.1 | 1.000 | 1.188 | 1.171 | 1.208 | 1.280 | 1.377 | 1.451 | 1.542 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x4f8795 | hypre_BoomerAMGCreate2ndS.A | par_strength.c:1614 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 274 E-6 | 272 E-6 | 162 E-6 | 79.2 E-6 | 53.1 E-6 | 36.7 E-6 | 36.0 E-6 | 32.1 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 14.2 E-6 | 49.1 E-6 | 24.7 E-6 | 18.7 E-6 | 11.4 E-6 | 10.7 E-6 | 9.21 E-6 | 0.0 | 14.1 E-6 | 49.1 E-6 | 24.6 E-6 | 18.7 E-6 | 11.3 E-6 | 10.6 E-6 | 9.13 E-6 | 0 | 4.78 | 26.7 | 27.5 | 34.8 | 29.3 | 29.8 | 28.8 | 1.000 | 1.050 | 1.364 | 1.380 | 1.533 | 1.414 | 1.425 | 1.404 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x43c5b4 | hypre_BoomerAMGCoarsenPMIS.A | par_coarsen.c:2338 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 256 E-6 | 296 E-6 | 290 E-6 | 312 E-6 | 300 E-6 | 276 E-6 | 303 E-6 | 286 E-6 | 39.0 | 39.0 | 39.0 | 39.0 | 39.0 | 39.0 | 39.0 | 39.0 | 0.0 | 60.2 E-6 | 84.2 E-6 | 114 E-6 | 122 E-6 | 121 E-6 | 130 E-6 | 130 E-6 | 0.0 | 57.3 E-6 | 80.5 E-6 | 111 E-6 | 118 E-6 | 118 E-6 | 127 E-6 | 127 E-6 | 0 | 19.6 | 28.9 | 36.6 | 40.7 | 44.0 | 42.9 | 45.5 | 1.000 | 1.244 | 1.407 | 1.578 | 1.686 | 1.785 | 1.751 | 1.835 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x54fc9e | hypre_ParMatmul.extracted | par_csr_matop.c:520 | 1 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 227 E-6 | 967 E-6 | 1.42 E-3 | 4.12 E-3 | 4.00 E-3 | 2.50 E-3 | 3.77 E-3 | 3.17 E-3 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x466265 | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:685 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 224 E-6 | 207 E-6 | 139 E-6 | 84.6 E-6 | 105 E-6 | 91.4 E-6 | 112 E-6 | 114 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 43.9 E-6 | 33.2 E-6 | 20.6 E-6 | 27.1 E-6 | 21.6 E-6 | 27.9 E-6 | 34.8 E-6 | 0.0 | 43.8 E-6 | 33.0 E-6 | 20.4 E-6 | 26.9 E-6 | 21.5 E-6 | 27.8 E-6 | 34.6 E-6 | 0 | 21.2 | 24.0 | 24.3 | 26.2 | 24.8 | 24.9 | 30.5 | 1.000 | 1.270 | 1.315 | 1.321 | 1.355 | 1.329 | 1.332 | 1.438 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x5a3d0a | hypre_sort_and_create_inverse_map | hypre_merge_sort.c:329 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 197 E-6 | 917 E-6 | 695 E-6 | 590 E-6 | 420 E-6 | 328 E-6 | 273 E-6 | 279 E-6 | 14.0 | 14.0 | 14.0 | 14.0 | 14.0 | 14.0 | 14.0 | 14.0 | 0.0 | 196 E-6 | 202 E-6 | 212 E-6 | 152 E-6 | 117 E-6 | 95.8 E-6 | 103 E-6 | 0.0 | 195 E-6 | 201 E-6 | 211 E-6 | 147 E-6 | 116 E-6 | 94.7 E-6 | 101 E-6 | 0 | 21.0 | 29.1 | 36.0 | 36.1 | 35.7 | 35.2 | 36.6 | 1.000 | 1.265 | 1.410 | 1.563 | 1.565 | 1.556 | 1.544 | 1.577 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x468725 | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:1997 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 145 E-6 | 82.8 E-6 | 50.6 E-6 | 29.7 E-6 | 21.1 E-6 | 17.1 E-6 | 12.4 E-6 | 13.9 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 4.47 E-6 | 6.28 E-6 | 4.21 E-6 | 5.01 E-6 | 5.10 E-6 | 3.78 E-6 | 4.55 E-6 | 0.0 | 4.40 E-6 | 6.22 E-6 | 4.09 E-6 | 4.88 E-6 | 4.99 E-6 | 3.65 E-6 | 4.45 E-6 | 0 | 5.42 | 12.4 | 14.2 | 23.5 | 30.0 | 30.5 | 32.9 | 1.000 | 1.057 | 1.141 | 1.165 | 1.308 | 1.429 | 1.439 | 1.490 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x476d22 | hypre_BoomerAMGBuildExtPIInterp.A | par_lr_interp.c:1829 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 139 E-6 | 104 E-6 | 69.2 E-6 | 53.3 E-6 | 39.3 E-6 | 37.0 E-6 | 41.9 E-6 | 52.2 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 11.8 E-6 | 11.2 E-6 | 13.7 E-6 | 13.2 E-6 | 16.1 E-6 | 16.1 E-6 | 19.8 E-6 | 0.0 | 11.4 E-6 | 10.7 E-6 | 13.4 E-6 | 12.8 E-6 | 15.7 E-6 | 15.7 E-6 | 19.4 E-6 | 0 | 10.7 | 16.0 | 25.8 | 33.8 | 43.5 | 38.7 | 38.0 | 1.000 | 1.120 | 1.190 | 1.348 | 1.510 | 1.770 | 1.630 | 1.612 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x4f7fe3 | hypre_BoomerAMGCreate2ndS.A | par_strength.c:1301 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 125 E-6 | 231 E-6 | 164 E-6 | 116 E-6 | 110 E-6 | 126 E-6 | 80.5 E-6 | 101 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 83.5 E-6 | 49.0 E-6 | 26.8 E-6 | 27.8 E-6 | 30.6 E-6 | 19.6 E-6 | 21.0 E-6 | 0.0 | 83.4 E-6 | 48.9 E-6 | 26.7 E-6 | 27.7 E-6 | 30.4 E-6 | 19.5 E-6 | 20.9 E-6 | 0 | 35.2 | 30.4 | 24.1 | 26.1 | 24.5 | 24.3 | 20.5 | 1.000 | 1.544 | 1.436 | 1.317 | 1.353 | 1.325 | 1.322 | 1.258 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x4f803c | hypre_BoomerAMGCreate2ndS.A | par_strength.c:1314 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 113 E-6 | 92.9 E-6 | 115 E-6 | 86.3 E-6 | 66.4 E-6 | 51.2 E-6 | 44.2 E-6 | 49.4 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 15.6 E-6 | 52.8 E-6 | 41.3 E-6 | 35.5 E-6 | 27.6 E-6 | 20.2 E-6 | 24.3 E-6 | 0.0 | 15.6 E-6 | 52.7 E-6 | 41.2 E-6 | 35.4 E-6 | 27.5 E-6 | 20.1 E-6 | 24.2 E-6 | 0 | 16.0 | 45.7 | 47.9 | 53.4 | 54.1 | 45.9 | 49.3 | 1.000 | 1.190 | 1.842 | 1.921 | 2.146 | 2.178 | 1.850 | 1.972 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x537499 | hypre_build_interp_colmap.A | aux_interp.c:754 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 111 E-6 | 164 E-6 | 160 E-6 | 122 E-6 | 80.4 E-6 | 63.9 E-6 | 52.0 E-6 | 42.2 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 28.3 E-6 | 56.0 E-6 | 54.4 E-6 | 34.6 E-6 | 27.8 E-6 | 21.3 E-6 | 18.1 E-6 | 0.0 | 27.8 E-6 | 55.7 E-6 | 54.1 E-6 | 34.2 E-6 | 27.4 E-6 | 21.0 E-6 | 17.7 E-6 | 0 | 16.7 | 35.0 | 44.6 | 43.0 | 43.7 | 41.0 | 42.8 | 1.000 | 1.201 | 1.538 | 1.806 | 1.753 | 1.777 | 1.695 | 1.747 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x536925 | hypre_exchange_interp_data.A | aux_interp.c:337 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 60.1 E-6 | 473 E-6 | 264 E-6 | 150 E-6 | 134 E-6 | 81.9 E-6 | 87.3 E-6 | 97.3 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 208 E-6 | 108 E-6 | 58.5 E-6 | 43.7 E-6 | 29.9 E-6 | 31.1 E-6 | 37.5 E-6 | 0.0 | 207 E-6 | 108 E-6 | 58.1 E-6 | 43.3 E-6 | 29.5 E-6 | 30.7 E-6 | 37.1 E-6 | 0 | 42.2 | 41.0 | 39.6 | 31.9 | 37.1 | 35.7 | 38.8 | 1.000 | 1.730 | 1.694 | 1.655 | 1.469 | 1.590 | 1.556 | 1.634 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x4654c6 | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:340 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 56.5 E-6 | 35.5 E-6 | 37.5 E-6 | 38.6 E-6 | 44.2 E-6 | 37.9 E-6 | 40.0 E-6 | 33.1 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 675 E-9 | 4.04 E-6 | 8.77 E-6 | 14.0 E-6 | 19.6 E-6 | 16.3 E-6 | 20.4 E-6 | 16.6 E-6 | 325 E-9 | 3.62 E-6 | 8.25 E-6 | 13.1 E-6 | 18.5 E-6 | 15.5 E-6 | 19.7 E-6 | 15.9 E-6 | 1.20 | 11.3 | 23.6 | 36.5 | 45.0 | 42.9 | 50.7 | 50.3 | 1.012 | 1.127 | 1.309 | 1.574 | 1.819 | 1.751 | 2.028 | 2.012 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x53744e | hypre_build_interp_colmap.A | aux_interp.c:721 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 47.1 E-6 | 53.9 E-6 | 59.2 E-6 | 68.1 E-6 | 69.8 E-6 | 80.0 E-6 | 80.5 E-6 | 82.8 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 2.69 E-6 | 18.7 E-6 | 28.0 E-6 | 39.5 E-6 | 41.3 E-6 | 55.6 E-6 | 55.9 E-6 | 57.7 E-6 | 335 E-9 | 15.3 E-6 | 24.3 E-6 | 35.1 E-6 | 37.4 E-6 | 52.3 E-6 | 52.6 E-6 | 54.5 E-6 | 5.68 | 34.6 | 47.3 | 58.0 | 59.2 | 69.5 | 69.4 | 69.8 | 1.060 | 1.530 | 1.899 | 2.380 | 2.453 | 3.284 | 3.264 | 3.310 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x46875e | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:2007 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 35.1 E-6 | 248 E-6 | 166 E-6 | 88.3 E-6 | 48.5 E-6 | 42.8 E-6 | 51.8 E-6 | 48.2 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 114 E-6 | 54.2 E-6 | 24.6 E-6 | 11.8 E-6 | 10.5 E-6 | 14.7 E-6 | 14.5 E-6 | 0.0 | 114 E-6 | 54.1 E-6 | 24.5 E-6 | 11.7 E-6 | 10.4 E-6 | 14.6 E-6 | 14.4 E-6 | 0 | 45.6 | 33.0 | 27.9 | 24.5 | 25.1 | 28.6 | 30.6 | 1.000 | 1.837 | 1.492 | 1.387 | 1.325 | 1.335 | 1.400 | 1.441 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x5373eb | hypre_build_interp_colmap.A | aux_interp.c:710 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 25.9 E-6 | 34.8 E-6 | 52.7 E-6 | 53.0 E-6 | 65.5 E-6 | 62.8 E-6 | 57.0 E-6 | 54.2 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 9.14 E-6 | 18.9 E-6 | 19.8 E-6 | 25.1 E-6 | 23.5 E-6 | 20.3 E-6 | 19.9 E-6 | 0.0 | 8.79 E-6 | 18.5 E-6 | 19.4 E-6 | 24.6 E-6 | 23.0 E-6 | 19.9 E-6 | 19.5 E-6 | 0 | 23.6 | 35.8 | 37.3 | 38.4 | 37.3 | 35.5 | 36.7 | 1.000 | 1.310 | 1.557 | 1.596 | 1.622 | 1.595 | 1.550 | 1.580 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x548895 | hypre_ParMatmul.A | par_csr_matop.c:581 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 22.7 E-6 | 25.8 E-6 | 28.6 E-6 | 29.2 E-6 | 33.9 E-6 | 36.8 E-6 | 36.9 E-6 | 39.9 E-6 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 5.00 | 0.0 | 5.61 E-6 | 8.36 E-6 | 10.7 E-6 | 12.3 E-6 | 16.4 E-6 | 15.4 E-6 | 19.0 E-6 | 0.0 | 5.18 E-6 | 7.68 E-6 | 10.0 E-6 | 11.8 E-6 | 15.9 E-6 | 14.9 E-6 | 18.5 E-6 | 0 | 21.3 | 29.2 | 36.7 | 36.4 | 44.8 | 41.7 | 47.5 | 1.000 | 1.270 | 1.412 | 1.579 | 1.571 | 1.810 | 1.716 | 1.904 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x535f9c | hypre_alt_insert_new_nodes.A | aux_interp.c:75 | 1 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 20.8 E-6 | 25.1 E-6 | 20.7 E-6 | 21.2 E-6 | 18.2 E-6 | 19.4 E-6 | 20.2 E-6 | 21.5 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x46622e | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:680 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 18.5 E-6 | 284 E-6 | 214 E-6 | 362 E-6 | 203 E-6 | 230 E-6 | 219 E-6 | 250 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 132 E-6 | 68.1 E-6 | 123 E-6 | 69.3 E-6 | 92.0 E-6 | 68.0 E-6 | 104 E-6 | 0.0 | 132 E-6 | 68.1 E-6 | 123 E-6 | 69.2 E-6 | 91.9 E-6 | 67.9 E-6 | 104 E-6 | 0 | 46.4 | 32.2 | 34.2 | 34.1 | 39.9 | 30.9 | 41.8 | 1.000 | 1.867 | 1.476 | 1.519 | 1.518 | 1.664 | 1.448 | 1.720 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x5367b3 | hypre_exchange_interp_data.A | aux_interp.c:559 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 11.8 E-6 | 31.2 E-6 | 36.1 E-6 | 35.7 E-6 | 37.5 E-6 | 36.6 E-6 | 35.3 E-6 | 35.1 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 11.4 E-6 | 12.5 E-6 | 13.2 E-6 | 14.6 E-6 | 14.3 E-6 | 13.9 E-6 | 13.6 E-6 | 0.0 | 11.1 E-6 | 12.2 E-6 | 12.7 E-6 | 14.1 E-6 | 13.8 E-6 | 13.5 E-6 | 13.3 E-6 | 0 | 36.5 | 34.8 | 36.8 | 38.7 | 39.1 | 39.4 | 38.8 | 1.000 | 1.575 | 1.534 | 1.583 | 1.631 | 1.642 | 1.650 | 1.635 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x5374df | hypre_build_interp_colmap.A | aux_interp.c:762 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 11.3 E-6 | 19.6 E-6 | 28.1 E-6 | 29.5 E-6 | 30.0 E-6 | 31.8 E-6 | 31.4 E-6 | 48.5 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 5.37 E-6 | 9.09 E-6 | 10.4 E-6 | 11.3 E-6 | 14.1 E-6 | 13.5 E-6 | 29.5 E-6 | 0.0 | 4.97 E-6 | 8.71 E-6 | 9.95 E-6 | 10.7 E-6 | 13.6 E-6 | 13.2 E-6 | 29.1 E-6 | 0 | 28.0 | 32.4 | 35.1 | 37.7 | 44.5 | 43.3 | 56.9 | 1.000 | 1.389 | 1.479 | 1.541 | 1.606 | 1.802 | 1.764 | 2.322 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x5373a0 | hypre_build_interp_colmap.A | aux_interp.c:700 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 10.8 E-6 | 38.8 E-6 | 35.3 E-6 | 35.2 E-6 | 31.7 E-6 | 31.7 E-6 | 32.9 E-6 | 33.1 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 10.6 E-6 | 11.7 E-6 | 13.4 E-6 | 11.0 E-6 | 13.1 E-6 | 12.7 E-6 | 14.0 E-6 | 0.0 | 10.3 E-6 | 11.4 E-6 | 13.0 E-6 | 10.4 E-6 | 12.7 E-6 | 12.3 E-6 | 13.6 E-6 | 0 | 27.3 | 33.3 | 38.3 | 34.6 | 41.4 | 38.4 | 42.3 | 1.000 | 1.375 | 1.498 | 1.620 | 1.529 | 1.706 | 1.625 | 1.733 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x536566 | hypre_initialize_vecs | aux_interp.c:264 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 7.98 E-6 | 69.2 E-6 | 62.0 E-6 | 43.2 E-6 | 44.0 E-6 | 40.7 E-6 | 40.2 E-6 | 41.1 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 30.4 E-6 | 26.5 E-6 | 16.6 E-6 | 17.3 E-6 | 16.1 E-6 | 16.2 E-6 | 15.9 E-6 | 0.0 | 29.9 E-6 | 26.1 E-6 | 16.2 E-6 | 16.8 E-6 | 15.6 E-6 | 15.8 E-6 | 15.6 E-6 | 0 | 44.0 | 42.8 | 38.3 | 39.2 | 39.7 | 40.4 | 38.8 | 1.000 | 1.786 | 1.748 | 1.620 | 1.645 | 1.658 | 1.677 | 1.634 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x468591 | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:1962 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 4.90 E-6 | 19.4 E-6 | 20.6 E-6 | 20.4 E-6 | 18.0 E-6 | 17.6 E-6 | 16.7 E-6 | 18.4 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 7.19 E-6 | 5.99 E-6 | 6.28 E-6 | 5.93 E-6 | 5.37 E-6 | 4.45 E-6 | 6.01 E-6 | 0.0 | 7.11 E-6 | 5.78 E-6 | 6.10 E-6 | 5.74 E-6 | 5.24 E-6 | 4.31 E-6 | 5.91 E-6 | 0 | 36.3 | 28.3 | 30.6 | 33.0 | 30.7 | 26.6 | 32.7 | 1.000 | 1.571 | 1.395 | 1.440 | 1.493 | 1.444 | 1.363 | 1.485 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x53600c | hypre_alt_insert_new_nodes.A | aux_interp.c:99 | 1 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 4.79 E-6 | 5.19 E-6 | 5.74 E-6 | 5.98 E-6 | 4.81 E-6 | 6.67 E-6 | 6.32 E-6 | 5.91 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x536b28 | hypre_exchange_interp_data.A | aux_interp.c:559 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 4.77 E-6 | 17.8 E-6 | 23.2 E-6 | 27.4 E-6 | 27.7 E-6 | 29.6 E-6 | 28.7 E-6 | 34.1 E-6 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 4.00 | 0.0 | 6.99 E-6 | 7.40 E-6 | 11.0 E-6 | 10.4 E-6 | 13.5 E-6 | 12.1 E-6 | 14.9 E-6 | 0.0 | 6.52 E-6 | 6.78 E-6 | 10.3 E-6 | 9.75 E-6 | 13.0 E-6 | 11.7 E-6 | 14.6 E-6 | 0 | 39.0 | 32.0 | 40.2 | 37.4 | 45.6 | 42.0 | 44.0 | 1.000 | 1.640 | 1.470 | 1.672 | 1.597 | 1.837 | 1.724 | 1.785 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x468659 | hypre_BoomerAMGBuildMultipass.A | par_multi_interp.c:1976 | 0 | 0 | runtime | parallel | 1 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 1.06 E-6 | 5.15 E-6 | 6.96 E-6 | 6.67 E-6 | 7.01 E-6 | 7.58 E-6 | 8.44 E-6 | 8.73 E-6 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 | 0.0 | 2.11 E-6 | 2.50 E-6 | 2.46 E-6 | 2.67 E-6 | 3.32 E-6 | 3.53 E-6 | 3.43 E-6 | 0.0 | 2.04 E-6 | 2.38 E-6 | 2.29 E-6 | 2.43 E-6 | 3.13 E-6 | 3.40 E-6 | 3.30 E-6 | 0 | 40.7 | 35.8 | 37.0 | 38.1 | 43.9 | 42.0 | 39.5 | 1.000 | 1.687 | 1.557 | 1.588 | 1.616 | 1.781 | 1.723 | 1.652 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 | 1.000 |
exec:0x520a97 | hypre_ParCSRComputeL1NormsThreads.A | ams.c:3363 | 0 | 0 | runtime | parallel | 0 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 0.0 | 0.284 | 0.176 | 96.1 E-3 | 69.7 E-3 | 48.0 E-3 | 38.9 E-3 | 37.7 E-3 | 0.0 | 6.00 | 6.00 | 6.00 | 6.00 | 6.00 | 6.00 | 6.00 | -nan E2147483643 | 1.18 E-3 | 19.1 E-3 | 14.1 E-3 | 16.5 E-3 | 11.9 E-3 | 7.76 E-3 | 5.70 E-3 | -nan E2147483643 | 1.18 E-3 | 19.1 E-3 | 14.1 E-3 | 16.5 E-3 | 11.9 E-3 | 7.76 E-3 | 5.69 E-3 | 0 | 0.41 | 10.3 | 14.7 | 23.5 | 24.8 | 19.9 | 15.0 | 1.000 | 1.004 | 1.115 | 1.172 | 1.307 | 1.330 | 1.249 | 1.176 | 1.000 | 1.000 | 1.000 | 1.000 | 1.001 | 1.001 | 1.000 | 1.000 |
exec:0x58c7b6 | hypre_CSRMatrixMatvecT.A | csr_matvec.c:554 | 0 | 0 | runtime | parallel | 0 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 0.0 | 2.337 | 1.186 | 0.602 | 0.392 | 0.317 | 0.355 | 0.401 | 0.0 | 240 | 240 | 240 | 240 | 240 | 240 | 240 | -nan E2147483643 | 5.50 E-3 | 14.0 E-3 | 7.36 E-3 | 29.9 E-3 | 55.0 E-3 | 84.2 E-3 | 0.112 | -nan E2147483643 | 5.38 E-3 | 13.9 E-3 | 7.22 E-3 | 29.8 E-3 | 54.8 E-3 | 84.0 E-3 | 0.112 | 0 | 0.24 | 1.18 | 1.22 | 7.62 | 16.9 | 24.0 | 28.0 | 1.000 | 1.002 | 1.012 | 1.012 | 1.083 | 1.204 | 1.315 | 1.389 | 1.000 | 1.000 | 1.000 | 1.000 | 1.001 | 1.003 | 1.005 | 1.006 |
exec:0x520e19 | hypre_ParCSRRelaxThreads.A | ams.c:3866 | 0 | 0 | runtime | parallel | 0 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 0.0 | 25.885 | 16.089 | 8.542 | 8.125 | 5.814 | 5.189 | 5.189 | 0.0 | 504 | 504 | 504 | 504 | 504 | 504 | 504 | -nan E2147483643 | 0.244 | 1.168 | 0.596 | 1.880 | 1.055 | 0.826 | 0.730 | -nan E2147483643 | 0.243 | 1.168 | 0.596 | 1.880 | 1.055 | 0.826 | 0.730 | 0 | 0.93 | 6.94 | 6.59 | 22.1 | 18.1 | 15.8 | 13.9 | 1.000 | 1.009 | 1.075 | 1.071 | 1.283 | 1.222 | 1.188 | 1.162 | 1.000 | 1.003 | 1.019 | 1.017 | 1.070 | 1.058 | 1.050 | 1.043 |
exec:0x520d9e | hypre_ParCSRRelaxThreads.A | ams.c:3655 | 0 | 0 | runtime | parallel | 0 | 2 | 4 | 8 | 16 | 32 | 64 | 96 | 0.0 | 0.633 | 0.464 | 0.259 | 0.236 | 0.173 | 0.178 | 0.151 | 0.0 | 504 | 504 | 504 | 504 | 504 | 504 | 504 | -nan E2147483643 | 8.86 E-3 | 50.6 E-3 | 36.8 E-3 | 80.9 E-3 | 35.6 E-3 | 42.1 E-3 | 21.0 E-3 | -nan E2147483643 | 8.82 E-3 | 50.6 E-3 | 36.7 E-3 | 80.9 E-3 | 35.6 E-3 | 42.1 E-3 | 21.0 E-3 | 0 | 1.43 | 10.9 | 14.2 | 34.3 | 20.6 | 23.5 | 14.0 | 1.000 | 1.015 | 1.123 | 1.165 | 1.522 | 1.259 | 1.308 | 1.162 | 1.000 | 1.000 | 1.001 | 1.001 | 1.003 | 1.002 | 1.002 | 1.001 |