options

Profiling node gpu04sas.benchmarkcenter.megware.com - process 17331 - thread 17365

NameModuleCoverage (%)Time (s)
hypre_ParCSRRelaxThreads.extracted.57+exec47.9633.44
Loop 4557 - ams.c:3662-3682 - exec+24.0216.74
Loop 4559 - ams.c:3672-3675 - exec14.6210.19
Loop 4561 - ams.c:3672-3675 - exec9.386.54
Loop 4558 - ams.c:3677-3680 - exec0.010.01
Loop 4560 - ams.c:3677-3680 - exec0.010.01
hypre_CSRMatrixMatvecOutOfPlace.extracted+exec24.5517.11
Loop 6434 - csr_matvec.c:248-314 - exec+6.464.50
Loop 6442 - csr_matvec.c:310-312 - exec2.071.44
Loop 6435 - csr_matvec.c:310-312 - exec1.070.74
Loop 6436 - csr_matvec.c:310-312 - exec0.900.63
Loop 6437 - csr_matvec.c:310-312 - exec0.850.59
Loop 6438 - csr_matvec.c:310-312 - exec0.560.39
Loop 6439 - csr_matvec.c:310-312 - exec0.370.25
Loop 6441 - csr_matvec.c:310-312 - exec0.320.23
Loop 6440 - csr_matvec.c:310-312 - exec0.320.22
Loop 6478 - csr_matvec.c:248-263 - exec+6.384.45
Loop 6486 - csr_matvec.c:259-261 - exec2.471.72
Loop 6479 - csr_matvec.c:259-261 - exec1.020.71
Loop 6481 - csr_matvec.c:259-261 - exec0.850.59
Loop 6480 - csr_matvec.c:259-261 - exec0.630.44
Loop 6482 - csr_matvec.c:259-261 - exec0.450.31
Loop 6483 - csr_matvec.c:259-261 - exec0.370.25
Loop 6484 - csr_matvec.c:259-261 - exec0.300.21
Loop 6485 - csr_matvec.c:259-261 - exec0.290.20
Loop 6416 - csr_matvec.c:248-341 - exec+0.040.02
Loop 6423 - csr_matvec.c:337-339 - exec0.020.01
Loop 6418 - csr_matvec.c:337-339 - exec0.010.01
bool _INTERNAL1311483b::__kmp_wait_template, true, false, true>(kmp_info*, kmp_flag_64*, void*)libiomp5.so4.503.14
hypre_BoomerAMGCreate2ndS.extracted.17+exec1.741.21
Loop 3478 - par_strength.c:1714-1797 - exec+0.660.46
Loop 3488 - par_strength.c:1731-1765 - exec+0.360.25
Loop 3490 - par_strength.c:1743-1752 - exec0.360.25
Loop 3482 - par_strength.c:1731-1765 - exec+0.300.21
Loop 3484 - par_strength.c:1743-1752 - exec0.300.21
Loop 3436 - par_strength.c:2000-2083 - exec+0.630.44
Loop 3446 - par_strength.c:2011-2048 - exec+0.350.24
Loop 3448 - par_strength.c:2024-2034 - exec0.350.24
Loop 3440 - par_strength.c:2011-2048 - exec+0.280.19
Loop 3442 - par_strength.c:2024-2034 - exec0.280.19
Loop 3458 - par_strength.c:1951-1953 - exec0.030.02
Loop 3492 - par_strength.c:1691-1693 - exec0.010.01
Loop 3456 - par_strength.c:1679-1984 - exec0.010.01
__intel_avx_rep_memcpy+exec1.711.20
Loop 6767 - - exec1.681.17
hypre_BoomerAMGBuildMultipass.extracted.34+exec1.691.18
Loop 1492 - par_multi_interp.c:917-997 - exec+0.240.17
Loop 1496 - par_multi_interp.c:917-970 - exec+0.240.17
Loop 1499 - par_multi_interp.c:951-958 - exec0.240.17
Loop 1480 - par_multi_interp.c:917-1125 - exec+0.190.13
Loop 1484 - par_multi_interp.c:917-1099 - exec+0.190.13
Loop 1487 - par_multi_interp.c:1082-1088 - exec0.190.13
Loop 1490 - par_multi_interp.c:1030-1034 - exec0.040.03
hypre_SeqVectorAxpy.extracted+exec1.641.14
Loop 6590 - vector.c:449-452 - exec1.641.14
hypre_BoomerAMGBuildMultipass.extracted.28+exec1.521.06
Loop 1437 - par_multi_interp.c:1747-1876 - exec+0.700.49
Loop 1471 - par_multi_interp.c:1799-1803 - exec0.370.25
Loop 1451 - par_multi_interp.c:1747-1837 - exec+0.320.22
Loop 1461 - par_multi_interp.c:1816-1822 - exec0.160.11
Loop 1455 - par_multi_interp.c:1816-1822 - exec0.160.11
Loop 1475 - par_multi_interp.c:1782-1787 - exec0.020.01
hypre_IJMatrixSetValuesOMPParCSR.extracted.28+exec1.400.98
Loop 5838 - IJMatrix_parcsr.c:3274-3275 - exec0.010.01
hypre_BoomerAMGCreateS.extracted+exec1.310.91
Loop 3386 - par_strength.c:253-472 - exec+0.670.46
Loop 3388 - par_strength.c:451-460 - exec0.510.35
Loop 3400 - par_strength.c:324-327 - exec0.150.11
Loop 3399 - par_strength.c:324-327 - exec0.010.01
Loop 3366 - par_strength.c:492-513 - exec+0.420.29
Loop 3378 - par_strength.c:498-503 - exec0.070.05
Loop 3374 - par_strength.c:498-503 - exec0.060.05
Loop 3368 - par_strength.c:498-503 - exec0.060.04
Loop 3370 - par_strength.c:498-503 - exec0.060.04
Loop 3380 - par_strength.c:498-503 - exec0.050.04
Loop 3372 - par_strength.c:498-503 - exec0.040.03
Loop 3376 - par_strength.c:498-503 - exec0.040.03
Loop 3382 - par_strength.c:498-503 - exec0.040.03
hypre_CSRMatrixMatvecT.extracted.49+exec1.290.90
Loop 6542 - csr_matvec.c:560-567 - exec+0.870.61
Loop 6552 - csr_matvec.c:564-567 - exec0.240.16
Loop 6546 - csr_matvec.c:564-567 - exec0.230.16
Loop 6549 - csr_matvec.c:564-567 - exec0.220.15
Loop 6543 - csr_matvec.c:564-567 - exec0.190.13
Loop 6527 - csr_matvec.c:560-579 - exec+0.020.02
Loop 6531 - csr_matvec.c:577-579 - exec0.010.01
Loop 6532 - csr_matvec.c:577-579 - exec0.010.01
hypre_ParMatmul.extracted.12+exec1.280.89
Loop 5094 - par_csr_matop.c:865-989 - exec+0.980.68
Loop 5095 - par_csr_matop.c:937-989 - exec+0.980.68
Loop 5097 - par_csr_matop.c:946-965 - exec0.970.68
Loop 5096 - par_csr_matop.c:970-989 - exec0.010.01
Loop 5101 - par_csr_matop.c:858-859 - exec0.010.01
hypre_ParMatmul_RowSizes.extracted+exec0.980.68
Loop 5043 - par_csr_matop.c:109-242 - exec+0.520.36
Loop 5060 - par_csr_matop.c:109-231 - exec+0.490.34
Loop 5067 - par_csr_matop.c:195-208 - exec0.250.17
Loop 5063 - par_csr_matop.c:195-208 - exec0.220.15
Loop 5068 - par_csr_matop.c:195-208 - exec0.010.01
Loop 5064 - par_csr_matop.c:195-208 - exec0.010.01
Loop 5061 - par_csr_matop.c:218-231 - exec0.010.01
Loop 5073 - par_csr_matop.c:109-177 - exec+0.020.02
Loop 5076 - par_csr_matop.c:154-167 - exec0.010.01
Loop 5080 - par_csr_matop.c:154-167 - exec0.010.01
Loop 5058 - par_csr_matop.c:195-208 - exec0.010.01
Loop 5040 - par_csr_matop.c:263-266 - exec0.030.02
hypre_BoomerAMGCoarsenPMIS.extracted.15+exec0.950.66
Loop 432 - par_coarsen.c:2354-2381 - exec+0.870.61
Loop 444 - par_coarsen.c:2361-2381 - exec0.170.12
Loop 434 - par_coarsen.c:2361-2381 - exec0.140.10
Loop 440 - par_coarsen.c:2361-2381 - exec0.130.09
Loop 442 - par_coarsen.c:2361-2381 - exec0.110.07
Loop 438 - par_coarsen.c:2361-2381 - exec0.100.07
Loop 436 - par_coarsen.c:2361-2381 - exec0.090.07
Loop 448 - par_coarsen.c:2361-2381 - exec0.070.05
Loop 446 - par_coarsen.c:2361-2381 - exec0.060.05
hypre_CSRMatrixMultiply.extracted+exec0.920.64
Loop 6021 - csr_matop.c:272-298 - exec+0.420.29
Loop 6022 - csr_matop.c:282-298 - exec+0.420.29
Loop 6023 - csr_matop.c:286-298 - exec0.420.29
Loop 6029 - csr_matop.c:214-231 - exec+0.230.16
Loop 6030 - csr_matop.c:222-231 - exec+0.230.16
Loop 6031 - csr_matop.c:225-231 - exec0.230.16
hypre_SeqVectorInnerProd.extracted+exec0.880.61
Loop 6592 - vector.c:483-486 - exec0.880.61
BuildIJLaplacian27pt.extracted+exec0.670.46
Loop 6 - amg.c:1402-2344 - exec+0.420.29
Loop 7 - amg.c:1404-2344 - exec+0.420.29
Loop 8 - amg.c:1406-2344 - exec0.420.29
Loop 11 - amg.c:794-1367 - exec+0.240.17
Loop 12 - amg.c:796-1367 - exec+0.240.17
Loop 13 - amg.c:798-1367 - exec0.240.17
hypre_IJMatrixAssembleParCSR.extracted.25+exec0.580.40
Loop 5757 - IJMatrix_parcsr.c:2798-2812 - exec+0.580.41
Loop 5761 - IJMatrix_parcsr.c:2803-2812 - exec0.130.09
Loop 5763 - IJMatrix_parcsr.c:2803-2812 - exec0.130.09
Loop 5759 - IJMatrix_parcsr.c:2803-2812 - exec0.110.07
Loop 5765 - IJMatrix_parcsr.c:2803-2812 - exec0.100.07
Loop 5762 - IJMatrix_parcsr.c:2803-2812 - exec0.050.04
Loop 5764 - IJMatrix_parcsr.c:2803-2812 - exec0.050.04
Loop 5760 - IJMatrix_parcsr.c:2803-2812 - exec0.010.01
Loop 5758 - IJMatrix_parcsr.c:2803-2812 - exec0.010.01
hypre_BoomerAMGCoarsenPMIS.extracted.10+exec0.550.38
Loop 412 - par_coarsen.c:2435-2477 - exec+0.480.34
Loop 414 - par_coarsen.c:2465-2470 - exec0.090.07
Loop 420 - par_coarsen.c:2465-2470 - exec0.080.06
Loop 416 - par_coarsen.c:2465-2470 - exec0.070.05
Loop 424 - par_coarsen.c:2465-2470 - exec0.060.05
Loop 428 - par_coarsen.c:2465-2470 - exec0.060.04
Loop 418 - par_coarsen.c:2465-2470 - exec0.050.04
Loop 426 - par_coarsen.c:2465-2470 - exec0.040.03
Loop 422 - par_coarsen.c:2465-2470 - exec0.030.02
hypre_BoomerAMGBuildMultipass.extracted.27+exec0.450.31
Loop 1428 - par_multi_interp.c:1585-1660 - exec+0.310.21
Loop 1434 - par_multi_interp.c:1618-1628 - exec0.290.20
Loop 1435 - par_multi_interp.c:1612-1615 - exec0.010.01
hypre_CSRMatrixMatvecOutOfPlace.extracted.9+exec0.410.28
Loop 6487 - csr_matvec.c:234-237 - exec0.410.28
__intel_avx_rep_memsetexec0.390.27
hypre_CSRMatrixMatvecOutOfPlace.extracted.24+exec0.350.25
Loop 6512 - csr_matvec.c:158-161 - exec0.350.25
hypre_SeqVectorSetConstantValues.extracted+exec0.340.24
Loop 6585 - vector.c:268-271 - exec0.340.24
hypre_ParCSRComputeL1NormsThreads.extracted+exec0.320.22
Loop 4488 - ams.c:3382-3401 - exec+0.140.10
Loop 4491 - ams.c:3388-3389 - exec0.070.05
Loop 4495 - ams.c:3388-3389 - exec0.060.05
Loop 4384 - ams.c:3363-3540 - exec+0.070.05
Loop 4387 - ams.c:3532-3534 - exec0.070.05
hypre_SeqVectorScale.extracted+exec0.300.21
Loop 6589 - vector.c:413-416 - exec0.300.21
hypre_BoomerAMGCoarsenPMIS.extracted.35+exec0.270.19
Loop 457 - par_coarsen.c:2132-2136 - exec0.270.19
hypre_BoomerAMGBuildExtPIInterp.extracted+exec0.230.16
Loop 1786 - par_lr_interp.c:1221-1748 - exec+0.110.08
Loop 1794 - par_lr_interp.c:1221-1675 - exec+0.090.07
Loop 1797 - par_lr_interp.c:1644-1650 - exec0.070.05
Loop 1800 - par_lr_interp.c:1221-1627 - exec0.020.01
Loop 1803 - par_lr_interp.c:1494-1545 - exec+0.010.01
Loop 1806 - par_lr_interp.c:1516-1526 - exec0.010.01
Loop 1789 - par_lr_interp.c:1221-1736 - exec+0.010.01
Loop 1792 - par_lr_interp.c:1688-1723 - exec0.010.01
Loop 1824 - par_lr_interp.c:1244-1350 - exec+0.020.02
Loop 1833 - par_lr_interp.c:1264-1303 - exec+0.010.01
Loop 1836 - par_lr_interp.c:1277-1285 - exec0.010.01
Loop 1827 - par_lr_interp.c:1264-1303 - exec+0.010.01
Loop 1830 - par_lr_interp.c:1277-1285 - exec0.010.01
hypre_CSRMatrixTranspose.extracted+exec0.190.13
Loop 6043 - csr_matop.c:540-548 - exec+0.140.10
Loop 6047 - csr_matop.c:540-548 - exec0.040.03
Loop 6048 - csr_matop.c:540-548 - exec0.020.01
Loop 6045 - csr_matop.c:540-548 - exec0.020.01
Loop 6051 - csr_matop.c:540-548 - exec0.020.01
Loop 6044 - csr_matop.c:541-548 - exec0.010.01
Loop 6050 - csr_matop.c:540-548 - exec0.010.01
Loop 6049 - csr_matop.c:540-548 - exec0.010.01
Loop 6046 - csr_matop.c:540-548 - exec0.010.01
Loop 6060 - csr_matop.c:483-485 - exec0.020.01
Loop 6059 - csr_matop.c:380-500 - exec0.010.01
kmp_flag_native::notdone_check()libiomp5.so0.140.10
hypre_BoomerAMGCoarsenPMIS.extracted+exec0.100.07
Loop 411 - par_coarsen.c:2528-2536 - exec0.060.05
Loop 407 - par_coarsen.c:2562-2567 - exec0.040.03
hypre_ParTMatmul.extracted+exec0.090.07
Loop 5173 - par_csr_matop.c:3467-3634 - exec+0.050.03
Loop 5174 - par_csr_matop.c:3467-3634 - exec+0.040.03
Loop 5178 - par_csr_matop.c:3505-3608 - exec0.040.03
Loop 5202 - par_csr_matop.c:3590-3596 - exec0.010.01
Loop 5207 - par_csr_matop.c:3467-3528 - exec+0.040.03
Loop 5208 - par_csr_matop.c:3467-3522 - exec+0.030.02
Loop 5212 - par_csr_matop.c:3504-3505 - exec0.020.01
Loop 5213 - par_csr_matop.c:3504-3505 - exec0.010.01
Loop 5236 - par_csr_matop.c:3491-3495 - exec0.010.01
hypre_BoomerAMGCoarsenPMIS.extracted.25+exec0.060.04
Loop 455 - par_coarsen.c:2327-2334 - exec0.060.04
__GI___sched_yieldlibc.so.60.060.04
hypre_CSRMatrixMatvecOutOfPlace.extracted.19+exec0.040.03
Loop 6506 - csr_matvec.c:178-196 - exec+0.010.01
Loop 6507 - csr_matvec.c:194-195 - exec0.010.01
__memset_avx512_unaligned_ermslibc.so.60.030.02
hypre_BoomerAMGCreate2ndS.extracted+exec0.020.01
Loop 3422 - par_strength.c:1268-1278 - exec0.010.01
Loop 3423 - par_strength.c:1261-1263 - exec0.010.01
_INTERNAL1311483b::__kmp_hyper_barrier_gather(barrier_type, kmp_info*, int, int, void (*)(void*, void*), void*)libiomp5.so0.010.01
hypre_BoomerAMGCoarsenPMIS.extracted.30+exec0.010.01
Loop 456 - par_coarsen.c:2139-2142 - exec0.010.01
_ZN17_INTERNAL1311483b26__kmp_hyper_barrier_gatherE12barrier_typeP8kmp_infoiiPFvPvS3_ES3_..0libiomp5.so0.000.00
×