options

Profiling node gpu04sas.benchmarkcenter.megware.com - process 17338 - thread 17338

NameModuleCoverage (%)Time (s)
hypre_ParCSRRelaxThreads.extracted.57+exec44.4632.82
Loop 4557 - ams.c:3662-3682 - exec+21.0015.50
Loop 4559 - ams.c:3672-3675 - exec12.639.32
Loop 4561 - ams.c:3672-3675 - exec8.326.14
Loop 4558 - ams.c:3677-3680 - exec0.030.02
Loop 4560 - ams.c:3677-3680 - exec0.010.00
hypre_CSRMatrixMatvecOutOfPlace.extracted+exec23.1717.10
Loop 6478 - csr_matvec.c:248-263 - exec+6.204.57
Loop 6481 - csr_matvec.c:259-261 - exec2.661.96
Loop 6482 - csr_matvec.c:259-261 - exec0.840.62
Loop 6483 - csr_matvec.c:259-261 - exec0.830.61
Loop 6484 - csr_matvec.c:259-261 - exec0.810.60
Loop 6485 - csr_matvec.c:259-261 - exec0.400.29
Loop 6486 - csr_matvec.c:259-261 - exec0.300.22
Loop 6479 - csr_matvec.c:259-261 - exec0.180.13
Loop 6480 - csr_matvec.c:259-261 - exec0.170.12
Loop 6434 - csr_matvec.c:248-314 - exec+6.174.55
Loop 6437 - csr_matvec.c:310-312 - exec2.231.64
Loop 6438 - csr_matvec.c:310-312 - exec1.040.77
Loop 6440 - csr_matvec.c:310-312 - exec0.750.55
Loop 6439 - csr_matvec.c:310-312 - exec0.680.50
Loop 6441 - csr_matvec.c:310-312 - exec0.520.38
Loop 6442 - csr_matvec.c:310-312 - exec0.390.28
Loop 6435 - csr_matvec.c:310-312 - exec0.310.23
Loop 6436 - csr_matvec.c:310-312 - exec0.250.18
Loop 6416 - csr_matvec.c:248-341 - exec+0.030.02
Loop 6422 - csr_matvec.c:337-339 - exec0.010.01
Loop 6418 - csr_matvec.c:337-339 - exec0.010.00
Loop 6420 - csr_matvec.c:337-339 - exec0.010.00
Loop 6419 - csr_matvec.c:337-339 - exec0.010.00
hypre_BoomerAMGBuildMultipass+exec6.594.86
Loop 1297 - par_multi_interp.c:646-661 - exec+2.191.62
Loop 1299 - par_multi_interp.c:651-655 - exec2.191.62
Loop 1300 - par_multi_interp.c:205-600 - exec+1.641.21
Loop 1311 - par_multi_interp.c:205-571 - exec+1.641.21
Loop 1313 - par_multi_interp.c:554-557 - exec1.631.20
Loop 1312 - par_multi_interp.c:568-571 - exec0.010.00
Loop 1325 - par_multi_interp.c:488-514 - exec+1.551.14
Loop 1327 - par_multi_interp.c:491-498 - exec1.551.14
Loop 1247 - par_multi_interp.c:1158-1161 - exec0.170.12
Loop 1352 - par_multi_interp.c:385-399 - exec0.070.05
Loop 1251 - par_multi_interp.c:205-891 - exec+0.010.01
Loop 1270 - par_multi_interp.c:205-758 - exec+0.010.01
Loop 1271 - par_multi_interp.c:205-758 - exec+0.010.01
Loop 1272 - par_multi_interp.c:749-758 - exec+0.010.00
Loop 1273 - par_multi_interp.c:753-755 - exec0.010.00
Loop 1274 - par_multi_interp.c:742-745 - exec0.010.00
_ZN17_INTERNAL1311483b26__kmp_hyper_barrier_gatherE12barrier_typeP8kmp_infoiiPFvPvS3_ES3_..0libiomp5.so1.821.34
hypre_BoomerAMGCreate2ndS.extracted.17+exec1.561.15
Loop 3436 - par_strength.c:2000-2083 - exec+0.600.44
Loop 3446 - par_strength.c:2011-2048 - exec+0.320.23
Loop 3448 - par_strength.c:2024-2034 - exec0.320.23
Loop 3440 - par_strength.c:2011-2048 - exec+0.280.21
Loop 3442 - par_strength.c:2024-2034 - exec0.280.21
Loop 3478 - par_strength.c:1714-1797 - exec+0.580.43
Loop 3482 - par_strength.c:1731-1765 - exec+0.340.25
Loop 3484 - par_strength.c:1743-1752 - exec0.340.25
Loop 3488 - par_strength.c:1731-1765 - exec+0.240.18
Loop 3490 - par_strength.c:1743-1752 - exec0.240.18
Loop 3458 - par_strength.c:1951-1953 - exec0.030.02
Loop 3456 - par_strength.c:1679-1984 - exec0.010.00
Loop 3492 - par_strength.c:1691-1693 - exec0.010.00
__intel_avx_rep_memcpy+exec1.521.12
Loop 6767 - - exec1.521.12
hypre_SeqVectorAxpy.extracted+exec1.501.10
Loop 6590 - vector.c:449-452 - exec1.501.10
hypre_BoomerAMGBuildMultipass.extracted.34+exec1.461.08
Loop 1492 - par_multi_interp.c:917-997 - exec+0.180.13
Loop 1496 - par_multi_interp.c:917-970 - exec+0.180.13
Loop 1499 - par_multi_interp.c:951-958 - exec0.180.13
Loop 1480 - par_multi_interp.c:917-1125 - exec+0.160.12
Loop 1484 - par_multi_interp.c:917-1099 - exec+0.160.11
Loop 1487 - par_multi_interp.c:1082-1088 - exec0.160.11
Loop 1481 - par_multi_interp.c:1104-1125 - exec+0.010.00
Loop 1482 - par_multi_interp.c:1111-1125 - exec0.010.00
hypre_BoomerAMGBuildMultipass.extracted.28+exec1.391.02
Loop 1437 - par_multi_interp.c:1747-1876 - exec+0.740.54
Loop 1471 - par_multi_interp.c:1799-1803 - exec0.380.28
Loop 1451 - par_multi_interp.c:1747-1837 - exec+0.340.25
Loop 1455 - par_multi_interp.c:1816-1822 - exec0.190.14
Loop 1461 - par_multi_interp.c:1816-1822 - exec0.150.11
Loop 1475 - par_multi_interp.c:1782-1787 - exec0.020.01
hypre_CSRMatrixMatvecT.extracted.49+exec1.200.88
Loop 6542 - csr_matvec.c:560-567 - exec+0.820.60
Loop 6543 - csr_matvec.c:564-567 - exec0.240.18
Loop 6549 - csr_matvec.c:564-567 - exec0.220.16
Loop 6552 - csr_matvec.c:564-567 - exec0.210.15
Loop 6546 - csr_matvec.c:564-567 - exec0.150.11
Loop 6527 - csr_matvec.c:560-579 - exec+0.030.02
Loop 6533 - csr_matvec.c:577-579 - exec0.010.01
Loop 6529 - csr_matvec.c:577-579 - exec0.010.00
Loop 6532 - csr_matvec.c:577-579 - exec0.010.00
hypre_BoomerAMGCreateS.extracted+exec1.160.85
Loop 3386 - par_strength.c:253-472 - exec+0.590.43
Loop 3388 - par_strength.c:451-460 - exec0.390.28
Loop 3400 - par_strength.c:324-327 - exec0.180.13
Loop 3399 - par_strength.c:324-327 - exec0.020.01
Loop 3387 - par_strength.c:463-472 - exec0.010.00
Loop 3366 - par_strength.c:492-513 - exec+0.330.24
Loop 3374 - par_strength.c:498-503 - exec0.070.05
Loop 3380 - par_strength.c:498-503 - exec0.050.04
Loop 3372 - par_strength.c:498-503 - exec0.050.03
Loop 3382 - par_strength.c:498-503 - exec0.050.03
Loop 3376 - par_strength.c:498-503 - exec0.040.03
Loop 3370 - par_strength.c:498-503 - exec0.030.02
Loop 3378 - par_strength.c:498-503 - exec0.030.02
Loop 3368 - par_strength.c:498-503 - exec0.020.01
hypre_ParMatmul.extracted.12+exec1.150.85
Loop 5094 - par_csr_matop.c:865-989 - exec+0.780.57
Loop 5095 - par_csr_matop.c:937-989 - exec+0.780.57
Loop 5097 - par_csr_matop.c:946-965 - exec0.770.57
Loop 5096 - par_csr_matop.c:970-989 - exec0.010.00
Loop 5101 - par_csr_matop.c:858-859 - exec0.010.01
hypre_IJMatrixSetValuesOMPParCSR.extracted.28+exec1.120.83
Loop 5838 - IJMatrix_parcsr.c:3274-3275 - exec0.010.00
hypre_CSRMatrixMatvecOutOfPlace+exec1.110.82
Loop 6305 - csr_matvec.c:166-167 - exec1.110.82
hypre_ParMatmul_RowSizes.extracted+exec0.840.62
Loop 5043 - par_csr_matop.c:109-242 - exec+0.470.34
Loop 5060 - par_csr_matop.c:109-231 - exec+0.440.32
Loop 5063 - par_csr_matop.c:195-208 - exec0.220.16
Loop 5067 - par_csr_matop.c:195-208 - exec0.180.13
Loop 5068 - par_csr_matop.c:195-208 - exec0.030.02
Loop 5064 - par_csr_matop.c:195-208 - exec0.010.01
Loop 5058 - par_csr_matop.c:195-208 - exec0.020.01
Loop 5073 - par_csr_matop.c:109-177 - exec+0.010.00
Loop 5078 - par_csr_matop.c:170-177 - exec0.010.00
hypre_SeqVectorInnerProd.extracted+exec0.840.62
Loop 6592 - vector.c:483-486 - exec0.840.62
hypre_BoomerAMGCoarsenPMIS.extracted.15+exec0.830.62
Loop 432 - par_coarsen.c:2354-2381 - exec+0.790.58
Loop 444 - par_coarsen.c:2361-2381 - exec0.120.08
Loop 436 - par_coarsen.c:2361-2381 - exec0.120.08
Loop 440 - par_coarsen.c:2361-2381 - exec0.120.08
Loop 442 - par_coarsen.c:2361-2381 - exec0.100.07
Loop 438 - par_coarsen.c:2361-2381 - exec0.090.07
Loop 448 - par_coarsen.c:2361-2381 - exec0.090.07
Loop 434 - par_coarsen.c:2361-2381 - exec0.080.06
Loop 446 - par_coarsen.c:2361-2381 - exec0.070.05
hypre_CSRMatrixMultiply.extracted+exec0.780.57
Loop 6021 - csr_matop.c:272-298 - exec+0.350.25
Loop 6022 - csr_matop.c:282-298 - exec+0.350.25
Loop 6023 - csr_matop.c:286-298 - exec0.350.25
Loop 6029 - csr_matop.c:214-231 - exec+0.180.13
Loop 6030 - csr_matop.c:222-231 - exec+0.180.13
Loop 6031 - csr_matop.c:225-231 - exec0.180.13
BuildIJLaplacian27pt.extracted+exec0.600.45
Loop 6 - amg.c:1402-2344 - exec+0.360.26
Loop 7 - amg.c:1404-2344 - exec+0.360.26
Loop 8 - amg.c:1406-2344 - exec0.360.26
Loop 11 - amg.c:794-1367 - exec+0.240.18
Loop 12 - amg.c:796-1367 - exec+0.240.18
Loop 13 - amg.c:798-1367 - exec0.240.18
hypre_IJMatrixAssembleParCSR.extracted.25+exec0.540.40
Loop 5757 - IJMatrix_parcsr.c:2798-2812 - exec+0.540.40
Loop 5759 - IJMatrix_parcsr.c:2803-2812 - exec0.140.10
Loop 5763 - IJMatrix_parcsr.c:2803-2812 - exec0.110.08
Loop 5765 - IJMatrix_parcsr.c:2803-2812 - exec0.100.07
Loop 5761 - IJMatrix_parcsr.c:2803-2812 - exec0.080.06
Loop 5762 - IJMatrix_parcsr.c:2803-2812 - exec0.040.03
Loop 5760 - IJMatrix_parcsr.c:2803-2812 - exec0.030.02
Loop 5764 - IJMatrix_parcsr.c:2803-2812 - exec0.030.02
Loop 5758 - IJMatrix_parcsr.c:2803-2812 - exec0.010.00
hypre_BoomerAMGCoarsenPMIS.extracted.10+exec0.490.36
Loop 412 - par_coarsen.c:2435-2477 - exec+0.430.31
Loop 424 - par_coarsen.c:2465-2470 - exec0.070.05
Loop 422 - par_coarsen.c:2465-2470 - exec0.070.05
Loop 418 - par_coarsen.c:2465-2470 - exec0.070.05
Loop 420 - par_coarsen.c:2465-2470 - exec0.050.04
Loop 426 - par_coarsen.c:2465-2470 - exec0.050.04
Loop 416 - par_coarsen.c:2465-2470 - exec0.050.04
Loop 414 - par_coarsen.c:2465-2470 - exec0.040.03
Loop 428 - par_coarsen.c:2465-2470 - exec0.020.01
hypre_Randexec0.430.32
hypre_BoomerAMGBuildMultipass.extracted.27+exec0.410.30
Loop 1428 - par_multi_interp.c:1585-1660 - exec+0.330.24
Loop 1434 - par_multi_interp.c:1618-1628 - exec0.320.23
Loop 1435 - par_multi_interp.c:1612-1615 - exec0.010.01
__intel_avx_rep_memsetexec0.360.26
hypre_CSRMatrixMatvecOutOfPlace.extracted.9+exec0.360.26
Loop 6487 - csr_matvec.c:234-237 - exec0.360.26
hypre_SeqVectorSetConstantValues.extracted+exec0.350.26
Loop 6585 - vector.c:268-271 - exec0.350.26
_INTERNAL1311483b::__kmp_hyper_barrier_gather(barrier_type, kmp_info*, int, int, void (*)(void*, void*), void*)libiomp5.so0.330.24
hypre_CSRMatrixMatvecOutOfPlace.extracted.24+exec0.320.23
Loop 6512 - csr_matvec.c:158-161 - exec0.320.23
hypre_ParCSRComputeL1NormsThreads.extracted+exec0.310.23
Loop 4488 - ams.c:3382-3401 - exec+0.120.09
Loop 4495 - ams.c:3388-3389 - exec0.080.06
Loop 4491 - ams.c:3388-3389 - exec0.040.03
Loop 4384 - ams.c:3363-3540 - exec+0.070.05
Loop 4387 - ams.c:3532-3534 - exec0.070.05
Loop 4385 - ams.c:3534-3538 - exec0.010.00
ADIOI_GEN_SetLockDirect64libmpi.so.12.0.00.300.22
hypre_SeqVectorScale.extracted+exec0.290.21
Loop 6589 - vector.c:413-416 - exec0.290.21
hypre_BoomerAMGCoarsenPMIS.extracted.35+exec0.260.19
Loop 457 - par_coarsen.c:2132-2136 - exec0.260.19
MPIDI_Bcast_intra_composition_epsilon_checklibmpi.so.12.0.00.220.16
__memset_avx512_unaligned_ermslibc.so.60.180.13
hypre_BoomerAMGBuildExtPIInterp.extracted+exec0.170.12
Loop 1786 - par_lr_interp.c:1221-1748 - exec+0.060.04
Loop 1794 - par_lr_interp.c:1221-1675 - exec+0.040.03
Loop 1800 - par_lr_interp.c:1221-1627 - exec0.030.02
Loop 1797 - par_lr_interp.c:1644-1650 - exec0.010.01
Loop 1803 - par_lr_interp.c:1494-1545 - exec+0.020.01
Loop 1806 - par_lr_interp.c:1516-1526 - exec0.020.01
Loop 1824 - par_lr_interp.c:1244-1350 - exec+0.020.01
Loop 1827 - par_lr_interp.c:1264-1303 - exec+0.010.01
Loop 1830 - par_lr_interp.c:1277-1285 - exec0.010.01
Loop 1833 - par_lr_interp.c:1264-1303 - exec+0.010.00
Loop 1836 - par_lr_interp.c:1277-1285 - exec0.010.00
Loop 1809 - par_lr_interp.c:1444-1445 - exec0.010.00
hypre_CSRMatrixTranspose.extracted+exec0.150.11
Loop 6043 - csr_matop.c:540-548 - exec+0.120.08
Loop 6046 - csr_matop.c:540-548 - exec0.020.01
Loop 6044 - csr_matop.c:541-548 - exec0.020.01
Loop 6049 - csr_matop.c:540-548 - exec0.020.01
Loop 6047 - csr_matop.c:540-548 - exec0.020.01
Loop 6050 - csr_matop.c:540-548 - exec0.020.01
Loop 6045 - csr_matop.c:540-548 - exec0.010.00
Loop 6051 - csr_matop.c:540-548 - exec0.010.00
Loop 6060 - csr_matop.c:483-485 - exec0.010.01
Loop 6059 - csr_matop.c:380-500 - exec0.010.00
hypre_qsort0exec0.140.10
I_MPI_memcpy_multipage_sselibmpi.so.12.0.00.120.08
hypre_ParTMatmul.extracted+exec0.110.08
Loop 5173 - par_csr_matop.c:3467-3634 - exec+0.050.04
Loop 5174 - par_csr_matop.c:3467-3634 - exec+0.050.04
Loop 5178 - par_csr_matop.c:3505-3608 - exec0.050.04
Loop 5207 - par_csr_matop.c:3467-3528 - exec+0.050.04
Loop 5208 - par_csr_matop.c:3467-3522 - exec+0.050.04
Loop 5212 - par_csr_matop.c:3504-3505 - exec0.050.03
Loop 5213 - par_csr_matop.c:3504-3505 - exec0.010.00
hypre_BoomerAMGCoarsenPMIS.extracted+exec0.110.08
Loop 411 - par_coarsen.c:2528-2536 - exec0.060.04
Loop 407 - par_coarsen.c:2562-2567 - exec0.050.03
hypre_IJMatrixSetDiagOffdSizesParCSRexec0.070.05
hypre_BoomerAMGCoarsenPMISexec0.070.05
hypre_CSRMatrixMatvecOutOfPlace.extracted.19+exec0.060.04
Loop 6506 - csr_matvec.c:178-196 - exec+0.010.00
Loop 6507 - csr_matvec.c:194-195 - exec0.010.00
hypre_CSRMatrixSetRownnzexec0.060.04
hypre_BoomerAMGCorrectCFMarkerexec0.060.04
hypre_BoomerAMGCoarsenPMIS.extracted.25+exec0.050.04
Loop 455 - par_coarsen.c:2327-2334 - exec0.050.04
I_MPI_memcpy_nontemporal_multipage_sselibmpi.so.12.0.00.050.03
kmp_flag_native::notdone_check()libiomp5.so0.050.03
mainexec0.050.03
hypre_BinarySearchexec0.040.03
MPIDI_SHMI_progresslibmpi.so.12.0.00.030.02
MPIR_Progress_hook_exec_on_vcilibmpi.so.12.0.00.030.02
hypre_BoomerAMGCoarseParmsexec0.030.02
MPID_Progress_waitlibmpi.so.12.0.00.030.02
hypre_ParCSRRelaxThreadsexec0.030.02
hypre_BoomerAMGCreate2ndS.extracted+exec0.020.01
Loop 3422 - par_strength.c:1268-1278 - exec0.010.01
Loop 3423 - par_strength.c:1261-1263 - exec0.010.00
hypre_BoomerAMGBuildMultipass.extracted.31exec0.020.01
hypre_BoomerAMGIndepSetInitexec0.020.01
__GI___sched_yieldlibc.so.60.010.01
impi_shm_heap_progresslibmpi.so.12.0.00.010.01
hypre_BoomerAMGCreate2ndSexec0.010.01
hypre_qsort2absexec0.010.01
hypre_BoomerAMGCoarsenPMIS.extracted.30+exec0.010.01
Loop 456 - par_coarsen.c:2139-2142 - exec0.010.01
×