options

Profiling node gpu04sas.benchmarkcenter.megware.com - process 17335 - thread 17335

NameModuleCoverage (%)Time (s)
hypre_ParCSRRelaxThreads.extracted.57+exec44.5132.81
Loop 4557 - ams.c:3662-3682 - exec+21.2115.63
Loop 4559 - ams.c:3672-3675 - exec12.819.44
Loop 4561 - ams.c:3672-3675 - exec8.346.14
Loop 4558 - ams.c:3677-3680 - exec0.050.04
Loop 4560 - ams.c:3677-3680 - exec0.010.01
hypre_CSRMatrixMatvecOutOfPlace.extracted+exec23.1317.05
Loop 6478 - csr_matvec.c:248-263 - exec+6.204.57
Loop 6481 - csr_matvec.c:259-261 - exec2.812.07
Loop 6482 - csr_matvec.c:259-261 - exec0.790.58
Loop 6483 - csr_matvec.c:259-261 - exec0.650.48
Loop 6484 - csr_matvec.c:259-261 - exec0.610.45
Loop 6485 - csr_matvec.c:259-261 - exec0.520.38
Loop 6479 - csr_matvec.c:259-261 - exec0.300.22
Loop 6486 - csr_matvec.c:259-261 - exec0.280.21
Loop 6480 - csr_matvec.c:259-261 - exec0.240.18
Loop 6434 - csr_matvec.c:248-314 - exec+6.004.42
Loop 6437 - csr_matvec.c:310-312 - exec2.181.61
Loop 6438 - csr_matvec.c:310-312 - exec0.950.70
Loop 6440 - csr_matvec.c:310-312 - exec0.820.61
Loop 6439 - csr_matvec.c:310-312 - exec0.690.51
Loop 6441 - csr_matvec.c:310-312 - exec0.510.37
Loop 6436 - csr_matvec.c:310-312 - exec0.350.25
Loop 6442 - csr_matvec.c:310-312 - exec0.320.23
Loop 6435 - csr_matvec.c:310-312 - exec0.180.13
Loop 6416 - csr_matvec.c:248-341 - exec+0.050.04
Loop 6417 - csr_matvec.c:337-339 - exec0.020.01
Loop 6420 - csr_matvec.c:337-339 - exec0.010.01
Loop 6421 - csr_matvec.c:337-339 - exec0.010.00
Loop 6423 - csr_matvec.c:337-339 - exec0.010.00
Loop 6419 - csr_matvec.c:337-339 - exec0.010.00
hypre_BoomerAMGBuildMultipass+exec6.684.92
Loop 1297 - par_multi_interp.c:646-661 - exec+2.291.68
Loop 1299 - par_multi_interp.c:651-655 - exec2.291.68
Loop 1300 - par_multi_interp.c:205-600 - exec+1.691.25
Loop 1311 - par_multi_interp.c:205-571 - exec+1.691.25
Loop 1313 - par_multi_interp.c:554-557 - exec1.681.24
Loop 1312 - par_multi_interp.c:568-571 - exec0.010.00
Loop 1325 - par_multi_interp.c:488-514 - exec+1.491.10
Loop 1327 - par_multi_interp.c:491-498 - exec1.491.10
Loop 1247 - par_multi_interp.c:1158-1161 - exec0.180.13
Loop 1352 - par_multi_interp.c:385-399 - exec0.130.09
_ZN17_INTERNAL1311483b26__kmp_hyper_barrier_gatherE12barrier_typeP8kmp_infoiiPFvPvS3_ES3_..0libiomp5.so1.801.33
__intel_avx_rep_memcpy+exec1.621.19
Loop 6767 - - exec1.591.17
hypre_BoomerAMGCreate2ndS.extracted.17+exec1.581.17
Loop 3478 - par_strength.c:1714-1797 - exec+0.640.47
Loop 3488 - par_strength.c:1731-1765 - exec+0.350.26
Loop 3490 - par_strength.c:1743-1752 - exec0.350.26
Loop 3482 - par_strength.c:1731-1765 - exec+0.280.21
Loop 3484 - par_strength.c:1743-1752 - exec0.280.21
Loop 3436 - par_strength.c:2000-2083 - exec+0.630.46
Loop 3440 - par_strength.c:2011-2048 - exec+0.320.23
Loop 3442 - par_strength.c:2024-2034 - exec0.310.23
Loop 3441 - par_strength.c:2038-2048 - exec0.010.00
Loop 3446 - par_strength.c:2011-2048 - exec+0.310.23
Loop 3448 - par_strength.c:2024-2034 - exec0.310.22
Loop 3447 - par_strength.c:2038-2048 - exec0.010.00
Loop 3458 - par_strength.c:1951-1953 - exec0.030.02
Loop 3492 - par_strength.c:1691-1693 - exec0.010.01
hypre_BoomerAMGBuildMultipass.extracted.34+exec1.491.10
Loop 1492 - par_multi_interp.c:917-997 - exec+0.200.15
Loop 1496 - par_multi_interp.c:917-970 - exec+0.200.15
Loop 1499 - par_multi_interp.c:951-958 - exec0.200.15
Loop 1480 - par_multi_interp.c:917-1125 - exec+0.180.13
Loop 1484 - par_multi_interp.c:917-1099 - exec+0.180.13
Loop 1487 - par_multi_interp.c:1082-1088 - exec0.170.12
Loop 1488 - par_multi_interp.c:1082-1088 - exec0.010.00
hypre_SeqVectorAxpy.extracted+exec1.491.09
Loop 6590 - vector.c:449-452 - exec1.481.09
hypre_BoomerAMGBuildMultipass.extracted.28+exec1.381.02
Loop 1437 - par_multi_interp.c:1747-1876 - exec+0.810.59
Loop 1471 - par_multi_interp.c:1799-1803 - exec0.460.34
Loop 1451 - par_multi_interp.c:1747-1837 - exec+0.320.23
Loop 1455 - par_multi_interp.c:1816-1822 - exec0.190.14
Loop 1461 - par_multi_interp.c:1816-1822 - exec0.130.09
Loop 1475 - par_multi_interp.c:1782-1787 - exec0.020.01
Loop 1470 - par_multi_interp.c:1805-1809 - exec0.010.00
hypre_CSRMatrixMatvecT.extracted.49+exec1.230.91
Loop 6542 - csr_matvec.c:560-567 - exec+0.790.58
Loop 6546 - csr_matvec.c:564-567 - exec0.240.17
Loop 6552 - csr_matvec.c:564-567 - exec0.220.16
Loop 6543 - csr_matvec.c:564-567 - exec0.190.14
Loop 6549 - csr_matvec.c:564-567 - exec0.140.10
Loop 6527 - csr_matvec.c:560-579 - exec+0.080.06
Loop 6535 - csr_matvec.c:577-579 - exec0.040.03
Loop 6530 - csr_matvec.c:577-579 - exec0.010.01
Loop 6529 - csr_matvec.c:577-579 - exec0.010.01
Loop 6531 - csr_matvec.c:577-579 - exec0.010.00
Loop 6532 - csr_matvec.c:577-579 - exec0.010.00
hypre_ParMatmul.extracted.12+exec1.130.83
Loop 5094 - par_csr_matop.c:865-989 - exec+0.840.62
Loop 5095 - par_csr_matop.c:937-989 - exec+0.840.62
Loop 5097 - par_csr_matop.c:946-965 - exec0.830.61
Loop 5096 - par_csr_matop.c:970-989 - exec0.010.01
hypre_CSRMatrixMatvecOutOfPlace+exec1.130.83
Loop 6305 - csr_matvec.c:166-167 - exec1.130.83
hypre_BoomerAMGCreateS.extracted+exec1.120.83
Loop 3386 - par_strength.c:253-472 - exec+0.600.44
Loop 3388 - par_strength.c:451-460 - exec0.410.30
Loop 3400 - par_strength.c:324-327 - exec0.180.13
Loop 3399 - par_strength.c:324-327 - exec0.020.01
Loop 3366 - par_strength.c:492-513 - exec+0.330.24
Loop 3378 - par_strength.c:498-503 - exec0.070.05
Loop 3370 - par_strength.c:498-503 - exec0.060.04
Loop 3372 - par_strength.c:498-503 - exec0.060.04
Loop 3382 - par_strength.c:498-503 - exec0.030.02
Loop 3368 - par_strength.c:498-503 - exec0.030.02
Loop 3380 - par_strength.c:498-503 - exec0.030.02
Loop 3374 - par_strength.c:498-503 - exec0.020.01
Loop 3376 - par_strength.c:498-503 - exec0.010.00
Loop 3375 - par_strength.c:508-513 - exec0.010.00
hypre_IJMatrixSetValuesOMPParCSR.extracted.28+exec1.030.76
Loop 5838 - IJMatrix_parcsr.c:3274-3275 - exec0.010.00
hypre_ParMatmul_RowSizes.extracted+exec0.840.62
Loop 5043 - par_csr_matop.c:109-242 - exec+0.490.36
Loop 5060 - par_csr_matop.c:109-231 - exec+0.470.35
Loop 5063 - par_csr_matop.c:195-208 - exec0.250.18
Loop 5067 - par_csr_matop.c:195-208 - exec0.220.16
Loop 5068 - par_csr_matop.c:195-208 - exec0.010.00
Loop 5073 - par_csr_matop.c:109-177 - exec+0.010.00
Loop 5076 - par_csr_matop.c:154-167 - exec0.010.00
Loop 5058 - par_csr_matop.c:195-208 - exec0.010.00
hypre_BoomerAMGCoarsenPMIS.extracted.15+exec0.840.62
Loop 432 - par_coarsen.c:2354-2381 - exec+0.790.58
Loop 434 - par_coarsen.c:2361-2381 - exec0.130.09
Loop 438 - par_coarsen.c:2361-2381 - exec0.120.09
Loop 442 - par_coarsen.c:2361-2381 - exec0.090.07
Loop 446 - par_coarsen.c:2361-2381 - exec0.090.07
Loop 448 - par_coarsen.c:2361-2381 - exec0.090.06
Loop 444 - par_coarsen.c:2361-2381 - exec0.090.06
Loop 440 - par_coarsen.c:2361-2381 - exec0.090.06
Loop 436 - par_coarsen.c:2361-2381 - exec0.080.06
Loop 435 - par_coarsen.c:2372-2380 - exec0.010.00
hypre_SeqVectorInnerProd.extracted+exec0.830.61
Loop 6592 - vector.c:483-486 - exec0.830.61
hypre_CSRMatrixMultiply.extracted+exec0.750.55
Loop 6021 - csr_matop.c:272-298 - exec+0.350.25
Loop 6022 - csr_matop.c:282-298 - exec+0.350.25
Loop 6023 - csr_matop.c:286-298 - exec0.350.25
Loop 6029 - csr_matop.c:214-231 - exec+0.170.12
Loop 6030 - csr_matop.c:222-231 - exec+0.170.12
Loop 6031 - csr_matop.c:225-231 - exec0.170.12
BuildIJLaplacian27pt.extracted+exec0.570.42
Loop 6 - amg.c:1402-2344 - exec+0.330.24
Loop 7 - amg.c:1404-2344 - exec+0.330.24
Loop 8 - amg.c:1406-2344 - exec0.330.24
Loop 11 - amg.c:794-1367 - exec+0.220.16
Loop 12 - amg.c:796-1367 - exec+0.220.16
Loop 13 - amg.c:798-1367 - exec0.220.16
hypre_IJMatrixAssembleParCSR.extracted.25+exec0.540.40
Loop 5757 - IJMatrix_parcsr.c:2798-2812 - exec+0.540.40
Loop 5765 - IJMatrix_parcsr.c:2803-2812 - exec0.140.10
Loop 5763 - IJMatrix_parcsr.c:2803-2812 - exec0.140.10
Loop 5761 - IJMatrix_parcsr.c:2803-2812 - exec0.120.09
Loop 5758 - IJMatrix_parcsr.c:2803-2812 - exec0.050.04
Loop 5759 - IJMatrix_parcsr.c:2803-2812 - exec0.050.04
Loop 5760 - IJMatrix_parcsr.c:2803-2812 - exec0.020.01
Loop 5762 - IJMatrix_parcsr.c:2803-2812 - exec0.020.01
Loop 5764 - IJMatrix_parcsr.c:2803-2812 - exec0.010.01
hypre_BoomerAMGCoarsenPMIS.extracted.10+exec0.490.36
Loop 412 - par_coarsen.c:2435-2477 - exec+0.420.31
Loop 416 - par_coarsen.c:2465-2470 - exec0.070.05
Loop 422 - par_coarsen.c:2465-2470 - exec0.070.05
Loop 424 - par_coarsen.c:2465-2470 - exec0.070.05
Loop 414 - par_coarsen.c:2465-2470 - exec0.060.04
Loop 426 - par_coarsen.c:2465-2470 - exec0.060.04
Loop 418 - par_coarsen.c:2465-2470 - exec0.040.03
Loop 420 - par_coarsen.c:2465-2470 - exec0.030.02
Loop 428 - par_coarsen.c:2465-2470 - exec0.020.01
hypre_Randexec0.440.32
hypre_BoomerAMGBuildMultipass.extracted.27+exec0.410.30
Loop 1428 - par_multi_interp.c:1585-1660 - exec+0.350.25
Loop 1434 - par_multi_interp.c:1618-1628 - exec0.350.25
_INTERNAL1311483b::__kmp_hyper_barrier_gather(barrier_type, kmp_info*, int, int, void (*)(void*, void*), void*)libiomp5.so0.370.27
hypre_CSRMatrixMatvecOutOfPlace.extracted.9+exec0.350.26
Loop 6487 - csr_matvec.c:234-237 - exec0.350.26
hypre_CSRMatrixMatvecOutOfPlace.extracted.24+exec0.340.25
Loop 6512 - csr_matvec.c:158-161 - exec0.340.25
hypre_SeqVectorSetConstantValues.extracted+exec0.330.24
Loop 6585 - vector.c:268-271 - exec0.330.24
MPIDI_Bcast_intra_composition_epsilon_checklibmpi.so.12.0.00.310.22
hypre_ParCSRComputeL1NormsThreads.extracted+exec0.300.22
Loop 4488 - ams.c:3382-3401 - exec+0.140.10
Loop 4495 - ams.c:3388-3389 - exec0.090.07
Loop 4491 - ams.c:3388-3389 - exec0.050.04
Loop 4384 - ams.c:3363-3540 - exec+0.070.05
Loop 4387 - ams.c:3532-3534 - exec0.070.05
hypre_SeqVectorScale.extracted+exec0.290.21
Loop 6589 - vector.c:413-416 - exec0.290.21
__intel_avx_rep_memsetexec0.260.20
hypre_BoomerAMGCoarsenPMIS.extracted.35+exec0.240.18
Loop 457 - par_coarsen.c:2132-2136 - exec0.240.18
ADIOI_GEN_SetLockDirect64libmpi.so.12.0.00.200.15
hypre_BoomerAMGBuildExtPIInterp.extracted+exec0.160.11
Loop 1786 - par_lr_interp.c:1221-1748 - exec+0.100.07
Loop 1794 - par_lr_interp.c:1221-1675 - exec+0.070.05
Loop 1800 - par_lr_interp.c:1221-1627 - exec0.060.04
Loop 1797 - par_lr_interp.c:1644-1650 - exec0.010.01
Loop 1803 - par_lr_interp.c:1494-1545 - exec+0.030.02
Loop 1806 - par_lr_interp.c:1516-1526 - exec0.030.02
Loop 1824 - par_lr_interp.c:1244-1350 - exec+0.010.01
Loop 1827 - par_lr_interp.c:1264-1303 - exec+0.010.01
Loop 1830 - par_lr_interp.c:1277-1285 - exec0.010.01
Loop 1809 - par_lr_interp.c:1444-1445 - exec0.010.00
hypre_CSRMatrixTranspose.extracted+exec0.150.11
Loop 6043 - csr_matop.c:540-548 - exec+0.120.09
Loop 6047 - csr_matop.c:540-548 - exec0.030.02
Loop 6045 - csr_matop.c:540-548 - exec0.030.02
Loop 6051 - csr_matop.c:540-548 - exec0.020.01
Loop 6046 - csr_matop.c:540-548 - exec0.010.01
Loop 6044 - csr_matop.c:541-548 - exec0.010.01
Loop 6048 - csr_matop.c:540-548 - exec0.010.00
Loop 6049 - csr_matop.c:540-548 - exec0.010.00
Loop 6060 - csr_matop.c:483-485 - exec0.020.01
I_MPI_memcpy_multipage_sselibmpi.so.12.0.00.140.10
hypre_qsort0exec0.140.10
__memset_avx512_unaligned_ermslibc.so.60.120.09
hypre_ParTMatmul.extracted+exec0.120.08
Loop 5173 - par_csr_matop.c:3467-3634 - exec+0.060.04
Loop 5174 - par_csr_matop.c:3467-3634 - exec+0.060.04
Loop 5178 - par_csr_matop.c:3505-3608 - exec0.060.04
Loop 5207 - par_csr_matop.c:3467-3528 - exec+0.050.03
Loop 5208 - par_csr_matop.c:3467-3522 - exec+0.040.03
Loop 5212 - par_csr_matop.c:3504-3505 - exec0.040.03
Loop 5236 - par_csr_matop.c:3491-3495 - exec0.010.00
hypre_BoomerAMGCoarsenPMIS.extracted+exec0.090.06
Loop 411 - par_coarsen.c:2528-2536 - exec0.050.04
Loop 407 - par_coarsen.c:2562-2567 - exec0.030.02
hypre_ParCSRRelaxThreadsexec0.080.06
hypre_BoomerAMGCoarsenPMISexec0.080.06
hypre_CSRMatrixMatvecOutOfPlace.extracted.19+exec0.070.05
Loop 6506 - csr_matvec.c:178-196 - exec+0.030.02
Loop 6508 - csr_matvec.c:194-195 - exec0.020.01
Loop 6507 - csr_matvec.c:194-195 - exec0.010.01
hypre_BoomerAMGCoarsenPMIS.extracted.25+exec0.070.05
Loop 455 - par_coarsen.c:2327-2334 - exec0.070.05
hypre_CSRMatrixSetRownnzexec0.070.05
hypre_BoomerAMGCorrectCFMarkerexec0.070.05
hypre_IJMatrixSetDiagOffdSizesParCSRexec0.050.04
hypre_BinarySearchexec0.050.04
hypre_BoomerAMGCoarseParmsexec0.050.04
MPIR_Progress_hook_exec_on_vcilibmpi.so.12.0.00.040.03
MPIDI_SHMI_progresslibmpi.so.12.0.00.030.02
kmp_flag_native::notdone_check()libiomp5.so0.030.02
__GI___sched_yieldlibc.so.60.030.02
impi_shm_heap_progresslibmpi.so.12.0.00.030.02
MPID_Progress_waitlibmpi.so.12.0.00.030.02
mainexec0.030.02
hypre_BoomerAMGCoarsenPMIS.extracted.30+exec0.020.01
Loop 456 - par_coarsen.c:2139-2142 - exec0.020.01
I_MPI_memcpy_nontemporal_multipage_sselibmpi.so.12.0.00.010.01
hypre_BoomerAMGCreate2ndS.extracted+exec0.010.01
Loop 3422 - par_strength.c:1268-1278 - exec0.010.00
Loop 3423 - par_strength.c:1261-1263 - exec0.010.00
hypre_BoomerAMGCreate2ndSexec0.010.01
hypre_BoomerAMGBuildMultipass.extracted.31exec0.010.01
hypre_BoomerAMGIndepSetInitexec0.010.01
×