options

Profiling node gpu04sas.benchmarkcenter.megware.com - process 17336 - thread 17398

NameModuleCoverage (%)Time (s)
hypre_ParCSRRelaxThreads.extracted.57+exec47.9633.32
Loop 4557 - ams.c:3662-3682 - exec+23.3316.21
Loop 4559 - ams.c:3672-3675 - exec14.289.92
Loop 4561 - ams.c:3672-3675 - exec9.006.25
Loop 4558 - ams.c:3677-3680 - exec0.040.03
Loop 4560 - ams.c:3677-3680 - exec0.010.01
hypre_CSRMatrixMatvecOutOfPlace.extracted+exec24.5117.03
Loop 6478 - csr_matvec.c:248-263 - exec+6.404.45
Loop 6480 - csr_matvec.c:259-261 - exec2.741.90
Loop 6481 - csr_matvec.c:259-261 - exec0.890.62
Loop 6482 - csr_matvec.c:259-261 - exec0.840.59
Loop 6483 - csr_matvec.c:259-261 - exec0.680.47
Loop 6484 - csr_matvec.c:259-261 - exec0.500.35
Loop 6485 - csr_matvec.c:259-261 - exec0.300.21
Loop 6486 - csr_matvec.c:259-261 - exec0.260.18
Loop 6479 - csr_matvec.c:259-261 - exec0.190.13
Loop 6434 - csr_matvec.c:248-314 - exec+5.944.13
Loop 6436 - csr_matvec.c:310-312 - exec1.861.29
Loop 6437 - csr_matvec.c:310-312 - exec1.050.73
Loop 6439 - csr_matvec.c:310-312 - exec0.890.62
Loop 6438 - csr_matvec.c:310-312 - exec0.830.57
Loop 6440 - csr_matvec.c:310-312 - exec0.470.33
Loop 6442 - csr_matvec.c:310-312 - exec0.330.23
Loop 6441 - csr_matvec.c:310-312 - exec0.300.21
Loop 6435 - csr_matvec.c:310-312 - exec0.210.14
Loop 6416 - csr_matvec.c:248-341 - exec+0.010.01
Loop 6422 - csr_matvec.c:337-339 - exec0.010.00
Loop 6419 - csr_matvec.c:337-339 - exec0.010.00
bool _INTERNAL1311483b::__kmp_wait_template, true, false, true>(kmp_info*, kmp_flag_64*, void*)libiomp5.so4.873.38
hypre_BoomerAMGCreate2ndS.extracted.17+exec1.731.20
Loop 3436 - par_strength.c:2000-2083 - exec+0.650.45
Loop 3446 - par_strength.c:2011-2048 - exec+0.390.27
Loop 3448 - par_strength.c:2024-2034 - exec0.380.27
Loop 3447 - par_strength.c:2038-2048 - exec0.010.00
Loop 3440 - par_strength.c:2011-2048 - exec+0.260.18
Loop 3442 - par_strength.c:2024-2034 - exec0.260.18
Loop 3478 - par_strength.c:1714-1797 - exec+0.650.45
Loop 3488 - par_strength.c:1731-1765 - exec+0.370.25
Loop 3490 - par_strength.c:1743-1752 - exec0.370.25
Loop 3482 - par_strength.c:1731-1765 - exec+0.280.19
Loop 3484 - par_strength.c:1743-1752 - exec0.280.19
Loop 3458 - par_strength.c:1951-1953 - exec0.030.02
Loop 3492 - par_strength.c:1691-1693 - exec0.010.01
Loop 3456 - par_strength.c:1679-1984 - exec0.010.00
hypre_BoomerAMGBuildMultipass.extracted.34+exec1.671.16
Loop 1492 - par_multi_interp.c:917-997 - exec+0.240.17
Loop 1496 - par_multi_interp.c:917-970 - exec+0.240.17
Loop 1499 - par_multi_interp.c:951-958 - exec0.240.16
Loop 1497 - par_multi_interp.c:963-970 - exec0.010.00
Loop 1480 - par_multi_interp.c:917-1125 - exec+0.220.15
Loop 1484 - par_multi_interp.c:917-1099 - exec+0.220.15
Loop 1487 - par_multi_interp.c:1082-1088 - exec0.220.15
Loop 1490 - par_multi_interp.c:1030-1034 - exec0.040.03
__intel_avx_rep_memcpy+exec1.641.14
Loop 6767 - - exec1.631.13
hypre_SeqVectorAxpy.extracted+exec1.601.11
Loop 6590 - vector.c:449-452 - exec1.601.11
hypre_BoomerAMGBuildMultipass.extracted.28+exec1.531.06
Loop 1437 - par_multi_interp.c:1747-1876 - exec+0.810.57
Loop 1471 - par_multi_interp.c:1799-1803 - exec0.380.27
Loop 1451 - par_multi_interp.c:1747-1837 - exec+0.370.26
Loop 1461 - par_multi_interp.c:1816-1822 - exec0.190.13
Loop 1455 - par_multi_interp.c:1816-1822 - exec0.180.13
Loop 1475 - par_multi_interp.c:1782-1787 - exec0.060.04
hypre_IJMatrixSetValuesOMPParCSR.extracted.28+exec1.290.89
Loop 5838 - IJMatrix_parcsr.c:3274-3275 - exec0.010.00
hypre_ParMatmul.extracted.12+exec1.270.88
Loop 5094 - par_csr_matop.c:865-989 - exec+0.990.69
Loop 5095 - par_csr_matop.c:937-989 - exec+0.990.69
Loop 5097 - par_csr_matop.c:946-965 - exec0.990.69
Loop 5098 - par_csr_matop.c:888-928 - exec+0.010.00
Loop 5100 - par_csr_matop.c:897-915 - exec0.010.00
hypre_CSRMatrixMatvecT.extracted.49+exec1.260.87
Loop 6542 - csr_matvec.c:560-567 - exec+0.850.59
Loop 6552 - csr_matvec.c:564-567 - exec0.280.19
Loop 6549 - csr_matvec.c:564-567 - exec0.230.16
Loop 6546 - csr_matvec.c:564-567 - exec0.210.14
Loop 6543 - csr_matvec.c:564-567 - exec0.130.09
Loop 6527 - csr_matvec.c:560-579 - exec+0.030.02
Loop 6533 - csr_matvec.c:577-579 - exec0.020.01
Loop 6530 - csr_matvec.c:577-579 - exec0.010.00
hypre_BoomerAMGCreateS.extracted+exec1.240.86
Loop 3386 - par_strength.c:253-472 - exec+0.610.42
Loop 3388 - par_strength.c:451-460 - exec0.420.29
Loop 3400 - par_strength.c:324-327 - exec0.180.12
Loop 3399 - par_strength.c:324-327 - exec0.010.01
Loop 3366 - par_strength.c:492-513 - exec+0.360.25
Loop 3382 - par_strength.c:498-503 - exec0.080.05
Loop 3372 - par_strength.c:498-503 - exec0.060.04
Loop 3376 - par_strength.c:498-503 - exec0.050.03
Loop 3374 - par_strength.c:498-503 - exec0.050.03
Loop 3370 - par_strength.c:498-503 - exec0.040.03
Loop 3380 - par_strength.c:498-503 - exec0.040.03
Loop 3378 - par_strength.c:498-503 - exec0.040.03
Loop 3368 - par_strength.c:498-503 - exec0.010.01
hypre_ParMatmul_RowSizes.extracted+exec0.990.69
Loop 5043 - par_csr_matop.c:109-242 - exec+0.600.41
Loop 5060 - par_csr_matop.c:109-231 - exec+0.580.40
Loop 5063 - par_csr_matop.c:195-208 - exec0.280.19
Loop 5067 - par_csr_matop.c:195-208 - exec0.280.19
Loop 5068 - par_csr_matop.c:195-208 - exec0.010.00
Loop 5061 - par_csr_matop.c:218-231 - exec0.010.00
Loop 5073 - par_csr_matop.c:109-177 - exec+0.010.01
Loop 5074 - par_csr_matop.c:170-177 - exec0.010.00
Loop 5076 - par_csr_matop.c:154-167 - exec0.010.00
Loop 5058 - par_csr_matop.c:195-208 - exec0.010.00
Loop 5040 - par_csr_matop.c:263-266 - exec0.030.02
hypre_BoomerAMGCoarsenPMIS.extracted.15+exec0.960.67
Loop 432 - par_coarsen.c:2354-2381 - exec+0.890.62
Loop 448 - par_coarsen.c:2361-2381 - exec0.160.11
Loop 440 - par_coarsen.c:2361-2381 - exec0.140.10
Loop 436 - par_coarsen.c:2361-2381 - exec0.130.09
Loop 446 - par_coarsen.c:2361-2381 - exec0.120.08
Loop 444 - par_coarsen.c:2361-2381 - exec0.120.08
Loop 442 - par_coarsen.c:2361-2381 - exec0.090.07
Loop 438 - par_coarsen.c:2361-2381 - exec0.090.06
Loop 434 - par_coarsen.c:2361-2381 - exec0.040.03
Loop 439 - par_coarsen.c:2372-2380 - exec0.010.00
hypre_CSRMatrixMultiply.extracted+exec0.940.66
Loop 6021 - csr_matop.c:272-298 - exec+0.400.28
Loop 6022 - csr_matop.c:282-298 - exec+0.400.28
Loop 6023 - csr_matop.c:286-298 - exec0.400.28
Loop 6029 - csr_matop.c:214-231 - exec+0.250.18
Loop 6030 - csr_matop.c:222-231 - exec+0.250.18
Loop 6031 - csr_matop.c:225-231 - exec0.250.18
hypre_SeqVectorInnerProd.extracted+exec0.900.62
Loop 6592 - vector.c:483-486 - exec0.900.62
BuildIJLaplacian27pt.extracted+exec0.610.43
Loop 6 - amg.c:1402-2344 - exec+0.340.24
Loop 7 - amg.c:1404-2344 - exec+0.340.24
Loop 8 - amg.c:1406-2344 - exec0.340.24
Loop 11 - amg.c:794-1367 - exec+0.270.19
Loop 12 - amg.c:796-1367 - exec+0.270.19
Loop 13 - amg.c:798-1367 - exec0.270.19
hypre_IJMatrixAssembleParCSR.extracted.25+exec0.580.41
Loop 5757 - IJMatrix_parcsr.c:2798-2812 - exec+0.580.40
Loop 5759 - IJMatrix_parcsr.c:2803-2812 - exec0.160.11
Loop 5765 - IJMatrix_parcsr.c:2803-2812 - exec0.120.08
Loop 5763 - IJMatrix_parcsr.c:2803-2812 - exec0.120.08
Loop 5761 - IJMatrix_parcsr.c:2803-2812 - exec0.060.04
Loop 5764 - IJMatrix_parcsr.c:2803-2812 - exec0.040.03
Loop 5762 - IJMatrix_parcsr.c:2803-2812 - exec0.030.02
Loop 5760 - IJMatrix_parcsr.c:2803-2812 - exec0.020.01
Loop 5758 - IJMatrix_parcsr.c:2803-2812 - exec0.020.01
hypre_BoomerAMGCoarsenPMIS.extracted.10+exec0.530.36
Loop 412 - par_coarsen.c:2435-2477 - exec+0.430.30
Loop 416 - par_coarsen.c:2465-2470 - exec0.090.06
Loop 422 - par_coarsen.c:2465-2470 - exec0.060.05
Loop 428 - par_coarsen.c:2465-2470 - exec0.060.05
Loop 414 - par_coarsen.c:2465-2470 - exec0.050.04
Loop 418 - par_coarsen.c:2465-2470 - exec0.050.03
Loop 426 - par_coarsen.c:2465-2470 - exec0.040.03
Loop 424 - par_coarsen.c:2465-2470 - exec0.040.03
Loop 420 - par_coarsen.c:2465-2470 - exec0.030.02
hypre_BoomerAMGBuildMultipass.extracted.27+exec0.450.31
Loop 1428 - par_multi_interp.c:1585-1660 - exec+0.390.27
Loop 1434 - par_multi_interp.c:1618-1628 - exec0.370.25
Loop 1435 - par_multi_interp.c:1612-1615 - exec0.020.01
hypre_CSRMatrixMatvecOutOfPlace.extracted.9+exec0.360.25
Loop 6487 - csr_matvec.c:234-237 - exec0.360.25
hypre_CSRMatrixMatvecOutOfPlace.extracted.24+exec0.350.24
Loop 6512 - csr_matvec.c:158-161 - exec0.350.24
hypre_ParCSRComputeL1NormsThreads.extracted+exec0.340.23
Loop 4488 - ams.c:3382-3401 - exec+0.170.11
Loop 4491 - ams.c:3388-3389 - exec0.090.06
Loop 4495 - ams.c:3388-3389 - exec0.080.05
Loop 4384 - ams.c:3363-3540 - exec+0.070.05
Loop 4387 - ams.c:3532-3534 - exec0.060.05
Loop 4385 - ams.c:3534-3538 - exec0.010.00
__intel_avx_rep_memsetexec0.340.23
hypre_SeqVectorSetConstantValues.extracted+exec0.330.23
Loop 6585 - vector.c:268-271 - exec0.330.23
hypre_SeqVectorScale.extracted+exec0.300.21
Loop 6589 - vector.c:413-416 - exec0.300.21
hypre_BoomerAMGCoarsenPMIS.extracted.35+exec0.270.19
Loop 457 - par_coarsen.c:2132-2136 - exec0.270.19
hypre_BoomerAMGBuildExtPIInterp.extracted+exec0.240.17
Loop 1786 - par_lr_interp.c:1221-1748 - exec+0.170.12
Loop 1794 - par_lr_interp.c:1221-1675 - exec+0.120.08
Loop 1800 - par_lr_interp.c:1221-1627 - exec0.060.05
Loop 1797 - par_lr_interp.c:1644-1650 - exec0.050.04
Loop 1803 - par_lr_interp.c:1494-1545 - exec+0.040.03
Loop 1806 - par_lr_interp.c:1516-1526 - exec0.040.03
Loop 1801 - par_lr_interp.c:1534-1596 - exec+0.010.00
Loop 1802 - par_lr_interp.c:1573-1596 - exec0.010.00
Loop 1789 - par_lr_interp.c:1221-1736 - exec+0.010.00
Loop 1793 - par_lr_interp.c:1688-1700 - exec0.010.00
Loop 1824 - par_lr_interp.c:1244-1350 - exec+0.040.02
Loop 1833 - par_lr_interp.c:1264-1303 - exec+0.030.02
Loop 1836 - par_lr_interp.c:1277-1285 - exec0.030.02
Loop 1827 - par_lr_interp.c:1264-1303 - exec+0.010.00
Loop 1830 - par_lr_interp.c:1277-1285 - exec0.010.00
hypre_CSRMatrixTranspose.extracted+exec0.160.11
Loop 6043 - csr_matop.c:540-548 - exec+0.110.07
Loop 6044 - csr_matop.c:541-548 - exec0.040.03
Loop 6047 - csr_matop.c:540-548 - exec0.010.01
Loop 6049 - csr_matop.c:540-548 - exec0.010.01
Loop 6051 - csr_matop.c:540-548 - exec0.010.00
Loop 6050 - csr_matop.c:540-548 - exec0.010.00
Loop 6048 - csr_matop.c:540-548 - exec0.010.00
Loop 6045 - csr_matop.c:540-548 - exec0.010.00
Loop 6046 - csr_matop.c:540-548 - exec0.010.00
Loop 6060 - csr_matop.c:483-485 - exec0.010.01
Loop 6055 - csr_matop.c:380-527 - exec0.010.00
_ZN17_INTERNAL1311483b26__kmp_hyper_barrier_gatherE12barrier_typeP8kmp_infoiiPFvPvS3_ES3_..0libiomp5.so0.130.09
hypre_ParTMatmul.extracted+exec0.120.08
Loop 5207 - par_csr_matop.c:3467-3528 - exec+0.060.04
Loop 5208 - par_csr_matop.c:3467-3522 - exec+0.060.04
Loop 5212 - par_csr_matop.c:3504-3505 - exec0.060.04
Loop 5236 - par_csr_matop.c:3491-3495 - exec0.010.00
Loop 5173 - par_csr_matop.c:3467-3634 - exec+0.060.04
Loop 5174 - par_csr_matop.c:3467-3634 - exec+0.050.03
Loop 5178 - par_csr_matop.c:3505-3608 - exec0.050.03
Loop 5202 - par_csr_matop.c:3590-3596 - exec0.010.00
hypre_BoomerAMGCoarsenPMIS.extracted+exec0.110.08
Loop 411 - par_coarsen.c:2528-2536 - exec0.070.05
Loop 407 - par_coarsen.c:2562-2567 - exec0.040.03
hypre_CSRMatrixMatvecOutOfPlace.extracted.19+exec0.090.06
Loop 6506 - csr_matvec.c:178-196 - exec+0.030.02
Loop 6509 - csr_matvec.c:194-195 - exec0.030.02
kmp_flag_native::notdone_check()libiomp5.so0.090.06
hypre_BoomerAMGCoarsenPMIS.extracted.25+exec0.060.05
Loop 455 - par_coarsen.c:2327-2334 - exec0.060.05
_INTERNAL1311483b::__kmp_hyper_barrier_gather(barrier_type, kmp_info*, int, int, void (*)(void*, void*), void*)libiomp5.so0.050.03
__memset_avx512_unaligned_ermslibc.so.60.040.03
hypre_BoomerAMGCreate2ndS.extracted+exec0.030.02
Loop 3422 - par_strength.c:1268-1278 - exec0.010.01
Loop 3423 - par_strength.c:1261-1263 - exec0.010.01
__kmp_acquire_queuing_locklibiomp5.so0.010.01
hypre_BoomerAMGCoarsenPMIS.extracted.30+exec0.010.01
Loop 456 - par_coarsen.c:2139-2142 - exec0.010.01
__GI___sched_yieldlibc.so.60.010.00
×