options

Profiling node gpu04sas.benchmarkcenter.megware.com - process 17333 - thread 17574

NameModuleCoverage (%)Time (s)
hypre_ParCSRRelaxThreads.extracted.57+exec46.8832.59
Loop 4557 - ams.c:3662-3682 - exec+22.2215.45
Loop 4561 - ams.c:3672-3675 - exec13.079.08
Loop 4559 - ams.c:3672-3675 - exec9.106.33
Loop 4560 - ams.c:3677-3680 - exec0.040.03
Loop 4558 - ams.c:3677-3680 - exec0.010.00
hypre_CSRMatrixMatvecOutOfPlace.extracted+exec23.8816.60
Loop 6478 - csr_matvec.c:248-263 - exec+6.384.43
Loop 6480 - csr_matvec.c:259-261 - exec2.611.81
Loop 6481 - csr_matvec.c:259-261 - exec0.890.62
Loop 6482 - csr_matvec.c:259-261 - exec0.780.54
Loop 6483 - csr_matvec.c:259-261 - exec0.760.53
Loop 6484 - csr_matvec.c:259-261 - exec0.480.33
Loop 6485 - csr_matvec.c:259-261 - exec0.370.26
Loop 6479 - csr_matvec.c:259-261 - exec0.240.17
Loop 6486 - csr_matvec.c:259-261 - exec0.240.16
Loop 6434 - csr_matvec.c:248-314 - exec+5.994.16
Loop 6436 - csr_matvec.c:310-312 - exec2.031.41
Loop 6439 - csr_matvec.c:310-312 - exec0.930.65
Loop 6437 - csr_matvec.c:310-312 - exec0.870.60
Loop 6438 - csr_matvec.c:310-312 - exec0.800.55
Loop 6440 - csr_matvec.c:310-312 - exec0.490.34
Loop 6441 - csr_matvec.c:310-312 - exec0.380.26
Loop 6442 - csr_matvec.c:310-312 - exec0.280.19
Loop 6435 - csr_matvec.c:310-312 - exec0.210.14
Loop 6416 - csr_matvec.c:248-341 - exec+0.010.01
Loop 6424 - csr_matvec.c:337-339 - exec0.010.00
Loop 6421 - csr_matvec.c:337-339 - exec0.010.00
bool _INTERNAL1311483b::__kmp_wait_template, true, false, true>(kmp_info*, kmp_flag_64*, void*)libiomp5.so7.004.87
hypre_BoomerAMGCreate2ndS.extracted.17+exec1.701.18
Loop 3436 - par_strength.c:2000-2083 - exec+0.680.47
Loop 3440 - par_strength.c:2011-2048 - exec+0.400.28
Loop 3442 - par_strength.c:2024-2034 - exec0.400.28
Loop 3446 - par_strength.c:2011-2048 - exec+0.270.19
Loop 3448 - par_strength.c:2024-2034 - exec0.270.18
Loop 3447 - par_strength.c:2038-2048 - exec0.010.00
Loop 3478 - par_strength.c:1714-1797 - exec+0.660.46
Loop 3482 - par_strength.c:1731-1765 - exec+0.340.23
Loop 3484 - par_strength.c:1743-1752 - exec0.340.23
Loop 3488 - par_strength.c:1731-1765 - exec+0.320.22
Loop 3490 - par_strength.c:1743-1752 - exec0.320.22
Loop 3458 - par_strength.c:1951-1953 - exec0.030.02
Loop 3456 - par_strength.c:1679-1984 - exec0.010.00
hypre_BoomerAMGBuildMultipass.extracted.34+exec1.661.15
Loop 1492 - par_multi_interp.c:917-997 - exec+0.270.19
Loop 1496 - par_multi_interp.c:917-970 - exec+0.270.19
Loop 1499 - par_multi_interp.c:951-958 - exec0.270.19
Loop 1480 - par_multi_interp.c:917-1125 - exec+0.190.13
Loop 1484 - par_multi_interp.c:917-1099 - exec+0.190.13
Loop 1487 - par_multi_interp.c:1082-1088 - exec0.190.13
Loop 1488 - par_multi_interp.c:1082-1088 - exec0.010.00
Loop 1490 - par_multi_interp.c:1030-1034 - exec0.040.03
__intel_avx_rep_memcpy+exec1.551.08
Loop 6767 - - exec1.541.07
hypre_BoomerAMGBuildMultipass.extracted.28+exec1.551.08
Loop 1437 - par_multi_interp.c:1747-1876 - exec+0.760.53
Loop 1451 - par_multi_interp.c:1747-1837 - exec+0.400.27
Loop 1461 - par_multi_interp.c:1816-1822 - exec0.210.14
Loop 1455 - par_multi_interp.c:1816-1822 - exec0.190.13
Loop 1471 - par_multi_interp.c:1799-1803 - exec0.350.24
Loop 1475 - par_multi_interp.c:1782-1787 - exec0.010.01
hypre_SeqVectorAxpy.extracted+exec1.521.06
Loop 6590 - vector.c:449-452 - exec1.521.06
hypre_IJMatrixSetValuesOMPParCSR.extracted.28+exec1.260.87
Loop 5838 - IJMatrix_parcsr.c:3274-3275 - exec0.010.00
hypre_BoomerAMGCreateS.extracted+exec1.250.87
Loop 3386 - par_strength.c:253-472 - exec+0.580.40
Loop 3388 - par_strength.c:451-460 - exec0.400.27
Loop 3400 - par_strength.c:324-327 - exec0.170.11
Loop 3399 - par_strength.c:324-327 - exec0.010.01
Loop 3366 - par_strength.c:492-513 - exec+0.370.26
Loop 3376 - par_strength.c:498-503 - exec0.070.05
Loop 3380 - par_strength.c:498-503 - exec0.060.04
Loop 3374 - par_strength.c:498-503 - exec0.050.03
Loop 3372 - par_strength.c:498-503 - exec0.050.03
Loop 3368 - par_strength.c:498-503 - exec0.040.03
Loop 3370 - par_strength.c:498-503 - exec0.040.03
Loop 3378 - par_strength.c:498-503 - exec0.040.02
Loop 3382 - par_strength.c:498-503 - exec0.020.01
hypre_CSRMatrixMatvecT.extracted.49+exec1.240.86
Loop 6542 - csr_matvec.c:560-567 - exec+0.810.56
Loop 6552 - csr_matvec.c:564-567 - exec0.230.16
Loop 6546 - csr_matvec.c:564-567 - exec0.210.14
Loop 6549 - csr_matvec.c:564-567 - exec0.190.13
Loop 6543 - csr_matvec.c:564-567 - exec0.180.12
Loop 6527 - csr_matvec.c:560-579 - exec+0.030.02
Loop 6533 - csr_matvec.c:577-579 - exec0.010.01
Loop 6531 - csr_matvec.c:577-579 - exec0.010.00
Loop 6532 - csr_matvec.c:577-579 - exec0.010.00
hypre_ParMatmul.extracted.12+exec1.240.86
Loop 5094 - par_csr_matop.c:865-989 - exec+1.010.70
Loop 5095 - par_csr_matop.c:937-989 - exec+0.990.69
Loop 5097 - par_csr_matop.c:946-965 - exec0.990.69
Loop 5098 - par_csr_matop.c:888-928 - exec+0.010.01
Loop 5099 - par_csr_matop.c:917-928 - exec0.010.00
Loop 5100 - par_csr_matop.c:897-915 - exec0.010.00
hypre_ParMatmul_RowSizes.extracted+exec0.990.68
Loop 5043 - par_csr_matop.c:109-242 - exec+0.600.41
Loop 5060 - par_csr_matop.c:109-231 - exec+0.570.39
Loop 5067 - par_csr_matop.c:195-208 - exec0.310.21
Loop 5063 - par_csr_matop.c:195-208 - exec0.220.15
Loop 5064 - par_csr_matop.c:195-208 - exec0.040.02
Loop 5068 - par_csr_matop.c:195-208 - exec0.010.00
Loop 5058 - par_csr_matop.c:195-208 - exec0.020.01
Loop 5073 - par_csr_matop.c:109-177 - exec+0.010.00
Loop 5080 - par_csr_matop.c:154-167 - exec0.010.00
Loop 5040 - par_csr_matop.c:263-266 - exec0.030.02
hypre_BoomerAMGCoarsenPMIS.extracted.15+exec0.950.66
Loop 432 - par_coarsen.c:2354-2381 - exec+0.900.62
Loop 448 - par_coarsen.c:2361-2381 - exec0.140.10
Loop 440 - par_coarsen.c:2361-2381 - exec0.140.09
Loop 438 - par_coarsen.c:2361-2381 - exec0.130.09
Loop 442 - par_coarsen.c:2361-2381 - exec0.120.08
Loop 444 - par_coarsen.c:2361-2381 - exec0.100.07
Loop 436 - par_coarsen.c:2361-2381 - exec0.100.07
Loop 446 - par_coarsen.c:2361-2381 - exec0.100.07
Loop 434 - par_coarsen.c:2361-2381 - exec0.070.05
hypre_CSRMatrixMultiply.extracted+exec0.890.62
Loop 6021 - csr_matop.c:272-298 - exec+0.370.26
Loop 6022 - csr_matop.c:282-298 - exec+0.370.26
Loop 6023 - csr_matop.c:286-298 - exec0.370.26
Loop 6029 - csr_matop.c:214-231 - exec+0.180.12
Loop 6030 - csr_matop.c:222-231 - exec+0.180.12
Loop 6031 - csr_matop.c:225-231 - exec0.180.12
hypre_SeqVectorInnerProd.extracted+exec0.860.60
Loop 6592 - vector.c:483-486 - exec0.860.60
BuildIJLaplacian27pt.extracted+exec0.600.42
Loop 6 - amg.c:1402-2344 - exec+0.320.23
Loop 7 - amg.c:1404-2344 - exec+0.320.23
Loop 8 - amg.c:1406-2344 - exec0.320.23
Loop 11 - amg.c:794-1367 - exec+0.280.19
Loop 12 - amg.c:796-1367 - exec+0.280.19
Loop 13 - amg.c:798-1367 - exec0.280.19
hypre_IJMatrixAssembleParCSR.extracted.25+exec0.570.39
Loop 5757 - IJMatrix_parcsr.c:2798-2812 - exec+0.570.39
Loop 5765 - IJMatrix_parcsr.c:2803-2812 - exec0.140.10
Loop 5761 - IJMatrix_parcsr.c:2803-2812 - exec0.120.08
Loop 5763 - IJMatrix_parcsr.c:2803-2812 - exec0.090.06
Loop 5759 - IJMatrix_parcsr.c:2803-2812 - exec0.090.06
Loop 5760 - IJMatrix_parcsr.c:2803-2812 - exec0.050.03
Loop 5764 - IJMatrix_parcsr.c:2803-2812 - exec0.030.02
Loop 5762 - IJMatrix_parcsr.c:2803-2812 - exec0.020.01
Loop 5758 - IJMatrix_parcsr.c:2803-2812 - exec0.020.01
hypre_BoomerAMGCoarsenPMIS.extracted.10+exec0.510.35
Loop 412 - par_coarsen.c:2435-2477 - exec+0.430.30
Loop 428 - par_coarsen.c:2465-2470 - exec0.120.08
Loop 424 - par_coarsen.c:2465-2470 - exec0.080.05
Loop 426 - par_coarsen.c:2465-2470 - exec0.080.05
Loop 420 - par_coarsen.c:2465-2470 - exec0.040.03
Loop 418 - par_coarsen.c:2465-2470 - exec0.030.02
Loop 416 - par_coarsen.c:2465-2470 - exec0.030.02
Loop 414 - par_coarsen.c:2465-2470 - exec0.030.02
Loop 422 - par_coarsen.c:2465-2470 - exec0.020.01
Loop 419 - par_coarsen.c:2473-2477 - exec0.010.00
hypre_BoomerAMGBuildMultipass.extracted.27+exec0.470.33
Loop 1428 - par_multi_interp.c:1585-1660 - exec+0.320.22
Loop 1434 - par_multi_interp.c:1618-1628 - exec0.320.22
Loop 1435 - par_multi_interp.c:1612-1615 - exec0.010.00
hypre_CSRMatrixMatvecOutOfPlace.extracted.9+exec0.360.25
Loop 6487 - csr_matvec.c:234-237 - exec0.360.25
hypre_SeqVectorSetConstantValues.extracted+exec0.340.23
Loop 6585 - vector.c:268-271 - exec0.340.23
hypre_CSRMatrixMatvecOutOfPlace.extracted.24+exec0.330.23
Loop 6512 - csr_matvec.c:158-161 - exec0.330.23
hypre_ParCSRComputeL1NormsThreads.extracted+exec0.320.22
Loop 4488 - ams.c:3382-3401 - exec+0.140.10
Loop 4495 - ams.c:3388-3389 - exec0.100.07
Loop 4491 - ams.c:3388-3389 - exec0.040.03
Loop 4384 - ams.c:3363-3540 - exec+0.070.05
Loop 4387 - ams.c:3532-3534 - exec0.070.05
__intel_avx_rep_memsetexec0.320.22
hypre_SeqVectorScale.extracted+exec0.290.20
Loop 6589 - vector.c:413-416 - exec0.290.20
hypre_BoomerAMGCoarsenPMIS.extracted.35+exec0.270.19
Loop 457 - par_coarsen.c:2132-2136 - exec0.270.19
hypre_BoomerAMGBuildExtPIInterp.extracted+exec0.220.16
Loop 1786 - par_lr_interp.c:1221-1748 - exec+0.110.07
Loop 1803 - par_lr_interp.c:1494-1545 - exec+0.050.03
Loop 1806 - par_lr_interp.c:1516-1526 - exec0.050.03
Loop 1794 - par_lr_interp.c:1221-1675 - exec+0.050.03
Loop 1800 - par_lr_interp.c:1221-1627 - exec0.030.02
Loop 1797 - par_lr_interp.c:1644-1650 - exec0.020.01
Loop 1789 - par_lr_interp.c:1221-1736 - exec+0.010.00
Loop 1792 - par_lr_interp.c:1688-1723 - exec0.010.00
Loop 1824 - par_lr_interp.c:1244-1350 - exec+0.030.02
Loop 1833 - par_lr_interp.c:1264-1303 - exec+0.020.01
Loop 1836 - par_lr_interp.c:1277-1285 - exec0.020.01
Loop 1827 - par_lr_interp.c:1264-1303 - exec+0.010.00
Loop 1830 - par_lr_interp.c:1277-1285 - exec0.010.00
kmp_flag_native::notdone_check()libiomp5.so0.180.12
hypre_CSRMatrixTranspose.extracted+exec0.160.11
Loop 6043 - csr_matop.c:540-548 - exec+0.120.08
Loop 6047 - csr_matop.c:540-548 - exec0.040.02
Loop 6045 - csr_matop.c:540-548 - exec0.020.01
Loop 6049 - csr_matop.c:540-548 - exec0.020.01
Loop 6044 - csr_matop.c:541-548 - exec0.010.01
Loop 6051 - csr_matop.c:540-548 - exec0.010.01
Loop 6048 - csr_matop.c:540-548 - exec0.010.00
Loop 6046 - csr_matop.c:540-548 - exec0.010.00
Loop 6060 - csr_matop.c:483-485 - exec0.010.01
Loop 6059 - csr_matop.c:380-500 - exec0.010.00
hypre_ParTMatmul.extracted+exec0.130.09
Loop 5207 - par_csr_matop.c:3467-3528 - exec+0.070.05
Loop 5208 - par_csr_matop.c:3467-3522 - exec+0.070.05
Loop 5212 - par_csr_matop.c:3504-3505 - exec0.070.05
Loop 5173 - par_csr_matop.c:3467-3634 - exec+0.060.04
Loop 5174 - par_csr_matop.c:3467-3634 - exec+0.040.03
Loop 5178 - par_csr_matop.c:3505-3608 - exec0.040.02
Loop 5176 - par_csr_matop.c:3610-3621 - exec0.010.00
Loop 5202 - par_csr_matop.c:3590-3596 - exec0.010.01
hypre_BoomerAMGCoarsenPMIS.extracted+exec0.100.07
Loop 411 - par_coarsen.c:2528-2536 - exec0.060.04
Loop 407 - par_coarsen.c:2562-2567 - exec0.040.02
__GI___sched_yieldlibc.so.60.090.06
hypre_CSRMatrixMatvecOutOfPlace.extracted.19+exec0.060.04
Loop 6506 - csr_matvec.c:178-196 - exec+0.010.01
Loop 6507 - csr_matvec.c:194-195 - exec0.010.01
hypre_BoomerAMGCoarsenPMIS.extracted.25+exec0.060.04
Loop 455 - par_coarsen.c:2327-2334 - exec0.060.04
__memset_avx512_unaligned_ermslibc.so.60.050.03
hypre_BoomerAMGCreate2ndS.extracted+exec0.040.02
Loop 3422 - par_strength.c:1268-1278 - exec0.020.01
Loop 3423 - par_strength.c:1261-1263 - exec0.010.01
__kmp_yieldlibiomp5.so0.010.01
hypre_BoomerAMGCoarsenPMIS.extracted.30+exec0.010.01
Loop 456 - par_coarsen.c:2139-2142 - exec0.010.01
×