| | | | | | | requested parallelism | walltime sum (s) | nb instances | any sync average per thread time (s) | any wait average per thread time (s) | parallelism overhead (%) | local speedup if perfectly balanced | global speedup if perfectly balanced |
start addr | function name | source location | level | ancestor thread num | invoker | parallel or teams | 64x8 | 64x8 | 64x8 | 64x8 | 64x8 | 64x8 | 64x8 | 64x8 |
libraveloPlugin.so:0x103804 | void _INTERNAL8a16bd7d::exanb::compute_pair_singlemat<_INTER... | compute_pair_singlemat.h:103 | 0 | 0 | runtime | parallel | 8 | 190.912 | 501 | 0.323 | 0.323 | 1.14 | 1.012 | 1.004 |
libraveloPlugin.so:0x100386 | void _INTERNAL8a16bd7d::exanb::compute_pair_singlemat<_INTER... | compute_pair_singlemat.h:103 | 0 | 0 | runtime | parallel | 8 | 166.254 | 501 | 0.229 | 0.229 | 0.82 | 1.008 | 1.002 |
libexanbParticleNeighborsPlugin.so:0x1ee832 | void exanb::chunk_neighbors_execute<exanb::OperatorNode::Ope... | chunk_neighbors_execute.h:92 | 0 | 0 | runtime | parallel | 8 | 21.973 | 35.0 | 30.5 E-3 | 30.4 E-3 | 0.17 | 1.002 | 1.000 |
libexaStampAnalyticsPlugin.so:0x279fd0 | L__ZN8exaStamp25GridCellParticleSplattingIN5exanb4GridIN5oni... | grid_cell_particle_splatting.cpp:392 | 0 | 0 | runtime | parallel | 8 | 11.716 | 50.0 | 15.5 E-3 | 15.5 E-3 | 0.14 | 1.001 | 1.000 |
libexaStampAnalyticsPlugin.so:0x29f829 | void exaStamp::GridConnectedComponents::execute_with_filter_... | grid_connected_components.cpp:239 | 0 | 0 | runtime | parallel | 8 | 8.354 | 50.0 | 6.861 | 6.861 | 82.5 | 5.713 | 1.012 |
libexaStampComputePlugin.so:0x2383a9 | void _INTERNAL52c8d60b::exanb::compute_cell_particles<_INTER... | compute_cell_particles.h:80 | 0 | 0 | runtime | parallel | 8 | 3.693 | 501 | 7.63 E-3 | 7.35 E-3 | 1.56 | 1.016 | 1.000 |
libexanbMPIPlugin.so:0x3229b7 | void exanb::MigrateCellParticlesImpl<exanb::Grid<onika::soat... | migrate_cell_particles.h:339 | 0 | 0 | runtime | parallel | 8 | 1.071 | 35.0 | 0.936 | 0.936 | 87.4 | 7.957 | 1.002 |
libexanbDefBoxPlugin.so:0x10a5ae | void _INTERNALfd8b84a7::exanb::compute_cell_particles<_INTER... | compute_cell_particles.h:80 | 0 | 0 | runtime | parallel | 8 | 1.034 | 1.00 E3 | 4.39 E-3 | 4.03 E-3 | 1.49 | 1.015 | 1.000 |
libexanbDefBoxPlugin.so:0x14988c | void _INTERNAL199001ba::exanb::compute_cell_particles<_INTER... | compute_cell_particles.h:80 | 0 | 0 | runtime | parallel | 8 | 0.796 | 500 | 2.69 E-3 | 2.49 E-3 | 1.44 | 1.015 | 1.000 |
libexanbMPIPlugin.so:0x323c14 | void exanb::MigrateCellParticlesImpl<exanb::Grid<onika::soat... | migrate_cell_particles.h:865 | 0 | 0 | runtime | parallel | 8 | 0.681 | 35.0 | 0.595 | 0.595 | 87.5 | 7.993 | 1.001 |
libexanbAMRPlugin.so:0xc2c13 | void exanb::project_particles_in_sub_grids<exanb::OperatorNo... | amr_grid_algorithm.h:113 | 0 | 0 | runtime | parallel | 8 | 0.505 | 35.0 | 995 E-6 | 974 E-6 | 0.97 | 1.010 | 1.000 |
libexanbMPIPlugin.so:0x1a863b | unsigned long long _INTERNAL92320475::exanb::reduce_cell_par... | reduce_cell_particles.h:116 | 0 | 0 | runtime | parallel | 8 | 0.419 | 500 | 1.92 E-3 | 1.75 E-3 | 1.28 | 1.013 | 1.000 |
libexaStampComputePlugin.so:0x1b46ee | void _INTERNALcdc1e29b::exanb::compute_cell_particles<_INTER... | compute_cell_particles.h:80 | 0 | 0 | runtime | parallel | 8 | 0.356 | 501 | 2.31 E-3 | 2.09 E-3 | 1.66 | 1.017 | 1.000 |
libexanbIOPlugin.so:0x223026 | L__ZN5exanb17GridMemoryCompactINS_4GridIN5onika5soatl8FieldI... | grid_memory_compact.cpp:45 | 0 | 0 | runtime | parallel | 8 | 0.247 | 36.0 | 13.4 E-3 | 13.4 E-3 | 6.30 | 1.067 | 1.000 |
libexaStampAnalyticsPlugin.so:0x2fe329 | exaStamp::GridSliceAnalysis<exanb::Grid<onika::soatl::FieldI... | grid_slice_analysis.cpp:477 | 0 | 0 | runtime | parallel | 8 | 0.237 | 50.0 | 0.114 | 0.114 | 29.0 | 1.408 | 1.000 |
libexanbGridCellParticlesPlugin.so:0x1876ee | void exanb::move_particles_across_cells<exanb::OperatorNode:... | move_particles_across_cells.h:130 | 0 | 0 | runtime | parallel | 8 | 0.140 | 35.0 | 873 E-6 | 850 E-6 | 1.39 | 1.014 | 1.000 |
libexanbMPIPlugin.so:0x3239a0 | void exanb::MigrateCellParticlesImpl<exanb::Grid<onika::soat... | migrate_cell_particles.h:825 | 0 | 0 | runtime | parallel | 8 | 0.137 | 35.0 | 0.119 | 0.119 | 80.0 | 4.998 | 1.000 |
libexaStampComputePlugin.so:0x391bb3 | exaStamp::ThermodynamicStateNode<exanb::Grid<onika::soatl::F... | simulation_thermodynamic_state.cpp:88 | 0 | 0 | runtime | parallel | 8 | 0.119 | 52.0 | 3.20 E-3 | 3.16 E-3 | 6.41 | 1.069 | 1.000 |
libexanbGridCellParticlesPlugin.so:0x1872f9 | void exanb::move_particles_across_cells<exanb::OperatorNode:... | move_particles_across_cells.h:70 | 0 | 0 | runtime | parallel | 8 | 98.1 E-3 | 35.0 | 316 E-6 | 302 E-6 | 0.58 | 1.006 | 1.000 |
libexanbIOPlugin.so:0x1515a6 | exanb::PositionBackupNode<exanb::Grid<onika::soatl::FieldIds... | backup_r.cpp:37 | 0 | 0 | runtime | parallel | 8 | 88.8 E-3 | 35.0 | 4.64 E-3 | 4.63 E-3 | 7.60 | 1.082 | 1.000 |
libexanbMPIPlugin.so:0x2e3c24 | exanb::UpdateGhostsCommSchemeNode<exanb::Grid<onika::soatl::... | update_ghosts_comm_scheme.cpp:126 | 0 | 0 | runtime | parallel | 8 | 37.2 E-3 | 35.0 | 36.4 E-3 | 36.3 E-3 | 94.4 | 17.837 | 1.000 |
libexanbAMR.so:0x3f24 | exanb::max_distance_sub_cell_pairs(exanb::OperatorNode::Oper... | amr_grid_algorithm.cpp:95 | 0 | 0 | runtime | parallel | 8 | 2.28 E-3 | 35.0 | 246 E-6 | 228 E-6 | 15.8 | 1.187 | 1.000 |
libexanbAMRPlugin.so:0xc1674 | void exanb::rebuild_sub_grids<exanb::OperatorNode::OperatorD... | amr_grid_algorithm.h:382 | 0 | 0 | runtime | parallel | 8 | 764 E-6 | 35.0 | 191 E-6 | 171 E-6 | 29.5 | 1.418 | 1.000 |
libexanbCore.so:0xc991e | __sti__$E | thread.cpp:32 | 0 | 0 | runtime | parallel | 8 | 599 E-6 | 1.00 | 15.1 E-6 | 14.8 E-6 | 2.68 | 1.028 | 1.000 |
libexanbGridCellParticlesPlugin.so:0xf02ad | exanb::ExtendDomainOperator<exanb::Grid<onika::soatl::FieldI... | extend_domain.cpp:56 | 0 | 0 | runtime | parallel | 8 | 416 E-6 | 35.0 | 126 E-6 | 110 E-6 | 31.4 | 1.457 | 1.000 |
libexanbMPIPlugin.so:0x31fd3f | void exanb::MigrateCellParticlesImpl<exanb::Grid<onika::soat... | migrate_cell_particles.h:187 | 0 | 0 | runtime | parallel | 8 | 392 E-6 | 35.0 | 141 E-6 | 137 E-6 | 34.7 | 1.532 | 1.000 |
exaStamp:0x45ac55 | L_main_190__par_region0_2_439 | main.cpp:190 | 0 | 0 | runtime | parallel | 8 | 285 E-6 | 1.00 | 62.2 E-6 | 61.7 E-6 | 36.5 | 1.575 | 1.000 |
libexanbMPIPlugin.so:0x29c255 | exanb::SimpleCostModel<exanb::Grid<onika::soatl::FieldIds<ex... | simple_cost_model.h:104 | 0 | 0 | runtime | parallel | 8 | 222 E-6 | 8.00 | 31.0 E-6 | 27.3 E-6 | 14.0 | 1.162 | 1.000 |
libexanbCore.so:0xb7664 | exanb::rand::generate_seed() | parallel_random.cpp:24 | 0 | 0 | runtime | parallel | 8 | 94.1 E-6 | 1.00 | 27.8 E-6 | 27.7 E-6 | 29.5 | 1.419 | 1.000 |
libexanbMPIPlugin.so:0x28d23d | exanb::PerformanceAdviser<exanb::Grid<onika::soatl::FieldIds... | performance_adviser.cpp:39 | 0 | 0 | runtime | parallel | 8 | 16.6 E-6 | 1.00 | 6.44 E-6 | 6.02 E-6 | 38.8 | 1.633 | 1.000 |