options

Profiling node o401 - process 179497 - thread 179497

NameModuleCoverage (%)Time (s)
__svml_u64div8_z0exec20.215.67
__svml_i64rem8_z0exec19.114.82
advec_mom_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clo...+exec3.812.95
Loop 125 - advec_mom.cpp:181-211 - exec3.812.95
advec_mom_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clo...+exec3.562.76
Loop 133 - advec_mom.cpp:109-139 - exec3.562.76
calc_dt_kernel(int, int, int, int, double, double, double, double, double, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer1D&, clover::Buffer1D&, clover::Buffer1D&, clover::Buffer1D&, clover::Buffer2D+exec3.522.73
Loop 160 - calc_dt.cpp:50-76 - exec3.522.73
viscosity_kernel(int, int, int, int, clover::Buffer1D&, clover::Buffer1D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&) [clone .extracted]+exec3.452.67
Loop 662 - viscosity.cpp:37-66 - exec3.452.67
accelerate_kernel(int, int, int, int, double, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D+exec3.232.5
Loop 105 - accelerate.cpp:41-54 - exec3.232.5
ideal_gas_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&) [clone .extracted]+exec3.172.46
Loop 194 - ideal_gas.cpp:38-46 - exec3.172.46
PdV_kernel(bool, int, int, int, int, double, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D+exec3.122.42
Loop 243 - PdV.cpp:70-84 - exec3.122.42
kmp_flag_64::wait(kmp_info*, int, void*)libiomp5.so3.092.39
advec_cell_kernel(int, int, int, int, int, int, clover::Buffer1D&, clover::Buffer1D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D+exec2.892.24
Loop 109 - advec_cell.cpp:158-202 - exec2.892.24
PdV_kernel(bool, int, int, int, int, double, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D+exec2.622.03
Loop 245 - PdV.cpp:49-64 - exec2.622.03
advec_cell_kernel(int, int, int, int, int, int, clover::Buffer1D&, clover::Buffer1D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D+exec2.62.02
Loop 117 - advec_cell.cpp:66-110 - exec2.62.02
advec_mom_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clo...+exec2.551.97
Loop 131 - advec_mom.cpp:147-150 - exec2.551.97
advec_mom_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clo...+exec2.551.97
Loop 123 - advec_mom.cpp:219-222 - exec2.551.97
advec_cell_kernel(int, int, int, int, int, int, clover::Buffer1D&, clover::Buffer1D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D+exec1.731.34
Loop 107 - advec_cell.cpp:209-217 - exec1.731.34
advec_cell_kernel(int, int, int, int, int, int, clover::Buffer1D&, clover::Buffer1D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D+exec1.661.29
Loop 115 - advec_cell.cpp:118-126 - exec1.661.29
advec_mom_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clo...+exec1.611.25
Loop 127 - advec_mom.cpp:168-173 - exec1.611.25
flux_calc_kernel(int, int, int, int, double, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D+exec1.531.19
Loop 178 - flux_calc.cpp:37-41 - exec1.531.19
advec_mom_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clo...+exec1.270.98
Loop 135 - advec_mom.cpp:96-101 - exec1.270.98
advec_mom_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clo...+exec1.090.84
Loop 143 - advec_mom.cpp:54-58 - exec1.090.84
advec_mom_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clo...+exec1.070.83
Loop 139 - advec_mom.cpp:72-76 - exec1.070.83
advec_mom_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clo...+exec1.060.82
Loop 137 - advec_mom.cpp:86-89 - exec1.060.82
advec_mom_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clo...+exec1.040.8
Loop 145 - advec_mom.cpp:45-49 - exec1.040.8
advec_mom_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clo...+exec0.990.77
Loop 129 - advec_mom.cpp:158-161 - exec0.990.77
advec_mom_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clo...+exec0.90.69
Loop 141 - advec_mom.cpp:63-67 - exec0.90.69
reset_field_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&) [...+exec0.880.69
Loop 250 - reset_field.cpp:35-39 - exec0.880.69
revert_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&) [clone .extracted]+exec0.760.59
Loop 253 - revert.cpp:35-39 - exec0.760.59
advec_cell_kernel(int, int, int, int, int, int, clover::Buffer1D&, clover::Buffer1D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D+exec0.660.51
Loop 113 - advec_cell.cpp:137-141 - exec0.660.51
reset_field_kernel(int, int, int, int, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&) [...+exec0.620.48
Loop 248 - reset_field.cpp:45-49 - exec0.620.48
advec_cell_kernel(int, int, int, int, int, int, clover::Buffer1D&, clover::Buffer1D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D+exec0.610.47
Loop 121 - advec_cell.cpp:45-49 - exec0.610.47
advec_cell_kernel(int, int, int, int, int, int, clover::Buffer1D&, clover::Buffer1D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D+exec0.480.38
Loop 119 - advec_cell.cpp:55-59 - exec0.480.38
advec_cell_kernel(int, int, int, int, int, int, clover::Buffer1D&, clover::Buffer1D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D&, clover::Buffer2D+exec0.430.33
Loop 111 - advec_cell.cpp:147-151 - exec0.430.33
MPL_gpu_cuda_finalizelibmpi.so.12.0.00.250.19
field_summary(global_variables&, parallel_&) [clone .extracted]+exec0.250.19
Loop 173 - field_summary.cpp:76-92 - exec+0.080.06
Loop 174 - field_summary.cpp:80-82 - exec+0.080.06
Loop 175 - field_summary.cpp:81-82 - exec0.080.06
__GI___pthread_mutex_locklibpthread-2.28.so0.210.16
MPIR_Progress_hook_exec_on_vcilibmpi.so.12.0.00.180.14
__pthread_mutex_unlock_usercntlibpthread-2.28.so0.140.11
__svml_i64div8_z0exec0.120.09
MPIDI_Progress_testlibmpi.so.12.0.00.10.07
MPIDI_OFI_progresslibmpi.so.12.0.00.080.06
I_MPI_memcpy_stream_nontemporal_avx512libmpi.so.12.0.00.070.05
kmp_flag_native::notdone_check()libiomp5.so0.070.05
MPID_CH4_SHM_bcast_intra_heap_init_cntlibmpi.so.12.0.00.050.04
I_MPI_memcpy_multipage_avx512libmpi.so.12.0.00.050.03
clover_unpack_message_left(global_variables&, int, int, int, int, clover::Buffer2D&, clover::Buffer1D&, int, int, int, int, int, int, int) [clone .extracted]+exec0.040.03
Loop 218 - pack_kernel.cpp:89-94 - exec+0.040.03
Loop 219 - pack_kernel.cpp:90-92 - exec0.040.03
__kmp_hyper_barrier_release(barrier_type, kmp_info*, int, int, int, void*)libiomp5.so0.030.02
ofi_cq_progresslibmlx-fi.so0.030.02
uct_rc_mlx5_iface_progress_cycliclibuct_ib.so.0.0.00.030.02
unknown_kernel_regionkernel0.030.02
inflate_fastlibmpi.so.12.0.00.030.02
ucp_worker_progresslibucp.so.0.0.00.030.02
build_field(global_variables&) [clone .extracted.37]+exec0.030.02
Loop 158 - build_field.cpp:101-114 - exec0.030.02
__svml_idiv8_l9exec0.020.01
clover_pack_message_left(global_variables&, int, int, int, int, clover::Buffer2D&, clover::Buffer1D&, int, int, int, int, int, int, int) [clone .extracted]+exec0.020.01
Loop 215 - pack_kernel.cpp:56-61 - exec+0.020.01
Loop 216 - pack_kernel.cpp:57-59 - exec0.020.01
MPIDI_OFI_get_bufferedlibmpi.so.12.0.00.010.01
MPIDU_Init_shm_barrierlibmpi.so.12.0.00.010.01
impi_shm_heap_progresslibmpi.so.12.0.00.010.01
MPID_Progress_waitlibmpi.so.12.0.00.010.01
ofi_cq_readfromlibmlx-fi.so0.010.01
ofi_cq_readlibmlx-fi.so0.010.01
update_halo_kernel(int, int, int, int, std::array const&, std::array const&, field_type&, int const*, int) [clone .extracted.222]exec0.010.01
mlx_ep_progresslibmlx-fi.so0.010.01
ucp_worker_progress@pltlibmlx-fi.so0.010.01
build_field(global_variables&) [clone .extracted.27]+exec0.010.01
Loop 154 - build_field.cpp:119-129 - exec0.010.01
MPID_Progress_completion_count_getlibmpi.so.12.0.00.010
rml::internal::Backend::genericGetBlock(int, unsigned long, bool)libiomp5.so0.010
MPIDI_SHMI_progresslibmpi.so.12.0.00.010
__kmp_fork_calllibiomp5.so0.010
__kmp_acquire_ticket_lock_timed_template(kmp_ticket_lock*, int)libiomp5.so0.010
__kmpc_fork_calllibiomp5.so0.010
MPIDI_OFI_coll_selectlibmpi.so.12.0.00.010
MPI_Isendlibmpi.so.12.0.00.010
uct_ud_mlx5_iface_progresslibuct_ib.so.0.0.00.010
adler32_zlibmpi.so.12.0.00.010
ofi_mutex_unlock_nooplibmlx-fi.so0.010
ofi_mutex_lock_nooplibmlx-fi.so0.010
syscalllibc-2.28.so0.010
update_halo_kernel(int, int, int, int, std::array const&, std::array const&, field_type&, int const*, int) [clone .extracted.262]exec0.010
update_halo_kernel(int, int, int, int, std::array const&, std::array const&, field_type&, int const*, int) [clone .extracted.212]exec0.010
update_halo_kernel(int, int, int, int, std::array const&, std::array const&, field_type&, int const*, int) [clone .extracted.102]exec0.010
update_halo_kernel(int, int, int, int, std::array const&, std::array const&, field_type&, int const*, int) [clone .extracted.92]exec0.010
update_halo_kernel(int, int, int, int, std::array const&, std::array const&, field_type&, int const*, int) [clone .extracted.82]exec0.010
update_halo_kernel(int, int, int, int, std::array const&, std::array const&, field_type&, int const*, int) [clone .extracted]exec0.010
initialise_chunk(int, global_variables&) [clone .extracted.7]+exec0.010
Loop 197 - initialise_chunk.cpp:78-83 - exec0.010
generate_chunk(int, global_variables&) [clone .extracted]exec0.010
pthread_mutex_lock@pltlibmlx-fi.so0.010
build_field(global_variables&) [clone .extracted.32]+exec0.010
Loop 156 - build_field.cpp:134-139 - exec0.010
build_field(global_variables&) [clone .extracted.22]+exec0.010
Loop 152 - build_field.cpp:144-149 - exec0.010
_dl_relocate_objectld-2.28.so0.010
do_lookup_xld-2.28.so0.010
mlx5dv_dci_stream_id_resetlibmlx5.so.1.24.44.00.010
×