options

Profiling node o405 - process 152356 - thread 152356

NameModuleCoverage (%)Time (s)
miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&)+exec23.9327.01
Loop 843 - MultiBsplineRef.hpp:42-71 - exec+23.9226.99
Loop 844 - MultiBsplineRef.hpp:63-71 - exec+23.9226.99
Loop 845 - MultiBsplineRef.hpp:64-71 - exec+23.9226.99
Loop 846 - MultiBsplineRef.hpp:68-70 - exec23.9226.99
miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&, qmcplusplus::Vector, std::allocator >...+exec19.2421.71
Loop 849 - MultiBsplineRef.hpp:187-286 - exec+17.3819.61
Loop 852 - MultiBsplineRef.hpp:226-262 - exec+17.1319.33
Loop 853 - MultiBsplineRef.hpp:227-262 - exec+17.1319.33
Loop 858 - MultiBsplineRef.hpp:242-262 - exec+17.1319.33
Loop 860 - MultiBsplineRef.hpp:242-262 - exec11.1412.57
Loop 859 - MultiBsplineRef.hpp:242-261 - exec5.996.76
Loop 851 - MultiBsplineRef.hpp:276-286 - exec0.250.28
Loop 847 - einspline_spo_ref.hpp:219-227 - exec+0.810.91
Loop 848 - einspline_spo_ref.hpp:223-227 - exec0.810.91
mkl_blas_avx512_dgemm_kernel_nocopy_TN_b1libmkl_avx512.so.213.7815.55
mkl_blas_avx512_dgemm_kernel_0libmkl_avx512.so.211.9113.44
qmcplusplus::SoaDistanceTableABOMPTarget::evaluate(qmcplusplus::ParticleSet&)+exec7.528.48
Loop 2084 - SoaDistanceTableABOMPTarget.h:214-228 - exec+7.58.46
Loop 2085 - SoaDistanceTableABOMPTarget.h:215-228 - exec+7.58.46
Loop 2083 - SoaDistanceTableABOMPTarget.h:228-228 - exec7.58.46
Loop 2086 - SoaDistanceTableABOMPTarget.h:194-196 - exec0.010.01
qmcplusplus::SoaDistanceTableAAOMPTarget::update(int)+exec6.797.66
Loop 1858 - SoaDistanceTableAAOMPTarget.h:440-442 - exec6.797.66
__intel_avx_rep_memset+exec2.072.34
Loop 2345 - - exec1.111.25
miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)+exec1.942.19
Loop 372 - TwoBodyJastrowRef.h:107-132 - exec+1.912.15
Loop 373 - BsplineFunctor.h:236-260 - exec+1.912.15
Loop 377 - BsplineFunctor.h:236-241 - exec1.792.02
Loop 375 - BsplineFunctor.h:246-260 - exec0.120.13
void qmcplusplus::DTD_BConds::computeDistances, qmcplusplus::VectorSoAContainer >, qmcplusplus::VectorSoAContainer+exec1.71.92
Loop 1352 - ParticleBConds3DSoa.h:235-256 - exec1.71.91
mkl_blas_avx512_dgemv_t_intrinsicslibmkl_avx512.so.21.431.61
miniqmcreference::TwoBodyJastrowRef >::acceptMove(qmcplusplus::ParticleSet&, int)+exec11.13
Loop 350 - TwoBodyJastrowRef.h:324-331 - exec0.310.34
Loop 345 - TwoBodyJastrowRef.h:342-347 - exec0.270.3
Loop 343 - TwoBodyJastrowRef.h:342-347 - exec0.220.24
Loop 347 - TwoBodyJastrowRef.h:342-347 - exec0.210.23
mkl_blas_avx512_dgemv_n_intrinsicslibmkl_avx512.so.20.951.07
mkl_blas_avx512_dgemm_kernel_nocopy_TN_b0libmkl_avx512.so.20.891
unknown_functionUnknown module0.770.86
miniqmcreference::DiracDeterminantRef >::evalGrad(qmcplusplus::ParticleSet&, int)+exec0.610.68
Loop 959 - inner_product.hpp:155-155 - exec0.60.68
kmp_flag_64::wait(kmp_info*, int, void*)libiomp5.so0.60.68
qmcplusplus::BsplineFunctor::evaluateVGL(int, int, int, double const*, double*, double*, double*, double*, int*) const+exec0.580.66
Loop 317 - BsplineFunctor.h:291-298 - exec0.480.55
Loop 315 - BsplineFunctor.h:303-338 - exec0.070.07
miniqmcreference::DiracDeterminantRef >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus:...+exec0.530.59
Loop 970 - inner_product.hpp:82-155 - exec+0.530.59
Loop 972 - inner_product.hpp:155-155 - exec0.380.42
Loop 974 - inner_product.hpp:82-83 - exec0.150.17
miniqmcreference::TwoBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)+exec0.450.5
Loop 338 - TwoBodyJastrowRef.h:155-156 - exec0.140.16
Loop 336 - TwoBodyJastrowRef.h:155-156 - exec0.120.13
Loop 337 - TwoBodyJastrowRef.h:155-156 - exec0.120.14
Loop 340 - stl_numeric.h:126-127 - exec0.050.06
miniqmcreference::DiracDeterminantRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)+exec0.310.35
Loop 960 - inner_product.hpp:155-155 - exec0.230.26
Loop 963 - inner_product.hpp:82-83 - exec0.070.08
qmcplusplus::SPOSet::evaluateDetRatios(qmcplusplus::VirtualParticleSet const&, qmcplusplus::Vector >&, qmcplusplus::Vector > const&, std::vector >&)+exec0.30.34
Loop 861 - inner_product.hpp:82-83 - exec+0.30.34
Loop 863 - inner_product.hpp:82-83 - exec0.30.34
__intel_avx_rep_memcpyexec0.260.29
unknown_kernel_regionkernel0.160.18
mkl_lapack_xdlaswplibmkl_core.so.20.160.18
qmcplusplus::DiracMatrix::invert_transpose(qmcplusplus::Matrix > const&, qmcplusplus::Matrix >&, double&, double&)+exec0.150.17
Loop 937 - inner_product.hpp:210-212 - exec+0.150.17
Loop 938 - inner_product.hpp:210-212 - exec+0.150.17
Loop 939 - inner_product.hpp:210-212 - exec+0.150.17
Loop 940 - inner_product.hpp:211-212 - exec0.150.17
mkl_blas_avx512_dgemm_kernel_nocopy_NN_b0libmkl_avx512.so.20.140.15
mkl_blas_avx512_dgemm_dcopy_right8_ealibmkl_avx512.so.20.110.12
miniqmcreference::TwoBodyJastrowRef >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::Particle...+exec0.090.1
Loop 355 - TwoBodyJastrowRef.h:268-420 - exec+0.080.08
Loop 356 - TwoBodyJastrowRef.h:268-420 - exec+0.080.08
Loop 358 - TwoBodyJastrowRef.h:393-398 - exec0.040.04
Loop 362 - TwoBodyJastrowRef.h:381-382 - exec0.020.02
Loop 364 - TwoBodyJastrowRef.h:381-382 - exec0.010.01
Loop 366 - TwoBodyJastrowRef.h:381-382 - exec0.010.01
MPIR_Progress_hook_exec_on_vcilibmpi.so.12.0.00.080.09
MPL_gpu_cuda_finalizelibmpi.so.12.0.00.080.09
qmcplusplus::NonLocalPP::evaluate(qmcplusplus::ParticleSet const&, qmcplusplus::WaveFunction&)+exec0.080.09
Loop 80 - NonLocalPP.hpp:122-135 - exec+0.010.01
Loop 81 - NonLocalPP.hpp:126-135 - exec+0.010.01
Loop 82 - NonLocalPP.hpp:131-132 - exec0.010.01
miniqmcreference::DiracDeterminantRef >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus...+exec0.080.08
Loop 953 - inner_product.hpp:82-155 - exec+0.080.08
Loop 957 - inner_product.hpp:155-155 - exec0.060.06
Loop 955 - inner_product.hpp:82-83 - exec0.020.02
mkl_blas_avx512_dgemm_dcopy_down24_ealibmkl_avx512.so.20.070.08
unknown_function[vdso]0.070.07
pthread_spin_locklibpthread-2.28.so0.060.06
__pthread_mutex_unlock_usercntlibpthread-2.28.so0.060.06
miniqmcreference::OneBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)+exec0.060.06
Loop 247 - OneBodyJastrowRef.h:192-193 - exec0.020.02
Loop 249 - OneBodyJastrowRef.h:192-193 - exec0.010.01
Loop 252 - OneBodyJastrowRef.h:186-187 - exec0.010.01
uct_ud_mlx5_iface_progresslibuct_ib.so.0.0.00.050.06
__GI___pthread_mutex_locklibpthread-2.28.so0.050.06
std::map, double, std::less >, std::allocator const, double> > >::operator[](qmcplusplus::StackKeyParam<2> const&)exec0.050.05
miniqmcreference::OneBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)+exec0.050.05
Loop 286 - OneBodyJastrowRef.h:134-155 - exec+0.040.04
Loop 288 - OneBodyJastrowRef.h:134-146 - exec+0.040.04
Loop 292 - BsplineFunctor.h:236-241 - exec0.040.04
mkl_blas_avx512_dtrsm_kernel_ll_0libmkl_avx512.so.20.040.05
qmcplusplus::TimerType::start()exec0.040.04
qmcplusplus::TimerType::stop()exec0.030.04
mkl_blas_avx512_dgemm_kernel_nocopy_NN_b1libmkl_avx512.so.20.030.03
std::map, long, std::less >, std::allocator const, long> > >::operator[](qmcplusplus::StackKeyParam<2> const&)exec0.030.03
uct_rc_mlx5_iface_progress_cycliclibuct_ib.so.0.0.00.030.03
qmcplusplus::SoaDistanceTableAAOMPTarget::move(qmcplusplus::ParticleSet const&, qmcplusplus::TinyVector const&, int, bool)exec0.020.02
qmcplusplus::Vector >::resize(unsigned long, double)+exec0.020.02
Loop 297 - stl_algobase.h:752-754 - exec0.020.02
mkl_blas_xdgemvlibmkl_core.so.20.020.02
MPIDI_OFI_get_bufferedlibmpi.so.12.0.00.020.02
__kmp_api_omp_get_levellibiomp5.so0.020.02
MPIDI_Progress_testlibmpi.so.12.0.00.020.02
qmcplusplus::SoaDistanceTableABOMPTarget::move(qmcplusplus::ParticleSet const&, qmcplusplus::TinyVector const&, int, bool)exec0.020.02
qmcplusplus::ParticleSet::makeMove(int, qmcplusplus::TinyVector const&, bool)exec0.020.02
miniqmcreference::DiracDeterminantRef >::resize(int, int)+exec0.020.02
Loop 982 - stl_algobase.h:740-742 - exec0.020.02
_dl_update_slotinfold-2.28.so0.020.02
qmcplusplus::WaveFunction::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)exec0.020.02
mkl_blas_avx512_xdgemm_nocopy_driverlibmkl_avx512.so.20.010.01
inflate_fastlibmpi.so.12.0.00.010.01
qmcplusplus::SoaDistanceTableABOMPTarget::update(int)exec0.010.01
__cxxabiv1::__vmi_class_type_info::__do_dyncast(long, __cxxabiv1::__class_type_info::__sub_kind, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info::__dyncast_result&) constlibstdc++.so.6.0.250.010.01
__cxxabiv1::__si_class_type_info::__do_dyncast(long, __cxxabiv1::__class_type_info::__sub_kind, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info::__dyncast_result&) constlibstdc++.so.6.0.250.010.01
miniqmcreference::TwoBodyJastrowRef >::evalGrad(qmcplusplus::ParticleSet&, int)exec0.010.01
update_get_addrld-2.28.so0.010.01
qmcplusplus::WaveFunction::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)exec0.010.01
qmcplusplus::WaveFunction::evalGrad(qmcplusplus::ParticleSet&, int)+exec0.010.01
Loop 106 - WaveFunction.cpp:185-188 - exec0.010.01
main.extracted.110+exec0.010.01
Loop 23 - stl_vector.h:296-933 - exec+0.010.01
Loop 37 - random.tcc:401-3338 - exec+0.010.01
Loop 38 - miniqmc.cpp:429-458 - exec0.010.01
mkl_blas_avx512_xdgemvlibmkl_avx512.so.20.010.01
MPIDI_OFI_progresslibmpi.so.12.0.00.010.01
__kmp_get_global_thread_id_reglibiomp5.so0.010.01
_intel_fast_memsetexec0.010.01
__libm_exp_z0exec0.010.01
__kmp_api_omp_get_ancestor_thread_numlibiomp5.so0.010.01
kmp_flag_native::notdone_check()libiomp5.so0.010.01
ofi_cq_progresslibmlx-fi.so0.010.01
qmcplusplus::TimerManager >::pop_timer(qmcplusplus::TimerType*)exec0.010.01
qmcplusplus::TimerManager >::push_timer(qmcplusplus::TimerType*)exec0.010.01
std::chrono::_V2::system_clock::now()libstdc++.so.6.0.250.010.01
qmcplusplus::VirtualParticleSet::makeMoves(qmcplusplus::ParticleSet const&, int, std::vector, std::allocator > > const&, bool, int)exec0.010.01
qmcplusplus::ParticleSet::update(bool)+exec0.010.01
Loop 1213 - ParticleSet.cpp:242-243 - exec0.010.01
miniqmcreference::DiracDeterminantRef >::acceptMove(qmcplusplus::ParticleSet&, int)exec0.010.01
void qmcplusplus::DelayedUpdate::getInvRow > >(qmcplusplus::Matrix > const&, int, qmcplusplus::Vector >&)exec0.010.01
ucp_worker_progress@pltlibmlx-fi.so0.010.01
__tls_get_addr_slowld-2.28.so0.010.01
miniqmcreference::OneBodyJastrowRef >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::Particle...+exec0.010.01
Loop 273 - OneBodyJastrowRef.h:109-194 - exec+0.010.01
Loop 280 - OneBodyJastrowRef.h:192-193 - exec0.010.01
__dynamic_castlibstdc++.so.6.0.250.010.01
__tls_get_addrld-2.28.so0.010.01
unknown_functionexec0.010.01
mkl_blas_avx512_xdgerlibmkl_avx512.so.200
miniqmcreference::OneBodyJastrowRef >::computeU3(qmcplusplus::ParticleSet&, int, double const*)exec00
×