Loop id | Source Location | Source Function | Level | Coverage run_0 (%) | Max Time Over Threads run_0 (s) | Time w.r.t. Wall Time run_0 (s) | Nb Threads run_0 | GFLOPS run_0 | Vectorization Ratio (%) | Vector Length Use (%) | Speedup If No Scalar Integer | Speedup If FP Vectorized | Speedup If Fully Vectorized | Speedup If Perfect Load Balancing run_0 | Stride 0 | Stride 1 | Stride n | Stride Unknown | Stride Indirect |
---|
690 | libqmcwfs.so - MultiBsplineRef.hpp:68-71 | miniqmcreference::einspline_spo_ref<double>::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector<double, std::allocator<double> >&) | Innermost | 22.6 | 28.18 | 26.92 | 112 | 227.64 | 100 | 50 | 1 | 1.95 | 2 | 1.09 | 1 | 7 | 4 | 0 | 0 |
692 | libqmcwfs.so - MultiBsplineRef.hpp:239-262 [...] | void miniqmcreference::MultiBsplineEvalRef::evaluate_vgh<double>(qmcplusplus::bspline_traits<double, 3u>::SplineType const*, double, double, double, double*, double*, double*, unsigned long) | Innermost | 20.09 | 32.52 | 23.93 | 112 | 368.99 | 20.93 | 15.12 | 1 | 1.94 | 6 | 1.42 | 1 | 12 | 1 | 0 | 0 |
480 | libqmcparticle_omptarget.so - ParticleBConds3DSoa.h:280-298 [...] | qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::evaluate(qmcplusplus::ParticleSet&) | Innermost | 8.16 | 10.38 | 9.72 | 112 | 313.32 | 12.24 | 14.03 | 1 | 3.33 | 6.67 | 1.11 | 0 | 7 | 0 | 0 | 0 |
226 | libqmcparticle_omptarget.so - SoaDistanceTableAAOMPTarget.h:440-442 [...] | qmcplusplus::SoaDistanceTableAAOMPTarget<double, 3u, 40>::update(int) | Single | 5.98 | 7.61 | 7.13 | 112 | 0.00 | 27.27 | 15.91 | 1.58 | 1 | 8 | 1.11 | 0 | 0 | 6 | 7 | 1 |
441 | libqmcparticle_omptarget.so - ParticleBConds3DSoa.h:237-255 | void qmcplusplus::DTD_BConds<double, 3u, 40>::computeDistances<qmcplusplus::TinyVector<double, 3u>, qmcplusplus::VectorSoAContainer<double, 3u, qmcplusplus::Mallocator<double, 64ul> >, qmcplusplus::VectorSoAContainer<double, 3... | Single | 1.67 | 2.24 | 1.98 | 112 | 1039.35 | 100 | 50 | 1 | 1.67 | 1.67 | 1.18 | 1 | 7 | 0 | 0 | 0 |
565 | libqmcwfs.so - BsplineFunctor.h:236-241 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | Innermost | 1.63 | 2.37 | 1.95 | 112 | 0.25 | 0 | 10 | 1 | 1 | 12.12 | 1.27 | NA | NA | NA | NA | NA |
691 | libqmcwfs.so - MultiBsplineRef.hpp:276-286 | void miniqmcreference::MultiBsplineEvalRef::evaluate_vgh<double>(qmcplusplus::bspline_traits<double, 3u>::SplineType const*, double, double, double, double*, double*, double*, unsigned long) | Single | 1.05 | 1.95 | 1.26 | 112 | 103.32 | 0 | 12.5 | 1 | 1.04 | 8 | 1.63 | 0 | 9 | 0 | 0 | 0 |
696 | libqmcwfs.so - einspline_spo_ref.hpp:223-227 [...] | miniqmcreference::einspline_spo_ref<double>::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector<double, std::allocator<double> >&, qmcplusplus::Vector<qmcplusplus::TinyVector<double, 3u>, std::allocator<... | Innermost | 0.91 | 1.29 | 1.08 | 112 | 0.00 | 11.11 | 13.89 | 1 | 1 | 6.4 | 1.24 | 0 | 5 | 5 | 0 | 0 |
494 | libqmcwfs.so - TwoBodyJastrowRef.h:342-347 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::acceptMove(qmcplusplus::ParticleSet&, int) | Innermost | 0.68 | 0.99 | 0.81 | 112 | 235.54 | 100 | 50 | 1 | 1.23 | 2 | 1.27 | 0 | 4 | 2 | 0 | 0 |
742 | libqmcwfs.so - OperatorTags.h:63-94 [...] | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<... | Innermost | 0.42 | 0.66 | 0.5 | 112 | 126.45 | 100 | 50 | 1 | 1 | 2 | 1.38 | 0 | 2 | 0 | 0 | 0 |
495 | libqmcwfs.so - TwoBodyJastrowRef.h:324-331 [...] | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::acceptMove(qmcplusplus::ParticleSet&, int) | Single | 0.39 | 0.59 | 0.46 | 112 | 205.03 | 0 | 12.5 | 1 | 1.31 | 8 | 1.31 | 0 | 8 | 0 | 0 | 0 |
554 | libqmcwfs.so - TwoBodyJastrow.h:155-156 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Innermost | 0.36 | 0.51 | 0.43 | 112 | 292.07 | 100 | 50 | 1 | 1.38 | 2 | 1.24 | 0 | 2 | 0 | 0 | 0 |
746 | libqmcwfs.so - OperatorTags.h:63-94 [...] | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evalGrad(qmcplusplus::ParticleSet&, int) | Single | 0.34 | 0.51 | 0.41 | 112 | 153.51 | 100 | 50 | 1 | 1 | 2 | 1.31 | 0 | 2 | 0 | 0 | 0 |
557 | libqmcwfs.so - BsplineFunctor.h:291-298 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Innermost | 0.31 | 0.48 | 0.37 | 112 | 0.06 | 0 | 9.38 | 1.19 | 1 | 12.63 | 1.37 | NA | NA | NA | NA | NA |
41 | libqmcwfs.so - inner_product.hpp:82-83 | qmcplusplus::SPOSet::evaluateDetRatios(qmcplusplus::VirtualParticleSet const&, qmcplusplus::Vector<double, std::allocator<double> >&, qmcplusplus::Vector<double, std::allocator<double> > const&, std::vector<double, st... | Innermost | 0.26 | 0.45 | 0.31 | 112 | 269.87 | 100 | 50 | 1 | 1.38 | 2 | 1.55 | 0 | 2 | 0 | 0 | 0 |
743 | libqmcwfs.so - inner_product.hpp:82-83 | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<... | Innermost | 0.25 | 0.44 | 0.3 | 112 | 69.92 | 100 | 50 | 1 | 1.38 | 2 | 1.57 | 0 | 2 | 0 | 0 | 0 |
258 | libqmcparticle_omptarget.so - ParticleBConds3DSoa.h:237-255 | qmcplusplus::SoaDistanceTableAAOMPTarget<double, 3u, 40>::evaluate(qmcplusplus::ParticleSet&) | Innermost | 0.24 | 0.45 | 0.28 | 112 | 333.88 | 100 | 50 | 1 | 1.67 | 1.67 | 1.67 | 1 | 7 | 0 | 0 | 0 |
711 | libqmcwfs.so - inner_product.hpp:211-212 | qmcplusplus::DiracMatrix<double, double>::invert_transpose(qmcplusplus::Matrix<double, std::allocator<double> > const&, qmcplusplus::Matrix<double, std::allocator<double> >&, double&, double&) | Innermost | 0.22 | 0.42 | 0.26 | 112 | 0.00 | 33.33 | 16.67 | 1 | 1 | 6.51 | 1.68 | 0 | 1 | 0 | 2 | 0 |
489 | libqmcwfs.so - BsplineFunctor.h:291-298 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::computeU3(qmcplusplus::ParticleSet const&, int, double const*, double*, double*, double*, bool) | Innermost | 0.22 | 0.35 | 0.26 | 112 | 0.09 | 0 | 9.38 | 1.19 | 1 | 12.63 | 1.4 | NA | NA | NA | NA | NA |
672 | libqmcwfs.so - inner_product.hpp:155-155 [...] | qmcplusplus::TinyVector<double, 3u> qmcplusplus::simd::dot<double, 3u>(double const*, qmcplusplus::TinyVector<double, 3u> const*, int) | Single | 0.11 | 0.19 | 0.13 | 112 | 483.50 | 100 | 50 | 1 | 1 | 2 | 1.58 | 0 | 2 | 0 | 0 | 0 |
749 | libqmcwfs.so - OperatorTags.h:63-94 [...] | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector&l... | Innermost | 0.09 | 0.14 | 0.11 | 112 | 115.62 | 100 | 50 | 1 | 1 | 2 | 1.4 | 0 | 2 | 0 | 0 | 0 |
745 | libqmcwfs.so - inner_product.hpp:82-83 | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Single | 0.08 | 0.14 | 0.1 | 112 | 213.17 | 100 | 50 | 1 | 1.38 | 2 | 1.56 | 0 | 2 | 0 | 0 | 0 |
555 | libqmcwfs.so - stl_numeric.h:140-141 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Single | 0.07 | 0.14 | 0.09 | 112 | 230.91 | 100 | 50 | 1 | 1.47 | 2 | 1.75 | 0 | 1 | 0 | 0 | 0 |
43 | exec - | main._omp_fn.1 | InBetween | 0.07 | 0.17 | 0.09 | 112 | 0.42 | 23.08 | 15.22 | 1.73 | 1.81 | 9.67 | 2.13 | NA | NA | NA | NA | NA |
566 | libqmcwfs.so - BsplineFunctor.h:246-260 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | Innermost | 0.07 | 0.14 | 0.08 | 112 | 764.95 | 100 | 48.46 | 1.09 | 1.43 | 2.15 | 1.75 | 7 | 1 | 0 | 0 | 1 |
463 | libqmcwfs.so - TwoBodyJastrowRef.h:381-382 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<double, ... | Innermost | 0.06 | 0.13 | 0.07 | 112 | 176.44 | 100 | 50 | 1 | 1.38 | 2 | 1.86 | 1 | 2 | 0 | 0 | 0 |
559 | libqmcwfs.so - BsplineFunctor.h:305-336 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Innermost | 0.05 | 0.09 | 0.06 | 112 | 551.85 | 99.43 | 48.78 | 1.12 | 1.59 | 2.2 | 1.8 | 11 | 2 | 0 | 0 | 3 |
656 | libqmcwfs.so - BsplineFunctor.h:236-241 | miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | Innermost | 0.04 | 0.11 | 0.05 | 112 | 0.56 | 0 | 10 | 1 | 1 | 12.12 | 2.2 | NA | NA | NA | NA | NA |
466 | libqmcwfs.so - BsplineFunctor.h:291-298 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<double, ... | Innermost | 0.03 | 0.07 | 0.04 | 112 | 0.11 | 0 | 9.38 | 1.19 | 1 | 12.63 | 2.33 | NA | NA | NA | NA | NA |
556 | libqmcwfs.so - TwoBodyJastrowRef.h:269-271 [...] | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Outermost | 0.03 | 0.07 | 0.03 | 112 | 121.99 | 44.9 | 19.59 | 1.21 | 1.52 | 6.13 | 2.33 | NA | NA | NA | NA | NA |
748 | libqmcwfs.so - inner_product.hpp:82-83 | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector&l... | Innermost | 0.03 | 0.05 | 0.03 | 112 | 136.37 | 100 | 50 | 1 | 1.38 | 2 | 1.67 | 1 | 2 | 0 | 0 | 0 |
491 | libqmcwfs.so - BsplineFunctor.h:305-336 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::computeU3(qmcplusplus::ParticleSet const&, int, double const*, double*, double*, double*, bool) | Innermost | 0.02 | 0.06 | 0.03 | 112 | 630.22 | 99.43 | 48.78 | 1.12 | 1.59 | 2.2 | 2 | 11 | 2 | 0 | 0 | 3 |
243 | libqmcwfs.so - stl_algobase.h:918-919 | qmcplusplus::Vector<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<double, 3u> > >::resize(unsigned long, qmcplusplus::TinyVector<double, 3u>) | Single | 0.02 | 0.04 | 0.02 | 110 | 0.00 | 50 | 18.75 | 2 | 1 | 5.33 | 2 | 0 | 0 | 1 | 0 | 0 |
564 | libqmcwfs.so - BsplineFunctor.h:232-260 [...] | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | InBetween | 0.02 | 0.05 | 0.03 | 112 | 263.14 | 27.88 | 16.13 | 1.07 | 2.05 | 6.18 | 1.67 | NA | NA | NA | NA | NA |
607 | libqmcwfs.so - OneBodyJastrow.h:192-193 | miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Innermost | 0.02 | 0.06 | 0.03 | 112 | 336.18 | 100 | 50 | 1 | 1.38 | 2 | 2 | 0 | 2 | 0 | 0 | 0 |
687 | libqmcwfs.so - einspline_spo_ref.hpp:175-176 [...] | miniqmcreference::einspline_spo_ref<double>::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector<double, std::allocator<double> >&) | Outermost | 0.01 | 0.04 | 0.01 | 112 | 36.55 | 11.59 | 14.63 | 1.24 | 1.95 | 8.81 | 4 | NA | NA | NA | NA | NA |
74 | exec - | main._omp_fn.1 | Innermost | 0.01 | 0.04 | 0.02 | 107 | 4.13 | 30.95 | 14.96 | 7.11 | 1 | 14.37 | 2 | 2 | 0 | 0 | 2 | 7 |
693 | libqmcwfs.so - MultiBsplineRef.hpp:227-262 [...] | void miniqmcreference::MultiBsplineEvalRef::evaluate_vgh<double>(qmcplusplus::bspline_traits<double, 3u>::SplineType const*, double, double, double, double*, double*, double*, unsigned long) | InBetween | 0.01 | 0.04 | 0.02 | 112 | 203.88 | 0 | 12.5 | 1.56 | 2.38 | 8 | 2 | 1 | 0 | 0 | 14 | 0 |
488 | libqmcwfs.so - TwoBodyJastrowRef.h:269-271 [...] | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::computeU3(qmcplusplus::ParticleSet const&, int, double const*, double*, double*, double*, bool) | Outermost | 0.01 | 0.04 | 0.01 | 112 | 182.01 | 45 | 19.6 | 1.21 | 1.53 | 6.14 | 4 | NA | NA | NA | NA | NA |
604 | libqmcwfs.so - OneBodyJastrowRef.h:214-216 | miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::computeU3(qmcplusplus::ParticleSet&, int, double const*) | Innermost | 0.01 | 0.04 | 0.01 | 74 | 0.10 | 0 | 12.5 | 1 | 1 | 8 | 4 | 0 | 1 | 0 | 0 | 0 |
461 | libqmcwfs.so - TwoBodyJastrowRef.h:397-398 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<double, ... | Innermost | 0.01 | 0.04 | 0.02 | 112 | 634.09 | 100 | 50 | 1 | 1.02 | 2 | 2 | 1 | 2 | 2 | 0 | 0 |
563 | libqmcwfs.so - TwoBodyJastrowRef.h:107-132 [...] | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | Outermost | 0.01 | 0.04 | 0.01 | 111 | 30.65 | 12.5 | 14.39 | 2.67 | 1.9 | 10.19 | 4 | NA | NA | NA | NA | NA |
620 | libqmcwfs.so - OneBodyJastrow.h:193-193 | miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<double,... | Innermost | 0.01 | 0.03 | 0.02 | 112 | 102.60 | 100 | 50 | 1 | 1.38 | 2 | 1.5 | 0 | 2 | 0 | 0 | 0 |
478 | libqmcparticle_omptarget.so - ParticleBConds3DSoa.h:280-298 [...] | qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::evaluate(qmcplusplus::ParticleSet&) | InBetween | 0.01 | 0.03 | 0.01 | 112 | 359.66 | 0 | 11.21 | 1.12 | 1 | 8.95 | 3 | 4.5 | 2.5 | 1 | 0 | 0 |
653 | libqmcwfs.so - OneBodyJastrowRef.h:134-155 [...] | miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | Outermost | 0.01 | 0.03 | 0.01 | 92 | 1.65 | 6.06 | 13.45 | 1.72 | 1.98 | 10.23 | 3 | NA | NA | NA | NA | NA |
40 | libqmcwfs.so - SPOSet.h:83-88 [...] | qmcplusplus::SPOSet::evaluateDetRatios(qmcplusplus::VirtualParticleSet const&, qmcplusplus::Vector<double, std::allocator<double> >&, qmcplusplus::Vector<double, std::allocator<double> > const&, std::vector<double, st... | Outermost | 0.01 | 0.03 | 0.01 | 112 | 59.00 | 63.46 | 29.57 | 1.83 | 2.26 | 4.95 | 3 | NA | NA | NA | NA | NA |
299 | libqmcparticle.so - stl_vector.h:988-988 [...] | qmcplusplus::ParticleSet::update(bool) | Single | 0.01 | 0.04 | 0.01 | 94 | 0.00 | NA | NA | 1 | NA | NA | 4 | 1 | 1 | 0 | 1 | 1 |
462 | libqmcwfs.so - TwoBodyJastrowRef.h:388-391 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<double, ... | Innermost | 0.01 | 0.03 | 0.01 | 112 | 841.43 | 100 | 50 | 1 | 1.02 | 2 | 3 | 1 | 5 | 0 | 0 | 0 |
608 | libqmcwfs.so - OneBodyJastrow.h:186-187 | miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Single | 0.01 | 0.03 | 0.01 | 112 | 503.42 | 100 | 50 | 1 | 1.38 | 2 | 3 | 0 | 2 | 0 | 0 | 0 |