Function: miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcp ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.11% |
---|
Function: miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcp ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.11% |
---|
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/shared_ptr_base.h: 1308 - 1308 |
-------------------------------------------------------------------------------- |
1308: { return _M_ptr; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 231 - 273 |
-------------------------------------------------------------------------------- |
231: inline const AoSElement_t operator[](size_t i) const { return AoSElement_t(myData + i, nGhosts); } |
[...] |
244: *(_base + M * i) = rhs[i]; |
[...] |
263: inline Accessor operator()(size_t i) { return Accessor(myData + i, nGhosts); } |
[...] |
273: inline const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
[...] |
249: inline const_pointer data() const { return X; } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_numeric.h: 126 - 127 |
-------------------------------------------------------------------------------- |
126: for (; __first != __last; ++__first) |
127: __init = __init + *__first; |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_algobase.h: 200 - 754 |
-------------------------------------------------------------------------------- |
200: if (__b < __a) |
[...] |
752: for (__decltype(__n + 0) __niter = __n; |
753: __niter > 0; --__niter, (void) ++__first) |
754: *__first = __tmp; |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_iterator.h: 784 - 887 |
-------------------------------------------------------------------------------- |
784: : _M_current(__i) { } |
[...] |
887: { return __lhs.base() != __rhs.base(); } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/TwoBodyJastrowRef.h: 268 - 432 |
-------------------------------------------------------------------------------- |
268: const int igt = P.GroupID[iat] * NumGroups; |
269: for (int jg = 0; jg < NumGroups; ++jg) |
270: { |
271: const FuncType& f2(*F[igt + jg]); |
272: int iStart = P.first(jg); |
273: int iEnd = std::min(jelmax, P.last(jg)); |
274: f2.evaluateVGL(iat, iStart, iEnd, dist, u, du, d2u, DistCompressed.data(), DistIndice.data()); |
[...] |
360: const auto& d_table = P.getDistTableAA(myTableID); |
361: for (int ig = 0; ig < NumGroups; ++ig) |
362: { |
363: const int igt = ig * NumGroups; |
364: for (int iat = P.first(ig), last = P.last(ig); iat < last; ++iat) |
365: { |
366: computeU3(P, iat, d_table.getDistRow(iat).data(), cur_u.data(), cur_du.data(), cur_d2u.data(), true); |
367: Uat[iat] = std::accumulate(cur_u.begin(), cur_u.begin() + iat, valT()); |
[...] |
375: for (int jat = 0; jat < iat; ++jat) |
376: lap += d2u[jat] + lapfac * du[jat]; |
377: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
378: { |
379: const valT* restrict dX = displ.data(idim); |
380: valT s = valT(); |
381: for (int jat = 0; jat < iat; ++jat) |
382: s += du[jat] * dX[jat]; |
383: grad[idim] = s; |
384: } |
385: dUat(iat) = grad; |
386: d2Uat[iat] = -lap; |
387: // add the contribution from the upper triangle |
388: for (int jat = 0; jat < iat; jat++) |
389: { |
390: Uat[jat] += u[jat]; |
391: d2Uat[jat] -= d2u[jat] + lapfac * du[jat]; |
392: } |
393: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
394: { |
395: valT* restrict save_g = dUat.data(idim); |
396: const valT* restrict dX = displ.data(idim); |
397: for (int jat = 0; jat < iat; jat++) |
398: save_g[jat] -= du[jat] * dX[jat]; |
[...] |
419: { |
420: if (fromscratch) |
421: recompute(P); |
422: LogValue = valT(0); |
423: for (int iat = 0; iat < N; ++iat) |
424: { |
425: LogValue += Uat[iat]; |
426: G[iat] += dUat[iat]; |
427: L[iat] += d2Uat[iat]; |
428: } |
429: |
430: constexpr valT mhalf(-0.5); |
431: LogValue = mhalf * LogValue; |
432: } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Particle/DistanceTable.h: 268 - 268 |
-------------------------------------------------------------------------------- |
268: const DistRow& getDistRow(int iel) const { return distances_[iel]; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 94 - 94 |
-------------------------------------------------------------------------------- |
94: (const_cast<T1&>(a) += b); |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_vector.h: 951 - 1056 |
-------------------------------------------------------------------------------- |
951: return *(this->_M_impl._M_start + __n); |
[...] |
1056: { return _M_data_ptr(this->_M_impl._M_start); } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 313 - 316 |
-------------------------------------------------------------------------------- |
313: inline int first(int igroup) const { return (*group_offsets_)[igroup]; } |
314: |
315: ///return the last index of a group i |
316: inline int last(int igroup) const { return (*group_offsets_)[igroup + 1]; } |
0x41f5b0 PUSH %RBP |
0x41f5b1 MOV %RSP,%RBP |
0x41f5b4 PUSH %R15 |
0x41f5b6 PUSH %R14 |
0x41f5b8 PUSH %R13 |
0x41f5ba PUSH %R12 |
0x41f5bc PUSH %RBX |
0x41f5bd SUB $0x98,%RSP |
0x41f5c4 MOV %RCX,-0x98(%RBP) |
0x41f5cb MOV %RDX,-0x90(%RBP) |
0x41f5d2 MOV %RDI,%R13 |
0x41f5d5 TEST %R8B,%R8B |
0x41f5d8 JE 41fe9c |
0x41f5de MOV %RSI,%R14 |
0x41f5e1 MOV 0x248(%R13),%ESI |
0x41f5e8 MOV %R14,%RDI |
0x41f5eb CALL 460cd0 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> |
0x41f5f0 MOV %RAX,-0x88(%RBP) |
0x41f5f7 MOV 0xa0(%R13),%R9 |
0x41f5fe TEST %R9,%R9 |
0x41f601 JE 41fe9c |
0x41f607 XOR %ECX,%ECX |
0x41f609 VMOVSD 0xd87d7(%RIP),%XMM5 |
0x41f611 VBROADCASTSD 0xd7606(%RIP),%YMM6 |
0x41f61a MOV %R9,%R12 |
0x41f61d MOV %R13,-0x70(%RBP) |
0x41f621 MOV %R14,-0x68(%RBP) |
0x41f625 JMP 41f64d |
0x41f627 NOPW (%RAX,%RAX,1) |
(355) 0x41f630 MOV %R12,%RAX |
(355) 0x41f633 MOV -0xa0(%RBP),%RCX |
(355) 0x41f63a INC %RCX |
(355) 0x41f63d MOV %RAX,%R12 |
(355) 0x41f640 CMP %RCX,%RAX |
(355) 0x41f643 MOV -0x68(%RBP),%R14 |
(355) 0x41f647 JBE 41fe9c |
(355) 0x41f64d MOV 0x268(%R14),%RAX |
(355) 0x41f654 MOV 0x18(%RAX),%RAX |
(355) 0x41f658 MOVSXD (%RAX,%RCX,4),%RSI |
(355) 0x41f65c MOV %RCX,-0xa0(%RBP) |
(355) 0x41f663 MOVSXD 0x4(%RAX,%RCX,4),%RAX |
(355) 0x41f668 MOV %RAX,-0xb0(%RBP) |
(355) 0x41f66f CMP %EAX,%ESI |
(355) 0x41f671 JGE 41f630 |
(355) 0x41f673 MOV 0x140(%R13),%R15 |
(355) 0x41f67a MOV 0x158(%R13),%R11 |
(355) 0x41f681 MOV 0x170(%R13),%RAX |
(355) 0x41f688 MOV %RAX,-0x40(%RBP) |
(355) 0x41f68c MOV $0x1fffffffffffffff,%RAX |
(355) 0x41f696 ADD %RSI,%RAX |
(355) 0x41f699 MOV %RAX,-0x78(%RBP) |
(355) 0x41f69d MOVQ $0,-0x80(%RBP) |
(355) 0x41f6a5 LEA -0x1(%RSI),%RAX |
(355) 0x41f6a9 MOV %RAX,-0xa8(%RBP) |
(355) 0x41f6b0 JMP 41f6db |
0x41f6b2 NOPW %CS:(%RAX,%RAX,1) |
(356) 0x41f6c0 INC %RSI |
(356) 0x41f6c3 INCQ -0x80(%RBP) |
(356) 0x41f6c7 INCQ -0x78(%RBP) |
(356) 0x41f6cb MOV %R9,%RAX |
(356) 0x41f6ce CMP -0xb0(%RBP),%RSI |
(356) 0x41f6d5 JE 41f633 |
(356) 0x41f6db MOV %R11,-0x38(%RBP) |
(356) 0x41f6df MOV -0x88(%RBP),%RAX |
(356) 0x41f6e6 MOV 0x48(%RAX),%RAX |
(356) 0x41f6ea LEA (%RSI,%RSI,4),%RCX |
(356) 0x41f6ee MOV %RCX,-0x58(%RBP) |
(356) 0x41f6f2 MOV 0x18(%RAX,%RCX,8),%R8 |
(356) 0x41f6f7 TEST %RSI,%RSI |
(356) 0x41f6fa MOV %RSI,-0x50(%RBP) |
(356) 0x41f6fe JLE 41f757 |
(356) 0x41f700 MOV %ESI,%EBX |
(356) 0x41f702 SAL $0x3,%RBX |
(356) 0x41f706 MOV %R15,%RDI |
(356) 0x41f709 XOR %ESI,%ESI |
(356) 0x41f70b MOV %RBX,%RDX |
(356) 0x41f70e MOV %R9,%R14 |
(356) 0x41f711 MOV %R8,%R13 |
(356) 0x41f714 VZEROUPPER |
(356) 0x41f717 CALL 4e7e80 <_intel_fast_memset> |
(356) 0x41f71c MOV -0x38(%RBP),%RDI |
(356) 0x41f720 XOR %ESI,%ESI |
(356) 0x41f722 MOV %RBX,%RDX |
(356) 0x41f725 CALL 4e7e80 <_intel_fast_memset> |
(356) 0x41f72a MOV -0x40(%RBP),%RDI |
(356) 0x41f72e XOR %ESI,%ESI |
(356) 0x41f730 MOV %RBX,%RDX |
(356) 0x41f733 CALL 4e7e80 <_intel_fast_memset> |
(356) 0x41f738 MOV %R13,%R8 |
(356) 0x41f73b MOV -0x70(%RBP),%R13 |
(356) 0x41f73f MOV -0x50(%RBP),%RSI |
(356) 0x41f743 MOV %R14,%R9 |
(356) 0x41f746 VBROADCASTSD 0xd74d1(%RIP),%YMM6 |
(356) 0x41f74f VMOVSD 0xd8691(%RIP),%XMM5 |
(356) 0x41f757 TEST %R12,%R12 |
(356) 0x41f75a JE 41f820 |
(356) 0x41f760 MOV -0x68(%RBP),%RAX |
(356) 0x41f764 MOV 0x18(%RAX),%RAX |
(356) 0x41f768 IMUL (%RAX,%RSI,4),%R12D |
(356) 0x41f76d MOV %R13,%RBX |
(356) 0x41f770 MOV %R15,-0x48(%RBP) |
(356) 0x41f774 MOVSXD %R12D,%RAX |
(356) 0x41f777 SAL $0x3,%RAX |
(356) 0x41f77b MOV %RAX,-0x60(%RBP) |
(356) 0x41f77f MOV $0x1,%R12D |
(356) 0x41f785 MOV -0x38(%RBP),%R14 |
(356) 0x41f789 MOV -0x40(%RBP),%R13 |
(356) 0x41f78d NOPL (%RAX) |
(371) 0x41f790 MOV 0x200(%RBX),%RAX |
(371) 0x41f797 ADD -0x60(%RBP),%RAX |
(371) 0x41f79b MOV -0x8(%RAX,%R12,8),%RDI |
(371) 0x41f7a0 MOV -0x68(%RBP),%RAX |
(371) 0x41f7a4 MOV 0x268(%RAX),%RAX |
(371) 0x41f7ab MOV 0x18(%RAX),%RAX |
(371) 0x41f7af MOV -0x4(%RAX,%R12,4),%EDX |
(371) 0x41f7b4 MOVSXD (%RAX,%R12,4),%RAX |
(371) 0x41f7b8 CMP %RAX,%RSI |
(371) 0x41f7bb MOV %ESI,%ECX |
(371) 0x41f7bd CMOVG %EAX,%ECX |
(371) 0x41f7c0 MOV %R8,%R15 |
(371) 0x41f7c3 MOV -0x48(%RBP),%R9 |
(371) 0x41f7c7 PUSHQ 0x1e8(%RBX) |
(371) 0x41f7cd PUSHQ 0x1d0(%RBX) |
(371) 0x41f7d3 PUSH %R13 |
(371) 0x41f7d5 PUSH %R14 |
(371) 0x41f7d7 VZEROUPPER |
(371) 0x41f7da CALL 41c590 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi> |
(371) 0x41f7df MOV %R15,%R8 |
(371) 0x41f7e2 MOV -0x50(%RBP),%RSI |
(371) 0x41f7e6 ADD $0x20,%RSP |
(371) 0x41f7ea MOV %R12D,%EAX |
(371) 0x41f7ed MOV 0xa0(%RBX),%R9 |
(371) 0x41f7f4 INC %R12 |
(371) 0x41f7f7 CMP %RAX,%R9 |
(371) 0x41f7fa JA 41f790 |
(356) 0x41f7fc MOV 0x140(%RBX),%R15 |
(356) 0x41f803 MOV %R9,%R12 |
(356) 0x41f806 MOV %RBX,%R13 |
(356) 0x41f809 VMOVSD 0xd85d7(%RIP),%XMM5 |
(356) 0x41f811 VBROADCASTSD 0xd7406(%RIP),%YMM6 |
(356) 0x41f81a JMP 41f823 |
0x41f81c NOPL (%RAX) |
(356) 0x41f820 XOR %R12D,%R12D |
(356) 0x41f823 VXORPD %XMM0,%XMM0,%XMM0 |
(356) 0x41f827 VXORPD %XMM1,%XMM1,%XMM1 |
(356) 0x41f82b MOV $0x1fffffffffffffff,%RAX |
(356) 0x41f835 TEST %RAX,%RSI |
(356) 0x41f838 JE 41f8ae |
(356) 0x41f83a LEA (%RSI,%RAX,1),%RCX |
(356) 0x41f83e AND %RAX,%RCX |
(356) 0x41f841 INC %RCX |
(356) 0x41f844 MOV %RCX,%RAX |
(356) 0x41f847 MOV $0x3ffffffffffffffc,%RDX |
(356) 0x41f851 AND %RDX,%RAX |
(356) 0x41f854 JE 41f890 |
(356) 0x41f856 VXORPD %XMM1,%XMM1,%XMM1 |
(356) 0x41f85a XOR %EDX,%EDX |
(356) 0x41f85c NOPL (%RAX) |
(370) 0x41f860 VADDPD (%R15,%RDX,8),%YMM1,%YMM1 |
(370) 0x41f866 ADD $0x4,%RDX |
(370) 0x41f86a CMP %RAX,%RDX |
(370) 0x41f86d JB 41f860 |
(356) 0x41f86f VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(356) 0x41f875 VADDPD %XMM2,%XMM1,%XMM1 |
(356) 0x41f879 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(356) 0x41f87e VADDSD %XMM2,%XMM1,%XMM1 |
(356) 0x41f882 CMP %RAX,%RCX |
(356) 0x41f885 JNE 41f892 |
(356) 0x41f887 JMP 41f8ae |
0x41f889 NOPL (%RAX) |
(356) 0x41f890 XOR %EAX,%EAX |
(356) 0x41f892 MOV $0x3d,%CL |
(356) 0x41f894 BZHI %RCX,-0x78(%RBP),%RCX |
(356) 0x41f89a INC %RCX |
(356) 0x41f89d NOPL (%RAX) |
(369) 0x41f8a0 VADDSD (%R15,%RAX,8),%XMM1,%XMM1 |
(369) 0x41f8a6 INC %RAX |
(369) 0x41f8a9 CMP %RAX,%RCX |
(369) 0x41f8ac JNE 41f8a0 |
(356) 0x41f8ae MOV 0xd8(%R13),%RDX |
(356) 0x41f8b5 VMOVSD %XMM1,(%RDX,%RSI,8) |
(356) 0x41f8ba MOV 0x158(%R13),%R11 |
(356) 0x41f8c1 MOV 0x170(%R13),%R10 |
(356) 0x41f8c8 MOV -0x88(%RBP),%RAX |
(356) 0x41f8cf MOV 0x60(%RAX),%RAX |
(356) 0x41f8d3 TEST %RSI,%RSI |
(356) 0x41f8d6 JLE 41f954 |
(356) 0x41f8d8 MOV %RSI,%RCX |
(356) 0x41f8db AND $-0x4,%RCX |
(356) 0x41f8df JE 41f930 |
(356) 0x41f8e1 LEA -0x1(%RCX),%R8 |
(356) 0x41f8e5 VXORPD %XMM0,%XMM0,%XMM0 |
(356) 0x41f8e9 XOR %EDI,%EDI |
(356) 0x41f8eb VBROADCASTSD 0xd84f4(%RIP),%YMM1 |
(356) 0x41f8f4 NOPW %CS:(%RAX,%RAX,1) |
(368) 0x41f900 VADDPD (%R10,%RDI,8),%YMM0,%YMM0 |
(368) 0x41f906 VFMADD231PD (%R11,%RDI,8),%YMM1,%YMM0 |
(368) 0x41f90c ADD $0x4,%RDI |
(368) 0x41f910 CMP %R8,%RDI |
(368) 0x41f913 JLE 41f900 |
(356) 0x41f915 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(356) 0x41f91b VADDPD %XMM1,%XMM0,%XMM0 |
(356) 0x41f91f VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(356) 0x41f924 VADDSD %XMM1,%XMM0,%XMM0 |
(356) 0x41f928 JMP 41f94f |
0x41f92a NOPW (%RAX,%RAX,1) |
(356) 0x41f930 VXORPD %XMM0,%XMM0,%XMM0 |
(356) 0x41f934 XOR %ECX,%ECX |
(356) 0x41f936 NOPW %CS:(%RAX,%RAX,1) |
(367) 0x41f940 VADDSD (%R10,%RCX,8),%XMM0,%XMM0 |
(367) 0x41f946 VFMADD231SD (%R11,%RCX,8),%XMM5,%XMM0 |
(367) 0x41f94c INC %RCX |
(367) 0x41f94f CMP %RCX,%RSI |
(367) 0x41f952 JNE 41f940 |
(356) 0x41f954 MOV -0x58(%RBP),%RCX |
(356) 0x41f958 MOV 0x8(%RAX,%RCX,8),%R14 |
(356) 0x41f95d MOV 0x18(%RAX,%RCX,8),%RAX |
(356) 0x41f962 VXORPD %XMM1,%XMM1,%XMM1 |
(356) 0x41f966 VXORPD %XMM2,%XMM2,%XMM2 |
(356) 0x41f96a TEST %RSI,%RSI |
(356) 0x41f96d JLE 41f9e4 |
(356) 0x41f96f MOV %RSI,%R8 |
(356) 0x41f972 AND $-0x4,%R8 |
(356) 0x41f976 JE 41f9c0 |
(356) 0x41f978 LEA -0x1(%R8),%RCX |
(356) 0x41f97c VXORPD %XMM2,%XMM2,%XMM2 |
(356) 0x41f980 XOR %EDI,%EDI |
(356) 0x41f982 NOPW %CS:(%RAX,%RAX,1) |
(366) 0x41f990 VMOVUPD (%RAX,%RDI,8),%YMM3 |
(366) 0x41f995 VFMADD231PD (%R11,%RDI,8),%YMM3,%YMM2 |
(366) 0x41f99b ADD $0x4,%RDI |
(366) 0x41f99f CMP %RCX,%RDI |
(366) 0x41f9a2 JLE 41f990 |
(356) 0x41f9a4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(356) 0x41f9aa VADDPD %XMM3,%XMM2,%XMM2 |
(356) 0x41f9ae VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(356) 0x41f9b3 VADDSD %XMM3,%XMM2,%XMM2 |
(356) 0x41f9b7 JMP 41f9df |
0x41f9b9 NOPL (%RAX) |
(356) 0x41f9c0 XOR %R8D,%R8D |
(356) 0x41f9c3 NOPW %CS:(%RAX,%RAX,1) |
(365) 0x41f9d0 VMOVSD (%RAX,%R8,8),%XMM3 |
(365) 0x41f9d6 VFMADD231SD (%R11,%R8,8),%XMM3,%XMM2 |
(365) 0x41f9dc INC %R8 |
(365) 0x41f9df CMP %R8,%RSI |
(365) 0x41f9e2 JNE 41f9d0 |
(356) 0x41f9e4 MOV %R10,-0x40(%RBP) |
(356) 0x41f9e8 TEST %RSI,%RSI |
(356) 0x41f9eb JLE 41fa64 |
(356) 0x41f9ed MOV %RSI,%R10 |
(356) 0x41f9f0 AND $-0x4,%R10 |
(356) 0x41f9f4 JE 41fa40 |
(356) 0x41f9f6 LEA -0x1(%R10),%RCX |
(356) 0x41f9fa LEA (%RAX,%R14,8),%RDI |
(356) 0x41f9fe VXORPD %XMM1,%XMM1,%XMM1 |
(356) 0x41fa02 XOR %R8D,%R8D |
(356) 0x41fa05 NOPW %CS:(%RAX,%RAX,1) |
(364) 0x41fa10 VMOVUPD (%RDI,%R8,8),%YMM3 |
(364) 0x41fa16 VFMADD231PD (%R11,%R8,8),%YMM3,%YMM1 |
(364) 0x41fa1c ADD $0x4,%R8 |
(364) 0x41fa20 CMP %RCX,%R8 |
(364) 0x41fa23 JLE 41fa10 |
(356) 0x41fa25 VEXTRACTF128 $0x1,%YMM1,%XMM3 |
(356) 0x41fa2b VADDPD %XMM3,%XMM1,%XMM1 |
(356) 0x41fa2f VSHUFPD $0x1,%XMM1,%XMM1,%XMM3 |
(356) 0x41fa34 VADDSD %XMM3,%XMM1,%XMM1 |
(356) 0x41fa38 CMP %R10,%RSI |
(356) 0x41fa3b JNE 41fa47 |
(356) 0x41fa3d JMP 41fa64 |
0x41fa3f NOP |
(356) 0x41fa40 VXORPD %XMM1,%XMM1,%XMM1 |
(356) 0x41fa44 XOR %R10D,%R10D |
(356) 0x41fa47 LEA (%RAX,%R14,8),%RCX |
(356) 0x41fa4b NOPL (%RAX,%RAX,1) |
(363) 0x41fa50 VMOVSD (%RCX,%R10,8),%XMM3 |
(363) 0x41fa56 VFMADD231SD (%R11,%R10,8),%XMM3,%XMM1 |
(363) 0x41fa5c INC %R10 |
(363) 0x41fa5f CMP %R10,%RSI |
(363) 0x41fa62 JNE 41fa50 |
(356) 0x41fa64 TEST %RSI,%RSI |
(356) 0x41fa67 JLE 41fac0 |
(356) 0x41fa69 MOV %RSI,%R10 |
(356) 0x41fa6c AND $-0x4,%R10 |
(356) 0x41fa70 JE 41fad0 |
(356) 0x41fa72 LEA -0x1(%R10),%RCX |
(356) 0x41fa76 MOV %R14,%RDI |
(356) 0x41fa79 SAL $0x4,%RDI |
(356) 0x41fa7d ADD %RAX,%RDI |
(356) 0x41fa80 VXORPD %XMM3,%XMM3,%XMM3 |
(356) 0x41fa84 XOR %R8D,%R8D |
(356) 0x41fa87 NOPW (%RAX,%RAX,1) |
(362) 0x41fa90 VMOVUPD (%RDI,%R8,8),%YMM4 |
(362) 0x41fa96 VFMADD231PD (%R11,%R8,8),%YMM4,%YMM3 |
(362) 0x41fa9c ADD $0x4,%R8 |
(362) 0x41faa0 CMP %RCX,%R8 |
(362) 0x41faa3 JLE 41fa90 |
(356) 0x41faa5 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(356) 0x41faab VADDPD %XMM4,%XMM3,%XMM3 |
(356) 0x41faaf VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(356) 0x41fab4 VADDSD %XMM4,%XMM3,%XMM3 |
(356) 0x41fab8 CMP %R10,%RSI |
(356) 0x41fabb JNE 41fad7 |
(356) 0x41fabd JMP 41fb04 |
0x41fabf NOP |
(356) 0x41fac0 VXORPD %XMM3,%XMM3,%XMM3 |
(356) 0x41fac4 JMP 41fb04 |
0x41fac6 NOPW %CS:(%RAX,%RAX,1) |
(356) 0x41fad0 VXORPD %XMM3,%XMM3,%XMM3 |
(356) 0x41fad4 XOR %R10D,%R10D |
(356) 0x41fad7 MOV %R14,%RCX |
(356) 0x41fada SAL $0x4,%RCX |
(356) 0x41fade ADD %RAX,%RCX |
(356) 0x41fae1 NOPW %CS:(%RAX,%RAX,1) |
(361) 0x41faf0 VMOVSD (%RCX,%R10,8),%XMM4 |
(361) 0x41faf6 VFMADD231SD (%R11,%R10,8),%XMM4,%XMM3 |
(361) 0x41fafc INC %R10 |
(361) 0x41faff CMP %R10,%RSI |
(361) 0x41fb02 JNE 41faf0 |
(356) 0x41fb04 MOV %R14,-0x60(%RBP) |
(356) 0x41fb08 MOV 0xf0(%R13),%RDI |
(356) 0x41fb0f MOV 0x100(%R13),%R14 |
(356) 0x41fb16 LEA (%RSI,%RDI,1),%RCX |
(356) 0x41fb1a VMOVSD %XMM2,(%R14,%RSI,8) |
(356) 0x41fb20 VMOVSD %XMM1,(%R14,%RCX,8) |
(356) 0x41fb26 MOV %RDI,-0x58(%RBP) |
(356) 0x41fb2a LEA (%RSI,%RDI,2),%RCX |
(356) 0x41fb2e VMOVSD %XMM3,(%R14,%RCX,8) |
(356) 0x41fb34 VXORPD 0xd7124(%RIP),%XMM0,%XMM0 |
(356) 0x41fb3c MOV 0x128(%R13),%R8 |
(356) 0x41fb43 VMOVLPD %XMM0,(%R8,%RSI,8) |
(356) 0x41fb49 TEST %RSI,%RSI |
(356) 0x41fb4c JLE 41f6c0 |
(356) 0x41fb52 MOV %R12,-0xb8(%RBP) |
(356) 0x41fb59 MOV %R9,-0xc0(%RBP) |
(356) 0x41fb60 LEA -0x1(%RSI),%R9 |
(356) 0x41fb64 MOV %R11,%R13 |
(356) 0x41fb67 LEA (%RDX,%R9,8),%R11 |
(356) 0x41fb6b CMP %R8,%R11 |
(356) 0x41fb6e SETAEB -0x2d(%RBP) |
(356) 0x41fb72 LEA (%R8,%R9,8),%RDI |
(356) 0x41fb76 CMP %RDX,%RDI |
(356) 0x41fb79 SETAE %CL |
(356) 0x41fb7c CMP %R15,%R11 |
(356) 0x41fb7f MOV %R15,%RSI |
(356) 0x41fb82 SETB %R15B |
(356) 0x41fb86 LEA (%RSI,%R9,8),%R10 |
(356) 0x41fb8a CMP %RDX,%R10 |
(356) 0x41fb8d SETBB -0x2c(%RBP) |
(356) 0x41fb91 CMP %R8,%R10 |
(356) 0x41fb94 SETB %R12B |
(356) 0x41fb98 MOV %RSI,-0x48(%RBP) |
(356) 0x41fb9c CMP %RSI,%RDI |
(356) 0x41fb9f SETBB -0x2b(%RBP) |
(356) 0x41fba3 CMP %R13,%R11 |
(356) 0x41fba6 SETB %R10B |
(356) 0x41fbaa LEA (,%R9,8),%RBX |
(356) 0x41fbb2 ADD %R13,%RBX |
(356) 0x41fbb5 CMP %RDX,%RBX |
(356) 0x41fbb8 SETBB -0x2a(%RBP) |
(356) 0x41fbbc MOV -0x40(%RBP),%RSI |
(356) 0x41fbc0 CMP %RSI,%R11 |
(356) 0x41fbc3 SETB %R11B |
(356) 0x41fbc7 LEA (%RSI,%R9,8),%R9 |
(356) 0x41fbcb CMP %RDX,%R9 |
(356) 0x41fbce SETBB -0x29(%RBP) |
(356) 0x41fbd2 CMP %R8,%RBX |
(356) 0x41fbd5 SETB %BL |
(356) 0x41fbd8 MOV %R13,-0x38(%RBP) |
(356) 0x41fbdc CMP %R13,%RDI |
(356) 0x41fbdf SETB %R13B |
(356) 0x41fbe3 CMP %R8,%R9 |
(356) 0x41fbe6 SETB %R9B |
(356) 0x41fbea CMP %RSI,%RDI |
(356) 0x41fbed SETB %SIL |
(356) 0x41fbf1 TEST %CL,-0x2d(%RBP) |
(356) 0x41fbf4 JNE 41fc90 |
(356) 0x41fbfa OR -0x2c(%RBP),%R15B |
(356) 0x41fbfe JE 41fc90 |
(356) 0x41fc04 OR -0x2b(%RBP),%R12B |
(356) 0x41fc08 JE 41fc90 |
(356) 0x41fc0e OR -0x2a(%RBP),%R10B |
(356) 0x41fc12 JE 41fc90 |
(356) 0x41fc14 OR -0x29(%RBP),%R11B |
(356) 0x41fc18 JE 41fc90 |
(356) 0x41fc1a OR %R13B,%BL |
(356) 0x41fc1d JE 41fc90 |
(356) 0x41fc1f OR %SIL,%R9B |
(356) 0x41fc22 JE 41fc90 |
(356) 0x41fc24 MOV -0x50(%RBP),%RSI |
(356) 0x41fc28 MOV %RSI,%R9 |
(356) 0x41fc2b AND $-0x4,%R9 |
(356) 0x41fc2f VMOVSD 0xd6fe9(%RIP),%XMM1 |
(356) 0x41fc37 JE 41fce1 |
(356) 0x41fc3d LEA -0x1(%R9),%RCX |
(356) 0x41fc41 XOR %EDI,%EDI |
(356) 0x41fc43 MOV -0x48(%RBP),%R10 |
(356) 0x41fc47 MOV -0x38(%RBP),%R11 |
(356) 0x41fc4b MOV -0x40(%RBP),%RBX |
(356) 0x41fc4f NOP |
(360) 0x41fc50 VMOVUPD (%RDX,%RDI,8),%YMM0 |
(360) 0x41fc55 VADDPD (%R10,%RDI,8),%YMM0,%YMM0 |
(360) 0x41fc5b VMOVUPD %YMM0,(%RDX,%RDI,8) |
(360) 0x41fc60 VMOVUPD (%R11,%RDI,8),%YMM0 |
(360) 0x41fc66 VFMSUB213PD (%RBX,%RDI,8),%YMM6,%YMM0 |
(360) 0x41fc6c VADDPD (%R8,%RDI,8),%YMM0,%YMM0 |
(360) 0x41fc72 VMOVUPD %YMM0,(%R8,%RDI,8) |
(360) 0x41fc78 ADD $0x4,%RDI |
(360) 0x41fc7c CMP %RCX,%RDI |
(360) 0x41fc7f JLE 41fc50 |
(356) 0x41fc81 JMP 41fd1d |
0x41fc86 NOPW %CS:(%RAX,%RAX,1) |
(356) 0x41fc90 XOR %ECX,%ECX |
(356) 0x41fc92 VMOVSD 0xd6f86(%RIP),%XMM1 |
(356) 0x41fc9a MOV -0x50(%RBP),%RSI |
(356) 0x41fc9e MOV -0x48(%RBP),%RDI |
(356) 0x41fca2 MOV -0x38(%RBP),%R9 |
(356) 0x41fca6 MOV -0x40(%RBP),%R10 |
(356) 0x41fcaa NOPW (%RAX,%RAX,1) |
(357) 0x41fcb0 VMOVSD (%RDX,%RCX,8),%XMM0 |
(357) 0x41fcb5 VADDSD (%RDI,%RCX,8),%XMM0,%XMM0 |
(357) 0x41fcba VMOVSD %XMM0,(%RDX,%RCX,8) |
(357) 0x41fcbf VMOVSD (%R9,%RCX,8),%XMM0 |
(357) 0x41fcc5 VFMSUB213SD (%R10,%RCX,8),%XMM1,%XMM0 |
(357) 0x41fccb VADDSD (%R8,%RCX,8),%XMM0,%XMM0 |
(357) 0x41fcd1 VMOVSD %XMM0,(%R8,%RCX,8) |
(357) 0x41fcd7 INC %RCX |
(357) 0x41fcda CMP %RCX,%RSI |
(357) 0x41fcdd JNE 41fcb0 |
(356) 0x41fcdf JMP 41fd22 |
(356) 0x41fce1 XOR %R9D,%R9D |
(356) 0x41fce4 MOV -0x48(%RBP),%R10 |
(356) 0x41fce8 MOV -0x38(%RBP),%R11 |
(356) 0x41fcec MOV -0x40(%RBP),%RBX |
(359) 0x41fcf0 VMOVSD (%RDX,%R9,8),%XMM0 |
(359) 0x41fcf6 VADDSD (%R10,%R9,8),%XMM0,%XMM0 |
(359) 0x41fcfc VMOVSD %XMM0,(%RDX,%R9,8) |
(359) 0x41fd02 VMOVSD (%R11,%R9,8),%XMM0 |
(359) 0x41fd08 VFMSUB213SD (%RBX,%R9,8),%XMM1,%XMM0 |
(359) 0x41fd0e VADDSD (%R8,%R9,8),%XMM0,%XMM0 |
(359) 0x41fd14 VMOVSD %XMM0,(%R8,%R9,8) |
(359) 0x41fd1a INC %R9 |
(359) 0x41fd1d CMP %R9,%RSI |
(359) 0x41fd20 JNE 41fcf0 |
(356) 0x41fd22 MOV -0xa8(%RBP),%RCX |
(356) 0x41fd29 ADD -0x80(%RBP),%RCX |
(356) 0x41fd2d JNE 41fd40 |
(356) 0x41fd2f XOR %EDX,%EDX |
(356) 0x41fd31 MOV -0x38(%RBP),%RCX |
(356) 0x41fd35 JMP 41fe1b |
0x41fd3a NOPW (%RAX,%RAX,1) |
(356) 0x41fd40 MOV %RSI,%R8 |
(356) 0x41fd43 AND $-0x2,%R8 |
(356) 0x41fd47 LEA 0x8(%RAX),%R9 |
(356) 0x41fd4b LEA 0x8(%R14),%R10 |
(356) 0x41fd4f MOV -0x60(%RBP),%RCX |
(356) 0x41fd53 LEA (%RAX,%RCX,8),%R11 |
(356) 0x41fd57 ADD $0x8,%R11 |
(356) 0x41fd5b MOV -0x58(%RBP),%RDX |
(356) 0x41fd5f LEA (%R14,%RDX,8),%R15 |
(356) 0x41fd63 ADD $0x8,%R15 |
(356) 0x41fd67 SAL $0x4,%RCX |
(356) 0x41fd6b LEA (%RAX,%RCX,1),%RBX |
(356) 0x41fd6f ADD $0x8,%RBX |
(356) 0x41fd73 MOV %RDX,%RCX |
(356) 0x41fd76 SAL $0x4,%RCX |
(356) 0x41fd7a LEA (%R14,%RCX,1),%R12 |
(356) 0x41fd7e ADD $0x8,%R12 |
(356) 0x41fd82 XOR %EDX,%EDX |
(356) 0x41fd84 MOV -0x38(%RBP),%RCX |
(356) 0x41fd88 NOPL (%RAX,%RAX,1) |
(358) 0x41fd90 VMOVSD (%RCX,%RDX,8),%XMM0 |
(358) 0x41fd95 VMOVSD -0x8(%R9,%RDX,8),%XMM1 |
(358) 0x41fd9c VFNMADD213SD -0x8(%R10,%RDX,8),%XMM0,%XMM1 |
(358) 0x41fda3 VMOVSD %XMM1,-0x8(%R10,%RDX,8) |
(358) 0x41fdaa VMOVSD -0x8(%R11,%RDX,8),%XMM1 |
(358) 0x41fdb1 VFNMADD213SD -0x8(%R15,%RDX,8),%XMM0,%XMM1 |
(358) 0x41fdb8 VMOVSD %XMM1,-0x8(%R15,%RDX,8) |
(358) 0x41fdbf VMOVSD -0x8(%RBX,%RDX,8),%XMM1 |
(358) 0x41fdc5 VFNMADD213SD -0x8(%R12,%RDX,8),%XMM0,%XMM1 |
(358) 0x41fdcc VMOVSD %XMM1,-0x8(%R12,%RDX,8) |
(358) 0x41fdd3 VMOVSD 0x8(%RCX,%RDX,8),%XMM0 |
(358) 0x41fdd9 VMOVSD (%R9,%RDX,8),%XMM1 |
(358) 0x41fddf VFNMADD213SD (%R10,%RDX,8),%XMM0,%XMM1 |
(358) 0x41fde5 VMOVSD %XMM1,(%R10,%RDX,8) |
(358) 0x41fdeb VMOVSD (%R11,%RDX,8),%XMM1 |
(358) 0x41fdf1 VFNMADD213SD (%R15,%RDX,8),%XMM0,%XMM1 |
(358) 0x41fdf7 VMOVSD %XMM1,(%R15,%RDX,8) |
(358) 0x41fdfd VMOVSD (%RBX,%RDX,8),%XMM1 |
(358) 0x41fe02 VFNMADD213SD (%R12,%RDX,8),%XMM0,%XMM1 |
(358) 0x41fe08 VMOVSD %XMM1,(%R12,%RDX,8) |
(358) 0x41fe0e ADD $0x2,%RDX |
(358) 0x41fe12 CMP %RDX,%R8 |
(358) 0x41fe15 JNE 41fd90 |
(356) 0x41fe1b MOV -0x50(%RBP),%RSI |
(356) 0x41fe1f TEST $0x1,%SIL |
(356) 0x41fe23 MOV -0x70(%RBP),%R13 |
(356) 0x41fe27 MOV -0xc0(%RBP),%R9 |
(356) 0x41fe2e MOV -0x48(%RBP),%R15 |
(356) 0x41fe32 MOV -0xb8(%RBP),%R12 |
(356) 0x41fe39 MOV %RCX,%R11 |
(356) 0x41fe3c JE 41f6c0 |
(356) 0x41fe42 VMOVSD (%R11,%RDX,8),%XMM0 |
(356) 0x41fe48 VMOVSD (%RAX,%RDX,8),%XMM1 |
(356) 0x41fe4d VFNMADD213SD (%R14,%RDX,8),%XMM0,%XMM1 |
(356) 0x41fe53 VMOVSD %XMM1,(%R14,%RDX,8) |
(356) 0x41fe59 MOV -0x60(%RBP),%RDI |
(356) 0x41fe5d LEA (%RDI,%RDI,1),%RCX |
(356) 0x41fe61 ADD %RDX,%RDI |
(356) 0x41fe64 VMOVSD (%RAX,%RDI,8),%XMM1 |
(356) 0x41fe69 MOV -0x58(%RBP),%R8 |
(356) 0x41fe6d LEA (%R8,%R8,1),%RDI |
(356) 0x41fe71 ADD %RDX,%R8 |
(356) 0x41fe74 VFNMADD213SD (%R14,%R8,8),%XMM0,%XMM1 |
(356) 0x41fe7a VMOVSD %XMM1,(%R14,%R8,8) |
(356) 0x41fe80 ADD %RDX,%RCX |
(356) 0x41fe83 VMOVSD (%RAX,%RCX,8),%XMM1 |
(356) 0x41fe88 ADD %RDX,%RDI |
(356) 0x41fe8b VFNMADD213SD (%R14,%RDI,8),%XMM0,%XMM1 |
(356) 0x41fe91 VMOVSD %XMM1,(%R14,%RDI,8) |
(356) 0x41fe97 JMP 41f6c0 |
0x41fe9c MOVQ $0,0x10(%R13) |
0x41fea4 MOV 0x90(%R13),%RAX |
0x41feab TEST %RAX,%RAX |
0x41feae JE 41ff5e |
0x41feb4 MOV 0xd8(%R13),%RCX |
0x41febb MOV 0x100(%R13),%RDX |
0x41fec2 MOVSXD 0xf0(%R13),%RSI |
0x41fec9 MOV -0x90(%RBP),%RDI |
0x41fed0 MOV 0x18(%RDI),%RDI |
0x41fed4 MOV 0x128(%R13),%R8 |
0x41fedb MOV -0x98(%RBP),%R9 |
0x41fee2 MOV 0x18(%R9),%R9 |
0x41fee6 ADD $0x10,%RDI |
0x41feea LEA (%RDX,%RSI,8),%R10 |
0x41feee SAL $0x4,%RSI |
0x41fef2 ADD %RDX,%RSI |
0x41fef5 VXORPD %XMM0,%XMM0,%XMM0 |
0x41fef9 XOR %R11D,%R11D |
0x41fefc NOPL (%RAX) |
(354) 0x41ff00 VADDSD (%RCX,%R11,8),%XMM0,%XMM0 |
(354) 0x41ff06 VMOVSD %XMM0,0x10(%R13) |
(354) 0x41ff0c VMOVSD (%RDX,%R11,8),%XMM0 |
(354) 0x41ff12 VMOVHPD (%R10,%R11,8),%XMM0,%XMM0 |
(354) 0x41ff18 VADDPD -0x10(%RDI),%XMM0,%XMM0 |
(354) 0x41ff1d VMOVSD (%RDI),%XMM1 |
(354) 0x41ff21 VADDSD (%RSI,%R11,8),%XMM1,%XMM1 |
(354) 0x41ff27 VMOVUPD %XMM0,-0x10(%RDI) |
(354) 0x41ff2c VMOVSD %XMM1,(%RDI) |
(354) 0x41ff30 VMOVSD (%R9,%R11,8),%XMM0 |
(354) 0x41ff36 VADDSD (%R8,%R11,8),%XMM0,%XMM0 |
(354) 0x41ff3c VMOVSD %XMM0,(%R9,%R11,8) |
(354) 0x41ff42 VMOVSD 0x10(%R13),%XMM0 |
(354) 0x41ff48 INC %R11 |
(354) 0x41ff4b ADD $0x18,%RDI |
(354) 0x41ff4f CMP %R11,%RAX |
(354) 0x41ff52 JNE 41ff00 |
0x41ff54 VMULSD 0xd6c94(%RIP),%XMM0,%XMM0 |
0x41ff5c JMP 41ff66 |
0x41ff5e VMOVSD 0xd7ea2(%RIP),%XMM0 |
0x41ff66 VMOVSD %XMM0,0x10(%R13) |
0x41ff6c ADD $0x98,%RSP |
0x41ff73 POP %RBX |
0x41ff74 POP %R12 |
0x41ff76 POP %R13 |
0x41ff78 POP %R14 |
0x41ff7a POP %R15 |
0x41ff7c POP %RBP |
0x41ff7d VZEROUPPER |
0x41ff80 RET |
0x41ff81 NOPW %CS:(%RAX,%RAX,1) |
0x41ff8b NOPL (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.68+ | miniqmcreference::TwoBodyJastr[...] | TwoBodyJastrowRef.h:411 | exec |
○ | qmcplusplus::WaveFunction::eva[...] | WaveFunction.cpp:175 | exec |
○ | main.extracted.113 | miniqmc.cpp:397 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 73 |
nb uops | 75 |
loop length | 354 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 5 |
micro-operation queue | 12.50 cycles |
front end | 12.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.50 | 2.40 | 7.33 | 7.33 | 7.00 | 2.40 | 2.50 | 7.00 | 7.00 | 7.00 | 2.20 | 7.33 |
cycles | 2.50 | 2.40 | 7.33 | 7.33 | 7.00 | 2.40 | 2.50 | 7.00 | 7.00 | 7.00 | 2.20 | 7.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 12.29 |
Stall cycles | 0.00 |
Front-end | 12.50 |
Dispatch | 7.33 |
Overall L1 | 12.50 |
all | 6% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 14% |
all | 16% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 9% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 22% |
all | 12% |
load | 12% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 12% |
load | 12% |
store | 11% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41fe9c <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x8ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x248(%R13),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 460cd0 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%R13),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R9,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41fe9c <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x8ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0xd87d7(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0xd7606(%RIP),%YMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV %R9,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 41f64d <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVQ $0,0x10(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41ff5e <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9ae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd8(%R13),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x100(%R13),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0xf0(%R13),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x128(%R13),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x98(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R9),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%RDX,%RSI,8),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x4,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMULSD 0xd6c94(%RIP),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
JMP 41ff66 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9b6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VMOVSD 0xd7ea2(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 73 |
nb uops | 75 |
loop length | 354 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 5 |
micro-operation queue | 12.50 cycles |
front end | 12.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.50 | 2.40 | 7.33 | 7.33 | 7.00 | 2.40 | 2.50 | 7.00 | 7.00 | 7.00 | 2.20 | 7.33 |
cycles | 2.50 | 2.40 | 7.33 | 7.33 | 7.00 | 2.40 | 2.50 | 7.00 | 7.00 | 7.00 | 2.20 | 7.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 12.29 |
Stall cycles | 0.00 |
Front-end | 12.50 |
Dispatch | 7.33 |
Overall L1 | 12.50 |
all | 6% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 14% |
all | 16% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 9% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 22% |
all | 12% |
load | 12% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 12% |
load | 12% |
store | 11% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41fe9c <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x8ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x248(%R13),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 460cd0 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%R13),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R9,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41fe9c <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x8ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0xd87d7(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0xd7606(%RIP),%YMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV %R9,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 41f64d <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVQ $0,0x10(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41ff5e <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9ae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd8(%R13),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x100(%R13),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0xf0(%R13),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x128(%R13),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x98(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R9),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%RDX,%RSI,8),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x4,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMULSD 0xd6c94(%RIP),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
JMP 41ff66 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9b6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VMOVSD 0xd7ea2(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼miniqmcreference::TwoBodyJastrowRef | 0.11 | 0.13 |
○Loop 354 - TwoBodyJastrowRef.h:423-427 - exec | 0 | 0 |
▼Loop 355 - TwoBodyJastrowRef.h:268-420 - exec– | 0 | 0 |
▼Loop 356 - TwoBodyJastrowRef.h:268-420 - exec– | 0 | 0 |
○Loop 358 - TwoBodyJastrowRef.h:393-398 - exec | 0.03 | 0.03 |
○Loop 364 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.02 |
○Loop 362 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.02 |
○Loop 366 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.02 |
○Loop 360 - TwoBodyJastrowRef.h:388-391 - exec | 0.01 | 0.01 |
○Loop 368 - TwoBodyJastrowRef.h:375-376 - exec | 0.01 | 0.01 |
○Loop 361 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 365 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 359 - TwoBodyJastrowRef.h:388-391 - exec | 0 | 0 |
○Loop 357 - TwoBodyJastrowRef.h:388-391 - exec | 0 | 0 |
○Loop 363 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 369 - stl_numeric.h:126-127 - exec | 0 | 0 |
○Loop 367 - TwoBodyJastrowRef.h:375-376 - exec | 0 | 0 |
○Loop 370 - stl_numeric.h:126-127 - exec | 0 | 0 |
○Loop 371 - TwoBodyJastrowRef.h:269-274 - exec | 0 | 0 |