Function: miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcp ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.13% |
---|
Function: miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcp ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.13% |
---|
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/shared_ptr_base.h: 1308 - 1308 |
-------------------------------------------------------------------------------- |
1308: { return _M_ptr; } |
/scratch_na/users/xoserete/qaas_runs/171-284-5201/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
[...] |
249: inline const_pointer data() const { return X; } |
/scratch_na/users/xoserete/qaas_runs/171-284-5201/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/TwoBodyJastrowRef.h: 268 - 432 |
-------------------------------------------------------------------------------- |
268: const int igt = P.GroupID[iat] * NumGroups; |
269: for (int jg = 0; jg < NumGroups; ++jg) |
270: { |
271: const FuncType& f2(*F[igt + jg]); |
272: int iStart = P.first(jg); |
273: int iEnd = std::min(jelmax, P.last(jg)); |
274: f2.evaluateVGL(iat, iStart, iEnd, dist, u, du, d2u, DistCompressed.data(), DistIndice.data()); |
[...] |
360: const auto& d_table = P.getDistTableAA(myTableID); |
361: for (int ig = 0; ig < NumGroups; ++ig) |
362: { |
363: const int igt = ig * NumGroups; |
364: for (int iat = P.first(ig), last = P.last(ig); iat < last; ++iat) |
365: { |
366: computeU3(P, iat, d_table.getDistRow(iat).data(), cur_u.data(), cur_du.data(), cur_d2u.data(), true); |
367: Uat[iat] = std::accumulate(cur_u.begin(), cur_u.begin() + iat, valT()); |
[...] |
375: for (int jat = 0; jat < iat; ++jat) |
376: lap += d2u[jat] + lapfac * du[jat]; |
377: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
378: { |
379: const valT* restrict dX = displ.data(idim); |
380: valT s = valT(); |
381: for (int jat = 0; jat < iat; ++jat) |
382: s += du[jat] * dX[jat]; |
383: grad[idim] = s; |
384: } |
385: dUat(iat) = grad; |
386: d2Uat[iat] = -lap; |
387: // add the contribution from the upper triangle |
388: for (int jat = 0; jat < iat; jat++) |
389: { |
390: Uat[jat] += u[jat]; |
391: d2Uat[jat] -= d2u[jat] + lapfac * du[jat]; |
392: } |
393: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
394: { |
395: valT* restrict save_g = dUat.data(idim); |
396: const valT* restrict dX = displ.data(idim); |
397: for (int jat = 0; jat < iat; jat++) |
398: save_g[jat] -= du[jat] * dX[jat]; |
[...] |
419: { |
420: if (fromscratch) |
421: recompute(P); |
422: LogValue = valT(0); |
423: for (int iat = 0; iat < N; ++iat) |
424: { |
425: LogValue += Uat[iat]; |
426: G[iat] += dUat[iat]; |
427: L[iat] += d2Uat[iat]; |
428: } |
429: |
430: constexpr valT mhalf(-0.5); |
431: LogValue = mhalf * LogValue; |
432: } |
/scratch_na/users/xoserete/qaas_runs/171-284-5201/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 231 - 273 |
-------------------------------------------------------------------------------- |
231: inline const AoSElement_t operator[](size_t i) const { return AoSElement_t(myData + i, nGhosts); } |
[...] |
244: *(_base + M * i) = rhs[i]; |
[...] |
263: inline Accessor operator()(size_t i) { return Accessor(myData + i, nGhosts); } |
[...] |
273: inline const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_numeric.h: 126 - 127 |
-------------------------------------------------------------------------------- |
126: for (; __first != __last; ++__first) |
127: __init = __init + *__first; |
/scratch_na/users/xoserete/qaas_runs/171-284-5201/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 94 - 94 |
-------------------------------------------------------------------------------- |
94: (const_cast<T1&>(a) += b); |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_algobase.h: 200 - 754 |
-------------------------------------------------------------------------------- |
200: if (__b < __a) |
[...] |
752: for (__decltype(__n + 0) __niter = __n; |
753: __niter > 0; --__niter, (void) ++__first) |
754: *__first = __tmp; |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_iterator.h: 784 - 887 |
-------------------------------------------------------------------------------- |
784: : _M_current(__i) { } |
[...] |
887: { return __lhs.base() != __rhs.base(); } |
/scratch_na/users/xoserete/qaas_runs/171-284-5201/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 313 - 316 |
-------------------------------------------------------------------------------- |
313: inline int first(int igroup) const { return (*group_offsets_)[igroup]; } |
314: |
315: ///return the last index of a group i |
316: inline int last(int igroup) const { return (*group_offsets_)[igroup + 1]; } |
/scratch_na/users/xoserete/qaas_runs/171-284-5201/intel/miniqmc/build/miniqmc/src/Particle/DistanceTable.h: 268 - 268 |
-------------------------------------------------------------------------------- |
268: const DistRow& getDistRow(int iel) const { return distances_[iel]; } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_vector.h: 951 - 1056 |
-------------------------------------------------------------------------------- |
951: return *(this->_M_impl._M_start + __n); |
[...] |
1056: { return _M_data_ptr(this->_M_impl._M_start); } |
0x41a040 PUSH %RBP |
0x41a041 MOV %RSP,%RBP |
0x41a044 PUSH %R15 |
0x41a046 PUSH %R14 |
0x41a048 PUSH %R13 |
0x41a04a PUSH %R12 |
0x41a04c PUSH %RBX |
0x41a04d SUB $0x98,%RSP |
0x41a054 MOV %RCX,-0xa0(%RBP) |
0x41a05b MOV %RDX,-0x98(%RBP) |
0x41a062 MOV %RDI,%R13 |
0x41a065 TEST %R8B,%R8B |
0x41a068 JE 41a939 |
0x41a06e MOV %RSI,%R14 |
0x41a071 MOV 0x248(%R13),%ESI |
0x41a078 MOV %R14,%RDI |
0x41a07b CALL 453d20 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> |
0x41a080 MOV %RAX,-0x90(%RBP) |
0x41a087 MOV 0xa0(%R13),%R9 |
0x41a08e TEST %R9,%R9 |
0x41a091 JE 41a939 |
0x41a097 XOR %ECX,%ECX |
0x41a099 VMOVSD 0xd1fd7(%RIP),%XMM5 |
0x41a0a1 VBROADCASTSD 0xd0dfe(%RIP),%YMM6 |
0x41a0aa MOV %R9,%R12 |
0x41a0ad MOV %R13,-0x78(%RBP) |
0x41a0b1 MOV %R14,-0x68(%RBP) |
0x41a0b5 JMP 41a0dd |
0x41a0b7 NOPW (%RAX,%RAX,1) |
(283) 0x41a0c0 MOV %R12,%RAX |
(283) 0x41a0c3 MOV -0xa8(%RBP),%RCX |
(283) 0x41a0ca INC %RCX |
(283) 0x41a0cd MOV %RAX,%R12 |
(283) 0x41a0d0 CMP %RCX,%RAX |
(283) 0x41a0d3 MOV -0x68(%RBP),%R14 |
(283) 0x41a0d7 JBE 41a939 |
(283) 0x41a0dd MOV 0x268(%R14),%RAX |
(283) 0x41a0e4 MOV 0x18(%RAX),%RAX |
(283) 0x41a0e8 MOVSXD (%RAX,%RCX,4),%RSI |
(283) 0x41a0ec MOV %RCX,-0xa8(%RBP) |
(283) 0x41a0f3 MOVSXD 0x4(%RAX,%RCX,4),%RAX |
(283) 0x41a0f8 MOV %RAX,-0xb8(%RBP) |
(283) 0x41a0ff CMP %EAX,%ESI |
(283) 0x41a101 JGE 41a0c0 |
(283) 0x41a103 MOV 0x140(%R13),%R15 |
(283) 0x41a10a MOV 0x158(%R13),%R11 |
(283) 0x41a111 MOV 0x170(%R13),%RAX |
(283) 0x41a118 MOV %RAX,-0x40(%RBP) |
(283) 0x41a11c LEA -0x1(%RSI),%RAX |
(283) 0x41a120 MOV %RAX,-0xb0(%RBP) |
(283) 0x41a127 MOV $0x1fffffffffffffff,%RAX |
(283) 0x41a131 ADD %RSI,%RAX |
(283) 0x41a134 MOV %RAX,-0x80(%RBP) |
(283) 0x41a138 MOVQ $0,-0x88(%RBP) |
(283) 0x41a143 JMP 41a16e |
0x41a145 NOPW %CS:(%RAX,%RAX,1) |
(284) 0x41a150 INC %RSI |
(284) 0x41a153 INCQ -0x88(%RBP) |
(284) 0x41a15a INCQ -0x80(%RBP) |
(284) 0x41a15e MOV %R9,%RAX |
(284) 0x41a161 CMP -0xb8(%RBP),%RSI |
(284) 0x41a168 JE 41a0c3 |
(284) 0x41a16e MOV %R11,-0x38(%RBP) |
(284) 0x41a172 MOV -0x90(%RBP),%RAX |
(284) 0x41a179 MOV 0x48(%RAX),%RAX |
(284) 0x41a17d LEA (%RSI,%RSI,4),%RCX |
(284) 0x41a181 MOV %RCX,-0x60(%RBP) |
(284) 0x41a185 MOV 0x18(%RAX,%RCX,8),%R8 |
(284) 0x41a18a TEST %RSI,%RSI |
(284) 0x41a18d MOV %RSI,-0x50(%RBP) |
(284) 0x41a191 JLE 41a1ea |
(284) 0x41a193 MOV %ESI,%EBX |
(284) 0x41a195 SAL $0x3,%RBX |
(284) 0x41a199 MOV %R15,%RDI |
(284) 0x41a19c XOR %ESI,%ESI |
(284) 0x41a19e MOV %RBX,%RDX |
(284) 0x41a1a1 MOV %R9,%R14 |
(284) 0x41a1a4 MOV %R8,%R13 |
(284) 0x41a1a7 VZEROUPPER |
(284) 0x41a1aa CALL 4dc0f0 <_intel_fast_memset> |
(284) 0x41a1af MOV -0x38(%RBP),%RDI |
(284) 0x41a1b3 XOR %ESI,%ESI |
(284) 0x41a1b5 MOV %RBX,%RDX |
(284) 0x41a1b8 CALL 4dc0f0 <_intel_fast_memset> |
(284) 0x41a1bd MOV -0x40(%RBP),%RDI |
(284) 0x41a1c1 XOR %ESI,%ESI |
(284) 0x41a1c3 MOV %RBX,%RDX |
(284) 0x41a1c6 CALL 4dc0f0 <_intel_fast_memset> |
(284) 0x41a1cb MOV %R13,%R8 |
(284) 0x41a1ce MOV -0x78(%RBP),%R13 |
(284) 0x41a1d2 MOV -0x50(%RBP),%RSI |
(284) 0x41a1d6 MOV %R14,%R9 |
(284) 0x41a1d9 VBROADCASTSD 0xd0cc6(%RIP),%YMM6 |
(284) 0x41a1e2 VMOVSD 0xd1e8e(%RIP),%XMM5 |
(284) 0x41a1ea TEST %R12,%R12 |
(284) 0x41a1ed JE 41a2b0 |
(284) 0x41a1f3 MOV -0x68(%RBP),%RAX |
(284) 0x41a1f7 MOV 0x18(%RAX),%RAX |
(284) 0x41a1fb IMUL (%RAX,%RSI,4),%R12D |
(284) 0x41a200 MOV %R13,%RBX |
(284) 0x41a203 MOV %R15,-0x48(%RBP) |
(284) 0x41a207 MOVSXD %R12D,%RAX |
(284) 0x41a20a SAL $0x3,%RAX |
(284) 0x41a20e MOV %RAX,-0x58(%RBP) |
(284) 0x41a212 MOV $0x1,%R12D |
(284) 0x41a218 MOV -0x38(%RBP),%R14 |
(284) 0x41a21c MOV -0x40(%RBP),%R13 |
(299) 0x41a220 MOV 0x200(%RBX),%RAX |
(299) 0x41a227 ADD -0x58(%RBP),%RAX |
(299) 0x41a22b MOV -0x8(%RAX,%R12,8),%RDI |
(299) 0x41a230 MOV -0x68(%RBP),%RAX |
(299) 0x41a234 MOV 0x268(%RAX),%RAX |
(299) 0x41a23b MOV 0x18(%RAX),%RAX |
(299) 0x41a23f MOV -0x4(%RAX,%R12,4),%EDX |
(299) 0x41a244 MOVSXD (%RAX,%R12,4),%RAX |
(299) 0x41a248 CMP %RAX,%RSI |
(299) 0x41a24b MOV %ESI,%ECX |
(299) 0x41a24d CMOVG %EAX,%ECX |
(299) 0x41a250 MOV %R8,%R15 |
(299) 0x41a253 MOV -0x48(%RBP),%R9 |
(299) 0x41a257 PUSHQ 0x1e8(%RBX) |
(299) 0x41a25d PUSHQ 0x1d0(%RBX) |
(299) 0x41a263 PUSH %R13 |
(299) 0x41a265 PUSH %R14 |
(299) 0x41a267 VZEROUPPER |
(299) 0x41a26a CALL 4170d0 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi> |
(299) 0x41a26f MOV %R15,%R8 |
(299) 0x41a272 MOV -0x50(%RBP),%RSI |
(299) 0x41a276 ADD $0x20,%RSP |
(299) 0x41a27a MOV %R12D,%EAX |
(299) 0x41a27d MOV 0xa0(%RBX),%R9 |
(299) 0x41a284 INC %R12 |
(299) 0x41a287 CMP %RAX,%R9 |
(299) 0x41a28a JA 41a220 |
(284) 0x41a28c MOV 0x140(%RBX),%R15 |
(284) 0x41a293 MOV %R9,%R12 |
(284) 0x41a296 MOV %RBX,%R13 |
(284) 0x41a299 VMOVSD 0xd1dd7(%RIP),%XMM5 |
(284) 0x41a2a1 VBROADCASTSD 0xd0bfe(%RIP),%YMM6 |
(284) 0x41a2aa JMP 41a2b3 |
0x41a2ac NOPL (%RAX) |
(284) 0x41a2b0 XOR %R12D,%R12D |
(284) 0x41a2b3 VXORPD %XMM0,%XMM0,%XMM0 |
(284) 0x41a2b7 VXORPD %XMM1,%XMM1,%XMM1 |
(284) 0x41a2bb MOV $0x1fffffffffffffff,%RAX |
(284) 0x41a2c5 TEST %RAX,%RSI |
(284) 0x41a2c8 JE 41a33e |
(284) 0x41a2ca LEA (%RSI,%RAX,1),%RCX |
(284) 0x41a2ce AND %RAX,%RCX |
(284) 0x41a2d1 INC %RCX |
(284) 0x41a2d4 MOV %RCX,%RAX |
(284) 0x41a2d7 MOV $0x3ffffffffffffffc,%RDX |
(284) 0x41a2e1 AND %RDX,%RAX |
(284) 0x41a2e4 JE 41a320 |
(284) 0x41a2e6 VXORPD %XMM1,%XMM1,%XMM1 |
(284) 0x41a2ea XOR %EDX,%EDX |
(284) 0x41a2ec NOPL (%RAX) |
(298) 0x41a2f0 VADDPD (%R15,%RDX,8),%YMM1,%YMM1 |
(298) 0x41a2f6 ADD $0x4,%RDX |
(298) 0x41a2fa CMP %RAX,%RDX |
(298) 0x41a2fd JB 41a2f0 |
(284) 0x41a2ff VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(284) 0x41a305 VADDPD %XMM2,%XMM1,%XMM1 |
(284) 0x41a309 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(284) 0x41a30e VADDSD %XMM2,%XMM1,%XMM1 |
(284) 0x41a312 CMP %RAX,%RCX |
(284) 0x41a315 JNE 41a322 |
(284) 0x41a317 JMP 41a33e |
0x41a319 NOPL (%RAX) |
(284) 0x41a320 XOR %EAX,%EAX |
(284) 0x41a322 MOV $0x3d,%CL |
(284) 0x41a324 BZHI %RCX,-0x80(%RBP),%RCX |
(284) 0x41a32a INC %RCX |
(284) 0x41a32d NOPL (%RAX) |
(297) 0x41a330 VADDSD (%R15,%RAX,8),%XMM1,%XMM1 |
(297) 0x41a336 INC %RAX |
(297) 0x41a339 CMP %RAX,%RCX |
(297) 0x41a33c JNE 41a330 |
(284) 0x41a33e MOV 0xd8(%R13),%RDX |
(284) 0x41a345 VMOVSD %XMM1,(%RDX,%RSI,8) |
(284) 0x41a34a MOV 0x158(%R13),%R11 |
(284) 0x41a351 MOV 0x170(%R13),%R10 |
(284) 0x41a358 MOV -0x90(%RBP),%RAX |
(284) 0x41a35f MOV 0x60(%RAX),%RAX |
(284) 0x41a363 TEST %RSI,%RSI |
(284) 0x41a366 JLE 41a3e4 |
(284) 0x41a368 MOV %RSI,%RCX |
(284) 0x41a36b AND $-0x4,%RCX |
(284) 0x41a36f JE 41a3c0 |
(284) 0x41a371 LEA -0x1(%RCX),%R8 |
(284) 0x41a375 VXORPD %XMM0,%XMM0,%XMM0 |
(284) 0x41a379 XOR %EDI,%EDI |
(284) 0x41a37b VBROADCASTSD 0xd1cf4(%RIP),%YMM1 |
(284) 0x41a384 NOPW %CS:(%RAX,%RAX,1) |
(296) 0x41a390 VADDPD (%R10,%RDI,8),%YMM0,%YMM0 |
(296) 0x41a396 VFMADD231PD (%R11,%RDI,8),%YMM1,%YMM0 |
(296) 0x41a39c ADD $0x4,%RDI |
(296) 0x41a3a0 CMP %R8,%RDI |
(296) 0x41a3a3 JLE 41a390 |
(284) 0x41a3a5 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(284) 0x41a3ab VADDPD %XMM1,%XMM0,%XMM0 |
(284) 0x41a3af VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(284) 0x41a3b4 VADDSD %XMM1,%XMM0,%XMM0 |
(284) 0x41a3b8 JMP 41a3df |
0x41a3ba NOPW (%RAX,%RAX,1) |
(284) 0x41a3c0 VXORPD %XMM0,%XMM0,%XMM0 |
(284) 0x41a3c4 XOR %ECX,%ECX |
(284) 0x41a3c6 NOPW %CS:(%RAX,%RAX,1) |
(295) 0x41a3d0 VADDSD (%R10,%RCX,8),%XMM0,%XMM0 |
(295) 0x41a3d6 VFMADD231SD (%R11,%RCX,8),%XMM5,%XMM0 |
(295) 0x41a3dc INC %RCX |
(295) 0x41a3df CMP %RCX,%RSI |
(295) 0x41a3e2 JNE 41a3d0 |
(284) 0x41a3e4 MOV -0x60(%RBP),%RCX |
(284) 0x41a3e8 MOV 0x8(%RAX,%RCX,8),%R14 |
(284) 0x41a3ed MOV 0x18(%RAX,%RCX,8),%RAX |
(284) 0x41a3f2 VXORPD %XMM1,%XMM1,%XMM1 |
(284) 0x41a3f6 VXORPD %XMM2,%XMM2,%XMM2 |
(284) 0x41a3fa TEST %RSI,%RSI |
(284) 0x41a3fd JLE 41a474 |
(284) 0x41a3ff MOV %RSI,%R8 |
(284) 0x41a402 AND $-0x4,%R8 |
(284) 0x41a406 JE 41a450 |
(284) 0x41a408 LEA -0x1(%R8),%RCX |
(284) 0x41a40c VXORPD %XMM2,%XMM2,%XMM2 |
(284) 0x41a410 XOR %EDI,%EDI |
(284) 0x41a412 NOPW %CS:(%RAX,%RAX,1) |
(294) 0x41a420 VMOVUPD (%RAX,%RDI,8),%YMM3 |
(294) 0x41a425 VFMADD231PD (%R11,%RDI,8),%YMM3,%YMM2 |
(294) 0x41a42b ADD $0x4,%RDI |
(294) 0x41a42f CMP %RCX,%RDI |
(294) 0x41a432 JLE 41a420 |
(284) 0x41a434 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(284) 0x41a43a VADDPD %XMM3,%XMM2,%XMM2 |
(284) 0x41a43e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(284) 0x41a443 VADDSD %XMM3,%XMM2,%XMM2 |
(284) 0x41a447 JMP 41a46f |
0x41a449 NOPL (%RAX) |
(284) 0x41a450 XOR %R8D,%R8D |
(284) 0x41a453 NOPW %CS:(%RAX,%RAX,1) |
(293) 0x41a460 VMOVSD (%RAX,%R8,8),%XMM3 |
(293) 0x41a466 VFMADD231SD (%R11,%R8,8),%XMM3,%XMM2 |
(293) 0x41a46c INC %R8 |
(293) 0x41a46f CMP %R8,%RSI |
(293) 0x41a472 JNE 41a460 |
(284) 0x41a474 MOV %R10,-0x40(%RBP) |
(284) 0x41a478 TEST %RSI,%RSI |
(284) 0x41a47b JLE 41a4f4 |
(284) 0x41a47d MOV %RSI,%R10 |
(284) 0x41a480 AND $-0x4,%R10 |
(284) 0x41a484 JE 41a4d0 |
(284) 0x41a486 LEA -0x1(%R10),%RCX |
(284) 0x41a48a LEA (%RAX,%R14,8),%RDI |
(284) 0x41a48e VXORPD %XMM1,%XMM1,%XMM1 |
(284) 0x41a492 XOR %R8D,%R8D |
(284) 0x41a495 NOPW %CS:(%RAX,%RAX,1) |
(292) 0x41a4a0 VMOVUPD (%RDI,%R8,8),%YMM3 |
(292) 0x41a4a6 VFMADD231PD (%R11,%R8,8),%YMM3,%YMM1 |
(292) 0x41a4ac ADD $0x4,%R8 |
(292) 0x41a4b0 CMP %RCX,%R8 |
(292) 0x41a4b3 JLE 41a4a0 |
(284) 0x41a4b5 VEXTRACTF128 $0x1,%YMM1,%XMM3 |
(284) 0x41a4bb VADDPD %XMM3,%XMM1,%XMM1 |
(284) 0x41a4bf VSHUFPD $0x1,%XMM1,%XMM1,%XMM3 |
(284) 0x41a4c4 VADDSD %XMM3,%XMM1,%XMM1 |
(284) 0x41a4c8 CMP %R10,%RSI |
(284) 0x41a4cb JNE 41a4d7 |
(284) 0x41a4cd JMP 41a4f4 |
0x41a4cf NOP |
(284) 0x41a4d0 VXORPD %XMM1,%XMM1,%XMM1 |
(284) 0x41a4d4 XOR %R10D,%R10D |
(284) 0x41a4d7 LEA (%RAX,%R14,8),%RCX |
(284) 0x41a4db NOPL (%RAX,%RAX,1) |
(291) 0x41a4e0 VMOVSD (%RCX,%R10,8),%XMM3 |
(291) 0x41a4e6 VFMADD231SD (%R11,%R10,8),%XMM3,%XMM1 |
(291) 0x41a4ec INC %R10 |
(291) 0x41a4ef CMP %R10,%RSI |
(291) 0x41a4f2 JNE 41a4e0 |
(284) 0x41a4f4 TEST %RSI,%RSI |
(284) 0x41a4f7 JLE 41a550 |
(284) 0x41a4f9 MOV %RSI,%R10 |
(284) 0x41a4fc AND $-0x4,%R10 |
(284) 0x41a500 JE 41a560 |
(284) 0x41a502 LEA -0x1(%R10),%RCX |
(284) 0x41a506 MOV %R14,%RDI |
(284) 0x41a509 SAL $0x4,%RDI |
(284) 0x41a50d ADD %RAX,%RDI |
(284) 0x41a510 VXORPD %XMM3,%XMM3,%XMM3 |
(284) 0x41a514 XOR %R8D,%R8D |
(284) 0x41a517 NOPW (%RAX,%RAX,1) |
(290) 0x41a520 VMOVUPD (%RDI,%R8,8),%YMM4 |
(290) 0x41a526 VFMADD231PD (%R11,%R8,8),%YMM4,%YMM3 |
(290) 0x41a52c ADD $0x4,%R8 |
(290) 0x41a530 CMP %RCX,%R8 |
(290) 0x41a533 JLE 41a520 |
(284) 0x41a535 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(284) 0x41a53b VADDPD %XMM4,%XMM3,%XMM3 |
(284) 0x41a53f VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(284) 0x41a544 VADDSD %XMM4,%XMM3,%XMM3 |
(284) 0x41a548 CMP %R10,%RSI |
(284) 0x41a54b JNE 41a567 |
(284) 0x41a54d JMP 41a594 |
0x41a54f NOP |
(284) 0x41a550 VXORPD %XMM3,%XMM3,%XMM3 |
(284) 0x41a554 JMP 41a594 |
0x41a556 NOPW %CS:(%RAX,%RAX,1) |
(284) 0x41a560 VXORPD %XMM3,%XMM3,%XMM3 |
(284) 0x41a564 XOR %R10D,%R10D |
(284) 0x41a567 MOV %R14,%RCX |
(284) 0x41a56a SAL $0x4,%RCX |
(284) 0x41a56e ADD %RAX,%RCX |
(284) 0x41a571 NOPW %CS:(%RAX,%RAX,1) |
(289) 0x41a580 VMOVSD (%RCX,%R10,8),%XMM4 |
(289) 0x41a586 VFMADD231SD (%R11,%R10,8),%XMM4,%XMM3 |
(289) 0x41a58c INC %R10 |
(289) 0x41a58f CMP %R10,%RSI |
(289) 0x41a592 JNE 41a580 |
(284) 0x41a594 MOV %R14,-0x58(%RBP) |
(284) 0x41a598 MOV 0xf0(%R13),%RDI |
(284) 0x41a59f MOV 0x100(%R13),%R14 |
(284) 0x41a5a6 LEA (%RSI,%RDI,1),%RCX |
(284) 0x41a5aa VMOVSD %XMM2,(%R14,%RSI,8) |
(284) 0x41a5b0 VMOVSD %XMM1,(%R14,%RCX,8) |
(284) 0x41a5b6 LEA (%RSI,%RDI,2),%RCX |
(284) 0x41a5ba VMOVSD %XMM3,(%R14,%RCX,8) |
(284) 0x41a5c0 VXORPD 0xd0988(%RIP),%XMM0,%XMM0 |
(284) 0x41a5c8 MOV 0x128(%R13),%R8 |
(284) 0x41a5cf VMOVLPD %XMM0,(%R8,%RSI,8) |
(284) 0x41a5d5 TEST %RSI,%RSI |
(284) 0x41a5d8 JLE 41a150 |
(284) 0x41a5de MOV %RDI,-0x70(%RBP) |
(284) 0x41a5e2 MOV %R12,-0xc0(%RBP) |
(284) 0x41a5e9 MOV %R9,-0x60(%RBP) |
(284) 0x41a5ed LEA -0x1(%RSI),%R9 |
(284) 0x41a5f1 MOV %R11,%R13 |
(284) 0x41a5f4 LEA (%RDX,%R9,8),%R11 |
(284) 0x41a5f8 CMP %R8,%R11 |
(284) 0x41a5fb SETAEB -0x2d(%RBP) |
(284) 0x41a5ff LEA (%R8,%R9,8),%RDI |
(284) 0x41a603 CMP %RDX,%RDI |
(284) 0x41a606 SETAE %CL |
(284) 0x41a609 CMP %R15,%R11 |
(284) 0x41a60c MOV %R15,%RSI |
(284) 0x41a60f SETB %R15B |
(284) 0x41a613 LEA (%RSI,%R9,8),%R10 |
(284) 0x41a617 CMP %RDX,%R10 |
(284) 0x41a61a SETBB -0x2c(%RBP) |
(284) 0x41a61e CMP %R8,%R10 |
(284) 0x41a621 SETB %R12B |
(284) 0x41a625 MOV %RSI,-0x48(%RBP) |
(284) 0x41a629 CMP %RSI,%RDI |
(284) 0x41a62c SETBB -0x2b(%RBP) |
(284) 0x41a630 CMP %R13,%R11 |
(284) 0x41a633 SETB %R10B |
(284) 0x41a637 LEA (,%R9,8),%RBX |
(284) 0x41a63f ADD %R13,%RBX |
(284) 0x41a642 CMP %RDX,%RBX |
(284) 0x41a645 SETBB -0x2a(%RBP) |
(284) 0x41a649 MOV -0x40(%RBP),%RSI |
(284) 0x41a64d CMP %RSI,%R11 |
(284) 0x41a650 SETB %R11B |
(284) 0x41a654 LEA (%RSI,%R9,8),%R9 |
(284) 0x41a658 CMP %RDX,%R9 |
(284) 0x41a65b SETBB -0x29(%RBP) |
(284) 0x41a65f CMP %R8,%RBX |
(284) 0x41a662 SETB %BL |
(284) 0x41a665 MOV %R13,-0x38(%RBP) |
(284) 0x41a669 CMP %R13,%RDI |
(284) 0x41a66c SETB %R13B |
(284) 0x41a670 CMP %R8,%R9 |
(284) 0x41a673 SETB %R9B |
(284) 0x41a677 CMP %RSI,%RDI |
(284) 0x41a67a SETB %SIL |
(284) 0x41a67e TEST %CL,-0x2d(%RBP) |
(284) 0x41a681 JNE 41a720 |
(284) 0x41a687 OR -0x2c(%RBP),%R15B |
(284) 0x41a68b JE 41a720 |
(284) 0x41a691 OR -0x2b(%RBP),%R12B |
(284) 0x41a695 JE 41a720 |
(284) 0x41a69b OR -0x2a(%RBP),%R10B |
(284) 0x41a69f JE 41a720 |
(284) 0x41a6a1 OR -0x29(%RBP),%R11B |
(284) 0x41a6a5 JE 41a720 |
(284) 0x41a6a7 OR %R13B,%BL |
(284) 0x41a6aa JE 41a720 |
(284) 0x41a6ac OR %SIL,%R9B |
(284) 0x41a6af JE 41a720 |
(284) 0x41a6b1 MOV -0x50(%RBP),%RSI |
(284) 0x41a6b5 MOV %RSI,%R9 |
(284) 0x41a6b8 AND $-0x4,%R9 |
(284) 0x41a6bc VMOVSD 0xd07e4(%RIP),%XMM1 |
(284) 0x41a6c4 JE 41a771 |
(284) 0x41a6ca LEA -0x1(%R9),%RCX |
(284) 0x41a6ce XOR %EDI,%EDI |
(284) 0x41a6d0 MOV -0x48(%RBP),%R10 |
(284) 0x41a6d4 MOV -0x38(%RBP),%R11 |
(284) 0x41a6d8 MOV -0x40(%RBP),%RBX |
(284) 0x41a6dc NOPL (%RAX) |
(288) 0x41a6e0 VMOVUPD (%RDX,%RDI,8),%YMM0 |
(288) 0x41a6e5 VADDPD (%R10,%RDI,8),%YMM0,%YMM0 |
(288) 0x41a6eb VMOVUPD %YMM0,(%RDX,%RDI,8) |
(288) 0x41a6f0 VMOVUPD (%R11,%RDI,8),%YMM0 |
(288) 0x41a6f6 VFMSUB213PD (%RBX,%RDI,8),%YMM6,%YMM0 |
(288) 0x41a6fc VADDPD (%R8,%RDI,8),%YMM0,%YMM0 |
(288) 0x41a702 VMOVUPD %YMM0,(%R8,%RDI,8) |
(288) 0x41a708 ADD $0x4,%RDI |
(288) 0x41a70c CMP %RCX,%RDI |
(288) 0x41a70f JLE 41a6e0 |
(284) 0x41a711 JMP 41a7ad |
0x41a716 NOPW %CS:(%RAX,%RAX,1) |
(284) 0x41a720 XOR %ECX,%ECX |
(284) 0x41a722 VMOVSD 0xd077e(%RIP),%XMM1 |
(284) 0x41a72a MOV -0x50(%RBP),%RSI |
(284) 0x41a72e MOV -0x48(%RBP),%RDI |
(284) 0x41a732 MOV -0x38(%RBP),%R9 |
(284) 0x41a736 MOV -0x40(%RBP),%R10 |
(284) 0x41a73a NOPW (%RAX,%RAX,1) |
(285) 0x41a740 VMOVSD (%RDX,%RCX,8),%XMM0 |
(285) 0x41a745 VADDSD (%RDI,%RCX,8),%XMM0,%XMM0 |
(285) 0x41a74a VMOVSD %XMM0,(%RDX,%RCX,8) |
(285) 0x41a74f VMOVSD (%R9,%RCX,8),%XMM0 |
(285) 0x41a755 VFMSUB213SD (%R10,%RCX,8),%XMM1,%XMM0 |
(285) 0x41a75b VADDSD (%R8,%RCX,8),%XMM0,%XMM0 |
(285) 0x41a761 VMOVSD %XMM0,(%R8,%RCX,8) |
(285) 0x41a767 INC %RCX |
(285) 0x41a76a CMP %RCX,%RSI |
(285) 0x41a76d JNE 41a740 |
(284) 0x41a76f JMP 41a7b2 |
(284) 0x41a771 XOR %R9D,%R9D |
(284) 0x41a774 MOV -0x48(%RBP),%R10 |
(284) 0x41a778 MOV -0x38(%RBP),%R11 |
(284) 0x41a77c MOV -0x40(%RBP),%RBX |
(287) 0x41a780 VMOVSD (%RDX,%R9,8),%XMM0 |
(287) 0x41a786 VADDSD (%R10,%R9,8),%XMM0,%XMM0 |
(287) 0x41a78c VMOVSD %XMM0,(%RDX,%R9,8) |
(287) 0x41a792 VMOVSD (%R11,%R9,8),%XMM0 |
(287) 0x41a798 VFMSUB213SD (%RBX,%R9,8),%XMM1,%XMM0 |
(287) 0x41a79e VADDSD (%R8,%R9,8),%XMM0,%XMM0 |
(287) 0x41a7a4 VMOVSD %XMM0,(%R8,%R9,8) |
(287) 0x41a7aa INC %R9 |
(287) 0x41a7ad CMP %R9,%RSI |
(287) 0x41a7b0 JNE 41a780 |
(284) 0x41a7b2 MOV -0xb0(%RBP),%RCX |
(284) 0x41a7b9 ADD -0x88(%RBP),%RCX |
(284) 0x41a7c0 JNE 41a7e0 |
(284) 0x41a7c2 XOR %EDX,%EDX |
(284) 0x41a7c4 MOV -0x38(%RBP),%RCX |
(284) 0x41a7c8 MOV -0x70(%RBP),%RDI |
(284) 0x41a7cc JMP 41a8bb |
0x41a7d1 NOPW %CS:(%RAX,%RAX,1) |
(284) 0x41a7e0 MOV %RSI,%R8 |
(284) 0x41a7e3 AND $-0x2,%R8 |
(284) 0x41a7e7 LEA 0x8(%RAX),%R9 |
(284) 0x41a7eb LEA 0x8(%R14),%R10 |
(284) 0x41a7ef MOV -0x58(%RBP),%RCX |
(284) 0x41a7f3 LEA (%RAX,%RCX,8),%R11 |
(284) 0x41a7f7 ADD $0x8,%R11 |
(284) 0x41a7fb MOV -0x70(%RBP),%RDI |
(284) 0x41a7ff LEA (%R14,%RDI,8),%R15 |
(284) 0x41a803 ADD $0x8,%R15 |
(284) 0x41a807 SAL $0x4,%RCX |
(284) 0x41a80b LEA (%RAX,%RCX,1),%RBX |
(284) 0x41a80f ADD $0x8,%RBX |
(284) 0x41a813 MOV %RDI,%RCX |
(284) 0x41a816 SAL $0x4,%RCX |
(284) 0x41a81a LEA (%R14,%RCX,1),%R12 |
(284) 0x41a81e ADD $0x8,%R12 |
(284) 0x41a822 XOR %EDX,%EDX |
(284) 0x41a824 MOV -0x38(%RBP),%RCX |
(284) 0x41a828 NOPL (%RAX,%RAX,1) |
(286) 0x41a830 VMOVSD (%RCX,%RDX,8),%XMM0 |
(286) 0x41a835 VMOVSD -0x8(%R9,%RDX,8),%XMM1 |
(286) 0x41a83c VFNMADD213SD -0x8(%R10,%RDX,8),%XMM0,%XMM1 |
(286) 0x41a843 VMOVSD %XMM1,-0x8(%R10,%RDX,8) |
(286) 0x41a84a VMOVSD -0x8(%R11,%RDX,8),%XMM1 |
(286) 0x41a851 VFNMADD213SD -0x8(%R15,%RDX,8),%XMM0,%XMM1 |
(286) 0x41a858 VMOVSD %XMM1,-0x8(%R15,%RDX,8) |
(286) 0x41a85f VMOVSD -0x8(%RBX,%RDX,8),%XMM1 |
(286) 0x41a865 VFNMADD213SD -0x8(%R12,%RDX,8),%XMM0,%XMM1 |
(286) 0x41a86c VMOVSD %XMM1,-0x8(%R12,%RDX,8) |
(286) 0x41a873 VMOVSD 0x8(%RCX,%RDX,8),%XMM0 |
(286) 0x41a879 VMOVSD (%R9,%RDX,8),%XMM1 |
(286) 0x41a87f VFNMADD213SD (%R10,%RDX,8),%XMM0,%XMM1 |
(286) 0x41a885 VMOVSD %XMM1,(%R10,%RDX,8) |
(286) 0x41a88b VMOVSD (%R11,%RDX,8),%XMM1 |
(286) 0x41a891 VFNMADD213SD (%R15,%RDX,8),%XMM0,%XMM1 |
(286) 0x41a897 VMOVSD %XMM1,(%R15,%RDX,8) |
(286) 0x41a89d VMOVSD (%RBX,%RDX,8),%XMM1 |
(286) 0x41a8a2 VFNMADD213SD (%R12,%RDX,8),%XMM0,%XMM1 |
(286) 0x41a8a8 VMOVSD %XMM1,(%R12,%RDX,8) |
(286) 0x41a8ae ADD $0x2,%RDX |
(286) 0x41a8b2 CMP %RDX,%R8 |
(286) 0x41a8b5 JNE 41a830 |
(284) 0x41a8bb MOV -0x50(%RBP),%RSI |
(284) 0x41a8bf TEST $0x1,%SIL |
(284) 0x41a8c3 MOV -0x78(%RBP),%R13 |
(284) 0x41a8c7 MOV -0x60(%RBP),%R9 |
(284) 0x41a8cb MOV -0x48(%RBP),%R15 |
(284) 0x41a8cf MOV -0xc0(%RBP),%R12 |
(284) 0x41a8d6 MOV %RCX,%R11 |
(284) 0x41a8d9 JE 41a150 |
(284) 0x41a8df LEA (%RDI,%RDI,1),%RCX |
(284) 0x41a8e3 VMOVSD (%R11,%RDX,8),%XMM0 |
(284) 0x41a8e9 VMOVSD (%RAX,%RDX,8),%XMM1 |
(284) 0x41a8ee VFNMADD213SD (%R14,%RDX,8),%XMM0,%XMM1 |
(284) 0x41a8f4 VMOVSD %XMM1,(%R14,%RDX,8) |
(284) 0x41a8fa MOV -0x58(%RBP),%R8 |
(284) 0x41a8fe MOV %RDI,%R10 |
(284) 0x41a901 LEA (%R8,%R8,1),%RDI |
(284) 0x41a905 ADD %RDX,%R8 |
(284) 0x41a908 VMOVSD (%RAX,%R8,8),%XMM1 |
(284) 0x41a90e ADD %RDX,%R10 |
(284) 0x41a911 VFNMADD213SD (%R14,%R10,8),%XMM0,%XMM1 |
(284) 0x41a917 VMOVSD %XMM1,(%R14,%R10,8) |
(284) 0x41a91d ADD %RDX,%RDI |
(284) 0x41a920 VMOVSD (%RAX,%RDI,8),%XMM1 |
(284) 0x41a925 ADD %RDX,%RCX |
(284) 0x41a928 VFNMADD213SD (%R14,%RCX,8),%XMM0,%XMM1 |
(284) 0x41a92e VMOVSD %XMM1,(%R14,%RCX,8) |
(284) 0x41a934 JMP 41a150 |
0x41a939 MOVQ $0,0x10(%R13) |
0x41a941 MOV 0x90(%R13),%RAX |
0x41a948 TEST %RAX,%RAX |
0x41a94b JE 41aa04 |
0x41a951 MOV 0xd8(%R13),%RCX |
0x41a958 MOV 0x100(%R13),%RDX |
0x41a95f MOVSXD 0xf0(%R13),%RSI |
0x41a966 MOV -0x98(%RBP),%RDI |
0x41a96d MOV 0x18(%RDI),%RDI |
0x41a971 MOV 0x128(%R13),%R8 |
0x41a978 MOV -0xa0(%RBP),%R9 |
0x41a97f MOV 0x18(%R9),%R9 |
0x41a983 ADD $0x10,%RDI |
0x41a987 LEA (%RDX,%RSI,8),%R10 |
0x41a98b SAL $0x4,%RSI |
0x41a98f ADD %RDX,%RSI |
0x41a992 XOR %R11D,%R11D |
0x41a995 NOPW %CS:(%RAX,%RAX,1) |
(282) 0x41a9a0 VMOVSD 0x10(%R13),%XMM0 |
(282) 0x41a9a6 VADDSD (%RCX,%R11,8),%XMM0,%XMM0 |
(282) 0x41a9ac VMOVSD %XMM0,0x10(%R13) |
(282) 0x41a9b2 VMOVSD (%RDX,%R11,8),%XMM0 |
(282) 0x41a9b8 VMOVHPD (%R10,%R11,8),%XMM0,%XMM0 |
(282) 0x41a9be VADDPD -0x10(%RDI),%XMM0,%XMM0 |
(282) 0x41a9c3 VMOVSD (%RDI),%XMM1 |
(282) 0x41a9c7 VADDSD (%RSI,%R11,8),%XMM1,%XMM1 |
(282) 0x41a9cd VMOVUPD %XMM0,-0x10(%RDI) |
(282) 0x41a9d2 VMOVSD %XMM1,(%RDI) |
(282) 0x41a9d6 VMOVSD (%R9,%R11,8),%XMM0 |
(282) 0x41a9dc VADDSD (%R8,%R11,8),%XMM0,%XMM0 |
(282) 0x41a9e2 VMOVSD %XMM0,(%R9,%R11,8) |
(282) 0x41a9e8 INC %R11 |
(282) 0x41a9eb ADD $0x18,%RDI |
(282) 0x41a9ef CMP %R11,%RAX |
(282) 0x41a9f2 JNE 41a9a0 |
0x41a9f4 VMOVSD 0x10(%R13),%XMM0 |
0x41a9fa VMULSD 0xd0476(%RIP),%XMM0,%XMM0 |
0x41aa02 JMP 41aa0c |
0x41aa04 VMOVSD 0xd168c(%RIP),%XMM0 |
0x41aa0c VMOVSD %XMM0,0x10(%R13) |
0x41aa12 ADD $0x98,%RSP |
0x41aa19 POP %RBX |
0x41aa1a POP %R12 |
0x41aa1c POP %R13 |
0x41aa1e POP %R14 |
0x41aa20 POP %R15 |
0x41aa22 POP %RBP |
0x41aa23 VZEROUPPER |
0x41aa26 RET |
0x41aa27 NOPW (%RAX,%RAX,1) |
Path / |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 72 |
nb uops | 74 |
loop length | 363 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 5 |
micro-operation queue | 12.33 cycles |
front end | 12.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.50 | 2.40 | 7.67 | 7.67 | 7.00 | 2.40 | 2.50 | 7.00 | 7.00 | 7.00 | 2.20 | 7.67 |
cycles | 2.50 | 2.40 | 7.67 | 7.67 | 7.00 | 2.40 | 2.50 | 7.00 | 7.00 | 7.00 | 2.20 | 7.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 12.13 |
Stall cycles | 0.00 |
Front-end | 12.33 |
Dispatch | 7.67 |
Overall L1 | 12.33 |
all | 6% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 14% |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 4% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 12% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 12% |
store | 11% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41a939 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x8f9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x248(%R13),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 453d20 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%R13),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R9,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41a939 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x8f9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0xd1fd7(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0xd0dfe(%RIP),%YMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV %R9,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 41a0dd <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVQ $0,0x10(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41aa04 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9c4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd8(%R13),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x100(%R13),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0xf0(%R13),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x98(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x128(%R13),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R9),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%RDX,%RSI,8),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x4,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0x10(%R13),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0xd0476(%RIP),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
JMP 41aa0c <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9cc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VMOVSD 0xd168c(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 72 |
nb uops | 74 |
loop length | 363 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 5 |
micro-operation queue | 12.33 cycles |
front end | 12.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.50 | 2.40 | 7.67 | 7.67 | 7.00 | 2.40 | 2.50 | 7.00 | 7.00 | 7.00 | 2.20 | 7.67 |
cycles | 2.50 | 2.40 | 7.67 | 7.67 | 7.00 | 2.40 | 2.50 | 7.00 | 7.00 | 7.00 | 2.20 | 7.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 12.13 |
Stall cycles | 0.00 |
Front-end | 12.33 |
Dispatch | 7.67 |
Overall L1 | 12.33 |
all | 6% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 14% |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 4% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 12% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 12% |
store | 11% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41a939 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x8f9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x248(%R13),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 453d20 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%R13),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R9,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41a939 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x8f9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0xd1fd7(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0xd0dfe(%RIP),%YMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV %R9,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 41a0dd <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVQ $0,0x10(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41aa04 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9c4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd8(%R13),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x100(%R13),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0xf0(%R13),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x98(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x128(%R13),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R9),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%RDX,%RSI,8),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x4,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0x10(%R13),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0xd0476(%RIP),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
JMP 41aa0c <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9cc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VMOVSD 0xd168c(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼miniqmcreference::TwoBodyJastrowRef | 0.13 | 0.14 |
○Loop 282 - TwoBodyJastrowRef.h:423-427 - exec | 0 | 0 |
▼Loop 283 - TwoBodyJastrowRef.h:268-420 - exec– | 0 | 0 |
▼Loop 284 - TwoBodyJastrowRef.h:268-420 - exec– | 0 | 0 |
○Loop 286 - TwoBodyJastrowRef.h:393-398 - exec | 0.04 | 0.04 |
○Loop 294 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.02 |
○Loop 292 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.02 |
○Loop 296 - TwoBodyJastrowRef.h:375-376 - exec | 0.02 | 0.02 |
○Loop 290 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.02 |
○Loop 288 - TwoBodyJastrowRef.h:388-391 - exec | 0.01 | 0.01 |
○Loop 295 - TwoBodyJastrowRef.h:375-376 - exec | 0 | 0 |
○Loop 287 - TwoBodyJastrowRef.h:388-391 - exec | 0 | 0 |
○Loop 298 - stl_numeric.h:126-127 - exec | 0 | 0.01 |
○Loop 293 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 291 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 289 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 297 - stl_numeric.h:126-127 - exec | 0 | 0 |
○Loop 299 - TwoBodyJastrowRef.h:269-274 - exec | 0 | 0 |
○Loop 285 - TwoBodyJastrowRef.h:388-391 - exec | 0 | 0 |