Function: _ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLER ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.1% |
---|
Function: _ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLER ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.1% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/Particle/DistanceTable.h: 268 - 268 |
-------------------------------------------------------------------------------- |
268: const DistRow& getDistRow(int iel) const { return distances_[iel]; } |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/TwoBodyJastrowRef.h: 268 - 432 |
-------------------------------------------------------------------------------- |
268: const int igt = P.GroupID[iat] * NumGroups; |
269: for (int jg = 0; jg < NumGroups; ++jg) |
270: { |
271: const FuncType& f2(*F[igt + jg]); |
272: int iStart = P.first(jg); |
273: int iEnd = std::min(jelmax, P.last(jg)); |
274: f2.evaluateVGL(iat, iStart, iEnd, dist, u, du, d2u, DistCompressed.data(), DistIndice.data()); |
[...] |
360: const auto& d_table = P.getDistTableAA(myTableID); |
361: for (int ig = 0; ig < NumGroups; ++ig) |
362: { |
363: const int igt = ig * NumGroups; |
364: for (int iat = P.first(ig), last = P.last(ig); iat < last; ++iat) |
365: { |
366: computeU3(P, iat, d_table.getDistRow(iat).data(), cur_u.data(), cur_du.data(), cur_d2u.data(), true); |
367: Uat[iat] = std::accumulate(cur_u.begin(), cur_u.begin() + iat, valT()); |
[...] |
375: for (int jat = 0; jat < iat; ++jat) |
376: lap += d2u[jat] + lapfac * du[jat]; |
377: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
378: { |
379: const valT* restrict dX = displ.data(idim); |
380: valT s = valT(); |
381: for (int jat = 0; jat < iat; ++jat) |
382: s += du[jat] * dX[jat]; |
383: grad[idim] = s; |
384: } |
385: dUat(iat) = grad; |
386: d2Uat[iat] = -lap; |
387: // add the contribution from the upper triangle |
388: for (int jat = 0; jat < iat; jat++) |
389: { |
390: Uat[jat] += u[jat]; |
391: d2Uat[jat] -= d2u[jat] + lapfac * du[jat]; |
392: } |
393: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
394: { |
395: valT* restrict save_g = dUat.data(idim); |
396: const valT* restrict dX = displ.data(idim); |
397: for (int jat = 0; jat < iat; jat++) |
398: save_g[jat] -= du[jat] * dX[jat]; |
[...] |
419: { |
420: if (fromscratch) |
421: recompute(P); |
422: LogValue = valT(0); |
423: for (int iat = 0; iat < N; ++iat) |
424: { |
425: LogValue += Uat[iat]; |
426: G[iat] += dUat[iat]; |
427: L[iat] += d2Uat[iat]; |
428: } |
429: |
430: constexpr valT mhalf(-0.5); |
431: LogValue = mhalf * LogValue; |
432: } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_numeric.h: 140 - 141 |
-------------------------------------------------------------------------------- |
140: for (; __first != __last; ++__first) |
141: __init = _GLIBCXX_MOVE_IF_20(__init) + *__first; |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 313 - 316 |
-------------------------------------------------------------------------------- |
313: inline int first(int igroup) const { return (*group_offsets_)[igroup]; } |
314: |
315: ///return the last index of a group i |
316: inline int last(int igroup) const { return (*group_offsets_)[igroup + 1]; } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/shared_ptr_base.h: 1296 - 1296 |
-------------------------------------------------------------------------------- |
1296: { return _M_ptr; } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_vector.h: 1064 - 1169 |
-------------------------------------------------------------------------------- |
1064: return *(this->_M_impl._M_start + __n); |
[...] |
1169: { return _M_data_ptr(this->_M_impl._M_start); } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_algobase.h: 235 - 1115 |
-------------------------------------------------------------------------------- |
235: if (__b < __a) |
[...] |
924: *__first = __tmp; |
[...] |
1115: if (__n <= 0) |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_iterator.h: 1028 - 1182 |
-------------------------------------------------------------------------------- |
1028: : _M_current(__i) { } |
[...] |
1182: { return __lhs.base() != __rhs.base(); } |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
[...] |
249: inline const_pointer data() const { return X; } |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 231 - 273 |
-------------------------------------------------------------------------------- |
231: inline const AoSElement_t operator[](size_t i) const { return AoSElement_t(myData + i, nGhosts); } |
[...] |
244: *(_base + M * i) = rhs[i]; |
[...] |
263: inline Accessor operator()(size_t i) { return Accessor(myData + i, nGhosts); } |
[...] |
273: inline const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 94 - 94 |
-------------------------------------------------------------------------------- |
94: (const_cast<T1&>(a) += b); |
0x41feb0 PUSH %RBP |
0x41feb1 MOV %RSP,%RBP |
0x41feb4 PUSH %R15 |
0x41feb6 PUSH %R14 |
0x41feb8 PUSH %R13 |
0x41feba PUSH %R12 |
0x41febc PUSH %RBX |
0x41febd SUB $0x78,%RSP |
0x41fec1 MOV %RCX,-0x98(%RBP) |
0x41fec8 MOV %RDX,-0x90(%RBP) |
0x41fecf MOV %RDI,-0x38(%RBP) |
0x41fed3 TEST %R8B,%R8B |
0x41fed6 JE 4206aa |
0x41fedc MOV %RSI,%RBX |
0x41fedf MOV -0x38(%RBP),%R14 |
0x41fee3 MOV 0x248(%R14),%ESI |
0x41feea MOV %RBX,%RDI |
0x41feed CALL 4617f0 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> |
0x41fef2 MOV %RAX,-0x88(%RBP) |
0x41fef9 MOV 0xa0(%R14),%R10 |
0x41ff00 TEST %R10,%R10 |
0x41ff03 JE 4206aa |
0x41ff09 XOR %ECX,%ECX |
0x41ff0b VMOVSD 0xd63a5(%RIP),%XMM5 |
0x41ff13 VBROADCASTSD 0xd639c(%RIP),%YMM6 |
0x41ff1c VMOVSD 0xd5144(%RIP),%XMM7 |
0x41ff24 VBROADCASTSD 0xd513b(%RIP),%YMM8 |
0x41ff2d MOV %R10,%RAX |
0x41ff30 MOV %R10,-0x40(%RBP) |
0x41ff34 MOV %RBX,-0x70(%RBP) |
0x41ff38 JMP 41ff62 |
0x41ff3a NOPW (%RAX,%RAX,1) |
(357) 0x41ff40 MOV -0x40(%RBP),%RAX |
(357) 0x41ff44 MOV -0xa0(%RBP),%RCX |
(357) 0x41ff4b INC %RCX |
(357) 0x41ff4e MOV %RAX,%RDX |
(357) 0x41ff51 MOV %RAX,-0x40(%RBP) |
(357) 0x41ff55 CMP %RCX,%RAX |
(357) 0x41ff58 MOV -0x70(%RBP),%RBX |
(357) 0x41ff5c JBE 4206aa |
(357) 0x41ff62 MOV 0x268(%RBX),%RAX |
(357) 0x41ff69 MOV 0x18(%RAX),%RAX |
(357) 0x41ff6d MOVSXD (%RAX,%RCX,4),%R13 |
(357) 0x41ff71 MOV 0x4(%RAX,%RCX,4),%EAX |
(357) 0x41ff75 CMP %EAX,%R13D |
(357) 0x41ff78 MOV %RCX,-0xa0(%RBP) |
(357) 0x41ff7f JGE 41ff40 |
(357) 0x41ff81 MOV %EAX,-0x74(%RBP) |
(357) 0x41ff84 MOV -0x38(%RBP),%RAX |
(357) 0x41ff88 MOV 0x140(%RAX),%R14 |
(357) 0x41ff8f MOV 0x158(%RAX),%RBX |
(357) 0x41ff96 MOV 0x170(%RAX),%R11 |
(357) 0x41ff9d MOV $0x1fffffffffffffff,%RAX |
(357) 0x41ffa7 ADD %R13,%RAX |
(357) 0x41ffaa MOV %RAX,-0x80(%RBP) |
(357) 0x41ffae JMP 41ffc0 |
(358) 0x41ffb0 INC %R13 |
(358) 0x41ffb3 INCQ -0x80(%RBP) |
(358) 0x41ffb7 MOV %R10,%RAX |
(358) 0x41ffba CMP %R13D,-0x74(%RBP) |
(358) 0x41ffbe JE 41ff44 |
(358) 0x41ffc0 MOV %R11,-0x48(%RBP) |
(358) 0x41ffc4 MOV %RBX,-0x50(%RBP) |
(358) 0x41ffc8 MOV -0x88(%RBP),%RAX |
(358) 0x41ffcf MOV 0x48(%RAX),%RAX |
(358) 0x41ffd3 LEA (,%R13,4),%RCX |
(358) 0x41ffdb ADD %R13,%RCX |
(358) 0x41ffde MOV %RCX,-0x60(%RBP) |
(358) 0x41ffe2 MOV 0x18(%RAX,%RCX,8),%R8 |
(358) 0x41ffe7 TEST %R13,%R13 |
(358) 0x41ffea JLE 42004d |
(358) 0x41ffec MOV %R13D,%R12D |
(358) 0x41ffef SAL $0x3,%R12 |
(358) 0x41fff3 MOV %R14,%RDI |
(358) 0x41fff6 XOR %ESI,%ESI |
(358) 0x41fff8 MOV %R12,%RDX |
(358) 0x41fffb MOV %R10,%RBX |
(358) 0x41fffe MOV %R8,%R15 |
(358) 0x420001 VZEROUPPER |
(358) 0x420004 CALL 4e5850 <_intel_fast_memset> |
(358) 0x420009 MOV -0x50(%RBP),%RDI |
(358) 0x42000d XOR %ESI,%ESI |
(358) 0x42000f MOV %R12,%RDX |
(358) 0x420012 CALL 4e5850 <_intel_fast_memset> |
(358) 0x420017 MOV -0x48(%RBP),%RDI |
(358) 0x42001b XOR %ESI,%ESI |
(358) 0x42001d MOV %R12,%RDX |
(358) 0x420020 CALL 4e5850 <_intel_fast_memset> |
(358) 0x420025 MOV %R15,%R8 |
(358) 0x420028 MOV %RBX,%R10 |
(358) 0x42002b VBROADCASTSD 0xd5034(%RIP),%YMM8 |
(358) 0x420034 VMOVSD 0xd502c(%RIP),%XMM7 |
(358) 0x42003c VBROADCASTSD 0xd6273(%RIP),%YMM6 |
(358) 0x420045 VMOVSD 0xd626b(%RIP),%XMM5 |
(358) 0x42004d MOV -0x40(%RBP),%RCX |
(358) 0x420051 TEST %RCX,%RCX |
(358) 0x420054 JE 420130 |
(358) 0x42005a MOV %R14,-0x58(%RBP) |
(358) 0x42005e MOV -0x70(%RBP),%RAX |
(358) 0x420062 MOV 0x18(%RAX),%RAX |
(358) 0x420066 IMUL (%RAX,%R13,4),%ECX |
(358) 0x42006b MOVSXD %ECX,%RAX |
(358) 0x42006e SAL $0x3,%RAX |
(358) 0x420072 MOV %RAX,-0x40(%RBP) |
(358) 0x420076 MOV -0x38(%RBP),%R15 |
(358) 0x42007a MOV $0x1,%R12D |
(358) 0x420080 MOV -0x48(%RBP),%RBX |
(358) 0x420084 NOPW %CS:(%RAX,%RAX,1) |
(373) 0x420090 MOV 0x200(%R15),%RAX |
(373) 0x420097 ADD -0x40(%RBP),%RAX |
(373) 0x42009b MOV -0x8(%RAX,%R12,8),%RDI |
(373) 0x4200a0 MOV -0x70(%RBP),%RAX |
(373) 0x4200a4 MOV 0x268(%RAX),%RAX |
(373) 0x4200ab MOV 0x18(%RAX),%RAX |
(373) 0x4200af MOV -0x4(%RAX,%R12,4),%EDX |
(373) 0x4200b4 MOVSXD (%RAX,%R12,4),%RAX |
(373) 0x4200b8 CMP %RAX,%R13 |
(373) 0x4200bb MOV %R13D,%ECX |
(373) 0x4200be CMOVG %EAX,%ECX |
(373) 0x4200c1 MOV %R13D,%ESI |
(373) 0x4200c4 MOV %R8,%R14 |
(373) 0x4200c7 MOV -0x58(%RBP),%R9 |
(373) 0x4200cb PUSHQ 0x1e8(%R15) |
(373) 0x4200d2 PUSHQ 0x1d0(%R15) |
(373) 0x4200d9 PUSH %RBX |
(373) 0x4200da PUSHQ -0x50(%RBP) |
(373) 0x4200dd VZEROUPPER |
(373) 0x4200e0 CALL 41cee0 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi> |
(373) 0x4200e5 MOV %R14,%R8 |
(373) 0x4200e8 ADD $0x20,%RSP |
(373) 0x4200ec MOV %R12D,%EAX |
(373) 0x4200ef MOV 0xa0(%R15),%R10 |
(373) 0x4200f6 INC %R12 |
(373) 0x4200f9 CMP %RAX,%R10 |
(373) 0x4200fc JA 420090 |
(358) 0x4200fe MOV 0x140(%R15),%R14 |
(358) 0x420105 MOV %R10,%RAX |
(358) 0x420108 MOV %R10,-0x40(%RBP) |
(358) 0x42010c VMOVSD 0xd61a4(%RIP),%XMM5 |
(358) 0x420114 VBROADCASTSD 0xd619b(%RIP),%YMM6 |
(358) 0x42011d VMOVSD 0xd4f43(%RIP),%XMM7 |
(358) 0x420125 VBROADCASTSD 0xd4f3a(%RIP),%YMM8 |
(358) 0x42012e JMP 420138 |
(358) 0x420130 MOVQ $0,-0x40(%RBP) |
(358) 0x420138 VXORPD %XMM0,%XMM0,%XMM0 |
(358) 0x42013c VXORPD %XMM1,%XMM1,%XMM1 |
(358) 0x420140 MOV $0x1fffffffffffffff,%RAX |
(358) 0x42014a TEST %RAX,%R13 |
(358) 0x42014d JE 4201ce |
(358) 0x42014f LEA (%RAX,%R13,1),%RCX |
(358) 0x420153 AND %RAX,%RCX |
(358) 0x420156 INC %RCX |
(358) 0x420159 MOV %RCX,%RAX |
(358) 0x42015c MOV $0x3ffffffffffffffc,%RDX |
(358) 0x420166 AND %RDX,%RAX |
(358) 0x420169 JE 4201b0 |
(358) 0x42016b VXORPD %XMM1,%XMM1,%XMM1 |
(358) 0x42016f XOR %EDX,%EDX |
(358) 0x420171 NOPW %CS:(%RAX,%RAX,1) |
(372) 0x420180 VADDPD (%R14,%RDX,8),%YMM1,%YMM1 |
(372) 0x420186 ADD $0x4,%RDX |
(372) 0x42018a CMP %RAX,%RDX |
(372) 0x42018d JB 420180 |
(358) 0x42018f VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(358) 0x420195 VADDPD %XMM2,%XMM1,%XMM1 |
(358) 0x420199 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(358) 0x42019e VADDSD %XMM2,%XMM1,%XMM1 |
(358) 0x4201a2 CMP %RAX,%RCX |
(358) 0x4201a5 JNE 4201b2 |
(358) 0x4201a7 JMP 4201ce |
0x4201a9 NOPL (%RAX) |
(358) 0x4201b0 XOR %EAX,%EAX |
(358) 0x4201b2 MOV $0x3d,%CL |
(358) 0x4201b4 BZHI %RCX,-0x80(%RBP),%RCX |
(358) 0x4201ba INC %RCX |
(358) 0x4201bd NOPL (%RAX) |
(371) 0x4201c0 VADDSD (%R14,%RAX,8),%XMM1,%XMM1 |
(371) 0x4201c6 INC %RAX |
(371) 0x4201c9 CMP %RAX,%RCX |
(371) 0x4201cc JNE 4201c0 |
(358) 0x4201ce MOV -0x38(%RBP),%RCX |
(358) 0x4201d2 MOV 0xd8(%RCX),%RAX |
(358) 0x4201d9 VMOVSD %XMM1,(%RAX,%R13,8) |
(358) 0x4201df MOV 0x158(%RCX),%RBX |
(358) 0x4201e6 MOV 0x170(%RCX),%R11 |
(358) 0x4201ed MOV -0x88(%RBP),%RCX |
(358) 0x4201f4 MOV 0x60(%RCX),%RDX |
(358) 0x4201f8 TEST %R13,%R13 |
(358) 0x4201fb JLE 420250 |
(358) 0x4201fd MOV %R13,%RCX |
(358) 0x420200 AND $-0x4,%RCX |
(358) 0x420204 JE 420240 |
(358) 0x420206 LEA -0x1(%RCX),%RSI |
(358) 0x42020a VXORPD %XMM0,%XMM0,%XMM0 |
(358) 0x42020e XOR %EDI,%EDI |
(370) 0x420210 VADDPD (%R11,%RDI,8),%YMM0,%YMM0 |
(370) 0x420216 VFMADD231PD (%RBX,%RDI,8),%YMM6,%YMM0 |
(370) 0x42021c ADD $0x4,%RDI |
(370) 0x420220 CMP %RSI,%RDI |
(370) 0x420223 JLE 420210 |
(358) 0x420225 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(358) 0x42022b VADDPD %XMM1,%XMM0,%XMM0 |
(358) 0x42022f VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(358) 0x420234 VADDSD %XMM1,%XMM0,%XMM0 |
(358) 0x420238 JMP 420690 |
0x42023d NOPL (%RAX) |
(358) 0x420240 VXORPD %XMM0,%XMM0,%XMM0 |
(358) 0x420244 XOR %ECX,%ECX |
(358) 0x420246 JMP 420699 |
0x42024b NOPL (%RAX,%RAX,1) |
(358) 0x420250 MOV -0x60(%RBP),%RSI |
(358) 0x420254 MOV 0x8(%RDX,%RSI,8),%RCX |
(358) 0x420259 MOV 0x18(%RDX,%RSI,8),%RDX |
(358) 0x42025e VXORPD %XMM1,%XMM1,%XMM1 |
(358) 0x420262 VXORPD %XMM2,%XMM2,%XMM2 |
(358) 0x420266 TEST %R13,%R13 |
(358) 0x420269 JLE 4202d3 |
(358) 0x42026b MOV %R13,%RSI |
(358) 0x42026e AND $-0x4,%RSI |
(358) 0x420272 JE 4202b0 |
(358) 0x420274 LEA -0x1(%RSI),%RDI |
(358) 0x420278 VXORPD %XMM2,%XMM2,%XMM2 |
(358) 0x42027c XOR %R8D,%R8D |
(358) 0x42027f NOP |
(368) 0x420280 VMOVUPD (%RDX,%R8,8),%YMM3 |
(368) 0x420286 VFMADD231PD (%RBX,%R8,8),%YMM3,%YMM2 |
(368) 0x42028c ADD $0x4,%R8 |
(368) 0x420290 CMP %RDI,%R8 |
(368) 0x420293 JLE 420280 |
(358) 0x420295 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(358) 0x42029b VADDPD %XMM3,%XMM2,%XMM2 |
(358) 0x42029f VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(358) 0x4202a4 VADDSD %XMM3,%XMM2,%XMM2 |
(358) 0x4202a8 JMP 4202ce |
0x4202aa NOPW (%RAX,%RAX,1) |
(358) 0x4202b0 XOR %ESI,%ESI |
(358) 0x4202b2 NOPW %CS:(%RAX,%RAX,1) |
(367) 0x4202c0 VMOVSD (%RDX,%RSI,8),%XMM3 |
(367) 0x4202c5 VFMADD231SD (%RBX,%RSI,8),%XMM3,%XMM2 |
(367) 0x4202cb INC %RSI |
(367) 0x4202ce CMP %RSI,%R13 |
(367) 0x4202d1 JNE 4202c0 |
(358) 0x4202d3 TEST %R13,%R13 |
(358) 0x4202d6 JLE 420343 |
(358) 0x4202d8 MOV %R13,%RSI |
(358) 0x4202db AND $-0x4,%RSI |
(358) 0x4202df JE 420320 |
(358) 0x4202e1 LEA -0x1(%RSI),%RDI |
(358) 0x4202e5 LEA (%RDX,%RCX,8),%R8 |
(358) 0x4202e9 VXORPD %XMM1,%XMM1,%XMM1 |
(358) 0x4202ed XOR %R9D,%R9D |
(366) 0x4202f0 VMOVUPD (%R8,%R9,8),%YMM3 |
(366) 0x4202f6 VFMADD231PD (%RBX,%R9,8),%YMM3,%YMM1 |
(366) 0x4202fc ADD $0x4,%R9 |
(366) 0x420300 CMP %RDI,%R9 |
(366) 0x420303 JLE 4202f0 |
(358) 0x420305 VEXTRACTF128 $0x1,%YMM1,%XMM3 |
(358) 0x42030b VADDPD %XMM3,%XMM1,%XMM1 |
(358) 0x42030f VSHUFPD $0x1,%XMM1,%XMM1,%XMM3 |
(358) 0x420314 VADDSD %XMM3,%XMM1,%XMM1 |
(358) 0x420318 CMP %RSI,%R13 |
(358) 0x42031b JNE 420326 |
(358) 0x42031d JMP 420343 |
0x42031f NOP |
(358) 0x420320 VXORPD %XMM1,%XMM1,%XMM1 |
(358) 0x420324 XOR %ESI,%ESI |
(358) 0x420326 LEA (%RDX,%RCX,8),%RDI |
(358) 0x42032a NOPW (%RAX,%RAX,1) |
(365) 0x420330 VMOVSD (%RDI,%RSI,8),%XMM3 |
(365) 0x420335 VFMADD231SD (%RBX,%RSI,8),%XMM3,%XMM1 |
(365) 0x42033b INC %RSI |
(365) 0x42033e CMP %RSI,%R13 |
(365) 0x420341 JNE 420330 |
(358) 0x420343 TEST %R13,%R13 |
(358) 0x420346 JLE 4203a0 |
(358) 0x420348 MOV %R13,%RSI |
(358) 0x42034b AND $-0x4,%RSI |
(358) 0x42034f JE 4203b0 |
(358) 0x420351 LEA -0x1(%RSI),%RDI |
(358) 0x420355 MOV %RCX,%R8 |
(358) 0x420358 SAL $0x4,%R8 |
(358) 0x42035c ADD %RDX,%R8 |
(358) 0x42035f VXORPD %XMM3,%XMM3,%XMM3 |
(358) 0x420363 XOR %R9D,%R9D |
(358) 0x420366 NOPW %CS:(%RAX,%RAX,1) |
(364) 0x420370 VMOVUPD (%R8,%R9,8),%YMM4 |
(364) 0x420376 VFMADD231PD (%RBX,%R9,8),%YMM4,%YMM3 |
(364) 0x42037c ADD $0x4,%R9 |
(364) 0x420380 CMP %RDI,%R9 |
(364) 0x420383 JLE 420370 |
(358) 0x420385 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(358) 0x42038b VADDPD %XMM4,%XMM3,%XMM3 |
(358) 0x42038f VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(358) 0x420394 VADDSD %XMM4,%XMM3,%XMM3 |
(358) 0x420398 CMP %RSI,%R13 |
(358) 0x42039b JNE 4203b6 |
(358) 0x42039d JMP 4203d3 |
0x42039f NOP |
(358) 0x4203a0 VXORPD %XMM3,%XMM3,%XMM3 |
(358) 0x4203a4 JMP 4203d3 |
0x4203a6 NOPW %CS:(%RAX,%RAX,1) |
(358) 0x4203b0 VXORPD %XMM3,%XMM3,%XMM3 |
(358) 0x4203b4 XOR %ESI,%ESI |
(358) 0x4203b6 MOV %RCX,%RDI |
(358) 0x4203b9 SAL $0x4,%RDI |
(358) 0x4203bd ADD %RDX,%RDI |
(363) 0x4203c0 VMOVSD (%RDI,%RSI,8),%XMM4 |
(363) 0x4203c5 VFMADD231SD (%RBX,%RSI,8),%XMM4,%XMM3 |
(363) 0x4203cb INC %RSI |
(363) 0x4203ce CMP %RSI,%R13 |
(363) 0x4203d1 JNE 4203c0 |
(358) 0x4203d3 MOV -0x38(%RBP),%R9 |
(358) 0x4203d7 MOV 0xf0(%R9),%RSI |
(358) 0x4203de MOV 0x100(%R9),%RDI |
(358) 0x4203e5 LEA (%RSI,%R13,1),%R8 |
(358) 0x4203e9 VMOVSD %XMM2,(%RDI,%R13,8) |
(358) 0x4203ef VMOVSD %XMM1,(%RDI,%R8,8) |
(358) 0x4203f5 LEA (%R13,%RSI,2),%R8 |
(358) 0x4203fa VMOVSD %XMM3,(%RDI,%R8,8) |
(358) 0x420400 VXORPD 0xd4c98(%RIP),%XMM0,%XMM0 |
(358) 0x420408 MOV 0x128(%R9),%R8 |
(358) 0x42040f VMOVLPD %XMM0,(%R8,%R13,8) |
(358) 0x420415 TEST %R13,%R13 |
(358) 0x420418 JLE 41ffb0 |
(358) 0x42041e MOV %R10,-0x68(%RBP) |
(358) 0x420422 LEA (%RAX,%R13,8),%R9 |
(358) 0x420426 ADD $-0x8,%R9 |
(358) 0x42042a CMP %R8,%R9 |
(358) 0x42042d SETAEB -0x30(%RBP) |
(358) 0x420431 LEA (%R8,%R13,8),%R12 |
(358) 0x420435 ADD $-0x8,%R12 |
(358) 0x420439 CMP %RAX,%R12 |
(358) 0x42043c SETAEB -0x2f(%RBP) |
(358) 0x420440 CMP %R14,%R9 |
(358) 0x420443 SETB %R15B |
(358) 0x420447 LEA (%R14,%R13,8),%R10 |
(358) 0x42044b ADD $-0x8,%R10 |
(358) 0x42044f CMP %RAX,%R10 |
(358) 0x420452 SETBB -0x2e(%RBP) |
(358) 0x420456 CMP %R8,%R10 |
(358) 0x420459 SETB %R10B |
(358) 0x42045d MOV %R14,-0x58(%RBP) |
(358) 0x420461 CMP %R14,%R12 |
(358) 0x420464 SETBB -0x2d(%RBP) |
(358) 0x420468 CMP %RBX,%R9 |
(358) 0x42046b SETBB -0x2c(%RBP) |
(358) 0x42046f LEA (%RBX,%R13,8),%R14 |
(358) 0x420473 ADD $-0x8,%R14 |
(358) 0x420477 CMP %RAX,%R14 |
(358) 0x42047a SETBB -0x2b(%RBP) |
(358) 0x42047e CMP %R11,%R9 |
(358) 0x420481 SETBB -0x2a(%RBP) |
(358) 0x420485 MOV %R13,-0x60(%RBP) |
(358) 0x420489 LEA (%R11,%R13,8),%R9 |
(358) 0x42048d ADD $-0x8,%R9 |
(358) 0x420491 CMP %RAX,%R9 |
(358) 0x420494 SETBB -0x29(%RBP) |
(358) 0x420498 CMP %R8,%R14 |
(358) 0x42049b SETB %R13B |
(358) 0x42049f MOV %RBX,-0x50(%RBP) |
(358) 0x4204a3 CMP %RBX,%R12 |
(358) 0x4204a6 SETB %BL |
(358) 0x4204a9 CMP %R8,%R9 |
(358) 0x4204ac SETB %R9B |
(358) 0x4204b0 MOV %R11,-0x48(%RBP) |
(358) 0x4204b4 CMP %R11,%R12 |
(358) 0x4204b7 SETB %R11B |
(358) 0x4204bb MOVZX -0x2f(%RBP),%R14D |
(358) 0x4204c0 TEST %R14B,-0x30(%RBP) |
(358) 0x4204c4 JNE 420580 |
(358) 0x4204ca OR -0x2e(%RBP),%R15B |
(358) 0x4204ce JE 420580 |
(358) 0x4204d4 OR -0x2d(%RBP),%R10B |
(358) 0x4204d8 JE 420580 |
(358) 0x4204de MOVZX -0x2b(%RBP),%R10D |
(358) 0x4204e3 OR %R10B,-0x2c(%RBP) |
(358) 0x4204e7 JE 420580 |
(358) 0x4204ed MOVZX -0x29(%RBP),%R10D |
(358) 0x4204f2 OR %R10B,-0x2a(%RBP) |
(358) 0x4204f6 JE 420580 |
(358) 0x4204fc OR %BL,%R13B |
(358) 0x4204ff JE 420580 |
(358) 0x420505 OR %R11B,%R9B |
(358) 0x420508 JE 420580 |
(358) 0x42050a MOV -0x60(%RBP),%R13 |
(358) 0x42050e MOV %R13,%R9 |
(358) 0x420511 AND $-0x4,%R9 |
(358) 0x420515 JE 4205d4 |
(358) 0x42051b LEA -0x1(%R9),%R10 |
(358) 0x42051f XOR %R11D,%R11D |
(358) 0x420522 MOV -0x58(%RBP),%R14 |
(358) 0x420526 MOV -0x50(%RBP),%RBX |
(358) 0x42052a MOV -0x48(%RBP),%R15 |
(358) 0x42052e XCHG %AX,%AX |
(362) 0x420530 VMOVUPD (%RAX,%R11,8),%YMM0 |
(362) 0x420536 VADDPD (%R14,%R11,8),%YMM0,%YMM0 |
(362) 0x42053c VMOVUPD %YMM0,(%RAX,%R11,8) |
(362) 0x420542 VMOVUPD (%RBX,%R11,8),%YMM0 |
(362) 0x420548 VFMSUB213PD (%R15,%R11,8),%YMM8,%YMM0 |
(362) 0x42054e VADDPD (%R8,%R11,8),%YMM0,%YMM0 |
(362) 0x420554 VMOVUPD %YMM0,(%R8,%R11,8) |
(362) 0x42055a ADD $0x4,%R11 |
(362) 0x42055e CMP %R10,%R11 |
(362) 0x420561 JLE 420530 |
(358) 0x420563 CMP %R9,%R13 |
(358) 0x420566 MOV -0x68(%RBP),%R10 |
(358) 0x42056a MOV %R15,%R11 |
(358) 0x42056d JNE 4205f0 |
(358) 0x420573 JMP 420622 |
0x420578 NOPL (%RAX,%RAX,1) |
(358) 0x420580 XOR %R9D,%R9D |
(358) 0x420583 MOV -0x68(%RBP),%R10 |
(358) 0x420587 MOV -0x60(%RBP),%R13 |
(358) 0x42058b MOV -0x58(%RBP),%R14 |
(358) 0x42058f MOV -0x50(%RBP),%RBX |
(358) 0x420593 MOV -0x48(%RBP),%R11 |
(358) 0x420597 NOPW (%RAX,%RAX,1) |
(359) 0x4205a0 VMOVSD (%RAX,%R9,8),%XMM0 |
(359) 0x4205a6 VADDSD (%R14,%R9,8),%XMM0,%XMM0 |
(359) 0x4205ac VMOVSD %XMM0,(%RAX,%R9,8) |
(359) 0x4205b2 VMOVSD (%RBX,%R9,8),%XMM0 |
(359) 0x4205b8 VFMSUB213SD (%R11,%R9,8),%XMM7,%XMM0 |
(359) 0x4205be VADDSD (%R8,%R9,8),%XMM0,%XMM0 |
(359) 0x4205c4 VMOVSD %XMM0,(%R8,%R9,8) |
(359) 0x4205ca INC %R9 |
(359) 0x4205cd CMP %R9,%R13 |
(359) 0x4205d0 JNE 4205a0 |
(358) 0x4205d2 JMP 420622 |
(358) 0x4205d4 XOR %R9D,%R9D |
(358) 0x4205d7 MOV -0x68(%RBP),%R10 |
(358) 0x4205db MOV -0x58(%RBP),%R14 |
(358) 0x4205df MOV -0x50(%RBP),%RBX |
(358) 0x4205e3 MOV -0x48(%RBP),%R11 |
(358) 0x4205e7 NOPW (%RAX,%RAX,1) |
(361) 0x4205f0 VMOVSD (%RAX,%R9,8),%XMM0 |
(361) 0x4205f6 VADDSD (%R14,%R9,8),%XMM0,%XMM0 |
(361) 0x4205fc VMOVSD %XMM0,(%RAX,%R9,8) |
(361) 0x420602 VMOVSD (%RBX,%R9,8),%XMM0 |
(361) 0x420608 VFMSUB213SD (%R11,%R9,8),%XMM7,%XMM0 |
(361) 0x42060e VADDSD (%R8,%R9,8),%XMM0,%XMM0 |
(361) 0x420614 VMOVSD %XMM0,(%R8,%R9,8) |
(361) 0x42061a INC %R9 |
(361) 0x42061d CMP %R9,%R13 |
(361) 0x420620 JNE 4205f0 |
(358) 0x420622 LEA (%RDI,%RSI,8),%RAX |
(358) 0x420626 SAL $0x4,%RSI |
(358) 0x42062a ADD %RDI,%RSI |
(358) 0x42062d LEA (%RDX,%RCX,8),%R8 |
(358) 0x420631 SAL $0x4,%RCX |
(358) 0x420635 ADD %RDX,%RCX |
(358) 0x420638 XOR %R9D,%R9D |
(358) 0x42063b NOPL (%RAX,%RAX,1) |
(360) 0x420640 VMOVSD (%RBX,%R9,8),%XMM0 |
(360) 0x420646 VMOVSD (%RDX,%R9,8),%XMM1 |
(360) 0x42064c VFNMADD213SD (%RDI,%R9,8),%XMM0,%XMM1 |
(360) 0x420652 VMOVSD %XMM1,(%RDI,%R9,8) |
(360) 0x420658 VMOVSD (%R8,%R9,8),%XMM1 |
(360) 0x42065e VFNMADD213SD (%RAX,%R9,8),%XMM0,%XMM1 |
(360) 0x420664 VMOVSD %XMM1,(%RAX,%R9,8) |
(360) 0x42066a VMOVSD (%RCX,%R9,8),%XMM1 |
(360) 0x420670 VFNMADD213SD (%RSI,%R9,8),%XMM0,%XMM1 |
(360) 0x420676 VMOVSD %XMM1,(%RSI,%R9,8) |
(360) 0x42067c INC %R9 |
(360) 0x42067f CMP %R9,%R13 |
(360) 0x420682 JNE 420640 |
(358) 0x420684 JMP 41ffb0 |
0x420689 NOPL (%RAX) |
(369) 0x420690 CMP %RCX,%R13 |
(369) 0x420693 JE 420250 |
(369) 0x420699 VADDSD (%R11,%RCX,8),%XMM0,%XMM0 |
(369) 0x42069f VFMADD231SD (%RBX,%RCX,8),%XMM5,%XMM0 |
(369) 0x4206a5 INC %RCX |
(369) 0x4206a8 JMP 420690 |
0x4206aa MOV -0x38(%RBP),%RAX |
0x4206ae MOVQ $0,0x10(%RAX) |
0x4206b6 MOV 0x90(%RAX),%RAX |
0x4206bd TEST %RAX,%RAX |
0x4206c0 JE 42077c |
0x4206c6 MOV -0x38(%RBP),%R8 |
0x4206ca MOV 0xd8(%R8),%RCX |
0x4206d1 MOV 0xf0(%R8),%RDX |
0x4206d8 MOV 0x100(%R8),%RSI |
0x4206df MOV -0x90(%RBP),%RDI |
0x4206e6 MOV 0x18(%RDI),%RDI |
0x4206ea MOV 0x128(%R8),%R8 |
0x4206f1 MOV -0x98(%RBP),%R9 |
0x4206f8 MOV 0x18(%R9),%R9 |
0x4206fc SAL $0x20,%RDX |
0x420700 ADD $0x10,%RDI |
0x420704 MOV %RDX,%R10 |
0x420707 SAR $0x1c,%R10 |
0x42070b ADD %RSI,%R10 |
0x42070e SAR $0x1d,%RDX |
0x420712 ADD %RSI,%RDX |
0x420715 VXORPD %XMM0,%XMM0,%XMM0 |
0x420719 XOR %R11D,%R11D |
0x42071c MOV -0x38(%RBP),%RBX |
(356) 0x420720 VADDSD (%RCX,%R11,8),%XMM0,%XMM0 |
(356) 0x420726 VMOVSD %XMM0,0x10(%RBX) |
(356) 0x42072b VMOVSD (%RSI,%R11,8),%XMM0 |
(356) 0x420731 VMOVHPD (%RDX,%R11,8),%XMM0,%XMM0 |
(356) 0x420737 VADDPD -0x10(%RDI),%XMM0,%XMM0 |
(356) 0x42073c VMOVSD (%RDI),%XMM1 |
(356) 0x420740 VADDSD (%R10,%R11,8),%XMM1,%XMM1 |
(356) 0x420746 VMOVUPD %XMM0,-0x10(%RDI) |
(356) 0x42074b VMOVSD %XMM1,(%RDI) |
(356) 0x42074f VMOVSD (%R9,%R11,8),%XMM0 |
(356) 0x420755 VADDSD (%R8,%R11,8),%XMM0,%XMM0 |
(356) 0x42075b VMOVSD %XMM0,(%R9,%R11,8) |
(356) 0x420761 VMOVSD 0x10(%RBX),%XMM0 |
(356) 0x420766 INC %R11 |
(356) 0x420769 ADD $0x18,%RDI |
(356) 0x42076d CMP %R11,%RAX |
(356) 0x420770 JNE 420720 |
0x420772 VMULSD 0xd48b6(%RIP),%XMM0,%XMM0 |
0x42077a JMP 420784 |
0x42077c VMOVSD 0xd5b54(%RIP),%XMM0 |
0x420784 MOV -0x38(%RBP),%RAX |
0x420788 VMOVSD %XMM0,0x10(%RAX) |
0x42078d ADD $0x78,%RSP |
0x420791 POP %RBX |
0x420792 POP %R12 |
0x420794 POP %R13 |
0x420796 POP %R14 |
0x420798 POP %R15 |
0x42079a POP %RBP |
0x42079b VZEROUPPER |
0x42079e RET |
0x42079f NOP |
Path / |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 80 |
nb uops | 82 |
loop length | 356 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 6 |
micro-operation queue | 13.67 cycles |
front end | 13.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 3.50 | 2.00 | 9.67 | 9.67 | 7.50 | 2.00 | 3.50 | 7.50 | 7.50 | 7.50 | 2.00 | 9.67 |
cycles | 3.50 | 2.00 | 9.67 | 9.67 | 7.50 | 2.00 | 3.50 | 7.50 | 7.50 | 7.50 | 2.00 | 9.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 13.47-13.49 |
Stall cycles | 0.00 |
Front-end | 13.67 |
Dispatch | 9.67 |
Overall L1 | 13.67 |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 12% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 6% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 12% |
load | 11% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 16% |
all | 12% |
load | 11% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x78,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4206aa <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x7fa> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x248(%R14),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4617f0 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%R14),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R10,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4206aa <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x7fa> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0xd63a5(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0xd639c(%RIP),%YMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVSD 0xd5144(%RIP),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0xd513b(%RIP),%YMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R10,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 41ff62 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0x10(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 42077c <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x8cc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xd8(%R8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xf0(%R8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x100(%R8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x128(%R8),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x98(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R9),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAL $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD $0x10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x1c,%R10 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %RSI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x1d,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %RSI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0xd48b6(%RIP),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
JMP 420784 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x8d4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VMOVSD 0xd5b54(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0x78,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 80 |
nb uops | 82 |
loop length | 356 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 6 |
micro-operation queue | 13.67 cycles |
front end | 13.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 3.50 | 2.00 | 9.67 | 9.67 | 7.50 | 2.00 | 3.50 | 7.50 | 7.50 | 7.50 | 2.00 | 9.67 |
cycles | 3.50 | 2.00 | 9.67 | 9.67 | 7.50 | 2.00 | 3.50 | 7.50 | 7.50 | 7.50 | 2.00 | 9.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 13.47-13.49 |
Stall cycles | 0.00 |
Front-end | 13.67 |
Dispatch | 9.67 |
Overall L1 | 13.67 |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 12% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 6% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 12% |
load | 11% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 16% |
all | 12% |
load | 11% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x78,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4206aa <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x7fa> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x248(%R14),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4617f0 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%R14),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R10,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4206aa <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x7fa> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0xd63a5(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0xd639c(%RIP),%YMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVSD 0xd5144(%RIP),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0xd513b(%RIP),%YMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R10,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 41ff62 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0x10(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 42077c <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x8cc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xd8(%R8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xf0(%R8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x100(%R8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x128(%R8),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x98(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R9),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAL $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD $0x10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x1c,%R10 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %RSI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x1d,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %RSI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0xd48b6(%RIP),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
JMP 420784 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x8d4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VMOVSD 0xd5b54(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0x78,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb– | 0.1 | 0.11 |
○Loop 356 - TwoBodyJastrowRef.h:422-427 - exec | 0 | 0 |
▼Loop 357 - TwoBodyJastrowRef.h:268-420 - exec– | 0 | 0 |
▼Loop 358 - TwoBodyJastrowRef.h:268-420 - exec– | 0 | 0 |
○Loop 360 - TwoBodyJastrowRef.h:393-398 - exec | 0.03 | 0.03 |
○Loop 368 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.02 |
○Loop 370 - TwoBodyJastrowRef.h:375-376 - exec | 0.01 | 0.01 |
○Loop 364 - TwoBodyJastrowRef.h:381-382 - exec | 0.01 | 0.01 |
○Loop 366 - TwoBodyJastrowRef.h:381-382 - exec | 0.01 | 0.01 |
○Loop 362 - TwoBodyJastrowRef.h:388-391 - exec | 0.01 | 0.01 |
○Loop 365 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 361 - TwoBodyJastrowRef.h:388-391 - exec | 0 | 0 |
○Loop 359 - TwoBodyJastrowRef.h:388-391 - exec | 0 | 0 |
○Loop 363 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 372 - stl_numeric.h:140-141 - exec | 0 | 0 |
○Loop 367 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 373 - TwoBodyJastrowRef.h:269-274 - exec | 0 | 0 |
○Loop 369 - TwoBodyJastrowRef.h:375-393 - exec | 0 | 0 |
○Loop 371 - stl_numeric.h:140-141 - exec | 0 | 0 |