Function: miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcp ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.1% |
---|
Function: miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcp ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.1% |
---|
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/shared_ptr_base.h: 1308 - 1308 |
-------------------------------------------------------------------------------- |
1308: { return _M_ptr; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 231 - 273 |
-------------------------------------------------------------------------------- |
231: inline const AoSElement_t operator[](size_t i) const { return AoSElement_t(myData + i, nGhosts); } |
[...] |
244: *(_base + M * i) = rhs[i]; |
[...] |
263: inline Accessor operator()(size_t i) { return Accessor(myData + i, nGhosts); } |
[...] |
273: inline const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
[...] |
249: inline const_pointer data() const { return X; } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_numeric.h: 126 - 127 |
-------------------------------------------------------------------------------- |
126: for (; __first != __last; ++__first) |
127: __init = __init + *__first; |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_algobase.h: 752 - 754 |
-------------------------------------------------------------------------------- |
752: for (__decltype(__n + 0) __niter = __n; |
753: __niter > 0; --__niter, (void) ++__first) |
754: *__first = __tmp; |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_iterator.h: 784 - 887 |
-------------------------------------------------------------------------------- |
784: : _M_current(__i) { } |
[...] |
887: { return __lhs.base() != __rhs.base(); } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/TwoBodyJastrowRef.h: 268 - 432 |
-------------------------------------------------------------------------------- |
268: const int igt = P.GroupID[iat] * NumGroups; |
269: for (int jg = 0; jg < NumGroups; ++jg) |
270: { |
271: const FuncType& f2(*F[igt + jg]); |
272: int iStart = P.first(jg); |
273: int iEnd = std::min(jelmax, P.last(jg)); |
274: f2.evaluateVGL(iat, iStart, iEnd, dist, u, du, d2u, DistCompressed.data(), DistIndice.data()); |
[...] |
360: const auto& d_table = P.getDistTableAA(myTableID); |
361: for (int ig = 0; ig < NumGroups; ++ig) |
362: { |
363: const int igt = ig * NumGroups; |
364: for (int iat = P.first(ig), last = P.last(ig); iat < last; ++iat) |
365: { |
366: computeU3(P, iat, d_table.getDistRow(iat).data(), cur_u.data(), cur_du.data(), cur_d2u.data(), true); |
367: Uat[iat] = std::accumulate(cur_u.begin(), cur_u.begin() + iat, valT()); |
[...] |
375: for (int jat = 0; jat < iat; ++jat) |
376: lap += d2u[jat] + lapfac * du[jat]; |
377: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
378: { |
379: const valT* restrict dX = displ.data(idim); |
380: valT s = valT(); |
381: for (int jat = 0; jat < iat; ++jat) |
382: s += du[jat] * dX[jat]; |
383: grad[idim] = s; |
384: } |
385: dUat(iat) = grad; |
386: d2Uat[iat] = -lap; |
387: // add the contribution from the upper triangle |
388: for (int jat = 0; jat < iat; jat++) |
389: { |
390: Uat[jat] += u[jat]; |
391: d2Uat[jat] -= d2u[jat] + lapfac * du[jat]; |
[...] |
397: for (int jat = 0; jat < iat; jat++) |
398: save_g[jat] -= du[jat] * dX[jat]; |
[...] |
419: { |
420: if (fromscratch) |
421: recompute(P); |
422: LogValue = valT(0); |
423: for (int iat = 0; iat < N; ++iat) |
424: { |
425: LogValue += Uat[iat]; |
426: G[iat] += dUat[iat]; |
427: L[iat] += d2Uat[iat]; |
428: } |
429: |
430: constexpr valT mhalf(-0.5); |
431: LogValue = mhalf * LogValue; |
432: } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Particle/DistanceTable.h: 268 - 268 |
-------------------------------------------------------------------------------- |
268: const DistRow& getDistRow(int iel) const { return distances_[iel]; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 94 - 94 |
-------------------------------------------------------------------------------- |
94: (const_cast<T1&>(a) += b); |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 145 - 169 |
-------------------------------------------------------------------------------- |
145: X[i] = base[i * offset]; |
[...] |
169: inline Type_t& operator[](unsigned int i) { return X[i]; } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_vector.h: 951 - 1056 |
-------------------------------------------------------------------------------- |
951: return *(this->_M_impl._M_start + __n); |
[...] |
1056: { return _M_data_ptr(this->_M_impl._M_start); } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 313 - 316 |
-------------------------------------------------------------------------------- |
313: inline int first(int igroup) const { return (*group_offsets_)[igroup]; } |
314: |
315: ///return the last index of a group i |
316: inline int last(int igroup) const { return (*group_offsets_)[igroup + 1]; } |
0x41fbb0 PUSH %RBP |
0x41fbb1 MOV %RSP,%RBP |
0x41fbb4 PUSH %R15 |
0x41fbb6 PUSH %R14 |
0x41fbb8 PUSH %R13 |
0x41fbba PUSH %R12 |
0x41fbbc PUSH %RBX |
0x41fbbd AND $-0x20,%RSP |
0x41fbc1 SUB $0x160,%RSP |
0x41fbc8 MOV %RCX,0x88(%RSP) |
0x41fbd0 MOV %RDX,0x80(%RSP) |
0x41fbd8 MOV %RSI,0x58(%RSP) |
0x41fbdd MOV %RDI,0x20(%RSP) |
0x41fbe2 TEST %R8B,%R8B |
0x41fbe5 JE 420665 |
0x41fbeb MOV 0x20(%RSP),%RBX |
0x41fbf0 MOV 0x248(%RBX),%ESI |
0x41fbf6 MOV 0x58(%RSP),%RDI |
0x41fbfb CALL 460080 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> |
0x41fc00 MOV %RAX,0x78(%RSP) |
0x41fc05 MOV 0xa0(%RBX),%R10 |
0x41fc0c TEST %R10,%R10 |
0x41fc0f JE 420665 |
0x41fc15 XOR %ECX,%ECX |
0x41fc17 VMOVSD 0xdc789(%RIP),%XMM6 |
0x41fc1f MOV %R10,%R11 |
0x41fc22 JMP 41fc4a |
0x41fc24 NOPW %CS:(%RAX,%RAX,1) |
(368) 0x41fc30 MOV %R11,%RAX |
(368) 0x41fc33 MOV 0x90(%RSP),%RCX |
(368) 0x41fc3b INC %RCX |
(368) 0x41fc3e MOV %RAX,%R11 |
(368) 0x41fc41 CMP %RCX,%RAX |
(368) 0x41fc44 JBE 420665 |
(368) 0x41fc4a MOV 0x58(%RSP),%RAX |
(368) 0x41fc4f MOV 0x268(%RAX),%RAX |
(368) 0x41fc56 MOV 0x18(%RAX),%RAX |
(368) 0x41fc5a MOVSXD (%RAX,%RCX,4),%RSI |
(368) 0x41fc5e MOV %RCX,0x90(%RSP) |
(368) 0x41fc66 MOVSXD 0x4(%RAX,%RCX,4),%RAX |
(368) 0x41fc6b MOV %RAX,0x98(%RSP) |
(368) 0x41fc73 CMP %EAX,%ESI |
(368) 0x41fc75 JGE 41fc30 |
(368) 0x41fc77 MOV 0x20(%RSP),%RAX |
(368) 0x41fc7c MOV 0x140(%RAX),%R15 |
(368) 0x41fc83 MOV 0x158(%RAX),%R13 |
(368) 0x41fc8a MOV 0x170(%RAX),%R8 |
(368) 0x41fc91 MOV $0x1fffffffffffffff,%RAX |
(368) 0x41fc9b LEA (%RSI,%RAX,1),%RBX |
(368) 0x41fc9f JMP 41fcc7 |
0x41fca1 NOPW %CS:(%RAX,%RAX,1) |
(370) 0x41fcb0 INC %RSI |
(370) 0x41fcb3 INC %RBX |
(370) 0x41fcb6 MOV %R10,%RAX |
(370) 0x41fcb9 CMP 0x98(%RSP),%RSI |
(370) 0x41fcc1 JE 41fc33 |
(370) 0x41fcc7 MOV %R8,0x28(%RSP) |
(370) 0x41fccc MOV %R13,0x30(%RSP) |
(370) 0x41fcd1 MOV 0x78(%RSP),%RAX |
(370) 0x41fcd6 MOV 0x48(%RAX),%RAX |
(370) 0x41fcda LEA (%RSI,%RSI,4),%RCX |
(370) 0x41fcde MOV %RCX,0x38(%RSP) |
(370) 0x41fce3 MOV 0x18(%RAX,%RCX,8),%R8 |
(370) 0x41fce8 TEST %RSI,%RSI |
(370) 0x41fceb MOV %RSI,0x60(%RSP) |
(370) 0x41fcf0 MOV %RBX,0x40(%RSP) |
(370) 0x41fcf5 JLE 41fd4f |
(370) 0x41fcf7 MOV %ESI,%EBX |
(370) 0x41fcf9 SAL $0x3,%RBX |
(370) 0x41fcfd MOV %R15,%RDI |
(370) 0x41fd00 XOR %ESI,%ESI |
(370) 0x41fd02 MOV %RBX,%RDX |
(370) 0x41fd05 MOV %R10,%R14 |
(370) 0x41fd08 MOV %R11,%R13 |
(370) 0x41fd0b MOV %R8,%R12 |
(370) 0x41fd0e VZEROUPPER |
(370) 0x41fd11 CALL 4ec910 <_intel_fast_memset> |
(370) 0x41fd16 MOV 0x30(%RSP),%RDI |
(370) 0x41fd1b XOR %ESI,%ESI |
(370) 0x41fd1d MOV %RBX,%RDX |
(370) 0x41fd20 CALL 4ec910 <_intel_fast_memset> |
(370) 0x41fd25 MOV 0x28(%RSP),%RDI |
(370) 0x41fd2a XOR %ESI,%ESI |
(370) 0x41fd2c MOV %RBX,%RDX |
(370) 0x41fd2f MOV 0x40(%RSP),%RBX |
(370) 0x41fd34 CALL 4ec910 <_intel_fast_memset> |
(370) 0x41fd39 MOV %R12,%R8 |
(370) 0x41fd3c MOV %R13,%R11 |
(370) 0x41fd3f MOV 0x60(%RSP),%RSI |
(370) 0x41fd44 MOV %R14,%R10 |
(370) 0x41fd47 VMOVSD 0xdc659(%RIP),%XMM6 |
(370) 0x41fd4f TEST %R11,%R11 |
(370) 0x41fd52 JE 41fe20 |
(370) 0x41fd58 MOV 0x58(%RSP),%RAX |
(370) 0x41fd5d MOV 0x18(%RAX),%RAX |
(370) 0x41fd61 IMUL (%RAX,%RSI,4),%R11D |
(370) 0x41fd66 MOVSXD %R11D,%RAX |
(370) 0x41fd69 SAL $0x3,%RAX |
(370) 0x41fd6d MOV %RAX,0x48(%RSP) |
(370) 0x41fd72 MOV %R15,0x50(%RSP) |
(370) 0x41fd77 MOV 0x20(%RSP),%R14 |
(370) 0x41fd7c MOV $0x1,%R12D |
(370) 0x41fd82 MOV 0x30(%RSP),%R13 |
(370) 0x41fd87 MOV 0x28(%RSP),%R15 |
(370) 0x41fd8c NOPL (%RAX) |
(388) 0x41fd90 MOV 0x200(%R14),%RAX |
(388) 0x41fd97 ADD 0x48(%RSP),%RAX |
(388) 0x41fd9c MOV -0x8(%RAX,%R12,8),%RDI |
(388) 0x41fda1 MOV 0x58(%RSP),%RAX |
(388) 0x41fda6 MOV 0x268(%RAX),%RAX |
(388) 0x41fdad MOV 0x18(%RAX),%RAX |
(388) 0x41fdb1 MOV -0x4(%RAX,%R12,4),%EDX |
(388) 0x41fdb6 MOV (%RAX,%R12,4),%ECX |
(388) 0x41fdba CMP %ESI,%ECX |
(388) 0x41fdbc CMOVGE %ESI,%ECX |
(388) 0x41fdbf MOV %R8,%RBX |
(388) 0x41fdc2 MOV 0x50(%RSP),%R9 |
(388) 0x41fdc7 PUSHQ 0x1e8(%R14) |
(388) 0x41fdce PUSHQ 0x1d0(%R14) |
(388) 0x41fdd5 PUSH %R15 |
(388) 0x41fdd7 PUSH %R13 |
(388) 0x41fdd9 VZEROUPPER |
(388) 0x41fddc CALL 41cbf0 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi> |
(388) 0x41fde1 MOV %RBX,%R8 |
(388) 0x41fde4 MOV 0x80(%RSP),%RSI |
(388) 0x41fdec ADD $0x20,%RSP |
(388) 0x41fdf0 MOV %R12D,%EAX |
(388) 0x41fdf3 MOV 0xa0(%R14),%R10 |
(388) 0x41fdfa INC %R12 |
(388) 0x41fdfd CMP %RAX,%R10 |
(388) 0x41fe00 JA 41fd90 |
(370) 0x41fe02 MOV 0x140(%R14),%R15 |
(370) 0x41fe09 MOV %R10,%R11 |
(370) 0x41fe0c VMOVSD 0xdc594(%RIP),%XMM6 |
(370) 0x41fe14 MOV 0x40(%RSP),%RBX |
(370) 0x41fe19 JMP 41fe23 |
0x41fe1b NOPL (%RAX,%RAX,1) |
(370) 0x41fe20 XOR %R11D,%R11D |
(370) 0x41fe23 VXORPD %XMM0,%XMM0,%XMM0 |
(370) 0x41fe27 VXORPD %XMM1,%XMM1,%XMM1 |
(370) 0x41fe2b MOV $0x1fffffffffffffff,%RAX |
(370) 0x41fe35 TEST %RAX,%RSI |
(370) 0x41fe38 JE 41feae |
(370) 0x41fe3a LEA (%RSI,%RAX,1),%RCX |
(370) 0x41fe3e AND %RAX,%RCX |
(370) 0x41fe41 INC %RCX |
(370) 0x41fe44 MOV %RCX,%RAX |
(370) 0x41fe47 MOV $0x3ffffffffffffffc,%RDX |
(370) 0x41fe51 AND %RDX,%RAX |
(370) 0x41fe54 JE 41fe90 |
(370) 0x41fe56 VXORPD %XMM1,%XMM1,%XMM1 |
(370) 0x41fe5a XOR %EDX,%EDX |
(370) 0x41fe5c NOPL (%RAX) |
(387) 0x41fe60 VADDPD (%R15,%RDX,8),%YMM1,%YMM1 |
(387) 0x41fe66 ADD $0x4,%RDX |
(387) 0x41fe6a CMP %RAX,%RDX |
(387) 0x41fe6d JB 41fe60 |
(370) 0x41fe6f VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(370) 0x41fe75 VADDPD %XMM2,%XMM1,%XMM1 |
(370) 0x41fe79 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(370) 0x41fe7e VADDSD %XMM2,%XMM1,%XMM1 |
(370) 0x41fe82 CMP %RAX,%RCX |
(370) 0x41fe85 JNE 41fe92 |
(370) 0x41fe87 JMP 41feae |
0x41fe89 NOPL (%RAX) |
(370) 0x41fe90 XOR %EAX,%EAX |
(370) 0x41fe92 MOV $0x3d,%CL |
(370) 0x41fe94 BZHI %RCX,%RBX,%RCX |
(370) 0x41fe99 INC %RCX |
(370) 0x41fe9c NOPL (%RAX) |
(386) 0x41fea0 VADDSD (%R15,%RAX,8),%XMM1,%XMM1 |
(386) 0x41fea6 INC %RAX |
(386) 0x41fea9 CMP %RAX,%RCX |
(386) 0x41feac JNE 41fea0 |
(370) 0x41feae MOV 0x20(%RSP),%RAX |
(370) 0x41feb3 MOV 0xd8(%RAX),%RDX |
(370) 0x41feba VMOVSD %XMM1,(%RDX,%RSI,8) |
(370) 0x41febf MOV 0x158(%RAX),%R14 |
(370) 0x41fec6 MOV 0x170(%RAX),%R9 |
(370) 0x41fecd MOV 0x78(%RSP),%RAX |
(370) 0x41fed2 MOV 0x60(%RAX),%RAX |
(370) 0x41fed6 TEST %RSI,%RSI |
(370) 0x41fed9 JLE 41ff54 |
(370) 0x41fedb MOV %RSI,%RCX |
(370) 0x41fede AND $-0x4,%RCX |
(370) 0x41fee2 JE 41ff30 |
(370) 0x41fee4 LEA -0x1(%RCX),%R8 |
(370) 0x41fee8 VXORPD %XMM0,%XMM0,%XMM0 |
(370) 0x41feec XOR %EDI,%EDI |
(370) 0x41feee VBROADCASTSD 0xdc4b1(%RIP),%YMM1 |
(370) 0x41fef7 NOPW (%RAX,%RAX,1) |
(385) 0x41ff00 VADDPD (%R9,%RDI,8),%YMM0,%YMM0 |
(385) 0x41ff06 VFMADD231PD (%R14,%RDI,8),%YMM1,%YMM0 |
(385) 0x41ff0c ADD $0x4,%RDI |
(385) 0x41ff10 CMP %R8,%RDI |
(385) 0x41ff13 JLE 41ff00 |
(370) 0x41ff15 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(370) 0x41ff1b VADDPD %XMM1,%XMM0,%XMM0 |
(370) 0x41ff1f VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(370) 0x41ff24 VADDSD %XMM1,%XMM0,%XMM0 |
(370) 0x41ff28 JMP 41ff4f |
0x41ff2a NOPW (%RAX,%RAX,1) |
(370) 0x41ff30 VXORPD %XMM0,%XMM0,%XMM0 |
(370) 0x41ff34 XOR %ECX,%ECX |
(370) 0x41ff36 NOPW %CS:(%RAX,%RAX,1) |
(384) 0x41ff40 VADDSD (%R9,%RCX,8),%XMM0,%XMM0 |
(384) 0x41ff46 VFMADD231SD (%R14,%RCX,8),%XMM6,%XMM0 |
(384) 0x41ff4c INC %RCX |
(384) 0x41ff4f CMP %RCX,%RSI |
(384) 0x41ff52 JNE 41ff40 |
(370) 0x41ff54 MOV 0x38(%RSP),%RCX |
(370) 0x41ff59 MOV 0x8(%RAX,%RCX,8),%R12 |
(370) 0x41ff5e MOV 0x18(%RAX,%RCX,8),%RAX |
(370) 0x41ff63 VXORPD %XMM2,%XMM2,%XMM2 |
(370) 0x41ff67 VXORPD %XMM1,%XMM1,%XMM1 |
(370) 0x41ff6b TEST %RSI,%RSI |
(370) 0x41ff6e JLE 41ffe4 |
(370) 0x41ff70 MOV %RSI,%R8 |
(370) 0x41ff73 AND $-0x4,%R8 |
(370) 0x41ff77 JE 41ffc0 |
(370) 0x41ff79 LEA -0x1(%R8),%RCX |
(370) 0x41ff7d VXORPD %XMM1,%XMM1,%XMM1 |
(370) 0x41ff81 XOR %EDI,%EDI |
(370) 0x41ff83 NOPW %CS:(%RAX,%RAX,1) |
(383) 0x41ff90 VMOVUPD (%RAX,%RDI,8),%YMM3 |
(383) 0x41ff95 VFMADD231PD (%R14,%RDI,8),%YMM3,%YMM1 |
(383) 0x41ff9b ADD $0x4,%RDI |
(383) 0x41ff9f CMP %RCX,%RDI |
(383) 0x41ffa2 JLE 41ff90 |
(370) 0x41ffa4 VEXTRACTF128 $0x1,%YMM1,%XMM3 |
(370) 0x41ffaa VADDPD %XMM3,%XMM1,%XMM1 |
(370) 0x41ffae VSHUFPD $0x1,%XMM1,%XMM1,%XMM3 |
(370) 0x41ffb3 VADDSD %XMM3,%XMM1,%XMM1 |
(370) 0x41ffb7 JMP 41ffdf |
0x41ffb9 NOPL (%RAX) |
(370) 0x41ffc0 XOR %R8D,%R8D |
(370) 0x41ffc3 NOPW %CS:(%RAX,%RAX,1) |
(382) 0x41ffd0 VMOVSD (%RAX,%R8,8),%XMM3 |
(382) 0x41ffd6 VFMADD231SD (%R14,%R8,8),%XMM3,%XMM1 |
(382) 0x41ffdc INC %R8 |
(382) 0x41ffdf CMP %R8,%RSI |
(382) 0x41ffe2 JNE 41ffd0 |
(370) 0x41ffe4 MOV %R9,0x28(%RSP) |
(370) 0x41ffe9 TEST %RSI,%RSI |
(370) 0x41ffec JLE 420064 |
(370) 0x41ffee MOV %RSI,%R9 |
(370) 0x41fff1 AND $-0x4,%R9 |
(370) 0x41fff5 JE 420040 |
(370) 0x41fff7 LEA -0x1(%R9),%RCX |
(370) 0x41fffb LEA (%RAX,%R12,8),%RDI |
(370) 0x41ffff VXORPD %XMM2,%XMM2,%XMM2 |
(370) 0x420003 XOR %R8D,%R8D |
(370) 0x420006 NOPW %CS:(%RAX,%RAX,1) |
(381) 0x420010 VMOVUPD (%RDI,%R8,8),%YMM3 |
(381) 0x420016 VFMADD231PD (%R14,%R8,8),%YMM3,%YMM2 |
(381) 0x42001c ADD $0x4,%R8 |
(381) 0x420020 CMP %RCX,%R8 |
(381) 0x420023 JLE 420010 |
(370) 0x420025 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(370) 0x42002b VADDPD %XMM3,%XMM2,%XMM2 |
(370) 0x42002f VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(370) 0x420034 VADDSD %XMM3,%XMM2,%XMM2 |
(370) 0x420038 CMP %R9,%RSI |
(370) 0x42003b JNE 420047 |
(370) 0x42003d JMP 420064 |
0x42003f NOP |
(370) 0x420040 VXORPD %XMM2,%XMM2,%XMM2 |
(370) 0x420044 XOR %R9D,%R9D |
(370) 0x420047 LEA (%RAX,%R12,8),%RCX |
(370) 0x42004b NOPL (%RAX,%RAX,1) |
(380) 0x420050 VMOVSD (%RCX,%R9,8),%XMM3 |
(380) 0x420056 VFMADD231SD (%R14,%R9,8),%XMM3,%XMM2 |
(380) 0x42005c INC %R9 |
(380) 0x42005f CMP %R9,%RSI |
(380) 0x420062 JNE 420050 |
(370) 0x420064 TEST %RSI,%RSI |
(370) 0x420067 MOV %R10,0x48(%RSP) |
(370) 0x42006c MOV %R11,0x70(%RSP) |
(370) 0x420071 JLE 4200d0 |
(370) 0x420073 MOV %RSI,%R9 |
(370) 0x420076 AND $-0x4,%R9 |
(370) 0x42007a JE 4200e0 |
(370) 0x42007c LEA -0x1(%R9),%RCX |
(370) 0x420080 MOV %R12,%RDI |
(370) 0x420083 SAL $0x4,%RDI |
(370) 0x420087 ADD %RAX,%RDI |
(370) 0x42008a VXORPD %XMM3,%XMM3,%XMM3 |
(370) 0x42008e XOR %R8D,%R8D |
(370) 0x420091 NOPW %CS:(%RAX,%RAX,1) |
(379) 0x4200a0 VMOVUPD (%RDI,%R8,8),%YMM4 |
(379) 0x4200a6 VFMADD231PD (%R14,%R8,8),%YMM4,%YMM3 |
(379) 0x4200ac ADD $0x4,%R8 |
(379) 0x4200b0 CMP %RCX,%R8 |
(379) 0x4200b3 JLE 4200a0 |
(370) 0x4200b5 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(370) 0x4200bb VADDPD %XMM4,%XMM3,%XMM3 |
(370) 0x4200bf VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(370) 0x4200c4 VADDSD %XMM4,%XMM3,%XMM3 |
(370) 0x4200c8 CMP %R9,%RSI |
(370) 0x4200cb JNE 4200e7 |
(370) 0x4200cd JMP 420114 |
0x4200cf NOP |
(370) 0x4200d0 VXORPD %XMM3,%XMM3,%XMM3 |
(370) 0x4200d4 JMP 420114 |
0x4200d6 NOPW %CS:(%RAX,%RAX,1) |
(370) 0x4200e0 VXORPD %XMM3,%XMM3,%XMM3 |
(370) 0x4200e4 XOR %R9D,%R9D |
(370) 0x4200e7 MOV %R12,%RCX |
(370) 0x4200ea SAL $0x4,%RCX |
(370) 0x4200ee ADD %RAX,%RCX |
(370) 0x4200f1 NOPW %CS:(%RAX,%RAX,1) |
(378) 0x420100 VMOVSD (%RCX,%R9,8),%XMM4 |
(378) 0x420106 VFMADD231SD (%R14,%R9,8),%XMM4,%XMM3 |
(378) 0x42010c INC %R9 |
(378) 0x42010f CMP %R9,%RSI |
(378) 0x420112 JNE 420100 |
(370) 0x420114 MOV %R14,0x30(%RSP) |
(370) 0x420119 VPUNPCKLQDQ %XMM2,%XMM1,%XMM1 |
(370) 0x42011d MOV 0x20(%RSP),%RDI |
(370) 0x420122 MOV 0xf0(%RDI),%R8 |
(370) 0x420129 MOV 0x100(%RDI),%R14 |
(370) 0x420130 VMOVQ %R8,%XMM2 |
(370) 0x420135 VPSLLDQ $0x8,%XMM2,%XMM2 |
(370) 0x42013a VPBROADCASTQ %R14,%XMM4 |
(370) 0x420140 VPBROADCASTQ %RSI,%XMM5 |
(370) 0x420146 VPADDQ %XMM2,%XMM5,%XMM2 |
(370) 0x42014a VPSLLQ $0x3,%XMM2,%XMM2 |
(370) 0x42014f VPADDQ %XMM2,%XMM4,%XMM2 |
(370) 0x420153 VMOVQ %XMM2,%RCX |
(370) 0x420158 VMOVLPD %XMM1,(%RCX) |
(370) 0x42015c VPEXTRQ $0x1,%XMM2,%RCX |
(370) 0x420162 VMOVHPD %XMM1,(%RCX) |
(370) 0x420166 MOV %R8,0x38(%RSP) |
(370) 0x42016b LEA (%RSI,%R8,2),%RCX |
(370) 0x42016f VMOVSD %XMM3,(%R14,%RCX,8) |
(370) 0x420175 VXORPD 0xdb0c1(%RIP){1to2},%XMM0,%XMM0 |
(370) 0x42017f MOV 0x128(%RDI),%R8 |
(370) 0x420186 VMOVLPD %XMM0,(%R8,%RSI,8) |
(370) 0x42018c TEST %RSI,%RSI |
(370) 0x42018f JLE 420310 |
(370) 0x420195 MOV %R12,0x68(%RSP) |
(370) 0x42019a LEA -0x1(%RSI),%R9 |
(370) 0x42019e LEA (%RDX,%R9,8),%R11 |
(370) 0x4201a2 CMP %R8,%R11 |
(370) 0x4201a5 SETAEB 0x1f(%RSP) |
(370) 0x4201aa LEA (%R8,%R9,8),%RDI |
(370) 0x4201ae CMP %RDX,%RDI |
(370) 0x4201b1 SETAE %R13B |
(370) 0x4201b5 CMP %R15,%R11 |
(370) 0x4201b8 MOV %R15,%RSI |
(370) 0x4201bb SETB %R15B |
(370) 0x4201bf LEA (%RSI,%R9,8),%R10 |
(370) 0x4201c3 CMP %RDX,%R10 |
(370) 0x4201c6 SETBB 0x1e(%RSP) |
(370) 0x4201cb CMP %R8,%R10 |
(370) 0x4201ce SETB %R12B |
(370) 0x4201d2 MOV %RSI,0x50(%RSP) |
(370) 0x4201d7 CMP %RSI,%RDI |
(370) 0x4201da SETBB 0x1d(%RSP) |
(370) 0x4201df MOV 0x30(%RSP),%RSI |
(370) 0x4201e4 CMP %RSI,%R11 |
(370) 0x4201e7 SETB %R10B |
(370) 0x4201eb LEA (%RSI,%R9,8),%RBX |
(370) 0x4201ef CMP %RDX,%RBX |
(370) 0x4201f2 SETBB 0x1c(%RSP) |
(370) 0x4201f7 MOV 0x28(%RSP),%RCX |
(370) 0x4201fc CMP %RCX,%R11 |
(370) 0x4201ff SETB %R11B |
(370) 0x420203 LEA (%RCX,%R9,8),%R9 |
(370) 0x420207 CMP %RDX,%R9 |
(370) 0x42020a SETBB 0x1b(%RSP) |
(370) 0x42020f CMP %R8,%RBX |
(370) 0x420212 SETB %BL |
(370) 0x420215 CMP %RSI,%RDI |
(370) 0x420218 SETB %SIL |
(370) 0x42021c CMP %R8,%R9 |
(370) 0x42021f SETB %R9B |
(370) 0x420223 CMP %RCX,%RDI |
(370) 0x420226 SETB %CL |
(370) 0x420229 TEST %R13B,0x1f(%RSP) |
(370) 0x42022e JNE 420340 |
(370) 0x420234 OR 0x1e(%RSP),%R15B |
(370) 0x420239 JE 420340 |
(370) 0x42023f OR 0x1d(%RSP),%R12B |
(370) 0x420244 JE 420340 |
(370) 0x42024a OR 0x1c(%RSP),%R10B |
(370) 0x42024f JE 420340 |
(370) 0x420255 OR 0x1b(%RSP),%R11B |
(370) 0x42025a JE 420340 |
(370) 0x420260 OR %SIL,%BL |
(370) 0x420263 JE 420340 |
(370) 0x420269 OR %CL,%R9B |
(370) 0x42026c JE 420340 |
(370) 0x420272 MOV 0x60(%RSP),%RSI |
(370) 0x420277 MOV %RSI,%R9 |
(370) 0x42027a AND $-0x4,%R9 |
(370) 0x42027e MOV 0x48(%RSP),%R10 |
(370) 0x420283 MOV 0x70(%RSP),%R11 |
(370) 0x420288 MOV 0x40(%RSP),%RBX |
(370) 0x42028d JE 420407 |
(370) 0x420293 LEA -0x1(%R9),%RCX |
(370) 0x420297 XOR %EDI,%EDI |
(370) 0x420299 VBROADCASTSD 0xdafce(%RIP),%YMM1 |
(370) 0x4202a2 MOV 0x50(%RSP),%R15 |
(370) 0x4202a7 MOV 0x30(%RSP),%R13 |
(370) 0x4202ac MOV 0x28(%RSP),%R12 |
(370) 0x4202b1 NOPW %CS:(%RAX,%RAX,1) |
(377) 0x4202c0 VMOVUPD (%RDX,%RDI,8),%YMM0 |
(377) 0x4202c5 VADDPD (%R15,%RDI,8),%YMM0,%YMM0 |
(377) 0x4202cb VMOVUPD %YMM0,(%RDX,%RDI,8) |
(377) 0x4202d0 VMOVUPD (%R13,%RDI,8),%YMM0 |
(377) 0x4202d7 VFMSUB213PD (%R12,%RDI,8),%YMM1,%YMM0 |
(377) 0x4202dd VADDPD (%R8,%RDI,8),%YMM0,%YMM0 |
(377) 0x4202e3 VMOVUPD %YMM0,(%R8,%RDI,8) |
(377) 0x4202e9 ADD $0x4,%RDI |
(377) 0x4202ed CMP %RCX,%RDI |
(377) 0x4202f0 JLE 4202c0 |
(370) 0x4202f2 CMP %R9,%RSI |
(370) 0x4202f5 MOV 0x68(%RSP),%R12 |
(370) 0x4202fa JE 4203a6 |
(370) 0x420300 JMP 420419 |
0x420305 NOPW %CS:(%RAX,%RAX,1) |
(370) 0x420310 MOV 0x48(%RSP),%R10 |
(370) 0x420315 MOV 0x70(%RSP),%R11 |
(370) 0x42031a MOV 0x40(%RSP),%RBX |
(370) 0x42031f MOV 0x30(%RSP),%R13 |
(370) 0x420324 TEST %RSI,%RSI |
(370) 0x420327 MOV 0x28(%RSP),%R8 |
(370) 0x42032c JG 4203b4 |
(370) 0x420332 JMP 41fcb0 |
0x420337 NOPW (%RAX,%RAX,1) |
(370) 0x420340 XOR %ECX,%ECX |
(370) 0x420342 VMOVSD 0xdaf26(%RIP),%XMM1 |
(370) 0x42034a MOV 0x48(%RSP),%R10 |
(370) 0x42034f MOV 0x60(%RSP),%RSI |
(370) 0x420354 MOV 0x50(%RSP),%R15 |
(370) 0x420359 MOV 0x70(%RSP),%R11 |
(370) 0x42035e MOV 0x40(%RSP),%RBX |
(370) 0x420363 MOV 0x30(%RSP),%R13 |
(370) 0x420368 MOV 0x28(%RSP),%RDI |
(370) 0x42036d NOPL (%RAX) |
(376) 0x420370 VMOVSD (%RDX,%RCX,8),%XMM0 |
(376) 0x420375 VADDSD (%R15,%RCX,8),%XMM0,%XMM0 |
(376) 0x42037b VMOVSD %XMM0,(%RDX,%RCX,8) |
(376) 0x420380 VMOVSD (%R13,%RCX,8),%XMM0 |
(376) 0x420387 VFMSUB213SD (%RDI,%RCX,8),%XMM1,%XMM0 |
(376) 0x42038d VADDSD (%R8,%RCX,8),%XMM0,%XMM0 |
(376) 0x420393 VMOVSD %XMM0,(%R8,%RCX,8) |
(376) 0x420399 INC %RCX |
(376) 0x42039c CMP %RCX,%RSI |
(376) 0x42039f JNE 420370 |
(370) 0x4203a1 MOV 0x68(%RSP),%R12 |
(370) 0x4203a6 TEST %RSI,%RSI |
(370) 0x4203a9 MOV 0x28(%RSP),%R8 |
(370) 0x4203ae JLE 41fcb0 |
(370) 0x4203b4 MOV %RSI,%RDX |
(370) 0x4203b7 AND $-0x4,%RDX |
(370) 0x4203bb JE 420400 |
(370) 0x4203bd LEA -0x1(%RDX),%RCX |
(370) 0x4203c1 XOR %EDI,%EDI |
(370) 0x4203c3 NOPW %CS:(%RAX,%RAX,1) |
(375) 0x4203d0 VMOVUPD (%RAX,%RDI,8),%YMM0 |
(375) 0x4203d5 VMOVUPD (%R13,%RDI,8),%YMM1 |
(375) 0x4203dc VFNMADD213PD (%R14,%RDI,8),%YMM0,%YMM1 |
(375) 0x4203e2 VMOVUPD %YMM1,(%R14,%RDI,8) |
(375) 0x4203e8 ADD $0x4,%RDI |
(375) 0x4203ec CMP %RCX,%RDI |
(375) 0x4203ef JLE 4203d0 |
(370) 0x4203f1 JMP 42052b |
0x4203f6 NOPW %CS:(%RAX,%RAX,1) |
(370) 0x420400 XOR %EDX,%EDX |
(370) 0x420402 JMP 420510 |
(370) 0x420407 XOR %R9D,%R9D |
(370) 0x42040a MOV 0x50(%RSP),%R15 |
(370) 0x42040f MOV 0x30(%RSP),%R13 |
(370) 0x420414 MOV 0x68(%RSP),%R12 |
(370) 0x420419 MOV %RSI,%RCX |
(370) 0x42041c SUB %R9,%RCX |
(370) 0x42041f VPBROADCASTQ %RCX,%YMM0 |
(370) 0x420425 VPCMPNLEUQ 0xdc0b0(%RIP),%YMM0,%K1 |
(370) 0x420430 VMOVUPD (%RDX,%R9,8),%YMM0{%K1}{z} |
(370) 0x420437 VMOVUPD 0xa0(%RSP),%YMM2 |
(370) 0x420440 VMOVAPD %YMM0,%YMM2{%K1} |
(370) 0x420446 VMOVUPD (%R15,%R9,8),%YMM0{%K1}{z} |
(370) 0x42044d VMOVUPD 0xc0(%RSP),%YMM1 |
(370) 0x420456 VMOVAPD %YMM0,%YMM1{%K1} |
(370) 0x42045c VMOVUPD %YMM1,0xc0(%RSP) |
(370) 0x420465 VMOVUPD %YMM2,0xa0(%RSP) |
(370) 0x42046e VADDPD %YMM1,%YMM2,%YMM0 |
(370) 0x420472 VMOVUPD %YMM0,(%RDX,%R9,8){%K1} |
(370) 0x420479 VMOVUPD (%R13,%R9,8),%YMM0{%K1}{z} |
(370) 0x420481 VMOVUPD 0xe0(%RSP),%YMM2 |
(370) 0x42048a VMOVAPD %YMM0,%YMM2{%K1} |
(370) 0x420490 MOV 0x28(%RSP),%RCX |
(370) 0x420495 VMOVUPD (%RCX,%R9,8),%YMM0{%K1}{z} |
(370) 0x42049c VMOVUPD 0x100(%RSP),%YMM1 |
(370) 0x4204a5 VMOVAPD %YMM0,%YMM1{%K1} |
(370) 0x4204ab VMOVUPD %YMM1,0x100(%RSP) |
(370) 0x4204b4 VMOVAPD %YMM1,%YMM0 |
(370) 0x4204b8 VMOVUPD %YMM2,0xe0(%RSP) |
(370) 0x4204c1 VFMSUB231PD 0xdada5(%RIP){1to4},%YMM2,%YMM0 |
(370) 0x4204cb VMOVUPD (%R8,%R9,8),%YMM1{%K1}{z} |
(370) 0x4204d2 VMOVUPD 0x120(%RSP),%YMM2 |
(370) 0x4204db VMOVAPD %YMM1,%YMM2{%K1} |
(370) 0x4204e1 VMOVUPD %YMM2,0x120(%RSP) |
(370) 0x4204ea VADDPD %YMM0,%YMM2,%YMM0 |
(370) 0x4204ee VMOVUPD %YMM0,(%R8,%R9,8){%K1} |
(370) 0x4204f5 TEST %RSI,%RSI |
(370) 0x4204f8 MOV 0x28(%RSP),%R8 |
(370) 0x4204fd JG 4203b4 |
(370) 0x420503 JMP 41fcb0 |
0x420508 NOPL (%RAX,%RAX,1) |
(369) 0x420510 VMOVSD (%RAX,%RDX,8),%XMM0 |
(369) 0x420515 VMOVSD (%R13,%RDX,8),%XMM1 |
(369) 0x42051c VFNMADD213SD (%R14,%RDX,8),%XMM0,%XMM1 |
(369) 0x420522 VMOVSD %XMM1,(%R14,%RDX,8) |
(369) 0x420528 INC %RDX |
(369) 0x42052b CMP %RDX,%RSI |
(369) 0x42052e JNE 420510 |
(370) 0x420530 TEST %RSI,%RSI |
(370) 0x420533 JLE 41fcb0 |
(370) 0x420539 MOV %RSI,%RDX |
(370) 0x42053c AND $-0x4,%RDX |
(370) 0x420540 JE 42058e |
(370) 0x420542 LEA -0x1(%RDX),%RCX |
(370) 0x420546 MOV 0x38(%RSP),%RDI |
(370) 0x42054b LEA (%R14,%RDI,8),%RDI |
(370) 0x42054f LEA (%RAX,%R12,8),%R8 |
(370) 0x420553 XOR %R9D,%R9D |
(370) 0x420556 NOPW %CS:(%RAX,%RAX,1) |
(374) 0x420560 VMOVUPD (%R8,%R9,8),%YMM0 |
(374) 0x420566 VMOVUPD (%R13,%R9,8),%YMM1 |
(374) 0x42056d VFNMADD213PD (%RDI,%R9,8),%YMM0,%YMM1 |
(374) 0x420573 VMOVUPD %YMM1,(%RDI,%R9,8) |
(374) 0x420579 ADD $0x4,%R9 |
(374) 0x42057d CMP %RCX,%R9 |
(374) 0x420580 JLE 420560 |
(370) 0x420582 CMP %RDX,%RSI |
(370) 0x420585 MOV 0x28(%RSP),%R8 |
(370) 0x42058a JNE 420590 |
(370) 0x42058c JMP 4205bf |
(370) 0x42058e XOR %EDX,%EDX |
(370) 0x420590 MOV 0x38(%RSP),%RCX |
(370) 0x420595 LEA (%R14,%RCX,8),%RCX |
(370) 0x420599 LEA (%RAX,%R12,8),%RDI |
(370) 0x42059d NOPL (%RAX) |
(371) 0x4205a0 VMOVSD (%RDI,%RDX,8),%XMM0 |
(371) 0x4205a5 VMOVSD (%R13,%RDX,8),%XMM1 |
(371) 0x4205ac VFNMADD213SD (%RCX,%RDX,8),%XMM0,%XMM1 |
(371) 0x4205b2 VMOVSD %XMM1,(%RCX,%RDX,8) |
(371) 0x4205b7 INC %RDX |
(371) 0x4205ba CMP %RDX,%RSI |
(371) 0x4205bd JNE 4205a0 |
(370) 0x4205bf TEST %RSI,%RSI |
(370) 0x4205c2 JLE 41fcb0 |
(370) 0x4205c8 MOV %RSI,%RDX |
(370) 0x4205cb AND $-0x4,%RDX |
(370) 0x4205cf JE 420622 |
(370) 0x4205d1 LEA -0x1(%RDX),%RCX |
(370) 0x4205d5 MOV 0x38(%RSP),%RDI |
(370) 0x4205da SAL $0x4,%RDI |
(370) 0x4205de ADD %R14,%RDI |
(370) 0x4205e1 MOV %R12,%R8 |
(370) 0x4205e4 SAL $0x4,%R8 |
(370) 0x4205e8 ADD %RAX,%R8 |
(370) 0x4205eb XOR %R9D,%R9D |
(370) 0x4205ee XCHG %AX,%AX |
(373) 0x4205f0 VMOVUPD (%R8,%R9,8),%YMM0 |
(373) 0x4205f6 VMOVUPD (%R13,%R9,8),%YMM1 |
(373) 0x4205fd VFNMADD213PD (%RDI,%R9,8),%YMM0,%YMM1 |
(373) 0x420603 VMOVUPD %YMM1,(%RDI,%R9,8) |
(373) 0x420609 ADD $0x4,%R9 |
(373) 0x42060d CMP %RCX,%R9 |
(373) 0x420610 JLE 4205f0 |
(370) 0x420612 CMP %RDX,%RSI |
(370) 0x420615 MOV 0x28(%RSP),%R8 |
(370) 0x42061a JE 41fcb0 |
(370) 0x420620 JMP 420624 |
(370) 0x420622 XOR %EDX,%EDX |
(370) 0x420624 MOV 0x38(%RSP),%RCX |
(370) 0x420629 SAL $0x4,%RCX |
(370) 0x42062d ADD %RCX,%R14 |
(370) 0x420630 SAL $0x4,%R12 |
(370) 0x420634 ADD %R12,%RAX |
(370) 0x420637 NOPW (%RAX,%RAX,1) |
(372) 0x420640 VMOVSD (%RAX,%RDX,8),%XMM0 |
(372) 0x420645 VMOVSD (%R13,%RDX,8),%XMM1 |
(372) 0x42064c VFNMADD213SD (%R14,%RDX,8),%XMM0,%XMM1 |
(372) 0x420652 VMOVSD %XMM1,(%R14,%RDX,8) |
(372) 0x420658 INC %RDX |
(372) 0x42065b CMP %RDX,%RSI |
(372) 0x42065e JNE 420640 |
(370) 0x420660 JMP 41fcb0 |
0x420665 MOV 0x20(%RSP),%RAX |
0x42066a MOVQ $0,0x10(%RAX) |
0x420672 MOV 0x90(%RAX),%R10 |
0x420679 TEST %R10,%R10 |
0x42067c JE 4206cd |
0x42067e MOV 0x20(%RSP),%RCX |
0x420683 MOV 0xd8(%RCX),%R9 |
0x42068a MOV 0x100(%RCX),%RDX |
0x420691 MOVSXD 0xf0(%RCX),%RDI |
0x420698 MOV 0x80(%RSP),%RAX |
0x4206a0 MOV 0x18(%RAX),%RSI |
0x4206a4 MOV 0x128(%RCX),%RAX |
0x4206ab MOV 0x88(%RSP),%RCX |
0x4206b3 MOV 0x18(%RCX),%RCX |
0x4206b7 LEA (%RDI,%RDI,1),%R8 |
0x4206bb CMP $0x1,%R10 |
0x4206bf JNE 4206da |
0x4206c1 VXORPD %XMM0,%XMM0,%XMM0 |
0x4206c5 XOR %R11D,%R11D |
0x4206c8 JMP 4207ba |
0x4206cd VMOVSD 0xdab6b(%RIP),%XMM0 |
0x4206d5 JMP 420826 |
0x4206da MOV %R10,%RBX |
0x4206dd AND $-0x2,%RBX |
0x4206e1 LEA 0x8(%RDX,%RDI,8),%R14 |
0x4206e6 LEA 0x8(%RDX,%R8,8),%R15 |
0x4206eb LEA 0x28(%RSI),%R12 |
0x4206ef VXORPD %XMM0,%XMM0,%XMM0 |
0x4206f3 XOR %R11D,%R11D |
0x4206f6 MOV 0x20(%RSP),%R13 |
0x4206fb NOPL (%RAX,%RAX,1) |
(367) 0x420700 VADDSD (%R9,%R11,8),%XMM0,%XMM0 |
(367) 0x420706 VMOVSD %XMM0,0x10(%R13) |
(367) 0x42070c VMOVSD (%RDX,%R11,8),%XMM0 |
(367) 0x420712 VMOVHPD -0x8(%R14,%R11,8),%XMM0,%XMM0 |
(367) 0x420719 VADDPD -0x28(%R12),%XMM0,%XMM0 |
(367) 0x420720 VMOVSD -0x18(%R12),%XMM1 |
(367) 0x420727 VADDSD -0x8(%R15,%R11,8),%XMM1,%XMM1 |
(367) 0x42072e VMOVUPD %XMM0,-0x28(%R12) |
(367) 0x420735 VMOVSD %XMM1,-0x18(%R12) |
(367) 0x42073c VMOVSD (%RCX,%R11,8),%XMM0 |
(367) 0x420742 VADDSD (%RAX,%R11,8),%XMM0,%XMM0 |
(367) 0x420748 VMOVSD %XMM0,(%RCX,%R11,8) |
(367) 0x42074e VMOVSD 0x8(%R9,%R11,8),%XMM0 |
(367) 0x420755 VADDSD 0x10(%R13),%XMM0,%XMM0 |
(367) 0x42075b VMOVSD %XMM0,0x10(%R13) |
(367) 0x420761 VMOVSD 0x8(%RDX,%R11,8),%XMM0 |
(367) 0x420768 VMOVHPD (%R14,%R11,8),%XMM0,%XMM0 |
(367) 0x42076e VADDPD -0x10(%R12),%XMM0,%XMM0 |
(367) 0x420775 VMOVSD (%R12),%XMM1 |
(367) 0x42077b VADDSD (%R15,%R11,8),%XMM1,%XMM1 |
(367) 0x420781 VMOVUPD %XMM0,-0x10(%R12) |
(367) 0x420788 VMOVSD %XMM1,(%R12) |
(367) 0x42078e VMOVSD 0x8(%RCX,%R11,8),%XMM0 |
(367) 0x420795 VADDSD 0x8(%RAX,%R11,8),%XMM0,%XMM0 |
(367) 0x42079c VMOVSD %XMM0,0x8(%RCX,%R11,8) |
(367) 0x4207a3 VMOVSD 0x10(%R13),%XMM0 |
(367) 0x4207a9 ADD $0x2,%R11 |
(367) 0x4207ad ADD $0x30,%R12 |
(367) 0x4207b1 CMP %R11,%RBX |
(367) 0x4207b4 JNE 420700 |
0x4207ba TEST $0x1,%R10B |
0x4207be JE 42081e |
0x4207c0 VADDSD (%R9,%R11,8),%XMM0,%XMM0 |
0x4207c6 MOV 0x20(%RSP),%R10 |
0x4207cb VMOVSD %XMM0,0x10(%R10) |
0x4207d1 ADD %R11,%RDI |
0x4207d4 ADD %R11,%R8 |
0x4207d7 LEA (%R11,%R11,2),%R9 |
0x4207db VMOVSD (%RDX,%R11,8),%XMM0 |
0x4207e1 VMOVHPD (%RDX,%RDI,8),%XMM0,%XMM0 |
0x4207e6 VADDPD (%RSI,%R9,8),%XMM0,%XMM0 |
0x4207ec VMOVSD 0x10(%RSI,%R9,8),%XMM1 |
0x4207f3 VADDSD (%RDX,%R8,8),%XMM1,%XMM1 |
0x4207f9 VMOVUPD %XMM0,(%RSI,%R9,8) |
0x4207ff VMOVSD %XMM1,0x10(%RSI,%R9,8) |
0x420806 VMOVSD (%RCX,%R11,8),%XMM0 |
0x42080c VADDSD (%RAX,%R11,8),%XMM0,%XMM0 |
0x420812 VMOVSD %XMM0,(%RCX,%R11,8) |
0x420818 VMOVSD 0x10(%R10),%XMM0 |
0x42081e VMULSD 0xdaa0a(%RIP),%XMM0,%XMM0 |
0x420826 MOV 0x20(%RSP),%RAX |
0x42082b VMOVSD %XMM0,0x10(%RAX) |
0x420830 LEA -0x28(%RBP),%RSP |
0x420834 POP %RBX |
0x420835 POP %R12 |
0x420837 POP %R13 |
0x420839 POP %R14 |
0x42083b POP %R15 |
0x42083d POP %RBP |
0x42083e VZEROUPPER |
0x420841 RET |
0x420842 NOPW %CS:(%RAX,%RAX,1) |
0x42084c NOPL (%RAX) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.69+ | miniqmcreference::TwoBodyJastr[...] | TwoBodyJastrowRef.h:411 | exec |
○ | qmcplusplus::WaveFunction::eva[...] | WaveFunction.cpp:175 | exec |
○ | main.extracted.113 | miniqmc.cpp:397 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 104 |
nb uops | 106 |
loop length | 523 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 6 |
ADD-SUB / MUL ratio | 4.00 |
micro-operation queue | 18.50 cycles |
front end | 18.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.90 | 4.90 | 12.33 | 12.33 | 9.00 | 4.70 | 4.70 | 9.00 | 9.00 | 9.00 | 4.80 | 12.33 |
cycles | 4.90 | 4.90 | 12.33 | 12.33 | 9.00 | 4.70 | 4.70 | 9.00 | 9.00 | 9.00 | 4.80 | 12.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 18.39-18.47 |
Stall cycles | 0.00 |
Front-end | 18.50 |
Dispatch | 12.33 |
Overall L1 | 18.50 |
all | 9% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 25% |
all | 21% |
load | 8% |
store | 20% |
mul | 0% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 16% |
load | 7% |
store | 9% |
mul | 0% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 13% |
load | 12% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 15% |
all | 15% |
load | 13% |
store | 15% |
mul | 12% |
add-sub | 15% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 14% |
load | 13% |
store | 13% |
mul | 12% |
add-sub | 15% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x160,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 420665 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xab5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x20(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x248(%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 460080 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R10,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 420665 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xab5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0xdc789(%RIP),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 41fc4a <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0x10(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RAX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R10,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4206cd <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb1d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x20(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xd8(%RCX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x100(%RCX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0xf0(%RCX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x128(%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x88(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDI,%RDI,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP $0x1,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4206da <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb2a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4207ba <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc0a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
VMOVSD 0xdab6b(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 420826 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc76> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R10,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x2,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
LEA 0x8(%RDX,%RDI,8),%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x8(%RDX,%R8,8),%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x28(%RSI),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x20(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%R10B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 42081e <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc6e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VADDSD (%R9,%R11,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
MOV 0x20(%RSP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%R10) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R11,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R11,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (%R11,%R11,2),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD (%RDX,%R11,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVHPD (%RDX,%RDI,8),%XMM0,%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4-12 | 1 |
VADDPD (%RSI,%R9,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD 0x10(%RSI,%R9,8),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RDX,%R8,8),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVUPD %XMM0,(%RSI,%R9,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD %XMM1,0x10(%RSI,%R9,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD (%RCX,%R11,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R11,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RCX,%R11,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x10(%R10),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0xdaa0a(%RIP),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 104 |
nb uops | 106 |
loop length | 523 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 6 |
ADD-SUB / MUL ratio | 4.00 |
micro-operation queue | 18.50 cycles |
front end | 18.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.90 | 4.90 | 12.33 | 12.33 | 9.00 | 4.70 | 4.70 | 9.00 | 9.00 | 9.00 | 4.80 | 12.33 |
cycles | 4.90 | 4.90 | 12.33 | 12.33 | 9.00 | 4.70 | 4.70 | 9.00 | 9.00 | 9.00 | 4.80 | 12.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 18.39-18.47 |
Stall cycles | 0.00 |
Front-end | 18.50 |
Dispatch | 12.33 |
Overall L1 | 18.50 |
all | 9% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 25% |
all | 21% |
load | 8% |
store | 20% |
mul | 0% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 16% |
load | 7% |
store | 9% |
mul | 0% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 13% |
load | 12% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 15% |
all | 15% |
load | 13% |
store | 15% |
mul | 12% |
add-sub | 15% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 14% |
load | 13% |
store | 13% |
mul | 12% |
add-sub | 15% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x160,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 420665 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xab5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x20(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x248(%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 460080 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R10,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 420665 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xab5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0xdc789(%RIP),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 41fc4a <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0x10(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RAX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R10,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4206cd <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb1d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x20(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xd8(%RCX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x100(%RCX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0xf0(%RCX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x128(%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x88(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDI,%RDI,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP $0x1,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4206da <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb2a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4207ba <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc0a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
VMOVSD 0xdab6b(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 420826 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc76> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R10,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x2,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
LEA 0x8(%RDX,%RDI,8),%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x8(%RDX,%R8,8),%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x28(%RSI),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x20(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%R10B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 42081e <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc6e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VADDSD (%R9,%R11,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
MOV 0x20(%RSP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%R10) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R11,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R11,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (%R11,%R11,2),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD (%RDX,%R11,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVHPD (%RDX,%RDI,8),%XMM0,%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4-12 | 1 |
VADDPD (%RSI,%R9,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD 0x10(%RSI,%R9,8),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RDX,%R8,8),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVUPD %XMM0,(%RSI,%R9,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD %XMM1,0x10(%RSI,%R9,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD (%RCX,%R11,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R11,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RCX,%R11,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x10(%R10),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0xdaa0a(%RIP),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼miniqmcreference::TwoBodyJastrowRef | 0.1 | 0.12 |
○Loop 367 - TwoBodyJastrowRef.h:423-427 - exec | 0 | 0 |
▼Loop 368 - TwoBodyJastrowRef.h:268-420 - exec– | 0 | 0 |
▼Loop 370 - stl_algobase.h:752-754 - exec– | 0 | 0 |
○Loop 383 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.02 |
○Loop 379 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.02 |
○Loop 381 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.02 |
○Loop 377 - TwoBodyJastrowRef.h:388-391 - exec | 0.01 | 0.01 |
○Loop 385 - TwoBodyJastrowRef.h:375-376 - exec | 0.01 | 0.01 |
○Loop 375 - TwoBodyJastrowRef.h:397-398 - exec | 0.01 | 0.01 |
○Loop 374 - TwoBodyJastrowRef.h:397-398 - exec | 0.01 | 0.01 |
○Loop 373 - TwoBodyJastrowRef.h:397-398 - exec | 0.01 | 0.01 |
○Loop 378 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 380 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 387 - stl_numeric.h:126-127 - exec | 0 | 0 |
○Loop 369 - TwoBodyJastrowRef.h:397-398 - exec | 0 | 0 |
○Loop 386 - stl_numeric.h:126-127 - exec | 0 | 0 |
○Loop 376 - TwoBodyJastrowRef.h:388-391 - exec | 0 | 0 |
○Loop 382 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 371 - TwoBodyJastrowRef.h:397-398 - exec | 0 | 0 |
○Loop 384 - TwoBodyJastrowRef.h:375-376 - exec | 0 | 0 |
○Loop 372 - TwoBodyJastrowRef.h:397-398 - exec | 0 | 0 |
○Loop 388 - TwoBodyJastrowRef.h:269-274 - exec | 0 | 0 |