Function: miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcp ... | Module: exec | Source: OneBodyJastrowRef.h:108-194 [...] | Coverage: 0.02% |
---|
Function: miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcp ... | Module: exec | Source: OneBodyJastrowRef.h:108-194 [...] | Coverage: 0.02% |
---|
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 273 - 273 |
-------------------------------------------------------------------------------- |
273: inline const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVectorOps.h: 49 - 49 |
-------------------------------------------------------------------------------- |
49: for (unsigned d = 0; d < D; ++d) |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
242: inline iterator begin() { return X; } |
[...] |
249: inline const_pointer data() const { return X; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/OneBodyJastrowRef.h: 108 - 194 |
-------------------------------------------------------------------------------- |
108: const auto& d_ie = P.getDistTableAB(myTableID); |
109: for (int iat = 0; iat < Nelec; ++iat) |
110: { |
111: computeU3(P, iat, d_ie.getDistRow(iat).data()); |
112: Vat[iat] = std::accumulate(U.begin(), U.begin() + Nions, valT()); |
113: Lap[iat] = accumulateGL(dU.data(), d2U.data(), d_ie.getDisplRow(iat), Grad[iat]); |
[...] |
165: { |
166: if (fromscratch) |
167: recompute(P); |
168: |
169: for (size_t iat = 0; iat < Nelec; ++iat) |
170: G[iat] += Grad[iat]; |
171: for (size_t iat = 0; iat < Nelec; ++iat) |
172: L[iat] -= Lap[iat]; |
173: LogValue = -std::accumulate(Vat.begin(), Vat.begin() + Nelec, valT()); |
174: } |
[...] |
186: for (int jat = 0; jat < Nions; ++jat) |
187: lap += d2u[jat] + lapfac * du[jat]; |
188: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
189: { |
190: const valT* restrict dX = displ.data(idim); |
191: valT s = valT(); |
192: for (int jat = 0; jat < Nions; ++jat) |
193: s += du[jat] * dX[jat]; |
194: grad[idim] = s; |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_numeric.h: 126 - 127 |
-------------------------------------------------------------------------------- |
126: for (; __first != __last; ++__first) |
127: __init = __init + *__first; |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_iterator.h: 784 - 887 |
-------------------------------------------------------------------------------- |
784: : _M_current(__i) { } |
[...] |
887: { return __lhs.base() != __rhs.base(); } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 94 - 94 |
-------------------------------------------------------------------------------- |
94: (const_cast<T1&>(a) += b); |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 169 - 170 |
-------------------------------------------------------------------------------- |
169: inline Type_t& operator[](unsigned int i) { return X[i]; } |
170: inline const Type_t& operator[](unsigned int i) const { return X[i]; } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_vector.h: 951 - 1056 |
-------------------------------------------------------------------------------- |
951: return *(this->_M_impl._M_start + __n); |
[...] |
1056: { return _M_data_ptr(this->_M_impl._M_start); } |
0x41ab10 PUSH %RBP |
0x41ab11 MOV %RSP,%RBP |
0x41ab14 PUSH %R15 |
0x41ab16 PUSH %R14 |
0x41ab18 PUSH %R13 |
0x41ab1a PUSH %R12 |
0x41ab1c PUSH %RBX |
0x41ab1d SUB $0x18,%RSP |
0x41ab21 MOV %RCX,%R14 |
0x41ab24 MOV %RDX,%R15 |
0x41ab27 MOV %RDI,%RBX |
0x41ab2a TEST %R8B,%R8B |
0x41ab2d JE 41af32 |
0x41ab33 MOV %RSI,%R12 |
0x41ab36 MOV 0xa8(%RBX),%ESI |
0x41ab3c MOV %R12,%RDI |
0x41ab3f CALL 4600b0 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> |
0x41ab44 MOV 0x94(%RBX),%R8D |
0x41ab4b TEST %R8D,%R8D |
0x41ab4e JLE 41af39 |
0x41ab54 MOV %RAX,%R13 |
0x41ab57 MOV %R12,-0x40(%RBP) |
0x41ab5b MOV %R15,-0x30(%RBP) |
0x41ab5f MOV %R14,-0x38(%RBP) |
0x41ab63 MOV $0x1fffffffffffffff,%R15 |
0x41ab6d XOR %R14D,%R14D |
0x41ab70 JMP 41abba |
0x41ab72 NOPW %CS:(%RAX,%RAX,1) |
(290) 0x41ab80 LEA (%R14,%R14,2),%RAX |
(290) 0x41ab84 VXORPD %XMM0,%XMM0,%XMM0 |
(290) 0x41ab88 VMOVUPD %XMM0,(%RDX,%RAX,8) |
(290) 0x41ab8d MOVQ $0,0x10(%RDX,%RAX,8) |
(290) 0x41ab96 VXORPD %XMM0,%XMM0,%XMM0 |
(290) 0x41ab9a MOV 0x1b8(%RBX),%RAX |
(290) 0x41aba1 VMOVSD %XMM0,(%RAX,%R14,8) |
(290) 0x41aba7 INC %R14 |
(290) 0x41abaa MOVSXD 0x94(%RBX),%R8 |
(290) 0x41abb1 CMP %R8,%R14 |
(290) 0x41abb4 JGE 41af47 |
(290) 0x41abba MOV 0x48(%R13),%RAX |
(290) 0x41abbe LEA (%R14,%R14,4),%R12 |
(290) 0x41abc2 MOV 0x18(%RAX,%R12,8),%RCX |
(290) 0x41abc7 MOV %RBX,%RDI |
(290) 0x41abca MOV -0x40(%RBP),%RSI |
(290) 0x41abce MOV %R14D,%EDX |
(290) 0x41abd1 VZEROUPPER |
(290) 0x41abd4 CALL 41ca60 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd> |
(290) 0x41abd9 MOVSXD 0x90(%RBX),%RAX |
(290) 0x41abe0 TEST %R15,%RAX |
(290) 0x41abe3 JE 41ac50 |
(290) 0x41abe5 MOV 0x100(%RBX),%RCX |
(290) 0x41abec LEA (%RAX,%R15,1),%RDX |
(290) 0x41abf0 AND %R15,%RDX |
(290) 0x41abf3 INC %RDX |
(290) 0x41abf6 MOV %RDX,%RSI |
(290) 0x41abf9 MOV $0x3ffffffffffffffc,%RDI |
(290) 0x41ac03 AND %RDI,%RSI |
(290) 0x41ac06 VMOVSD 0xe179a(%RIP),%XMM2 |
(290) 0x41ac0e VBROADCASTSD 0xe1791(%RIP),%YMM3 |
(290) 0x41ac17 JE 41ac70 |
(290) 0x41ac19 VXORPD %XMM0,%XMM0,%XMM0 |
(290) 0x41ac1d XOR %EDI,%EDI |
(290) 0x41ac1f NOP |
(302) 0x41ac20 VADDPD (%RCX,%RDI,8),%YMM0,%YMM0 |
(302) 0x41ac25 ADD $0x4,%RDI |
(302) 0x41ac29 CMP %RSI,%RDI |
(302) 0x41ac2c JB 41ac20 |
(290) 0x41ac2e VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(290) 0x41ac34 VADDPD %XMM1,%XMM0,%XMM0 |
(290) 0x41ac38 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(290) 0x41ac3d VADDSD %XMM1,%XMM0,%XMM0 |
(290) 0x41ac41 JMP 41af28 |
0x41ac46 NOPW %CS:(%RAX,%RAX,1) |
(290) 0x41ac50 VXORPD %XMM0,%XMM0,%XMM0 |
(290) 0x41ac54 VMOVSD 0xe174c(%RIP),%XMM2 |
(290) 0x41ac5c VBROADCASTSD 0xe1743(%RIP),%YMM3 |
(290) 0x41ac65 JMP 41ac80 |
0x41ac67 NOPW (%RAX,%RAX,1) |
(290) 0x41ac70 VXORPD %XMM0,%XMM0,%XMM0 |
(290) 0x41ac74 XOR %ESI,%ESI |
(290) 0x41ac76 JMP 41af20 |
0x41ac7b NOPL (%RAX,%RAX,1) |
(290) 0x41ac80 MOV 0xf0(%RBX),%RCX |
(290) 0x41ac87 VMOVSD %XMM0,(%RCX,%R14,8) |
(290) 0x41ac8d MOV 0x190(%RBX),%RDX |
(290) 0x41ac94 TEST %EAX,%EAX |
(290) 0x41ac96 JLE 41ab80 |
(290) 0x41ac9c MOV 0x118(%RBX),%RCX |
(290) 0x41aca3 MOV 0x130(%RBX),%RDI |
(290) 0x41acaa MOV %RAX,%RSI |
(290) 0x41acad AND $-0x4,%RSI |
(290) 0x41acb1 JE 41ad00 |
(290) 0x41acb3 VXORPD %XMM0,%XMM0,%XMM0 |
(290) 0x41acb7 XOR %R8D,%R8D |
(290) 0x41acba NOPW (%RAX,%RAX,1) |
(300) 0x41acc0 VADDPD (%RDI,%R8,8),%YMM0,%YMM0 |
(300) 0x41acc6 VFMADD231PD (%RCX,%R8,8),%YMM3,%YMM0 |
(300) 0x41accc ADD $0x4,%R8 |
(300) 0x41acd0 CMP %RSI,%R8 |
(300) 0x41acd3 JL 41acc0 |
(290) 0x41acd5 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(290) 0x41acdb VADDPD %XMM1,%XMM0,%XMM0 |
(290) 0x41acdf VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(290) 0x41ace4 VADDSD %XMM1,%XMM0,%XMM0 |
(290) 0x41ace8 MOV %RSI,%R8 |
(290) 0x41aceb CMP %RAX,%RSI |
(290) 0x41acee JNE 41ad10 |
(290) 0x41acf0 JMP 41ad24 |
0x41acf2 NOPW %CS:(%RAX,%RAX,1) |
(290) 0x41ad00 VXORPD %XMM0,%XMM0,%XMM0 |
(290) 0x41ad04 XOR %R8D,%R8D |
(290) 0x41ad07 NOPW (%RAX,%RAX,1) |
(291) 0x41ad10 VADDSD (%RDI,%R8,8),%XMM0,%XMM0 |
(291) 0x41ad16 VFMADD231SD (%RCX,%R8,8),%XMM2,%XMM0 |
(291) 0x41ad1c INC %R8 |
(291) 0x41ad1f CMP %R8,%RAX |
(291) 0x41ad22 JNE 41ad10 |
(290) 0x41ad24 MOV 0x60(%R13),%RDI |
(290) 0x41ad28 MOV 0x8(%RDI,%R12,8),%R8 |
(290) 0x41ad2d MOV 0x18(%RDI,%R12,8),%RDI |
(290) 0x41ad32 MOV %R8,%R9 |
(290) 0x41ad35 SAR $0x3f,%R9 |
(290) 0x41ad39 ANDN %R8,%R9,%R9 |
(290) 0x41ad3e TEST %R8,%R8 |
(290) 0x41ad41 LEA (%RAX,%R9,2),%R9 |
(290) 0x41ad45 LEA -0x8(%RDI,%R9,8),%R12 |
(290) 0x41ad4a LEA (%R14,%R14,2),%R9 |
(290) 0x41ad4e LEA (%RDX,%R9,8),%R10 |
(290) 0x41ad52 MOV $0,%R11D |
(290) 0x41ad58 CMOVS %R8,%R11 |
(290) 0x41ad5c CMP %R10,%R12 |
(290) 0x41ad5f JB 41adc0 |
(290) 0x41ad61 SAL $0x4,%R11 |
(290) 0x41ad65 ADD %RDI,%R11 |
(290) 0x41ad68 LEA 0x10(%RDX,%R9,8),%R12 |
(290) 0x41ad6d CMP %R11,%R12 |
(290) 0x41ad70 JB 41adc0 |
(290) 0x41ad72 SAL $0x3,%R8 |
(290) 0x41ad76 XOR %EDX,%EDX |
(290) 0x41ad78 NOPL (%RAX,%RAX,1) |
(299) 0x41ad80 VXORPD %XMM1,%XMM1,%XMM1 |
(299) 0x41ad84 XOR %ESI,%ESI |
(299) 0x41ad86 NOPW %CS:(%RAX,%RAX,1) |
(298) 0x41ad90 VMOVSD (%RDI,%RSI,8),%XMM2 |
(298) 0x41ad95 VFMADD231SD (%RCX,%RSI,8),%XMM2,%XMM1 |
(298) 0x41ad9b INC %RSI |
(298) 0x41ad9e CMP %RSI,%RAX |
(298) 0x41ada1 JNE 41ad90 |
(299) 0x41ada3 VMOVSD %XMM1,(%R10,%RDX,8) |
(299) 0x41ada9 LEA 0x1(%RDX),%RSI |
(299) 0x41adad ADD %R8,%RDI |
(299) 0x41adb0 CMP $0x2,%RDX |
(299) 0x41adb4 MOV %RSI,%RDX |
(299) 0x41adb7 JNE 41ad80 |
(290) 0x41adb9 JMP 41ab9a |
0x41adbe XCHG %AX,%AX |
(290) 0x41adc0 TEST %RSI,%RSI |
(290) 0x41adc3 JE 41ae02 |
(290) 0x41adc5 VXORPD %XMM1,%XMM1,%XMM1 |
(290) 0x41adc9 XOR %R10D,%R10D |
(290) 0x41adcc NOPL (%RAX) |
(297) 0x41add0 VMOVUPD (%RDI,%R10,8),%YMM2 |
(297) 0x41add6 VFMADD231PD (%RCX,%R10,8),%YMM2,%YMM1 |
(297) 0x41addc ADD $0x4,%R10 |
(297) 0x41ade0 CMP %RSI,%R10 |
(297) 0x41ade3 JL 41add0 |
(290) 0x41ade5 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(290) 0x41adeb VADDPD %XMM2,%XMM1,%XMM1 |
(290) 0x41adef VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(290) 0x41adf4 VADDSD %XMM2,%XMM1,%XMM1 |
(290) 0x41adf8 MOV %RSI,%R10 |
(290) 0x41adfb CMP %RAX,%RSI |
(290) 0x41adfe JNE 41ae10 |
(290) 0x41ae00 JMP 41ae24 |
(290) 0x41ae02 VXORPD %XMM1,%XMM1,%XMM1 |
(290) 0x41ae06 XOR %R10D,%R10D |
(290) 0x41ae09 NOPL (%RAX) |
(292) 0x41ae10 VMOVSD (%RDI,%R10,8),%XMM2 |
(292) 0x41ae16 VFMADD231SD (%RCX,%R10,8),%XMM2,%XMM1 |
(292) 0x41ae1c INC %R10 |
(292) 0x41ae1f CMP %R10,%RAX |
(292) 0x41ae22 JNE 41ae10 |
(290) 0x41ae24 VMOVSD %XMM1,(%RDX,%R9,8) |
(290) 0x41ae2a TEST %RSI,%RSI |
(290) 0x41ae2d JE 41ae72 |
(290) 0x41ae2f LEA (%RDI,%R8,8),%R10 |
(290) 0x41ae33 VXORPD %XMM1,%XMM1,%XMM1 |
(290) 0x41ae37 XOR %R11D,%R11D |
(290) 0x41ae3a NOPW (%RAX,%RAX,1) |
(296) 0x41ae40 VMOVUPD (%R10,%R11,8),%YMM2 |
(296) 0x41ae46 VFMADD231PD (%RCX,%R11,8),%YMM2,%YMM1 |
(296) 0x41ae4c ADD $0x4,%R11 |
(296) 0x41ae50 CMP %RSI,%R11 |
(296) 0x41ae53 JL 41ae40 |
(290) 0x41ae55 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(290) 0x41ae5b VADDPD %XMM2,%XMM1,%XMM1 |
(290) 0x41ae5f VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(290) 0x41ae64 VADDSD %XMM2,%XMM1,%XMM1 |
(290) 0x41ae68 MOV %RSI,%R10 |
(290) 0x41ae6b CMP %RAX,%RSI |
(290) 0x41ae6e JNE 41ae79 |
(290) 0x41ae70 JMP 41ae94 |
(290) 0x41ae72 VXORPD %XMM1,%XMM1,%XMM1 |
(290) 0x41ae76 XOR %R10D,%R10D |
(290) 0x41ae79 LEA (%RDI,%R8,8),%R11 |
(290) 0x41ae7d NOPL (%RAX) |
(293) 0x41ae80 VMOVSD (%R11,%R10,8),%XMM2 |
(293) 0x41ae86 VFMADD231SD (%RCX,%R10,8),%XMM2,%XMM1 |
(293) 0x41ae8c INC %R10 |
(293) 0x41ae8f CMP %R10,%RAX |
(293) 0x41ae92 JNE 41ae80 |
(290) 0x41ae94 VMOVSD %XMM1,0x8(%RDX,%R9,8) |
(290) 0x41ae9b TEST %RSI,%RSI |
(290) 0x41ae9e JE 41aeef |
(290) 0x41aea0 MOV %R8,%R10 |
(290) 0x41aea3 SAL $0x4,%R10 |
(290) 0x41aea7 ADD %RDI,%R10 |
(290) 0x41aeaa VXORPD %XMM1,%XMM1,%XMM1 |
(290) 0x41aeae XOR %R11D,%R11D |
(290) 0x41aeb1 NOPW %CS:(%RAX,%RAX,1) |
(295) 0x41aec0 VMOVUPD (%R10,%R11,8),%YMM2 |
(295) 0x41aec6 VFMADD231PD (%RCX,%R11,8),%YMM2,%YMM1 |
(295) 0x41aecc ADD $0x4,%R11 |
(295) 0x41aed0 CMP %RSI,%R11 |
(295) 0x41aed3 JL 41aec0 |
(290) 0x41aed5 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(290) 0x41aedb VADDPD %XMM2,%XMM1,%XMM1 |
(290) 0x41aedf VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(290) 0x41aee4 VADDSD %XMM2,%XMM1,%XMM1 |
(290) 0x41aee8 CMP %RAX,%RSI |
(290) 0x41aeeb JNE 41aef5 |
(290) 0x41aeed JMP 41af13 |
(290) 0x41aeef VXORPD %XMM1,%XMM1,%XMM1 |
(290) 0x41aef3 XOR %ESI,%ESI |
(290) 0x41aef5 SAL $0x4,%R8 |
(290) 0x41aef9 ADD %R8,%RDI |
(290) 0x41aefc NOPL (%RAX) |
(294) 0x41af00 VMOVSD (%RDI,%RSI,8),%XMM2 |
(294) 0x41af05 VFMADD231SD (%RCX,%RSI,8),%XMM2,%XMM1 |
(294) 0x41af0b INC %RSI |
(294) 0x41af0e CMP %RSI,%RAX |
(294) 0x41af11 JNE 41af00 |
(290) 0x41af13 VMOVSD %XMM1,0x10(%RDX,%R9,8) |
(290) 0x41af1a JMP 41ab9a |
0x41af1f NOP |
(301) 0x41af20 VADDSD (%RCX,%RSI,8),%XMM0,%XMM0 |
(301) 0x41af25 INC %RSI |
(301) 0x41af28 CMP %RSI,%RDX |
(301) 0x41af2b JNE 41af20 |
(290) 0x41af2d JMP 41ac80 |
0x41af32 MOV 0x94(%RBX),%R8D |
0x41af39 VXORPD %XMM0,%XMM0,%XMM0 |
0x41af3d TEST %R8D,%R8D |
0x41af40 JNE 41af5c |
0x41af42 JMP 41b226 |
0x41af47 MOV -0x38(%RBP),%R14 |
0x41af4b MOV -0x30(%RBP),%R15 |
0x41af4f VXORPD %XMM0,%XMM0,%XMM0 |
0x41af53 TEST %R8D,%R8D |
0x41af56 JE 41b226 |
0x41af5c MOVSXD %R8D,%RAX |
0x41af5f MOV 0x190(%RBX),%RDX |
0x41af66 MOV 0x18(%R15),%RSI |
0x41af6a LEA -0x1(%RAX),%RCX |
0x41af6e LEA -0x8(,%RAX,8),%RDI |
0x41af76 LEA (%RDI,%RDI,2),%RDI |
0x41af7a LEA 0x10(%RSI,%RDI,1),%R9 |
0x41af7f CMP %RDX,%R9 |
0x41af82 JB 41afd4 |
0x41af84 LEA 0x10(%RDX,%RDI,1),%RDI |
0x41af89 CMP %RSI,%RDI |
0x41af8c JB 41afd4 |
0x41af8e XOR %EDI,%EDI |
(289) 0x41af90 XOR %R8D,%R8D |
(289) 0x41af93 NOPW %CS:(%RAX,%RAX,1) |
(288) 0x41afa0 VMOVSD (%RSI,%R8,8),%XMM1 |
(288) 0x41afa6 VADDSD (%RDX,%R8,8),%XMM1,%XMM1 |
(288) 0x41afac VMOVSD %XMM1,(%RSI,%R8,8) |
(288) 0x41afb2 INC %R8 |
(288) 0x41afb5 CMP $0x3,%R8 |
(288) 0x41afb9 JNE 41afa0 |
(289) 0x41afbb LEA 0x1(%RDI),%R8 |
(289) 0x41afbf ADD $0x18,%RDX |
(289) 0x41afc3 ADD $0x18,%RSI |
(289) 0x41afc7 CMP %RCX,%RDI |
(289) 0x41afca MOV %R8,%RDI |
(289) 0x41afcd JNE 41af90 |
0x41afcf JMP 41b110 |
0x41afd4 MOV %R8D,%EDI |
0x41afd7 AND $0x3,%EDI |
0x41afda CMP $0x4,%R8D |
0x41afde JAE 41afe8 |
0x41afe0 XOR %R8D,%R8D |
0x41afe3 JMP 41b0b6 |
0x41afe8 MOV %RAX,%R9 |
0x41afeb AND $-0x4,%R9 |
0x41afef MOV $0x58,%R10D |
0x41aff5 XOR %R8D,%R8D |
0x41aff8 NOPL (%RAX,%RAX,1) |
(281) 0x41b000 VMOVUPD -0x58(%RSI,%R10,1),%XMM1 |
(281) 0x41b007 VADDPD -0x58(%RDX,%R10,1),%XMM1,%XMM1 |
(281) 0x41b00e VMOVUPD %XMM1,-0x58(%RSI,%R10,1) |
(281) 0x41b015 VMOVSD -0x48(%RSI,%R10,1),%XMM1 |
(281) 0x41b01c VADDSD -0x48(%RDX,%R10,1),%XMM1,%XMM1 |
(281) 0x41b023 VMOVSD %XMM1,-0x48(%RSI,%R10,1) |
(281) 0x41b02a VMOVUPD -0x40(%RSI,%R10,1),%XMM1 |
(281) 0x41b031 VADDPD -0x40(%RDX,%R10,1),%XMM1,%XMM1 |
(281) 0x41b038 VMOVUPD %XMM1,-0x40(%RSI,%R10,1) |
(281) 0x41b03f VMOVSD -0x30(%RSI,%R10,1),%XMM1 |
(281) 0x41b046 VADDSD -0x30(%RDX,%R10,1),%XMM1,%XMM1 |
(281) 0x41b04d VMOVSD %XMM1,-0x30(%RSI,%R10,1) |
(281) 0x41b054 VMOVUPD -0x28(%RSI,%R10,1),%XMM1 |
(281) 0x41b05b VADDPD -0x28(%RDX,%R10,1),%XMM1,%XMM1 |
(281) 0x41b062 VMOVUPD %XMM1,-0x28(%RSI,%R10,1) |
(281) 0x41b069 VMOVSD -0x18(%RSI,%R10,1),%XMM1 |
(281) 0x41b070 VADDSD -0x18(%RDX,%R10,1),%XMM1,%XMM1 |
(281) 0x41b077 VMOVSD %XMM1,-0x18(%RSI,%R10,1) |
(281) 0x41b07e VMOVUPD -0x10(%RSI,%R10,1),%XMM1 |
(281) 0x41b085 VADDPD -0x10(%RDX,%R10,1),%XMM1,%XMM1 |
(281) 0x41b08c VMOVUPD %XMM1,-0x10(%RSI,%R10,1) |
(281) 0x41b093 VMOVSD (%RSI,%R10,1),%XMM1 |
(281) 0x41b099 VADDSD (%RDX,%R10,1),%XMM1,%XMM1 |
(281) 0x41b09f VMOVSD %XMM1,(%RSI,%R10,1) |
(281) 0x41b0a5 ADD $0x4,%R8 |
(281) 0x41b0a9 ADD $0x60,%R10 |
(281) 0x41b0ad CMP %R8,%R9 |
(281) 0x41b0b0 JNE 41b000 |
0x41b0b6 TEST %RDI,%RDI |
0x41b0b9 JE 41b110 |
0x41b0bb LEA (%R8,%R8,2),%R8 |
0x41b0bf LEA 0x10(%RDX,%R8,8),%RDX |
0x41b0c4 LEA 0x10(%RSI,%R8,8),%RSI |
0x41b0c9 SAL $0x3,%EDI |
0x41b0cc LEA (%RDI,%RDI,2),%RDI |
0x41b0d0 XOR %R8D,%R8D |
0x41b0d3 NOPW %CS:(%RAX,%RAX,1) |
(287) 0x41b0e0 VMOVUPD -0x10(%RSI,%R8,1),%XMM1 |
(287) 0x41b0e7 VADDPD -0x10(%RDX,%R8,1),%XMM1,%XMM1 |
(287) 0x41b0ee VMOVUPD %XMM1,-0x10(%RSI,%R8,1) |
(287) 0x41b0f5 VMOVSD (%RSI,%R8,1),%XMM1 |
(287) 0x41b0fb VADDSD (%RDX,%R8,1),%XMM1,%XMM1 |
(287) 0x41b101 VMOVSD %XMM1,(%RSI,%R8,1) |
(287) 0x41b107 ADD $0x18,%R8 |
(287) 0x41b10b CMP %R8,%RDI |
(287) 0x41b10e JNE 41b0e0 |
0x41b110 MOV 0x1b8(%RBX),%RDX |
0x41b117 MOV 0x18(%R14),%RSI |
0x41b11b LEA (%RSI,%RCX,8),%RDI |
0x41b11f CMP %RDX,%RDI |
0x41b122 JB 41b149 |
0x41b124 LEA (%RDX,%RCX,8),%RCX |
0x41b128 CMP %RSI,%RCX |
0x41b12b JB 41b149 |
0x41b12d XOR %ECX,%ECX |
0x41b12f NOP |
(286) 0x41b130 VMOVSD (%RSI,%RCX,8),%XMM1 |
(286) 0x41b135 VSUBSD (%RDX,%RCX,8),%XMM1,%XMM1 |
(286) 0x41b13a VMOVSD %XMM1,(%RSI,%RCX,8) |
(286) 0x41b13f INC %RCX |
(286) 0x41b142 CMP %RCX,%RAX |
(286) 0x41b145 JNE 41b130 |
0x41b147 JMP 41b1a7 |
0x41b149 MOV %RAX,%RCX |
0x41b14c AND $-0x4,%RCX |
0x41b150 JE 41b182 |
0x41b152 LEA -0x1(%RCX),%RDI |
0x41b156 XOR %R8D,%R8D |
0x41b159 NOPL (%RAX) |
(285) 0x41b160 VMOVUPD (%RSI,%R8,8),%YMM1 |
(285) 0x41b166 VSUBPD (%RDX,%R8,8),%YMM1,%YMM1 |
(285) 0x41b16c VMOVUPD %YMM1,(%RSI,%R8,8) |
(285) 0x41b172 ADD $0x4,%R8 |
(285) 0x41b176 CMP %RDI,%R8 |
(285) 0x41b179 JBE 41b160 |
0x41b17b CMP %RAX,%RCX |
0x41b17e JNE 41b190 |
0x41b180 JMP 41b1a7 |
0x41b182 XOR %ECX,%ECX |
0x41b184 NOPW %CS:(%RAX,%RAX,1) |
(282) 0x41b190 VMOVSD (%RSI,%RCX,8),%XMM1 |
(282) 0x41b195 VSUBSD (%RDX,%RCX,8),%XMM1,%XMM1 |
(282) 0x41b19a VMOVSD %XMM1,(%RSI,%RCX,8) |
(282) 0x41b19f INC %RCX |
(282) 0x41b1a2 CMP %RCX,%RAX |
(282) 0x41b1a5 JNE 41b190 |
0x41b1a7 LEA (,%RAX,8),%RCX |
0x41b1af TEST %RCX,%RCX |
0x41b1b2 JE 41b226 |
0x41b1b4 MOV $0x1fffffffffffffff,%RDX |
0x41b1be MOV 0xf0(%RBX),%RCX |
0x41b1c5 ADD %RDX,%RAX |
0x41b1c8 AND %RDX,%RAX |
0x41b1cb INC %RAX |
0x41b1ce MOV $0x3ffffffffffffffc,%RDX |
0x41b1d8 AND %RAX,%RDX |
0x41b1db JE 41b213 |
0x41b1dd VXORPD %XMM0,%XMM0,%XMM0 |
0x41b1e1 XOR %ESI,%ESI |
0x41b1e3 NOPW %CS:(%RAX,%RAX,1) |
(284) 0x41b1f0 VADDPD (%RCX,%RSI,8),%YMM0,%YMM0 |
(284) 0x41b1f5 ADD $0x4,%RSI |
(284) 0x41b1f9 CMP %RDX,%RSI |
(284) 0x41b1fc JB 41b1f0 |
0x41b1fe VEXTRACTF128 $0x1,%YMM0,%XMM1 |
0x41b204 VADDPD %XMM1,%XMM0,%XMM0 |
0x41b208 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
0x41b20d VADDSD %XMM1,%XMM0,%XMM0 |
0x41b211 JMP 41b221 |
0x41b213 XOR %EDX,%EDX |
0x41b215 VXORPD %XMM0,%XMM0,%XMM0 |
(283) 0x41b219 VADDSD (%RCX,%RDX,8),%XMM0,%XMM0 |
(283) 0x41b21e INC %RDX |
(283) 0x41b221 CMP %RDX,%RAX |
(283) 0x41b224 JNE 41b219 |
0x41b226 VXORPD 0xe0010(%RIP){1to2},%XMM0,%XMM0 |
0x41b230 VMOVLPD %XMM0,0x10(%RBX) |
0x41b235 ADD $0x18,%RSP |
0x41b239 POP %RBX |
0x41b23a POP %R12 |
0x41b23c POP %R13 |
0x41b23e POP %R14 |
0x41b240 POP %R15 |
0x41b242 POP %RBP |
0x41b243 VZEROUPPER |
0x41b246 RET |
0x41b247 NOPW (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►97.45+ | miniqmcreference::OneBodyJastr[...] | OneBodyJastrowRef.h:122 | exec |
○ | qmcplusplus::WaveFunction::eva[...] | WaveFunction.cpp:175 | exec |
○ | main.extracted.113 | miniqmc.cpp:397 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►2.55+ | qmcplusplus::WaveFunction::eva[...] | stl_vector.h:933 | exec |
○ | main.extracted.110 | miniqmc.cpp:467 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | OneBodyJastrowRef.h:108-194 |
Module | exec |
nb instructions | 133 |
nb uops | 135 |
loop length | 558 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 3 |
micro-operation queue | 22.50 cycles |
front end | 22.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.60 | 9.67 | 6.00 | 6.00 | 5.50 | 9.53 | 9.60 | 5.50 | 5.50 | 5.50 | 9.60 | 6.00 |
cycles | 9.60 | 9.67 | 6.00 | 6.00 | 5.50 | 9.53 | 9.60 | 5.50 | 5.50 | 5.50 | 9.60 | 6.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 22.35-22.34 |
Stall cycles | 0.00 |
Front-end | 22.50 |
Dispatch | 9.67 |
Overall L1 | 22.50 |
all | 5% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 80% |
load | 100% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 30% |
load | 100% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 11% |
load | NA (no load vectorizable/vectorized instructions) |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 22% |
load | 25% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 18% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 15% |
load | 25% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 18% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41af32 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x422> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xa8(%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4600b0 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x94(%RBX),%R8D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R8D,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41af39 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x429> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x1fffffffffffffff,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41abba <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xaa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x94(%RBX),%R8D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %R8D,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 41af5c <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x44c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41b226 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x716> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x38(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %R8D,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41b226 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x716> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD %R8D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV 0x190(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R15),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RDI,2),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x10(%RSI,%RDI,1),%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41afd4 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4c4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x10(%RDX,%RDI,1),%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41afd4 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4c4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41b110 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x600> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R8D,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $0x3,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP $0x4,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 41afe8 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4d8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41b0b6 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5a6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RAX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV $0x58,%R10D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RDI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41b110 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x600> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R8,%R8,2),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x10(%RDX,%R8,8),%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x10(%RSI,%R8,8),%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x3,%EDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA (%RDI,%RDI,2),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x1b8(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R14),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RSI,%RCX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41b149 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x639> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RDX,%RCX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41b149 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x639> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41b1a7 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x697> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 41b182 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x672> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RCX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 41b190 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x680> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41b1a7 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x697> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41b226 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x716> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1fffffffffffffff,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV 0xf0(%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
AND %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
INC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0x3ffffffffffffffc,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
AND %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 41b213 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x703> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTF128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VADDPD %XMM1,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VADDSD %XMM1,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
JMP 41b221 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x711> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD 0xe0010(%RIP){1to2},%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVLPD %XMM0,0x10(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 4-12 | 0.50 |
ADD $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | OneBodyJastrowRef.h:108-194 |
Module | exec |
nb instructions | 133 |
nb uops | 135 |
loop length | 558 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 3 |
micro-operation queue | 22.50 cycles |
front end | 22.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.60 | 9.67 | 6.00 | 6.00 | 5.50 | 9.53 | 9.60 | 5.50 | 5.50 | 5.50 | 9.60 | 6.00 |
cycles | 9.60 | 9.67 | 6.00 | 6.00 | 5.50 | 9.53 | 9.60 | 5.50 | 5.50 | 5.50 | 9.60 | 6.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 22.35-22.34 |
Stall cycles | 0.00 |
Front-end | 22.50 |
Dispatch | 9.67 |
Overall L1 | 22.50 |
all | 5% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 80% |
load | 100% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 30% |
load | 100% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 11% |
load | NA (no load vectorizable/vectorized instructions) |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 22% |
load | 25% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 18% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 15% |
load | 25% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 18% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41af32 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x422> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xa8(%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4600b0 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x94(%RBX),%R8D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R8D,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41af39 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x429> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x1fffffffffffffff,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41abba <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xaa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x94(%RBX),%R8D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %R8D,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 41af5c <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x44c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41b226 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x716> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x38(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %R8D,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41b226 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x716> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD %R8D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV 0x190(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R15),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RDI,2),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x10(%RSI,%RDI,1),%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41afd4 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4c4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x10(%RDX,%RDI,1),%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41afd4 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4c4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41b110 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x600> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R8D,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $0x3,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP $0x4,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 41afe8 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4d8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41b0b6 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5a6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RAX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV $0x58,%R10D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RDI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41b110 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x600> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R8,%R8,2),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x10(%RDX,%R8,8),%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x10(%RSI,%R8,8),%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x3,%EDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA (%RDI,%RDI,2),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x1b8(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R14),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RSI,%RCX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41b149 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x639> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RDX,%RCX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41b149 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x639> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41b1a7 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x697> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 41b182 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x672> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RCX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 41b190 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x680> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41b1a7 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x697> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41b226 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x716> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1fffffffffffffff,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV 0xf0(%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
AND %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
INC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0x3ffffffffffffffc,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
AND %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 41b213 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x703> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTF128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VADDPD %XMM1,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VADDSD %XMM1,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
JMP 41b221 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x711> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD 0xe0010(%RIP){1to2},%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVLPD %XMM0,0x10(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 4-12 | 0.50 |
ADD $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼miniqmcreference::OneBodyJastrowRef | 0.02 | 0.02 |
○Loop 287 - OneBodyJastrowRef.h:169-169 - exec | 0 | 0 |
○Loop 281 - OneBodyJastrowRef.h:169-169 - exec | 0 | 0 |
○Loop 284 - stl_numeric.h:126-127 - exec | 0 | 0 |
▼Loop 289 - OneBodyJastrowRef.h:169-169 - exec– | 0 | 0 |
○Loop 288 - TinyVectorOps.h:49-49 - exec | 0 | 0 |
○Loop 285 - OneBodyJastrowRef.h:171-172 - exec | 0 | 0 |
○Loop 286 - OneBodyJastrowRef.h:171-172 - exec | 0 | 0 |
○Loop 282 - OneBodyJastrowRef.h:171-172 - exec | 0 | 0 |
○Loop 283 - OneBodyJastrowRef.h:0-0 - exec | 0 | 0 |
▼Loop 290 - OneBodyJastrowRef.h:109-194 - exec– | 0 | 0 |
○Loop 297 - OneBodyJastrowRef.h:192-193 - exec | 0.01 | 0.01 |
○Loop 300 - OneBodyJastrowRef.h:186-187 - exec | 0 | 0 |
○Loop 302 - stl_numeric.h:126-127 - exec | 0 | 0 |
○Loop 301 - OneBodyJastrowRef.h:0-0 - exec | 0 | 0 |
○Loop 296 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 295 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0.01 |
○Loop 293 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 294 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 292 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
▼Loop 299 - OneBodyJastrowRef.h:188-194 - exec– | 0 | 0 |
○Loop 298 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 291 - OneBodyJastrowRef.h:186-187 - exec | 0 | 0 |