Function: _ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLER ... | Module: exec | Source: OneBodyJastrowRef.h:108-194 [...] | Coverage: 0.01% |
---|
Function: _ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLER ... | Module: exec | Source: OneBodyJastrowRef.h:108-194 [...] | Coverage: 0.01% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/OneBodyJastrowRef.h: 108 - 194 |
-------------------------------------------------------------------------------- |
108: const auto& d_ie = P.getDistTableAB(myTableID); |
109: for (int iat = 0; iat < Nelec; ++iat) |
110: { |
111: computeU3(P, iat, d_ie.getDistRow(iat).data()); |
112: Vat[iat] = std::accumulate(U.begin(), U.begin() + Nions, valT()); |
113: Lap[iat] = accumulateGL(dU.data(), d2U.data(), d_ie.getDisplRow(iat), Grad[iat]); |
[...] |
165: { |
166: if (fromscratch) |
167: recompute(P); |
168: |
169: for (size_t iat = 0; iat < Nelec; ++iat) |
170: G[iat] += Grad[iat]; |
171: for (size_t iat = 0; iat < Nelec; ++iat) |
172: L[iat] -= Lap[iat]; |
173: LogValue = -std::accumulate(Vat.begin(), Vat.begin() + Nelec, valT()); |
174: } |
[...] |
186: for (int jat = 0; jat < Nions; ++jat) |
187: lap += d2u[jat] + lapfac * du[jat]; |
188: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
189: { |
190: const valT* restrict dX = displ.data(idim); |
191: valT s = valT(); |
192: for (int jat = 0; jat < Nions; ++jat) |
193: s += du[jat] * dX[jat]; |
194: grad[idim] = s; |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_numeric.h: 140 - 141 |
-------------------------------------------------------------------------------- |
140: for (; __first != __last; ++__first) |
141: __init = _GLIBCXX_MOVE_IF_20(__init) + *__first; |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVectorOps.h: 49 - 49 |
-------------------------------------------------------------------------------- |
49: for (unsigned d = 0; d < D; ++d) |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_vector.h: 1064 - 1169 |
-------------------------------------------------------------------------------- |
1064: return *(this->_M_impl._M_start + __n); |
[...] |
1169: { return _M_data_ptr(this->_M_impl._M_start); } |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 169 - 170 |
-------------------------------------------------------------------------------- |
169: inline Type_t& operator[](unsigned int i) { return X[i]; } |
170: inline const Type_t& operator[](unsigned int i) const { return X[i]; } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_iterator.h: 1028 - 1182 |
-------------------------------------------------------------------------------- |
1028: : _M_current(__i) { } |
[...] |
1182: { return __lhs.base() != __rhs.base(); } |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
242: inline iterator begin() { return X; } |
[...] |
249: inline const_pointer data() const { return X; } |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 273 - 273 |
-------------------------------------------------------------------------------- |
273: inline const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 94 - 94 |
-------------------------------------------------------------------------------- |
94: (const_cast<T1&>(a) += b); |
0x41aa80 PUSH %RBP |
0x41aa81 MOV %RSP,%RBP |
0x41aa84 PUSH %R15 |
0x41aa86 PUSH %R14 |
0x41aa88 PUSH %R13 |
0x41aa8a PUSH %R12 |
0x41aa8c PUSH %RBX |
0x41aa8d SUB $0x18,%RSP |
0x41aa91 MOV %RCX,%R14 |
0x41aa94 MOV %RDX,%R15 |
0x41aa97 MOV %RDI,%RBX |
0x41aa9a TEST %R8B,%R8B |
0x41aa9d JE 41ae9f |
0x41aaa3 MOV %RSI,%R12 |
0x41aaa6 MOV 0xa8(%RBX),%ESI |
0x41aaac MOV %R12,%RDI |
0x41aaaf CALL 461820 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> |
0x41aab4 MOV %RAX,%R13 |
0x41aab7 MOV 0x94(%RBX),%EAX |
0x41aabd TEST %EAX,%EAX |
0x41aabf JLE 41aea5 |
0x41aac5 MOV %R12,-0x40(%RBP) |
0x41aac9 MOV %R15,-0x30(%RBP) |
0x41aacd MOV %R14,-0x38(%RBP) |
0x41aad1 MOV $0x1fffffffffffffff,%R15 |
0x41aadb XOR %R14D,%R14D |
0x41aade JMP 41ab1a |
(275) 0x41aae0 LEA (%R14,%R14,2),%RAX |
(275) 0x41aae4 VXORPD %XMM0,%XMM0,%XMM0 |
(275) 0x41aae8 VMOVUPD %XMM0,(%RDX,%RAX,8) |
(275) 0x41aaed MOVQ $0,0x10(%RDX,%RAX,8) |
(275) 0x41aaf6 VXORPD %XMM0,%XMM0,%XMM0 |
(275) 0x41aafa MOV 0x1b8(%RBX),%RAX |
(275) 0x41ab01 VMOVSD %XMM0,(%RAX,%R14,8) |
(275) 0x41ab07 INC %R14 |
(275) 0x41ab0a MOVSXD 0x94(%RBX),%RAX |
(275) 0x41ab11 CMP %RAX,%R14 |
(275) 0x41ab14 JGE 41aeb2 |
(275) 0x41ab1a MOV 0x48(%R13),%RAX |
(275) 0x41ab1e LEA (%R14,%R14,4),%R12 |
(275) 0x41ab22 MOV 0x18(%RAX,%R12,8),%RCX |
(275) 0x41ab27 MOV %RBX,%RDI |
(275) 0x41ab2a MOV -0x40(%RBP),%RSI |
(275) 0x41ab2e MOV %R14D,%EDX |
(275) 0x41ab31 VZEROUPPER |
(275) 0x41ab34 CALL 41cd50 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd> |
(275) 0x41ab39 MOVSXD 0x90(%RBX),%RAX |
(275) 0x41ab40 TEST %R15,%RAX |
(275) 0x41ab43 JE 41abb0 |
(275) 0x41ab45 MOV 0x100(%RBX),%RCX |
(275) 0x41ab4c LEA (%RAX,%R15,1),%RDX |
(275) 0x41ab50 AND %R15,%RDX |
(275) 0x41ab53 INC %RDX |
(275) 0x41ab56 MOV %RDX,%RSI |
(275) 0x41ab59 MOV $0x3ffffffffffffffc,%RDI |
(275) 0x41ab63 AND %RDI,%RSI |
(275) 0x41ab66 JE 41abd0 |
(275) 0x41ab68 VXORPD %XMM0,%XMM0,%XMM0 |
(275) 0x41ab6c XOR %EDI,%EDI |
(275) 0x41ab6e XCHG %AX,%AX |
(287) 0x41ab70 VADDPD (%RCX,%RDI,8),%YMM0,%YMM0 |
(287) 0x41ab75 ADD $0x4,%RDI |
(287) 0x41ab79 CMP %RSI,%RDI |
(287) 0x41ab7c JB 41ab70 |
(275) 0x41ab7e VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(275) 0x41ab84 VADDPD %XMM1,%XMM0,%XMM0 |
(275) 0x41ab88 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(275) 0x41ab8d VADDSD %XMM1,%XMM0,%XMM0 |
(275) 0x41ab91 CMP %RSI,%RDX |
(275) 0x41ab94 VMOVSD 0xdb71c(%RIP),%XMM2 |
(275) 0x41ab9c VBROADCASTSD 0xdb713(%RIP),%YMM1 |
(275) 0x41aba5 JNE 41abf0 |
(275) 0x41aba7 JMP 41abfd |
0x41aba9 NOPL (%RAX) |
(275) 0x41abb0 VXORPD %XMM0,%XMM0,%XMM0 |
(275) 0x41abb4 VMOVSD 0xdb6fc(%RIP),%XMM2 |
(275) 0x41abbc VBROADCASTSD 0xdb6f3(%RIP),%YMM1 |
(275) 0x41abc5 JMP 41abfd |
0x41abc7 NOPW (%RAX,%RAX,1) |
(275) 0x41abd0 VXORPD %XMM0,%XMM0,%XMM0 |
(275) 0x41abd4 XOR %ESI,%ESI |
(275) 0x41abd6 VMOVSD 0xdb6da(%RIP),%XMM2 |
(275) 0x41abde VBROADCASTSD 0xdb6d1(%RIP),%YMM1 |
(275) 0x41abe7 NOPW (%RAX,%RAX,1) |
(286) 0x41abf0 VADDSD (%RCX,%RSI,8),%XMM0,%XMM0 |
(286) 0x41abf5 INC %RSI |
(286) 0x41abf8 CMP %RSI,%RDX |
(286) 0x41abfb JNE 41abf0 |
(275) 0x41abfd MOV 0xf0(%RBX),%RCX |
(275) 0x41ac04 VMOVSD %XMM0,(%RCX,%R14,8) |
(275) 0x41ac0a MOV 0x190(%RBX),%RDX |
(275) 0x41ac11 TEST %EAX,%EAX |
(275) 0x41ac13 JLE 41aae0 |
(275) 0x41ac19 MOV 0x118(%RBX),%RCX |
(275) 0x41ac20 MOV 0x130(%RBX),%RDI |
(275) 0x41ac27 MOV %RAX,%RSI |
(275) 0x41ac2a AND $-0x4,%RSI |
(275) 0x41ac2e JE 41ac80 |
(275) 0x41ac30 VXORPD %XMM0,%XMM0,%XMM0 |
(275) 0x41ac34 XOR %R8D,%R8D |
(275) 0x41ac37 NOPW (%RAX,%RAX,1) |
(285) 0x41ac40 VADDPD (%RDI,%R8,8),%YMM0,%YMM0 |
(285) 0x41ac46 VFMADD231PD (%RCX,%R8,8),%YMM1,%YMM0 |
(285) 0x41ac4c ADD $0x4,%R8 |
(285) 0x41ac50 CMP %RSI,%R8 |
(285) 0x41ac53 JL 41ac40 |
(275) 0x41ac55 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(275) 0x41ac5b VADDPD %XMM1,%XMM0,%XMM0 |
(275) 0x41ac5f VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(275) 0x41ac64 VADDSD %XMM1,%XMM0,%XMM0 |
(275) 0x41ac68 MOV %RSI,%R8 |
(275) 0x41ac6b CMP %RAX,%RSI |
(275) 0x41ac6e JNE 41ac90 |
(275) 0x41ac70 JMP 41aca4 |
0x41ac72 NOPW %CS:(%RAX,%RAX,1) |
(275) 0x41ac80 VXORPD %XMM0,%XMM0,%XMM0 |
(275) 0x41ac84 XOR %R8D,%R8D |
(275) 0x41ac87 NOPW (%RAX,%RAX,1) |
(276) 0x41ac90 VADDSD (%RDI,%R8,8),%XMM0,%XMM0 |
(276) 0x41ac96 VFMADD231SD (%RCX,%R8,8),%XMM2,%XMM0 |
(276) 0x41ac9c INC %R8 |
(276) 0x41ac9f CMP %R8,%RAX |
(276) 0x41aca2 JNE 41ac90 |
(275) 0x41aca4 MOV 0x60(%R13),%RDI |
(275) 0x41aca8 MOV 0x8(%RDI,%R12,8),%R8 |
(275) 0x41acad MOV 0x18(%RDI,%R12,8),%RDI |
(275) 0x41acb2 MOV %R8,%R9 |
(275) 0x41acb5 SAR $0x3f,%R9 |
(275) 0x41acb9 ANDN %R8,%R9,%R9 |
(275) 0x41acbe TEST %R8,%R8 |
(275) 0x41acc1 LEA (%RAX,%R9,2),%R9 |
(275) 0x41acc5 LEA -0x8(%RDI,%R9,8),%R12 |
(275) 0x41acca LEA (%R14,%R14,2),%R9 |
(275) 0x41acce LEA (%RDX,%R9,8),%R10 |
(275) 0x41acd2 MOV $0,%R11D |
(275) 0x41acd8 CMOVS %R8,%R11 |
(275) 0x41acdc CMP %R10,%R12 |
(275) 0x41acdf JB 41ad40 |
(275) 0x41ace1 SAL $0x4,%R11 |
(275) 0x41ace5 ADD %RDI,%R11 |
(275) 0x41ace8 LEA (%RDX,%R9,8),%R12 |
(275) 0x41acec ADD $0x10,%R12 |
(275) 0x41acf0 CMP %R11,%R12 |
(275) 0x41acf3 JB 41ad40 |
(275) 0x41acf5 SAL $0x3,%R8 |
(275) 0x41acf9 XOR %EDX,%EDX |
(275) 0x41acfb NOPL (%RAX,%RAX,1) |
(284) 0x41ad00 VXORPD %XMM1,%XMM1,%XMM1 |
(284) 0x41ad04 XOR %ESI,%ESI |
(284) 0x41ad06 NOPW %CS:(%RAX,%RAX,1) |
(283) 0x41ad10 VMOVSD (%RDI,%RSI,8),%XMM2 |
(283) 0x41ad15 VFMADD231SD (%RCX,%RSI,8),%XMM2,%XMM1 |
(283) 0x41ad1b INC %RSI |
(283) 0x41ad1e CMP %RSI,%RAX |
(283) 0x41ad21 JNE 41ad10 |
(284) 0x41ad23 VMOVSD %XMM1,(%R10,%RDX,8) |
(284) 0x41ad29 ADD %R8,%RDI |
(284) 0x41ad2c CMP $0x2,%RDX |
(284) 0x41ad30 LEA 0x1(%RDX),%RDX |
(284) 0x41ad34 JNE 41ad00 |
(275) 0x41ad36 JMP 41aafa |
0x41ad3b NOPL (%RAX,%RAX,1) |
(275) 0x41ad40 TEST %RSI,%RSI |
(275) 0x41ad43 JE 41ad82 |
(275) 0x41ad45 VXORPD %XMM1,%XMM1,%XMM1 |
(275) 0x41ad49 XOR %R10D,%R10D |
(275) 0x41ad4c NOPL (%RAX) |
(282) 0x41ad50 VMOVUPD (%RDI,%R10,8),%YMM2 |
(282) 0x41ad56 VFMADD231PD (%RCX,%R10,8),%YMM2,%YMM1 |
(282) 0x41ad5c ADD $0x4,%R10 |
(282) 0x41ad60 CMP %RSI,%R10 |
(282) 0x41ad63 JL 41ad50 |
(275) 0x41ad65 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(275) 0x41ad6b VADDPD %XMM2,%XMM1,%XMM1 |
(275) 0x41ad6f VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(275) 0x41ad74 VADDSD %XMM2,%XMM1,%XMM1 |
(275) 0x41ad78 MOV %RSI,%R10 |
(275) 0x41ad7b CMP %RAX,%RSI |
(275) 0x41ad7e JNE 41ad90 |
(275) 0x41ad80 JMP 41ada4 |
(275) 0x41ad82 VXORPD %XMM1,%XMM1,%XMM1 |
(275) 0x41ad86 XOR %R10D,%R10D |
(275) 0x41ad89 NOPL (%RAX) |
(277) 0x41ad90 VMOVSD (%RDI,%R10,8),%XMM2 |
(277) 0x41ad96 VFMADD231SD (%RCX,%R10,8),%XMM2,%XMM1 |
(277) 0x41ad9c INC %R10 |
(277) 0x41ad9f CMP %R10,%RAX |
(277) 0x41ada2 JNE 41ad90 |
(275) 0x41ada4 VMOVSD %XMM1,(%RDX,%R9,8) |
(275) 0x41adaa TEST %RSI,%RSI |
(275) 0x41adad JE 41adf2 |
(275) 0x41adaf LEA (%RDI,%R8,8),%R10 |
(275) 0x41adb3 VXORPD %XMM1,%XMM1,%XMM1 |
(275) 0x41adb7 XOR %R11D,%R11D |
(275) 0x41adba NOPW (%RAX,%RAX,1) |
(281) 0x41adc0 VMOVUPD (%R10,%R11,8),%YMM2 |
(281) 0x41adc6 VFMADD231PD (%RCX,%R11,8),%YMM2,%YMM1 |
(281) 0x41adcc ADD $0x4,%R11 |
(281) 0x41add0 CMP %RSI,%R11 |
(281) 0x41add3 JL 41adc0 |
(275) 0x41add5 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(275) 0x41addb VADDPD %XMM2,%XMM1,%XMM1 |
(275) 0x41addf VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(275) 0x41ade4 VADDSD %XMM2,%XMM1,%XMM1 |
(275) 0x41ade8 MOV %RSI,%R10 |
(275) 0x41adeb CMP %RAX,%RSI |
(275) 0x41adee JNE 41adf9 |
(275) 0x41adf0 JMP 41ae14 |
(275) 0x41adf2 VXORPD %XMM1,%XMM1,%XMM1 |
(275) 0x41adf6 XOR %R10D,%R10D |
(275) 0x41adf9 LEA (%RDI,%R8,8),%R11 |
(275) 0x41adfd NOPL (%RAX) |
(278) 0x41ae00 VMOVSD (%R11,%R10,8),%XMM2 |
(278) 0x41ae06 VFMADD231SD (%RCX,%R10,8),%XMM2,%XMM1 |
(278) 0x41ae0c INC %R10 |
(278) 0x41ae0f CMP %R10,%RAX |
(278) 0x41ae12 JNE 41ae00 |
(275) 0x41ae14 VMOVSD %XMM1,0x8(%RDX,%R9,8) |
(275) 0x41ae1b TEST %RSI,%RSI |
(275) 0x41ae1e JE 41ae6f |
(275) 0x41ae20 MOV %R8,%R10 |
(275) 0x41ae23 SAL $0x4,%R10 |
(275) 0x41ae27 ADD %RDI,%R10 |
(275) 0x41ae2a VXORPD %XMM1,%XMM1,%XMM1 |
(275) 0x41ae2e XOR %R11D,%R11D |
(275) 0x41ae31 NOPW %CS:(%RAX,%RAX,1) |
(280) 0x41ae40 VMOVUPD (%R10,%R11,8),%YMM2 |
(280) 0x41ae46 VFMADD231PD (%RCX,%R11,8),%YMM2,%YMM1 |
(280) 0x41ae4c ADD $0x4,%R11 |
(280) 0x41ae50 CMP %RSI,%R11 |
(280) 0x41ae53 JL 41ae40 |
(275) 0x41ae55 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(275) 0x41ae5b VADDPD %XMM2,%XMM1,%XMM1 |
(275) 0x41ae5f VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(275) 0x41ae64 VADDSD %XMM2,%XMM1,%XMM1 |
(275) 0x41ae68 CMP %RAX,%RSI |
(275) 0x41ae6b JNE 41ae75 |
(275) 0x41ae6d JMP 41ae93 |
(275) 0x41ae6f VXORPD %XMM1,%XMM1,%XMM1 |
(275) 0x41ae73 XOR %ESI,%ESI |
(275) 0x41ae75 SAL $0x4,%R8 |
(275) 0x41ae79 ADD %R8,%RDI |
(275) 0x41ae7c NOPL (%RAX) |
(279) 0x41ae80 VMOVSD (%RDI,%RSI,8),%XMM2 |
(279) 0x41ae85 VFMADD231SD (%RCX,%RSI,8),%XMM2,%XMM1 |
(279) 0x41ae8b INC %RSI |
(279) 0x41ae8e CMP %RSI,%RAX |
(279) 0x41ae91 JNE 41ae80 |
(275) 0x41ae93 VMOVSD %XMM1,0x10(%RDX,%R9,8) |
(275) 0x41ae9a JMP 41aafa |
0x41ae9f MOV 0x94(%RBX),%EAX |
0x41aea5 VXORPD %XMM0,%XMM0,%XMM0 |
0x41aea9 TEST %EAX,%EAX |
0x41aeab JNE 41aec6 |
0x41aead JMP 41b116 |
0x41aeb2 MOV -0x38(%RBP),%R14 |
0x41aeb6 MOV -0x30(%RBP),%R15 |
0x41aeba VXORPD %XMM0,%XMM0,%XMM0 |
0x41aebe TEST %EAX,%EAX |
0x41aec0 JE 41b116 |
0x41aec6 CLTQ |
0x41aec8 MOV 0x190(%RBX),%RDX |
0x41aecf MOV 0x18(%R15),%RSI |
0x41aed3 LEA -0x1(%RAX),%RCX |
0x41aed7 LEA -0x8(,%RAX,8),%RDI |
0x41aedf LEA (%RDI,%RDI,2),%RDI |
0x41aee3 LEA (%RSI,%RDI,1),%R8 |
0x41aee7 ADD $0x10,%R8 |
0x41aeeb CMP %RDX,%R8 |
0x41aeee JB 41af41 |
0x41aef0 ADD %RDX,%RDI |
0x41aef3 ADD $0x10,%RDI |
0x41aef7 CMP %RSI,%RDI |
0x41aefa JB 41af41 |
0x41aefc XOR %EDI,%EDI |
0x41aefe XCHG %AX,%AX |
(274) 0x41af00 XOR %R8D,%R8D |
(274) 0x41af03 NOPW %CS:(%RAX,%RAX,1) |
(273) 0x41af10 VMOVSD (%RSI,%R8,8),%XMM1 |
(273) 0x41af16 VADDSD (%RDX,%R8,8),%XMM1,%XMM1 |
(273) 0x41af1c VMOVSD %XMM1,(%RSI,%R8,8) |
(273) 0x41af22 INC %R8 |
(273) 0x41af25 CMP $0x3,%R8 |
(273) 0x41af29 JNE 41af10 |
(274) 0x41af2b ADD $0x18,%RDX |
(274) 0x41af2f ADD $0x18,%RSI |
(274) 0x41af33 CMP %RCX,%RDI |
(274) 0x41af36 LEA 0x1(%RDI),%RDI |
(274) 0x41af3a JNE 41af00 |
0x41af3c JMP 41afeb |
0x41af41 TEST %RCX,%RCX |
0x41af44 JE 41b062 |
0x41af4a MOV %RAX,%R8 |
0x41af4d AND $-0x2,%R8 |
0x41af51 MOV $0x28,%R9D |
0x41af57 XOR %EDI,%EDI |
0x41af59 NOPL (%RAX) |
(272) 0x41af60 VMOVUPD -0x28(%RSI,%R9,1),%XMM1 |
(272) 0x41af67 VADDPD -0x28(%RDX,%R9,1),%XMM1,%XMM1 |
(272) 0x41af6e VMOVUPD %XMM1,-0x28(%RSI,%R9,1) |
(272) 0x41af75 VMOVSD -0x18(%RSI,%R9,1),%XMM1 |
(272) 0x41af7c VADDSD -0x18(%RDX,%R9,1),%XMM1,%XMM1 |
(272) 0x41af83 VMOVSD %XMM1,-0x18(%RSI,%R9,1) |
(272) 0x41af8a VMOVUPD -0x10(%RSI,%R9,1),%XMM1 |
(272) 0x41af91 VADDPD -0x10(%RDX,%R9,1),%XMM1,%XMM1 |
(272) 0x41af98 VMOVUPD %XMM1,-0x10(%RSI,%R9,1) |
(272) 0x41af9f VMOVSD (%RSI,%R9,1),%XMM1 |
(272) 0x41afa5 VADDSD (%RDX,%R9,1),%XMM1,%XMM1 |
(272) 0x41afab VMOVSD %XMM1,(%RSI,%R9,1) |
(272) 0x41afb1 ADD $0x2,%RDI |
(272) 0x41afb5 ADD $0x30,%R9 |
(272) 0x41afb9 CMP %RDI,%R8 |
(272) 0x41afbc JNE 41af60 |
0x41afbe TEST $0x1,%AL |
0x41afc0 JE 41afeb |
0x41afc2 SAL $0x3,%RDI |
0x41afc6 LEA (%RDI,%RDI,2),%RDI |
0x41afca VMOVUPD (%RSI,%RDI,1),%XMM1 |
0x41afcf VADDPD (%RDX,%RDI,1),%XMM1,%XMM1 |
0x41afd4 VMOVUPD %XMM1,(%RSI,%RDI,1) |
0x41afd9 VMOVSD 0x10(%RSI,%RDI,1),%XMM1 |
0x41afdf VADDSD 0x10(%RDX,%RDI,1),%XMM1,%XMM1 |
0x41afe5 VMOVSD %XMM1,0x10(%RSI,%RDI,1) |
0x41afeb MOV 0x1b8(%RBX),%RDX |
0x41aff2 MOV 0x18(%R14),%RSI |
0x41aff6 LEA (%RSI,%RCX,8),%RDI |
0x41affa CMP %RDX,%RDI |
0x41affd JB 41b029 |
0x41afff LEA (%RDX,%RCX,8),%RCX |
0x41b003 CMP %RSI,%RCX |
0x41b006 JB 41b029 |
0x41b008 XOR %ECX,%ECX |
0x41b00a NOPW (%RAX,%RAX,1) |
(271) 0x41b010 VMOVSD (%RSI,%RCX,8),%XMM1 |
(271) 0x41b015 VSUBSD (%RDX,%RCX,8),%XMM1,%XMM1 |
(271) 0x41b01a VMOVSD %XMM1,(%RSI,%RCX,8) |
(271) 0x41b01f INC %RCX |
(271) 0x41b022 CMP %RCX,%RAX |
(271) 0x41b025 JNE 41b010 |
0x41b027 JMP 41b097 |
0x41b029 MOV %RAX,%RCX |
0x41b02c AND $-0x4,%RCX |
0x41b030 JE 41b071 |
0x41b032 LEA -0x1(%RCX),%RDI |
0x41b036 XOR %R8D,%R8D |
0x41b039 NOPL (%RAX) |
(270) 0x41b040 VMOVUPD (%RSI,%R8,8),%YMM1 |
(270) 0x41b046 VSUBPD (%RDX,%R8,8),%YMM1,%YMM1 |
(270) 0x41b04c VMOVUPD %YMM1,(%RSI,%R8,8) |
(270) 0x41b052 ADD $0x4,%R8 |
(270) 0x41b056 CMP %RDI,%R8 |
(270) 0x41b059 JBE 41b040 |
0x41b05b CMP %RAX,%RCX |
0x41b05e JNE 41b080 |
0x41b060 JMP 41b097 |
0x41b062 XOR %EDI,%EDI |
0x41b064 TEST $0x1,%AL |
0x41b066 JNE 41afc2 |
0x41b06c JMP 41afeb |
0x41b071 XOR %ECX,%ECX |
0x41b073 NOPW %CS:(%RAX,%RAX,1) |
(267) 0x41b080 VMOVSD (%RSI,%RCX,8),%XMM1 |
(267) 0x41b085 VSUBSD (%RDX,%RCX,8),%XMM1,%XMM1 |
(267) 0x41b08a VMOVSD %XMM1,(%RSI,%RCX,8) |
(267) 0x41b08f INC %RCX |
(267) 0x41b092 CMP %RCX,%RAX |
(267) 0x41b095 JNE 41b080 |
0x41b097 LEA (,%RAX,8),%RCX |
0x41b09f TEST %RCX,%RCX |
0x41b0a2 JE 41b116 |
0x41b0a4 MOV $0x1fffffffffffffff,%RDX |
0x41b0ae MOV 0xf0(%RBX),%RCX |
0x41b0b5 ADD %RDX,%RAX |
0x41b0b8 AND %RDX,%RAX |
0x41b0bb INC %RAX |
0x41b0be MOV $0x3ffffffffffffffc,%RDX |
0x41b0c8 AND %RAX,%RDX |
0x41b0cb JE 41b103 |
0x41b0cd VXORPD %XMM0,%XMM0,%XMM0 |
0x41b0d1 XOR %ESI,%ESI |
0x41b0d3 NOPW %CS:(%RAX,%RAX,1) |
(269) 0x41b0e0 VADDPD (%RCX,%RSI,8),%YMM0,%YMM0 |
(269) 0x41b0e5 ADD $0x4,%RSI |
(269) 0x41b0e9 CMP %RDX,%RSI |
(269) 0x41b0ec JB 41b0e0 |
0x41b0ee VEXTRACTF128 $0x1,%YMM0,%XMM1 |
0x41b0f4 VADDPD %XMM1,%XMM0,%XMM0 |
0x41b0f8 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
0x41b0fd VADDSD %XMM1,%XMM0,%XMM0 |
0x41b101 JMP 41b111 |
0x41b103 XOR %EDX,%EDX |
0x41b105 VXORPD %XMM0,%XMM0,%XMM0 |
(268) 0x41b109 VADDSD (%RCX,%RDX,8),%XMM0,%XMM0 |
(268) 0x41b10e INC %RDX |
(268) 0x41b111 CMP %RDX,%RAX |
(268) 0x41b114 JNE 41b109 |
0x41b116 VXORPD 0xd9f82(%RIP),%XMM0,%XMM0 |
0x41b11e VMOVLPD %XMM0,0x10(%RBX) |
0x41b123 ADD $0x18,%RSP |
0x41b127 POP %RBX |
0x41b128 POP %R12 |
0x41b12a POP %R13 |
0x41b12c POP %R14 |
0x41b12e POP %R15 |
0x41b130 POP %RBP |
0x41b131 VZEROUPPER |
0x41b134 RET |
0x41b135 NOPW %CS:(%RAX,%RAX,1) |
0x41b13f NOP |
Path / |
Source file and lines | OneBodyJastrowRef.h:108-194 |
Module | exec |
nb instructions | 135 |
nb uops | 137 |
loop length | 550 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 3 |
micro-operation queue | 23.17 cycles |
front end | 23.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.70 | 9.57 | 7.33 | 7.33 | 6.50 | 9.63 | 9.50 | 6.50 | 6.50 | 6.50 | 9.60 | 7.33 |
cycles | 9.70 | 9.57 | 7.33 | 7.33 | 6.50 | 9.63 | 9.50 | 6.50 | 6.50 | 6.50 | 9.60 | 7.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 23.00 |
Stall cycles | 0.00 |
Front-end | 23.17 |
Dispatch | 9.70 |
Overall L1 | 23.17 |
all | 4% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 68% |
load | 60% |
store | 33% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 31% |
load | 60% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 40% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 32% |
all | 11% |
load | NA (no load vectorizable/vectorized instructions) |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 21% |
load | 20% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 18% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 15% |
load | 20% |
store | 14% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 17% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41ae9f <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x41f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xa8(%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 461820 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x94(%RBX),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41aea5 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x425> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x1fffffffffffffff,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41ab1a <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x94(%RBX),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 41aec6 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x446> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41b116 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x696> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x38(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41b116 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x696> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CLTQ | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV 0x190(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R15),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RDI,2),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RSI,%RDI,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x10,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41af41 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4c1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD $0x10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41af41 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4c1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41afeb <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x56b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41b062 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5e2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x2,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV $0x28,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41afeb <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x56b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA (%RDI,%RDI,2),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD (%RSI,%RDI,1),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VADDPD (%RDX,%RDI,1),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVUPD %XMM1,(%RSI,%RDI,1) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x10(%RSI,%RDI,1),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD 0x10(%RDX,%RDI,1),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM1,0x10(%RSI,%RDI,1) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1b8(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R14),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RSI,%RCX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41b029 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RDX,%RCX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41b029 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41b097 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x617> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 41b071 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5f1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RCX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 41b080 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x600> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41b097 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x617> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 41afc2 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x542> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41afeb <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x56b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41b116 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x696> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1fffffffffffffff,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV 0xf0(%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
AND %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
INC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0x3ffffffffffffffc,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
AND %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 41b103 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x683> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTF128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VADDPD %XMM1,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VADDSD %XMM1,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
JMP 41b111 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x691> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD 0xd9f82(%RIP),%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVLPD %XMM0,0x10(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 4-12 | 0.50 |
ADD $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | OneBodyJastrowRef.h:108-194 |
Module | exec |
nb instructions | 135 |
nb uops | 137 |
loop length | 550 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 3 |
micro-operation queue | 23.17 cycles |
front end | 23.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.70 | 9.57 | 7.33 | 7.33 | 6.50 | 9.63 | 9.50 | 6.50 | 6.50 | 6.50 | 9.60 | 7.33 |
cycles | 9.70 | 9.57 | 7.33 | 7.33 | 6.50 | 9.63 | 9.50 | 6.50 | 6.50 | 6.50 | 9.60 | 7.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 23.00 |
Stall cycles | 0.00 |
Front-end | 23.17 |
Dispatch | 9.70 |
Overall L1 | 23.17 |
all | 4% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 68% |
load | 60% |
store | 33% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 31% |
load | 60% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 40% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 32% |
all | 11% |
load | NA (no load vectorizable/vectorized instructions) |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 21% |
load | 20% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 18% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 15% |
load | 20% |
store | 14% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 17% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41ae9f <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x41f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xa8(%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 461820 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x94(%RBX),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41aea5 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x425> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x1fffffffffffffff,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41ab1a <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x94(%RBX),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 41aec6 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x446> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41b116 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x696> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x38(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41b116 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x696> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CLTQ | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV 0x190(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R15),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RDI,2),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RSI,%RDI,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x10,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41af41 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4c1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD $0x10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41af41 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4c1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41afeb <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x56b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41b062 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5e2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x2,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV $0x28,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41afeb <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x56b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA (%RDI,%RDI,2),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD (%RSI,%RDI,1),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VADDPD (%RDX,%RDI,1),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVUPD %XMM1,(%RSI,%RDI,1) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x10(%RSI,%RDI,1),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD 0x10(%RDX,%RDI,1),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM1,0x10(%RSI,%RDI,1) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1b8(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R14),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RSI,%RCX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41b029 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RDX,%RCX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41b029 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41b097 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x617> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 41b071 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5f1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RCX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 41b080 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x600> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41b097 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x617> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 41afc2 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x542> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41afeb <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x56b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41b116 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x696> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1fffffffffffffff,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV 0xf0(%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
AND %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
INC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0x3ffffffffffffffc,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
AND %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 41b103 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x683> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTF128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VADDPD %XMM1,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VADDSD %XMM1,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
JMP 41b111 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x691> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD 0xd9f82(%RIP),%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVLPD %XMM0,0x10(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 4-12 | 0.50 |
ADD $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb– | 0.01 | 0.01 |
○Loop 270 - OneBodyJastrowRef.h:171-172 - exec | 0 | 0 |
▼Loop 274 - OneBodyJastrowRef.h:169-169 - exec– | 0 | 0 |
○Loop 273 - TinyVectorOps.h:49-49 - exec | 0 | 0 |
▼Loop 275 - OneBodyJastrowRef.h:109-194 - exec– | 0 | 0 |
○Loop 287 - stl_numeric.h:140-141 - exec | 0 | 0 |
○Loop 279 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
▼Loop 284 - OneBodyJastrowRef.h:188-194 - exec– | 0 | 0 |
○Loop 283 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 277 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 280 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 281 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 282 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 285 - OneBodyJastrowRef.h:186-187 - exec | 0 | 0 |
○Loop 276 - OneBodyJastrowRef.h:186-187 - exec | 0 | 0 |
○Loop 286 - stl_numeric.h:140-141 - exec | 0 | 0 |
○Loop 278 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 272 - OneBodyJastrowRef.h:169-169 - exec | 0 | 0 |
○Loop 267 - OneBodyJastrowRef.h:171-172 - exec | 0 | 0 |
○Loop 268 - OneBodyJastrowRef.h:0-0 - exec | 0 | 0 |
○Loop 269 - stl_numeric.h:140-141 - exec | 0 | 0 |
○Loop 271 - OneBodyJastrowRef.h:171-172 - exec | 0 | 0 |