Function: miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcp ... | Module: exec | Source: OneBodyJastrowRef.h:108-194 [...] | Coverage: 0.02% |
---|
Function: miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcp ... | Module: exec | Source: OneBodyJastrowRef.h:108-194 [...] | Coverage: 0.02% |
---|
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 273 - 273 |
-------------------------------------------------------------------------------- |
273: inline const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVectorOps.h: 49 - 49 |
-------------------------------------------------------------------------------- |
49: for (unsigned d = 0; d < D; ++d) |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
242: inline iterator begin() { return X; } |
[...] |
249: inline const_pointer data() const { return X; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/OneBodyJastrowRef.h: 108 - 194 |
-------------------------------------------------------------------------------- |
108: const auto& d_ie = P.getDistTableAB(myTableID); |
109: for (int iat = 0; iat < Nelec; ++iat) |
110: { |
111: computeU3(P, iat, d_ie.getDistRow(iat).data()); |
112: Vat[iat] = std::accumulate(U.begin(), U.begin() + Nions, valT()); |
113: Lap[iat] = accumulateGL(dU.data(), d2U.data(), d_ie.getDisplRow(iat), Grad[iat]); |
[...] |
165: { |
166: if (fromscratch) |
167: recompute(P); |
168: |
169: for (size_t iat = 0; iat < Nelec; ++iat) |
170: G[iat] += Grad[iat]; |
171: for (size_t iat = 0; iat < Nelec; ++iat) |
172: L[iat] -= Lap[iat]; |
173: LogValue = -std::accumulate(Vat.begin(), Vat.begin() + Nelec, valT()); |
174: } |
[...] |
186: for (int jat = 0; jat < Nions; ++jat) |
187: lap += d2u[jat] + lapfac * du[jat]; |
188: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
189: { |
190: const valT* restrict dX = displ.data(idim); |
191: valT s = valT(); |
192: for (int jat = 0; jat < Nions; ++jat) |
193: s += du[jat] * dX[jat]; |
194: grad[idim] = s; |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_numeric.h: 126 - 127 |
-------------------------------------------------------------------------------- |
126: for (; __first != __last; ++__first) |
127: __init = __init + *__first; |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_iterator.h: 784 - 887 |
-------------------------------------------------------------------------------- |
784: : _M_current(__i) { } |
[...] |
887: { return __lhs.base() != __rhs.base(); } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 94 - 94 |
-------------------------------------------------------------------------------- |
94: (const_cast<T1&>(a) += b); |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 169 - 170 |
-------------------------------------------------------------------------------- |
169: inline Type_t& operator[](unsigned int i) { return X[i]; } |
170: inline const Type_t& operator[](unsigned int i) const { return X[i]; } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_vector.h: 951 - 1056 |
-------------------------------------------------------------------------------- |
951: return *(this->_M_impl._M_start + __n); |
[...] |
1056: { return _M_data_ptr(this->_M_impl._M_start); } |
0x41a420 PUSH %RBP |
0x41a421 MOV %RSP,%RBP |
0x41a424 PUSH %R15 |
0x41a426 PUSH %R14 |
0x41a428 PUSH %R13 |
0x41a42a PUSH %R12 |
0x41a42c PUSH %RBX |
0x41a42d SUB $0x18,%RSP |
0x41a431 MOV %RCX,%R14 |
0x41a434 MOV %RDX,%R15 |
0x41a437 MOV %RDI,%RBX |
0x41a43a TEST %R8B,%R8B |
0x41a43d JE 41a832 |
0x41a443 MOV %RSI,%R12 |
0x41a446 MOV 0xa8(%RBX),%ESI |
0x41a44c MOV %R12,%RDI |
0x41a44f CALL 460d00 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> |
0x41a454 MOV %RAX,%R13 |
0x41a457 MOV 0x94(%RBX),%EAX |
0x41a45d TEST %EAX,%EAX |
0x41a45f JLE 41a838 |
0x41a465 MOV %R12,-0x40(%RBP) |
0x41a469 MOV %R15,-0x30(%RBP) |
0x41a46d MOV %R14,-0x38(%RBP) |
0x41a471 MOV $0x1fffffffffffffff,%R15 |
0x41a47b XOR %R14D,%R14D |
0x41a47e JMP 41a4ba |
(273) 0x41a480 LEA (%R14,%R14,2),%RAX |
(273) 0x41a484 VXORPD %XMM0,%XMM0,%XMM0 |
(273) 0x41a488 VMOVUPD %XMM0,(%RDX,%RAX,8) |
(273) 0x41a48d MOVQ $0,0x10(%RDX,%RAX,8) |
(273) 0x41a496 VXORPD %XMM0,%XMM0,%XMM0 |
(273) 0x41a49a MOV 0x1b8(%RBX),%RAX |
(273) 0x41a4a1 VMOVSD %XMM0,(%RAX,%R14,8) |
(273) 0x41a4a7 INC %R14 |
(273) 0x41a4aa MOVSXD 0x94(%RBX),%RAX |
(273) 0x41a4b1 CMP %RAX,%R14 |
(273) 0x41a4b4 JGE 41a845 |
(273) 0x41a4ba MOV 0x48(%R13),%RAX |
(273) 0x41a4be LEA (%R14,%R14,4),%R12 |
(273) 0x41a4c2 MOV 0x18(%RAX,%R12,8),%RCX |
(273) 0x41a4c7 MOV %RBX,%RDI |
(273) 0x41a4ca MOV -0x40(%RBP),%RSI |
(273) 0x41a4ce MOV %R14D,%EDX |
(273) 0x41a4d1 VZEROUPPER |
(273) 0x41a4d4 CALL 41c400 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd> |
(273) 0x41a4d9 MOVSXD 0x90(%RBX),%RAX |
(273) 0x41a4e0 TEST %R15,%RAX |
(273) 0x41a4e3 JE 41a550 |
(273) 0x41a4e5 MOV 0x100(%RBX),%RCX |
(273) 0x41a4ec LEA (%RAX,%R15,1),%RDX |
(273) 0x41a4f0 AND %R15,%RDX |
(273) 0x41a4f3 INC %RDX |
(273) 0x41a4f6 MOV %RDX,%RSI |
(273) 0x41a4f9 MOV $0x3ffffffffffffffc,%RDI |
(273) 0x41a503 AND %RDI,%RSI |
(273) 0x41a506 VMOVSD 0xdd8da(%RIP),%XMM2 |
(273) 0x41a50e VBROADCASTSD 0xdd8d1(%RIP),%YMM3 |
(273) 0x41a517 JE 41a570 |
(273) 0x41a519 VXORPD %XMM0,%XMM0,%XMM0 |
(273) 0x41a51d XOR %EDI,%EDI |
(273) 0x41a51f NOP |
(285) 0x41a520 VADDPD (%RCX,%RDI,8),%YMM0,%YMM0 |
(285) 0x41a525 ADD $0x4,%RDI |
(285) 0x41a529 CMP %RSI,%RDI |
(285) 0x41a52c JB 41a520 |
(273) 0x41a52e VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(273) 0x41a534 VADDPD %XMM1,%XMM0,%XMM0 |
(273) 0x41a538 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(273) 0x41a53d VADDSD %XMM1,%XMM0,%XMM0 |
(273) 0x41a541 JMP 41a828 |
0x41a546 NOPW %CS:(%RAX,%RAX,1) |
(273) 0x41a550 VXORPD %XMM0,%XMM0,%XMM0 |
(273) 0x41a554 VMOVSD 0xdd88c(%RIP),%XMM2 |
(273) 0x41a55c VBROADCASTSD 0xdd883(%RIP),%YMM3 |
(273) 0x41a565 JMP 41a580 |
0x41a567 NOPW (%RAX,%RAX,1) |
(273) 0x41a570 VXORPD %XMM0,%XMM0,%XMM0 |
(273) 0x41a574 XOR %ESI,%ESI |
(273) 0x41a576 JMP 41a820 |
0x41a57b NOPL (%RAX,%RAX,1) |
(273) 0x41a580 MOV 0xf0(%RBX),%RCX |
(273) 0x41a587 VMOVSD %XMM0,(%RCX,%R14,8) |
(273) 0x41a58d MOV 0x190(%RBX),%RDX |
(273) 0x41a594 TEST %EAX,%EAX |
(273) 0x41a596 JLE 41a480 |
(273) 0x41a59c MOV 0x118(%RBX),%RCX |
(273) 0x41a5a3 MOV 0x130(%RBX),%RDI |
(273) 0x41a5aa MOV %RAX,%RSI |
(273) 0x41a5ad AND $-0x4,%RSI |
(273) 0x41a5b1 JE 41a600 |
(273) 0x41a5b3 VXORPD %XMM0,%XMM0,%XMM0 |
(273) 0x41a5b7 XOR %R8D,%R8D |
(273) 0x41a5ba NOPW (%RAX,%RAX,1) |
(283) 0x41a5c0 VADDPD (%RDI,%R8,8),%YMM0,%YMM0 |
(283) 0x41a5c6 VFMADD231PD (%RCX,%R8,8),%YMM3,%YMM0 |
(283) 0x41a5cc ADD $0x4,%R8 |
(283) 0x41a5d0 CMP %RSI,%R8 |
(283) 0x41a5d3 JL 41a5c0 |
(273) 0x41a5d5 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(273) 0x41a5db VADDPD %XMM1,%XMM0,%XMM0 |
(273) 0x41a5df VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(273) 0x41a5e4 VADDSD %XMM1,%XMM0,%XMM0 |
(273) 0x41a5e8 MOV %RSI,%R8 |
(273) 0x41a5eb CMP %RAX,%RSI |
(273) 0x41a5ee JNE 41a610 |
(273) 0x41a5f0 JMP 41a624 |
0x41a5f2 NOPW %CS:(%RAX,%RAX,1) |
(273) 0x41a600 VXORPD %XMM0,%XMM0,%XMM0 |
(273) 0x41a604 XOR %R8D,%R8D |
(273) 0x41a607 NOPW (%RAX,%RAX,1) |
(274) 0x41a610 VADDSD (%RDI,%R8,8),%XMM0,%XMM0 |
(274) 0x41a616 VFMADD231SD (%RCX,%R8,8),%XMM2,%XMM0 |
(274) 0x41a61c INC %R8 |
(274) 0x41a61f CMP %R8,%RAX |
(274) 0x41a622 JNE 41a610 |
(273) 0x41a624 MOV 0x60(%R13),%RDI |
(273) 0x41a628 MOV 0x8(%RDI,%R12,8),%R8 |
(273) 0x41a62d MOV 0x18(%RDI,%R12,8),%RDI |
(273) 0x41a632 MOV %R8,%R9 |
(273) 0x41a635 SAR $0x3f,%R9 |
(273) 0x41a639 ANDN %R8,%R9,%R9 |
(273) 0x41a63e TEST %R8,%R8 |
(273) 0x41a641 LEA (%RAX,%R9,2),%R9 |
(273) 0x41a645 LEA -0x8(%RDI,%R9,8),%R12 |
(273) 0x41a64a LEA (%R14,%R14,2),%R9 |
(273) 0x41a64e LEA (%RDX,%R9,8),%R10 |
(273) 0x41a652 MOV $0,%R11D |
(273) 0x41a658 CMOVS %R8,%R11 |
(273) 0x41a65c CMP %R10,%R12 |
(273) 0x41a65f JB 41a6c0 |
(273) 0x41a661 SAL $0x4,%R11 |
(273) 0x41a665 ADD %RDI,%R11 |
(273) 0x41a668 LEA (%RDX,%R9,8),%R12 |
(273) 0x41a66c ADD $0x10,%R12 |
(273) 0x41a670 CMP %R11,%R12 |
(273) 0x41a673 JB 41a6c0 |
(273) 0x41a675 SAL $0x3,%R8 |
(273) 0x41a679 XOR %EDX,%EDX |
(273) 0x41a67b NOPL (%RAX,%RAX,1) |
(282) 0x41a680 VXORPD %XMM1,%XMM1,%XMM1 |
(282) 0x41a684 XOR %ESI,%ESI |
(282) 0x41a686 NOPW %CS:(%RAX,%RAX,1) |
(281) 0x41a690 VMOVSD (%RDI,%RSI,8),%XMM2 |
(281) 0x41a695 VFMADD231SD (%RCX,%RSI,8),%XMM2,%XMM1 |
(281) 0x41a69b INC %RSI |
(281) 0x41a69e CMP %RSI,%RAX |
(281) 0x41a6a1 JNE 41a690 |
(282) 0x41a6a3 VMOVSD %XMM1,(%R10,%RDX,8) |
(282) 0x41a6a9 ADD %R8,%RDI |
(282) 0x41a6ac CMP $0x2,%RDX |
(282) 0x41a6b0 LEA 0x1(%RDX),%RDX |
(282) 0x41a6b4 JNE 41a680 |
(273) 0x41a6b6 JMP 41a49a |
0x41a6bb NOPL (%RAX,%RAX,1) |
(273) 0x41a6c0 TEST %RSI,%RSI |
(273) 0x41a6c3 JE 41a702 |
(273) 0x41a6c5 VXORPD %XMM1,%XMM1,%XMM1 |
(273) 0x41a6c9 XOR %R10D,%R10D |
(273) 0x41a6cc NOPL (%RAX) |
(280) 0x41a6d0 VMOVUPD (%RDI,%R10,8),%YMM2 |
(280) 0x41a6d6 VFMADD231PD (%RCX,%R10,8),%YMM2,%YMM1 |
(280) 0x41a6dc ADD $0x4,%R10 |
(280) 0x41a6e0 CMP %RSI,%R10 |
(280) 0x41a6e3 JL 41a6d0 |
(273) 0x41a6e5 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(273) 0x41a6eb VADDPD %XMM2,%XMM1,%XMM1 |
(273) 0x41a6ef VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(273) 0x41a6f4 VADDSD %XMM2,%XMM1,%XMM1 |
(273) 0x41a6f8 MOV %RSI,%R10 |
(273) 0x41a6fb CMP %RAX,%RSI |
(273) 0x41a6fe JNE 41a710 |
(273) 0x41a700 JMP 41a724 |
(273) 0x41a702 VXORPD %XMM1,%XMM1,%XMM1 |
(273) 0x41a706 XOR %R10D,%R10D |
(273) 0x41a709 NOPL (%RAX) |
(275) 0x41a710 VMOVSD (%RDI,%R10,8),%XMM2 |
(275) 0x41a716 VFMADD231SD (%RCX,%R10,8),%XMM2,%XMM1 |
(275) 0x41a71c INC %R10 |
(275) 0x41a71f CMP %R10,%RAX |
(275) 0x41a722 JNE 41a710 |
(273) 0x41a724 VMOVSD %XMM1,(%RDX,%R9,8) |
(273) 0x41a72a TEST %RSI,%RSI |
(273) 0x41a72d JE 41a772 |
(273) 0x41a72f LEA (%RDI,%R8,8),%R10 |
(273) 0x41a733 VXORPD %XMM1,%XMM1,%XMM1 |
(273) 0x41a737 XOR %R11D,%R11D |
(273) 0x41a73a NOPW (%RAX,%RAX,1) |
(279) 0x41a740 VMOVUPD (%R10,%R11,8),%YMM2 |
(279) 0x41a746 VFMADD231PD (%RCX,%R11,8),%YMM2,%YMM1 |
(279) 0x41a74c ADD $0x4,%R11 |
(279) 0x41a750 CMP %RSI,%R11 |
(279) 0x41a753 JL 41a740 |
(273) 0x41a755 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(273) 0x41a75b VADDPD %XMM2,%XMM1,%XMM1 |
(273) 0x41a75f VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(273) 0x41a764 VADDSD %XMM2,%XMM1,%XMM1 |
(273) 0x41a768 MOV %RSI,%R10 |
(273) 0x41a76b CMP %RAX,%RSI |
(273) 0x41a76e JNE 41a779 |
(273) 0x41a770 JMP 41a794 |
(273) 0x41a772 VXORPD %XMM1,%XMM1,%XMM1 |
(273) 0x41a776 XOR %R10D,%R10D |
(273) 0x41a779 LEA (%RDI,%R8,8),%R11 |
(273) 0x41a77d NOPL (%RAX) |
(276) 0x41a780 VMOVSD (%R11,%R10,8),%XMM2 |
(276) 0x41a786 VFMADD231SD (%RCX,%R10,8),%XMM2,%XMM1 |
(276) 0x41a78c INC %R10 |
(276) 0x41a78f CMP %R10,%RAX |
(276) 0x41a792 JNE 41a780 |
(273) 0x41a794 VMOVSD %XMM1,0x8(%RDX,%R9,8) |
(273) 0x41a79b TEST %RSI,%RSI |
(273) 0x41a79e JE 41a7ef |
(273) 0x41a7a0 MOV %R8,%R10 |
(273) 0x41a7a3 SAL $0x4,%R10 |
(273) 0x41a7a7 ADD %RDI,%R10 |
(273) 0x41a7aa VXORPD %XMM1,%XMM1,%XMM1 |
(273) 0x41a7ae XOR %R11D,%R11D |
(273) 0x41a7b1 NOPW %CS:(%RAX,%RAX,1) |
(278) 0x41a7c0 VMOVUPD (%R10,%R11,8),%YMM2 |
(278) 0x41a7c6 VFMADD231PD (%RCX,%R11,8),%YMM2,%YMM1 |
(278) 0x41a7cc ADD $0x4,%R11 |
(278) 0x41a7d0 CMP %RSI,%R11 |
(278) 0x41a7d3 JL 41a7c0 |
(273) 0x41a7d5 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(273) 0x41a7db VADDPD %XMM2,%XMM1,%XMM1 |
(273) 0x41a7df VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(273) 0x41a7e4 VADDSD %XMM2,%XMM1,%XMM1 |
(273) 0x41a7e8 CMP %RAX,%RSI |
(273) 0x41a7eb JNE 41a7f5 |
(273) 0x41a7ed JMP 41a813 |
(273) 0x41a7ef VXORPD %XMM1,%XMM1,%XMM1 |
(273) 0x41a7f3 XOR %ESI,%ESI |
(273) 0x41a7f5 SAL $0x4,%R8 |
(273) 0x41a7f9 ADD %R8,%RDI |
(273) 0x41a7fc NOPL (%RAX) |
(277) 0x41a800 VMOVSD (%RDI,%RSI,8),%XMM2 |
(277) 0x41a805 VFMADD231SD (%RCX,%RSI,8),%XMM2,%XMM1 |
(277) 0x41a80b INC %RSI |
(277) 0x41a80e CMP %RSI,%RAX |
(277) 0x41a811 JNE 41a800 |
(273) 0x41a813 VMOVSD %XMM1,0x10(%RDX,%R9,8) |
(273) 0x41a81a JMP 41a49a |
0x41a81f NOP |
(284) 0x41a820 VADDSD (%RCX,%RSI,8),%XMM0,%XMM0 |
(284) 0x41a825 INC %RSI |
(284) 0x41a828 CMP %RSI,%RDX |
(284) 0x41a82b JNE 41a820 |
(273) 0x41a82d JMP 41a580 |
0x41a832 MOV 0x94(%RBX),%EAX |
0x41a838 VXORPD %XMM0,%XMM0,%XMM0 |
0x41a83c TEST %EAX,%EAX |
0x41a83e JNE 41a859 |
0x41a840 JMP 41aab6 |
0x41a845 MOV -0x38(%RBP),%R14 |
0x41a849 MOV -0x30(%RBP),%R15 |
0x41a84d VXORPD %XMM0,%XMM0,%XMM0 |
0x41a851 TEST %EAX,%EAX |
0x41a853 JE 41aab6 |
0x41a859 CLTQ |
0x41a85b MOV 0x190(%RBX),%RDX |
0x41a862 MOV 0x18(%R15),%RSI |
0x41a866 LEA -0x1(%RAX),%RCX |
0x41a86a LEA -0x8(,%RAX,8),%RDI |
0x41a872 LEA (%RDI,%RDI,2),%RDI |
0x41a876 LEA (%RSI,%RDI,1),%R8 |
0x41a87a ADD $0x10,%R8 |
0x41a87e CMP %RDX,%R8 |
0x41a881 JB 41a8e1 |
0x41a883 ADD %RDX,%RDI |
0x41a886 ADD $0x10,%RDI |
0x41a88a CMP %RSI,%RDI |
0x41a88d JB 41a8e1 |
0x41a88f XOR %EDI,%EDI |
0x41a891 NOPW %CS:(%RAX,%RAX,1) |
(272) 0x41a8a0 XOR %R8D,%R8D |
(272) 0x41a8a3 NOPW %CS:(%RAX,%RAX,1) |
(271) 0x41a8b0 VMOVSD (%RSI,%R8,8),%XMM1 |
(271) 0x41a8b6 VADDSD (%RDX,%R8,8),%XMM1,%XMM1 |
(271) 0x41a8bc VMOVSD %XMM1,(%RSI,%R8,8) |
(271) 0x41a8c2 INC %R8 |
(271) 0x41a8c5 CMP $0x3,%R8 |
(271) 0x41a8c9 JNE 41a8b0 |
(272) 0x41a8cb ADD $0x18,%RDX |
(272) 0x41a8cf ADD $0x18,%RSI |
(272) 0x41a8d3 CMP %RCX,%RDI |
(272) 0x41a8d6 LEA 0x1(%RDI),%RDI |
(272) 0x41a8da JNE 41a8a0 |
0x41a8dc JMP 41a98b |
0x41a8e1 TEST %RCX,%RCX |
0x41a8e4 JE 41aa02 |
0x41a8ea MOV %RAX,%R8 |
0x41a8ed AND $-0x2,%R8 |
0x41a8f1 MOV $0x28,%R9D |
0x41a8f7 XOR %EDI,%EDI |
0x41a8f9 NOPL (%RAX) |
(270) 0x41a900 VMOVUPD -0x28(%RSI,%R9,1),%XMM1 |
(270) 0x41a907 VADDPD -0x28(%RDX,%R9,1),%XMM1,%XMM1 |
(270) 0x41a90e VMOVUPD %XMM1,-0x28(%RSI,%R9,1) |
(270) 0x41a915 VMOVSD -0x18(%RSI,%R9,1),%XMM1 |
(270) 0x41a91c VADDSD -0x18(%RDX,%R9,1),%XMM1,%XMM1 |
(270) 0x41a923 VMOVSD %XMM1,-0x18(%RSI,%R9,1) |
(270) 0x41a92a VMOVUPD -0x10(%RSI,%R9,1),%XMM1 |
(270) 0x41a931 VADDPD -0x10(%RDX,%R9,1),%XMM1,%XMM1 |
(270) 0x41a938 VMOVUPD %XMM1,-0x10(%RSI,%R9,1) |
(270) 0x41a93f VMOVSD (%RSI,%R9,1),%XMM1 |
(270) 0x41a945 VADDSD (%RDX,%R9,1),%XMM1,%XMM1 |
(270) 0x41a94b VMOVSD %XMM1,(%RSI,%R9,1) |
(270) 0x41a951 ADD $0x2,%RDI |
(270) 0x41a955 ADD $0x30,%R9 |
(270) 0x41a959 CMP %RDI,%R8 |
(270) 0x41a95c JNE 41a900 |
0x41a95e TEST $0x1,%AL |
0x41a960 JE 41a98b |
0x41a962 SAL $0x3,%RDI |
0x41a966 LEA (%RDI,%RDI,2),%RDI |
0x41a96a VMOVUPD (%RSI,%RDI,1),%XMM1 |
0x41a96f VADDPD (%RDX,%RDI,1),%XMM1,%XMM1 |
0x41a974 VMOVUPD %XMM1,(%RSI,%RDI,1) |
0x41a979 VMOVSD 0x10(%RSI,%RDI,1),%XMM1 |
0x41a97f VADDSD 0x10(%RDX,%RDI,1),%XMM1,%XMM1 |
0x41a985 VMOVSD %XMM1,0x10(%RSI,%RDI,1) |
0x41a98b MOV 0x1b8(%RBX),%RDX |
0x41a992 MOV 0x18(%R14),%RSI |
0x41a996 LEA (%RSI,%RCX,8),%RDI |
0x41a99a CMP %RDX,%RDI |
0x41a99d JB 41a9c9 |
0x41a99f LEA (%RDX,%RCX,8),%RCX |
0x41a9a3 CMP %RSI,%RCX |
0x41a9a6 JB 41a9c9 |
0x41a9a8 XOR %ECX,%ECX |
0x41a9aa NOPW (%RAX,%RAX,1) |
(269) 0x41a9b0 VMOVSD (%RSI,%RCX,8),%XMM1 |
(269) 0x41a9b5 VSUBSD (%RDX,%RCX,8),%XMM1,%XMM1 |
(269) 0x41a9ba VMOVSD %XMM1,(%RSI,%RCX,8) |
(269) 0x41a9bf INC %RCX |
(269) 0x41a9c2 CMP %RCX,%RAX |
(269) 0x41a9c5 JNE 41a9b0 |
0x41a9c7 JMP 41aa37 |
0x41a9c9 MOV %RAX,%RCX |
0x41a9cc AND $-0x4,%RCX |
0x41a9d0 JE 41aa11 |
0x41a9d2 LEA -0x1(%RCX),%RDI |
0x41a9d6 XOR %R8D,%R8D |
0x41a9d9 NOPL (%RAX) |
(268) 0x41a9e0 VMOVUPD (%RSI,%R8,8),%YMM1 |
(268) 0x41a9e6 VSUBPD (%RDX,%R8,8),%YMM1,%YMM1 |
(268) 0x41a9ec VMOVUPD %YMM1,(%RSI,%R8,8) |
(268) 0x41a9f2 ADD $0x4,%R8 |
(268) 0x41a9f6 CMP %RDI,%R8 |
(268) 0x41a9f9 JBE 41a9e0 |
0x41a9fb CMP %RAX,%RCX |
0x41a9fe JNE 41aa20 |
0x41aa00 JMP 41aa37 |
0x41aa02 XOR %EDI,%EDI |
0x41aa04 TEST $0x1,%AL |
0x41aa06 JNE 41a962 |
0x41aa0c JMP 41a98b |
0x41aa11 XOR %ECX,%ECX |
0x41aa13 NOPW %CS:(%RAX,%RAX,1) |
(265) 0x41aa20 VMOVSD (%RSI,%RCX,8),%XMM1 |
(265) 0x41aa25 VSUBSD (%RDX,%RCX,8),%XMM1,%XMM1 |
(265) 0x41aa2a VMOVSD %XMM1,(%RSI,%RCX,8) |
(265) 0x41aa2f INC %RCX |
(265) 0x41aa32 CMP %RCX,%RAX |
(265) 0x41aa35 JNE 41aa20 |
0x41aa37 LEA (,%RAX,8),%RCX |
0x41aa3f TEST %RCX,%RCX |
0x41aa42 JE 41aab6 |
0x41aa44 MOV $0x1fffffffffffffff,%RDX |
0x41aa4e MOV 0xf0(%RBX),%RCX |
0x41aa55 ADD %RDX,%RAX |
0x41aa58 AND %RDX,%RAX |
0x41aa5b INC %RAX |
0x41aa5e MOV $0x3ffffffffffffffc,%RDX |
0x41aa68 AND %RAX,%RDX |
0x41aa6b JE 41aaa3 |
0x41aa6d VXORPD %XMM0,%XMM0,%XMM0 |
0x41aa71 XOR %ESI,%ESI |
0x41aa73 NOPW %CS:(%RAX,%RAX,1) |
(267) 0x41aa80 VADDPD (%RCX,%RSI,8),%YMM0,%YMM0 |
(267) 0x41aa85 ADD $0x4,%RSI |
(267) 0x41aa89 CMP %RDX,%RSI |
(267) 0x41aa8c JB 41aa80 |
0x41aa8e VEXTRACTF128 $0x1,%YMM0,%XMM1 |
0x41aa94 VADDPD %XMM1,%XMM0,%XMM0 |
0x41aa98 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
0x41aa9d VADDSD %XMM1,%XMM0,%XMM0 |
0x41aaa1 JMP 41aab1 |
0x41aaa3 XOR %EDX,%EDX |
0x41aaa5 VXORPD %XMM0,%XMM0,%XMM0 |
(266) 0x41aaa9 VADDSD (%RCX,%RDX,8),%XMM0,%XMM0 |
(266) 0x41aaae INC %RDX |
(266) 0x41aab1 CMP %RDX,%RAX |
(266) 0x41aab4 JNE 41aaa9 |
0x41aab6 VXORPD 0xdc1a2(%RIP),%XMM0,%XMM0 |
0x41aabe VMOVLPD %XMM0,0x10(%RBX) |
0x41aac3 ADD $0x18,%RSP |
0x41aac7 POP %RBX |
0x41aac8 POP %R12 |
0x41aaca POP %R13 |
0x41aacc POP %R14 |
0x41aace POP %R15 |
0x41aad0 POP %RBP |
0x41aad1 VZEROUPPER |
0x41aad4 RET |
0x41aad5 NOPW %CS:(%RAX,%RAX,1) |
0x41aadf NOP |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►97.67+ | miniqmcreference::OneBodyJastr[...] | OneBodyJastrowRef.h:122 | exec |
○ | qmcplusplus::WaveFunction::eva[...] | WaveFunction.cpp:175 | exec |
○ | main.extracted.113 | miniqmc.cpp:397 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►2.33+ | qmcplusplus::WaveFunction::eva[...] | stl_vector.h:933 | exec |
○ | main.extracted.110 | miniqmc.cpp:467 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | OneBodyJastrowRef.h:108-194 |
Module | exec |
nb instructions | 137 |
nb uops | 139 |
loop length | 572 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 3 |
micro-operation queue | 23.50 cycles |
front end | 23.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.70 | 9.57 | 7.33 | 7.33 | 6.50 | 9.63 | 9.50 | 6.50 | 6.50 | 6.50 | 9.60 | 7.33 |
cycles | 9.70 | 9.57 | 7.33 | 7.33 | 6.50 | 9.63 | 9.50 | 6.50 | 6.50 | 6.50 | 9.60 | 7.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 23.34 |
Stall cycles | 0.00 |
Front-end | 23.50 |
Dispatch | 9.70 |
Overall L1 | 23.50 |
all | 4% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 68% |
load | 60% |
store | 33% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 31% |
load | 60% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 40% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 32% |
all | 11% |
load | NA (no load vectorizable/vectorized instructions) |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 21% |
load | 20% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 18% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 15% |
load | 20% |
store | 14% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 17% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41a832 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x412> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xa8(%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 460d00 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x94(%RBX),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41a838 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x418> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x1fffffffffffffff,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41a4ba <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x94(%RBX),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 41a859 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x439> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41aab6 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x696> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x38(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41aab6 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x696> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CLTQ | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV 0x190(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R15),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RDI,2),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RSI,%RDI,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x10,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41a8e1 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4c1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD $0x10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41a8e1 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4c1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41a98b <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x56b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41aa02 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5e2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x2,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV $0x28,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41a98b <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x56b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA (%RDI,%RDI,2),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD (%RSI,%RDI,1),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VADDPD (%RDX,%RDI,1),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVUPD %XMM1,(%RSI,%RDI,1) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x10(%RSI,%RDI,1),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD 0x10(%RDX,%RDI,1),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM1,0x10(%RSI,%RDI,1) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1b8(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R14),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RSI,%RCX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41a9c9 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RDX,%RCX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41a9c9 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41aa37 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x617> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 41aa11 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5f1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RCX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 41aa20 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x600> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41aa37 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x617> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 41a962 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x542> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41a98b <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x56b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41aab6 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x696> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1fffffffffffffff,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV 0xf0(%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
AND %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
INC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0x3ffffffffffffffc,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
AND %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 41aaa3 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x683> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTF128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VADDPD %XMM1,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VADDSD %XMM1,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
JMP 41aab1 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x691> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD 0xdc1a2(%RIP),%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVLPD %XMM0,0x10(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 4-12 | 0.50 |
ADD $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | OneBodyJastrowRef.h:108-194 |
Module | exec |
nb instructions | 137 |
nb uops | 139 |
loop length | 572 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 3 |
micro-operation queue | 23.50 cycles |
front end | 23.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.70 | 9.57 | 7.33 | 7.33 | 6.50 | 9.63 | 9.50 | 6.50 | 6.50 | 6.50 | 9.60 | 7.33 |
cycles | 9.70 | 9.57 | 7.33 | 7.33 | 6.50 | 9.63 | 9.50 | 6.50 | 6.50 | 6.50 | 9.60 | 7.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 23.34 |
Stall cycles | 0.00 |
Front-end | 23.50 |
Dispatch | 9.70 |
Overall L1 | 23.50 |
all | 4% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 68% |
load | 60% |
store | 33% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 31% |
load | 60% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 40% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 32% |
all | 11% |
load | NA (no load vectorizable/vectorized instructions) |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 21% |
load | 20% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 18% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 15% |
load | 20% |
store | 14% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 17% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41a832 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x412> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xa8(%RBX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 460d00 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x94(%RBX),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41a838 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x418> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x1fffffffffffffff,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41a4ba <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x9a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x94(%RBX),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 41a859 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x439> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41aab6 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x696> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x38(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41aab6 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x696> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CLTQ | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV 0x190(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R15),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RDI,2),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RSI,%RDI,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x10,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41a8e1 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4c1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD $0x10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41a8e1 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x4c1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41a98b <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x56b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41aa02 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5e2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x2,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV $0x28,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41a98b <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x56b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA (%RDI,%RDI,2),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD (%RSI,%RDI,1),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VADDPD (%RDX,%RDI,1),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVUPD %XMM1,(%RSI,%RDI,1) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x10(%RSI,%RDI,1),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD 0x10(%RDX,%RDI,1),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM1,0x10(%RSI,%RDI,1) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1b8(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R14),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RSI,%RCX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41a9c9 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RDX,%RCX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 41a9c9 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41aa37 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x617> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 41aa11 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5f1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RCX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 41aa20 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x600> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41aa37 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x617> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 41a962 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x542> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41a98b <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x56b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 41aab6 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x696> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1fffffffffffffff,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV 0xf0(%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
AND %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
INC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0x3ffffffffffffffc,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
AND %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 41aaa3 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x683> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTF128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VADDPD %XMM1,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VADDSD %XMM1,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
JMP 41aab1 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x691> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD 0xdc1a2(%RIP),%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVLPD %XMM0,0x10(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 4-12 | 0.50 |
ADD $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼miniqmcreference::OneBodyJastrowRef | 0.02 | 0.02 |
○Loop 266 - OneBodyJastrowRef.h:0-0 - exec | 0 | 0 |
○Loop 265 - OneBodyJastrowRef.h:171-172 - exec | 0 | 0 |
▼Loop 273 - OneBodyJastrowRef.h:109-194 - exec– | 0 | 0 |
○Loop 280 - OneBodyJastrowRef.h:192-193 - exec | 0.01 | 0.01 |
○Loop 278 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 284 - OneBodyJastrowRef.h:0-0 - exec | 0 | 0 |
○Loop 279 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 283 - OneBodyJastrowRef.h:186-187 - exec | 0 | 0 |
○Loop 277 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
▼Loop 282 - OneBodyJastrowRef.h:188-194 - exec– | 0 | 0 |
○Loop 281 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 285 - stl_numeric.h:126-127 - exec | 0 | 0 |
○Loop 276 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 275 - OneBodyJastrowRef.h:192-193 - exec | 0 | 0 |
○Loop 274 - OneBodyJastrowRef.h:186-187 - exec | 0 | 0 |
▼Loop 272 - OneBodyJastrowRef.h:169-169 - exec– | 0 | 0 |
○Loop 271 - TinyVectorOps.h:49-49 - exec | 0 | 0 |
○Loop 267 - stl_numeric.h:126-127 - exec | 0 | 0 |
○Loop 268 - OneBodyJastrowRef.h:171-172 - exec | 0 | 0 |
○Loop 269 - OneBodyJastrowRef.h:171-172 - exec | 0 | 0 |
○Loop 270 - OneBodyJastrowRef.h:169-169 - exec | 0 | 0 |