Function: _ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS ... | Module: libqmcwfs.so | Source: OneBodyJastrowRef.h:205-241 [...] | Coverage: 0.01% |
---|
Function: _ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS ... | Module: libqmcwfs.so | Source: OneBodyJastrowRef.h:205-241 [...] | Coverage: 0.01% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/OneBodyJastrowRef.h: 205 - 241 |
-------------------------------------------------------------------------------- |
205: inline void computeU3(ParticleSet& P, int iat, const valT* dist) |
206: { |
207: if (NumGroups > 0) |
[...] |
214: for (int jg = 0; jg < NumGroups; ++jg) |
215: { |
216: if (F[jg] == nullptr) |
217: continue; |
218: F[jg]->evaluateVGL(-1, |
[...] |
231: for (int c = 0; c < Nions; ++c) |
232: { |
233: int gid = Ions.GroupID[c]; |
234: if (F[gid] != nullptr) |
235: { |
236: U[c] = F[gid]->evaluate(dist[c], dU[c], d2U[c]); |
237: dU[c] /= dist[c]; |
238: } |
239: } |
240: } |
241: } |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/shared_ptr_base.h: 1666 - 1666 |
-------------------------------------------------------------------------------- |
1666: { return _M_ptr; } |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/stl_vector.h: 1123 - 1258 |
-------------------------------------------------------------------------------- |
1123: operator[](size_type __n) _GLIBCXX_NOEXCEPT |
1124: { |
1125: __glibcxx_requires_subscript(__n); |
1126: return *(this->_M_impl._M_start + __n); |
[...] |
1258: { return _M_data_ptr(this->_M_impl._M_start); } |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/stl_algobase.h: 931 - 1128 |
-------------------------------------------------------------------------------- |
931: *__first = __tmp; |
[...] |
1123: if (__n <= 0) |
1124: return __first; |
1125: |
1126: __glibcxx_requires_can_increment(__first, __n); |
1127: |
1128: std::__fill_a(__first, __first + __n, __value); |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 229 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/BsplineFunctor.h: 188 - 217 |
-------------------------------------------------------------------------------- |
188: if (r >= cutoff_radius) |
189: { |
190: dudr = d2udr2 = 0.0; |
191: return 0.0; |
192: } |
193: r *= DeltaRInv; |
194: real_type ipart, t; |
195: t = std::modf(r, &ipart); |
196: int i = (int)ipart; |
197: real_type tp[4]; |
198: tp[0] = t * t * t; |
199: tp[1] = t * t; |
200: tp[2] = t; |
201: tp[3] = 1.0; |
202: // clang-format off |
203: d2udr2 = DeltaRInv * DeltaRInv * |
204: (SplineCoefs[i+0]*(d2A[ 0]*tp[0] + d2A[ 1]*tp[1] + d2A[ 2]*tp[2] + d2A[ 3]*tp[3])+ |
205: SplineCoefs[i+1]*(d2A[ 4]*tp[0] + d2A[ 5]*tp[1] + d2A[ 6]*tp[2] + d2A[ 7]*tp[3])+ |
206: SplineCoefs[i+2]*(d2A[ 8]*tp[0] + d2A[ 9]*tp[1] + d2A[10]*tp[2] + d2A[11]*tp[3])+ |
207: SplineCoefs[i+3]*(d2A[12]*tp[0] + d2A[13]*tp[1] + d2A[14]*tp[2] + d2A[15]*tp[3])); |
208: dudr = DeltaRInv * |
209: (SplineCoefs[i+0]*(dA[ 0]*tp[0] + dA[ 1]*tp[1] + dA[ 2]*tp[2] + dA[ 3]*tp[3])+ |
210: SplineCoefs[i+1]*(dA[ 4]*tp[0] + dA[ 5]*tp[1] + dA[ 6]*tp[2] + dA[ 7]*tp[3])+ |
211: SplineCoefs[i+2]*(dA[ 8]*tp[0] + dA[ 9]*tp[1] + dA[10]*tp[2] + dA[11]*tp[3])+ |
212: SplineCoefs[i+3]*(dA[12]*tp[0] + dA[13]*tp[1] + dA[14]*tp[2] + dA[15]*tp[3])); |
213: return |
214: (SplineCoefs[i+0]*(A[ 0]*tp[0] + A[ 1]*tp[1] + A[ 2]*tp[2] + A[ 3]*tp[3])+ |
215: SplineCoefs[i+1]*(A[ 4]*tp[0] + A[ 5]*tp[1] + A[ 6]*tp[2] + A[ 7]*tp[3])+ |
216: SplineCoefs[i+2]*(A[ 8]*tp[0] + A[ 9]*tp[1] + A[10]*tp[2] + A[11]*tp[3])+ |
217: SplineCoefs[i+3]*(A[12]*tp[0] + A[13]*tp[1] + A[14]*tp[2] + A[15]*tp[3])); |
0x38a90 LEA 0x8(%RSP),%R10 |
0x38a95 AND $-0x20,%RSP |
0x38a99 PUSHQ -0x8(%R10) |
0x38a9d PUSH %RBP |
0x38a9e MOV %RSP,%RBP |
0x38aa1 PUSH %R15 |
0x38aa3 PUSH %R14 |
0x38aa5 PUSH %R13 |
0x38aa7 PUSH %R12 |
0x38aa9 MOV %RDI,%R12 |
0x38aac PUSH %R10 |
0x38aae PUSH %RBX |
0x38aaf SUB $0x60,%RSP |
0x38ab3 MOV 0x98(%RDI),%EAX |
0x38ab9 MOV %RCX,-0x48(%RBP) |
0x38abd MOVSXD 0x90(%RDI),%RBX |
0x38ac4 TEST %EAX,%EAX |
0x38ac6 JLE 38b98 |
0x38acc MOV 0x100(%RDI),%RDI |
0x38ad3 MOV 0x130(%R12),%R14 |
0x38adb MOV 0x118(%R12),%R15 |
0x38ae3 MOV %RDI,-0x50(%RBP) |
0x38ae7 TEST %EBX,%EBX |
0x38ae9 JLE 38b13 |
0x38aeb SAL $0x3,%RBX |
0x38aef XOR %ESI,%ESI |
0x38af1 MOV %RBX,%RDX |
0x38af4 CALL 80e0 <memset@plt> |
0x38af9 MOV %RBX,%RDX |
0x38afc XOR %ESI,%ESI |
0x38afe MOV %R15,%RDI |
0x38b01 CALL 80e0 <memset@plt> |
0x38b06 MOV %RBX,%RDX |
0x38b09 XOR %ESI,%ESI |
0x38b0b MOV %R14,%RDI |
0x38b0e CALL 80e0 <memset@plt> |
0x38b13 MOV 0x1c8(%R12),%RBX |
0x38b1b XOR %R13D,%R13D |
0x38b1e XCHG %AX,%AX |
(360) 0x38b20 MOV (%RBX,%R13,8),%RDI |
(360) 0x38b24 TEST %RDI,%RDI |
(360) 0x38b27 JE 38b6f |
(360) 0x38b29 MOV 0xa0(%R12),%R8 |
(360) 0x38b31 MOV $-0x1,%ESI |
(360) 0x38b36 MOV 0x268(%R8),%R9 |
(360) 0x38b3d MOV -0x48(%RBP),%R8 |
(360) 0x38b41 MOV 0x18(%R9),%R11 |
(360) 0x38b45 MOV -0x50(%RBP),%R9 |
(360) 0x38b49 MOV 0x4(%R11,%R13,4),%ECX |
(360) 0x38b4e MOV (%R11,%R13,4),%EDX |
(360) 0x38b52 PUSHQ 0x160(%R12) |
(360) 0x38b5a PUSHQ 0x148(%R12) |
(360) 0x38b62 PUSH %R14 |
(360) 0x38b64 PUSH %R15 |
(360) 0x38b66 CALL 37710 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi> |
(360) 0x38b6b ADD $0x20,%RSP |
(360) 0x38b6f INC %R13 |
(360) 0x38b72 CMP %R13D,0x98(%R12) |
(360) 0x38b7a JG 38b20 |
0x38b7c LEA -0x30(%RBP),%RSP |
0x38b80 POP %RBX |
0x38b81 POP %R10 |
0x38b83 POP %R12 |
0x38b85 POP %R13 |
0x38b87 POP %R14 |
0x38b89 POP %R15 |
0x38b8b POP %RBP |
0x38b8c LEA -0x8(%R10),%RSP |
0x38b90 RET |
0x38b91 NOPL (%RAX) |
0x38b98 TEST %EBX,%EBX |
0x38b9a JLE 38b7c |
0x38b9c MOV 0xa0(%RDI),%RDX |
0x38ba3 LEA -0x38(%RBP),%RCX |
0x38ba7 MOVSXD %EBX,%R15 |
0x38baa XOR %R13D,%R13D |
0x38bad MOV %RCX,-0x78(%RBP) |
0x38bb1 MOV 0x1c8(%RDI),%R14 |
0x38bb8 MOV 0x18(%RDX),%RSI |
0x38bbc JMP 38bf9 |
0x38bbe XCHG %AX,%AX |
(359) 0x38bc0 MOVQ $0,(%R8) |
(359) 0x38bc7 VXORPD %XMM3,%XMM3,%XMM3 |
(359) 0x38bcb MOVQ $0,(%RAX) |
(359) 0x38bd2 MOV 0x100(%R12),%RCX |
(359) 0x38bda MOV -0x48(%RBP),%RDI |
(359) 0x38bde VMOVSD %XMM3,(%RCX,%RDX,1) |
(359) 0x38be3 VMOVSD (%RAX),%XMM0 |
(359) 0x38be7 VDIVSD (%RDI,%R13,8),%XMM0,%XMM4 |
(359) 0x38bed VMOVSD %XMM4,(%RAX) |
(359) 0x38bf1 INC %R13 |
(359) 0x38bf4 CMP %R13,%R15 |
(359) 0x38bf7 JE 38b7c |
(359) 0x38bf9 MOVSXD (%RSI,%R13,4),%RDI |
(359) 0x38bfd MOV (%R14,%RDI,8),%RBX |
(359) 0x38c01 TEST %RBX,%RBX |
(359) 0x38c04 JE 38bf1 |
(359) 0x38c06 MOV 0x130(%R12),%R8 |
(359) 0x38c0e MOV 0x118(%R12),%RAX |
(359) 0x38c16 LEA (,%R13,8),%RDX |
(359) 0x38c1e MOV -0x48(%RBP),%R9 |
(359) 0x38c22 ADD %RDX,%R8 |
(359) 0x38c25 ADD %RDX,%RAX |
(359) 0x38c28 VMOVSD (%R9,%R13,8),%XMM0 |
(359) 0x38c2e VCOMISD 0x8(%RBX),%XMM0 |
(359) 0x38c33 JAE 38bc0 |
(359) 0x38c35 VMOVSD 0x238(%RBX),%XMM4 |
(359) 0x38c3d MOV -0x78(%RBP),%RDI |
(359) 0x38c41 MOV %RSI,-0x70(%RBP) |
(359) 0x38c45 MOV %RAX,-0x68(%RBP) |
(359) 0x38c49 VMULSD %XMM4,%XMM0,%XMM0 |
(359) 0x38c4d MOV %RDX,-0x58(%RBP) |
(359) 0x38c51 VMOVSD %XMM4,-0x50(%RBP) |
(359) 0x38c56 MOV %R8,-0x60(%RBP) |
(359) 0x38c5a CALL 8230 <modf@plt> |
(359) 0x38c5f VCVTTSD2SI -0x38(%RBP),%ESI |
(359) 0x38c64 MOV -0x60(%RBP),%RAX |
(359) 0x38c68 VMULSD %XMM0,%XMM0,%XMM5 |
(359) 0x38c6c VMOVSD 0x120(%RBX),%XMM14 |
(359) 0x38c74 VBROADCASTSD %XMM0,%YMM2 |
(359) 0x38c79 VMOVSD 0x118(%RBX),%XMM7 |
(359) 0x38c81 VMOVSD 0x178(%RBX),%XMM11 |
(359) 0x38c89 MOV 0x218(%RBX),%R10 |
(359) 0x38c90 VMOVHPD 0x140(%RBX),%XMM14,%XMM15 |
(359) 0x38c98 VMOVHPD 0x138(%RBX),%XMM7,%XMM8 |
(359) 0x38ca0 VMOVSD 0x130(%RBX),%XMM14 |
(359) 0x38ca8 VMOVHPD 0x158(%RBX),%XMM11,%XMM12 |
(359) 0x38cb0 MOVSXD %ESI,%R11 |
(359) 0x38cb3 VINSERTF128 $0x1,%XMM8,%YMM12,%YMM13 |
(359) 0x38cb9 VMOVSD 0x188(%RBX),%XMM8 |
(359) 0x38cc1 VPERMPD $0x4b,(%R10,%R11,8),%YMM10 |
(359) 0x38cc8 VMULSD %XMM5,%XMM0,%XMM6 |
(359) 0x38ccc VMOVSD 0x180(%RBX),%XMM0 |
(359) 0x38cd4 VBROADCASTSD %XMM5,%YMM3 |
(359) 0x38cd9 VMOVHPD 0x168(%RBX),%XMM8,%XMM11 |
(359) 0x38ce1 VMOVHPD 0x160(%RBX),%XMM0,%XMM4 |
(359) 0x38ce9 VMOVSD 0x190(%RBX),%XMM0 |
(359) 0x38cf1 VINSERTF128 $0x1,%XMM15,%YMM4,%YMM1 |
(359) 0x38cf7 VMOVHPD 0x150(%RBX),%XMM14,%XMM15 |
(359) 0x38cff VMULPD %YMM3,%YMM1,%YMM5 |
(359) 0x38d03 VMOVHPD 0x170(%RBX),%XMM0,%XMM4 |
(359) 0x38d0b VBROADCASTSD %XMM6,%YMM9 |
(359) 0x38d10 VMOVSD 0x128(%RBX),%XMM6 |
(359) 0x38d18 VINSERTF128 $0x1,%XMM15,%YMM4,%YMM1 |
(359) 0x38d1e VMOVHPD 0x148(%RBX),%XMM6,%XMM7 |
(359) 0x38d26 VINSERTF128 $0x1,%XMM7,%YMM11,%YMM12 |
(359) 0x38d2c VMOVSD -0x50(%RBP),%XMM11 |
(359) 0x38d31 VFMADD132PD %YMM2,%YMM1,%YMM12 |
(359) 0x38d36 VFMADD132PD %YMM9,%YMM5,%YMM13 |
(359) 0x38d3b VADDPD %YMM12,%YMM13,%YMM13 |
(359) 0x38d40 VMULSD %XMM11,%XMM11,%XMM12 |
(359) 0x38d45 VMULPD %YMM10,%YMM13,%YMM10 |
(359) 0x38d4a VEXTRACTF128 $0x1,%YMM10,%XMM5 |
(359) 0x38d50 VADDPD %XMM10,%XMM5,%XMM6 |
(359) 0x38d55 VUNPCKHPD %XMM6,%XMM6,%XMM7 |
(359) 0x38d59 VADDPD %XMM6,%XMM7,%XMM8 |
(359) 0x38d5d VMULSD %XMM8,%XMM12,%XMM14 |
(359) 0x38d62 VMOVSD %XMM14,(%RAX) |
(359) 0x38d66 VMOVSD 0xa0(%RBX),%XMM5 |
(359) 0x38d6e VMOVSD 0x100(%RBX),%XMM7 |
(359) 0x38d76 VMOVSD 0x98(%RBX),%XMM0 |
(359) 0x38d7e VMOVSD 0xf8(%RBX),%XMM4 |
(359) 0x38d86 VMOVHPD 0xc0(%RBX),%XMM5,%XMM6 |
(359) 0x38d8e VMOVHPD 0xe0(%RBX),%XMM7,%XMM8 |
(359) 0x38d96 VMOVSD 0xa8(%RBX),%XMM14 |
(359) 0x38d9e VPERMPD $0x4b,(%R10,%R11,8),%YMM15 |
(359) 0x38da5 VINSERTF128 $0x1,%XMM6,%YMM8,%YMM11 |
(359) 0x38dab VMOVHPD 0xd8(%RBX),%XMM4,%XMM13 |
(359) 0x38db3 VMOVHPD 0xb8(%RBX),%XMM0,%XMM1 |
(359) 0x38dbb VMULPD %YMM3,%YMM11,%YMM12 |
(359) 0x38dbf VINSERTF128 $0x1,%XMM1,%YMM13,%YMM10 |
(359) 0x38dc5 VMOVHPD 0xc8(%RBX),%XMM14,%XMM1 |
(359) 0x38dcd MOV -0x68(%RBP),%RAX |
(359) 0x38dd1 VMOVSD 0x108(%RBX),%XMM0 |
(359) 0x38dd9 VMOVSD 0xb0(%RBX),%XMM5 |
(359) 0x38de1 VMOVSD 0x110(%RBX),%XMM6 |
(359) 0x38de9 MOV -0x70(%RBP),%RSI |
(359) 0x38ded VMOVHPD 0xe8(%RBX),%XMM0,%XMM4 |
(359) 0x38df5 VMOVHPD 0xd0(%RBX),%XMM5,%XMM7 |
(359) 0x38dfd MOV -0x58(%RBP),%RDX |
(359) 0x38e01 VMOVHPD 0xf0(%RBX),%XMM6,%XMM8 |
(359) 0x38e09 VINSERTF128 $0x1,%XMM1,%YMM4,%YMM13 |
(359) 0x38e0f VINSERTF128 $0x1,%XMM7,%YMM8,%YMM11 |
(359) 0x38e15 VFMADD132PD %YMM9,%YMM12,%YMM10 |
(359) 0x38e1a VFMADD132PD %YMM2,%YMM11,%YMM13 |
(359) 0x38e1f VADDPD %YMM10,%YMM13,%YMM10 |
(359) 0x38e24 VMULPD %YMM15,%YMM10,%YMM15 |
(359) 0x38e29 VEXTRACTF128 $0x1,%YMM15,%XMM12 |
(359) 0x38e2f VADDPD %XMM15,%XMM12,%XMM14 |
(359) 0x38e34 VUNPCKHPD %XMM14,%XMM14,%XMM1 |
(359) 0x38e39 VADDPD %XMM14,%XMM1,%XMM0 |
(359) 0x38e3e VMULSD 0x238(%RBX),%XMM0,%XMM4 |
(359) 0x38e46 VMOVSD %XMM4,(%RAX) |
(359) 0x38e4a VMOVSD 0x20(%RBX),%XMM10 |
(359) 0x38e4f VMOVSD 0x18(%RBX),%XMM5 |
(359) 0x38e54 VMOVSD 0x80(%RBX),%XMM12 |
(359) 0x38e5c VMOVSD 0x78(%RBX),%XMM6 |
(359) 0x38e61 VMOVHPD 0x40(%RBX),%XMM10,%XMM15 |
(359) 0x38e66 VMOVHPD 0x38(%RBX),%XMM5,%XMM7 |
(359) 0x38e6b VMOVSD 0x28(%RBX),%XMM0 |
(359) 0x38e70 VMOVSD 0x88(%RBX),%XMM5 |
(359) 0x38e78 VMOVHPD 0x60(%RBX),%XMM12,%XMM14 |
(359) 0x38e7d VMOVHPD 0x58(%RBX),%XMM6,%XMM8 |
(359) 0x38e82 VMOVSD 0x90(%RBX),%XMM10 |
(359) 0x38e8a VMOVSD 0x30(%RBX),%XMM6 |
(359) 0x38e8f VINSERTF128 $0x1,%XMM15,%YMM14,%YMM1 |
(359) 0x38e95 VINSERTF128 $0x1,%XMM7,%YMM8,%YMM11 |
(359) 0x38e9b VMOVHPD 0x48(%RBX),%XMM0,%XMM4 |
(359) 0x38ea0 VMULPD %YMM3,%YMM1,%YMM3 |
(359) 0x38ea4 VMOVHPD 0x68(%RBX),%XMM5,%XMM7 |
(359) 0x38ea9 VMOVHPD 0x70(%RBX),%XMM10,%XMM15 |
(359) 0x38eae VINSERTF128 $0x1,%XMM4,%YMM7,%YMM8 |
(359) 0x38eb4 VPERMPD $0x4b,(%R10,%R11,8),%YMM13 |
(359) 0x38ebb VFMADD132PD %YMM11,%YMM3,%YMM9 |
(359) 0x38ec0 VMOVHPD 0x50(%RBX),%XMM6,%XMM11 |
(359) 0x38ec5 VINSERTF128 $0x1,%XMM11,%YMM15,%YMM12 |
(359) 0x38ecb VFMADD231PD %YMM8,%YMM2,%YMM12 |
(359) 0x38ed0 VADDPD %YMM9,%YMM12,%YMM2 |
(359) 0x38ed5 VMULPD %YMM13,%YMM2,%YMM9 |
(359) 0x38eda VEXTRACTF128 $0x1,%YMM9,%XMM13 |
(359) 0x38ee0 VADDPD %XMM9,%XMM13,%XMM14 |
(359) 0x38ee5 VUNPCKHPD %XMM14,%XMM14,%XMM1 |
(359) 0x38eea VADDPD %XMM14,%XMM1,%XMM3 |
(359) 0x38eef VZEROUPPER |
(359) 0x38ef2 JMP 38bd2 |
0x38ef7 NOP |
0x38ef8 NOPL (%RAX,%RAX,1) |
Path / |
Source file and lines | OneBodyJastrowRef.h:205-241 |
Module | libqmcwfs.so |
nb instructions | 63 |
nb uops | 67 |
loop length | 221 |
used x86 registers | 13 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 6 |
micro-operation queue | 11.17 cycles |
front end | 11.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.50 | 1.73 | 6.00 | 6.00 | 7.00 | 1.73 | 2.50 | 7.00 | 7.00 | 7.00 | 1.53 | 6.00 |
cycles | 2.50 | 1.73 | 6.00 | 6.00 | 7.00 | 1.73 | 2.50 | 7.00 | 7.00 | 7.00 | 1.53 | 6.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 10.79-10.86 |
Stall cycles | 0.00 |
Front-end | 11.17 |
Dispatch | 7.00 |
Overall L1 | 11.17 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 9% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 7% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
LEA 0x8(%RSP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
PUSHQ -0x8(%R10) | 2 | 0 | 0 | 0.33 | 0.33 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0.33 | 5-12 | 0.62 |
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R10 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x60,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x98(%RDI),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD 0x90(%RDI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 38b98 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd+0x108> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x100(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x130(%R12),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x118(%R12),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %EBX,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 38b13 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd+0x83> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 80e0 <memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 80e0 <memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 80e0 <memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x1c8(%R12),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x30(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
LEA -0x8(%R10),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %EBX,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 38b7c <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd+0xec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xa0(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x38(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSXD %EBX,%R15 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1c8(%RDI),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RDX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 38bf9 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd+0x169> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | OneBodyJastrowRef.h:205-241 |
Module | libqmcwfs.so |
nb instructions | 63 |
nb uops | 67 |
loop length | 221 |
used x86 registers | 13 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 6 |
micro-operation queue | 11.17 cycles |
front end | 11.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.50 | 1.73 | 6.00 | 6.00 | 7.00 | 1.73 | 2.50 | 7.00 | 7.00 | 7.00 | 1.53 | 6.00 |
cycles | 2.50 | 1.73 | 6.00 | 6.00 | 7.00 | 1.73 | 2.50 | 7.00 | 7.00 | 7.00 | 1.53 | 6.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 10.79-10.86 |
Stall cycles | 0.00 |
Front-end | 11.17 |
Dispatch | 7.00 |
Overall L1 | 11.17 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 9% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 7% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
LEA 0x8(%RSP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
PUSHQ -0x8(%R10) | 2 | 0 | 0 | 0.33 | 0.33 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0.33 | 5-12 | 0.62 |
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R10 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x60,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x98(%RDI),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD 0x90(%RDI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 38b98 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd+0x108> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x100(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x130(%R12),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x118(%R12),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %EBX,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 38b13 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd+0x83> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 80e0 <memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 80e0 <memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 80e0 <memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x1c8(%R12),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x30(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
LEA -0x8(%R10),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %EBX,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 38b7c <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd+0xec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xa0(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x38(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSXD %EBX,%R15 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1c8(%RDI),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RDX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 38bf9 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd+0x169> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE9computeU3ERNS1_11ParticleSetEiPKd– | 0.01 | 0.01 |
○Loop 359 - BsplineFunctor.h:188-217 - libqmcwfs.so | 0 | 0 |
○Loop 360 - OneBodyJastrowRef.h:214-218 - libqmcwfs.so | 0 | 0 |