Loop Id: 389 | Module: exec | Source: TwoBodyJastrowRef.h:107-132 [...] | Coverage: 0.01% |
---|
Loop Id: 389 | Module: exec | Source: TwoBodyJastrowRef.h:107-132 [...] | Coverage: 0.01% |
---|
0x4208a0 VXORPD %XMM0,%XMM0,%XMM0 |
0x4208a4 VMOVUPD 0x60(%RSP),%YMM24 |
0x4208ac VMOVUPD 0x80(%RSP),%YMM25 |
0x4208b4 VMOVUPD 0xe0(%RSP),%YMM27 |
0x4208bc VMOVUPD 0xc0(%RSP),%YMM30 |
0x4208c4 VMOVUPD 0xa0(%RSP),%YMM31 |
0x4208cc VMOVUPD %YMM31,0xa0(%RSP) |
0x4208d4 VMOVUPD %YMM30,0xc0(%RSP) |
0x4208dc VMOVUPD %YMM27,0xe0(%RSP) |
0x4208e4 VMOVUPD %YMM25,0x80(%RSP) |
0x4208ec VMOVUPD %YMM24,0x60(%RSP) |
0x4208f4 VMOVSD 0x38(%RSP),%XMM1 |
0x4208fa VSUBSD %XMM0,%XMM1,%XMM0 |
0x4208fe VZEROUPPER |
0x420901 CALL 4db2b0 <exp> |
0x420906 MOV 0x30(%RSP),%RCX |
0x42090b MOV (%RCX),%RAX |
0x42090e MOV 0x10(%RSP),%RDX |
0x420913 VMOVSD %XMM0,(%RAX,%RDX,8) |
0x420918 INC %RDX |
0x42091b MOV 0x8(%RCX),%RCX |
0x42091f SUB %RAX,%RCX |
0x420922 SAR $0x3,%RCX |
0x420926 MOV %RDX,0x10(%RSP) |
0x42092b CMP %RDX,%RCX |
0x42092e MOV 0x28(%RSP),%RDI |
0x420933 MOV 0x18(%RSP),%RCX |
0x420938 JBE 42100e |
0x42093e CMPB $0,0x298(%RDI) |
0x420945 JE 42101d |
0x42094b MOVSXD 0x2a0(%RDI),%RBX |
0x420952 MOV 0xd8(%RCX),%RAX |
0x420959 VMOVSD (%RAX,%RBX,8),%XMM0 |
0x42095e VMOVSD %XMM0,0x38(%RSP) |
0x420964 MOV 0x290(%RDI),%R14 |
0x42096b MOV 0x248(%RCX),%ESI |
0x420971 VZEROUPPER |
0x420974 CALL 4600b0 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> |
0x420979 MOV 0x18(%RSP),%RDI |
0x42097e MOV 0xa0(%RDI),%RCX |
0x420985 TEST %RCX,%RCX |
0x420988 JE 4208a0 |
0x42098e MOV 0x48(%RAX),%RAX |
0x420992 MOV 0x10(%RSP),%RDX |
0x420997 LEA (%RDX,%RDX,4),%RDX |
0x42099b MOV 0x18(%RAX,%RDX,8),%RAX |
0x4209a0 MOV %RAX,0x20(%RSP) |
0x4209a5 MOV 0x18(%R14),%RDX |
0x4209a9 MOV (%RDX,%RBX,4),%ESI |
0x4209ac IMUL %ECX,%ESI |
0x4209af MOV 0x1d0(%RDI),%RDX |
0x4209b6 MOV 0x200(%RDI),%RAX |
0x4209bd MOV %RAX,0x58(%RSP) |
0x4209c2 MOVSXD %ESI,%RAX |
0x4209c5 MOV %RAX,0x50(%RSP) |
0x4209ca DEC %RCX |
0x4209cd VPBROADCASTD %EBX,%YMM1 |
0x4209d3 VXORPD %XMM0,%XMM0,%XMM0 |
0x4209d7 XOR %R8D,%R8D |
0x4209da VMOVDQU64 0xdbb1c(%RIP),%YMM28 |
0x4209e4 VMOVDQU64 0xdbb32(%RIP),%YMM29 |
0x4209ee VMOVUPD 0x60(%RSP),%YMM24 |
0x4209f6 VMOVUPD 0x80(%RSP),%YMM25 |
0x4209fe VMOVUPD 0xe0(%RSP),%YMM27 |
0x420a06 VMOVUPD 0xc0(%RSP),%YMM30 |
0x420a0e VMOVUPD 0xa0(%RSP),%YMM31 |
0x420a16 MOV %R14,0x48(%RSP) |
0x420a1b MOV %RCX,0x40(%RSP) |
0x420a20 JMP 420a4c |
(390) 0x420a30 VXORPD %XMM18,%XMM18,%XMM18 |
(390) 0x420a36 VADDSD %XMM0,%XMM18,%XMM0 |
(390) 0x420a3c LEA 0x1(%R8),%RAX |
(390) 0x420a40 CMP %RCX,%R8 |
(390) 0x420a43 MOV %RAX,%R8 |
(390) 0x420a46 JE 4208cc |
(390) 0x420a4c MOV 0x268(%R14),%RSI |
(390) 0x420a53 MOV 0x18(%RSI),%RSI |
(390) 0x420a57 MOV (%RSI,%R8,4),%R13 |
(390) 0x420a5b MOV %R13,%RSI |
(390) 0x420a5e SHR $0x20,%RSI |
(390) 0x420a62 SUB %R13D,%ESI |
(390) 0x420a65 TEST %ESI,%ESI |
(390) 0x420a67 JLE 420a30 |
(390) 0x420a69 MOV 0x50(%RSP),%RAX |
(390) 0x420a6e LEA (%R8,%RAX,1),%RDI |
(390) 0x420a72 MOV 0x58(%RSP),%RAX |
(390) 0x420a77 MOV (%RAX,%RDI,8),%R9 |
(390) 0x420a7b VMOVSD 0x8(%R9),%XMM2 |
(390) 0x420a81 MOV %ESI,%R15D |
(390) 0x420a84 MOV %R15,%R11 |
(390) 0x420a87 MOVSXD %R13D,%R12 |
(390) 0x420a8a MOV $-0x10,%EAX |
(390) 0x420a8f AND %RAX,%R11 |
(390) 0x420a92 JE 420e00 |
(390) 0x420a98 MOV %RBX,%RCX |
(390) 0x420a9b VMOVQ %R13,%XMM3 |
(390) 0x420aa0 VBROADCASTSD %XMM2,%YMM4 |
(390) 0x420aa5 MOV 0x20(%RSP),%RAX |
(390) 0x420aaa LEA (%RAX,%R12,8),%RBX |
(390) 0x420aae XOR %R10D,%R10D |
(390) 0x420ab1 XOR %ESI,%ESI |
(390) 0x420ab3 NOPW %CS:(%RAX,%RAX,1) |
(393) 0x420ac0 VMOVUPD (%RBX,%RSI,8),%YMM5 |
(393) 0x420ac5 VMOVUPD 0x20(%RBX,%RSI,8),%YMM6 |
(393) 0x420acb VMOVUPD 0x40(%RBX,%RSI,8),%YMM7 |
(393) 0x420ad1 VMOVUPD 0x60(%RBX,%RSI,8),%YMM8 |
(393) 0x420ad7 VMOVD %ESI,%XMM9 |
(393) 0x420adb VPADDD %XMM3,%XMM9,%XMM9 |
(393) 0x420adf VPBROADCASTD %XMM9,%YMM9 |
(393) 0x420ae4 VPADDD %YMM28,%YMM9,%YMM10 |
(393) 0x420aea VPADDD %YMM29,%YMM9,%YMM9 |
(393) 0x420af0 VPCMPNEQD %YMM1,%YMM9,%K0 |
(393) 0x420af7 VPCMPNEQD %YMM1,%YMM10,%K2 |
(393) 0x420afe VCMPPD $0x1,%YMM4,%YMM5,%K5 |
(393) 0x420b05 VCMPPD $0x1,%YMM4,%YMM6,%K1 |
(393) 0x420b0c KMOVW %K1,0x60(%RSP) |
(393) 0x420b12 KSHIFTLB $0x4,%K1,%K3 |
(393) 0x420b18 KORB %K3,%K5,%K3 |
(393) 0x420b1c VCMPPD $0x1,%YMM4,%YMM7,%K6 |
(393) 0x420b23 VCMPPD $0x1,%YMM4,%YMM8,%K4 |
(393) 0x420b2a MOVSXD %R10D,%R10 |
(393) 0x420b2d LEA (%RDX,%R10,8),%RDI |
(393) 0x420b31 KANDB %K0,%K3,%K7 |
(393) 0x420b35 KMOVB %K7,%EAX |
(393) 0x420b39 KANDW %K2,%K6,%K7 |
(393) 0x420b3d POPCNT %EAX,%EAX |
(393) 0x420b41 VCOMPRESSPD %YMM7,(%RDI,%RAX,8){%K7} |
(393) 0x420b48 KANDW %K0,%K5,%K5 |
(393) 0x420b4c VCOMPRESSPD %YMM5,(%RDX,%R10,8){%K5} |
(393) 0x420b53 KSHIFTLB $0x4,%K4,%K1 |
(393) 0x420b59 KORB %K1,%K6,%K1 |
(393) 0x420b5d KMOVB %K7,0xe(%RSP) |
(393) 0x420b63 KSHIFTRB $0x4,%K2,%K6 |
(393) 0x420b69 KANDW %K6,%K4,%K4 |
(393) 0x420b6d LEA (%RDI,%RAX,8),%RAX |
(393) 0x420b71 MOVZX 0xe(%RSP),%R14D |
(393) 0x420b77 POPCNT %R14D,%R14D |
(393) 0x420b7c VCOMPRESSPD %YMM8,(%RAX,%R14,8){%K4} |
(393) 0x420b83 KUNPCKBW %K3,%K1,%K1 |
(393) 0x420b87 KMOVB %K5,0xf(%RSP) |
(393) 0x420b8d KUNPCKBW %K0,%K2,%K2 |
(393) 0x420b91 KSHIFTRB $0x4,%K0,%K0 |
(393) 0x420b97 KMOVW 0x60(%RSP),%K3 |
(393) 0x420b9d KANDW %K0,%K3,%K3 |
(393) 0x420ba1 MOVZX 0xf(%RSP),%EAX |
(393) 0x420ba6 POPCNT %EAX,%EAX |
(393) 0x420baa VCOMPRESSPD %YMM6,(%RDI,%RAX,8){%K3} |
(393) 0x420bb1 KANDW %K2,%K1,%K0 |
(393) 0x420bb5 KMOVW %K0,%EAX |
(393) 0x420bb9 POPCNT %EAX,%EAX |
(393) 0x420bbd ADD %EAX,%R10D |
(393) 0x420bc0 ADD $0x10,%RSI |
(393) 0x420bc4 CMP %R11,%RSI |
(393) 0x420bc7 JB 420ac0 |
(390) 0x420bcd CMP %R15,%R11 |
(390) 0x420bd0 MOV %RCX,%RBX |
(390) 0x420bd3 MOV 0x48(%RSP),%R14 |
(390) 0x420bd8 MOV 0x40(%RSP),%RCX |
(390) 0x420bdd JNE 420e06 |
(390) 0x420be3 TEST %R10D,%R10D |
(390) 0x420be6 JLE 420a30 |
(390) 0x420bec VMOVSD 0x238(%R9),%XMM3 |
(390) 0x420bf5 MOV 0x218(%R9),%R11 |
(390) 0x420bfc VMOVSD 0x18(%R9),%XMM18 |
(390) 0x420c03 VMOVSD 0x20(%R9),%XMM2 |
(390) 0x420c09 VMOVSD 0x28(%R9),%XMM6 |
(390) 0x420c0f VMOVSD 0x30(%R9),%XMM5 |
(390) 0x420c15 VMOVSD 0x38(%R9),%XMM17 |
(390) 0x420c1c VMOVSD 0x40(%R9),%XMM11 |
(390) 0x420c22 VMOVSD 0x48(%R9),%XMM13 |
(390) 0x420c28 VMOVSD 0x50(%R9),%XMM15 |
(390) 0x420c2e VMOVSD 0x58(%R9),%XMM7 |
(390) 0x420c34 VMOVSD 0x60(%R9),%XMM4 |
(390) 0x420c3a VMOVSD 0x68(%R9),%XMM10 |
(390) 0x420c40 VMOVSD 0x70(%R9),%XMM9 |
(390) 0x420c46 VMOVSD 0x78(%R9),%XMM12 |
(390) 0x420c4c VMOVSD 0x80(%R9),%XMM8 |
(390) 0x420c55 VMOVSD 0x88(%R9),%XMM14 |
(390) 0x420c5e VMOVSD 0x90(%R9),%XMM16 |
(390) 0x420c65 MOV %R10D,%R10D |
(390) 0x420c68 MOV %R10,%R9 |
(390) 0x420c6b MOV $-0x4,%EAX |
(390) 0x420c70 AND %RAX,%R9 |
(390) 0x420c73 JE 420e4b |
(390) 0x420c79 VMOVUPD %YMM25,0x80(%RSP) |
(390) 0x420c81 VMOVUPD %YMM24,0x60(%RSP) |
(390) 0x420c89 VBROADCASTSD %XMM3,%YMM19 |
(390) 0x420c8f VBROADCASTSD %XMM18,%YMM3 |
(390) 0x420c95 VBROADCASTSD %XMM2,%YMM2 |
(390) 0x420c9a VBROADCASTSD %XMM6,%YMM6 |
(390) 0x420c9f VBROADCASTSD %XMM5,%YMM5 |
(390) 0x420ca4 VPBROADCASTQ %R11,%YMM20 |
(390) 0x420caa VBROADCASTSD %XMM17,%YMM17 |
(390) 0x420cb0 VBROADCASTSD %XMM11,%YMM11 |
(390) 0x420cb5 VBROADCASTSD %XMM13,%YMM13 |
(390) 0x420cba VBROADCASTSD %XMM15,%YMM15 |
(390) 0x420cbf VBROADCASTSD %XMM7,%YMM7 |
(390) 0x420cc4 VBROADCASTSD %XMM4,%YMM4 |
(390) 0x420cc9 VBROADCASTSD %XMM10,%YMM10 |
(390) 0x420cce VBROADCASTSD %XMM9,%YMM9 |
(390) 0x420cd3 VBROADCASTSD %XMM12,%YMM12 |
(390) 0x420cd8 VBROADCASTSD %XMM8,%YMM8 |
(390) 0x420cdd VBROADCASTSD %XMM14,%YMM14 |
(390) 0x420ce2 VBROADCASTSD %XMM16,%YMM16 |
(390) 0x420ce8 VXORPD %XMM18,%XMM18,%XMM18 |
(390) 0x420cee XOR %ESI,%ESI |
(391) 0x420cf0 VMULPD (%RDX,%RSI,8),%YMM19,%YMM21 |
(391) 0x420cf7 VCVTTPD2DQ %YMM21,%XMM22 |
(391) 0x420cfd KXNORW %K0,%K0,%K1 |
(391) 0x420d01 VXORPD %XMM23,%XMM23,%XMM23 |
(391) 0x420d07 VGATHERDPD (%R11,%XMM22,8),%YMM23{%K1} |
(391) 0x420d0e KXNORW %K0,%K0,%K1 |
(391) 0x420d12 VXORPD %XMM24,%XMM24,%XMM24 |
(391) 0x420d18 VGATHERDPD 0x8(%R11,%XMM22,8),%YMM24{%K1} |
(391) 0x420d20 KXNORW %K0,%K0,%K1 |
(391) 0x420d24 VXORPD %XMM25,%XMM25,%XMM25 |
(391) 0x420d2a VGATHERDPD 0x10(%R11,%XMM22,8),%YMM25{%K1} |
(391) 0x420d32 VRNDSCALEPD $0xb,%YMM21,%YMM26 |
(391) 0x420d39 VSUBPD %YMM26,%YMM21,%YMM21 |
(391) 0x420d3f KXNORW %K0,%K0,%K1 |
(391) 0x420d43 VXORPD %XMM26,%XMM26,%XMM26 |
(391) 0x420d49 VGATHERDPD 0x18(%R11,%XMM22,8),%YMM26{%K1} |
(391) 0x420d51 VMOVAPD %YMM21,%YMM22 |
(391) 0x420d57 VFMADD213PD %YMM2,%YMM3,%YMM22 |
(391) 0x420d5d VFMADD213PD %YMM6,%YMM21,%YMM22 |
(391) 0x420d63 VFMADD213PD %YMM5,%YMM21,%YMM22 |
(391) 0x420d69 VFMADD213PD %YMM18,%YMM23,%YMM22 |
(391) 0x420d6f VMOVAPD %YMM21,%YMM18 |
(391) 0x420d75 VFMADD213PD %YMM11,%YMM17,%YMM18 |
(391) 0x420d7b VFMADD213PD %YMM13,%YMM21,%YMM18 |
(391) 0x420d81 VFMADD213PD %YMM15,%YMM21,%YMM18 |
(391) 0x420d87 VFMADD213PD %YMM22,%YMM24,%YMM18 |
(391) 0x420d8d VMOVAPD %YMM21,%YMM22 |
(391) 0x420d93 VFMADD213PD %YMM4,%YMM7,%YMM22 |
(391) 0x420d99 VFMADD213PD %YMM10,%YMM21,%YMM22 |
(391) 0x420d9f VFMADD213PD %YMM9,%YMM21,%YMM22 |
(391) 0x420da5 VFMADD213PD %YMM18,%YMM25,%YMM22 |
(391) 0x420dab VMOVAPD %YMM21,%YMM18 |
(391) 0x420db1 VFMADD213PD %YMM8,%YMM12,%YMM18 |
(391) 0x420db7 VFMADD213PD %YMM14,%YMM21,%YMM18 |
(391) 0x420dbd VFMADD213PD %YMM16,%YMM21,%YMM18 |
(391) 0x420dc3 VFMADD213PD %YMM22,%YMM26,%YMM18 |
(391) 0x420dc9 ADD $0x4,%RSI |
(391) 0x420dcd CMP %R9,%RSI |
(391) 0x420dd0 JB 420cf0 |
(390) 0x420dd6 VEXTRACTF32X4 $0x1,%YMM18,%XMM21 |
(390) 0x420ddd VADDPD %XMM21,%XMM18,%XMM18 |
(390) 0x420de3 VSHUFPD $0x1,%XMM18,%XMM18,%XMM21 |
(390) 0x420dea VADDSD %XMM21,%XMM18,%XMM18 |
(390) 0x420df0 CMP %R10,%R9 |
(390) 0x420df3 JNE 420ebb |
(390) 0x420df9 JMP 420a36 |
(390) 0x420e00 XOR %R10D,%R10D |
(390) 0x420e03 XOR %R11D,%R11D |
(390) 0x420e06 MOV %EBX,%ESI |
(390) 0x420e08 SUB %R13D,%ESI |
(390) 0x420e0b MOV 0x20(%RSP),%RAX |
(390) 0x420e10 LEA (%RAX,%R12,8),%RDI |
(390) 0x420e14 JMP 420e2c |
(392) 0x420e20 INC %R11 |
(392) 0x420e23 CMP %R11,%R15 |
(392) 0x420e26 JE 420be3 |
(392) 0x420e2c VMOVSD (%RDI,%R11,8),%XMM3 |
(392) 0x420e32 VUCOMISD %XMM3,%XMM2 |
(392) 0x420e36 JBE 420e20 |
(392) 0x420e38 CMP %R11D,%ESI |
(392) 0x420e3b JE 420e20 |
(392) 0x420e3d MOVSXD %R10D,%R10 |
(392) 0x420e40 VMOVSD %XMM3,(%RDX,%R10,8) |
(392) 0x420e46 INC %R10D |
(392) 0x420e49 JMP 420e20 |
(390) 0x420e4b VPBROADCASTQ %R10,%YMM21 |
(390) 0x420e51 VBROADCASTSD %XMM3,%YMM19 |
(390) 0x420e57 VBROADCASTSD %XMM18,%YMM3 |
(390) 0x420e5d VBROADCASTSD %XMM2,%YMM2 |
(390) 0x420e62 VBROADCASTSD %XMM6,%YMM6 |
(390) 0x420e67 VBROADCASTSD %XMM5,%YMM5 |
(390) 0x420e6c VPBROADCASTQ %R11,%YMM20 |
(390) 0x420e72 VBROADCASTSD %XMM17,%YMM17 |
(390) 0x420e78 VBROADCASTSD %XMM11,%YMM11 |
(390) 0x420e7d VBROADCASTSD %XMM13,%YMM13 |
(390) 0x420e82 VBROADCASTSD %XMM15,%YMM15 |
(390) 0x420e87 VBROADCASTSD %XMM7,%YMM7 |
(390) 0x420e8c VBROADCASTSD %XMM4,%YMM4 |
(390) 0x420e91 VBROADCASTSD %XMM10,%YMM10 |
(390) 0x420e96 VBROADCASTSD %XMM9,%YMM9 |
(390) 0x420e9b VBROADCASTSD %XMM12,%YMM12 |
(390) 0x420ea0 VBROADCASTSD %XMM8,%YMM8 |
(390) 0x420ea5 VBROADCASTSD %XMM14,%YMM14 |
(390) 0x420eaa VBROADCASTSD %XMM16,%YMM16 |
(390) 0x420eb0 VXORPD %XMM18,%XMM18,%XMM18 |
(390) 0x420eb6 XOR %R9D,%R9D |
(390) 0x420eb9 JMP 420ed1 |
(390) 0x420ebb VPBROADCASTQ %R10,%YMM21 |
(390) 0x420ec1 VMOVUPD 0x60(%RSP),%YMM24 |
(390) 0x420ec9 VMOVUPD 0x80(%RSP),%YMM25 |
(390) 0x420ed1 VPBROADCASTQ %R9,%YMM22 |
(390) 0x420ed7 VPSUBQ %YMM22,%YMM21,%YMM21 |
(390) 0x420edd VPCMPNLEUQ 0xdb5f8(%RIP),%YMM21,%K1 |
(390) 0x420ee8 VMOVUPD (%RDX,%R9,8),%YMM21{%K1}{z} |
(390) 0x420eef VMOVAPD %YMM21,%YMM31{%K1} |
(390) 0x420ef5 VMULPD %YMM31,%YMM19,%YMM19 |
(390) 0x420efb VCVTTPD2DQ %YMM19,%XMM21 |
(390) 0x420f01 VPMOVSXDQ %XMM21,%YMM21 |
(390) 0x420f07 VPSLLQ $0x3,%YMM21,%YMM21 |
(390) 0x420f0e VPADDQ %YMM21,%YMM20,%YMM20 |
(390) 0x420f14 KMOVQ %K1,%K2 |
(390) 0x420f19 VPXORD %XMM21,%XMM21,%XMM21 |
(390) 0x420f1f VGATHERQPD (,%YMM20,1),%YMM21{%K2} |
(390) 0x420f2a VRNDSCALEPD $0xb,%YMM19,%YMM22 |
(390) 0x420f31 KMOVQ %K1,%K2 |
(390) 0x420f36 VXORPD %XMM23,%XMM23,%XMM23 |
(390) 0x420f3c VGATHERQPD 0x8(,%YMM20,1),%YMM23{%K2} |
(390) 0x420f47 VSUBPD %YMM22,%YMM19,%YMM19 |
(390) 0x420f4d VMOVAPD %YMM21,%YMM30{%K1} |
(390) 0x420f53 VMOVAPD %YMM23,%YMM27{%K1} |
(390) 0x420f59 VFMADD231PD %YMM17,%YMM19,%YMM11 |
(390) 0x420f5f KMOVQ %K1,%K2 |
(390) 0x420f64 VXORPD %XMM17,%XMM17,%XMM17 |
(390) 0x420f6a VGATHERQPD 0x10(,%YMM20,1),%YMM17{%K2} |
(390) 0x420f75 VFMADD213PD %YMM13,%YMM19,%YMM11 |
(390) 0x420f7b VFMADD213PD %YMM15,%YMM19,%YMM11 |
(390) 0x420f81 VMULPD %YMM27,%YMM11,%YMM11 |
(390) 0x420f87 VMOVAPD %YMM17,%YMM25{%K1} |
(390) 0x420f8d KMOVQ %K1,%K2 |
(390) 0x420f92 VXORPD %XMM13,%XMM13,%XMM13 |
(390) 0x420f97 VGATHERQPD 0x18(,%YMM20,1),%YMM13{%K2} |
(390) 0x420fa2 VFMADD231PD %YMM12,%YMM19,%YMM8 |
(390) 0x420fa8 VFMADD213PD %YMM14,%YMM19,%YMM8 |
(390) 0x420fae VFMADD213PD %YMM16,%YMM19,%YMM8 |
(390) 0x420fb4 VMOVAPD %YMM13,%YMM24{%K1} |
(390) 0x420fba VFMADD231PD %YMM3,%YMM19,%YMM2 |
(390) 0x420fc0 VFMADD213PD %YMM6,%YMM19,%YMM2 |
(390) 0x420fc6 VFMADD213PD %YMM5,%YMM19,%YMM2 |
(390) 0x420fcc VFMADD213PD %YMM11,%YMM30,%YMM2 |
(390) 0x420fd2 VFMADD231PD %YMM7,%YMM19,%YMM4 |
(390) 0x420fd8 VFMADD213PD %YMM10,%YMM19,%YMM4 |
(390) 0x420fde VFMADD213PD %YMM9,%YMM19,%YMM4 |
(390) 0x420fe4 VFMADD213PD %YMM2,%YMM25,%YMM4 |
(390) 0x420fea VFMADD231PD %YMM8,%YMM24,%YMM4{%K1}{z} |
(390) 0x420ff0 VEXTRACTF128 $0x1,%YMM4,%XMM2 |
(390) 0x420ff6 VADDPD %XMM2,%XMM4,%XMM2 |
(390) 0x420ffa VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(390) 0x420fff VADDSD %XMM3,%XMM2,%XMM2 |
(390) 0x421003 VADDSD %XMM2,%XMM18,%XMM18 |
(390) 0x421009 JMP 420a36 |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/refwrap.h: 313 - 313 |
-------------------------------------------------------------------------------- |
313: { return *_M_data; } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/shared_ptr_base.h: 1308 - 1308 |
-------------------------------------------------------------------------------- |
1308: { return _M_ptr; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
[...] |
249: inline const_pointer data() const { return X; } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/optional: 897 - 1213 |
-------------------------------------------------------------------------------- |
897: { return this->_M_payload._M_engaged; } |
[...] |
1213: return this->_M_is_engaged() |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/BsplineFunctor.h: 229 - 260 |
-------------------------------------------------------------------------------- |
229: const real_type* restrict distArray = _distArray + iStart; |
[...] |
236: for (int jat = 0; jat < iLimit; jat++) |
237: { |
238: real_type r = distArray[jat]; |
239: // pick the distances smaller than the cutoff and avoid the reference atom |
240: if (r < cutoff_radius && iStart + jat != iat) |
241: distArrayCompressed[iCount++] = distArray[jat]; |
242: } |
243: |
244: real_type d = 0.0; |
245: //#pragma omp simd reduction(+:d) |
246: for (int jat = 0; jat < iCount; jat++) |
247: { |
248: real_type r = distArrayCompressed[jat]; |
249: r *= DeltaRInv; |
250: int i = (int)r; |
251: real_type t = r - real_type(i); |
252: real_type tp0 = t * t * t; |
253: real_type tp1 = t * t; |
254: real_type tp2 = t; |
255: |
256: real_type d1 = SplineCoefs[i + 0] * (A[0] * tp0 + A[1] * tp1 + A[2] * tp2 + A[3]); |
257: real_type d2 = SplineCoefs[i + 1] * (A[4] * tp0 + A[5] * tp1 + A[6] * tp2 + A[7]); |
258: real_type d3 = SplineCoefs[i + 2] * (A[8] * tp0 + A[9] * tp1 + A[10] * tp2 + A[11]); |
259: real_type d4 = SplineCoefs[i + 3] * (A[12] * tp0 + A[13] * tp1 + A[14] * tp2 + A[15]); |
260: d += (d1 + d2 + d3 + d4); |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/TwoBodyJastrowRef.h: 107 - 132 |
-------------------------------------------------------------------------------- |
107: for (int k = 0; k < ratios.size(); ++k) |
108: ratios[k] = std::exp(Uat[VP.refPtcl] - computeU(VP.getRefPS(), VP.refPtcl, VP.getDistTableAB(myTableID).getDistRow(k).data())); |
[...] |
126: const int igt = P.GroupID[iat] * NumGroups; |
127: for (int jg = 0; jg < NumGroups; ++jg) |
128: { |
129: const FuncType& f2(*F[igt + jg]); |
130: int iStart = P.first(jg); |
131: int iEnd = P.last(jg); |
132: curUat += f2.evaluateV(iat, iStart, iEnd, dist, DistCompressed.data()); |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_vector.h: 806 - 1056 |
-------------------------------------------------------------------------------- |
806: { return size_type(this->_M_impl._M_finish - this->_M_impl._M_start); } |
[...] |
933: return *(this->_M_impl._M_start + __n); |
[...] |
951: return *(this->_M_impl._M_start + __n); |
[...] |
1056: { return _M_data_ptr(this->_M_impl._M_start); } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 313 - 316 |
-------------------------------------------------------------------------------- |
313: inline int first(int igroup) const { return (*group_offsets_)[igroup]; } |
314: |
315: ///return the last index of a group i |
316: inline int last(int igroup) const { return (*group_offsets_)[igroup + 1]; } |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | qmcplusplus::WaveFunction::eva[...] | stl_vector.h:806 | exec |
○ | qmcplusplus::NonLocalPP<double[...] | NonLocalPP.hpp:135 | exec |
○ | main.extracted.110 | NewTimer.h:249 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.78 |
CQA speedup if FP arith vectorized | 1.72 |
CQA speedup if fully vectorized | 5.48 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.07 |
Bottlenecks | micro-operation queue, |
Function | miniqmcreference::TwoBodyJastrowRef |
Source | refwrap.h:313-313,OhmmsVector.h:223-223,OhmmsVector.h:229-229,OhmmsVector.h:249-249,optional:897-897,optional:1213-1213,TwoBodyJastrowRef.h:107-108,TwoBodyJastrowRef.h:126-127,stl_vector.h:806-806,stl_vector.h:933-933,stl_vector.h:951-951,stl_vector.h:1056-1056 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 12.17 |
CQA cycles if no scalar integer | 6.83 |
CQA cycles if FP arith vectorized | 7.08 |
CQA cycles if fully vectorized | 2.22 |
Front-end cycles | 12.17 |
DIV/SQRT cycles | 2.40 |
P0 cycles | 2.50 |
P1 cycles | 11.33 |
P2 cycles | 11.33 |
P3 cycles | 7.50 |
P4 cycles | 2.30 |
P5 cycles | 2.40 |
P6 cycles | 7.50 |
P7 cycles | 7.50 |
P8 cycles | 7.50 |
P9 cycles | 2.40 |
P10 cycles | 11.33 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 14.23 |
Stall cycles (UFS) | 2.52 |
Nb insns | 69.00 |
Nb uops | 73.00 |
Nb loads | 34.00 |
Nb stores | 13.00 |
Nb stack references | 15.00 |
FLOP/cycle | 0.08 |
Nb FLOP add-sub | 1.00 |
Nb FLOP mul | 0.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 62.88 |
Bytes prefetched | 0.00 |
Bytes loaded | 541.00 |
Bytes stored | 224.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 52.50 |
Vectorization ratio load | 70.59 |
Vectorization ratio store | 38.46 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 44.44 |
Vector-efficiency ratio all | 28.63 |
Vector-efficiency ratio load | 37.59 |
Vector-efficiency ratio store | 26.92 |
Vector-efficiency ratio mul | 6.25 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 15.45 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.78 |
CQA speedup if FP arith vectorized | 1.72 |
CQA speedup if fully vectorized | 5.48 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.07 |
Bottlenecks | micro-operation queue, |
Function | miniqmcreference::TwoBodyJastrowRef |
Source | refwrap.h:313-313,OhmmsVector.h:223-223,OhmmsVector.h:229-229,OhmmsVector.h:249-249,optional:897-897,optional:1213-1213,TwoBodyJastrowRef.h:107-108,TwoBodyJastrowRef.h:126-127,stl_vector.h:806-806,stl_vector.h:933-933,stl_vector.h:951-951,stl_vector.h:1056-1056 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 12.17 |
CQA cycles if no scalar integer | 6.83 |
CQA cycles if FP arith vectorized | 7.08 |
CQA cycles if fully vectorized | 2.22 |
Front-end cycles | 12.17 |
DIV/SQRT cycles | 2.40 |
P0 cycles | 2.50 |
P1 cycles | 11.33 |
P2 cycles | 11.33 |
P3 cycles | 7.50 |
P4 cycles | 2.30 |
P5 cycles | 2.40 |
P6 cycles | 7.50 |
P7 cycles | 7.50 |
P8 cycles | 7.50 |
P9 cycles | 2.40 |
P10 cycles | 11.33 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 14.23 |
Stall cycles (UFS) | 2.52 |
Nb insns | 69.00 |
Nb uops | 73.00 |
Nb loads | 34.00 |
Nb stores | 13.00 |
Nb stack references | 15.00 |
FLOP/cycle | 0.08 |
Nb FLOP add-sub | 1.00 |
Nb FLOP mul | 0.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 62.88 |
Bytes prefetched | 0.00 |
Bytes loaded | 541.00 |
Bytes stored | 224.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 52.50 |
Vectorization ratio load | 70.59 |
Vectorization ratio store | 38.46 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 44.44 |
Vector-efficiency ratio all | 28.63 |
Vector-efficiency ratio load | 37.59 |
Vector-efficiency ratio store | 26.92 |
Vector-efficiency ratio mul | 6.25 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 15.45 |
Path / |
Function | miniqmcreference::TwoBodyJastrowRef |
Source file and lines | TwoBodyJastrowRef.h:107-132 |
Module | exec |
nb instructions | 69 |
nb uops | 73 |
loop length | 386 |
used x86 registers | 9 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 8 |
used zmm registers | 0 |
nb stack references | 15 |
micro-operation queue | 12.17 cycles |
front end | 12.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.40 | 2.50 | 11.33 | 11.33 | 7.50 | 2.30 | 2.40 | 7.50 | 7.50 | 7.50 | 2.40 | 11.33 |
cycles | 2.40 | 2.50 | 11.33 | 11.33 | 7.50 | 2.30 | 2.40 | 7.50 | 7.50 | 7.50 | 2.40 | 11.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 14.23 |
Stall cycles | 2.52 |
LM full (events) | 6.08 |
Front-end | 12.17 |
Dispatch | 11.33 |
Overall L1 | 12.17 |
all | 22% |
load | 40% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 28% |
all | 77% |
load | 83% |
store | 71% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 52% |
load | 70% |
store | 38% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 44% |
all | 15% |
load | 22% |
store | 12% |
mul | 6% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 39% |
load | 43% |
store | 39% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 28% |
load | 37% |
store | 26% |
mul | 6% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD 0x60(%RSP),%YMM24 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x80(%RSP),%YMM25 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xe0(%RSP),%YMM27 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xc0(%RSP),%YMM30 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xa0(%RSP),%YMM31 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD %YMM31,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM30,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM27,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM25,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM24,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x38(%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VSUBSD %XMM0,%XMM1,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4db2b0 <exp> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x30(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,(%RAX,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x8(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RDX,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JBE 42100e <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x7be> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPB $0,0x298(%RDI) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 42101d <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x7cd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD 0x2a0(%RDI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xd8(%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RAX,%RBX,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x290(%RDI),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x248(%RCX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4600b0 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa0(%RDI),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4208a0 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x50> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x48(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDX,%RDX,4),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%RAX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%R14),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX,%RBX,4),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %ECX,%ESI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x1d0(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x200(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %ESI,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV %RAX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VPBROADCASTD %EBX,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDQU64 0xdbb1c(%RIP),%YMM28 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0xdbb32(%RIP),%YMM29 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x60(%RSP),%YMM24 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x80(%RSP),%YMM25 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xe0(%RSP),%YMM27 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xc0(%RSP),%YMM30 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xa0(%RSP),%YMM31 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R14,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 420a4c <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x1fc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
Function | miniqmcreference::TwoBodyJastrowRef |
Source file and lines | TwoBodyJastrowRef.h:107-132 |
Module | exec |
nb instructions | 69 |
nb uops | 73 |
loop length | 386 |
used x86 registers | 9 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 8 |
used zmm registers | 0 |
nb stack references | 15 |
micro-operation queue | 12.17 cycles |
front end | 12.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.40 | 2.50 | 11.33 | 11.33 | 7.50 | 2.30 | 2.40 | 7.50 | 7.50 | 7.50 | 2.40 | 11.33 |
cycles | 2.40 | 2.50 | 11.33 | 11.33 | 7.50 | 2.30 | 2.40 | 7.50 | 7.50 | 7.50 | 2.40 | 11.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 14.23 |
Stall cycles | 2.52 |
LM full (events) | 6.08 |
Front-end | 12.17 |
Dispatch | 11.33 |
Overall L1 | 12.17 |
all | 22% |
load | 40% |
store | 0% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 28% |
all | 77% |
load | 83% |
store | 71% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 52% |
load | 70% |
store | 38% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 44% |
all | 15% |
load | 22% |
store | 12% |
mul | 6% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 39% |
load | 43% |
store | 39% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 28% |
load | 37% |
store | 26% |
mul | 6% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD 0x60(%RSP),%YMM24 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x80(%RSP),%YMM25 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xe0(%RSP),%YMM27 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xc0(%RSP),%YMM30 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xa0(%RSP),%YMM31 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD %YMM31,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM30,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM27,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM25,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM24,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x38(%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VSUBSD %XMM0,%XMM1,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4db2b0 <exp> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x30(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,(%RAX,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x8(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RDX,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JBE 42100e <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x7be> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPB $0,0x298(%RDI) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 42101d <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x7cd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD 0x2a0(%RDI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xd8(%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RAX,%RBX,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x290(%RDI),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x248(%RCX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4600b0 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa0(%RDI),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4208a0 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x50> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x48(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDX,%RDX,4),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%RAX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%R14),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX,%RBX,4),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %ECX,%ESI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x1d0(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x200(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %ESI,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV %RAX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VPBROADCASTD %EBX,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDQU64 0xdbb1c(%RIP),%YMM28 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0xdbb32(%RIP),%YMM29 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x60(%RSP),%YMM24 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x80(%RSP),%YMM25 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xe0(%RSP),%YMM27 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xc0(%RSP),%YMM30 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xa0(%RSP),%YMM31 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R14,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 420a4c <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x1fc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |