Loop Id: 286 | Module: exec | Source: OneBodyJastrowRef.h:134-155 [...] | Coverage: 0.01% |
---|
Loop Id: 286 | Module: exec | Source: OneBodyJastrowRef.h:134-155 [...] | Coverage: 0.01% |
---|
0x41ab61 VXORPD %XMM8,%XMM8,%XMM8 |
0x41ab66 NOPW %CS:(%RAX,%RAX,1) |
0x41ab70 VMOVSD 0x40(%RSP),%XMM0 |
0x41ab76 VSUBSD %XMM8,%XMM0,%XMM0 |
0x41ab7b VZEROUPPER |
0x41ab7e CALL 4d6610 <exp> |
0x41ab83 MOV 0x38(%RSP),%RCX |
0x41ab88 MOV (%RCX),%RAX |
0x41ab8b MOV 0x48(%RSP),%RBX |
0x41ab90 VMOVSD %XMM0,(%RAX,%RBX,8) |
0x41ab95 INC %RBX |
0x41ab98 MOV 0x8(%RCX),%RCX |
0x41ab9c SUB %RAX,%RCX |
0x41ab9f SAR $0x3,%RCX |
0x41aba3 CMP %RBX,%RCX |
0x41aba6 MOV 0x28(%RSP),%R14 |
0x41abab JBE 41b47c |
0x41abb1 MOV 0x30(%RSP),%RDI |
0x41abb6 MOVSXD 0x2a0(%RDI),%RAX |
0x41abbd MOV 0xf0(%R14),%RCX |
0x41abc4 VMOVSD (%RCX,%RAX,8),%XMM0 |
0x41abc9 VMOVSD %XMM0,0x40(%RSP) |
0x41abcf MOV 0xa8(%R14),%ESI |
0x41abd6 VZEROUPPER |
0x41abd9 CALL 460d00 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> |
0x41abde MOV 0x48(%RAX),%RAX |
0x41abe2 LEA (%RBX,%RBX,4),%RCX |
0x41abe6 MOV 0x18(%RAX,%RCX,8),%RDI |
0x41abeb MOV 0x98(%R14),%EAX |
0x41abf2 TEST %EAX,%EAX |
0x41abf4 MOV %RBX,0x48(%RSP) |
0x41abf9 JLE 41b360 |
0x41abff MOV 0x1c8(%R14),%RCX |
0x41ac06 MOV 0xa0(%R14),%RDX |
0x41ac0d MOV 0x148(%R14),%RSI |
0x41ac14 DEC %RAX |
0x41ac17 MOV %RDI,0x8(%RSP) |
0x41ac1c ADD $0x38,%RDI |
0x41ac20 MOV %RDI,0x50(%RSP) |
0x41ac25 VXORPD %XMM8,%XMM8,%XMM8 |
0x41ac2a XOR %R8D,%R8D |
0x41ac2d JMP 41ac44 |
(288) 0x41ac30 LEA 0x1(%R8),%RDI |
(288) 0x41ac34 VADDSD %XMM0,%XMM8,%XMM8 |
(288) 0x41ac38 CMP %RAX,%R8 |
(288) 0x41ac3b MOV %RDI,%R8 |
(288) 0x41ac3e JE 41ab70 |
(288) 0x41ac44 MOV (%RCX,%R8,8),%R9 |
(288) 0x41ac48 TEST %R9,%R9 |
(288) 0x41ac4b JE 41b100 |
(288) 0x41ac51 MOV 0x268(%RDX),%RDI |
(288) 0x41ac58 MOV 0x18(%RDI),%RDI |
(288) 0x41ac5c MOVSXD (%RDI,%R8,4),%R11 |
(288) 0x41ac60 MOV 0x4(%RDI,%R8,4),%EDI |
(288) 0x41ac65 SUB %R11D,%EDI |
(288) 0x41ac68 VXORPD %XMM0,%XMM0,%XMM0 |
(288) 0x41ac6c TEST %EDI,%EDI |
(288) 0x41ac6e JLE 41ac30 |
(288) 0x41ac70 MOV %R11D,%R12D |
(288) 0x41ac73 VMOVSD 0x8(%R9),%XMM1 |
(288) 0x41ac79 MOV %EDI,%R15D |
(288) 0x41ac7c XOR %R10D,%R10D |
(288) 0x41ac7f CMP $0x8,%EDI |
(288) 0x41ac82 JAE 41b115 |
(288) 0x41ac88 MOV %R15D,%EDI |
(288) 0x41ac8b AND $-0x8,%EDI |
(288) 0x41ac8e CMP %R15,%RDI |
(288) 0x41ac91 JNE 41b245 |
(288) 0x41ac97 TEST %R10D,%R10D |
(288) 0x41ac9a JLE 41ac30 |
(288) 0x41ac9c VMOVSD %XMM8,(%RSP) |
(288) 0x41aca1 VMOVSD 0x238(%R9),%XMM9 |
(288) 0x41acaa MOV 0x218(%R9),%R11 |
(288) 0x41acb1 VMOVSD 0x18(%R9),%XMM0 |
(288) 0x41acb7 VMOVUPS %XMM0,0x10(%RSP) |
(288) 0x41acbd VMOVSD 0x20(%R9),%XMM4 |
(288) 0x41acc3 VMOVSD 0x28(%R9),%XMM2 |
(288) 0x41acc9 VMOVSD 0x30(%R9),%XMM3 |
(288) 0x41accf VMOVSD 0x38(%R9),%XMM6 |
(288) 0x41acd5 VMOVSD 0x40(%R9),%XMM7 |
(288) 0x41acdb VMOVSD 0x48(%R9),%XMM14 |
(288) 0x41ace1 VMOVSD 0x50(%R9),%XMM13 |
(288) 0x41ace7 VMOVSD 0x58(%R9),%XMM10 |
(288) 0x41aced VMOVSD 0x60(%R9),%XMM12 |
(288) 0x41acf3 VMOVSD 0x68(%R9),%XMM1 |
(288) 0x41acf9 VMOVSD 0x70(%R9),%XMM15 |
(288) 0x41acff VMOVSD 0x78(%R9),%XMM11 |
(288) 0x41ad05 VMOVSD 0x80(%R9),%XMM0 |
(288) 0x41ad0e VMOVSD 0x88(%R9),%XMM8 |
(288) 0x41ad17 MOV %R10D,%R10D |
(288) 0x41ad1a MOV %R10,%RBX |
(288) 0x41ad1d VMOVSD 0x90(%R9),%XMM5 |
(288) 0x41ad26 MOV $-0x4,%EDI |
(288) 0x41ad2b AND %RDI,%RBX |
(288) 0x41ad2e VMOVUPD %XMM0,0x150(%RSP) |
(288) 0x41ad37 VMOVUPD %XMM8,0x140(%RSP) |
(288) 0x41ad40 VMOVUPD %XMM5,0x130(%RSP) |
(288) 0x41ad49 JE 41b28a |
(288) 0x41ad4f VMOVUPD %XMM9,0x120(%RSP) |
(288) 0x41ad58 VBROADCASTSD %XMM9,%YMM9 |
(288) 0x41ad5d VMOVUPD %YMM9,0x300(%RSP) |
(288) 0x41ad66 VBROADCASTSD 0x10(%RSP),%YMM9 |
(288) 0x41ad6d VMOVUPS %YMM9,0x2e0(%RSP) |
(288) 0x41ad76 VMOVUPD %XMM4,0x100(%RSP) |
(288) 0x41ad7f VBROADCASTSD %XMM4,%YMM4 |
(288) 0x41ad84 VMOVUPD %YMM4,0x2c0(%RSP) |
(288) 0x41ad8d VMOVUPD %XMM2,0xb0(%RSP) |
(288) 0x41ad96 VBROADCASTSD %XMM2,%YMM2 |
(288) 0x41ad9b VMOVUPD %YMM2,0x2a0(%RSP) |
(288) 0x41ada4 VMOVUPD %XMM3,0xd0(%RSP) |
(288) 0x41adad VBROADCASTSD %XMM3,%YMM2 |
(288) 0x41adb2 VMOVUPD %YMM2,0x280(%RSP) |
(288) 0x41adbb VMOVUPD %XMM6,0x110(%RSP) |
(288) 0x41adc4 VBROADCASTSD %XMM6,%YMM2 |
(288) 0x41adc9 VMOVUPD %YMM2,0x260(%RSP) |
(288) 0x41add2 VMOVUPD %XMM7,0xf0(%RSP) |
(288) 0x41addb VBROADCASTSD %XMM7,%YMM2 |
(288) 0x41ade0 VMOVUPD %YMM2,0x240(%RSP) |
(288) 0x41ade9 VMOVUPD %XMM14,0x80(%RSP) |
(288) 0x41adf2 VBROADCASTSD %XMM14,%YMM2 |
(288) 0x41adf7 VMOVUPD %YMM2,0x220(%RSP) |
(288) 0x41ae00 VMOVUPD %XMM13,0x90(%RSP) |
(288) 0x41ae09 VBROADCASTSD %XMM13,%YMM2 |
(288) 0x41ae0e VMOVUPD %YMM2,0x200(%RSP) |
(288) 0x41ae17 VMOVUPD %XMM10,0xe0(%RSP) |
(288) 0x41ae20 VBROADCASTSD %XMM10,%YMM2 |
(288) 0x41ae25 VMOVUPD %YMM2,0x1e0(%RSP) |
(288) 0x41ae2e VMOVUPD %XMM12,0xa0(%RSP) |
(288) 0x41ae37 VBROADCASTSD %XMM12,%YMM2 |
(288) 0x41ae3c VMOVUPD %YMM2,0x1c0(%RSP) |
(288) 0x41ae45 VMOVUPD %XMM1,0x60(%RSP) |
(288) 0x41ae4b VBROADCASTSD %XMM1,%YMM14 |
(288) 0x41ae50 VMOVUPD %XMM15,0x70(%RSP) |
(288) 0x41ae56 VBROADCASTSD %XMM15,%YMM15 |
(288) 0x41ae5b VMOVUPD %XMM11,0xc0(%RSP) |
(288) 0x41ae64 VBROADCASTSD %XMM11,%YMM4 |
(288) 0x41ae69 VBROADCASTSD %XMM0,%YMM3 |
(288) 0x41ae6e VBROADCASTSD %XMM8,%YMM1 |
(288) 0x41ae73 XOR %EDI,%EDI |
(288) 0x41ae75 VBROADCASTSD %XMM5,%YMM0 |
(288) 0x41ae7a VXORPD %XMM2,%XMM2,%XMM2 |
(288) 0x41ae7e VMOVDQU 0x1a0(%RSP),%YMM11 |
(288) 0x41ae87 VMOVDQU 0x180(%RSP),%YMM13 |
(288) 0x41ae90 VMOVDQU 0x160(%RSP),%YMM12 |
(288) 0x41ae99 NOPL (%RAX) |
(290) 0x41aea0 VMOVUPD 0x300(%RSP),%YMM5 |
(290) 0x41aea9 VMULPD (%RSI,%RDI,8),%YMM5,%YMM5 |
(290) 0x41aeae VCVTTPD2DQ %YMM5,%XMM6 |
(290) 0x41aeb2 VROUNDPD $0xb,%YMM5,%YMM7 |
(290) 0x41aeb8 VSUBPD %YMM7,%YMM5,%YMM5 |
(290) 0x41aebc VPMOVSXDQ %XMM6,%YMM6 |
(290) 0x41aec1 VPSLLQ $0x3,%YMM6,%YMM6 |
(290) 0x41aec6 VMOVQ %R11,%XMM7 |
(290) 0x41aecb VPBROADCASTQ %XMM7,%YMM7 |
(290) 0x41aed0 VPADDQ %YMM6,%YMM7,%YMM6 |
(290) 0x41aed4 VMOVQ %XMM6,%R9 |
(290) 0x41aed9 VEXTRACTI128 $0x1,%YMM6,%XMM7 |
(290) 0x41aedf VMOVQ %XMM7,%R14 |
(290) 0x41aee4 VPEXTRQ $0x1,%XMM6,%R15 |
(290) 0x41aeea VPEXTRQ $0x1,%XMM7,%R12 |
(290) 0x41aef0 VMOVSD (%R9),%XMM7 |
(290) 0x41aef5 VMOVSD (%R14),%XMM8 |
(290) 0x41aefa VPADDQ %YMM6,%YMM12,%YMM9 |
(290) 0x41aefe VMOVQ %XMM9,%R9 |
(290) 0x41af03 VMOVHPD (%R15),%XMM7,%XMM7 |
(290) 0x41af08 VPEXTRQ $0x1,%XMM9,%R14 |
(290) 0x41af0e VMOVHPD (%R12),%XMM8,%XMM8 |
(290) 0x41af14 VEXTRACTI128 $0x1,%YMM9,%XMM9 |
(290) 0x41af1a VPEXTRQ $0x1,%XMM9,%R15 |
(290) 0x41af20 VINSERTF128 $0x1,%XMM8,%YMM7,%YMM7 |
(290) 0x41af26 VMOVQ %XMM9,%R12 |
(290) 0x41af2b VMOVSD (%R9),%XMM8 |
(290) 0x41af30 VPADDQ %YMM6,%YMM13,%YMM9 |
(290) 0x41af34 VMOVSD (%R12),%XMM10 |
(290) 0x41af3a VPEXTRQ $0x1,%XMM9,%R9 |
(290) 0x41af40 VMOVHPD (%R14),%XMM8,%XMM8 |
(290) 0x41af45 VMOVQ %XMM9,%R14 |
(290) 0x41af4a VEXTRACTI128 $0x1,%YMM9,%XMM9 |
(290) 0x41af50 VMOVHPD (%R15),%XMM10,%XMM10 |
(290) 0x41af55 VMOVQ %XMM9,%R15 |
(290) 0x41af5a VPEXTRQ $0x1,%XMM9,%R12 |
(290) 0x41af60 VINSERTF128 $0x1,%XMM10,%YMM8,%YMM8 |
(290) 0x41af66 VMOVSD (%R15),%XMM9 |
(290) 0x41af6b VMOVSD (%R14),%XMM10 |
(290) 0x41af70 VMOVHPD (%R12),%XMM9,%XMM9 |
(290) 0x41af76 VMOVHPD (%R9),%XMM10,%XMM10 |
(290) 0x41af7b VINSERTF128 $0x1,%XMM9,%YMM10,%YMM9 |
(290) 0x41af81 VPADDQ %YMM6,%YMM11,%YMM6 |
(290) 0x41af85 VMOVQ %XMM6,%R15 |
(290) 0x41af8a VPEXTRQ $0x1,%XMM6,%R14 |
(290) 0x41af90 VEXTRACTI128 $0x1,%YMM6,%XMM6 |
(290) 0x41af96 VMOVQ %XMM6,%R12 |
(290) 0x41af9b VPEXTRQ $0x1,%XMM6,%R9 |
(290) 0x41afa1 VMOVUPD 0x2e0(%RSP),%YMM6 |
(290) 0x41afaa VFMADD213PD 0x2c0(%RSP),%YMM5,%YMM6 |
(290) 0x41afb4 VFMADD213PD 0x2a0(%RSP),%YMM5,%YMM6 |
(290) 0x41afbe VFMADD213PD 0x280(%RSP),%YMM5,%YMM6 |
(290) 0x41afc8 VFMADD213PD %YMM2,%YMM7,%YMM6 |
(290) 0x41afcd VMOVUPD 0x260(%RSP),%YMM2 |
(290) 0x41afd6 VMOVSD (%R12),%XMM7 |
(290) 0x41afdc VFMADD213PD 0x240(%RSP),%YMM5,%YMM2 |
(290) 0x41afe6 VFMADD213PD 0x220(%RSP),%YMM5,%YMM2 |
(290) 0x41aff0 VFMADD213PD 0x200(%RSP),%YMM5,%YMM2 |
(290) 0x41affa VFMADD213PD %YMM6,%YMM8,%YMM2 |
(290) 0x41afff VMOVSD (%R15),%XMM6 |
(290) 0x41b004 VMOVUPD 0x1e0(%RSP),%YMM8 |
(290) 0x41b00d VFMADD213PD 0x1c0(%RSP),%YMM5,%YMM8 |
(290) 0x41b017 VMOVHPD (%R14),%XMM6,%XMM6 |
(290) 0x41b01c VFMADD213PD %YMM14,%YMM5,%YMM8 |
(290) 0x41b021 VFMADD213PD %YMM15,%YMM5,%YMM8 |
(290) 0x41b026 VMOVHPD (%R9),%XMM7,%XMM7 |
(290) 0x41b02b VFMADD213PD %YMM2,%YMM9,%YMM8 |
(290) 0x41b030 VINSERTF128 $0x1,%XMM7,%YMM6,%YMM6 |
(290) 0x41b036 VMOVAPD %YMM4,%YMM2 |
(290) 0x41b03a VFMADD213PD %YMM3,%YMM5,%YMM2 |
(290) 0x41b03f VFMADD213PD %YMM1,%YMM5,%YMM2 |
(290) 0x41b044 VFMADD213PD %YMM0,%YMM5,%YMM2 |
(290) 0x41b049 VFMADD213PD %YMM8,%YMM6,%YMM2 |
(290) 0x41b04e ADD $0x4,%RDI |
(290) 0x41b052 CMP %RBX,%RDI |
(290) 0x41b055 JB 41aea0 |
(288) 0x41b05b VEXTRACTF128 $0x1,%YMM2,%XMM0 |
(288) 0x41b061 VADDPD %XMM0,%XMM2,%XMM0 |
(288) 0x41b065 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(288) 0x41b06a VADDSD %XMM1,%XMM0,%XMM0 |
(288) 0x41b06e CMP %R10,%RBX |
(288) 0x41b071 VMOVSD (%RSP),%XMM8 |
(288) 0x41b076 VMOVUPD 0x120(%RSP),%XMM9 |
(288) 0x41b07f VMOVUPD 0x10(%RSP),%XMM5 |
(288) 0x41b085 VMOVUPD 0x110(%RSP),%XMM6 |
(288) 0x41b08e VMOVUPD 0x100(%RSP),%XMM4 |
(288) 0x41b097 VMOVUPD 0xf0(%RSP),%XMM7 |
(288) 0x41b0a0 VMOVUPD 0xe0(%RSP),%XMM10 |
(288) 0x41b0a9 VMOVUPD 0xd0(%RSP),%XMM3 |
(288) 0x41b0b2 VMOVUPD 0xc0(%RSP),%XMM11 |
(288) 0x41b0bb VMOVUPD 0xb0(%RSP),%XMM2 |
(288) 0x41b0c4 VMOVUPD 0xa0(%RSP),%XMM12 |
(288) 0x41b0cd VMOVUPD 0x90(%RSP),%XMM13 |
(288) 0x41b0d6 VMOVUPD 0x80(%RSP),%XMM14 |
(288) 0x41b0df VMOVUPD 0x70(%RSP),%XMM15 |
(288) 0x41b0e5 VMOVUPD 0x60(%RSP),%XMM1 |
(288) 0x41b0eb JE 41ac30 |
(288) 0x41b0f1 JMP 41b29b |
(288) 0x41b100 LEA 0x1(%R8),%RDI |
(288) 0x41b104 CMP %RAX,%R8 |
(288) 0x41b107 MOV %RDI,%R8 |
(288) 0x41b10a JNE 41ac44 |
0x41b110 JMP 41ab70 |
(288) 0x41b115 MOV 0x50(%RSP),%RDI |
(288) 0x41b11a LEA (%RDI,%R11,8),%RDI |
(288) 0x41b11e MOV %R15D,%EBX |
(288) 0x41b121 AND $-0x8,%EBX |
(288) 0x41b124 XOR %R13D,%R13D |
(288) 0x41b127 XOR %R10D,%R10D |
(288) 0x41b12a JMP 41b13d |
(292) 0x41b130 ADD $0x8,%R13 |
(292) 0x41b134 CMP %R13,%RBX |
(292) 0x41b137 JE 41ac88 |
(292) 0x41b13d VMOVSD -0x38(%RDI,%R13,8),%XMM2 |
(292) 0x41b144 LEA (%R12,%R13,1),%R14 |
(292) 0x41b148 VUCOMISD %XMM2,%XMM1 |
(292) 0x41b14c JBE 41b160 |
(292) 0x41b14e CMP $-0x1,%R14D |
(292) 0x41b152 JE 41b160 |
(292) 0x41b154 MOVSXD %R10D,%R10 |
(292) 0x41b157 VMOVSD %XMM2,(%RSI,%R10,8) |
(292) 0x41b15d INC %R10D |
(292) 0x41b160 VMOVSD -0x30(%RDI,%R13,8),%XMM2 |
(292) 0x41b167 VUCOMISD %XMM2,%XMM1 |
(292) 0x41b16b JBE 41b17f |
(292) 0x41b16d CMP $-0x2,%R14D |
(292) 0x41b171 JE 41b17f |
(292) 0x41b173 MOVSXD %R10D,%R10 |
(292) 0x41b176 VMOVSD %XMM2,(%RSI,%R10,8) |
(292) 0x41b17c INC %R10D |
(292) 0x41b17f VMOVSD -0x28(%RDI,%R13,8),%XMM2 |
(292) 0x41b186 VUCOMISD %XMM2,%XMM1 |
(292) 0x41b18a JBE 41b19e |
(292) 0x41b18c CMP $-0x3,%R14D |
(292) 0x41b190 JE 41b19e |
(292) 0x41b192 MOVSXD %R10D,%R10 |
(292) 0x41b195 VMOVSD %XMM2,(%RSI,%R10,8) |
(292) 0x41b19b INC %R10D |
(292) 0x41b19e VMOVSD -0x20(%RDI,%R13,8),%XMM2 |
(292) 0x41b1a5 VUCOMISD %XMM2,%XMM1 |
(292) 0x41b1a9 JBE 41b1bd |
(292) 0x41b1ab CMP $-0x4,%R14D |
(292) 0x41b1af JE 41b1bd |
(292) 0x41b1b1 MOVSXD %R10D,%R10 |
(292) 0x41b1b4 VMOVSD %XMM2,(%RSI,%R10,8) |
(292) 0x41b1ba INC %R10D |
(292) 0x41b1bd VMOVSD -0x18(%RDI,%R13,8),%XMM2 |
(292) 0x41b1c4 VUCOMISD %XMM2,%XMM1 |
(292) 0x41b1c8 JBE 41b1dc |
(292) 0x41b1ca CMP $-0x5,%R14D |
(292) 0x41b1ce JE 41b1dc |
(292) 0x41b1d0 MOVSXD %R10D,%R10 |
(292) 0x41b1d3 VMOVSD %XMM2,(%RSI,%R10,8) |
(292) 0x41b1d9 INC %R10D |
(292) 0x41b1dc VMOVSD -0x10(%RDI,%R13,8),%XMM2 |
(292) 0x41b1e3 VUCOMISD %XMM2,%XMM1 |
(292) 0x41b1e7 JBE 41b1fb |
(292) 0x41b1e9 CMP $-0x6,%R14D |
(292) 0x41b1ed JE 41b1fb |
(292) 0x41b1ef MOVSXD %R10D,%R10 |
(292) 0x41b1f2 VMOVSD %XMM2,(%RSI,%R10,8) |
(292) 0x41b1f8 INC %R10D |
(292) 0x41b1fb VMOVSD -0x8(%RDI,%R13,8),%XMM2 |
(292) 0x41b202 VUCOMISD %XMM2,%XMM1 |
(292) 0x41b206 JBE 41b21a |
(292) 0x41b208 CMP $-0x7,%R14D |
(292) 0x41b20c JE 41b21a |
(292) 0x41b20e MOVSXD %R10D,%R10 |
(292) 0x41b211 VMOVSD %XMM2,(%RSI,%R10,8) |
(292) 0x41b217 INC %R10D |
(292) 0x41b21a VMOVSD (%RDI,%R13,8),%XMM2 |
(292) 0x41b220 VUCOMISD %XMM2,%XMM1 |
(292) 0x41b224 JBE 41b130 |
(292) 0x41b22a CMP $-0x8,%R14D |
(292) 0x41b22e JE 41b130 |
(292) 0x41b234 MOVSXD %R10D,%R10 |
(292) 0x41b237 VMOVSD %XMM2,(%RSI,%R10,8) |
(292) 0x41b23d INC %R10D |
(292) 0x41b240 JMP 41b130 |
(288) 0x41b245 MOVSXD %R12D,%RBX |
(288) 0x41b248 NOT %R11D |
(288) 0x41b24b MOV 0x8(%RSP),%R14 |
(288) 0x41b250 LEA (%R14,%RBX,8),%RBX |
(288) 0x41b254 JMP 41b26c |
(291) 0x41b260 INC %RDI |
(291) 0x41b263 CMP %RDI,%R15 |
(291) 0x41b266 JE 41ac97 |
(291) 0x41b26c VMOVSD (%RBX,%RDI,8),%XMM2 |
(291) 0x41b271 VUCOMISD %XMM2,%XMM1 |
(291) 0x41b275 JBE 41b260 |
(291) 0x41b277 CMP %EDI,%R11D |
(291) 0x41b27a JE 41b260 |
(291) 0x41b27c MOVSXD %R10D,%R10 |
(291) 0x41b27f VMOVSD %XMM2,(%RSI,%R10,8) |
(291) 0x41b285 INC %R10D |
(291) 0x41b288 JMP 41b260 |
(288) 0x41b28a VXORPD %XMM0,%XMM0,%XMM0 |
(288) 0x41b28e XOR %EBX,%EBX |
(288) 0x41b290 VMOVSD (%RSP),%XMM8 |
(288) 0x41b295 VMOVUPD 0x10(%RSP),%XMM5 |
(288) 0x41b29b VUNPCKLPD 0x140(%RSP),%XMM1,%XMM1 |
(288) 0x41b2a4 VUNPCKLPD %XMM14,%XMM2,%XMM2 |
(288) 0x41b2a9 VINSERTF128 $0x1,%XMM1,%YMM2,%YMM1 |
(288) 0x41b2af VUNPCKLPD 0x130(%RSP),%XMM15,%XMM2 |
(288) 0x41b2b8 VUNPCKLPD %XMM13,%XMM3,%XMM3 |
(288) 0x41b2bd VINSERTF128 $0x1,%XMM2,%YMM3,%YMM2 |
(288) 0x41b2c3 VUNPCKLPD 0x150(%RSP),%XMM12,%XMM3 |
(288) 0x41b2cc VUNPCKLPD %XMM7,%XMM4,%XMM4 |
(288) 0x41b2d0 VINSERTF128 $0x1,%XMM3,%YMM4,%YMM3 |
(288) 0x41b2d6 VUNPCKLPD %XMM11,%XMM10,%XMM4 |
(288) 0x41b2db VUNPCKLPD %XMM6,%XMM5,%XMM5 |
(288) 0x41b2df VINSERTF128 $0x1,%XMM4,%YMM5,%YMM4 |
(288) 0x41b2e5 NOPW %CS:(%RAX,%RAX,1) |
(289) 0x41b2f0 VMULSD (%RSI,%RBX,8),%XMM9,%XMM5 |
(289) 0x41b2f5 VROUNDSD $0xb,%XMM5,%XMM5,%XMM6 |
(289) 0x41b2fb VCVTTSD2SI %XMM5,%EDI |
(289) 0x41b2ff VSUBSD %XMM6,%XMM5,%XMM5 |
(289) 0x41b303 VMULSD %XMM5,%XMM5,%XMM6 |
(289) 0x41b307 MOVSXD %EDI,%RDI |
(289) 0x41b30a VMULSD %XMM5,%XMM6,%XMM7 |
(289) 0x41b30e VBROADCASTSD %XMM6,%YMM6 |
(289) 0x41b313 VBROADCASTSD %XMM5,%YMM5 |
(289) 0x41b318 VFMADD213PD %YMM2,%YMM1,%YMM5 |
(289) 0x41b31d VBROADCASTSD %XMM7,%YMM7 |
(289) 0x41b322 VFMADD231PD %YMM6,%YMM3,%YMM5 |
(289) 0x41b327 VFMADD231PD %YMM7,%YMM4,%YMM5 |
(289) 0x41b32c VMULPD (%R11,%RDI,8),%YMM5,%YMM5 |
(289) 0x41b332 VEXTRACTF128 $0x1,%YMM5,%XMM6 |
(289) 0x41b338 VADDPD %XMM6,%XMM5,%XMM5 |
(289) 0x41b33c VSHUFPD $0x1,%XMM5,%XMM5,%XMM6 |
(289) 0x41b341 VADDSD %XMM6,%XMM5,%XMM5 |
(289) 0x41b345 VADDSD %XMM5,%XMM0,%XMM0 |
(289) 0x41b349 INC %RBX |
(289) 0x41b34c CMP %RBX,%R10 |
(289) 0x41b34f JNE 41b2f0 |
(288) 0x41b351 JMP 41ac30 |
0x41b360 MOV 0x90(%R14),%EBX |
0x41b367 TEST %EBX,%EBX |
0x41b369 JLE 41ab61 |
0x41b36f MOV %RDI,0x8(%RSP) |
0x41b374 MOV 0xa0(%R14),%RAX |
0x41b37b MOV 0x1c8(%R14),%R14 |
0x41b382 MOV 0x18(%RAX),%R15 |
0x41b386 VXORPD %XMM8,%XMM8,%XMM8 |
0x41b38b XOR %R12D,%R12D |
0x41b38e JMP 41b3a0 |
(287) 0x41b390 VADDSD %XMM1,%XMM8,%XMM8 |
(287) 0x41b394 INC %R12 |
(287) 0x41b397 CMP %R12,%RBX |
(287) 0x41b39a JE 41ab70 |
(287) 0x41b3a0 MOVSXD (%R15,%R12,4),%RAX |
(287) 0x41b3a4 MOV (%R14,%RAX,8),%R13 |
(287) 0x41b3a8 TEST %R13,%R13 |
(287) 0x41b3ab JE 41b394 |
(287) 0x41b3ad MOV 0x8(%RSP),%RAX |
(287) 0x41b3b2 VMOVSD (%RAX,%R12,8),%XMM0 |
(287) 0x41b3b8 VMOVSD 0x8(%R13),%XMM2 |
(287) 0x41b3be VXORPD %XMM1,%XMM1,%XMM1 |
(287) 0x41b3c2 VUCOMISD %XMM0,%XMM2 |
(287) 0x41b3c6 JBE 41b390 |
(287) 0x41b3c8 VMULSD 0x238(%R13),%XMM0,%XMM0 |
(287) 0x41b3d1 LEA 0x58(%RSP),%RDI |
(287) 0x41b3d6 VMOVSD %XMM8,(%RSP) |
(287) 0x41b3db CALL 4d66a0 <modf> |
(287) 0x41b3e0 VMOVSD (%RSP),%XMM8 |
(287) 0x41b3e5 VCVTTSD2SI 0x58(%RSP),%EAX |
(287) 0x41b3eb CLTQ |
(287) 0x41b3ed VMOVSD 0x20(%R13),%XMM1 |
(287) 0x41b3f3 VFMADD231SD 0x18(%R13),%XMM0,%XMM1 |
(287) 0x41b3f9 VFMADD213SD 0x28(%R13),%XMM0,%XMM1 |
(287) 0x41b3ff VFMADD213SD 0x30(%R13),%XMM0,%XMM1 |
(287) 0x41b405 MOV 0x218(%R13),%RCX |
(287) 0x41b40c VMULSD (%RCX,%RAX,8),%XMM1,%XMM1 |
(287) 0x41b411 VMOVSD 0x40(%R13),%XMM2 |
(287) 0x41b417 VFMADD231SD 0x38(%R13),%XMM0,%XMM2 |
(287) 0x41b41d VFMADD213SD 0x48(%R13),%XMM0,%XMM2 |
(287) 0x41b423 VFMADD213SD 0x50(%R13),%XMM0,%XMM2 |
(287) 0x41b429 VFMADD132SD 0x8(%RCX,%RAX,8),%XMM1,%XMM2 |
(287) 0x41b430 VMOVSD 0x60(%R13),%XMM3 |
(287) 0x41b436 VFMADD231SD 0x58(%R13),%XMM0,%XMM3 |
(287) 0x41b43c VFMADD213SD 0x68(%R13),%XMM0,%XMM3 |
(287) 0x41b442 VFMADD213SD 0x70(%R13),%XMM0,%XMM3 |
(287) 0x41b448 VFMADD132SD 0x10(%RCX,%RAX,8),%XMM2,%XMM3 |
(287) 0x41b44f VMOVSD 0x80(%R13),%XMM1 |
(287) 0x41b458 VFMADD231SD 0x78(%R13),%XMM0,%XMM1 |
(287) 0x41b45e VFMADD213SD 0x88(%R13),%XMM0,%XMM1 |
(287) 0x41b467 VFMADD213SD 0x90(%R13),%XMM0,%XMM1 |
(287) 0x41b470 VFMADD132SD 0x18(%RCX,%RAX,8),%XMM3,%XMM1 |
(287) 0x41b477 JMP 41b390 |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/shared_ptr_base.h: 1308 - 1308 |
-------------------------------------------------------------------------------- |
1308: { return _M_ptr; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
[...] |
249: inline const_pointer data() const { return X; } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/OneBodyJastrowRef.h: 134 - 155 |
-------------------------------------------------------------------------------- |
134: for (int k = 0; k < ratios.size(); ++k) |
135: ratios[k] = std::exp(Vat[VP.refPtcl] - computeU(VP.getDistTableAB(myTableID).getDistRow(k).data())); |
[...] |
141: if (NumGroups > 0) |
142: { |
143: for (int jg = 0; jg < NumGroups; ++jg) |
144: { |
145: if (F[jg] != nullptr) |
146: curVat += F[jg]->evaluateV(-1, Ions.first(jg), Ions.last(jg), dist, DistCompressed.data()); |
147: } |
148: } |
149: else |
150: { |
151: for (int c = 0; c < Nions; ++c) |
152: { |
153: int gid = Ions.GroupID[c]; |
154: if (F[gid] != nullptr) |
155: curVat += F[gid]->evaluate(dist[c]); |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/BsplineFunctor.h: 166 - 260 |
-------------------------------------------------------------------------------- |
166: if (r >= cutoff_radius) |
167: return 0.0; |
168: r *= DeltaRInv; |
169: real_type ipart, t; |
170: t = std::modf(r, &ipart); |
171: int i = (int)ipart; |
[...] |
179: (SplineCoefs[i+0]*(A[ 0]*tp[0] + A[ 1]*tp[1] + A[ 2]*tp[2] + A[ 3]*tp[3])+ |
180: SplineCoefs[i+1]*(A[ 4]*tp[0] + A[ 5]*tp[1] + A[ 6]*tp[2] + A[ 7]*tp[3])+ |
181: SplineCoefs[i+2]*(A[ 8]*tp[0] + A[ 9]*tp[1] + A[10]*tp[2] + A[11]*tp[3])+ |
[...] |
229: const real_type* restrict distArray = _distArray + iStart; |
[...] |
236: for (int jat = 0; jat < iLimit; jat++) |
237: { |
238: real_type r = distArray[jat]; |
239: // pick the distances smaller than the cutoff and avoid the reference atom |
240: if (r < cutoff_radius && iStart + jat != iat) |
241: distArrayCompressed[iCount++] = distArray[jat]; |
242: } |
243: |
244: real_type d = 0.0; |
245: //#pragma omp simd reduction(+:d) |
246: for (int jat = 0; jat < iCount; jat++) |
247: { |
248: real_type r = distArrayCompressed[jat]; |
249: r *= DeltaRInv; |
250: int i = (int)r; |
251: real_type t = r - real_type(i); |
252: real_type tp0 = t * t * t; |
253: real_type tp1 = t * t; |
254: real_type tp2 = t; |
255: |
256: real_type d1 = SplineCoefs[i + 0] * (A[0] * tp0 + A[1] * tp1 + A[2] * tp2 + A[3]); |
257: real_type d2 = SplineCoefs[i + 1] * (A[4] * tp0 + A[5] * tp1 + A[6] * tp2 + A[7]); |
258: real_type d3 = SplineCoefs[i + 2] * (A[8] * tp0 + A[9] * tp1 + A[10] * tp2 + A[11]); |
259: real_type d4 = SplineCoefs[i + 3] * (A[12] * tp0 + A[13] * tp1 + A[14] * tp2 + A[15]); |
260: d += (d1 + d2 + d3 + d4); |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_vector.h: 806 - 1056 |
-------------------------------------------------------------------------------- |
806: { return size_type(this->_M_impl._M_finish - this->_M_impl._M_start); } |
[...] |
933: return *(this->_M_impl._M_start + __n); |
[...] |
951: return *(this->_M_impl._M_start + __n); |
[...] |
1056: { return _M_data_ptr(this->_M_impl._M_start); } |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 313 - 316 |
-------------------------------------------------------------------------------- |
313: inline int first(int igroup) const { return (*group_offsets_)[igroup]; } |
314: |
315: ///return the last index of a group i |
316: inline int last(int igroup) const { return (*group_offsets_)[igroup + 1]; } |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | qmcplusplus::WaveFunction::eva[...] | stl_vector.h:806 | exec |
○ | qmcplusplus::NonLocalPP<double[...] | NonLocalPP.hpp:135 | exec |
○ | main.extracted.110 | NewTimer.h:249 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 3.17 |
CQA speedup if FP arith vectorized | 2.57 |
CQA speedup if fully vectorized | 11.78 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.36 |
Bottlenecks | micro-operation queue, |
Function | miniqmcreference::OneBodyJastrowRef |
Source | OhmmsVector.h:223-223,OhmmsVector.h:229-229,OhmmsVector.h:249-249,OneBodyJastrowRef.h:134-135,OneBodyJastrowRef.h:141-143,OneBodyJastrowRef.h:146-146,OneBodyJastrowRef.h:151-153,stl_vector.h:806-806,stl_vector.h:933-933,stl_vector.h:951-951,stl_vector.h:1056-1056 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 9.50 |
CQA cycles if no scalar integer | 3.00 |
CQA cycles if FP arith vectorized | 3.70 |
CQA cycles if fully vectorized | 0.81 |
Front-end cycles | 9.50 |
DIV/SQRT cycles | 2.00 |
P0 cycles | 1.70 |
P1 cycles | 7.00 |
P2 cycles | 7.00 |
P3 cycles | 4.00 |
P4 cycles | 1.70 |
P5 cycles | 2.00 |
P6 cycles | 4.00 |
P7 cycles | 4.00 |
P8 cycles | 4.00 |
P9 cycles | 1.60 |
P10 cycles | 7.00 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 9.59 |
Stall cycles (UFS) | 0.52 |
Nb insns | 53.00 |
Nb uops | 57.00 |
Nb loads | 21.00 |
Nb stores | 6.00 |
Nb stack references | 7.00 |
FLOP/cycle | 0.11 |
Nb FLOP add-sub | 1.00 |
Nb FLOP mul | 0.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 21.05 |
Bytes prefetched | 0.00 |
Bytes loaded | 152.00 |
Bytes stored | 48.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 22.73 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | NA |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 55.56 |
Vector-efficiency ratio all | 14.20 |
Vector-efficiency ratio load | 11.46 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | NA |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 17.36 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 3.17 |
CQA speedup if FP arith vectorized | 2.57 |
CQA speedup if fully vectorized | 11.78 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.36 |
Bottlenecks | micro-operation queue, |
Function | miniqmcreference::OneBodyJastrowRef |
Source | OhmmsVector.h:223-223,OhmmsVector.h:229-229,OhmmsVector.h:249-249,OneBodyJastrowRef.h:134-135,OneBodyJastrowRef.h:141-143,OneBodyJastrowRef.h:146-146,OneBodyJastrowRef.h:151-153,stl_vector.h:806-806,stl_vector.h:933-933,stl_vector.h:951-951,stl_vector.h:1056-1056 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 9.50 |
CQA cycles if no scalar integer | 3.00 |
CQA cycles if FP arith vectorized | 3.70 |
CQA cycles if fully vectorized | 0.81 |
Front-end cycles | 9.50 |
DIV/SQRT cycles | 2.00 |
P0 cycles | 1.70 |
P1 cycles | 7.00 |
P2 cycles | 7.00 |
P3 cycles | 4.00 |
P4 cycles | 1.70 |
P5 cycles | 2.00 |
P6 cycles | 4.00 |
P7 cycles | 4.00 |
P8 cycles | 4.00 |
P9 cycles | 1.60 |
P10 cycles | 7.00 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 9.59 |
Stall cycles (UFS) | 0.52 |
Nb insns | 53.00 |
Nb uops | 57.00 |
Nb loads | 21.00 |
Nb stores | 6.00 |
Nb stack references | 7.00 |
FLOP/cycle | 0.11 |
Nb FLOP add-sub | 1.00 |
Nb FLOP mul | 0.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 21.05 |
Bytes prefetched | 0.00 |
Bytes loaded | 152.00 |
Bytes stored | 48.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 22.73 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | NA |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 55.56 |
Vector-efficiency ratio all | 14.20 |
Vector-efficiency ratio load | 11.46 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | NA |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 17.36 |
Path / |
Function | miniqmcreference::OneBodyJastrowRef |
Source file and lines | OneBodyJastrowRef.h:134-155 |
Module | exec |
nb instructions | 53 |
nb uops | 57 |
loop length | 259 |
used x86 registers | 11 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 7 |
micro-operation queue | 9.50 cycles |
front end | 9.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.00 | 1.70 | 7.00 | 7.00 | 4.00 | 1.70 | 2.00 | 4.00 | 4.00 | 4.00 | 1.60 | 7.00 |
cycles | 2.00 | 1.70 | 7.00 | 7.00 | 4.00 | 1.70 | 2.00 | 4.00 | 4.00 | 4.00 | 1.60 | 7.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 9.59 |
Stall cycles | 0.52 |
LM full (events) | 1.38 |
Front-end | 9.50 |
Dispatch | 7.00 |
Overall L1 | 9.50 |
all | 14% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 33% |
all | 37% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 22% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 55% |
all | 12% |
load | 10% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 17% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 14% |
load | 11% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
VXORPD %XMM8,%XMM8,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0x40(%RSP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VSUBSD %XMM8,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4d6610 <exp> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x38(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x8(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RSP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JBE 41b47c <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x98c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x30(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0x2a0(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xf0(%R14),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RCX,%RAX,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa8(%R14),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 460d00 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x48(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RBX,%RBX,4),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%RAX,%RCX,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x98(%R14),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %RBX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JLE 41b360 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x870> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x1c8(%R14),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa0(%R14),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x148(%R14),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
DEC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0x38,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VXORPD %XMM8,%XMM8,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41ac44 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x154> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
JMP 41ab70 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x80> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x90(%R14),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %EBX,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41ab61 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x71> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDI,0x8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x1c8(%R14),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM8,%XMM8,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R12D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41b3a0 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x8b0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
Function | miniqmcreference::OneBodyJastrowRef |
Source file and lines | OneBodyJastrowRef.h:134-155 |
Module | exec |
nb instructions | 53 |
nb uops | 57 |
loop length | 259 |
used x86 registers | 11 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 7 |
micro-operation queue | 9.50 cycles |
front end | 9.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.00 | 1.70 | 7.00 | 7.00 | 4.00 | 1.70 | 2.00 | 4.00 | 4.00 | 4.00 | 1.60 | 7.00 |
cycles | 2.00 | 1.70 | 7.00 | 7.00 | 4.00 | 1.70 | 2.00 | 4.00 | 4.00 | 4.00 | 1.60 | 7.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 9.59 |
Stall cycles | 0.52 |
LM full (events) | 1.38 |
Front-end | 9.50 |
Dispatch | 7.00 |
Overall L1 | 9.50 |
all | 14% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 33% |
all | 37% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 100% |
all | 22% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 55% |
all | 12% |
load | 10% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 17% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 14% |
load | 11% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
VXORPD %XMM8,%XMM8,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0x40(%RSP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VSUBSD %XMM8,%XMM0,%XMM0 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4d6610 <exp> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x38(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x8(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RSP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JBE 41b47c <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x98c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x30(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0x2a0(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xf0(%R14),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RCX,%RAX,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa8(%R14),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 460d00 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x48(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RBX,%RBX,4),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%RAX,%RCX,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x98(%R14),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %EAX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %RBX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JLE 41b360 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x870> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x1c8(%R14),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa0(%R14),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x148(%R14),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
DEC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0x38,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VXORPD %XMM8,%XMM8,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41ac44 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x154> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
JMP 41ab70 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x80> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x90(%R14),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %EBX,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41ab61 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x71> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDI,0x8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x1c8(%R14),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM8,%XMM8,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R12D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41b3a0 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x8b0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |