Loop Id: 755 | Module: exec | Source: MultiBsplineRef.hpp:227-262 [...] | Coverage: 0.03% |
---|
Loop Id: 755 | Module: exec | Source: MultiBsplineRef.hpp:227-262 [...] | Coverage: 0.03% |
---|
0x435780 MOV %R13,%R9 |
0x435783 MOV 0x380(%RSP),%RAX |
0x43578b ADD %RAX,%R14 |
0x43578e ADD %RAX,%R12 |
0x435791 MOV 0x68(%RSP),%R15 |
0x435796 ADD %RAX,%R15 |
0x435799 MOV 0x70(%RSP),%RCX |
0x43579e ADD %RAX,%RCX |
0x4357a1 ADD %RAX,0x1c8(%RSP) |
0x4357a9 ADD %RAX,0x1d0(%RSP) |
0x4357b1 ADD %RAX,0x1d8(%RSP) |
0x4357b9 ADD %RAX,0x1e0(%RSP) |
0x4357c1 MOV 0x198(%RSP),%RAX |
0x4357c9 ADD %RAX,0x1a0(%RSP) |
0x4357d1 ADD %RAX,0x1a8(%RSP) |
0x4357d9 ADD %RAX,0x1b0(%RSP) |
0x4357e1 ADD %RAX,0x1b8(%RSP) |
0x4357e9 MOV 0x3a8(%RSP),%RAX |
0x4357f1 CMP $0x3,%RAX |
0x4357f5 LEA 0x1(%RAX),%RAX |
0x4357f9 MOV 0x3a0(%RSP),%RDI |
0x435801 MOV %RSI,%R13 |
0x435804 JE 4355f0 |
0x43580a MOV %R15,0x68(%RSP) |
0x43580f MOV %RCX,0x70(%RSP) |
0x435814 VMOVSD 0x5e0(%RSP,%RAX,8),%XMM0 |
0x43581d VMULSD 0x398(%RSP),%XMM0,%XMM2 |
0x435826 VMOVUPD %XMM2,0xf0(%RSP) |
0x43582f VMOVSD 0x390(%RSP),%XMM2 |
0x435838 VMULSD %XMM2,%XMM0,%XMM1 |
0x43583c VMOVUPD %XMM1,0x140(%RSP) |
0x435845 VMOVSD 0x388(%RSP),%XMM4 |
0x43584e VMULSD %XMM4,%XMM0,%XMM0 |
0x435852 VMOVUPD %XMM0,0x20(%RSP) |
0x435858 VMOVSD 0x540(%RSP,%RAX,8),%XMM0 |
0x435861 VMULSD %XMM2,%XMM0,%XMM10 |
0x435865 VMULSD %XMM4,%XMM0,%XMM0 |
0x435869 VMOVUPD %XMM0,0x130(%RSP) |
0x435872 VMULSD 0x500(%RSP,%RAX,8),%XMM4,%XMM0 |
0x43587b VMOVUPD %XMM0,0xe0(%RSP) |
0x435884 CMP $0x81,%R13D |
0x43588b VMOVUPD %XMM10,0x470(%RSP) |
0x435894 MOV %RAX,0x3a8(%RSP) |
0x43589c JB 4363e0 |
0x4358a2 TEST %R13D,%R13D |
0x4358a5 MOV %R13,%RSI |
0x4358a8 MOV %R9,%R13 |
0x4358ab MOV 0x60(%RSP),%RDI |
0x4358b0 JLE 435780 |
0x4358b6 VBROADCASTSD 0xf0(%RSP),%YMM7 |
0x4358c0 VBROADCASTSD %XMM10,%YMM1 |
0x4358c5 VMOVUPD %YMM1,0x780(%RSP) |
0x4358ce VBROADCASTSD 0x140(%RSP),%YMM10 |
0x4358d8 VBROADCASTSD 0xe0(%RSP),%YMM1 |
0x4358e2 VMOVUPS %YMM1,0x760(%RSP) |
0x4358eb VBROADCASTSD 0x130(%RSP),%YMM2 |
0x4358f5 VBROADCASTSD 0x20(%RSP),%YMM1 |
0x4358fc MOV 0x8(%RSP),%RAX |
0x435901 MOV %RAX,0x280(%RSP) |
0x435909 MOV 0x188(%RSP),%RAX |
0x435911 MOV %RAX,0x278(%RSP) |
0x435919 MOV 0x180(%RSP),%RAX |
0x435921 MOV %RAX,0x270(%RSP) |
0x435929 MOV 0x178(%RSP),%RAX |
0x435931 MOV %RAX,0x268(%RSP) |
0x435939 MOV 0x170(%RSP),%RAX |
0x435941 MOV %RAX,0x260(%RSP) |
0x435949 MOV %R8,%RCX |
0x43594c MOV 0x50(%RSP),%R15 |
0x435951 MOV %R11,0x238(%RSP) |
0x435959 MOV 0x58(%RSP),%RAX |
0x43595e MOV %RAX,0x230(%RSP) |
0x435966 MOV %RBX,0x228(%RSP) |
0x43596e MOV %R10,0x220(%RSP) |
0x435976 MOV %RDX,0x218(%RSP) |
0x43597e MOV 0x190(%RSP),%RAX |
0x435986 MOV %RAX,0x210(%RSP) |
0x43598e MOV %R13,0xa8(%RSP) |
0x435996 MOV 0x1b8(%RSP),%RAX |
0x43599e MOV %RAX,0x258(%RSP) |
0x4359a6 MOV 0x1b0(%RSP),%RAX |
0x4359ae MOV %RAX,0x250(%RSP) |
0x4359b6 MOV 0x1a8(%RSP),%RAX |
0x4359be MOV %RAX,0x248(%RSP) |
0x4359c6 MOV 0x1a0(%RSP),%RAX |
0x4359ce MOV %RAX,0x240(%RSP) |
0x4359d6 MOV 0x378(%RSP),%RAX |
0x4359de MOV 0x70(%RSP),%RDX |
0x4359e3 MOV %RDX,0x208(%RSP) |
0x4359eb MOV 0x68(%RSP),%RDX |
0x4359f0 MOV %RDX,0x200(%RSP) |
0x4359f8 MOV %R12,0x1f8(%RSP) |
0x435a00 MOV %R14,0x1f0(%RSP) |
0x435a08 MOV %RDI,0xa0(%RSP) |
0x435a10 XOR %R9D,%R9D |
0x435a13 MOV %R12,0x3c0(%RSP) |
0x435a1b MOV %R14,0x3b8(%RSP) |
0x435a23 VMOVUPD %YMM7,0x820(%RSP) |
0x435a2c VMOVUPD %YMM2,0x800(%RSP) |
0x435a35 VMOVUPD %YMM1,0x7e0(%RSP) |
0x435a3e VMOVUPS %YMM10,0x7a0(%RSP) |
0x435a47 JMP 435be8 |
(760) 0x435a50 ADDQ $0x200,0xa0(%RSP) |
(760) 0x435a5c ADDQ $0x200,0x1f0(%RSP) |
(760) 0x435a68 ADDQ $0x200,0x1f8(%RSP) |
(760) 0x435a74 ADDQ $0x200,0x200(%RSP) |
(760) 0x435a80 ADDQ $0x200,0x208(%RSP) |
(760) 0x435a8c MOV 0x3d0(%RSP),%RDX |
(760) 0x435a94 ADD $-0x40,%RDX |
(760) 0x435a98 ADDQ $0x40,0x240(%RSP) |
(760) 0x435aa1 ADDQ $0x40,0x248(%RSP) |
(760) 0x435aaa ADDQ $0x40,0x250(%RSP) |
(760) 0x435ab3 ADDQ $0x40,0x258(%RSP) |
(760) 0x435abc ADDQ $0x200,0xa8(%RSP) |
(760) 0x435ac8 ADDQ $0x200,0x210(%RSP) |
(760) 0x435ad4 ADDQ $0x200,0x218(%RSP) |
(760) 0x435ae0 ADDQ $0x200,0x220(%RSP) |
(760) 0x435aec ADDQ $0x200,0x228(%RSP) |
(760) 0x435af8 ADDQ $0x200,0x230(%RSP) |
(760) 0x435b04 ADDQ $0x200,0x238(%RSP) |
(760) 0x435b10 MOV 0x288(%RSP),%R15 |
(760) 0x435b18 ADD $0x200,%R15 |
(760) 0x435b1f MOV 0xb0(%RSP),%RCX |
(760) 0x435b27 ADD $0x200,%RCX |
(760) 0x435b2e ADDQ $0x40,0x260(%RSP) |
(760) 0x435b37 ADDQ $0x40,0x268(%RSP) |
(760) 0x435b40 ADDQ $0x40,0x270(%RSP) |
(760) 0x435b49 ADDQ $0x40,0x278(%RSP) |
(760) 0x435b52 ADDQ $0x40,0x280(%RSP) |
(760) 0x435b5b MOV 0x3c8(%RSP),%RAX |
(760) 0x435b63 CMP 0x3b0(%RSP),%RAX |
(760) 0x435b6b LEA 0x1(%RAX),%R9 |
(760) 0x435b6f MOV %RDX,%RAX |
(760) 0x435b72 MOV 0x98(%RSP),%RSI |
(760) 0x435b7a MOV 0x18(%RSP),%R13 |
(760) 0x435b7f MOV 0x10(%RSP),%R8 |
(760) 0x435b84 VMOVUPD 0xd0(%RSP),%XMM6 |
(760) 0x435b8d MOV 0x1e8(%RSP),%RBX |
(760) 0x435b95 MOV 0x90(%RSP),%RDX |
(760) 0x435b9d VMOVUPD 0x7c0(%RSP),%YMM12 |
(760) 0x435ba6 MOV 0x88(%RSP),%R10 |
(760) 0x435bae MOV 0x38(%RSP),%R11 |
(760) 0x435bb3 VMOVAPD %XMM7,%XMM13 |
(760) 0x435bb7 MOV 0x3c0(%RSP),%R12 |
(760) 0x435bbf MOV 0x3b8(%RSP),%R14 |
(760) 0x435bc7 VMOVUPD 0x820(%RSP),%YMM7 |
(760) 0x435bd0 VMOVUPD 0x800(%RSP),%YMM2 |
(760) 0x435bd9 VMOVUPD 0x7e0(%RSP),%YMM1 |
(760) 0x435be2 JE 435780 |
(760) 0x435be8 MOV %R15,0x288(%RSP) |
(760) 0x435bf0 MOV %RCX,0xb0(%RSP) |
(760) 0x435bf8 CMP $0x3f,%RAX |
(760) 0x435bfc MOV $0x3f,%ECX |
(760) 0x435c01 MOV %RAX,0x3d0(%RSP) |
(760) 0x435c09 CMOVL %RAX,%RCX |
(760) 0x435c0d MOV %R9,%R11 |
(760) 0x435c10 SAL $0x6,%R11 |
(760) 0x435c14 NOT %R11 |
(760) 0x435c17 ADD %RSI,%R11 |
(760) 0x435c1a CMP $0x40,%R11 |
(760) 0x435c1e MOV $0x3f,%EAX |
(760) 0x435c23 CMOVGE %RAX,%R11 |
(760) 0x435c27 INC %R11 |
(760) 0x435c2a MOV %R11,%R10 |
(760) 0x435c2d AND $-0x4,%R10 |
(760) 0x435c31 MOV %R9,0x3c8(%RSP) |
(760) 0x435c39 MOV %RCX,0x100(%RSP) |
(760) 0x435c41 MOV %R10,0xc0(%RSP) |
(760) 0x435c49 MOV %R11,0xb8(%RSP) |
(760) 0x435c51 JE 435e30 |
(760) 0x435c57 LEA -0x1(%R10),%RAX |
(760) 0x435c5b XOR %ECX,%ECX |
(760) 0x435c5d VMOVUPD 0x620(%RSP),%YMM10 |
(760) 0x435c66 VMOVAPD %YMM12,%YMM15 |
(760) 0x435c6b VMOVUPD 0x7a0(%RSP),%YMM9 |
(760) 0x435c74 VMOVUPD 0x780(%RSP),%YMM8 |
(760) 0x435c7d VMOVAPD %YMM2,%YMM6 |
(760) 0x435c81 VMOVUPD 0x760(%RSP),%YMM11 |
(760) 0x435c8a MOV 0x208(%RSP),%RDX |
(760) 0x435c92 MOV 0x200(%RSP),%RSI |
(760) 0x435c9a MOV 0x1f8(%RSP),%RDI |
(760) 0x435ca2 MOV 0x1f0(%RSP),%R8 |
(760) 0x435caa MOV 0xa0(%RSP),%R9 |
(760) 0x435cb2 NOPW %CS:(%RAX,%RAX,1) |
(762) 0x435cc0 VMOVUPD (%RDX,%RCX,8),%YMM14 |
(762) 0x435cc5 VMOVUPD (%RSI,%RCX,8),%YMM2 |
(762) 0x435cca VMOVUPD (%RDI,%RCX,8),%YMM13 |
(762) 0x435ccf VMOVUPD (%R8,%RCX,8),%YMM0 |
(762) 0x435cd5 VMULPD 0x740(%RSP),%YMM14,%YMM12 |
(762) 0x435cde VFMADD231PD %YMM3,%YMM2,%YMM12 |
(762) 0x435ce3 VFMADD231PD 0x6a0(%RSP),%YMM13,%YMM12 |
(762) 0x435ced VFMADD231PD 0x680(%RSP),%YMM0,%YMM12 |
(762) 0x435cf7 VMULPD %YMM7,%YMM12,%YMM4 |
(762) 0x435cfb VMOVUPD %YMM4,0x1848(%RSP,%RCX,8) |
(762) 0x435d04 VMULPD 0x660(%RSP),%YMM14,%YMM4 |
(762) 0x435d0d VMULPD 0x720(%RSP),%YMM2,%YMM5 |
(762) 0x435d16 VFMADD231PD 0x6e0(%RSP),%YMM0,%YMM5 |
(762) 0x435d20 VFMADD231PD 0x700(%RSP),%YMM13,%YMM4 |
(762) 0x435d2a VFMADD231PD %YMM5,%YMM10,%YMM4 |
(762) 0x435d2f VMULPD %YMM12,%YMM8,%YMM5 |
(762) 0x435d34 VMOVUPD %YMM5,0x1648(%RSP,%RCX,8) |
(762) 0x435d3d VMULPD %YMM4,%YMM9,%YMM5 |
(762) 0x435d41 VMOVUPD %YMM5,0x1448(%RSP,%RCX,8) |
(762) 0x435d4a VMULPD 0x640(%RSP),%YMM14,%YMM5 |
(762) 0x435d53 VFMADD231PD %YMM2,%YMM15,%YMM5 |
(762) 0x435d58 VMULPD %YMM12,%YMM11,%YMM2 |
(762) 0x435d5d VMOVUPD %YMM2,0x1248(%RSP,%RCX,8) |
(762) 0x435d66 VFMADD231PD 0x6c0(%RSP),%YMM13,%YMM5 |
(762) 0x435d70 VMULPD %YMM6,%YMM4,%YMM2 |
(762) 0x435d74 VMOVUPD %YMM2,0x1048(%RSP,%RCX,8) |
(762) 0x435d7d VFMADD231PD %YMM0,%YMM10,%YMM5 |
(762) 0x435d82 VMULPD %YMM1,%YMM5,%YMM0 |
(762) 0x435d86 VMOVUPD %YMM0,0xe48(%RSP,%RCX,8) |
(762) 0x435d8f VMULPD %YMM9,%YMM12,%YMM0 |
(762) 0x435d94 VMOVUPD %YMM0,0xc48(%RSP,%RCX,8) |
(762) 0x435d9d VMULPD %YMM6,%YMM12,%YMM0 |
(762) 0x435da1 VMOVUPD %YMM0,0xa48(%RSP,%RCX,8) |
(762) 0x435daa VMULPD %YMM1,%YMM4,%YMM0 |
(762) 0x435dae VMOVUPD %YMM0,0x848(%RSP,%RCX,8) |
(762) 0x435db7 VFMADD213PD (%R9,%RCX,8),%YMM1,%YMM12 |
(762) 0x435dbd VMOVUPD %YMM12,(%R9,%RCX,8) |
(762) 0x435dc3 ADD $0x4,%RCX |
(762) 0x435dc7 CMP %RAX,%RCX |
(762) 0x435dca JLE 435cc0 |
(760) 0x435dd0 MOV %R10,%RSI |
(760) 0x435dd3 CMP %R10,%R11 |
(760) 0x435dd6 VMOVUPD 0x4e0(%RSP),%YMM8 |
(760) 0x435ddf VMOVUPD 0x4c0(%RSP),%YMM14 |
(760) 0x435de8 VMOVUPD 0x2a0(%RSP),%XMM15 |
(760) 0x435df1 VMOVUPD 0x4a0(%RSP),%YMM7 |
(760) 0x435dfa VMOVUPD 0x290(%RSP),%XMM11 |
(760) 0x435e03 VMOVUPD 0xd0(%RSP),%XMM10 |
(760) 0x435e0c VMOVUPD 0x140(%RSP),%XMM1 |
(760) 0x435e15 VMOVUPD 0x130(%RSP),%XMM6 |
(760) 0x435e1e VMOVUPD 0x2b0(%RSP),%XMM3 |
(760) 0x435e27 JNE 435e7a |
(760) 0x435e29 JMP 43606d |
(760) 0x435e30 XOR %ESI,%ESI |
(760) 0x435e32 VMOVUPD 0x2b0(%RSP),%XMM3 |
(760) 0x435e3b VMOVAPD %XMM13,%XMM11 |
(760) 0x435e40 VMOVUPD 0x4e0(%RSP),%YMM8 |
(760) 0x435e49 VMOVUPD 0x4c0(%RSP),%YMM14 |
(760) 0x435e52 VMOVUPD 0x2a0(%RSP),%XMM15 |
(760) 0x435e5b VMOVAPD %XMM6,%XMM10 |
(760) 0x435e5f VMOVUPD 0x4a0(%RSP),%YMM7 |
(760) 0x435e68 VMOVUPD 0x140(%RSP),%XMM1 |
(760) 0x435e71 VMOVUPD 0x130(%RSP),%XMM6 |
(760) 0x435e7a MOV 0x100(%RSP),%R8 |
(760) 0x435e82 SUB %RSI,%R8 |
(760) 0x435e85 INC %R8 |
(760) 0x435e88 MOV 0xa0(%RSP),%RAX |
(760) 0x435e90 LEA (%RAX,%RSI,8),%R9 |
(760) 0x435e94 LEA (%RSP,%RSI,8),%RAX |
(760) 0x435e98 ADD $0x848,%RAX |
(760) 0x435e9e MOV %RAX,0x2c0(%RSP) |
(760) 0x435ea6 LEA 0xa48(%RSP,%RSI,8),%RAX |
(760) 0x435eae MOV %RAX,0x3e0(%RSP) |
(760) 0x435eb6 LEA 0xc48(%RSP,%RSI,8),%RAX |
(760) 0x435ebe MOV %RAX,0xc8(%RSP) |
(760) 0x435ec6 LEA 0xe48(%RSP,%RSI,8),%R10 |
(760) 0x435ece LEA 0x1048(%RSP,%RSI,8),%RCX |
(760) 0x435ed6 LEA 0x1248(%RSP,%RSI,8),%RDX |
(760) 0x435ede LEA 0x1448(%RSP,%RSI,8),%R14 |
(760) 0x435ee6 MOV 0x240(%RSP),%RAX |
(760) 0x435eee LEA (%RSI,%RAX,1),%RAX |
(760) 0x435ef2 MOV 0x80(%RSP),%R11 |
(760) 0x435efa LEA (%R11,%RAX,8),%R13 |
(760) 0x435efe MOV 0x248(%RSP),%RAX |
(760) 0x435f06 ADD %RSI,%RAX |
(760) 0x435f09 LEA (%R11,%RAX,8),%RBX |
(760) 0x435f0d MOV 0x250(%RSP),%RAX |
(760) 0x435f15 ADD %RSI,%RAX |
(760) 0x435f18 LEA (%R11,%RAX,8),%R12 |
(760) 0x435f1c LEA (%RSP,%RSI,8),%RDI |
(760) 0x435f20 ADD $0x1648,%RDI |
(760) 0x435f27 LEA (%RSP,%RSI,8),%RAX |
(760) 0x435f2b ADD $0x1848,%RAX |
(760) 0x435f31 ADD 0x258(%RSP),%RSI |
(760) 0x435f39 LEA (%R11,%RSI,8),%R11 |
(760) 0x435f3d XOR %ESI,%ESI |
(760) 0x435f3f NOP |
(758) 0x435f40 VMOVSD (%R11,%RSI,8),%XMM2 |
(758) 0x435f46 VMOVSD (%R12,%RSI,8),%XMM0 |
(758) 0x435f4c VMOVSD (%R13,%RSI,8),%XMM13 |
(758) 0x435f53 VMOVSD (%RBX,%RSI,8),%XMM4 |
(758) 0x435f58 VUNPCKLPD %XMM4,%XMM0,%XMM5 |
(758) 0x435f5c VMULPD %XMM5,%XMM8,%XMM5 |
(758) 0x435f60 VSHUFPD $0x1,%XMM5,%XMM5,%XMM12 |
(758) 0x435f65 VFMADD231SD %XMM2,%XMM3,%XMM5 |
(758) 0x435f6a VFMADD231SD %XMM11,%XMM13,%XMM12 |
(758) 0x435f6f VADDSD %XMM5,%XMM12,%XMM12 |
(758) 0x435f73 VUNPCKLPD %XMM0,%XMM2,%XMM5 |
(758) 0x435f77 VMULPD %XMM5,%XMM14,%XMM5 |
(758) 0x435f7b VMOVAPD %XMM3,%XMM9 |
(758) 0x435f7f VMOVAPD %YMM7,%YMM3 |
(758) 0x435f83 VMOVAPD %XMM11,%XMM7 |
(758) 0x435f87 VMOVAPD %YMM14,%YMM11 |
(758) 0x435f8c VUNPCKLPD %XMM13,%XMM4,%XMM14 |
(758) 0x435f91 VFMADD132PD 0x5d0(%RSP),%XMM5,%XMM14 |
(758) 0x435f9b VMULSD 0xf0(%RSP),%XMM12,%XMM5 |
(758) 0x435fa4 VMOVSD %XMM5,(%RAX,%RSI,8) |
(758) 0x435fa9 VMULSD 0x470(%RSP),%XMM12,%XMM5 |
(758) 0x435fb2 VMOVSD %XMM5,(%RDI,%RSI,8) |
(758) 0x435fb7 VSHUFPD $0x1,%XMM14,%XMM14,%XMM5 |
(758) 0x435fbd VFMADD213SD %XMM14,%XMM10,%XMM5 |
(758) 0x435fc2 VMULSD %XMM1,%XMM5,%XMM14 |
(758) 0x435fc6 VMOVSD %XMM14,(%R14,%RSI,8) |
(758) 0x435fcc VMULSD 0xe0(%RSP),%XMM12,%XMM14 |
(758) 0x435fd5 VMOVSD %XMM14,(%RDX,%RSI,8) |
(758) 0x435fda VMOVAPD %YMM11,%YMM14 |
(758) 0x435fdf VMOVAPD %XMM7,%XMM11 |
(758) 0x435fe3 VMOVAPD %YMM3,%YMM7 |
(758) 0x435fe7 VMOVAPD %XMM9,%XMM3 |
(758) 0x435feb VUNPCKLPD %XMM4,%XMM2,%XMM2 |
(758) 0x435fef VMULSD %XMM6,%XMM5,%XMM4 |
(758) 0x435ff3 VMOVSD %XMM4,(%RCX,%RSI,8) |
(758) 0x435ff8 VMULPD %XMM7,%XMM2,%XMM2 |
(758) 0x435ffc VFMADD213SD %XMM2,%XMM15,%XMM0 |
(758) 0x436001 VSHUFPD $0x1,%XMM2,%XMM2,%XMM2 |
(758) 0x436006 VFMADD231SD %XMM13,%XMM10,%XMM2 |
(758) 0x43600b VADDSD %XMM0,%XMM2,%XMM0 |
(758) 0x43600f VMOVUPD 0x20(%RSP),%XMM2 |
(758) 0x436015 VMULSD %XMM2,%XMM0,%XMM0 |
(758) 0x436019 VMOVSD %XMM0,(%R10,%RSI,8) |
(758) 0x43601f VMULSD %XMM1,%XMM12,%XMM0 |
(758) 0x436023 MOV 0xc8(%RSP),%R15 |
(758) 0x43602b VMOVSD %XMM0,(%R15,%RSI,8) |
(758) 0x436031 VMULSD %XMM6,%XMM12,%XMM0 |
(758) 0x436035 MOV 0x3e0(%RSP),%R15 |
(758) 0x43603d VMOVSD %XMM0,(%R15,%RSI,8) |
(758) 0x436043 VMULSD %XMM2,%XMM5,%XMM0 |
(758) 0x436047 MOV 0x2c0(%RSP),%R15 |
(758) 0x43604f VMOVSD %XMM0,(%R15,%RSI,8) |
(758) 0x436055 VFMADD213SD (%R9,%RSI,8),%XMM2,%XMM12 |
(758) 0x43605b VMOVSD %XMM12,(%R9,%RSI,8) |
(758) 0x436061 INC %RSI |
(758) 0x436064 CMP %RSI,%R8 |
(758) 0x436067 JNE 435f40 |
(760) 0x43606d MOV 0xc0(%RSP),%R12 |
(760) 0x436075 TEST %R12,%R12 |
(760) 0x436078 JE 4361c0 |
(760) 0x43607e LEA -0x1(%R12),%RAX |
(760) 0x436083 XOR %ECX,%ECX |
(760) 0x436085 VMOVUPD 0x290(%RSP),%XMM7 |
(760) 0x43608e VMOVUPD 0x480(%RSP),%YMM3 |
(760) 0x436097 MOV 0xb0(%RSP),%RDX |
(760) 0x43609f MOV 0x288(%RSP),%RSI |
(760) 0x4360a7 MOV 0x238(%RSP),%RDI |
(760) 0x4360af MOV 0x230(%RSP),%R8 |
(760) 0x4360b7 MOV 0x228(%RSP),%R9 |
(760) 0x4360bf MOV 0x220(%RSP),%R10 |
(760) 0x4360c7 MOV 0x218(%RSP),%R11 |
(760) 0x4360cf MOV 0x210(%RSP),%RBX |
(760) 0x4360d7 MOV 0xa8(%RSP),%R14 |
(760) 0x4360df NOP |
(761) 0x4360e0 VMOVUPD 0x1848(%RSP,%RCX,8),%YMM0 |
(761) 0x4360e9 VMOVUPD 0x1648(%RSP,%RCX,8),%YMM2 |
(761) 0x4360f2 VMOVUPD 0x1448(%RSP,%RCX,8),%YMM4 |
(761) 0x4360fb VMOVUPD 0x1248(%RSP,%RCX,8),%YMM5 |
(761) 0x436104 VMOVUPD 0x1048(%RSP,%RCX,8),%YMM12 |
(761) 0x43610d VMOVUPD 0xe48(%RSP,%RCX,8),%YMM13 |
(761) 0x436116 VMOVUPD 0xc48(%RSP,%RCX,8),%YMM14 |
(761) 0x43611f VMOVUPD 0xa48(%RSP,%RCX,8),%YMM6 |
(761) 0x436128 VMOVUPD 0x848(%RSP,%RCX,8),%YMM8 |
(761) 0x436131 VADDPD (%RDX,%RCX,8),%YMM0,%YMM0 |
(761) 0x436136 VMOVUPD %YMM0,(%RDX,%RCX,8) |
(761) 0x43613b VADDPD (%RSI,%RCX,8),%YMM2,%YMM0 |
(761) 0x436140 VMOVUPD %YMM0,(%RSI,%RCX,8) |
(761) 0x436145 VADDPD (%R8,%RCX,8),%YMM4,%YMM0 |
(761) 0x43614b VMOVUPD %YMM0,(%R8,%RCX,8) |
(761) 0x436151 VADDPD (%R10,%RCX,8),%YMM5,%YMM0 |
(761) 0x436157 VMOVUPD %YMM0,(%R10,%RCX,8) |
(761) 0x43615d VADDPD (%R11,%RCX,8),%YMM12,%YMM0 |
(761) 0x436163 VMOVUPD %YMM0,(%R11,%RCX,8) |
(761) 0x436169 VADDPD (%RBX,%RCX,8),%YMM13,%YMM0 |
(761) 0x43616e VMOVUPD %YMM0,(%RBX,%RCX,8) |
(761) 0x436173 VADDPD (%R14,%RCX,8),%YMM14,%YMM0 |
(761) 0x436179 VMOVUPD %YMM0,(%R14,%RCX,8) |
(761) 0x43617f VADDPD (%RDI,%RCX,8),%YMM6,%YMM0 |
(761) 0x436184 VMOVUPD %YMM0,(%RDI,%RCX,8) |
(761) 0x436189 VADDPD (%R9,%RCX,8),%YMM8,%YMM0 |
(761) 0x43618f VMOVUPD %YMM0,(%R9,%RCX,8) |
(761) 0x436195 ADD $0x4,%RCX |
(761) 0x436199 CMP %RAX,%RCX |
(761) 0x43619c JLE 4360e0 |
(760) 0x4361a2 CMP %R12,0xb8(%RSP) |
(760) 0x4361aa MOV 0x100(%RSP),%RAX |
(760) 0x4361b2 JE 435a50 |
(760) 0x4361b8 JMP 4361dd |
(760) 0x4361c0 XOR %R12D,%R12D |
(760) 0x4361c3 VMOVUPD 0x290(%RSP),%XMM7 |
(760) 0x4361cc VMOVUPD 0x480(%RSP),%YMM3 |
(760) 0x4361d5 MOV 0x100(%RSP),%RAX |
(760) 0x4361dd SUB %R12,%RAX |
(760) 0x4361e0 INC %RAX |
(760) 0x4361e3 MOV %RAX,0x100(%RSP) |
(760) 0x4361eb MOV 0xa8(%RSP),%RAX |
(760) 0x4361f3 LEA (%RAX,%R12,8),%RAX |
(760) 0x4361f7 MOV 0x260(%RSP),%RCX |
(760) 0x4361ff ADD %R12,%RCX |
(760) 0x436202 MOV 0x10(%RSP),%R11 |
(760) 0x436207 LEA (%R11,%RCX,8),%RCX |
(760) 0x43620b MOV 0x268(%RSP),%RDX |
(760) 0x436213 LEA (%R12,%RDX,1),%RDX |
(760) 0x436217 LEA (%R11,%RDX,8),%RDX |
(760) 0x43621b MOV 0x270(%RSP),%RSI |
(760) 0x436223 LEA (%R12,%RSI,1),%RSI |
(760) 0x436227 LEA (%R11,%RSI,8),%RSI |
(760) 0x43622b MOV 0x278(%RSP),%RDI |
(760) 0x436233 LEA (%R12,%RDI,1),%R8 |
(760) 0x436237 MOV 0x18(%RSP),%R9 |
(760) 0x43623c LEA (%R9,%R8,8),%RDI |
(760) 0x436240 LEA (%R11,%R8,8),%R8 |
(760) 0x436244 MOV 0x280(%RSP),%R10 |
(760) 0x43624c LEA (%R12,%R10,1),%R10 |
(760) 0x436250 LEA (%R9,%R10,8),%R9 |
(760) 0x436254 LEA (%R11,%R10,8),%R10 |
(760) 0x436258 MOV 0xb0(%RSP),%R11 |
(760) 0x436260 LEA (%R11,%R12,8),%R11 |
(760) 0x436264 LEA 0x848(%RSP,%R12,8),%RBX |
(760) 0x43626c MOV %RBX,0x2c0(%RSP) |
(760) 0x436274 LEA 0xa48(%RSP,%R12,8),%RBX |
(760) 0x43627c MOV %RBX,0x3e0(%RSP) |
(760) 0x436284 LEA 0xc48(%RSP,%R12,8),%RBX |
(760) 0x43628c MOV %RBX,0xc8(%RSP) |
(760) 0x436294 LEA 0xe48(%RSP,%R12,8),%RBX |
(760) 0x43629c MOV %RBX,0xc0(%RSP) |
(760) 0x4362a4 LEA 0x1048(%RSP,%R12,8),%RBX |
(760) 0x4362ac MOV %RBX,0xb8(%RSP) |
(760) 0x4362b4 LEA 0x1248(%RSP,%R12,8),%RBX |
(760) 0x4362bc MOV %RBX,0x3d8(%RSP) |
(760) 0x4362c4 LEA (%RSP,%R12,8),%R14 |
(760) 0x4362c8 ADD $0x1448,%R14 |
(760) 0x4362cf LEA (%RSP,%R12,8),%R15 |
(760) 0x4362d3 ADD $0x1648,%R15 |
(760) 0x4362da LEA (%RSP,%R12,8),%R12 |
(760) 0x4362de ADD $0x1848,%R12 |
(760) 0x4362e5 XOR %R13D,%R13D |
(760) 0x4362e8 NOPL (%RAX,%RAX,1) |
(759) 0x4362f0 VMOVSD (%R12,%R13,8),%XMM0 |
(759) 0x4362f6 VMOVSD (%R15,%R13,8),%XMM2 |
(759) 0x4362fc VMOVSD (%R14,%R13,8),%XMM4 |
(759) 0x436302 MOV 0x3d8(%RSP),%RBX |
(759) 0x43630a VMOVSD (%RBX,%R13,8),%XMM5 |
(759) 0x436310 MOV 0xb8(%RSP),%RBX |
(759) 0x436318 VMOVSD (%RBX,%R13,8),%XMM6 |
(759) 0x43631e MOV 0xc0(%RSP),%RBX |
(759) 0x436326 VMOVSD (%RBX,%R13,8),%XMM8 |
(759) 0x43632c MOV 0xc8(%RSP),%RBX |
(759) 0x436334 VMOVSD (%RBX,%R13,8),%XMM12 |
(759) 0x43633a MOV 0x3e0(%RSP),%RBX |
(759) 0x436342 VMOVSD (%RBX,%R13,8),%XMM13 |
(759) 0x436348 MOV 0x2c0(%RSP),%RBX |
(759) 0x436350 VMOVSD (%RBX,%R13,8),%XMM14 |
(759) 0x436356 VADDSD (%R11,%R13,8),%XMM0,%XMM0 |
(759) 0x43635c VMOVSD %XMM0,(%R11,%R13,8) |
(759) 0x436362 VADDSD (%R10,%R13,8),%XMM2,%XMM0 |
(759) 0x436368 VMOVSD %XMM0,(%R10,%R13,8) |
(759) 0x43636e VADDSD (%R8,%R13,8),%XMM4,%XMM0 |
(759) 0x436374 VMOVSD %XMM0,(%R8,%R13,8) |
(759) 0x43637a VADDSD (%RSI,%R13,8),%XMM5,%XMM0 |
(759) 0x436380 VMOVSD %XMM0,(%RSI,%R13,8) |
(759) 0x436386 VADDSD (%RDX,%R13,8),%XMM6,%XMM0 |
(759) 0x43638c VMOVSD %XMM0,(%RDX,%R13,8) |
(759) 0x436392 VADDSD (%RCX,%R13,8),%XMM8,%XMM0 |
(759) 0x436398 VMOVSD %XMM0,(%RCX,%R13,8) |
(759) 0x43639e VADDSD (%RAX,%R13,8),%XMM12,%XMM0 |
(759) 0x4363a4 VMOVSD %XMM0,(%RAX,%R13,8) |
(759) 0x4363aa VADDSD (%R9,%R13,8),%XMM13,%XMM0 |
(759) 0x4363b0 VMOVSD %XMM0,(%R9,%R13,8) |
(759) 0x4363b6 VADDSD (%RDI,%R13,8),%XMM14,%XMM0 |
(759) 0x4363bc VMOVSD %XMM0,(%RDI,%R13,8) |
(759) 0x4363c2 INC %R13 |
(759) 0x4363c5 CMP %R13,0x100(%RSP) |
(759) 0x4363cd JNE 4362f0 |
(760) 0x4363d3 JMP 435a50 |
0x4363e0 TEST %R13D,%R13D |
0x4363e3 MOV %R13,%RSI |
0x4363e6 MOV %R9,%R13 |
0x4363e9 JLE 435780 |
0x4363ef CMPQ $0,0x78(%RSP) |
0x4363f5 JE 43662b |
0x4363fb VBROADCASTSD 0xf0(%RSP),%YMM0 |
0x436405 VMOVUPS %YMM0,0x100(%RSP) |
0x43640e VBROADCASTSD %XMM10,%YMM0 |
0x436413 VMOVUPD %YMM0,0x2c0(%RSP) |
0x43641c VBROADCASTSD 0x140(%RSP),%YMM7 |
0x436426 VBROADCASTSD 0xe0(%RSP),%YMM0 |
0x436430 VMOVUPS %YMM0,0x3e0(%RSP) |
0x436439 VMOVUPD 0x620(%RSP),%YMM15 |
0x436442 VBROADCASTSD 0x130(%RSP),%YMM10 |
0x43644c VBROADCASTSD 0x20(%RSP),%YMM11 |
0x436453 XOR %EAX,%EAX |
0x436455 VMOVUPD 0x6a0(%RSP),%YMM13 |
0x43645e VMOVUPD 0x640(%RSP),%YMM3 |
0x436467 VMOVAPD %YMM12,%YMM1 |
0x43646b VMOVUPD 0x680(%RSP),%YMM14 |
0x436474 VMOVUPD 0x660(%RSP),%YMM9 |
0x43647d MOV 0x1c0(%RSP),%R15 |
0x436485 MOV %R14,%RSI |
0x436488 MOV %R12,%R14 |
0x43648b MOV 0x70(%RSP),%R12 |
0x436490 MOV 0x68(%RSP),%R13 |
0x436495 MOV 0x60(%RSP),%RDI |
0x43649a NOPW (%RAX,%RAX,1) |
(757) 0x4364a0 VMOVUPD (%R12,%RAX,8),%YMM0 |
(757) 0x4364a6 VMOVUPD (%R13,%RAX,8),%YMM2 |
(757) 0x4364ad VMOVUPD (%R14,%RAX,8),%YMM12 |
(757) 0x4364b3 VMOVUPD (%RSI,%RAX,8),%YMM8 |
(757) 0x4364b8 VMULPD %YMM0,%YMM9,%YMM5 |
(757) 0x4364bc VMULPD 0x720(%RSP),%YMM2,%YMM4 |
(757) 0x4364c5 VFMADD231PD 0x6e0(%RSP),%YMM8,%YMM4 |
(757) 0x4364cf VFMADD231PD 0x700(%RSP),%YMM12,%YMM5 |
(757) 0x4364d9 VFMADD231PD %YMM4,%YMM15,%YMM5 |
(757) 0x4364de VMULPD 0x740(%RSP),%YMM0,%YMM6 |
(757) 0x4364e7 VFMADD231PD 0x480(%RSP),%YMM2,%YMM6 |
(757) 0x4364f1 VFMADD231PD %YMM13,%YMM12,%YMM6 |
(757) 0x4364f6 VFMADD231PD %YMM8,%YMM14,%YMM6 |
(757) 0x4364fb VMULPD %YMM3,%YMM0,%YMM0 |
(757) 0x4364ff VFMADD231PD %YMM2,%YMM1,%YMM0 |
(757) 0x436504 LEA (%R8,%RAX,8),%RCX |
(757) 0x436508 VMOVUPD (%R8,%RAX,8),%YMM2 |
(757) 0x43650e VFMADD231PD 0x100(%RSP),%YMM6,%YMM2 |
(757) 0x436518 VMOVUPD %YMM2,(%R8,%RAX,8) |
(757) 0x43651e VMOVUPD (%R15,%RCX,1),%YMM2 |
(757) 0x436524 VFMADD231PD 0x2c0(%RSP),%YMM6,%YMM2 |
(757) 0x43652e VMOVUPD %YMM2,(%R15,%RCX,1) |
(757) 0x436534 VFMADD231PD 0x6c0(%RSP),%YMM12,%YMM0 |
(757) 0x43653e LEA (%RCX,%R15,1),%RCX |
(757) 0x436542 VMOVUPD (%R15,%RCX,1),%YMM2 |
(757) 0x436548 VFMADD231PD %YMM7,%YMM5,%YMM2 |
(757) 0x43654d VMOVUPD %YMM2,(%R15,%RCX,1) |
(757) 0x436553 LEA (%RCX,%R15,1),%RCX |
(757) 0x436557 VMOVUPD (%R15,%RCX,1),%YMM2 |
(757) 0x43655d VFMADD231PD 0x3e0(%RSP),%YMM6,%YMM2 |
(757) 0x436567 VMOVUPD %YMM2,(%R15,%RCX,1) |
(757) 0x43656d LEA (%RCX,%R15,1),%RCX |
(757) 0x436571 VMOVUPD (%R15,%RCX,1),%YMM2 |
(757) 0x436577 VFMADD231PD %YMM10,%YMM5,%YMM2 |
(757) 0x43657c VMOVUPD %YMM2,(%R15,%RCX,1) |
(757) 0x436582 VFMADD231PD %YMM8,%YMM15,%YMM0 |
(757) 0x436587 LEA (%RCX,%R15,1),%RCX |
(757) 0x43658b VFMADD213PD (%R15,%RCX,1),%YMM11,%YMM0 |
(757) 0x436591 VMOVUPD %YMM0,(%R15,%RCX,1) |
(757) 0x436597 MOV 0x78(%RSP),%RCX |
(757) 0x43659c VMOVUPD (%R9,%RAX,8),%YMM0 |
(757) 0x4365a2 VFMADD231PD %YMM7,%YMM6,%YMM0 |
(757) 0x4365a7 VMOVUPD %YMM0,(%R9,%RAX,8) |
(757) 0x4365ad VMOVUPD (%R11,%RAX,8),%YMM0 |
(757) 0x4365b3 VFMADD231PD %YMM10,%YMM6,%YMM0 |
(757) 0x4365b8 VMOVUPD %YMM0,(%R11,%RAX,8) |
(757) 0x4365be VFMADD213PD (%RBX,%RAX,8),%YMM11,%YMM5 |
(757) 0x4365c4 VMOVUPD %YMM5,(%RBX,%RAX,8) |
(757) 0x4365c9 VFMADD213PD (%RDI,%RAX,8),%YMM11,%YMM6 |
(757) 0x4365cf VMOVUPD %YMM6,(%RDI,%RAX,8) |
(757) 0x4365d4 ADD $0x4,%RAX |
(757) 0x4365d8 CMP %RCX,%RAX |
(757) 0x4365db JL 4364a0 |
0x4365e1 MOV %RCX,%RAX |
0x4365e4 MOV %RSI,%R15 |
0x4365e7 MOV 0x98(%RSP),%RSI |
0x4365ef CMP %RSI,%RCX |
0x4365f2 VMOVUPD 0xd0(%RSP),%XMM6 |
0x4365fb VMOVAPD %YMM1,%YMM12 |
0x4365ff VMOVUPD 0x480(%RSP),%YMM3 |
0x436608 VMOVUPD 0x290(%RSP),%XMM13 |
0x436611 MOV %R14,%R12 |
0x436614 MOV %R15,%R14 |
0x436617 VMOVUPD 0x470(%RSP),%XMM10 |
0x436620 MOV %R9,%R13 |
0x436623 JE 435780 |
0x436629 JMP 436635 |
0x43662b XOR %EAX,%EAX |
0x43662d MOV %R9,%R13 |
0x436630 MOV 0x60(%RSP),%RDI |
0x436635 MOV 0x1c0(%RSP),%R15 |
0x43663d VMOVUPD 0x140(%RSP),%XMM1 |
0x436646 NOPW %CS:(%RAX,%RAX,1) |
(756) 0x436650 MOV 0x1e0(%RSP),%RCX |
(756) 0x436658 VMOVSD (%RCX,%RAX,8),%XMM0 |
(756) 0x43665d MOV 0x1d8(%RSP),%RCX |
(756) 0x436665 VMOVSD (%RCX,%RAX,8),%XMM2 |
(756) 0x43666a MOV 0x1d0(%RSP),%RCX |
(756) 0x436672 VMOVSD (%RCX,%RAX,8),%XMM8 |
(756) 0x436677 MOV 0x1c8(%RSP),%RCX |
(756) 0x43667f VMOVSD (%RCX,%RAX,8),%XMM7 |
(756) 0x436684 VMULSD 0x4c0(%RSP),%XMM0,%XMM5 |
(756) 0x43668d VMULSD 0x5b0(%RSP),%XMM2,%XMM4 |
(756) 0x436696 VFMADD231SD 0x460(%RSP),%XMM7,%XMM4 |
(756) 0x4366a0 VFMADD231SD 0x450(%RSP),%XMM8,%XMM5 |
(756) 0x4366aa VFMADD231SD %XMM4,%XMM6,%XMM5 |
(756) 0x4366af VMULSD 0x2b0(%RSP),%XMM0,%XMM6 |
(756) 0x4366b8 VFMADD231SD 0x4e0(%RSP),%XMM2,%XMM6 |
(756) 0x4366c2 VFMADD231SD 0x5c0(%RSP),%XMM8,%XMM6 |
(756) 0x4366cc VFMADD231SD %XMM7,%XMM13,%XMM6 |
(756) 0x4366d1 VMULSD 0x4a0(%RSP),%XMM0,%XMM0 |
(756) 0x4366da VFMADD231SD 0x2a0(%RSP),%XMM2,%XMM0 |
(756) 0x4366e4 LEA (%R8,%RAX,8),%RCX |
(756) 0x4366e8 VMOVSD (%R8,%RAX,8),%XMM2 |
(756) 0x4366ee VFMADD231SD 0xf0(%RSP),%XMM6,%XMM2 |
(756) 0x4366f8 VMOVSD %XMM2,(%R8,%RAX,8) |
(756) 0x4366fe VMOVSD (%R15,%RCX,1),%XMM2 |
(756) 0x436704 VFMADD231SD %XMM6,%XMM10,%XMM2 |
(756) 0x436709 VMOVSD %XMM2,(%R15,%RCX,1) |
(756) 0x43670f VFMADD231SD 0x5a0(%RSP),%XMM8,%XMM0 |
(756) 0x436719 LEA (%RCX,%R15,1),%RCX |
(756) 0x43671d VMOVSD (%R15,%RCX,1),%XMM2 |
(756) 0x436723 VFMADD231SD %XMM1,%XMM5,%XMM2 |
(756) 0x436728 VMOVSD %XMM2,(%R15,%RCX,1) |
(756) 0x43672e LEA (%RCX,%R15,1),%RCX |
(756) 0x436732 VMOVSD (%R15,%RCX,1),%XMM2 |
(756) 0x436738 VFMADD231SD 0xe0(%RSP),%XMM6,%XMM2 |
(756) 0x436742 VMOVSD %XMM2,(%R15,%RCX,1) |
(756) 0x436748 LEA (%RCX,%R15,1),%RCX |
(756) 0x43674c VMOVSD (%R15,%RCX,1),%XMM2 |
(756) 0x436752 VMOVUPD 0x130(%RSP),%XMM4 |
(756) 0x43675b VFMADD231SD %XMM4,%XMM5,%XMM2 |
(756) 0x436760 VMOVSD %XMM2,(%R15,%RCX,1) |
(756) 0x436766 VFMADD231SD 0xd0(%RSP),%XMM7,%XMM0 |
(756) 0x436770 LEA (%RCX,%R15,1),%RCX |
(756) 0x436774 VMOVUPD 0x20(%RSP),%XMM2 |
(756) 0x43677a VFMADD213SD (%R15,%RCX,1),%XMM2,%XMM0 |
(756) 0x436780 VMOVSD %XMM0,(%R15,%RCX,1) |
(756) 0x436786 VMOVSD (%R13,%RAX,8),%XMM0 |
(756) 0x43678d VFMADD231SD %XMM1,%XMM6,%XMM0 |
(756) 0x436792 VMOVSD %XMM0,(%R13,%RAX,8) |
(756) 0x436799 VMOVSD (%R11,%RAX,8),%XMM0 |
(756) 0x43679f VFMADD231SD %XMM4,%XMM6,%XMM0 |
(756) 0x4367a4 VMOVSD %XMM0,(%R11,%RAX,8) |
(756) 0x4367aa VFMADD213SD (%RBX,%RAX,8),%XMM2,%XMM5 |
(756) 0x4367b0 VMOVSD %XMM5,(%RBX,%RAX,8) |
(756) 0x4367b5 VFMADD213SD (%RDI,%RAX,8),%XMM2,%XMM6 |
(756) 0x4367bb VMOVSD %XMM6,(%RDI,%RAX,8) |
(756) 0x4367c0 VMOVUPD 0xd0(%RSP),%XMM6 |
(756) 0x4367c9 INC %RAX |
(756) 0x4367cc CMP %RAX,%RSI |
(756) 0x4367cf JNE 436650 |
0x4367d5 JMP 435780 |
/scratch_na/users/xoserete/qaas_runs/171-284-5201/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 61 - 61 |
-------------------------------------------------------------------------------- |
61: for (size_t d = 0; d < D; ++d) |
/scratch_na/users/xoserete/qaas_runs/171-284-5201/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineRef.hpp: 227 - 262 |
-------------------------------------------------------------------------------- |
227: for (int j = 0; j < 4; j++) |
[...] |
234: const T pre20 = d2a[i] * b[j]; |
235: const T pre10 = da[i] * b[j]; |
236: const T pre00 = a[i] * b[j]; |
237: const T pre11 = da[i] * db[j]; |
238: const T pre01 = a[i] * db[j]; |
239: const T pre02 = a[i] * d2b[j]; |
240: |
241: const int iSplitPoint = num_splines; |
242: for (int n = 0; n < iSplitPoint; n++) |
243: { |
244: T coefsv = coefs[n]; |
245: T coefsvzs = coefszs[n]; |
246: T coefsv2zs = coefs2zs[n]; |
247: T coefsv3zs = coefs3zs[n]; |
248: |
249: T sum0 = c[0] * coefsv + c[1] * coefsvzs + c[2] * coefsv2zs + c[3] * coefsv3zs; |
250: T sum1 = dc[0] * coefsv + dc[1] * coefsvzs + dc[2] * coefsv2zs + dc[3] * coefsv3zs; |
251: T sum2 = d2c[0] * coefsv + d2c[1] * coefsvzs + d2c[2] * coefsv2zs + d2c[3] * coefsv3zs; |
252: |
253: hxx[n] += pre20 * sum0; |
254: hxy[n] += pre11 * sum0; |
255: hxz[n] += pre10 * sum1; |
256: hyy[n] += pre02 * sum0; |
257: hyz[n] += pre01 * sum1; |
258: hzz[n] += pre00 * sum2; |
259: gx[n] += pre10 * sum0; |
260: gy[n] += pre01 * sum0; |
261: gz[n] += pre00 * sum1; |
262: vals[n] += pre00 * sum0; |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 2.52 |
CQA speedup if FP arith vectorized | 1.10 |
CQA speedup if fully vectorized | 5.24 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.10 |
Bottlenecks | micro-operation queue, |
Function | miniqmcreference::einspline_spo_ref |
Source | TinyVector.h:61-61,MultiBsplineRef.hpp:227-227,MultiBsplineRef.hpp:234-239,MultiBsplineRef.hpp:242-242,MultiBsplineRef.hpp:253-258 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 26.83 |
CQA cycles if no scalar integer | 10.67 |
CQA cycles if FP arith vectorized | 24.50 |
CQA cycles if fully vectorized | 5.13 |
Front-end cycles | 26.83 |
DIV/SQRT cycles | 6.50 |
P0 cycles | 6.40 |
P1 cycles | 21.33 |
P2 cycles | 21.33 |
P3 cycles | 24.50 |
P4 cycles | 6.40 |
P5 cycles | 6.30 |
P6 cycles | 24.50 |
P7 cycles | 24.50 |
P8 cycles | 24.50 |
P9 cycles | 6.40 |
P10 cycles | 21.33 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 28.67 |
Stall cycles (UFS) | 0.00 |
Nb insns | 152.00 |
Nb uops | 160.00 |
Nb loads | 64.00 |
Nb stores | 49.00 |
Nb stack references | 76.00 |
FLOP/cycle | 0.22 |
Nb FLOP add-sub | 0.00 |
Nb FLOP mul | 6.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 50.09 |
Bytes prefetched | 0.00 |
Bytes loaded | 688.00 |
Bytes stored | 656.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 23.68 |
Vectorization ratio load | 21.28 |
Vectorization ratio store | 30.61 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 6.67 |
Vector-efficiency ratio all | 18.97 |
Vector-efficiency ratio load | 18.35 |
Vector-efficiency ratio store | 20.92 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 14.17 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 2.52 |
CQA speedup if FP arith vectorized | 1.10 |
CQA speedup if fully vectorized | 5.24 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.10 |
Bottlenecks | micro-operation queue, |
Function | miniqmcreference::einspline_spo_ref |
Source | TinyVector.h:61-61,MultiBsplineRef.hpp:227-227,MultiBsplineRef.hpp:234-239,MultiBsplineRef.hpp:242-242,MultiBsplineRef.hpp:253-258 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 26.83 |
CQA cycles if no scalar integer | 10.67 |
CQA cycles if FP arith vectorized | 24.50 |
CQA cycles if fully vectorized | 5.13 |
Front-end cycles | 26.83 |
DIV/SQRT cycles | 6.50 |
P0 cycles | 6.40 |
P1 cycles | 21.33 |
P2 cycles | 21.33 |
P3 cycles | 24.50 |
P4 cycles | 6.40 |
P5 cycles | 6.30 |
P6 cycles | 24.50 |
P7 cycles | 24.50 |
P8 cycles | 24.50 |
P9 cycles | 6.40 |
P10 cycles | 21.33 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 28.67 |
Stall cycles (UFS) | 0.00 |
Nb insns | 152.00 |
Nb uops | 160.00 |
Nb loads | 64.00 |
Nb stores | 49.00 |
Nb stack references | 76.00 |
FLOP/cycle | 0.22 |
Nb FLOP add-sub | 0.00 |
Nb FLOP mul | 6.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 50.09 |
Bytes prefetched | 0.00 |
Bytes loaded | 688.00 |
Bytes stored | 656.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 23.68 |
Vectorization ratio load | 21.28 |
Vectorization ratio store | 30.61 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 6.67 |
Vector-efficiency ratio all | 18.97 |
Vector-efficiency ratio load | 18.35 |
Vector-efficiency ratio store | 20.92 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 14.17 |
Path / |
Function | miniqmcreference::einspline_spo_ref |
Source file and lines | MultiBsplineRef.hpp:227-262 |
Module | exec |
nb instructions | 152 |
nb uops | 160 |
loop length | 1024 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 7 |
used ymm registers | 12 |
used zmm registers | 0 |
nb stack references | 76 |
micro-operation queue | 26.83 cycles |
front end | 26.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 6.50 | 6.40 | 21.33 | 21.33 | 24.50 | 6.40 | 6.30 | 24.50 | 24.50 | 24.50 | 6.40 | 21.33 |
cycles | 6.50 | 6.40 | 21.33 | 21.33 | 24.50 | 6.40 | 6.30 | 24.50 | 24.50 | 24.50 | 6.40 | 21.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 28.67 |
Stall cycles | 0.00 |
Front-end | 26.83 |
Dispatch | 24.50 |
Overall L1 | 26.83 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 55% |
load | 38% |
store | 100% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 23% |
load | 21% |
store | 30% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 6% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 28% |
load | 23% |
store | 40% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
all | 18% |
load | 18% |
store | 20% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV %R13,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x380(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x68(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x70(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,0x1c8(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1d0(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1d8(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1e0(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV 0x198(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,0x1a0(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1a8(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1b0(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1b8(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV 0x3a8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x3,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x3a0(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JE 4355f0 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xb70> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x5e0(%RSP,%RAX,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0x398(%RSP),%XMM0,%XMM2 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVUPD %XMM2,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x390(%RSP),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM2,%XMM0,%XMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM1,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x388(%RSP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM4,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM0,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x540(%RSP,%RAX,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM2,%XMM0,%XMM10 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM4,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM0,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMULSD 0x500(%RSP,%RAX,8),%XMM4,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVUPD %XMM0,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
CMP $0x81,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVUPD %XMM10,0x470(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV %RAX,0x3a8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JB 4363e0 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1960> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
TEST %R13D,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x60(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 435780 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VBROADCASTSD 0xf0(%RSP),%YMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD %XMM10,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM1,0x780(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x140(%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xe0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM1,0x760(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x130(%RSP),%YMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x20(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV 0x8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x280(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x188(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x278(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x180(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x270(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x178(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x268(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x170(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x260(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x50(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,0x238(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x230(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0x228(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x218(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x190(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x210(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1b8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x258(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1b0(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x250(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1a8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x248(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1a0(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x240(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x378(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x70(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x208(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x1f8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x1f0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,0x3c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x3b8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVUPD %YMM7,0x820(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM2,0x800(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM1,0x7e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS %YMM10,0x7a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
JMP 435be8 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1168> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
TEST %R13D,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JLE 435780 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0,0x78(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 43662b <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1bab> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VBROADCASTSD 0xf0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM10,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x140(%RSP),%YMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xe0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x3e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x620(%RSP),%YMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD 0x130(%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x20(%RSP),%YMM11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD 0x6a0(%RSP),%YMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x640(%RSP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVAPD %YMM12,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VMOVUPD 0x680(%RSP),%YMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x660(%RSP),%YMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV 0x1c0(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x70(%RSP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x68(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RSI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x98(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVUPD 0xd0(%RSP),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVAPD %YMM1,%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VMOVUPD 0x480(%RSP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x290(%RSP),%XMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R14,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVUPD 0x470(%RSP),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JE 435780 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 436635 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1bb5> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x60(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x1c0(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0x140(%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 435780 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
Function | miniqmcreference::einspline_spo_ref |
Source file and lines | MultiBsplineRef.hpp:227-262 |
Module | exec |
nb instructions | 152 |
nb uops | 160 |
loop length | 1024 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 7 |
used ymm registers | 12 |
used zmm registers | 0 |
nb stack references | 76 |
micro-operation queue | 26.83 cycles |
front end | 26.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 6.50 | 6.40 | 21.33 | 21.33 | 24.50 | 6.40 | 6.30 | 24.50 | 24.50 | 24.50 | 6.40 | 21.33 |
cycles | 6.50 | 6.40 | 21.33 | 21.33 | 24.50 | 6.40 | 6.30 | 24.50 | 24.50 | 24.50 | 6.40 | 21.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 28.67 |
Stall cycles | 0.00 |
Front-end | 26.83 |
Dispatch | 24.50 |
Overall L1 | 26.83 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 55% |
load | 38% |
store | 100% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 23% |
load | 21% |
store | 30% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 6% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 28% |
load | 23% |
store | 40% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
all | 18% |
load | 18% |
store | 20% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV %R13,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x380(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x68(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x70(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,0x1c8(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1d0(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1d8(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1e0(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV 0x198(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,0x1a0(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1a8(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1b0(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1b8(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV 0x3a8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x3,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x3a0(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JE 4355f0 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xb70> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x5e0(%RSP,%RAX,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0x398(%RSP),%XMM0,%XMM2 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVUPD %XMM2,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x390(%RSP),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM2,%XMM0,%XMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM1,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x388(%RSP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM4,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM0,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x540(%RSP,%RAX,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM2,%XMM0,%XMM10 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM4,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM0,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMULSD 0x500(%RSP,%RAX,8),%XMM4,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVUPD %XMM0,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
CMP $0x81,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVUPD %XMM10,0x470(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV %RAX,0x3a8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JB 4363e0 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1960> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
TEST %R13D,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x60(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 435780 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VBROADCASTSD 0xf0(%RSP),%YMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD %XMM10,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM1,0x780(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x140(%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xe0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM1,0x760(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x130(%RSP),%YMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x20(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV 0x8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x280(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x188(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x278(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x180(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x270(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x178(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x268(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x170(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x260(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x50(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,0x238(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x230(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0x228(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x218(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x190(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x210(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1b8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x258(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1b0(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x250(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1a8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x248(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1a0(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x240(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x378(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x70(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x208(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x1f8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x1f0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,0x3c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x3b8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVUPD %YMM7,0x820(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM2,0x800(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM1,0x7e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS %YMM10,0x7a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
JMP 435be8 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1168> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
TEST %R13D,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JLE 435780 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0,0x78(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 43662b <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1bab> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VBROADCASTSD 0xf0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM10,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x140(%RSP),%YMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xe0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x3e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x620(%RSP),%YMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD 0x130(%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x20(%RSP),%YMM11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD 0x6a0(%RSP),%YMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x640(%RSP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVAPD %YMM12,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VMOVUPD 0x680(%RSP),%YMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x660(%RSP),%YMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV 0x1c0(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x70(%RSP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x68(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RSI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x98(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVUPD 0xd0(%RSP),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVAPD %YMM1,%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VMOVUPD 0x480(%RSP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x290(%RSP),%XMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R14,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVUPD 0x470(%RSP),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JE 435780 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 436635 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1bb5> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x60(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x1c0(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0x140(%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 435780 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |