Loop Id: 853 | Module: exec | Source: MultiBsplineRef.hpp:227-262 [...] | Coverage: 0.03% |
---|
Loop Id: 853 | Module: exec | Source: MultiBsplineRef.hpp:227-262 [...] | Coverage: 0.03% |
---|
0x43c310 MOV 0x3d8(%RSP),%RAX |
0x43c318 ADD %RAX,%R14 |
0x43c31b ADD %RAX,%R13 |
0x43c31e ADD %RAX,%R12 |
0x43c321 MOV 0x80(%RSP),%R15 |
0x43c329 ADD %RAX,%R15 |
0x43c32c ADD %RAX,0x1a8(%RSP) |
0x43c334 ADD %RAX,0x1b0(%RSP) |
0x43c33c ADD %RAX,0x1b8(%RSP) |
0x43c344 ADD %RAX,0x1c0(%RSP) |
0x43c34c MOV 0x170(%RSP),%RAX |
0x43c354 ADD %RAX,0x178(%RSP) |
0x43c35c ADD %RAX,0x180(%RSP) |
0x43c364 ADD %RAX,0x188(%RSP) |
0x43c36c ADD %RAX,0x190(%RSP) |
0x43c374 MOV 0x400(%RSP),%RCX |
0x43c37c CMP $0x3,%RCX |
0x43c380 LEA 0x1(%RCX),%RCX |
0x43c384 MOV 0x40(%RSP),%R11 |
0x43c389 MOV 0x3f8(%RSP),%RAX |
0x43c391 JE 43c170 |
0x43c397 MOV %R15,0x80(%RSP) |
0x43c39f VMOVSD 0x620(%RSP,%RCX,8),%XMM0 |
0x43c3a8 VMULSD 0x3f0(%RSP),%XMM0,%XMM5 |
0x43c3b1 VMOVSD 0x3e8(%RSP),%XMM2 |
0x43c3ba VMULSD %XMM2,%XMM0,%XMM14 |
0x43c3be VMOVSD 0x3e0(%RSP),%XMM4 |
0x43c3c7 VMULSD %XMM4,%XMM0,%XMM1 |
0x43c3cb VMOVSD 0x580(%RSP,%RCX,8),%XMM0 |
0x43c3d4 VMULSD %XMM2,%XMM0,%XMM10 |
0x43c3d8 VMULSD %XMM4,%XMM0,%XMM0 |
0x43c3dc VMOVUPD %XMM0,0xf0(%RSP) |
0x43c3e5 VMULSD 0x540(%RSP,%RCX,8),%XMM4,%XMM0 |
0x43c3ee VMOVUPD %XMM0,0x50(%RSP) |
0x43c3f4 CMP $0x81,%R11D |
0x43c3fb VMOVAPD %XMM5,%XMM6 |
0x43c3ff VMOVUPD %XMM5,0x4b0(%RSP) |
0x43c408 VMOVUPD %XMM14,0x320(%RSP) |
0x43c411 VMOVUPD %XMM1,0x310(%RSP) |
0x43c41a VMOVUPD %XMM10,0x4a0(%RSP) |
0x43c423 MOV %RCX,0x400(%RSP) |
0x43c42b JB 43cf90 |
0x43c431 TEST %R11D,%R11D |
0x43c434 MOV 0x18(%RSP),%RBX |
0x43c439 MOV 0x88(%RSP),%RDI |
0x43c441 JLE 43c310 |
0x43c447 VBROADCASTSD %XMM6,%YMM0 |
0x43c44c VBROADCASTSD %XMM10,%YMM2 |
0x43c451 VMOVUPD %YMM2,0x7a0(%RSP) |
0x43c45a VBROADCASTSD %XMM14,%YMM10 |
0x43c45f VBROADCASTSD 0x50(%RSP),%YMM4 |
0x43c466 VBROADCASTSD 0xf0(%RSP),%YMM2 |
0x43c470 VBROADCASTSD %XMM1,%YMM5 |
0x43c475 MOV 0x3d0(%RSP),%RAX |
0x43c47d MOV %RAX,0x258(%RSP) |
0x43c485 MOV 0x150(%RSP),%RAX |
0x43c48d MOV %RAX,0x250(%RSP) |
0x43c495 MOV 0x148(%RSP),%RAX |
0x43c49d MOV %RAX,0x248(%RSP) |
0x43c4a5 MOV 0x140(%RSP),%RAX |
0x43c4ad MOV %RAX,0x240(%RSP) |
0x43c4b5 MOV 0x138(%RSP),%RAX |
0x43c4bd MOV %RAX,0x238(%RSP) |
0x43c4c5 MOV %R8,%RAX |
0x43c4c8 MOV 0x78(%RSP),%RCX |
0x43c4cd MOV %R10,%R15 |
0x43c4d0 MOV 0x168(%RSP),%R8 |
0x43c4d8 MOV %R8,0x210(%RSP) |
0x43c4e0 MOV %R9,0x208(%RSP) |
0x43c4e8 MOV %RDX,0x200(%RSP) |
0x43c4f0 MOV 0x158(%RSP),%RDX |
0x43c4f8 MOV %RDX,0x1f8(%RSP) |
0x43c500 MOV 0x160(%RSP),%RDX |
0x43c508 MOV %RDX,0x1f0(%RSP) |
0x43c510 MOV %RBX,0xa8(%RSP) |
0x43c518 MOV 0x190(%RSP),%RDX |
0x43c520 MOV %RDX,0x230(%RSP) |
0x43c528 MOV 0x188(%RSP),%RDX |
0x43c530 MOV %RDX,0x228(%RSP) |
0x43c538 MOV 0x180(%RSP),%RDX |
0x43c540 MOV %RDX,0x220(%RSP) |
0x43c548 MOV 0x178(%RSP),%RDX |
0x43c550 MOV %RDX,0x218(%RSP) |
0x43c558 MOV 0x1c8(%RSP),%RSI |
0x43c560 MOV 0x80(%RSP),%RDX |
0x43c568 MOV %RDX,0x1e8(%RSP) |
0x43c570 MOV %R12,0x1e0(%RSP) |
0x43c578 MOV %R13,0x1d8(%RSP) |
0x43c580 MOV %R14,0x1d0(%RSP) |
0x43c588 MOV %RDI,0xa0(%RSP) |
0x43c590 XOR %R11D,%R11D |
0x43c593 MOV %R12,0x420(%RSP) |
0x43c59b MOV %R13,0x418(%RSP) |
0x43c5a3 MOV %R14,0x410(%RSP) |
0x43c5ab VMOVUPD %YMM0,0x840(%RSP) |
0x43c5b4 VMOVUPD %YMM2,0x820(%RSP) |
0x43c5bd VMOVUPD %YMM4,0x800(%RSP) |
0x43c5c6 VMOVUPD %YMM5,0x7e0(%RSP) |
0x43c5cf VMOVUPD %YMM10,0x7c0(%RSP) |
0x43c5d8 JMP 43c76a |
(858) 0x43c5e0 ADDQ $0x200,0xa0(%RSP) |
(858) 0x43c5ec ADDQ $0x200,0x1d0(%RSP) |
(858) 0x43c5f8 ADDQ $0x200,0x1d8(%RSP) |
(858) 0x43c604 ADDQ $0x200,0x1e0(%RSP) |
(858) 0x43c610 ADDQ $0x200,0x1e8(%RSP) |
(858) 0x43c61c MOV 0x430(%RSP),%RSI |
(858) 0x43c624 ADD $-0x40,%RSI |
(858) 0x43c628 ADDQ $0x40,0x218(%RSP) |
(858) 0x43c631 ADDQ $0x40,0x220(%RSP) |
(858) 0x43c63a ADDQ $0x40,0x228(%RSP) |
(858) 0x43c643 ADDQ $0x40,0x230(%RSP) |
(858) 0x43c64c ADDQ $0x200,0xa8(%RSP) |
(858) 0x43c658 ADDQ $0x200,0x1f0(%RSP) |
(858) 0x43c664 ADDQ $0x200,0x1f8(%RSP) |
(858) 0x43c670 ADDQ $0x200,0x200(%RSP) |
(858) 0x43c67c ADDQ $0x200,0x208(%RSP) |
(858) 0x43c688 ADDQ $0x200,0x210(%RSP) |
(858) 0x43c694 MOV 0x260(%RSP),%R15 |
(858) 0x43c69c ADD $0x200,%R15 |
(858) 0x43c6a3 MOV 0x268(%RSP),%RCX |
(858) 0x43c6ab ADD $0x200,%RCX |
(858) 0x43c6b2 MOV 0xb0(%RSP),%RAX |
(858) 0x43c6ba ADD $0x200,%RAX |
(858) 0x43c6c0 ADDQ $0x40,0x238(%RSP) |
(858) 0x43c6c9 ADDQ $0x40,0x240(%RSP) |
(858) 0x43c6d2 ADDQ $0x40,0x248(%RSP) |
(858) 0x43c6db ADDQ $0x40,0x250(%RSP) |
(858) 0x43c6e4 ADDQ $0x40,0x258(%RSP) |
(858) 0x43c6ed MOV 0x428(%RSP),%R11 |
(858) 0x43c6f5 CMP 0x408(%RSP),%R11 |
(858) 0x43c6fd LEA 0x1(%R11),%R11 |
(858) 0x43c701 MOV 0x20(%RSP),%R8 |
(858) 0x43c706 VMOVUPD 0x100(%RSP),%XMM12 |
(858) 0x43c70f MOV 0x98(%RSP),%RDX |
(858) 0x43c717 MOV 0x90(%RSP),%R9 |
(858) 0x43c71f MOV 0x48(%RSP),%R10 |
(858) 0x43c724 VMOVAPD %XMM7,%XMM8 |
(858) 0x43c728 MOV 0x420(%RSP),%R12 |
(858) 0x43c730 MOV 0x418(%RSP),%R13 |
(858) 0x43c738 MOV 0x410(%RSP),%R14 |
(858) 0x43c740 VMOVUPD 0x840(%RSP),%YMM0 |
(858) 0x43c749 VMOVUPD 0x820(%RSP),%YMM2 |
(858) 0x43c752 VMOVUPD 0x800(%RSP),%YMM4 |
(858) 0x43c75b VMOVUPD 0x7e0(%RSP),%YMM5 |
(858) 0x43c764 JE 43c310 |
(858) 0x43c76a MOV %R15,0x260(%RSP) |
(858) 0x43c772 MOV %RCX,0x268(%RSP) |
(858) 0x43c77a MOV %RAX,0xb0(%RSP) |
(858) 0x43c782 CMP $0x3f,%RSI |
(858) 0x43c786 MOV $0x3f,%ECX |
(858) 0x43c78b CMOVL %RSI,%RCX |
(858) 0x43c78f MOV %R11,%RAX |
(858) 0x43c792 SAL $0x6,%RAX |
(858) 0x43c796 MOV 0x1c8(%RSP),%RBX |
(858) 0x43c79e SUB %RAX,%RBX |
(858) 0x43c7a1 CMP $0x40,%RBX |
(858) 0x43c7a5 MOV $0x3f,%EAX |
(858) 0x43c7aa CMOVGE %RAX,%RBX |
(858) 0x43c7ae INC %RBX |
(858) 0x43c7b1 MOV %RBX,%R10 |
(858) 0x43c7b4 AND $-0x4,%R10 |
(858) 0x43c7b8 MOV %RSI,0x430(%RSP) |
(858) 0x43c7c0 MOV %R11,0x428(%RSP) |
(858) 0x43c7c8 MOV %RCX,0xc0(%RSP) |
(858) 0x43c7d0 MOV %R10,0x110(%RSP) |
(858) 0x43c7d8 MOV %RBX,0xb8(%RSP) |
(858) 0x43c7e0 JE 43c9c0 |
(858) 0x43c7e6 LEA -0x1(%R10),%RAX |
(858) 0x43c7ea XOR %ECX,%ECX |
(858) 0x43c7ec VMOVUPD 0x660(%RSP),%YMM10 |
(858) 0x43c7f5 VMOVAPD %YMM0,%YMM8 |
(858) 0x43c7f9 VMOVUPD 0x7c0(%RSP),%YMM9 |
(858) 0x43c802 VMOVUPD 0x7a0(%RSP),%YMM7 |
(858) 0x43c80b VMOVAPD %YMM2,%YMM6 |
(858) 0x43c80f VMOVAPD %YMM4,%YMM1 |
(858) 0x43c813 VMOVAPD %YMM5,%YMM11 |
(858) 0x43c817 MOV 0x1e8(%RSP),%RDX |
(858) 0x43c81f MOV 0x1e0(%RSP),%RSI |
(858) 0x43c827 MOV 0x1d8(%RSP),%RDI |
(858) 0x43c82f MOV 0x1d0(%RSP),%R8 |
(858) 0x43c837 MOV 0xa0(%RSP),%R9 |
(858) 0x43c83f NOP |
(860) 0x43c840 VMOVUPD (%RDX,%RCX,8),%YMM14 |
(860) 0x43c845 VMOVUPD (%RSI,%RCX,8),%YMM2 |
(860) 0x43c84a VMOVUPD (%RDI,%RCX,8),%YMM13 |
(860) 0x43c84f VMOVUPD (%R8,%RCX,8),%YMM0 |
(860) 0x43c855 VMULPD %YMM15,%YMM14,%YMM12 |
(860) 0x43c85a VFMADD231PD %YMM3,%YMM2,%YMM12 |
(860) 0x43c85f VFMADD231PD 0x720(%RSP),%YMM13,%YMM12 |
(860) 0x43c869 VFMADD231PD 0x700(%RSP),%YMM0,%YMM12 |
(860) 0x43c873 VMULPD %YMM12,%YMM8,%YMM4 |
(860) 0x43c878 VMOVUPD %YMM4,0x1868(%RSP,%RCX,8) |
(860) 0x43c881 VMULPD 0x6e0(%RSP),%YMM14,%YMM4 |
(860) 0x43c88a VMULPD 0x6c0(%RSP),%YMM2,%YMM5 |
(860) 0x43c893 VFMADD231PD 0x760(%RSP),%YMM0,%YMM5 |
(860) 0x43c89d VFMADD231PD 0x780(%RSP),%YMM13,%YMM4 |
(860) 0x43c8a7 VFMADD231PD %YMM5,%YMM10,%YMM4 |
(860) 0x43c8ac VMULPD %YMM7,%YMM12,%YMM5 |
(860) 0x43c8b0 VMOVUPD %YMM5,0x1668(%RSP,%RCX,8) |
(860) 0x43c8b9 VMULPD %YMM4,%YMM9,%YMM5 |
(860) 0x43c8bd VMOVUPD %YMM5,0x1468(%RSP,%RCX,8) |
(860) 0x43c8c6 VMULPD 0x680(%RSP),%YMM14,%YMM5 |
(860) 0x43c8cf VFMADD231PD 0x6a0(%RSP),%YMM2,%YMM5 |
(860) 0x43c8d9 VMULPD %YMM1,%YMM12,%YMM2 |
(860) 0x43c8dd VMOVUPD %YMM2,0x1268(%RSP,%RCX,8) |
(860) 0x43c8e6 VFMADD231PD 0x740(%RSP),%YMM13,%YMM5 |
(860) 0x43c8f0 VMULPD %YMM6,%YMM4,%YMM2 |
(860) 0x43c8f4 VMOVUPD %YMM2,0x1068(%RSP,%RCX,8) |
(860) 0x43c8fd VFMADD231PD %YMM0,%YMM10,%YMM5 |
(860) 0x43c902 VMULPD %YMM5,%YMM11,%YMM0 |
(860) 0x43c906 VMOVUPD %YMM0,0xe68(%RSP,%RCX,8) |
(860) 0x43c90f VMULPD %YMM9,%YMM12,%YMM0 |
(860) 0x43c914 VMOVUPD %YMM0,0xc68(%RSP,%RCX,8) |
(860) 0x43c91d VMULPD %YMM6,%YMM12,%YMM0 |
(860) 0x43c921 VMOVUPD %YMM0,0xa68(%RSP,%RCX,8) |
(860) 0x43c92a VMULPD %YMM4,%YMM11,%YMM0 |
(860) 0x43c92e VMOVUPD %YMM0,0x868(%RSP,%RCX,8) |
(860) 0x43c937 VFMADD213PD (%R9,%RCX,8),%YMM11,%YMM12 |
(860) 0x43c93d VMOVUPD %YMM12,(%R9,%RCX,8) |
(860) 0x43c943 ADD $0x4,%RCX |
(860) 0x43c947 CMP %RAX,%RCX |
(860) 0x43c94a JLE 43c840 |
(858) 0x43c950 MOV %R10,%RDI |
(858) 0x43c953 CMP %R10,%RBX |
(858) 0x43c956 VMOVUPD 0x2e0(%RSP),%YMM10 |
(858) 0x43c95f VMOVUPD 0x520(%RSP),%YMM14 |
(858) 0x43c968 VMOVUPD 0x280(%RSP),%XMM4 |
(858) 0x43c971 VMOVUPD 0x500(%RSP),%YMM9 |
(858) 0x43c97a VMOVUPD 0x270(%RSP),%XMM7 |
(858) 0x43c983 VMOVUPD 0x100(%RSP),%XMM8 |
(858) 0x43c98c VMOVUPD 0x320(%RSP),%XMM1 |
(858) 0x43c995 VMOVUPD 0x310(%RSP),%XMM6 |
(858) 0x43c99e VMOVUPD 0xf0(%RSP),%XMM11 |
(858) 0x43c9a7 VMOVUPD 0x290(%RSP),%XMM15 |
(858) 0x43c9b0 JNE 43ca17 |
(858) 0x43c9b2 JMP 43cc06 |
(858) 0x43c9c0 XOR %EDI,%EDI |
(858) 0x43c9c2 VMOVUPD 0x290(%RSP),%XMM15 |
(858) 0x43c9cb VMOVAPD %XMM8,%XMM7 |
(858) 0x43c9cf VMOVUPD 0x2e0(%RSP),%YMM10 |
(858) 0x43c9d8 VMOVUPD 0x520(%RSP),%YMM14 |
(858) 0x43c9e1 VMOVUPD 0x280(%RSP),%XMM4 |
(858) 0x43c9ea VMOVUPD 0x500(%RSP),%YMM9 |
(858) 0x43c9f3 VMOVUPD 0x100(%RSP),%XMM8 |
(858) 0x43c9fc VMOVUPD 0x320(%RSP),%XMM1 |
(858) 0x43ca05 VMOVUPD 0x310(%RSP),%XMM6 |
(858) 0x43ca0e VMOVUPD 0xf0(%RSP),%XMM11 |
(858) 0x43ca17 MOV 0xc0(%RSP),%R8 |
(858) 0x43ca1f SUB %RDI,%R8 |
(858) 0x43ca22 INC %R8 |
(858) 0x43ca25 MOV 0xa0(%RSP),%RAX |
(858) 0x43ca2d LEA (%RAX,%RDI,8),%RSI |
(858) 0x43ca31 LEA (%RSP,%RDI,8),%RAX |
(858) 0x43ca35 ADD $0x868,%RAX |
(858) 0x43ca3b MOV %RAX,0x2c0(%RSP) |
(858) 0x43ca43 LEA 0xa68(%RSP,%RDI,8),%RAX |
(858) 0x43ca4b MOV %RAX,0x2a0(%RSP) |
(858) 0x43ca53 LEA 0xc68(%RSP,%RDI,8),%RAX |
(858) 0x43ca5b MOV %RAX,0x30(%RSP) |
(858) 0x43ca60 LEA 0xe68(%RSP,%RDI,8),%R10 |
(858) 0x43ca68 LEA 0x1068(%RSP,%RDI,8),%RCX |
(858) 0x43ca70 LEA 0x1268(%RSP,%RDI,8),%R9 |
(858) 0x43ca78 LEA 0x1468(%RSP,%RDI,8),%R14 |
(858) 0x43ca80 MOV 0x218(%RSP),%RAX |
(858) 0x43ca88 LEA (%RDI,%RAX,1),%RAX |
(858) 0x43ca8c MOV 0x198(%RSP),%R11 |
(858) 0x43ca94 LEA (%R11,%RAX,8),%R13 |
(858) 0x43ca98 MOV 0x220(%RSP),%RAX |
(858) 0x43caa0 ADD %RDI,%RAX |
(858) 0x43caa3 LEA (%R11,%RAX,8),%RBX |
(858) 0x43caa7 MOV 0x228(%RSP),%RAX |
(858) 0x43caaf ADD %RDI,%RAX |
(858) 0x43cab2 LEA (%R11,%RAX,8),%R12 |
(858) 0x43cab6 LEA (%RSP,%RDI,8),%R15 |
(858) 0x43caba ADD $0x1668,%R15 |
(858) 0x43cac1 LEA (%RSP,%RDI,8),%RAX |
(858) 0x43cac5 ADD $0x1868,%RAX |
(858) 0x43cacb ADD 0x230(%RSP),%RDI |
(858) 0x43cad3 LEA (%R11,%RDI,8),%RDI |
(858) 0x43cad7 XOR %R11D,%R11D |
(858) 0x43cada NOPW (%RAX,%RAX,1) |
(856) 0x43cae0 VMOVSD (%RDI,%R11,8),%XMM2 |
(856) 0x43cae6 VMOVSD (%R12,%R11,8),%XMM0 |
(856) 0x43caec VMOVSD (%R13,%R11,8),%XMM13 |
(856) 0x43caf3 VMOVAPD %XMM4,%XMM3 |
(856) 0x43caf7 VMOVSD (%RBX,%R11,8),%XMM4 |
(856) 0x43cafd VUNPCKLPD %XMM4,%XMM0,%XMM5 |
(856) 0x43cb01 VMULPD %XMM5,%XMM10,%XMM5 |
(856) 0x43cb05 VSHUFPD $0x1,%XMM5,%XMM5,%XMM12 |
(856) 0x43cb0a VFMADD231SD %XMM2,%XMM15,%XMM5 |
(856) 0x43cb0f VFMADD231SD %XMM7,%XMM13,%XMM12 |
(856) 0x43cb14 VADDSD %XMM5,%XMM12,%XMM12 |
(856) 0x43cb18 VUNPCKLPD %XMM0,%XMM2,%XMM5 |
(856) 0x43cb1c VMULPD %XMM5,%XMM14,%XMM5 |
(856) 0x43cb20 VMOVAPD %XMM7,%XMM10 |
(856) 0x43cb24 VMOVAPD %YMM14,%YMM7 |
(856) 0x43cb28 VUNPCKLPD %XMM13,%XMM4,%XMM14 |
(856) 0x43cb2d VFMADD132PD 0x610(%RSP),%XMM5,%XMM14 |
(856) 0x43cb37 VMULSD 0x4b0(%RSP),%XMM12,%XMM5 |
(856) 0x43cb40 VMOVSD %XMM5,(%RAX,%R11,8) |
(856) 0x43cb46 VMULSD 0x4a0(%RSP),%XMM12,%XMM5 |
(856) 0x43cb4f VMOVSD %XMM5,(%R15,%R11,8) |
(856) 0x43cb55 VSHUFPD $0x1,%XMM14,%XMM14,%XMM5 |
(856) 0x43cb5b VFMADD213SD %XMM14,%XMM8,%XMM5 |
(856) 0x43cb60 VMULSD %XMM1,%XMM5,%XMM14 |
(856) 0x43cb64 VMOVSD %XMM14,(%R14,%R11,8) |
(856) 0x43cb6a VMULSD 0x50(%RSP),%XMM12,%XMM14 |
(856) 0x43cb70 VMOVSD %XMM14,(%R9,%R11,8) |
(856) 0x43cb76 VMOVAPD %YMM7,%YMM14 |
(856) 0x43cb7a VMOVAPD %XMM10,%XMM7 |
(856) 0x43cb7e VUNPCKLPD %XMM4,%XMM2,%XMM2 |
(856) 0x43cb82 VMULSD %XMM5,%XMM11,%XMM4 |
(856) 0x43cb86 VMOVSD %XMM4,(%RCX,%R11,8) |
(856) 0x43cb8c VMOVAPD %XMM3,%XMM4 |
(856) 0x43cb90 VMULPD %XMM2,%XMM9,%XMM2 |
(856) 0x43cb94 VFMADD213SD %XMM2,%XMM3,%XMM0 |
(856) 0x43cb99 VSHUFPD $0x1,%XMM2,%XMM2,%XMM2 |
(856) 0x43cb9e VFMADD231SD %XMM13,%XMM8,%XMM2 |
(856) 0x43cba3 VADDSD %XMM0,%XMM2,%XMM0 |
(856) 0x43cba7 VMULSD %XMM6,%XMM0,%XMM0 |
(856) 0x43cbab VMOVSD %XMM0,(%R10,%R11,8) |
(856) 0x43cbb1 VMULSD %XMM1,%XMM12,%XMM0 |
(856) 0x43cbb5 MOV 0x30(%RSP),%RDX |
(856) 0x43cbba VMOVSD %XMM0,(%RDX,%R11,8) |
(856) 0x43cbc0 VMULSD %XMM11,%XMM12,%XMM0 |
(856) 0x43cbc5 MOV 0x2a0(%RSP),%RDX |
(856) 0x43cbcd VMOVSD %XMM0,(%RDX,%R11,8) |
(856) 0x43cbd3 VMULSD %XMM6,%XMM5,%XMM0 |
(856) 0x43cbd7 MOV 0x2c0(%RSP),%RDX |
(856) 0x43cbdf VMOVSD %XMM0,(%RDX,%R11,8) |
(856) 0x43cbe5 VFMADD213SD (%RSI,%R11,8),%XMM6,%XMM12 |
(856) 0x43cbeb VMOVSD %XMM12,(%RSI,%R11,8) |
(856) 0x43cbf1 VMOVUPD 0x2e0(%RSP),%YMM10 |
(856) 0x43cbfa INC %R11 |
(856) 0x43cbfd CMP %R11,%R8 |
(856) 0x43cc00 JNE 43cae0 |
(858) 0x43cc06 MOV 0x110(%RSP),%R12 |
(858) 0x43cc0e TEST %R12,%R12 |
(858) 0x43cc11 JE 43cd70 |
(858) 0x43cc17 LEA -0x1(%R12),%RAX |
(858) 0x43cc1c XOR %ECX,%ECX |
(858) 0x43cc1e VMOVUPD 0x270(%RSP),%XMM7 |
(858) 0x43cc27 VMOVUPD 0x4e0(%RSP),%YMM15 |
(858) 0x43cc30 VMOVUPD 0x4c0(%RSP),%YMM3 |
(858) 0x43cc39 MOV 0xb0(%RSP),%RDX |
(858) 0x43cc41 MOV 0x268(%RSP),%RSI |
(858) 0x43cc49 MOV 0x260(%RSP),%RDI |
(858) 0x43cc51 MOV 0x210(%RSP),%R8 |
(858) 0x43cc59 MOV 0x208(%RSP),%R9 |
(858) 0x43cc61 MOV 0x200(%RSP),%R10 |
(858) 0x43cc69 MOV 0x1f8(%RSP),%R11 |
(858) 0x43cc71 MOV 0x1f0(%RSP),%RBX |
(858) 0x43cc79 MOV 0xa8(%RSP),%R14 |
(858) 0x43cc81 NOPW %CS:(%RAX,%RAX,1) |
(859) 0x43cc90 VMOVUPD 0x1868(%RSP,%RCX,8),%YMM0 |
(859) 0x43cc99 VMOVUPD 0x1668(%RSP,%RCX,8),%YMM2 |
(859) 0x43cca2 VMOVUPD 0x1468(%RSP,%RCX,8),%YMM4 |
(859) 0x43ccab VMOVUPD 0x1268(%RSP,%RCX,8),%YMM5 |
(859) 0x43ccb4 VMOVUPD 0x1068(%RSP,%RCX,8),%YMM12 |
(859) 0x43ccbd VMOVUPD 0xe68(%RSP,%RCX,8),%YMM13 |
(859) 0x43ccc6 VMOVUPD 0xc68(%RSP,%RCX,8),%YMM14 |
(859) 0x43cccf VMOVUPD 0xa68(%RSP,%RCX,8),%YMM6 |
(859) 0x43ccd8 VMOVUPD 0x868(%RSP,%RCX,8),%YMM8 |
(859) 0x43cce1 VADDPD (%RDX,%RCX,8),%YMM0,%YMM0 |
(859) 0x43cce6 VMOVUPD %YMM0,(%RDX,%RCX,8) |
(859) 0x43cceb VADDPD (%RSI,%RCX,8),%YMM2,%YMM0 |
(859) 0x43ccf0 VMOVUPD %YMM0,(%RSI,%RCX,8) |
(859) 0x43ccf5 VADDPD (%R8,%RCX,8),%YMM4,%YMM0 |
(859) 0x43ccfb VMOVUPD %YMM0,(%R8,%RCX,8) |
(859) 0x43cd01 VADDPD (%R10,%RCX,8),%YMM5,%YMM0 |
(859) 0x43cd07 VMOVUPD %YMM0,(%R10,%RCX,8) |
(859) 0x43cd0d VADDPD (%R11,%RCX,8),%YMM12,%YMM0 |
(859) 0x43cd13 VMOVUPD %YMM0,(%R11,%RCX,8) |
(859) 0x43cd19 VADDPD (%RBX,%RCX,8),%YMM13,%YMM0 |
(859) 0x43cd1e VMOVUPD %YMM0,(%RBX,%RCX,8) |
(859) 0x43cd23 VADDPD (%R14,%RCX,8),%YMM14,%YMM0 |
(859) 0x43cd29 VMOVUPD %YMM0,(%R14,%RCX,8) |
(859) 0x43cd2f VADDPD (%RDI,%RCX,8),%YMM6,%YMM0 |
(859) 0x43cd34 VMOVUPD %YMM0,(%RDI,%RCX,8) |
(859) 0x43cd39 VADDPD (%R9,%RCX,8),%YMM8,%YMM0 |
(859) 0x43cd3f VMOVUPD %YMM0,(%R9,%RCX,8) |
(859) 0x43cd45 ADD $0x4,%RCX |
(859) 0x43cd49 CMP %RAX,%RCX |
(859) 0x43cd4c JLE 43cc90 |
(858) 0x43cd52 CMP %R12,0xb8(%RSP) |
(858) 0x43cd5a MOV 0xc0(%RSP),%RAX |
(858) 0x43cd62 JE 43c5e0 |
(858) 0x43cd68 JMP 43cd96 |
(858) 0x43cd70 XOR %R12D,%R12D |
(858) 0x43cd73 VMOVUPD 0x270(%RSP),%XMM7 |
(858) 0x43cd7c VMOVUPD 0x4e0(%RSP),%YMM15 |
(858) 0x43cd85 VMOVUPD 0x4c0(%RSP),%YMM3 |
(858) 0x43cd8e MOV 0xc0(%RSP),%RAX |
(858) 0x43cd96 SUB %R12,%RAX |
(858) 0x43cd99 INC %RAX |
(858) 0x43cd9c MOV %RAX,0xc0(%RSP) |
(858) 0x43cda4 MOV 0xa8(%RSP),%RAX |
(858) 0x43cdac LEA (%RAX,%R12,8),%RAX |
(858) 0x43cdb0 MOV 0x238(%RSP),%RCX |
(858) 0x43cdb8 ADD %R12,%RCX |
(858) 0x43cdbb MOV 0x20(%RSP),%R11 |
(858) 0x43cdc0 LEA (%R11,%RCX,8),%RCX |
(858) 0x43cdc4 MOV 0x240(%RSP),%RDX |
(858) 0x43cdcc LEA (%R12,%RDX,1),%RDX |
(858) 0x43cdd0 LEA (%R11,%RDX,8),%RDX |
(858) 0x43cdd4 MOV 0x248(%RSP),%RSI |
(858) 0x43cddc LEA (%R12,%RSI,1),%RSI |
(858) 0x43cde0 LEA (%R11,%RSI,8),%RSI |
(858) 0x43cde4 MOV 0x250(%RSP),%RDI |
(858) 0x43cdec LEA (%R12,%RDI,1),%R8 |
(858) 0x43cdf0 MOV 0x18(%RSP),%R9 |
(858) 0x43cdf5 LEA (%R9,%R8,8),%RDI |
(858) 0x43cdf9 LEA (%R11,%R8,8),%R8 |
(858) 0x43cdfd MOV 0x258(%RSP),%R10 |
(858) 0x43ce05 LEA (%R12,%R10,1),%R10 |
(858) 0x43ce09 LEA (%R9,%R10,8),%R9 |
(858) 0x43ce0d LEA (%R11,%R10,8),%R10 |
(858) 0x43ce11 MOV 0xb0(%RSP),%R11 |
(858) 0x43ce19 LEA (%R11,%R12,8),%R11 |
(858) 0x43ce1d LEA 0x868(%RSP,%R12,8),%RBX |
(858) 0x43ce25 MOV %RBX,0x2c0(%RSP) |
(858) 0x43ce2d LEA 0xa68(%RSP,%R12,8),%RBX |
(858) 0x43ce35 MOV %RBX,0x2a0(%RSP) |
(858) 0x43ce3d LEA 0xc68(%RSP,%R12,8),%RBX |
(858) 0x43ce45 MOV %RBX,0x30(%RSP) |
(858) 0x43ce4a LEA 0xe68(%RSP,%R12,8),%RBX |
(858) 0x43ce52 MOV %RBX,0x110(%RSP) |
(858) 0x43ce5a LEA 0x1068(%RSP,%R12,8),%RBX |
(858) 0x43ce62 MOV %RBX,0xb8(%RSP) |
(858) 0x43ce6a LEA 0x1268(%RSP,%R12,8),%RBX |
(858) 0x43ce72 MOV %RBX,0x438(%RSP) |
(858) 0x43ce7a LEA (%RSP,%R12,8),%R14 |
(858) 0x43ce7e ADD $0x1468,%R14 |
(858) 0x43ce85 LEA (%RSP,%R12,8),%R15 |
(858) 0x43ce89 ADD $0x1668,%R15 |
(858) 0x43ce90 LEA (%RSP,%R12,8),%R12 |
(858) 0x43ce94 ADD $0x1868,%R12 |
(858) 0x43ce9b XOR %R13D,%R13D |
(858) 0x43ce9e XCHG %AX,%AX |
(857) 0x43cea0 VMOVSD (%R12,%R13,8),%XMM0 |
(857) 0x43cea6 VMOVSD (%R15,%R13,8),%XMM2 |
(857) 0x43ceac VMOVSD (%R14,%R13,8),%XMM4 |
(857) 0x43ceb2 MOV 0x438(%RSP),%RBX |
(857) 0x43ceba VMOVSD (%RBX,%R13,8),%XMM5 |
(857) 0x43cec0 MOV 0xb8(%RSP),%RBX |
(857) 0x43cec8 VMOVSD (%RBX,%R13,8),%XMM6 |
(857) 0x43cece MOV 0x110(%RSP),%RBX |
(857) 0x43ced6 VMOVSD (%RBX,%R13,8),%XMM8 |
(857) 0x43cedc MOV 0x30(%RSP),%RBX |
(857) 0x43cee1 VMOVSD (%RBX,%R13,8),%XMM12 |
(857) 0x43cee7 MOV 0x2a0(%RSP),%RBX |
(857) 0x43ceef VMOVSD (%RBX,%R13,8),%XMM13 |
(857) 0x43cef5 MOV 0x2c0(%RSP),%RBX |
(857) 0x43cefd VMOVSD (%RBX,%R13,8),%XMM14 |
(857) 0x43cf03 VADDSD (%R11,%R13,8),%XMM0,%XMM0 |
(857) 0x43cf09 VMOVSD %XMM0,(%R11,%R13,8) |
(857) 0x43cf0f VADDSD (%R10,%R13,8),%XMM2,%XMM0 |
(857) 0x43cf15 VMOVSD %XMM0,(%R10,%R13,8) |
(857) 0x43cf1b VADDSD (%R8,%R13,8),%XMM4,%XMM0 |
(857) 0x43cf21 VMOVSD %XMM0,(%R8,%R13,8) |
(857) 0x43cf27 VADDSD (%RSI,%R13,8),%XMM5,%XMM0 |
(857) 0x43cf2d VMOVSD %XMM0,(%RSI,%R13,8) |
(857) 0x43cf33 VADDSD (%RDX,%R13,8),%XMM6,%XMM0 |
(857) 0x43cf39 VMOVSD %XMM0,(%RDX,%R13,8) |
(857) 0x43cf3f VADDSD (%RCX,%R13,8),%XMM8,%XMM0 |
(857) 0x43cf45 VMOVSD %XMM0,(%RCX,%R13,8) |
(857) 0x43cf4b VADDSD (%RAX,%R13,8),%XMM12,%XMM0 |
(857) 0x43cf51 VMOVSD %XMM0,(%RAX,%R13,8) |
(857) 0x43cf57 VADDSD (%R9,%R13,8),%XMM13,%XMM0 |
(857) 0x43cf5d VMOVSD %XMM0,(%R9,%R13,8) |
(857) 0x43cf63 VADDSD (%RDI,%R13,8),%XMM14,%XMM0 |
(857) 0x43cf69 VMOVSD %XMM0,(%RDI,%R13,8) |
(857) 0x43cf6f INC %R13 |
(857) 0x43cf72 CMP %R13,0xc0(%RSP) |
(857) 0x43cf7a JNE 43cea0 |
(858) 0x43cf80 JMP 43c5e0 |
0x43cf90 TEST %R11D,%R11D |
0x43cf93 MOV 0x18(%RSP),%RBX |
0x43cf98 MOV 0x88(%RSP),%RDI |
0x43cfa0 JLE 43c310 |
0x43cfa6 CMPQ $0,0x38(%RSP) |
0x43cfac JE 43d1ec |
0x43cfb2 VBROADCASTSD %XMM6,%YMM0 |
0x43cfb7 VMOVUPD %YMM0,0xc0(%RSP) |
0x43cfc0 VBROADCASTSD %XMM10,%YMM0 |
0x43cfc5 VMOVUPD %YMM0,0x2c0(%RSP) |
0x43cfce VBROADCASTSD %XMM14,%YMM7 |
0x43cfd3 VBROADCASTSD 0x50(%RSP),%YMM0 |
0x43cfda VMOVUPS %YMM0,0x2a0(%RSP) |
0x43cfe3 VMOVUPD 0x660(%RSP),%YMM3 |
0x43cfec VBROADCASTSD 0xf0(%RSP),%YMM10 |
0x43cff6 VBROADCASTSD %XMM1,%YMM11 |
0x43cffb XOR %EAX,%EAX |
0x43cffd VMOVUPD 0x720(%RSP),%YMM12 |
0x43d006 VMOVUPD 0x700(%RSP),%YMM13 |
0x43d00f VMOVUPD 0x6e0(%RSP),%YMM14 |
0x43d018 VMOVUPD 0x680(%RSP),%YMM15 |
0x43d021 VMOVUPD 0x6a0(%RSP),%YMM1 |
0x43d02a VMOVUPD 0x6c0(%RSP),%YMM9 |
0x43d033 MOV 0x1a0(%RSP),%R15 |
0x43d03b MOV %R14,%RSI |
0x43d03e MOV %R13,%R14 |
0x43d041 MOV %R12,%R13 |
0x43d044 MOV 0x80(%RSP),%R12 |
0x43d04c NOPL (%RAX) |
(855) 0x43d050 VMOVUPD (%R12,%RAX,8),%YMM2 |
(855) 0x43d056 VMOVUPD (%R13,%RAX,8),%YMM4 |
(855) 0x43d05d VMOVUPD (%R14,%RAX,8),%YMM0 |
(855) 0x43d063 VMOVUPD (%RSI,%RAX,8),%YMM8 |
(855) 0x43d068 VMULPD %YMM2,%YMM14,%YMM5 |
(855) 0x43d06c VMULPD %YMM4,%YMM9,%YMM6 |
(855) 0x43d070 VFMADD231PD 0x760(%RSP),%YMM8,%YMM6 |
(855) 0x43d07a VFMADD231PD 0x780(%RSP),%YMM0,%YMM5 |
(855) 0x43d084 VFMADD231PD %YMM6,%YMM3,%YMM5 |
(855) 0x43d089 VMULPD 0x4e0(%RSP),%YMM2,%YMM6 |
(855) 0x43d092 VFMADD231PD 0x4c0(%RSP),%YMM4,%YMM6 |
(855) 0x43d09c VFMADD231PD %YMM12,%YMM0,%YMM6 |
(855) 0x43d0a1 VFMADD231PD %YMM8,%YMM13,%YMM6 |
(855) 0x43d0a6 VMULPD %YMM2,%YMM15,%YMM2 |
(855) 0x43d0aa VFMADD231PD %YMM4,%YMM1,%YMM2 |
(855) 0x43d0af LEA (%R8,%RAX,8),%RCX |
(855) 0x43d0b3 VMOVUPD (%R8,%RAX,8),%YMM4 |
(855) 0x43d0b9 VFMADD231PD 0xc0(%RSP),%YMM6,%YMM4 |
(855) 0x43d0c3 VMOVUPD %YMM4,(%R8,%RAX,8) |
(855) 0x43d0c9 VMOVUPD (%R15,%RCX,1),%YMM4 |
(855) 0x43d0cf VFMADD231PD 0x2c0(%RSP),%YMM6,%YMM4 |
(855) 0x43d0d9 VMOVUPD %YMM4,(%R15,%RCX,1) |
(855) 0x43d0df VFMADD231PD 0x740(%RSP),%YMM0,%YMM2 |
(855) 0x43d0e9 LEA (%RCX,%R15,1),%RCX |
(855) 0x43d0ed VMOVUPD (%R15,%RCX,1),%YMM0 |
(855) 0x43d0f3 VFMADD231PD %YMM7,%YMM5,%YMM0 |
(855) 0x43d0f8 VMOVUPD %YMM0,(%R15,%RCX,1) |
(855) 0x43d0fe LEA (%RCX,%R15,1),%RCX |
(855) 0x43d102 VMOVUPD (%R15,%RCX,1),%YMM0 |
(855) 0x43d108 VFMADD231PD 0x2a0(%RSP),%YMM6,%YMM0 |
(855) 0x43d112 VMOVUPD %YMM0,(%R15,%RCX,1) |
(855) 0x43d118 LEA (%RCX,%R15,1),%RCX |
(855) 0x43d11c VMOVUPD (%R15,%RCX,1),%YMM0 |
(855) 0x43d122 VFMADD231PD %YMM10,%YMM5,%YMM0 |
(855) 0x43d127 VMOVUPD %YMM0,(%R15,%RCX,1) |
(855) 0x43d12d VFMADD231PD %YMM8,%YMM3,%YMM2 |
(855) 0x43d132 LEA (%RCX,%R15,1),%RCX |
(855) 0x43d136 VFMADD213PD (%R15,%RCX,1),%YMM11,%YMM2 |
(855) 0x43d13c VMOVUPD %YMM2,(%R15,%RCX,1) |
(855) 0x43d142 MOV 0x38(%RSP),%RCX |
(855) 0x43d147 VMOVUPD (%RBX,%RAX,8),%YMM0 |
(855) 0x43d14c VFMADD231PD %YMM7,%YMM6,%YMM0 |
(855) 0x43d151 VMOVUPD %YMM0,(%RBX,%RAX,8) |
(855) 0x43d156 VMOVUPD (%R10,%RAX,8),%YMM0 |
(855) 0x43d15c VFMADD231PD %YMM10,%YMM6,%YMM0 |
(855) 0x43d161 VMOVUPD %YMM0,(%R10,%RAX,8) |
(855) 0x43d167 VFMADD213PD (%R9,%RAX,8),%YMM11,%YMM5 |
(855) 0x43d16d VMOVUPD %YMM5,(%R9,%RAX,8) |
(855) 0x43d173 VFMADD213PD (%RDI,%RAX,8),%YMM11,%YMM6 |
(855) 0x43d179 VMOVUPD %YMM6,(%RDI,%RAX,8) |
(855) 0x43d17e ADD $0x4,%RAX |
(855) 0x43d182 CMP %RCX,%RAX |
(855) 0x43d185 JL 43d050 |
0x43d18b MOV %RCX,%RAX |
0x43d18e CMP 0x40(%RSP),%RCX |
0x43d193 VMOVUPD 0x100(%RSP),%XMM12 |
0x43d19c VMOVUPD 0x4e0(%RSP),%YMM15 |
0x43d1a5 VMOVUPD 0x4c0(%RSP),%YMM3 |
0x43d1ae VMOVUPD 0x270(%RSP),%XMM8 |
0x43d1b7 MOV %R13,%R12 |
0x43d1ba MOV %R14,%R13 |
0x43d1bd MOV %RSI,%R14 |
0x43d1c0 VMOVUPD 0x4b0(%RSP),%XMM9 |
0x43d1c9 VMOVUPD 0x320(%RSP),%XMM14 |
0x43d1d2 VMOVUPD 0x310(%RSP),%XMM1 |
0x43d1db VMOVUPD 0x4a0(%RSP),%XMM10 |
0x43d1e4 JE 43c310 |
0x43d1ea JMP 43d1f2 |
0x43d1ec XOR %EAX,%EAX |
0x43d1ee VMOVAPD %XMM6,%XMM9 |
0x43d1f2 MOV 0x1a0(%RSP),%R15 |
0x43d1fa MOV 0x88(%RSP),%RDI |
0x43d202 MOV 0x18(%RSP),%RBX |
0x43d207 NOPW (%RAX,%RAX,1) |
(854) 0x43d210 MOV 0x1c0(%RSP),%RCX |
(854) 0x43d218 VMOVSD (%RCX,%RAX,8),%XMM2 |
(854) 0x43d21d MOV 0x1b8(%RSP),%RCX |
(854) 0x43d225 VMOVSD (%RCX,%RAX,8),%XMM4 |
(854) 0x43d22a MOV 0x1b0(%RSP),%RCX |
(854) 0x43d232 VMOVSD (%RCX,%RAX,8),%XMM0 |
(854) 0x43d237 MOV 0x1a8(%RSP),%RCX |
(854) 0x43d23f VMOVSD (%RCX,%RAX,8),%XMM7 |
(854) 0x43d244 VMULSD 0x520(%RSP),%XMM2,%XMM5 |
(854) 0x43d24d VMULSD 0x5f0(%RSP),%XMM4,%XMM6 |
(854) 0x43d256 VFMADD231SD 0x490(%RSP),%XMM7,%XMM6 |
(854) 0x43d260 VFMADD231SD 0x480(%RSP),%XMM0,%XMM5 |
(854) 0x43d26a VFMADD231SD %XMM6,%XMM12,%XMM5 |
(854) 0x43d26f VMULSD 0x290(%RSP),%XMM2,%XMM6 |
(854) 0x43d278 VFMADD231SD 0x2e0(%RSP),%XMM4,%XMM6 |
(854) 0x43d282 VFMADD231SD 0x600(%RSP),%XMM0,%XMM6 |
(854) 0x43d28c VFMADD231SD %XMM7,%XMM8,%XMM6 |
(854) 0x43d291 VMULSD 0x500(%RSP),%XMM2,%XMM2 |
(854) 0x43d29a VFMADD231SD 0x280(%RSP),%XMM4,%XMM2 |
(854) 0x43d2a4 LEA (%R8,%RAX,8),%RCX |
(854) 0x43d2a8 VMOVSD (%R8,%RAX,8),%XMM4 |
(854) 0x43d2ae VFMADD231SD %XMM6,%XMM9,%XMM4 |
(854) 0x43d2b3 VMOVSD %XMM4,(%R8,%RAX,8) |
(854) 0x43d2b9 VMOVSD (%R15,%RCX,1),%XMM4 |
(854) 0x43d2bf VFMADD231SD %XMM6,%XMM10,%XMM4 |
(854) 0x43d2c4 VMOVSD %XMM4,(%R15,%RCX,1) |
(854) 0x43d2ca VFMADD231SD 0x5e0(%RSP),%XMM0,%XMM2 |
(854) 0x43d2d4 LEA (%RCX,%R15,1),%RCX |
(854) 0x43d2d8 VMOVSD (%R15,%RCX,1),%XMM0 |
(854) 0x43d2de VFMADD231SD %XMM14,%XMM5,%XMM0 |
(854) 0x43d2e3 VMOVSD %XMM0,(%R15,%RCX,1) |
(854) 0x43d2e9 LEA (%RCX,%R15,1),%RCX |
(854) 0x43d2ed VMOVSD (%R15,%RCX,1),%XMM0 |
(854) 0x43d2f3 VFMADD231SD 0x50(%RSP),%XMM6,%XMM0 |
(854) 0x43d2fa VMOVSD %XMM0,(%R15,%RCX,1) |
(854) 0x43d300 LEA (%RCX,%R15,1),%RCX |
(854) 0x43d304 VMOVSD (%R15,%RCX,1),%XMM0 |
(854) 0x43d30a VMOVUPD 0xf0(%RSP),%XMM4 |
(854) 0x43d313 VFMADD231SD %XMM4,%XMM5,%XMM0 |
(854) 0x43d318 VMOVSD %XMM0,(%R15,%RCX,1) |
(854) 0x43d31e VFMADD231SD %XMM7,%XMM12,%XMM2 |
(854) 0x43d323 LEA (%RCX,%R15,1),%RCX |
(854) 0x43d327 VFMADD213SD (%R15,%RCX,1),%XMM1,%XMM2 |
(854) 0x43d32d VMOVSD %XMM2,(%R15,%RCX,1) |
(854) 0x43d333 VMOVSD (%RBX,%RAX,8),%XMM0 |
(854) 0x43d338 VFMADD231SD %XMM14,%XMM6,%XMM0 |
(854) 0x43d33d VMOVSD %XMM0,(%RBX,%RAX,8) |
(854) 0x43d342 VMOVSD (%R10,%RAX,8),%XMM0 |
(854) 0x43d348 VFMADD231SD %XMM4,%XMM6,%XMM0 |
(854) 0x43d34d VMOVSD %XMM0,(%R10,%RAX,8) |
(854) 0x43d353 VFMADD213SD (%R9,%RAX,8),%XMM1,%XMM5 |
(854) 0x43d359 VMOVSD %XMM5,(%R9,%RAX,8) |
(854) 0x43d35f VFMADD213SD (%RDI,%RAX,8),%XMM1,%XMM6 |
(854) 0x43d365 VMOVSD %XMM6,(%RDI,%RAX,8) |
(854) 0x43d36a INC %RAX |
(854) 0x43d36d CMP %RAX,0x40(%RSP) |
(854) 0x43d372 JNE 43d210 |
0x43d378 JMP 43c310 |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 61 - 61 |
-------------------------------------------------------------------------------- |
61: for (size_t d = 0; d < D; ++d) |
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineRef.hpp: 227 - 262 |
-------------------------------------------------------------------------------- |
227: for (int j = 0; j < 4; j++) |
[...] |
234: const T pre20 = d2a[i] * b[j]; |
235: const T pre10 = da[i] * b[j]; |
236: const T pre00 = a[i] * b[j]; |
237: const T pre11 = da[i] * db[j]; |
238: const T pre01 = a[i] * db[j]; |
239: const T pre02 = a[i] * d2b[j]; |
240: |
241: const int iSplitPoint = num_splines; |
242: for (int n = 0; n < iSplitPoint; n++) |
243: { |
244: T coefsv = coefs[n]; |
245: T coefsvzs = coefszs[n]; |
246: T coefsv2zs = coefs2zs[n]; |
247: T coefsv3zs = coefs3zs[n]; |
248: |
249: T sum0 = c[0] * coefsv + c[1] * coefsvzs + c[2] * coefsv2zs + c[3] * coefsv3zs; |
250: T sum1 = dc[0] * coefsv + dc[1] * coefsvzs + dc[2] * coefsv2zs + dc[3] * coefsv3zs; |
251: T sum2 = d2c[0] * coefsv + d2c[1] * coefsvzs + d2c[2] * coefsv2zs + d2c[3] * coefsv3zs; |
252: |
253: hxx[n] += pre20 * sum0; |
254: hxy[n] += pre11 * sum0; |
255: hxz[n] += pre10 * sum1; |
256: hyy[n] += pre02 * sum0; |
257: hyz[n] += pre01 * sum1; |
258: hzz[n] += pre00 * sum2; |
259: gx[n] += pre10 * sum0; |
260: gy[n] += pre01 * sum0; |
261: gz[n] += pre00 * sum1; |
262: vals[n] += pre00 * sum0; |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►87.78+ | miniqmcreference::DiracDetermi[...] | DiracDeterminantRef.cpp:100 | exec |
○ | qmcplusplus::WaveFunction::rat[...] | WaveFunction.cpp:196 | exec |
○ | main.extracted.110 | refwrap.h:313 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►7.07+ | qmcplusplus::SPOSet::evaluate_[...] | OhmmsVector.h:144 | exec |
○ | miniqmcreference::DiracDetermi[...] | DiracDeterminantRef.cpp:263 | exec |
○ | miniqmcreference::DiracDetermi[...] | DiracDeterminantRef.cpp:238 | exec |
○ | qmcplusplus::WaveFunction::eva[...] | WaveFunction.cpp:170 | exec |
○ | main.extracted.113 | miniqmc.cpp:397 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►5.15+ | qmcplusplus::SPOSet::evaluate_[...] | OhmmsVector.h:144 | exec |
○ | miniqmcreference::DiracDetermi[...] | DiracDeterminantRef.cpp:263 | exec |
○ | miniqmcreference::DiracDetermi[...] | DiracDeterminantRef.cpp:238 | exec |
○ | qmcplusplus::WaveFunction::eva[...] | WaveFunction.cpp:171 | exec |
○ | main.extracted.113 | miniqmc.cpp:397 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 2.46 |
CQA speedup if FP arith vectorized | 1.11 |
CQA speedup if fully vectorized | 5.27 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.11 |
Bottlenecks | micro-operation queue, |
Function | miniqmcreference::einspline_spo_ref |
Source | TinyVector.h:61-61,MultiBsplineRef.hpp:227-227,MultiBsplineRef.hpp:234-239,MultiBsplineRef.hpp:242-242,MultiBsplineRef.hpp:253-258 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 26.67 |
CQA cycles if no scalar integer | 10.83 |
CQA cycles if FP arith vectorized | 24.00 |
CQA cycles if fully vectorized | 5.06 |
Front-end cycles | 26.67 |
DIV/SQRT cycles | 7.50 |
P0 cycles | 7.60 |
P1 cycles | 21.67 |
P2 cycles | 21.67 |
P3 cycles | 24.00 |
P4 cycles | 8.00 |
P5 cycles | 7.50 |
P6 cycles | 24.00 |
P7 cycles | 24.00 |
P8 cycles | 24.00 |
P9 cycles | 7.40 |
P10 cycles | 21.67 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 28.22 |
Stall cycles (UFS) | 0.00 |
Nb insns | 151.00 |
Nb uops | 159.00 |
Nb loads | 65.00 |
Nb stores | 48.00 |
Nb stack references | 80.00 |
FLOP/cycle | 0.22 |
Nb FLOP add-sub | 0.00 |
Nb FLOP mul | 6.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 53.70 |
Bytes prefetched | 0.00 |
Bytes loaded | 784.00 |
Bytes stored | 648.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 25.81 |
Vectorization ratio load | 27.78 |
Vectorization ratio store | 31.25 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 7.41 |
Vector-efficiency ratio all | 19.15 |
Vector-efficiency ratio load | 20.14 |
Vector-efficiency ratio store | 21.09 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 12.50 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 2.46 |
CQA speedup if FP arith vectorized | 1.11 |
CQA speedup if fully vectorized | 5.27 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.11 |
Bottlenecks | micro-operation queue, |
Function | miniqmcreference::einspline_spo_ref |
Source | TinyVector.h:61-61,MultiBsplineRef.hpp:227-227,MultiBsplineRef.hpp:234-239,MultiBsplineRef.hpp:242-242,MultiBsplineRef.hpp:253-258 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 26.67 |
CQA cycles if no scalar integer | 10.83 |
CQA cycles if FP arith vectorized | 24.00 |
CQA cycles if fully vectorized | 5.06 |
Front-end cycles | 26.67 |
DIV/SQRT cycles | 7.50 |
P0 cycles | 7.60 |
P1 cycles | 21.67 |
P2 cycles | 21.67 |
P3 cycles | 24.00 |
P4 cycles | 8.00 |
P5 cycles | 7.50 |
P6 cycles | 24.00 |
P7 cycles | 24.00 |
P8 cycles | 24.00 |
P9 cycles | 7.40 |
P10 cycles | 21.67 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 28.22 |
Stall cycles (UFS) | 0.00 |
Nb insns | 151.00 |
Nb uops | 159.00 |
Nb loads | 65.00 |
Nb stores | 48.00 |
Nb stack references | 80.00 |
FLOP/cycle | 0.22 |
Nb FLOP add-sub | 0.00 |
Nb FLOP mul | 6.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 53.70 |
Bytes prefetched | 0.00 |
Bytes loaded | 784.00 |
Bytes stored | 648.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 25.81 |
Vectorization ratio load | 27.78 |
Vectorization ratio store | 31.25 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 7.41 |
Vector-efficiency ratio all | 19.15 |
Vector-efficiency ratio load | 20.14 |
Vector-efficiency ratio store | 21.09 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 12.50 |
Path / |
Function | miniqmcreference::einspline_spo_ref |
Source file and lines | MultiBsplineRef.hpp:227-262 |
Module | exec |
nb instructions | 151 |
nb uops | 159 |
loop length | 1047 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 11 |
used ymm registers | 14 |
used zmm registers | 0 |
nb stack references | 80 |
micro-operation queue | 26.67 cycles |
front end | 26.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 7.50 | 7.60 | 21.67 | 21.67 | 24.00 | 8.00 | 7.50 | 24.00 | 24.00 | 24.00 | 7.40 | 21.67 |
cycles | 7.50 | 7.60 | 21.67 | 21.67 | 24.00 | 8.00 | 7.50 | 24.00 | 24.00 | 24.00 | 7.40 | 21.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 28.22 |
Stall cycles | 0.00 |
Front-end | 26.67 |
Dispatch | 24.00 |
Overall L1 | 26.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 59% |
load | 60% |
store | 100% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 25% |
load | 27% |
store | 31% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 7% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 28% |
load | 29% |
store | 40% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 19% |
load | 20% |
store | 21% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV 0x3d8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x80(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,0x1a8(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1b0(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1b8(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1c0(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV 0x170(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,0x178(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x180(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x188(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x190(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV 0x400(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x3,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%RCX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x40(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x3f8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 43c170 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xb60> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x620(%RSP,%RCX,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0x3f0(%RSP),%XMM0,%XMM5 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD 0x3e8(%RSP),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM2,%XMM0,%XMM14 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x3e0(%RSP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM4,%XMM0,%XMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x580(%RSP,%RCX,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM2,%XMM0,%XMM10 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM4,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM0,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMULSD 0x540(%RSP,%RCX,8),%XMM4,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVUPD %XMM0,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
CMP $0x81,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVAPD %XMM5,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VMOVUPD %XMM5,0x4b0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM14,0x320(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM1,0x310(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM10,0x4a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV %RCX,0x400(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JB 43cf90 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1980> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
TEST %R11D,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV 0x18(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x88(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 43c310 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VBROADCASTSD %XMM6,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM10,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM2,0x7a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM14,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD 0x50(%RSP),%YMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xf0(%RSP),%YMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD %XMM1,%YMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x3d0(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x258(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x150(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x250(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x148(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x248(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x140(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x240(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x138(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x238(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x78(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x168(%RSP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,0x210(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x208(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x158(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x1f8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x160(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x1f0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x190(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x230(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x188(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x228(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x180(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x178(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x218(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1c8(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x1e8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x1e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x1d8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x1d0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,0x420(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x418(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x410(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVUPD %YMM0,0x840(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM2,0x820(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM4,0x800(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM5,0x7e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM10,0x7c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
JMP 43c76a <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x115a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
TEST %R11D,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV 0x18(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x88(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 43c310 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0,0x38(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 43d1ec <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1bdc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VBROADCASTSD %XMM6,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM10,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM14,%YMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD 0x50(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x660(%RSP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD 0xf0(%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD %XMM1,%YMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD 0x720(%RSP),%YMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x700(%RSP),%YMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x6e0(%RSP),%YMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x680(%RSP),%YMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x6a0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x6c0(%RSP),%YMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV 0x1a0(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x80(%RSP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP 0x40(%RSP),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
VMOVUPD 0x100(%RSP),%XMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x4e0(%RSP),%YMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x4c0(%RSP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x270(%RSP),%XMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R13,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R14,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVUPD 0x4b0(%RSP),%XMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x320(%RSP),%XMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x310(%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x4a0(%RSP),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
JE 43c310 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 43d1f2 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1be2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVAPD %XMM6,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
MOV 0x1a0(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x88(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 43c310 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
Function | miniqmcreference::einspline_spo_ref |
Source file and lines | MultiBsplineRef.hpp:227-262 |
Module | exec |
nb instructions | 151 |
nb uops | 159 |
loop length | 1047 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 11 |
used ymm registers | 14 |
used zmm registers | 0 |
nb stack references | 80 |
micro-operation queue | 26.67 cycles |
front end | 26.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 7.50 | 7.60 | 21.67 | 21.67 | 24.00 | 8.00 | 7.50 | 24.00 | 24.00 | 24.00 | 7.40 | 21.67 |
cycles | 7.50 | 7.60 | 21.67 | 21.67 | 24.00 | 8.00 | 7.50 | 24.00 | 24.00 | 24.00 | 7.40 | 21.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 28.22 |
Stall cycles | 0.00 |
Front-end | 26.67 |
Dispatch | 24.00 |
Overall L1 | 26.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 59% |
load | 60% |
store | 100% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 25% |
load | 27% |
store | 31% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 7% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 28% |
load | 29% |
store | 40% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 19% |
load | 20% |
store | 21% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV 0x3d8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x80(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,0x1a8(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1b0(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1b8(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x1c0(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV 0x170(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,0x178(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x180(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x188(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
ADD %RAX,0x190(%RSP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV 0x400(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x3,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%RCX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x40(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x3f8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 43c170 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xb60> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x620(%RSP,%RCX,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0x3f0(%RSP),%XMM0,%XMM5 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD 0x3e8(%RSP),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM2,%XMM0,%XMM14 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x3e0(%RSP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM4,%XMM0,%XMM1 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x580(%RSP,%RCX,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM2,%XMM0,%XMM10 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM4,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVUPD %XMM0,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMULSD 0x540(%RSP,%RCX,8),%XMM4,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVUPD %XMM0,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
CMP $0x81,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVAPD %XMM5,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VMOVUPD %XMM5,0x4b0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM14,0x320(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM1,0x310(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM10,0x4a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV %RCX,0x400(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JB 43cf90 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1980> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
TEST %R11D,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV 0x18(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x88(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 43c310 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VBROADCASTSD %XMM6,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM10,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM2,0x7a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM14,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD 0x50(%RSP),%YMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xf0(%RSP),%YMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD %XMM1,%YMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x3d0(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x258(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x150(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x250(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x148(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x248(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x140(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x240(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x138(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x238(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x78(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x168(%RSP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,0x210(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x208(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x158(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x1f8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x160(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x1f0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x190(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x230(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x188(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x228(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x180(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x178(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x218(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1c8(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x1e8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x1e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x1d8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x1d0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,0x420(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x418(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x410(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVUPD %YMM0,0x840(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM2,0x820(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM4,0x800(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM5,0x7e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM10,0x7c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
JMP 43c76a <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x115a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
TEST %R11D,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV 0x18(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x88(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 43c310 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0,0x38(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 43d1ec <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1bdc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VBROADCASTSD %XMM6,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM10,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM14,%YMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD 0x50(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x660(%RSP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD 0xf0(%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD %XMM1,%YMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD 0x720(%RSP),%YMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x700(%RSP),%YMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x6e0(%RSP),%YMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x680(%RSP),%YMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x6a0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x6c0(%RSP),%YMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV 0x1a0(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x80(%RSP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP 0x40(%RSP),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
VMOVUPD 0x100(%RSP),%XMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x4e0(%RSP),%YMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x4c0(%RSP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x270(%RSP),%XMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R13,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R14,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVUPD 0x4b0(%RSP),%XMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x320(%RSP),%XMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x310(%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x4a0(%RSP),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
JE 43c310 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 43d1f2 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x1be2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVAPD %XMM6,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
MOV 0x1a0(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x88(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 43c310 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0xd00> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |