Loop Id: 1617 | Module: libparcsr_ls.so | Source: par_lr_interp.c:1221-1675 [...] | Coverage: 0.04% |
---|
Loop Id: 1617 | Module: libparcsr_ls.so | Source: par_lr_interp.c:1221-1675 [...] | Coverage: 0.04% |
---|
0x5b1a0 MOV -0x90(%RBP),%RCX |
0x5b1a7 MOV (%RCX),%RCX |
0x5b1aa VMOVSD (%RCX,%RAX,8),%XMM5 |
0x5b1af MOV -0x50(%RBP),%RDX |
0x5b1b3 VADDSD (%RDX,%R9,8),%XMM5,%XMM5 |
0x5b1b9 VMOVSD %XMM5,(%RCX,%RAX,8) |
0x5b1be INC %R9 |
0x5b1c1 CMP %R12,%R9 |
0x5b1c4 JE 5b94c |
0x5b1ca MOV -0xb0(%RBP),%RAX |
0x5b1d1 MOV (%RAX,%R9,8),%R11 |
0x5b1d5 MOV (%R13,%R11,8),%RAX |
0x5b1da CMP %RDI,%RAX |
0x5b1dd JGE 5b1a0 |
0x5b1df CMP -0x80(%RBP),%RAX |
0x5b1e3 JNE 5b370 |
0x5b1e9 MOV -0x188(%RBP),%RCX |
0x5b1f0 MOV (%RCX,%R11,8),%R15 |
0x5b1f4 VPXOR %XMM5,%XMM5,%XMM5 |
0x5b1f8 XOR %EAX,%EAX |
0x5b1fa MOV -0x50(%RBP),%RDX |
0x5b1fe VUCOMISD (%RDX,%R15,8),%XMM5 |
0x5b204 MOV 0x8(%RCX,%R11,8),%RCX |
0x5b209 SETBE %AL |
0x5b20c LEA -0x1(%RAX,%RAX,1),%RAX |
0x5b211 MOV %RAX,-0x70(%RBP) |
0x5b215 LEA 0x1(%R15),%R10 |
0x5b219 CMP %RCX,%R10 |
0x5b21c MOV %R15,-0x68(%RBP) |
0x5b220 JGE 5b248 |
0x5b222 VCVTSI2SDQ -0x70(%RBP),%XMM9,%XMM6 |
0x5b228 NOT %R15 |
0x5b22b ADD %RCX,%R15 |
0x5b22e CMP $0x4,%R15 |
0x5b232 JAE 5b3c3 |
0x5b238 MOV %R15,%RAX |
0x5b23b AND $-0x4,%RAX |
0x5b23f CMP %R15,%RAX |
0x5b242 JNE 5b4d4 |
0x5b248 MOV -0xd8(%RBP),%RAX |
0x5b24f MOV (%RAX),%RAX |
0x5b252 MOV %RAX,-0xc8(%RBP) |
0x5b259 CMP $0x2,%RAX |
0x5b25d JL 5b2b0 |
0x5b25f MOV -0x168(%RBP),%RAX |
0x5b266 MOV (%RAX,%R11,8),%R12 |
0x5b26a MOV 0x8(%RAX,%R11,8),%R15 |
0x5b26f MOV %R15,%RAX |
0x5b272 SUB %R12,%RAX |
0x5b275 JLE 5b2b0 |
0x5b277 VCVTSI2SDQ -0x70(%RBP),%XMM9,%XMM6 |
0x5b27d CMP $0x4,%RAX |
0x5b281 MOV %RAX,-0xc0(%RBP) |
0x5b288 JAE 5b533 |
0x5b28e MOV -0xc0(%RBP),%RDX |
0x5b295 MOV %RDX,%RAX |
0x5b298 AND $-0x4,%RAX |
0x5b29c CMP %RDX,%RAX |
0x5b29f JNE 5b628 |
0x5b2a5 NOPW %CS:(%RAX,%RAX,1) |
0x5b2b0 VUCOMISD %XMM0,%XMM5 |
0x5b2b4 MOV -0x50(%RBP),%RAX |
0x5b2b8 VMOVSD (%RAX,%R9,8),%XMM6 |
0x5b2be JE 5b3b0 |
0x5b2c4 VDIVSD %XMM5,%XMM6,%XMM5 |
0x5b2c8 CMP %RCX,%R10 |
0x5b2cb MOV %R8,%R15 |
0x5b2ce MOV -0xa0(%RBP),%R12 |
0x5b2d5 JGE 5b67f |
0x5b2db VCVTSI2SDQ -0x70(%RBP),%XMM9,%XMM6 |
0x5b2e1 MOV -0x68(%RBP),%RDX |
0x5b2e5 MOV %EDX,%EAX |
0x5b2e7 NOT %EAX |
0x5b2e9 ADD %ECX,%EAX |
0x5b2eb TEST $0x1,%AL |
0x5b2ed JE 5b676 |
0x5b2f3 MOV -0xb0(%RBP),%RAX |
0x5b2fa MOV 0x8(%RAX,%RDX,8),%RAX |
0x5b2ff MOV (%R13,%RAX,8),%RDX |
0x5b304 CMP %RDI,%RDX |
0x5b307 JL 5b338 |
0x5b309 MOV -0x50(%RBP),%R10 |
0x5b30d MOV -0x68(%RBP),%RBX |
0x5b311 VMOVSD 0x8(%R10,%RBX,8),%XMM7 |
0x5b318 VMULSD %XMM6,%XMM7,%XMM8 |
0x5b31c VUCOMISD %XMM0,%XMM8 |
0x5b320 JAE 5b338 |
0x5b322 MOV -0x90(%RBP),%R10 |
0x5b329 MOV (%R10),%R10 |
0x5b32c VFMADD213SD (%R10,%RDX,8),%XMM5,%XMM7 |
0x5b332 VMOVSD %XMM7,(%R10,%RDX,8) |
0x5b338 CMP %R15,%RAX |
0x5b33b JNE 5b66e |
0x5b341 MOV -0x50(%RBP),%RAX |
0x5b345 MOV -0x68(%RBP),%RDX |
0x5b349 VMOVSD 0x8(%RAX,%RDX,8),%XMM7 |
0x5b34f VMULSD %XMM6,%XMM7,%XMM8 |
0x5b353 VFMADD213SD %XMM4,%XMM5,%XMM7 |
0x5b358 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
0x5b35f VMOVSD %XMM7,%XMM4,%XMM4{%K1} |
0x5b365 JMP 5b672 |
0x5b370 MOV -0x100(%RBP),%RAX |
0x5b377 CMPQ $-0x3,(%RAX,%R11,8) |
0x5b37c JE 5b1be |
0x5b382 CMPQ $0x1,-0x180(%RBP) |
0x5b38a JE 5b3a1 |
0x5b38c MOV -0x178(%RBP),%RCX |
0x5b393 MOV (%RCX,%R15,8),%RAX |
0x5b397 CMP (%RCX,%R11,8),%RAX |
0x5b39b JNE 5b1be |
0x5b3a1 MOV -0x50(%RBP),%RAX |
0x5b3a5 VADDSD (%RAX,%R9,8),%XMM4,%XMM4 |
0x5b3ab JMP 5b1be |
0x5b3b0 VADDSD %XMM4,%XMM6,%XMM4 |
0x5b3b4 MOV %R8,%R15 |
0x5b3b7 MOV -0xa0(%RBP),%R12 |
0x5b3be JMP 5b1be |
0x5b3c3 MOV %R15,%R12 |
0x5b3c6 SHR $0x2,%R12 |
0x5b3ca MOV -0x68(%RBP),%RAX |
0x5b3ce LEA 0x20(,%RAX,8),%RAX |
0x5b3d6 JMP 5b40b |
(1624) 0x5b3e0 MOV -0x50(%RBP),%RDX |
(1624) 0x5b3e4 VMOVSD (%RDX,%RAX,1),%XMM7 |
(1624) 0x5b3e9 VMULSD %XMM6,%XMM7,%XMM8 |
(1624) 0x5b3ed VADDSD %XMM5,%XMM7,%XMM7 |
(1624) 0x5b3f1 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1624) 0x5b3f8 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1624) 0x5b3fe ADD $0x20,%RAX |
(1624) 0x5b402 DEC %R12 |
(1624) 0x5b405 JE 5b238 |
(1624) 0x5b40b MOV -0xb0(%RBP),%RDX |
(1624) 0x5b412 MOV -0x18(%RDX,%RAX,1),%RDX |
(1624) 0x5b417 CMP %R8,%RDX |
(1624) 0x5b41a JE 5b423 |
(1624) 0x5b41c CMP %RDI,(%R13,%RDX,8) |
(1624) 0x5b421 JL 5b442 |
(1624) 0x5b423 MOV -0x50(%RBP),%RDX |
(1624) 0x5b427 VMOVSD -0x18(%RDX,%RAX,1),%XMM7 |
(1624) 0x5b42d VMULSD %XMM6,%XMM7,%XMM8 |
(1624) 0x5b431 VADDSD %XMM5,%XMM7,%XMM7 |
(1624) 0x5b435 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1624) 0x5b43c VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1624) 0x5b442 MOV -0xb0(%RBP),%RDX |
(1624) 0x5b449 MOV -0x10(%RDX,%RAX,1),%RDX |
(1624) 0x5b44e CMP %R8,%RDX |
(1624) 0x5b451 JE 5b45a |
(1624) 0x5b453 CMP %RDI,(%R13,%RDX,8) |
(1624) 0x5b458 JL 5b479 |
(1624) 0x5b45a MOV -0x50(%RBP),%RDX |
(1624) 0x5b45e VMOVSD -0x10(%RDX,%RAX,1),%XMM7 |
(1624) 0x5b464 VMULSD %XMM6,%XMM7,%XMM8 |
(1624) 0x5b468 VADDSD %XMM5,%XMM7,%XMM7 |
(1624) 0x5b46c VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1624) 0x5b473 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1624) 0x5b479 MOV -0xb0(%RBP),%RDX |
(1624) 0x5b480 MOV -0x8(%RDX,%RAX,1),%RDX |
(1624) 0x5b485 CMP %R8,%RDX |
(1624) 0x5b488 JE 5b491 |
(1624) 0x5b48a CMP %RDI,(%R13,%RDX,8) |
(1624) 0x5b48f JL 5b4b0 |
(1624) 0x5b491 MOV -0x50(%RBP),%RDX |
(1624) 0x5b495 VMOVSD -0x8(%RDX,%RAX,1),%XMM7 |
(1624) 0x5b49b VMULSD %XMM6,%XMM7,%XMM8 |
(1624) 0x5b49f VADDSD %XMM5,%XMM7,%XMM7 |
(1624) 0x5b4a3 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1624) 0x5b4aa VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1624) 0x5b4b0 MOV -0xb0(%RBP),%RDX |
(1624) 0x5b4b7 MOV (%RDX,%RAX,1),%RDX |
(1624) 0x5b4bb CMP %R8,%RDX |
(1624) 0x5b4be JE 5b3e0 |
(1624) 0x5b4c4 CMP %RDI,(%R13,%RDX,8) |
(1624) 0x5b4c9 JL 5b3fe |
(1624) 0x5b4cf JMP 5b3e0 |
0x5b4d4 MOV -0x68(%RBP),%RDX |
0x5b4d8 LEA 0x1(%RDX,%RAX,1),%RAX |
0x5b4dd MOV %R8,%R15 |
0x5b4e0 JMP 5b51a |
(1623) 0x5b4f0 MOV -0x50(%RBP),%RDX |
(1623) 0x5b4f4 VMOVSD (%RDX,%RAX,8),%XMM7 |
(1623) 0x5b4f9 VMULSD %XMM6,%XMM7,%XMM8 |
(1623) 0x5b4fd VADDSD %XMM5,%XMM7,%XMM7 |
(1623) 0x5b501 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1623) 0x5b508 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1623) 0x5b50e INC %RAX |
(1623) 0x5b511 CMP %RAX,%RCX |
(1623) 0x5b514 JE 5b248 |
(1623) 0x5b51a MOV -0xb0(%RBP),%RDX |
(1623) 0x5b521 MOV (%RDX,%RAX,8),%RDX |
(1623) 0x5b525 CMP %R15,%RDX |
(1623) 0x5b528 JE 5b4f0 |
(1623) 0x5b52a CMP %RDI,(%R13,%RDX,8) |
(1623) 0x5b52f JL 5b50e |
(1623) 0x5b531 JMP 5b4f0 |
0x5b533 SHR $0x2,%RAX |
0x5b537 LEA 0x18(,%R12,8),%RDX |
0x5b53f JMP 5b55d |
(1622) 0x5b550 ADD $0x20,%RDX |
(1622) 0x5b554 DEC %RAX |
(1622) 0x5b557 JE 5b28e |
(1622) 0x5b55d MOV -0x98(%RBP),%RBX |
(1622) 0x5b564 MOV -0x18(%RBX,%RDX,1),%RBX |
(1622) 0x5b569 CMP %RSI,(%R14,%RBX,8) |
(1622) 0x5b56d JL 5b58e |
(1622) 0x5b56f MOV -0x60(%RBP),%RBX |
(1622) 0x5b573 VMOVSD -0x18(%RBX,%RDX,1),%XMM7 |
(1622) 0x5b579 VMULSD %XMM6,%XMM7,%XMM8 |
(1622) 0x5b57d VADDSD %XMM5,%XMM7,%XMM7 |
(1622) 0x5b581 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1622) 0x5b588 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1622) 0x5b58e MOV -0x98(%RBP),%RBX |
(1622) 0x5b595 MOV -0x10(%RBX,%RDX,1),%RBX |
(1622) 0x5b59a CMP %RSI,(%R14,%RBX,8) |
(1622) 0x5b59e JL 5b5bf |
(1622) 0x5b5a0 MOV -0x60(%RBP),%RBX |
(1622) 0x5b5a4 VMOVSD -0x10(%RBX,%RDX,1),%XMM7 |
(1622) 0x5b5aa VMULSD %XMM6,%XMM7,%XMM8 |
(1622) 0x5b5ae VADDSD %XMM5,%XMM7,%XMM7 |
(1622) 0x5b5b2 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1622) 0x5b5b9 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1622) 0x5b5bf MOV -0x98(%RBP),%RBX |
(1622) 0x5b5c6 MOV -0x8(%RBX,%RDX,1),%RBX |
(1622) 0x5b5cb CMP %RSI,(%R14,%RBX,8) |
(1622) 0x5b5cf JL 5b5f0 |
(1622) 0x5b5d1 MOV -0x60(%RBP),%RBX |
(1622) 0x5b5d5 VMOVSD -0x8(%RBX,%RDX,1),%XMM7 |
(1622) 0x5b5db VMULSD %XMM6,%XMM7,%XMM8 |
(1622) 0x5b5df VADDSD %XMM5,%XMM7,%XMM7 |
(1622) 0x5b5e3 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1622) 0x5b5ea VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1622) 0x5b5f0 MOV -0x98(%RBP),%RBX |
(1622) 0x5b5f7 MOV (%RBX,%RDX,1),%RBX |
(1622) 0x5b5fb CMP %RSI,(%R14,%RBX,8) |
(1622) 0x5b5ff JL 5b550 |
(1622) 0x5b605 MOV -0x60(%RBP),%RBX |
(1622) 0x5b609 VMOVSD (%RBX,%RDX,1),%XMM7 |
(1622) 0x5b60e VMULSD %XMM6,%XMM7,%XMM8 |
(1622) 0x5b612 VADDSD %XMM5,%XMM7,%XMM7 |
(1622) 0x5b616 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1622) 0x5b61d VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1622) 0x5b623 JMP 5b550 |
0x5b628 ADD %RAX,%R12 |
0x5b62b JMP 5b63c |
(1621) 0x5b630 INC %R12 |
(1621) 0x5b633 CMP %R12,%R15 |
(1621) 0x5b636 JE 5b2b0 |
(1621) 0x5b63c MOV -0x98(%RBP),%RAX |
(1621) 0x5b643 MOV (%RAX,%R12,8),%RAX |
(1621) 0x5b647 CMP %RSI,(%R14,%RAX,8) |
(1621) 0x5b64b JL 5b630 |
(1621) 0x5b64d MOV -0x60(%RBP),%RAX |
(1621) 0x5b651 VMOVSD (%RAX,%R12,8),%XMM7 |
(1621) 0x5b657 VMULSD %XMM6,%XMM7,%XMM8 |
(1621) 0x5b65b VADDSD %XMM5,%XMM7,%XMM7 |
(1621) 0x5b65f VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1621) 0x5b666 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1621) 0x5b66c JMP 5b630 |
0x5b66e MOV -0x68(%RBP),%RDX |
0x5b672 LEA 0x2(%RDX),%R10 |
0x5b676 LEA -0x2(%RCX),%RAX |
0x5b67a CMP %RDX,%RAX |
0x5b67d JNE 5b6e9 |
0x5b67f CMPQ $0x2,-0xc8(%RBP) |
0x5b687 JL 5b1be |
0x5b68d MOV -0x168(%RBP),%RCX |
0x5b694 MOV (%RCX,%R11,8),%RAX |
0x5b698 MOV 0x8(%RCX,%R11,8),%RCX |
0x5b69d MOV %RCX,%R10 |
0x5b6a0 SUB %RAX,%R10 |
0x5b6a3 JLE 5b1be |
0x5b6a9 VCVTSI2SDQ -0x70(%RBP),%XMM9,%XMM6 |
0x5b6af CMP $0x4,%R10 |
0x5b6b3 JAE 5b7c9 |
0x5b6b9 MOV %R10,%RDX |
0x5b6bc AND $-0x4,%RDX |
0x5b6c0 CMP %R10,%RDX |
0x5b6c3 JNE 5b8f8 |
0x5b6c9 MOV %R8,%R15 |
0x5b6cc JMP 5b1be |
(1620) 0x5b6e0 ADD $0x2,%R10 |
(1620) 0x5b6e4 CMP %R10,%RCX |
(1620) 0x5b6e7 JE 5b67f |
(1620) 0x5b6e9 MOV -0xb0(%RBP),%RAX |
(1620) 0x5b6f0 MOV (%RAX,%R10,8),%RAX |
(1620) 0x5b6f4 MOV (%R13,%RAX,8),%RDX |
(1620) 0x5b6f9 CMP %RDI,%RDX |
(1620) 0x5b6fc JL 5b72e |
(1620) 0x5b6fe MOV -0x50(%RBP),%R15 |
(1620) 0x5b702 VMOVSD (%R15,%R10,8),%XMM7 |
(1620) 0x5b708 MOV %R8,%R15 |
(1620) 0x5b70b VMULSD %XMM6,%XMM7,%XMM8 |
(1620) 0x5b70f VUCOMISD %XMM0,%XMM8 |
(1620) 0x5b713 JAE 5b72e |
(1620) 0x5b715 MOV -0x90(%RBP),%R15 |
(1620) 0x5b71c MOV (%R15),%R15 |
(1620) 0x5b71f VFMADD213SD (%R15,%RDX,8),%XMM5,%XMM7 |
(1620) 0x5b725 VMOVSD %XMM7,(%R15,%RDX,8) |
(1620) 0x5b72b MOV %R8,%R15 |
(1620) 0x5b72e CMP %R15,%RAX |
(1620) 0x5b731 JNE 5b753 |
(1620) 0x5b733 MOV -0x50(%RBP),%RAX |
(1620) 0x5b737 VMOVSD (%RAX,%R10,8),%XMM7 |
(1620) 0x5b73d VMULSD %XMM6,%XMM7,%XMM8 |
(1620) 0x5b741 VFMADD213SD %XMM4,%XMM5,%XMM7 |
(1620) 0x5b746 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1620) 0x5b74d VMOVSD %XMM7,%XMM4,%XMM4{%K1} |
(1620) 0x5b753 MOV -0xb0(%RBP),%RAX |
(1620) 0x5b75a MOV 0x8(%RAX,%R10,8),%RAX |
(1620) 0x5b75f MOV (%R13,%RAX,8),%RDX |
(1620) 0x5b764 CMP %RDI,%RDX |
(1620) 0x5b767 JL 5b79a |
(1620) 0x5b769 MOV -0x50(%RBP),%R15 |
(1620) 0x5b76d VMOVSD 0x8(%R15,%R10,8),%XMM7 |
(1620) 0x5b774 MOV %R8,%R15 |
(1620) 0x5b777 VMULSD %XMM6,%XMM7,%XMM8 |
(1620) 0x5b77b VUCOMISD %XMM0,%XMM8 |
(1620) 0x5b77f JAE 5b79a |
(1620) 0x5b781 MOV -0x90(%RBP),%R15 |
(1620) 0x5b788 MOV (%R15),%R15 |
(1620) 0x5b78b VFMADD213SD (%R15,%RDX,8),%XMM5,%XMM7 |
(1620) 0x5b791 VMOVSD %XMM7,(%R15,%RDX,8) |
(1620) 0x5b797 MOV %R8,%R15 |
(1620) 0x5b79a CMP %R15,%RAX |
(1620) 0x5b79d JNE 5b6e0 |
(1620) 0x5b7a3 MOV -0x50(%RBP),%RAX |
(1620) 0x5b7a7 VMOVSD 0x8(%RAX,%R10,8),%XMM7 |
(1620) 0x5b7ae VMULSD %XMM6,%XMM7,%XMM8 |
(1620) 0x5b7b2 VFMADD213SD %XMM4,%XMM5,%XMM7 |
(1620) 0x5b7b7 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1620) 0x5b7be VMOVSD %XMM7,%XMM4,%XMM4{%K1} |
(1620) 0x5b7c4 JMP 5b6e0 |
0x5b7c9 MOV %R10,%RDX |
0x5b7cc SHR $0x2,%RDX |
0x5b7d0 LEA 0x18(,%RAX,8),%R11 |
0x5b7d8 JMP 5b7ed |
(1619) 0x5b7e0 ADD $0x20,%R11 |
(1619) 0x5b7e4 DEC %RDX |
(1619) 0x5b7e7 JE 5b6b9 |
(1619) 0x5b7ed MOV -0x98(%RBP),%RBX |
(1619) 0x5b7f4 MOV -0x18(%RBX,%R11,1),%RBX |
(1619) 0x5b7f9 MOV (%R14,%RBX,8),%R15 |
(1619) 0x5b7fd CMP %RSI,%R15 |
(1619) 0x5b800 JL 5b82d |
(1619) 0x5b802 MOV -0x60(%RBP),%RBX |
(1619) 0x5b806 VMOVSD -0x18(%RBX,%R11,1),%XMM7 |
(1619) 0x5b80d VMULSD %XMM6,%XMM7,%XMM8 |
(1619) 0x5b811 VUCOMISD %XMM0,%XMM8 |
(1619) 0x5b815 JAE 5b82d |
(1619) 0x5b817 MOV -0x88(%RBP),%RBX |
(1619) 0x5b81e MOV (%RBX),%RBX |
(1619) 0x5b821 VFMADD213SD (%RBX,%R15,8),%XMM5,%XMM7 |
(1619) 0x5b827 VMOVSD %XMM7,(%RBX,%R15,8) |
(1619) 0x5b82d MOV -0x98(%RBP),%RBX |
(1619) 0x5b834 MOV -0x10(%RBX,%R11,1),%RBX |
(1619) 0x5b839 MOV (%R14,%RBX,8),%R15 |
(1619) 0x5b83d CMP %RSI,%R15 |
(1619) 0x5b840 JL 5b86d |
(1619) 0x5b842 MOV -0x60(%RBP),%RBX |
(1619) 0x5b846 VMOVSD -0x10(%RBX,%R11,1),%XMM7 |
(1619) 0x5b84d VMULSD %XMM6,%XMM7,%XMM8 |
(1619) 0x5b851 VUCOMISD %XMM0,%XMM8 |
(1619) 0x5b855 JAE 5b86d |
(1619) 0x5b857 MOV -0x88(%RBP),%RBX |
(1619) 0x5b85e MOV (%RBX),%RBX |
(1619) 0x5b861 VFMADD213SD (%RBX,%R15,8),%XMM5,%XMM7 |
(1619) 0x5b867 VMOVSD %XMM7,(%RBX,%R15,8) |
(1619) 0x5b86d MOV -0x98(%RBP),%RBX |
(1619) 0x5b874 MOV -0x8(%RBX,%R11,1),%RBX |
(1619) 0x5b879 MOV (%R14,%RBX,8),%R15 |
(1619) 0x5b87d CMP %RSI,%R15 |
(1619) 0x5b880 JL 5b8ad |
(1619) 0x5b882 MOV -0x60(%RBP),%RBX |
(1619) 0x5b886 VMOVSD -0x8(%RBX,%R11,1),%XMM7 |
(1619) 0x5b88d VMULSD %XMM6,%XMM7,%XMM8 |
(1619) 0x5b891 VUCOMISD %XMM0,%XMM8 |
(1619) 0x5b895 JAE 5b8ad |
(1619) 0x5b897 MOV -0x88(%RBP),%RBX |
(1619) 0x5b89e MOV (%RBX),%RBX |
(1619) 0x5b8a1 VFMADD213SD (%RBX,%R15,8),%XMM5,%XMM7 |
(1619) 0x5b8a7 VMOVSD %XMM7,(%RBX,%R15,8) |
(1619) 0x5b8ad MOV -0x98(%RBP),%RBX |
(1619) 0x5b8b4 MOV (%RBX,%R11,1),%RBX |
(1619) 0x5b8b8 MOV (%R14,%RBX,8),%R15 |
(1619) 0x5b8bc CMP %RSI,%R15 |
(1619) 0x5b8bf JL 5b7e0 |
(1619) 0x5b8c5 MOV -0x60(%RBP),%RBX |
(1619) 0x5b8c9 VMOVSD (%RBX,%R11,1),%XMM7 |
(1619) 0x5b8cf VMULSD %XMM6,%XMM7,%XMM8 |
(1619) 0x5b8d3 VUCOMISD %XMM0,%XMM8 |
(1619) 0x5b8d7 JAE 5b7e0 |
(1619) 0x5b8dd MOV -0x88(%RBP),%RBX |
(1619) 0x5b8e4 MOV (%RBX),%RBX |
(1619) 0x5b8e7 VFMADD213SD (%RBX,%R15,8),%XMM5,%XMM7 |
(1619) 0x5b8ed VMOVSD %XMM7,(%RBX,%R15,8) |
(1619) 0x5b8f3 JMP 5b7e0 |
0x5b8f8 ADD %RDX,%RAX |
0x5b8fb MOV %R8,%R15 |
0x5b8fe JMP 5b90c |
(1618) 0x5b900 INC %RAX |
(1618) 0x5b903 CMP %RAX,%RCX |
(1618) 0x5b906 JE 5b1be |
(1618) 0x5b90c MOV -0x98(%RBP),%RDX |
(1618) 0x5b913 MOV (%RDX,%RAX,8),%RDX |
(1618) 0x5b917 MOV (%R14,%RDX,8),%RDX |
(1618) 0x5b91b CMP %RSI,%RDX |
(1618) 0x5b91e JL 5b900 |
(1618) 0x5b920 MOV -0x60(%RBP),%R10 |
(1618) 0x5b924 VMOVSD (%R10,%RAX,8),%XMM7 |
(1618) 0x5b92a VMULSD %XMM6,%XMM7,%XMM8 |
(1618) 0x5b92e VUCOMISD %XMM0,%XMM8 |
(1618) 0x5b932 JAE 5b900 |
(1618) 0x5b934 MOV -0x88(%RBP),%R10 |
(1618) 0x5b93b MOV (%R10),%R10 |
(1618) 0x5b93e VFMADD213SD (%R10,%RDX,8),%XMM5,%XMM7 |
(1618) 0x5b944 VMOVSD %XMM7,(%R10,%RDX,8) |
(1618) 0x5b94a JMP 5b900 |
/scratch_na/users/xoserete/qaas_runs/171-415-3872/intel/AMG/build/AMG/AMG/parcsr_ls/par_lr_interp.c: 1221 - 1675 |
-------------------------------------------------------------------------------- |
1221: if (n_fine) |
[...] |
1609: for (jj = A_diag_i[i]+1; jj < A_diag_i[i+1]; jj++) |
1610: { /* i1 is a c-point and strongly influences i, accumulate |
1611: * a_(i,i1) into interpolation weight */ |
1612: i1 = A_diag_j[jj]; |
1613: if (P_marker[i1] >= jj_begin_row) |
1614: { |
1615: P_diag_data[P_marker[i1]] += A_diag_data[jj]; |
1616: } |
1617: else if(P_marker[i1] == strong_f_marker) |
1618: { |
1619: sum = zero; |
1620: sgn = 1; |
1621: if(A_diag_data[A_diag_i[i1]] < 0) sgn = -1; |
1622: /* Loop over row of A for point i1 and calculate the sum |
1623: * of the connections to c-points that strongly influence i. */ |
1624: for(jj1 = A_diag_i[i1]+1; jj1 < A_diag_i[i1+1]; jj1++) |
1625: { |
1626: i2 = A_diag_j[jj1]; |
1627: if((P_marker[i2] >= jj_begin_row || i2 == i) && (sgn*A_diag_data[jj1]) < 0) |
1628: sum += A_diag_data[jj1]; |
1629: } |
1630: if(num_procs > 1) |
1631: { |
1632: for(jj1 = A_offd_i[i1]; jj1< A_offd_i[i1+1]; jj1++) |
1633: { |
1634: i2 = A_offd_j[jj1]; |
1635: if(P_marker_offd[i2] >= jj_begin_row_offd && |
1636: (sgn*A_offd_data[jj1]) < 0) |
1637: sum += A_offd_data[jj1]; |
1638: } |
1639: } |
1640: if(sum != 0) |
1641: { |
1642: distribute = A_diag_data[jj]/sum; |
1643: /* Loop over row of A for point i1 and do the distribution */ |
1644: for(jj1 = A_diag_i[i1]+1; jj1 < A_diag_i[i1+1]; jj1++) |
1645: { |
1646: i2 = A_diag_j[jj1]; |
1647: if(P_marker[i2] >= jj_begin_row && (sgn*A_diag_data[jj1]) < 0) |
1648: P_diag_data[P_marker[i2]] += |
1649: distribute*A_diag_data[jj1]; |
1650: if(i2 == i && (sgn*A_diag_data[jj1]) < 0) |
1651: diagonal += distribute*A_diag_data[jj1]; |
1652: } |
1653: if(num_procs > 1) |
1654: { |
1655: for(jj1 = A_offd_i[i1]; jj1 < A_offd_i[i1+1]; jj1++) |
1656: { |
1657: i2 = A_offd_j[jj1]; |
1658: if(P_marker_offd[i2] >= jj_begin_row_offd && |
1659: (sgn*A_offd_data[jj1]) < 0) |
1660: P_offd_data[P_marker_offd[i2]] += |
[...] |
1667: diagonal += A_diag_data[jj]; |
1668: } |
1669: } |
1670: /* neighbor i1 weakly influences i, accumulate a_(i,i1) into |
1671: * diagonal */ |
1672: else if (CF_marker[i1] != -3) |
1673: { |
1674: if(num_functions == 1 || dof_func[i] == dof_func[i1]) |
1675: diagonal += A_diag_data[jj]; |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.82 |
CQA speedup if FP arith vectorized | 2.98 |
CQA speedup if fully vectorized | 8.00 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.48 |
Bottlenecks | micro-operation queue, |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source | par_lr_interp.c:1221-1221,par_lr_interp.c:1609-1609,par_lr_interp.c:1612-1617,par_lr_interp.c:1621-1621,par_lr_interp.c:1624-1624,par_lr_interp.c:1627-1627,par_lr_interp.c:1630-1632,par_lr_interp.c:1635-1636,par_lr_interp.c:1640-1650,par_lr_interp.c:1653-1655,par_lr_interp.c:1659-1660,par_lr_interp.c:1667-1667,par_lr_interp.c:1672-1675 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 27.67 |
CQA cycles if no scalar integer | 15.17 |
CQA cycles if FP arith vectorized | 9.28 |
CQA cycles if fully vectorized | 3.46 |
Front-end cycles | 27.67 |
DIV/SQRT cycles | 16.50 |
P0 cycles | 15.20 |
P1 cycles | 18.67 |
P2 cycles | 18.67 |
P3 cycles | 3.00 |
P4 cycles | 15.40 |
P5 cycles | 16.50 |
P6 cycles | 3.00 |
P7 cycles | 3.00 |
P8 cycles | 3.00 |
P9 cycles | 15.40 |
P10 cycles | 18.67 |
P11 cycles | 4.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 27.94 - 28.00 |
Stall cycles (UFS) | 0.00 |
Nb insns | 160.00 |
Nb uops | 162.00 |
Nb loads | 56.00 |
Nb stores | 6.00 |
Nb stack references | 15.00 |
FLOP/cycle | 0.36 |
Nb FLOP add-sub | 3.00 |
Nb FLOP mul | 2.00 |
Nb FLOP fma | 2.00 |
Nb FLOP div | 1.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 17.93 |
Bytes prefetched | 0.00 |
Bytes loaded | 448.00 |
Bytes stored | 48.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 2.13 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | 0.00 |
Vectorization ratio div_sqrt | 0.00 |
Vectorization ratio other | 3.45 |
Vector-efficiency ratio all | 12.77 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | 12.50 |
Vector-efficiency ratio div_sqrt | 12.50 |
Vector-efficiency ratio other | 12.93 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.82 |
CQA speedup if FP arith vectorized | 2.98 |
CQA speedup if fully vectorized | 8.00 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.48 |
Bottlenecks | micro-operation queue, |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source | par_lr_interp.c:1221-1221,par_lr_interp.c:1609-1609,par_lr_interp.c:1612-1617,par_lr_interp.c:1621-1621,par_lr_interp.c:1624-1624,par_lr_interp.c:1627-1627,par_lr_interp.c:1630-1632,par_lr_interp.c:1635-1636,par_lr_interp.c:1640-1650,par_lr_interp.c:1653-1655,par_lr_interp.c:1659-1660,par_lr_interp.c:1667-1667,par_lr_interp.c:1672-1675 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 27.67 |
CQA cycles if no scalar integer | 15.17 |
CQA cycles if FP arith vectorized | 9.28 |
CQA cycles if fully vectorized | 3.46 |
Front-end cycles | 27.67 |
DIV/SQRT cycles | 16.50 |
P0 cycles | 15.20 |
P1 cycles | 18.67 |
P2 cycles | 18.67 |
P3 cycles | 3.00 |
P4 cycles | 15.40 |
P5 cycles | 16.50 |
P6 cycles | 3.00 |
P7 cycles | 3.00 |
P8 cycles | 3.00 |
P9 cycles | 15.40 |
P10 cycles | 18.67 |
P11 cycles | 4.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 27.94 - 28.00 |
Stall cycles (UFS) | 0.00 |
Nb insns | 160.00 |
Nb uops | 162.00 |
Nb loads | 56.00 |
Nb stores | 6.00 |
Nb stack references | 15.00 |
FLOP/cycle | 0.36 |
Nb FLOP add-sub | 3.00 |
Nb FLOP mul | 2.00 |
Nb FLOP fma | 2.00 |
Nb FLOP div | 1.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 17.93 |
Bytes prefetched | 0.00 |
Bytes loaded | 448.00 |
Bytes stored | 48.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 2.13 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | 0.00 |
Vectorization ratio div_sqrt | 0.00 |
Vectorization ratio other | 3.45 |
Vector-efficiency ratio all | 12.77 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | 12.50 |
Vector-efficiency ratio div_sqrt | 12.50 |
Vector-efficiency ratio other | 12.93 |
Path / |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source file and lines | par_lr_interp.c:1221-1675 |
Module | libparcsr_ls.so |
nb instructions | 160 |
nb uops | 162 |
loop length | 719 |
used x86 registers | 13 |
used mmx registers | 0 |
used xmm registers | 7 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 15 |
ADD-SUB / MUL ratio | 1.50 |
micro-operation queue | 27.67 cycles |
front end | 27.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 16.50 | 15.20 | 18.67 | 18.67 | 3.00 | 15.40 | 16.50 | 3.00 | 3.00 | 3.00 | 15.40 | 18.67 |
cycles | 16.50 | 15.20 | 18.67 | 18.67 | 3.00 | 15.40 | 16.50 | 3.00 | 3.00 | 3.00 | 15.40 | 18.67 |
Cycles executing div or sqrt instructions | 4.00 |
FE+BE cycles | 27.94-28.00 |
Stall cycles | 0.00 |
Front-end | 27.67 |
Dispatch | 18.67 |
DIV/SQRT | 4.00 |
Overall L1 | 27.67 |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 4% |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 0% |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 3% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | 12% |
other | 12% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | 12% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0x90(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RCX,%RAX,8),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RDX,%R9,8),%XMM5,%XMM5 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM5,(%RCX,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R12,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 5b94c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1c7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R9,8),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%R11,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 5b1a0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14d0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP -0x80(%RBP),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 5b370 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x16a0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x188(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R11,8),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPXOR %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD (%RDX,%R15,8),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x8(%RCX,%R11,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SETBE %AL | 2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 1-2 | 1 |
LEA -0x1(%RAX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%R15),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 5b248 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1578> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0x70(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
NOT %R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RCX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP $0x4,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 5b3c3 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x16f3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5b4d4 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1804> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xd8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x2,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 5b2b0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x168(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R11,8),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX,%R11,8),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 5b2b0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0x70(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 5b533 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1863> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5b628 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1958> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM0,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RAX,%R9,8),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 5b3b0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x16e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VDIVSD %XMM5,%XMM6,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-15 | 4 |
CMP %RCX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0xa0(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 5b67f <hypre_BoomerAMGBuildExtPIInterp.extracted+0x19af> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0x70(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EDX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %ECX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 5b676 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x19a6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%RAX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 5b338 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1668> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%R10,%RBX,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM6,%XMM7,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VUCOMISD %XMM0,%XMM8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JAE 5b338 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1668> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x90(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VFMADD213SD (%R10,%RDX,8),%XMM5,%XMM7 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD %XMM7,(%R10,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5b66e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x199e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%RAX,%RDX,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM6,%XMM7,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM4,%XMM5,%XMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPSD $0x1,%XMM0,%XMM8,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVSD %XMM7,%XMM4,%XMM4{%K1} | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 5b672 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x19a2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x100(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $-0x3,(%RAX,%R11,8) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x1,-0x180(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 5b3a1 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x16d1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x178(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R15,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RCX,%R11,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R9,8),%XMM4,%XMM4 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
JMP 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
VADDSD %XMM4,%XMM6,%XMM4 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0xa0(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R15,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV -0x68(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x20(,%RAX,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 5b40b <hypre_BoomerAMGBuildExtPIInterp.extracted+0x173b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RDX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 5b51a <hypre_BoomerAMGBuildExtPIInterp.extracted+0x184a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
SHR $0x2,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%R12,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 5b55d <hypre_BoomerAMGBuildExtPIInterp.extracted+0x188d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 5b63c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x196c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x2(%RDX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x2(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5b6e9 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a19> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x2,-0xc8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JL 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x168(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R11,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX,%R11,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0x70(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 5b7c9 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1af9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R10,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5b8f8 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1c28> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%RAX,8),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 5b7ed <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b1d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 5b90c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1c3c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source file and lines | par_lr_interp.c:1221-1675 |
Module | libparcsr_ls.so |
nb instructions | 160 |
nb uops | 162 |
loop length | 719 |
used x86 registers | 13 |
used mmx registers | 0 |
used xmm registers | 7 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 15 |
ADD-SUB / MUL ratio | 1.50 |
micro-operation queue | 27.67 cycles |
front end | 27.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 16.50 | 15.20 | 18.67 | 18.67 | 3.00 | 15.40 | 16.50 | 3.00 | 3.00 | 3.00 | 15.40 | 18.67 |
cycles | 16.50 | 15.20 | 18.67 | 18.67 | 3.00 | 15.40 | 16.50 | 3.00 | 3.00 | 3.00 | 15.40 | 18.67 |
Cycles executing div or sqrt instructions | 4.00 |
FE+BE cycles | 27.94-28.00 |
Stall cycles | 0.00 |
Front-end | 27.67 |
Dispatch | 18.67 |
DIV/SQRT | 4.00 |
Overall L1 | 27.67 |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 4% |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 0% |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 3% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | 12% |
other | 12% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | 12% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0x90(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RCX,%RAX,8),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RDX,%R9,8),%XMM5,%XMM5 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM5,(%RCX,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R12,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 5b94c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1c7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R9,8),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%R11,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 5b1a0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14d0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP -0x80(%RBP),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 5b370 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x16a0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x188(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R11,8),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPXOR %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD (%RDX,%R15,8),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x8(%RCX,%R11,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SETBE %AL | 2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 1-2 | 1 |
LEA -0x1(%RAX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%R15),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 5b248 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1578> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0x70(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
NOT %R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RCX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP $0x4,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 5b3c3 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x16f3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5b4d4 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1804> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xd8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x2,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 5b2b0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x168(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R11,8),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX,%R11,8),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 5b2b0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0x70(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 5b533 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1863> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5b628 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1958> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM0,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RAX,%R9,8),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 5b3b0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x16e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VDIVSD %XMM5,%XMM6,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-15 | 4 |
CMP %RCX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0xa0(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 5b67f <hypre_BoomerAMGBuildExtPIInterp.extracted+0x19af> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0x70(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EDX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %ECX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 5b676 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x19a6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%RAX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 5b338 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1668> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%R10,%RBX,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM6,%XMM7,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VUCOMISD %XMM0,%XMM8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JAE 5b338 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1668> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x90(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VFMADD213SD (%R10,%RDX,8),%XMM5,%XMM7 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD %XMM7,(%R10,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5b66e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x199e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%RAX,%RDX,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM6,%XMM7,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM4,%XMM5,%XMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPSD $0x1,%XMM0,%XMM8,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVSD %XMM7,%XMM4,%XMM4{%K1} | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 5b672 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x19a2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x100(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $-0x3,(%RAX,%R11,8) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x1,-0x180(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 5b3a1 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x16d1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x178(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R15,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RCX,%R11,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R9,8),%XMM4,%XMM4 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
JMP 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
VADDSD %XMM4,%XMM6,%XMM4 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0xa0(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R15,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV -0x68(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x20(,%RAX,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 5b40b <hypre_BoomerAMGBuildExtPIInterp.extracted+0x173b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RDX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 5b51a <hypre_BoomerAMGBuildExtPIInterp.extracted+0x184a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
SHR $0x2,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%R12,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 5b55d <hypre_BoomerAMGBuildExtPIInterp.extracted+0x188d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 5b63c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x196c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x2(%RDX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x2(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5b6e9 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a19> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x2,-0xc8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JL 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x168(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R11,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX,%R11,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0x70(%RBP),%XMM9,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 5b7c9 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1af9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R10,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5b8f8 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1c28> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 5b1be <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%RAX,8),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 5b7ed <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b1d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 5b90c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1c3c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |