Function: void RAJA::internal::StatementExecutor<RAJA::statement::Collapse<RAJA::omp_parallel_collap ... | Module: exec | Source: Collapse.hpp:81-81 [...] | Coverage: 4.1% |
---|
Function: void RAJA::internal::StatementExecutor<RAJA::statement::Collapse<RAJA::omp_parallel_collap ... | Module: exec | Source: Collapse.hpp:81-81 [...] | Coverage: 4.1% |
---|
/scratch_na/users/xoserete/qaas_runs/171-291-3153/intel/Kripke/build/Kripke/tpl/raja/include/RAJA/util/View.hpp: 79 - 110 |
-------------------------------------------------------------------------------- |
79: : layout(V.layout), data(V.data) |
[...] |
110: return data[idx]; |
/scratch_na/users/xoserete/qaas_runs/171-291-3153/intel/Kripke/build/Kripke/tpl/raja/include/RAJA/index/RangeSegment.hpp: 120 - 120 |
-------------------------------------------------------------------------------- |
120: RAJA_HOST_DEVICE RAJA_INLINE ~TypedRangeSegment() {} |
/scratch_na/users/xoserete/qaas_runs/171-291-3153/intel/Kripke/build/Kripke/src/Kripke/Kernel/LPlusTimes.cpp: 57 - 57 |
-------------------------------------------------------------------------------- |
57: rhs(d,g,z) += ell_plus(d, nm) * phi_out(nm, g, z); |
/scratch_na/users/xoserete/qaas_runs/171-291-3153/intel/Kripke/build/Kripke/tpl/raja/include/RAJA/policy/loop/forall.hpp: 59 - 59 |
-------------------------------------------------------------------------------- |
59: for (decltype(distance_it) i = 0; i < distance_it; ++i) { |
/scratch_na/users/xoserete/qaas_runs/171-291-3153/intel/Kripke/build/Kripke/tpl/raja/include/RAJA/internal/Iterators.hpp: 55 - 177 |
-------------------------------------------------------------------------------- |
55: : val(rhs.val) |
[...] |
142: return val - rhs.val; |
[...] |
177: return value_type(val + rhs); |
/scratch_na/users/xoserete/qaas_runs/171-291-3153/intel/Kripke/build/Kripke/tpl/raja/include/RAJA/util/Layout.hpp: 55 - 55 |
-------------------------------------------------------------------------------- |
55: return a * b; |
/scratch_na/users/xoserete/qaas_runs/171-291-3153/intel/Kripke/build/Kripke/tpl/raja/include/RAJA/util/Operators.hpp: 307 - 307 |
-------------------------------------------------------------------------------- |
307: return Ret{lhs} + rhs; |
/scratch_na/users/xoserete/qaas_runs/171-291-3153/intel/Kripke/build/Kripke/tpl/raja/include/RAJA/policy/openmp/kernel/Collapse.hpp: 81 - 81 |
-------------------------------------------------------------------------------- |
81: #pragma omp parallel for private(i0, i1) firstprivate(privatizer) \ |
0x4a97a0 PUSH %RBP |
0x4a97a1 MOV %RSP,%RBP |
0x4a97a4 PUSH %R15 |
0x4a97a6 PUSH %R14 |
0x4a97a8 PUSH %R13 |
0x4a97aa PUSH %R12 |
0x4a97ac PUSH %RBX |
0x4a97ad AND $-0x20,%RSP |
0x4a97b1 SUB $0xe0,%RSP |
0x4a97b8 MOV 0x10(%RDI),%RAX |
0x4a97bc MOV (%RAX),%RBX |
0x4a97bf MOV 0x110(%RAX),%R13 |
0x4a97c6 MOV 0x10(%RAX),%RDX |
0x4a97ca MOV 0x18(%RAX),%RCX |
0x4a97ce MOV 0x20(%RAX),%RSI |
0x4a97d2 MOV 0x38(%RAX),%R8 |
0x4a97d6 MOV %RBX,0x8(%RSP) |
0x4a97db MOV 0x60(%RAX),%R9 |
0x4a97df MOV 0x68(%RAX),%R10 |
0x4a97e3 MOV %R13,0xd0(%RSP) |
0x4a97eb MOV 0xc0(%RAX),%R11 |
0x4a97f2 MOV 0xf0(%RAX),%R12 |
0x4a97f9 MOV %RDX,0x70(%RSP) |
0x4a97fe MOV 0x118(%RAX),%R14 |
0x4a9805 MOV 0x30(%RAX),%RBX |
0x4a9809 MOV %RCX,0x68(%RSP) |
0x4a980e MOV 0xa8(%RAX),%R15 |
0x4a9815 MOV %RSI,0x38(%RSP) |
0x4a981a MOV %R8,0x60(%RSP) |
0x4a981f MOV %R9,0x48(%RSP) |
0x4a9824 MOV %R10,0x40(%RSP) |
0x4a9829 MOV %R11,0x50(%RSP) |
0x4a982e MOV %R12,0x30(%RSP) |
0x4a9833 MOV %R14,0x58(%RSP) |
0x4a9838 MOV 0x158(%RAX),%R14 |
0x4a983f MOV (%RDI),%R13 |
0x4a9842 MOV 0x8(%RDI),%RAX |
0x4a9846 TEST %R13,%R13 |
0x4a9849 JLE 4a9ce7 |
0x4a984f MOV %RAX,0x78(%RSP) |
0x4a9854 TEST %RAX,%RAX |
0x4a9857 JLE 4a9ce7 |
0x4a985d CALL 4034d0 <omp_get_num_threads@plt> |
0x4a9862 MOVSXD %EAX,%R12 |
0x4a9865 CALL 403420 <omp_get_thread_num@plt> |
0x4a986a XOR %EDX,%EDX |
0x4a986c MOVSXD %EAX,%RDI |
0x4a986f MOV 0x78(%RSP),%RAX |
0x4a9874 IMUL %R13,%RAX |
0x4a9878 DIV %R12 |
0x4a987b MOV %RAX,%RCX |
0x4a987e CMP %RDX,%RDI |
0x4a9881 JB 4a9f0d |
0x4a9887 IMUL %RCX,%RDI |
0x4a988b LEA (%RDI,%RDX,1),%RAX |
0x4a988f LEA (%RCX,%RAX,1),%RSI |
0x4a9893 CMP %RSI,%RAX |
0x4a9896 JAE 4a9ce7 |
0x4a989c XOR %EDX,%EDX |
0x4a989e MOV 0x60(%RSP),%R12 |
0x4a98a3 MOV 0x70(%RSP),%R9 |
0x4a98a8 DIVQ 0x78(%RSP) |
0x4a98ad SUB %RBX,%R12 |
0x4a98b0 MOV %RAX,0x10(%RSP) |
0x4a98b5 MOV %RDX,%R8 |
0x4a98b8 CMP %R9,0x68(%RSP) |
0x4a98bd JLE 4a9ce7 |
0x4a98c3 TEST %R12,%R12 |
0x4a98c6 JLE 4a9ce7 |
0x4a98cc MOV 0xd0(%RSP),%R11 |
0x4a98d4 LEA -0x1(%RCX),%R10 |
0x4a98d8 MOV 0x10(%RSP),%RSI |
0x4a98dd MOV %R12,%RCX |
0x4a98e0 MOV 0x8(%RSP),%RDX |
0x4a98e5 MOV %R10,0x20(%RSP) |
0x4a98ea SHR $0x2,%RCX |
0x4a98ee MOV %R12,%RAX |
0x4a98f1 MOV %R11,%R13 |
0x4a98f4 MOV %R12,%R10 |
0x4a98f7 LEA -0x1(%R12),%RDI |
0x4a98fc SAL $0x5,%RCX |
0x4a9900 IMUL %R9,%R13 |
0x4a9904 MOV %R12,%R9 |
0x4a9907 AND $-0x4,%RAX |
0x4a990b ADD %RDX,%RSI |
0x4a990e AND $0x3,%R9D |
0x4a9912 AND $0x3,%R10D |
0x4a9916 MOV %RDI,0xa8(%RSP) |
0x4a991e SAL $0x3,%R11 |
0x4a9922 MOV %RCX,0xc8(%RSP) |
0x4a992a MOV %R13,0x18(%RSP) |
0x4a992f MOV %RAX,0x98(%RSP) |
0x4a9937 MOV %RSI,0x28(%RSP) |
0x4a993c MOV %R9,0xa0(%RSP) |
0x4a9944 MOV %R10,0x90(%RSP) |
0x4a994c MOV %R11,0xc0(%RSP) |
0x4a9954 XOR %R11D,%R11D |
0x4a9957 NOPW (%RAX,%RAX,1) |
(1892) 0x4a9960 MOV 0x38(%RSP),%R13 |
(1892) 0x4a9965 MOV 0x28(%RSP),%RCX |
(1892) 0x4a996a MOV %R8,0x88(%RSP) |
(1892) 0x4a9972 MOV 0x40(%RSP),%R10 |
(1892) 0x4a9977 MOV 0x48(%RSP),%RSI |
(1892) 0x4a997c MOV %R11,0x80(%RSP) |
(1892) 0x4a9984 LEA (%R8,%R13,1),%RDI |
(1892) 0x4a9988 MOV 0x50(%RSP),%RAX |
(1892) 0x4a998d MOV 0x70(%RSP),%RDX |
(1892) 0x4a9992 IMUL %RCX,%RSI |
(1892) 0x4a9996 MOV 0x30(%RSP),%R9 |
(1892) 0x4a999b IMUL %RDI,%R10 |
(1892) 0x4a999f IMUL %RCX,%RAX |
(1892) 0x4a99a3 ADD %RSI,%R10 |
(1892) 0x4a99a6 MOV 0x58(%RSP),%RSI |
(1892) 0x4a99ab LEA (%RAX,%RDX,1),%R13 |
(1892) 0x4a99af MOV 0x18(%RSP),%RDX |
(1892) 0x4a99b4 IMUL %RSI,%RDI |
(1892) 0x4a99b8 LEA (%R9,%R13,8),%RCX |
(1892) 0x4a99bc ADD %RDX,%RDI |
(1892) 0x4a99bf MOV 0x68(%RSP),%RDX |
(1892) 0x4a99c4 LEA (%RBX,%RDI,1),%R13 |
(1892) 0x4a99c8 ADD %RDX,%RAX |
(1892) 0x4a99cb LEA (%R14,%R13,8),%RSI |
(1892) 0x4a99cf MOV 0x60(%RSP),%R13 |
(1892) 0x4a99d4 LEA (%R9,%RAX,8),%RAX |
(1892) 0x4a99d8 LEA (%R10,%RBX,1),%R9 |
(1892) 0x4a99dc MOV %R9,0xb8(%RSP) |
(1892) 0x4a99e4 ADD %R10,%R13 |
(1892) 0x4a99e7 MOV %RAX,0xd8(%RSP) |
(1892) 0x4a99ef LEA (%R15,%R13,8),%R13 |
(1892) 0x4a99f3 LEA (%R15,%R9,8),%RAX |
(1892) 0x4a99f7 NOPW (%RAX,%RAX,1) |
(1891) 0x4a9a00 CMP $0x1,%R12 |
(1891) 0x4a9a04 JE 4a9eb0 |
(1891) 0x4a9a0a LEA 0x8(%RCX),%R9 |
(1891) 0x4a9a0e CMP %R9,%RAX |
(1891) 0x4a9a11 SETAE %R8B |
(1891) 0x4a9a15 CMP %R13,%RCX |
(1891) 0x4a9a18 SETAE %R11B |
(1891) 0x4a9a1c OR %R8B,%R11B |
(1891) 0x4a9a1f JE 4a9d00 |
(1891) 0x4a9a25 LEA 0x8(%RSI),%R8 |
(1891) 0x4a9a29 MOV %RAX,%RDX |
(1891) 0x4a9a2c SUB %R8,%RDX |
(1891) 0x4a9a2f CMP $0x10,%RDX |
(1891) 0x4a9a33 JBE 4a9d00 |
(1891) 0x4a9a39 CMPQ $0x2,0xa8(%RSP) |
(1891) 0x4a9a42 JBE 4a9eca |
(1891) 0x4a9a48 MOV 0xc8(%RSP),%R11 |
(1891) 0x4a9a50 VBROADCASTSD (%RCX),%YMM2 |
(1891) 0x4a9a55 XOR %EDX,%EDX |
(1891) 0x4a9a57 LEA -0x20(%R11),%R8 |
(1891) 0x4a9a5b SHR $0x5,%R8 |
(1891) 0x4a9a5f INC %R8 |
(1891) 0x4a9a62 AND $0x7,%R8D |
(1891) 0x4a9a66 JE 4a9b2c |
(1891) 0x4a9a6c CMP $0x1,%R8 |
(1891) 0x4a9a70 JE 4a9b0a |
(1891) 0x4a9a76 CMP $0x2,%R8 |
(1891) 0x4a9a7a JE 4a9af6 |
(1891) 0x4a9a7c CMP $0x3,%R8 |
(1891) 0x4a9a80 JE 4a9ae2 |
(1891) 0x4a9a82 CMP $0x4,%R8 |
(1891) 0x4a9a86 JE 4a9ace |
(1891) 0x4a9a88 CMP $0x5,%R8 |
(1891) 0x4a9a8c JE 4a9aba |
(1891) 0x4a9a8e CMP $0x6,%R8 |
(1891) 0x4a9a92 JE 4a9aa6 |
(1891) 0x4a9a94 VMOVUPD (%RSI),%YMM1 |
(1891) 0x4a9a98 VFMADD213PD (%RAX),%YMM2,%YMM1 |
(1891) 0x4a9a9d MOV $0x20,%EDX |
(1891) 0x4a9aa2 VMOVUPD %YMM1,(%RAX) |
(1891) 0x4a9aa6 VMOVUPD (%RSI,%RDX,1),%YMM3 |
(1891) 0x4a9aab VFMADD213PD (%RAX,%RDX,1),%YMM2,%YMM3 |
(1891) 0x4a9ab1 VMOVUPD %YMM3,(%RAX,%RDX,1) |
(1891) 0x4a9ab6 ADD $0x20,%RDX |
(1891) 0x4a9aba VMOVUPD (%RSI,%RDX,1),%YMM5 |
(1891) 0x4a9abf VFMADD213PD (%RAX,%RDX,1),%YMM2,%YMM5 |
(1891) 0x4a9ac5 VMOVUPD %YMM5,(%RAX,%RDX,1) |
(1891) 0x4a9aca ADD $0x20,%RDX |
(1891) 0x4a9ace VMOVUPD (%RSI,%RDX,1),%YMM6 |
(1891) 0x4a9ad3 VFMADD213PD (%RAX,%RDX,1),%YMM2,%YMM6 |
(1891) 0x4a9ad9 VMOVUPD %YMM6,(%RAX,%RDX,1) |
(1891) 0x4a9ade ADD $0x20,%RDX |
(1891) 0x4a9ae2 VMOVUPD (%RSI,%RDX,1),%YMM7 |
(1891) 0x4a9ae7 VFMADD213PD (%RAX,%RDX,1),%YMM2,%YMM7 |
(1891) 0x4a9aed VMOVUPD %YMM7,(%RAX,%RDX,1) |
(1891) 0x4a9af2 ADD $0x20,%RDX |
(1891) 0x4a9af6 VMOVUPD (%RSI,%RDX,1),%YMM8 |
(1891) 0x4a9afb VFMADD213PD (%RAX,%RDX,1),%YMM2,%YMM8 |
(1891) 0x4a9b01 VMOVUPD %YMM8,(%RAX,%RDX,1) |
(1891) 0x4a9b06 ADD $0x20,%RDX |
(1891) 0x4a9b0a VMOVUPD (%RSI,%RDX,1),%YMM9 |
(1891) 0x4a9b0f VFMADD213PD (%RAX,%RDX,1),%YMM2,%YMM9 |
(1891) 0x4a9b15 VMOVUPD %YMM9,(%RAX,%RDX,1) |
(1891) 0x4a9b1a ADD $0x20,%RDX |
(1891) 0x4a9b1e CMP %RDX,0xc8(%RSP) |
(1891) 0x4a9b26 JE 4a9bfa |
(1894) 0x4a9b2c VMOVUPD (%RSI,%RDX,1),%YMM10 |
(1894) 0x4a9b31 VFMADD213PD (%RAX,%RDX,1),%YMM2,%YMM10 |
(1894) 0x4a9b37 VMOVUPD %YMM10,(%RAX,%RDX,1) |
(1894) 0x4a9b3c VMOVUPD 0x20(%RDX,%RSI,1),%YMM11 |
(1894) 0x4a9b42 VFMADD213PD 0x20(%RAX,%RDX,1),%YMM2,%YMM11 |
(1894) 0x4a9b49 VMOVUPD %YMM11,0x20(%RAX,%RDX,1) |
(1894) 0x4a9b4f VMOVUPD 0x40(%RDX,%RSI,1),%YMM12 |
(1894) 0x4a9b55 VFMADD213PD 0x40(%RAX,%RDX,1),%YMM2,%YMM12 |
(1894) 0x4a9b5c VMOVUPD %YMM12,0x40(%RAX,%RDX,1) |
(1894) 0x4a9b62 VMOVUPD 0x60(%RDX,%RSI,1),%YMM13 |
(1894) 0x4a9b68 VFMADD213PD 0x60(%RAX,%RDX,1),%YMM2,%YMM13 |
(1894) 0x4a9b6f VMOVUPD %YMM13,0x60(%RAX,%RDX,1) |
(1894) 0x4a9b75 VMOVUPD 0x80(%RDX,%RSI,1),%YMM14 |
(1894) 0x4a9b7e VFMADD213PD 0x80(%RAX,%RDX,1),%YMM2,%YMM14 |
(1894) 0x4a9b88 VMOVUPD %YMM14,0x80(%RAX,%RDX,1) |
(1894) 0x4a9b91 VMOVUPD 0xa0(%RDX,%RSI,1),%YMM15 |
(1894) 0x4a9b9a VFMADD213PD 0xa0(%RAX,%RDX,1),%YMM2,%YMM15 |
(1894) 0x4a9ba4 VMOVUPD %YMM15,0xa0(%RAX,%RDX,1) |
(1894) 0x4a9bad VMOVUPD 0xc0(%RDX,%RSI,1),%YMM0 |
(1894) 0x4a9bb6 VFMADD213PD 0xc0(%RAX,%RDX,1),%YMM2,%YMM0 |
(1894) 0x4a9bc0 VMOVUPD %YMM0,0xc0(%RAX,%RDX,1) |
(1894) 0x4a9bc9 VMOVUPD 0xe0(%RDX,%RSI,1),%YMM4 |
(1894) 0x4a9bd2 VFMADD213PD 0xe0(%RAX,%RDX,1),%YMM2,%YMM4 |
(1894) 0x4a9bdc VMOVUPD %YMM4,0xe0(%RAX,%RDX,1) |
(1894) 0x4a9be5 ADD $0x100,%RDX |
(1894) 0x4a9bec CMP %RDX,0xc8(%RSP) |
(1894) 0x4a9bf4 JNE 4a9b2c |
(1891) 0x4a9bfa CMPQ $0,0xa0(%RSP) |
(1891) 0x4a9c03 JE 4a9c8d |
(1891) 0x4a9c09 MOV 0x90(%RSP),%R11 |
(1891) 0x4a9c11 MOV %R11,%RDX |
(1891) 0x4a9c14 CMP $0x1,%R11 |
(1891) 0x4a9c18 JE 4a9ee1 |
(1891) 0x4a9c1e MOV 0x98(%RSP),%R8 |
(1891) 0x4a9c26 MOV %R8,0xb0(%RSP) |
(1891) 0x4a9c2e MOV 0xb8(%RSP),%R11 |
(1891) 0x4a9c36 VMOVDDUP (%RCX),%XMM2 |
(1891) 0x4a9c3a ADD %R8,%R11 |
(1891) 0x4a9c3d ADD %RBX,%R8 |
(1891) 0x4a9c40 LEA (%R15,%R11,8),%R11 |
(1891) 0x4a9c44 ADD %RDI,%R8 |
(1891) 0x4a9c47 VMOVUPD (%R11),%XMM1 |
(1891) 0x4a9c4c VFMADD132PD (%R14,%R8,8),%XMM1,%XMM2 |
(1891) 0x4a9c52 VMOVUPD %XMM2,(%R11) |
(1891) 0x4a9c57 TEST $0x1,%DL |
(1891) 0x4a9c5a JE 4a9c8d |
(1891) 0x4a9c5c MOV 0xb0(%RSP),%R8 |
(1891) 0x4a9c64 AND $-0x2,%RDX |
(1891) 0x4a9c68 ADD %R8,%RDX |
(1891) 0x4a9c6b ADD %RBX,%RDX |
(1891) 0x4a9c6e VMOVSD (%RCX),%XMM3 |
(1891) 0x4a9c72 LEA (%R10,%RDX,1),%R11 |
(1891) 0x4a9c76 ADD %RDI,%RDX |
(1891) 0x4a9c79 LEA (%R15,%R11,8),%R8 |
(1891) 0x4a9c7d VMOVSD (%R8),%XMM5 |
(1891) 0x4a9c82 VFMADD132SD (%R14,%RDX,8),%XMM5,%XMM3 |
(1891) 0x4a9c88 VMOVSD %XMM3,(%R8) |
(1891) 0x4a9c8d MOV 0xc0(%RSP),%R8 |
(1891) 0x4a9c95 MOV %R9,%RCX |
(1891) 0x4a9c98 MOV 0xd8(%RSP),%R11 |
(1891) 0x4a9ca0 MOV 0xd0(%RSP),%R9 |
(1891) 0x4a9ca8 ADD %R8,%RSI |
(1891) 0x4a9cab ADD %R9,%RDI |
(1891) 0x4a9cae CMP %R11,%RCX |
(1891) 0x4a9cb1 JNE 4a9a00 |
(1892) 0x4a9cb7 MOV 0x88(%RSP),%R8 |
(1892) 0x4a9cbf MOV 0x80(%RSP),%R11 |
(1892) 0x4a9cc7 CMP %R11,0x20(%RSP) |
(1892) 0x4a9ccc JE 4a9ce4 |
(1892) 0x4a9cce INC %R8 |
(1892) 0x4a9cd1 CMP %R8,0x78(%RSP) |
(1892) 0x4a9cd6 JLE 4a9eee |
(1892) 0x4a9cdc INC %R11 |
(1892) 0x4a9cdf JMP 4a9960 |
0x4a9ce4 VZEROUPPER |
0x4a9ce7 LEA -0x28(%RBP),%RSP |
0x4a9ceb POP %RBX |
0x4a9cec POP %R12 |
0x4a9cee POP %R13 |
0x4a9cf0 POP %R14 |
0x4a9cf2 POP %R15 |
0x4a9cf4 POP %RBP |
0x4a9cf5 RET |
0x4a9cf6 NOPW %CS:(%RAX,%RAX,1) |
(1891) 0x4a9d00 MOV %R12,%R11 |
(1891) 0x4a9d03 XOR %EDX,%EDX |
(1891) 0x4a9d05 AND $0x7,%R11D |
(1891) 0x4a9d09 JE 4a9de4 |
(1891) 0x4a9d0f CMP $0x1,%R11 |
(1891) 0x4a9d13 JE 4a9dc4 |
(1891) 0x4a9d19 CMP $0x2,%R11 |
(1891) 0x4a9d1d JE 4a9dad |
(1891) 0x4a9d23 CMP $0x3,%R11 |
(1891) 0x4a9d27 JE 4a9d96 |
(1891) 0x4a9d29 CMP $0x4,%R11 |
(1891) 0x4a9d2d JE 4a9d7f |
(1891) 0x4a9d2f CMP $0x5,%R11 |
(1891) 0x4a9d33 JE 4a9d68 |
(1891) 0x4a9d35 CMP $0x6,%R11 |
(1891) 0x4a9d39 JE 4a9d51 |
(1891) 0x4a9d3b VMOVSD (%RSI),%XMM7 |
(1891) 0x4a9d3f VMOVSD (%RAX),%XMM6 |
(1891) 0x4a9d43 MOV $0x1,%EDX |
(1891) 0x4a9d48 VFMADD132SD (%RCX),%XMM6,%XMM7 |
(1891) 0x4a9d4d VMOVSD %XMM7,(%RAX) |
(1891) 0x4a9d51 VMOVSD (%RSI,%RDX,8),%XMM8 |
(1891) 0x4a9d56 VMOVSD (%RAX,%RDX,8),%XMM9 |
(1891) 0x4a9d5b VFMADD132SD (%RCX),%XMM9,%XMM8 |
(1891) 0x4a9d60 VMOVSD %XMM8,(%RAX,%RDX,8) |
(1891) 0x4a9d65 INC %RDX |
(1891) 0x4a9d68 VMOVSD (%RSI,%RDX,8),%XMM10 |
(1891) 0x4a9d6d VMOVSD (%RAX,%RDX,8),%XMM11 |
(1891) 0x4a9d72 VFMADD132SD (%RCX),%XMM11,%XMM10 |
(1891) 0x4a9d77 VMOVSD %XMM10,(%RAX,%RDX,8) |
(1891) 0x4a9d7c INC %RDX |
(1891) 0x4a9d7f VMOVSD (%RSI,%RDX,8),%XMM12 |
(1891) 0x4a9d84 VMOVSD (%RAX,%RDX,8),%XMM13 |
(1891) 0x4a9d89 VFMADD132SD (%RCX),%XMM13,%XMM12 |
(1891) 0x4a9d8e VMOVSD %XMM12,(%RAX,%RDX,8) |
(1891) 0x4a9d93 INC %RDX |
(1891) 0x4a9d96 VMOVSD (%RSI,%RDX,8),%XMM14 |
(1891) 0x4a9d9b VMOVSD (%RAX,%RDX,8),%XMM15 |
(1891) 0x4a9da0 VFMADD132SD (%RCX),%XMM15,%XMM14 |
(1891) 0x4a9da5 VMOVSD %XMM14,(%RAX,%RDX,8) |
(1891) 0x4a9daa INC %RDX |
(1891) 0x4a9dad VMOVSD (%RSI,%RDX,8),%XMM0 |
(1891) 0x4a9db2 VMOVSD (%RAX,%RDX,8),%XMM4 |
(1891) 0x4a9db7 VFMADD132SD (%RCX),%XMM4,%XMM0 |
(1891) 0x4a9dbc VMOVSD %XMM0,(%RAX,%RDX,8) |
(1891) 0x4a9dc1 INC %RDX |
(1891) 0x4a9dc4 VMOVSD (%RSI,%RDX,8),%XMM2 |
(1891) 0x4a9dc9 VMOVSD (%RAX,%RDX,8),%XMM1 |
(1891) 0x4a9dce VFMADD132SD (%RCX),%XMM1,%XMM2 |
(1891) 0x4a9dd3 VMOVSD %XMM2,(%RAX,%RDX,8) |
(1891) 0x4a9dd8 INC %RDX |
(1891) 0x4a9ddb CMP %RDX,%R12 |
(1891) 0x4a9dde JE 4a9c8d |
(1893) 0x4a9de4 VMOVSD (%RSI,%RDX,8),%XMM3 |
(1893) 0x4a9de9 VMOVSD (%RAX,%RDX,8),%XMM5 |
(1893) 0x4a9dee VFMADD132SD (%RCX),%XMM5,%XMM3 |
(1893) 0x4a9df3 VMOVSD 0x8(%RAX,%RDX,8),%XMM6 |
(1893) 0x4a9df9 VMOVSD 0x10(%RAX,%RDX,8),%XMM9 |
(1893) 0x4a9dff VMOVSD 0x18(%RAX,%RDX,8),%XMM11 |
(1893) 0x4a9e05 VMOVSD 0x20(%RAX,%RDX,8),%XMM13 |
(1893) 0x4a9e0b VMOVSD 0x28(%RAX,%RDX,8),%XMM15 |
(1893) 0x4a9e11 VMOVSD 0x30(%RAX,%RDX,8),%XMM4 |
(1893) 0x4a9e17 VMOVSD 0x38(%RAX,%RDX,8),%XMM1 |
(1893) 0x4a9e1d VMOVSD %XMM3,(%RAX,%RDX,8) |
(1893) 0x4a9e22 VMOVSD 0x8(%RSI,%RDX,8),%XMM7 |
(1893) 0x4a9e28 VFMADD132SD (%RCX),%XMM6,%XMM7 |
(1893) 0x4a9e2d VMOVSD %XMM7,0x8(%RAX,%RDX,8) |
(1893) 0x4a9e33 VMOVSD 0x10(%RSI,%RDX,8),%XMM8 |
(1893) 0x4a9e39 VFMADD132SD (%RCX),%XMM9,%XMM8 |
(1893) 0x4a9e3e VMOVSD %XMM8,0x10(%RAX,%RDX,8) |
(1893) 0x4a9e44 VMOVSD 0x18(%RSI,%RDX,8),%XMM10 |
(1893) 0x4a9e4a VFMADD132SD (%RCX),%XMM11,%XMM10 |
(1893) 0x4a9e4f VMOVSD %XMM10,0x18(%RAX,%RDX,8) |
(1893) 0x4a9e55 VMOVSD 0x20(%RSI,%RDX,8),%XMM12 |
(1893) 0x4a9e5b VFMADD132SD (%RCX),%XMM13,%XMM12 |
(1893) 0x4a9e60 VMOVSD %XMM12,0x20(%RAX,%RDX,8) |
(1893) 0x4a9e66 VMOVSD 0x28(%RSI,%RDX,8),%XMM14 |
(1893) 0x4a9e6c VFMADD132SD (%RCX),%XMM15,%XMM14 |
(1893) 0x4a9e71 VMOVSD %XMM14,0x28(%RAX,%RDX,8) |
(1893) 0x4a9e77 VMOVSD 0x30(%RSI,%RDX,8),%XMM0 |
(1893) 0x4a9e7d VFMADD132SD (%RCX),%XMM4,%XMM0 |
(1893) 0x4a9e82 VMOVSD %XMM0,0x30(%RAX,%RDX,8) |
(1893) 0x4a9e88 VMOVSD 0x38(%RSI,%RDX,8),%XMM2 |
(1893) 0x4a9e8e VFMADD132SD (%RCX),%XMM1,%XMM2 |
(1893) 0x4a9e93 VMOVSD %XMM2,0x38(%RAX,%RDX,8) |
(1893) 0x4a9e99 ADD $0x8,%RDX |
(1893) 0x4a9e9d CMP %RDX,%R12 |
(1893) 0x4a9ea0 JNE 4a9de4 |
(1891) 0x4a9ea6 JMP 4a9c8d |
0x4a9eab NOPL (%RAX,%RAX,1) |
(1891) 0x4a9eb0 VMOVSD (%RCX),%XMM0 |
(1891) 0x4a9eb4 VMOVSD (%RAX),%XMM4 |
(1891) 0x4a9eb8 LEA 0x8(%RCX),%R9 |
(1891) 0x4a9ebc VFMADD132SD (%RSI),%XMM4,%XMM0 |
(1891) 0x4a9ec1 VMOVSD %XMM0,(%RAX) |
(1891) 0x4a9ec5 JMP 4a9c8d |
(1891) 0x4a9eca MOVQ $0,0xb0(%RSP) |
(1891) 0x4a9ed6 MOV %R12,%RDX |
(1891) 0x4a9ed9 XOR %R8D,%R8D |
(1891) 0x4a9edc JMP 4a9c2e |
(1891) 0x4a9ee1 MOV 0x98(%RSP),%RDX |
(1891) 0x4a9ee9 JMP 4a9c6b |
(1892) 0x4a9eee INCQ 0x10(%RSP) |
(1892) 0x4a9ef3 MOV 0x8(%RSP),%RDI |
(1892) 0x4a9ef8 XOR %R8D,%R8D |
(1892) 0x4a9efb MOV 0x10(%RSP),%R10 |
(1892) 0x4a9f00 ADD %RDI,%R10 |
(1892) 0x4a9f03 MOV %R10,0x28(%RSP) |
(1892) 0x4a9f08 JMP 4a9cdc |
0x4a9f0d INC %RCX |
0x4a9f10 XOR %EDX,%EDX |
0x4a9f12 JMP 4a9887 |
0x4a9f17 NOPW (%RAX,%RAX,1) |
Path / |
Source file and lines | Collapse.hpp:81-81 |
Module | exec |
nb instructions | 113 |
nb uops | 124 |
loop length | 500 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 23 |
micro-operation queue | 20.67 cycles |
front end | 20.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 6.40 | 9.00 | 10.67 | 10.67 | 15.00 | 6.20 | 6.20 | 15.00 | 15.00 | 15.00 | 6.20 | 10.67 |
cycles | 6.40 | 12.27 | 10.67 | 10.67 | 15.00 | 6.20 | 6.20 | 15.00 | 15.00 | 15.00 | 6.20 | 10.67 |
Cycles executing div or sqrt instructions | 20.00 |
FE+BE cycles | 20.28-20.38 |
Stall cycles | 0.01-0.11 |
SB full (events) | 0.04-0.44 |
Front-end | 20.67 |
Dispatch | 15.00 |
DIV/SQRT | 20.00 |
Overall L1 | 20.67 |
all | 1% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 6% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 12% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0xe0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x110(%RAX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RAX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,0x8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RAX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x68(%RAX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RAX),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xf0(%RAX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x118(%RAX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RAX),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa8(%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x158(%RAX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R13,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4a9ce7 <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0x547> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4a9ce7 <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0x547> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CALL 4034d0 <omp_get_num_threads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOVSXD %EAX,%R12 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
CALL 403420 <omp_get_thread_num@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSXD %EAX,%RDI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV 0x78(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %R13,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DIV %R12 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4a9f0d <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0x76d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %RCX,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%RDI,%RDX,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RCX,%RAX,1),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4a9ce7 <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0x547> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x60(%RSP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x70(%RSP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
DIVQ 0x78(%RSP) | 5 | 0 | 3 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 11-16 | 10 |
SUB %RBX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R9,0x68(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JLE 4a9ce7 <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0x547> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4a9ce7 <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0x547> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd0(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%RCX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x10(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x8(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R12),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x5,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %R9,%R13 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
AND $0x3,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
AND $0x3,%R10D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RDI,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x3,%R11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RCX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4a9887 <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0xe7> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | Collapse.hpp:81-81 |
Module | exec |
nb instructions | 113 |
nb uops | 124 |
loop length | 500 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 23 |
micro-operation queue | 20.67 cycles |
front end | 20.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 6.40 | 9.00 | 10.67 | 10.67 | 15.00 | 6.20 | 6.20 | 15.00 | 15.00 | 15.00 | 6.20 | 10.67 |
cycles | 6.40 | 12.27 | 10.67 | 10.67 | 15.00 | 6.20 | 6.20 | 15.00 | 15.00 | 15.00 | 6.20 | 10.67 |
Cycles executing div or sqrt instructions | 20.00 |
FE+BE cycles | 20.28-20.38 |
Stall cycles | 0.01-0.11 |
SB full (events) | 0.04-0.44 |
Front-end | 20.67 |
Dispatch | 15.00 |
DIV/SQRT | 20.00 |
Overall L1 | 20.67 |
all | 1% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 6% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 12% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0xe0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x110(%RAX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RAX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,0x8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RAX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x68(%RAX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RAX),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xf0(%RAX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x118(%RAX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RAX),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa8(%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x158(%RAX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R13,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4a9ce7 <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0x547> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4a9ce7 <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0x547> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CALL 4034d0 <omp_get_num_threads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOVSXD %EAX,%R12 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
CALL 403420 <omp_get_thread_num@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVSXD %EAX,%RDI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV 0x78(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %R13,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DIV %R12 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4a9f0d <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0x76d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %RCX,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%RDI,%RDX,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RCX,%RAX,1),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4a9ce7 <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0x547> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x60(%RSP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x70(%RSP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
DIVQ 0x78(%RSP) | 5 | 0 | 3 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 11-16 | 10 |
SUB %RBX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R9,0x68(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JLE 4a9ce7 <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0x547> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4a9ce7 <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0x547> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd0(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%RCX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x10(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x8(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R12),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x5,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %R9,%R13 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
AND $0x3,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
AND $0x3,%R10D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RDI,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x3,%R11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RCX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4a9887 <_ZN4RAJA8internal17StatementExecutorINS_9statement8CollapseINS_26omp_parallel_collapse_execEN4camp7int_seqIlJLl0ELl2EEEEJNS2_3ForILl1ENS_6policy4loop9loop_execEJNS8_ILl3ESB_JNS2_6LambdaILl0EJEEEEEEEEEEEEE4execIRNS0_8LoopDataINS5_4listIJSG_EEENS5_5tupleIJNS_4impl4SpanINS_9Iterators16numeric_iteratorIN6Kripke9DirectionElPSS_EESS_EENSO_INSQ_INSR_6MomentElPSW_EESW_EENSO_INSQ_INSR_5GroupElPS10_EES10_EENSO_INSQ_INSR_4ZoneElPS14_EES14_EEEEENSM_IJEEEJZNK14LPlusTimesSdomclINSR_11ArchLayoutTINSR_12ArchT_OpenMPENSR_11LayoutT_DGZEEEEEvT_NSR_6SdomIdERKNSR_4Core3SetES1L_S1L_S1L_RNS1I_5FieldIdJSW_S10_S14_EEERNS1M_IdJSS_S10_S14_EEERNS1M_IdJSS_SW_EEEEUlSS_SW_S10_S14_E_EEEEEvOS1G_._omp_fn.0+0xe7> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼void RAJA::internal::StatementExecutor | 4.1 | 2.17 |
▼Loop 1892 - RangeSegment.hpp:120-120 - exec– | 0 | 0 |
▼Loop 1891 - forall.hpp:59-59 - exec– | 0 | 0.01 |
○Loop 1894 - forall.hpp:59-59 - exec | 4.1 | 2.04 |
○Loop 1893 - forall.hpp:59-59 - exec | 0 | 0 |