Loop Id: 851 | Module: libparcsr_ls.so | Source: par_multi_interp.c:1072-1125 | Coverage: 0.06% |
---|
Loop Id: 851 | Module: libparcsr_ls.so | Source: par_multi_interp.c:1072-1125 | Coverage: 0.06% |
---|
0x88890 MOV -0xb0(%RBP),%R13 |
0x88897 MOV -0x70(%RBP),%RCX |
0x8889b MOV -0xd0(%RBP),%R8 |
0x888a2 MOV (%R13,%RCX,8),%RDI |
0x888a7 LEA 0x8(,%RDI,8),%RDX |
0x888af MOV (%R8,%RDI,8),%R11 |
0x888b3 MOV %RDI,%RAX |
0x888b6 ADD %RDX,%R8 |
0x888b9 NOT %RAX |
0x888bc MOV %R8,-0x90(%RBP) |
0x888c3 MOV (%R8),%R8 |
0x888c6 MOV %R11,-0x38(%RBP) |
0x888ca CMP %R8,%R11 |
0x888cd JGE 88bf0 |
0x888d3 MOV %RDI,-0xe0(%RBP) |
0x888da MOV %RBX,%R13 |
0x888dd MOV -0x88(%RBP),%RDI |
0x888e4 MOV %RDX,-0xc0(%RBP) |
0x888eb JMP 88901 |
(854) 0x888f0 INCQ -0x38(%RBP) |
(854) 0x888f4 MOV -0x38(%RBP),%RDX |
(854) 0x888f8 CMP %R8,%RDX |
(854) 0x888fb JGE 88bd8 |
(854) 0x88901 MOV -0x40(%RBP),%RDX |
(854) 0x88905 MOV -0x38(%RBP),%RBX |
(854) 0x88909 MOV (%RDX,%RBX,8),%RCX |
(854) 0x8890d MOV -0x48(%RBP),%RDX |
(854) 0x88911 LEA (,%RCX,8),%R11 |
(854) 0x88919 CMP %R13,(%RDX,%RCX,8) |
(854) 0x8891d JNE 888f0 |
(854) 0x8891f MOV -0x80(%RBP),%R8 |
(854) 0x88923 MOV -0x60(%RBP),%RBX |
(854) 0x88927 MOV (%R8,%RCX,8),%R8 |
(854) 0x8892b MOV 0x8(%RBX,%R11,1),%RBX |
(854) 0x88930 ADD %R8,%RBX |
(854) 0x88933 CMP %RBX,%R8 |
(854) 0x88936 JGE 88a94 |
(854) 0x8893c MOV -0x8(%R10,%R14,1),%RDX |
(854) 0x88941 LEA (%RDX,%RBX,8),%RBX |
(854) 0x88945 LEA (%RDX,%R8,8),%R8 |
(854) 0x88949 MOV %RBX,-0x68(%RBP) |
(854) 0x8894d SUB %R8,%RBX |
(854) 0x88950 SUB $0x8,%RBX |
(854) 0x88954 SHR $0x3,%RBX |
(854) 0x88958 INC %RBX |
(854) 0x8895b AND $0x3,%EBX |
(854) 0x8895e JE 88a07 |
(854) 0x88964 CMP $0x1,%RBX |
(854) 0x88968 JE 889ce |
(854) 0x8896a CMP $0x2,%RBX |
(854) 0x8896e JE 8899f |
(854) 0x88970 MOV (%R8),%RDX |
(854) 0x88973 MOV %RDX,%RBX |
(854) 0x88976 LEA (%R12,%RDX,8),%RDX |
(854) 0x8897a MOV %RDX,-0x88(%RBP) |
(854) 0x88981 CMP %RAX,(%RDX) |
(854) 0x88984 JE 8899b |
(854) 0x88986 MOV (%R10,%R14,1),%RDX |
(854) 0x8898a MOV %RBX,(%RDX,%RSI,8) |
(854) 0x8898e MOV -0x88(%RBP),%RBX |
(854) 0x88995 INC %RSI |
(854) 0x88998 MOV %RAX,(%RBX) |
(854) 0x8899b ADD $0x8,%R8 |
(854) 0x8899f MOV (%R8),%RDX |
(854) 0x889a2 MOV %RDX,%RBX |
(854) 0x889a5 LEA (%R12,%RDX,8),%RDX |
(854) 0x889a9 MOV %RDX,-0x88(%RBP) |
(854) 0x889b0 CMP %RAX,(%RDX) |
(854) 0x889b3 JE 889ca |
(854) 0x889b5 MOV (%R10,%R14,1),%RDX |
(854) 0x889b9 MOV %RBX,(%RDX,%RSI,8) |
(854) 0x889bd MOV -0x88(%RBP),%RBX |
(854) 0x889c4 INC %RSI |
(854) 0x889c7 MOV %RAX,(%RBX) |
(854) 0x889ca ADD $0x8,%R8 |
(854) 0x889ce MOV (%R8),%RDX |
(854) 0x889d1 MOV %RDX,%RBX |
(854) 0x889d4 LEA (%R12,%RDX,8),%RDX |
(854) 0x889d8 MOV %RDX,-0x88(%RBP) |
(854) 0x889df CMP %RAX,(%RDX) |
(854) 0x889e2 JE 889f9 |
(854) 0x889e4 MOV (%R10,%R14,1),%RDX |
(854) 0x889e8 MOV %RBX,(%RDX,%RSI,8) |
(854) 0x889ec MOV -0x88(%RBP),%RBX |
(854) 0x889f3 INC %RSI |
(854) 0x889f6 MOV %RAX,(%RBX) |
(854) 0x889f9 ADD $0x8,%R8 |
(854) 0x889fd CMP %R8,-0x68(%RBP) |
(854) 0x88a01 JE 88a94 |
(854) 0x88a07 MOV %RCX,-0x88(%RBP) |
(854) 0x88a0e MOV %RDI,%RBX |
(856) 0x88a11 MOV (%R8),%RDI |
(856) 0x88a14 LEA (%R12,%RDI,8),%RDX |
(856) 0x88a18 CMP %RAX,(%RDX) |
(856) 0x88a1b JE 88a2b |
(856) 0x88a1d MOV (%R10,%R14,1),%RCX |
(856) 0x88a21 MOV %RDI,(%RCX,%RSI,8) |
(856) 0x88a25 INC %RSI |
(856) 0x88a28 MOV %RAX,(%RDX) |
(856) 0x88a2b LEA 0x8(%R8),%RDX |
(856) 0x88a2f MOV 0x8(%R8),%R8 |
(856) 0x88a33 LEA (%R12,%R8,8),%RDI |
(856) 0x88a37 CMP %RAX,(%RDI) |
(856) 0x88a3a JE 88a4a |
(856) 0x88a3c MOV (%R10,%R14,1),%RCX |
(856) 0x88a40 MOV %R8,(%RCX,%RSI,8) |
(856) 0x88a44 INC %RSI |
(856) 0x88a47 MOV %RAX,(%RDI) |
(856) 0x88a4a MOV 0x8(%RDX),%R8 |
(856) 0x88a4e LEA (%R12,%R8,8),%RDI |
(856) 0x88a52 CMP %RAX,(%RDI) |
(856) 0x88a55 JE 88a65 |
(856) 0x88a57 MOV (%R10,%R14,1),%RCX |
(856) 0x88a5b MOV %R8,(%RCX,%RSI,8) |
(856) 0x88a5f INC %RSI |
(856) 0x88a62 MOV %RAX,(%RDI) |
(856) 0x88a65 MOV 0x10(%RDX),%R8 |
(856) 0x88a69 LEA (%R12,%R8,8),%RDI |
(856) 0x88a6d CMP %RAX,(%RDI) |
(856) 0x88a70 JE 88a80 |
(856) 0x88a72 MOV (%R10,%R14,1),%RCX |
(856) 0x88a76 MOV %R8,(%RCX,%RSI,8) |
(856) 0x88a7a INC %RSI |
(856) 0x88a7d MOV %RAX,(%RDI) |
(856) 0x88a80 LEA 0x18(%RDX),%R8 |
(856) 0x88a84 CMP %R8,-0x68(%RBP) |
(856) 0x88a88 JNE 88a11 |
(854) 0x88a8a MOV -0x88(%RBP),%RCX |
(854) 0x88a91 MOV %RBX,%RDI |
(854) 0x88a94 MOV -0x78(%RBP),%RBX |
(854) 0x88a98 MOV -0x58(%RBP),%RDX |
(854) 0x88a9c MOV (%RBX,%RCX,8),%RCX |
(854) 0x88aa0 MOV 0x8(%RDX,%R11,1),%R8 |
(854) 0x88aa5 ADD %RCX,%R8 |
(854) 0x88aa8 CMP %R8,%RCX |
(854) 0x88aab JGE 88fd0 |
(854) 0x88ab1 MOV -0x8(%R9,%R14,1),%RBX |
(854) 0x88ab6 LEA (%RBX,%RCX,8),%RCX |
(854) 0x88aba LEA (%RBX,%R8,8),%RBX |
(854) 0x88abe MOV %RBX,%RDX |
(854) 0x88ac1 SUB %RCX,%RDX |
(854) 0x88ac4 SUB $0x8,%RDX |
(854) 0x88ac8 SHR $0x3,%RDX |
(854) 0x88acc INC %RDX |
(854) 0x88acf AND $0x3,%EDX |
(854) 0x88ad2 JE 88b3f |
(854) 0x88ad4 CMP $0x1,%RDX |
(854) 0x88ad8 JE 88b1c |
(854) 0x88ada CMP $0x2,%RDX |
(854) 0x88ade JE 88afe |
(854) 0x88ae0 MOV (%RCX),%R11 |
(854) 0x88ae3 LEA (%R15,%R11,8),%R8 |
(854) 0x88ae7 CMP %RAX,(%R8) |
(854) 0x88aea JE 88afa |
(854) 0x88aec MOV (%R9,%R14,1),%RDX |
(854) 0x88af0 MOV %R11,(%RDX,%RDI,8) |
(854) 0x88af4 INC %RDI |
(854) 0x88af7 MOV %RAX,(%R8) |
(854) 0x88afa ADD $0x8,%RCX |
(854) 0x88afe MOV (%RCX),%R11 |
(854) 0x88b01 LEA (%R15,%R11,8),%R8 |
(854) 0x88b05 CMP %RAX,(%R8) |
(854) 0x88b08 JE 88b18 |
(854) 0x88b0a MOV (%R9,%R14,1),%RDX |
(854) 0x88b0e MOV %R11,(%RDX,%RDI,8) |
(854) 0x88b12 INC %RDI |
(854) 0x88b15 MOV %RAX,(%R8) |
(854) 0x88b18 ADD $0x8,%RCX |
(854) 0x88b1c MOV (%RCX),%R11 |
(854) 0x88b1f LEA (%R15,%R11,8),%R8 |
(854) 0x88b23 CMP %RAX,(%R8) |
(854) 0x88b26 JE 88b36 |
(854) 0x88b28 MOV (%R9,%R14,1),%RDX |
(854) 0x88b2c MOV %R11,(%RDX,%RDI,8) |
(854) 0x88b30 INC %RDI |
(854) 0x88b33 MOV %RAX,(%R8) |
(854) 0x88b36 ADD $0x8,%RCX |
(854) 0x88b3a CMP %RBX,%RCX |
(854) 0x88b3d JE 88bb7 |
(855) 0x88b3f MOV (%RCX),%R8 |
(855) 0x88b42 LEA (%R15,%R8,8),%RDX |
(855) 0x88b46 CMP %RAX,(%RDX) |
(855) 0x88b49 JE 88b59 |
(855) 0x88b4b MOV (%R9,%R14,1),%R11 |
(855) 0x88b4f MOV %R8,(%R11,%RDI,8) |
(855) 0x88b53 INC %RDI |
(855) 0x88b56 MOV %RAX,(%RDX) |
(855) 0x88b59 MOV 0x8(%RCX),%R8 |
(855) 0x88b5d LEA 0x8(%RCX),%RDX |
(855) 0x88b61 LEA (%R15,%R8,8),%RCX |
(855) 0x88b65 CMP %RAX,(%RCX) |
(855) 0x88b68 JE 88b78 |
(855) 0x88b6a MOV (%R9,%R14,1),%R11 |
(855) 0x88b6e MOV %R8,(%R11,%RDI,8) |
(855) 0x88b72 INC %RDI |
(855) 0x88b75 MOV %RAX,(%RCX) |
(855) 0x88b78 MOV 0x8(%RDX),%R8 |
(855) 0x88b7c LEA (%R15,%R8,8),%RCX |
(855) 0x88b80 CMP %RAX,(%RCX) |
(855) 0x88b83 JE 88b93 |
(855) 0x88b85 MOV (%R9,%R14,1),%R11 |
(855) 0x88b89 MOV %R8,(%R11,%RDI,8) |
(855) 0x88b8d INC %RDI |
(855) 0x88b90 MOV %RAX,(%RCX) |
(855) 0x88b93 MOV 0x10(%RDX),%R8 |
(855) 0x88b97 LEA (%R15,%R8,8),%RCX |
(855) 0x88b9b CMP %RAX,(%RCX) |
(855) 0x88b9e JE 88bae |
(855) 0x88ba0 MOV (%R9,%R14,1),%R11 |
(855) 0x88ba4 MOV %R8,(%R11,%RDI,8) |
(855) 0x88ba8 INC %RDI |
(855) 0x88bab MOV %RAX,(%RCX) |
(855) 0x88bae LEA 0x18(%RDX),%RCX |
(855) 0x88bb2 CMP %RBX,%RCX |
(855) 0x88bb5 JNE 88b3f |
(854) 0x88bb7 INCQ -0x38(%RBP) |
(854) 0x88bbb MOV -0x90(%RBP),%RBX |
(854) 0x88bc2 MOV (%RBX),%R8 |
(854) 0x88bc5 MOV -0x38(%RBP),%RDX |
(854) 0x88bc9 CMP %R8,%RDX |
(854) 0x88bcc JL 88901 |
0x88bd2 NOPW (%RAX,%RAX,1) |
0x88bd8 MOV %RDI,-0x88(%RBP) |
0x88bdf MOV -0xc0(%RBP),%RDX |
0x88be6 MOV %R13,%RBX |
0x88be9 MOV -0xe0(%RBP),%RDI |
0x88bf0 MOV -0xc8(%RBP),%R11 |
0x88bf7 MOV (%R11,%RDI,8),%RAX |
0x88bfb ADD %RDX,%R11 |
0x88bfe NOT %RDI |
0x88c01 MOV (%R11),%RCX |
0x88c04 MOV %R11,-0xc0(%RBP) |
0x88c0b CMP %RAX,%RCX |
0x88c0e JLE 88eca |
0x88c14 MOV -0x88(%RBP),%R8 |
0x88c1b MOV -0xd8(%RBP),%R13 |
0x88c22 MOV %R9,-0x68(%RBP) |
0x88c26 MOV %R10,-0x90(%RBP) |
0x88c2d JMP 88c3c |
(852) 0x88c30 INC %RAX |
(852) 0x88c33 CMP %RCX,%RAX |
(852) 0x88c36 JGE 88eb8 |
(852) 0x88c3c MOV -0x50(%RBP),%R9 |
(852) 0x88c40 MOV (%R9,%RAX,8),%RDX |
(852) 0x88c44 LEA (,%RDX,8),%R11 |
(852) 0x88c4c CMP %RBX,(%R13,%RDX,8) |
(852) 0x88c51 JNE 88c30 |
(852) 0x88c53 MOV -0xa0(%RBP),%R10 |
(852) 0x88c5a MOV -0x98(%RBP),%R9 |
(852) 0x88c61 MOV (%R10,%RDX,8),%RDX |
(852) 0x88c65 MOV 0x8(%R9,%R11,1),%R11 |
(852) 0x88c6a ADD %RDX,%R11 |
(852) 0x88c6d CMP %R11,%RDX |
(852) 0x88c70 JGE 88c30 |
(852) 0x88c72 MOV -0xa8(%RBP),%RCX |
(852) 0x88c79 MOV (%RCX,%R14,1),%R10 |
(852) 0x88c7d LEA (%R10,%R11,8),%R9 |
(852) 0x88c81 LEA (%R10,%RDX,8),%RDX |
(852) 0x88c85 MOV %R9,-0x38(%RBP) |
(852) 0x88c89 SUB %RDX,%R9 |
(852) 0x88c8c SUB $0x8,%R9 |
(852) 0x88c90 SHR $0x3,%R9 |
(852) 0x88c94 INC %R9 |
(852) 0x88c97 AND $0x3,%R9D |
(852) 0x88c9b JE 88d3b |
(852) 0x88ca1 CMP $0x1,%R9 |
(852) 0x88ca5 JE 88d03 |
(852) 0x88ca7 CMP $0x2,%R9 |
(852) 0x88cab JE 88cd8 |
(852) 0x88cad MOV (%RDX),%RCX |
(852) 0x88cb0 TEST %RCX,%RCX |
(852) 0x88cb3 JS 88fe0 |
(852) 0x88cb9 LEA (%R15,%RCX,8),%R11 |
(852) 0x88cbd CMP %RDI,(%R11) |
(852) 0x88cc0 JE 88cd4 |
(852) 0x88cc2 MOV -0x68(%RBP),%R10 |
(852) 0x88cc6 MOV (%R10,%R14,1),%R9 |
(852) 0x88cca MOV %RCX,(%R9,%R8,8) |
(852) 0x88cce INC %R8 |
(852) 0x88cd1 MOV %RDI,(%R11) |
(852) 0x88cd4 ADD $0x8,%RDX |
(852) 0x88cd8 MOV (%RDX),%RCX |
(852) 0x88cdb TEST %RCX,%RCX |
(852) 0x88cde JS 88fa0 |
(852) 0x88ce4 LEA (%R15,%RCX,8),%R10 |
(852) 0x88ce8 CMP %RDI,(%R10) |
(852) 0x88ceb JE 88cff |
(852) 0x88ced MOV -0x68(%RBP),%R9 |
(852) 0x88cf1 MOV (%R9,%R14,1),%R11 |
(852) 0x88cf5 MOV %RCX,(%R11,%R8,8) |
(852) 0x88cf9 INC %R8 |
(852) 0x88cfc MOV %RDI,(%R10) |
(852) 0x88cff ADD $0x8,%RDX |
(852) 0x88d03 MOV (%RDX),%RCX |
(852) 0x88d06 TEST %RCX,%RCX |
(852) 0x88d09 JS 88f68 |
(852) 0x88d0f LEA (%R15,%RCX,8),%R11 |
(852) 0x88d13 CMP %RDI,(%R11) |
(852) 0x88d16 JE 88d2a |
(852) 0x88d18 MOV -0x68(%RBP),%R9 |
(852) 0x88d1c MOV (%R9,%R14,1),%R10 |
(852) 0x88d20 MOV %RCX,(%R10,%R8,8) |
(852) 0x88d24 INC %R8 |
(852) 0x88d27 MOV %RDI,(%R11) |
(852) 0x88d2a MOV -0x38(%RBP),%RCX |
(852) 0x88d2e ADD $0x8,%RDX |
(852) 0x88d32 CMP %RCX,%RDX |
(852) 0x88d35 JE 88e9d |
(852) 0x88d3b MOV -0x68(%RBP),%R9 |
(852) 0x88d3f MOV -0x90(%RBP),%R10 |
(852) 0x88d46 MOV %RAX,-0x88(%RBP) |
(852) 0x88d4d JMP 88dc0 |
(853) 0x88d50 LEA (%R15,%RDX,8),%R11 |
(853) 0x88d54 CMP %RDI,(%R11) |
(853) 0x88d57 JE 88d67 |
(853) 0x88d59 MOV (%R9,%R14,1),%RAX |
(853) 0x88d5d MOV %RDX,(%RAX,%R8,8) |
(853) 0x88d61 INC %R8 |
(853) 0x88d64 MOV %RDI,(%R11) |
(853) 0x88d67 MOV 0x8(%RCX),%RDX |
(853) 0x88d6b TEST %RDX,%RDX |
(853) 0x88d6e JS 88e25 |
(853) 0x88d74 LEA (%R15,%RDX,8),%R11 |
(853) 0x88d78 CMP %RDI,(%R11) |
(853) 0x88d7b JE 88d8b |
(853) 0x88d7d MOV (%R9,%R14,1),%RAX |
(853) 0x88d81 MOV %RDX,(%RAX,%R8,8) |
(853) 0x88d85 INC %R8 |
(853) 0x88d88 MOV %RDI,(%R11) |
(853) 0x88d8b MOV 0x10(%RCX),%RDX |
(853) 0x88d8f TEST %RDX,%RDX |
(853) 0x88d92 JS 88e56 |
(853) 0x88d98 LEA (%R15,%RDX,8),%R11 |
(853) 0x88d9c CMP %RDI,(%R11) |
(853) 0x88d9f JE 88daf |
(853) 0x88da1 MOV (%R9,%R14,1),%RAX |
(853) 0x88da5 MOV %RDX,(%RAX,%R8,8) |
(853) 0x88da9 INC %R8 |
(853) 0x88dac MOV %RDI,(%R11) |
(853) 0x88daf LEA 0x18(%RCX),%RDX |
(853) 0x88db3 MOV -0x38(%RBP),%RCX |
(853) 0x88db7 CMP %RCX,%RDX |
(853) 0x88dba JE 88e8b |
(853) 0x88dc0 MOV (%RDX),%RCX |
(853) 0x88dc3 TEST %RCX,%RCX |
(853) 0x88dc6 JS 88f38 |
(853) 0x88dcc LEA (%R15,%RCX,8),%R11 |
(853) 0x88dd0 CMP %RDI,(%R11) |
(853) 0x88dd3 JE 88de3 |
(853) 0x88dd5 MOV (%R9,%R14,1),%RAX |
(853) 0x88dd9 MOV %RCX,(%RAX,%R8,8) |
(853) 0x88ddd INC %R8 |
(853) 0x88de0 MOV %RDI,(%R11) |
(853) 0x88de3 LEA 0x8(%RDX),%RCX |
(853) 0x88de7 MOV 0x8(%RDX),%RDX |
(853) 0x88deb TEST %RDX,%RDX |
(853) 0x88dee JNS 88d50 |
(853) 0x88df4 MOV %RDX,%R11 |
(853) 0x88df7 NOT %R11 |
(853) 0x88dfa LEA (%R12,%R11,8),%R11 |
(853) 0x88dfe CMP %RDI,(%R11) |
(853) 0x88e01 JE 88d67 |
(853) 0x88e07 MOV (%R10,%R14,1),%RAX |
(853) 0x88e0b NOT %RDX |
(853) 0x88e0e MOV %RDX,(%RAX,%RSI,8) |
(853) 0x88e12 INC %RSI |
(853) 0x88e15 MOV %RDI,(%R11) |
(853) 0x88e18 MOV 0x8(%RCX),%RDX |
(853) 0x88e1c TEST %RDX,%RDX |
(853) 0x88e1f JNS 88d74 |
(853) 0x88e25 MOV %RDX,%R11 |
(853) 0x88e28 NOT %R11 |
(853) 0x88e2b LEA (%R12,%R11,8),%R11 |
(853) 0x88e2f CMP %RDI,(%R11) |
(853) 0x88e32 JE 88d8b |
(853) 0x88e38 MOV (%R10,%R14,1),%RAX |
(853) 0x88e3c NOT %RDX |
(853) 0x88e3f MOV %RDX,(%RAX,%RSI,8) |
(853) 0x88e43 INC %RSI |
(853) 0x88e46 MOV %RDI,(%R11) |
(853) 0x88e49 MOV 0x10(%RCX),%RDX |
(853) 0x88e4d TEST %RDX,%RDX |
(853) 0x88e50 JNS 88d98 |
(853) 0x88e56 MOV %RDX,%R11 |
(853) 0x88e59 NOT %R11 |
(853) 0x88e5c LEA (%R12,%R11,8),%R11 |
(853) 0x88e60 CMP %RDI,(%R11) |
(853) 0x88e63 JE 88daf |
(853) 0x88e69 MOV (%R10,%R14,1),%RAX |
(853) 0x88e6d NOT %RDX |
(853) 0x88e70 MOV %RDX,(%RAX,%RSI,8) |
(853) 0x88e74 LEA 0x18(%RCX),%RDX |
(853) 0x88e78 MOV -0x38(%RBP),%RCX |
(853) 0x88e7c INC %RSI |
(853) 0x88e7f MOV %RDI,(%R11) |
(853) 0x88e82 CMP %RCX,%RDX |
(853) 0x88e85 JNE 88dc0 |
(852) 0x88e8b MOV %R9,-0x68(%RBP) |
(852) 0x88e8f MOV -0x88(%RBP),%RAX |
(852) 0x88e96 MOV %R10,-0x90(%RBP) |
(852) 0x88e9d MOV -0xc0(%RBP),%R9 |
(852) 0x88ea4 INC %RAX |
(852) 0x88ea7 MOV (%R9),%RCX |
(852) 0x88eaa CMP %RCX,%RAX |
(852) 0x88ead JL 88c3c |
0x88eb3 NOPL (%RAX,%RAX,1) |
0x88eb8 MOV -0x68(%RBP),%R9 |
0x88ebc MOV -0x90(%RBP),%R10 |
0x88ec3 MOV %R8,-0x88(%RBP) |
0x88eca INCQ -0x70(%RBP) |
0x88ece MOV -0x70(%RBP),%RDI |
0x88ed2 CMP %RDI,-0xb8(%RBP) |
0x88ed9 JG 88890 |
(853) 0x88f38 MOV %RCX,%R11 |
(853) 0x88f3b NOT %R11 |
(853) 0x88f3e LEA (%R12,%R11,8),%R11 |
(853) 0x88f42 CMP %RDI,(%R11) |
(853) 0x88f45 JE 88de3 |
(853) 0x88f4b MOV (%R10,%R14,1),%RAX |
(853) 0x88f4f NOT %RCX |
(853) 0x88f52 MOV %RCX,(%RAX,%RSI,8) |
(853) 0x88f56 INC %RSI |
(853) 0x88f59 MOV %RDI,(%R11) |
(853) 0x88f5c JMP 88de3 |
(852) 0x88f68 MOV %RCX,%R11 |
(852) 0x88f6b NOT %R11 |
(852) 0x88f6e LEA (%R12,%R11,8),%R10 |
(852) 0x88f72 CMP %RDI,(%R10) |
(852) 0x88f75 JE 88d2a |
(852) 0x88f7b MOV -0x90(%RBP),%R9 |
(852) 0x88f82 NOT %RCX |
(852) 0x88f85 MOV (%R9,%R14,1),%R11 |
(852) 0x88f89 MOV %RCX,(%R11,%RSI,8) |
(852) 0x88f8d INC %RSI |
(852) 0x88f90 MOV %RDI,(%R10) |
(852) 0x88f93 JMP 88d2a |
(852) 0x88fa0 MOV %RCX,%R10 |
(852) 0x88fa3 NOT %R10 |
(852) 0x88fa6 LEA (%R12,%R10,8),%R11 |
(852) 0x88faa CMP %RDI,(%R11) |
(852) 0x88fad JE 88cff |
(852) 0x88fb3 MOV -0x90(%RBP),%R9 |
(852) 0x88fba NOT %RCX |
(852) 0x88fbd MOV (%R9,%R14,1),%R10 |
(852) 0x88fc1 MOV %RCX,(%R10,%RSI,8) |
(852) 0x88fc5 INC %RSI |
(852) 0x88fc8 MOV %RDI,(%R11) |
(852) 0x88fcb JMP 88cff |
(854) 0x88fd0 MOV -0x90(%RBP),%R11 |
(854) 0x88fd7 MOV (%R11),%R8 |
(854) 0x88fda JMP 888f0 |
(852) 0x88fe0 MOV %RCX,%R11 |
(852) 0x88fe3 NOT %R11 |
(852) 0x88fe6 LEA (%R12,%R11,8),%R10 |
(852) 0x88fea CMP %RDI,(%R10) |
(852) 0x88fed JE 88cd4 |
(852) 0x88ff3 MOV -0x90(%RBP),%R9 |
(852) 0x88ffa NOT %RCX |
(852) 0x88ffd MOV (%R9,%R14,1),%R11 |
(852) 0x89001 MOV %RCX,(%R11,%RSI,8) |
(852) 0x89005 INC %RSI |
(852) 0x89008 MOV %RDI,(%R10) |
(852) 0x8900b JMP 88cd4 |
/scratch_na/users/xoserete/qaas_runs/171-415-3872/intel/AMG/build/AMG/AMG/parcsr_ls/par_multi_interp.c: 1072 - 1125 |
-------------------------------------------------------------------------------- |
1072: for (i=thread_start; i < thread_stop; i++) |
1073: { |
1074: i1 = pass_array[i]; |
1075: for (j=S_diag_i[i1]; j < S_diag_i[i1+1]; j++) |
1076: { |
1077: j1 = S_diag_j[j]; |
1078: if (assigned[j1] == pass-1) |
1079: { |
1080: j_start = P_diag_start[j1]; |
1081: j_end = j_start+P_diag_i[j1+1]; |
1082: for (k=j_start; k < j_end; k++) |
1083: { |
1084: k1 = P_diag_pass[pass-1][k]; |
1085: if (P_marker[k1] != -i1-1) |
1086: { |
1087: P_diag_pass[pass][cnt_nz++] = k1; |
1088: P_marker[k1] = -i1-1; |
1089: } |
1090: } |
1091: j_start = P_offd_start[j1]; |
1092: j_end = j_start+P_offd_i[j1+1]; |
1093: for (k=j_start; k < j_end; k++) |
1094: { |
1095: k1 = P_offd_pass[pass-1][k]; |
1096: if (P_marker_offd[k1] != -i1-1) |
1097: { |
1098: P_offd_pass[pass][cnt_nz_offd++] = k1; |
1099: P_marker_offd[k1] = -i1-1; |
1100: } |
1101: } |
1102: } |
1103: } |
1104: for (j=S_offd_i[i1]; j < S_offd_i[i1+1]; j++) |
1105: { |
1106: j1 = S_offd_j[j]; |
1107: if (assigned_offd[j1] == pass-1) |
1108: { |
1109: j_start = Pext_start[j1]; |
1110: j_end = j_start+Pext_i[j1+1]; |
1111: for (k=j_start; k < j_end; k++) |
1112: { |
1113: k1 = Pext_pass[pass][k]; |
1114: if (k1 < 0) |
1115: { |
1116: if (P_marker[-k1-1] != -i1-1) |
1117: { |
1118: P_diag_pass[pass][cnt_nz++] = -k1-1; |
1119: P_marker[-k1-1] = -i1-1; |
1120: } |
1121: } |
1122: else if (P_marker_offd[k1] != -i1-1) |
1123: { |
1124: P_offd_pass[pass][cnt_nz_offd++] = k1; |
1125: P_marker_offd[k1] = -i1-1; |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
○98.02 | gomp_thread_start | team.c:130 | libgomp.so.1.0.0 |
○1.98 | GOMP_parallel | libgomp.h:985 | libgomp.so.1.0.0 |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.00 |
CQA speedup if FP arith vectorized | 1.00 |
CQA speedup if fully vectorized | 8.00 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.21 |
Bottlenecks | micro-operation queue, |
Function | hypre_BoomerAMGBuildMultipass._omp_fn.5 |
Source | par_multi_interp.c:1072-1075,par_multi_interp.c:1104-1104,par_multi_interp.c:1122-1122 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 7.67 |
CQA cycles if no scalar integer | 7.67 |
CQA cycles if FP arith vectorized | 7.67 |
CQA cycles if fully vectorized | 0.96 |
Front-end cycles | 7.67 |
DIV/SQRT cycles | 2.10 |
P0 cycles | 2.00 |
P1 cycles | 6.33 |
P2 cycles | 6.33 |
P3 cycles | 5.00 |
P4 cycles | 2.00 |
P5 cycles | 1.90 |
P6 cycles | 5.00 |
P7 cycles | 5.00 |
P8 cycles | 5.00 |
P9 cycles | 2.00 |
P10 cycles | 6.33 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 7.86 |
Stall cycles (UFS) | 0.00 |
Nb insns | 45.00 |
Nb uops | 46.00 |
Nb loads | 19.00 |
Nb stores | 10.00 |
Nb stack references | 12.00 |
FLOP/cycle | 0.00 |
Nb FLOP add-sub | 0.00 |
Nb FLOP mul | 0.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 30.26 |
Bytes prefetched | 0.00 |
Bytes loaded | 152.00 |
Bytes stored | 80.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 0.00 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | NA |
Vectorization ratio add_sub | NA |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 0.00 |
Vector-efficiency ratio all | 12.50 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | NA |
Vector-efficiency ratio add_sub | NA |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 12.50 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.00 |
CQA speedup if FP arith vectorized | 1.00 |
CQA speedup if fully vectorized | 8.00 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.21 |
Bottlenecks | micro-operation queue, |
Function | hypre_BoomerAMGBuildMultipass._omp_fn.5 |
Source | par_multi_interp.c:1072-1075,par_multi_interp.c:1104-1104,par_multi_interp.c:1122-1122 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 7.67 |
CQA cycles if no scalar integer | 7.67 |
CQA cycles if FP arith vectorized | 7.67 |
CQA cycles if fully vectorized | 0.96 |
Front-end cycles | 7.67 |
DIV/SQRT cycles | 2.10 |
P0 cycles | 2.00 |
P1 cycles | 6.33 |
P2 cycles | 6.33 |
P3 cycles | 5.00 |
P4 cycles | 2.00 |
P5 cycles | 1.90 |
P6 cycles | 5.00 |
P7 cycles | 5.00 |
P8 cycles | 5.00 |
P9 cycles | 2.00 |
P10 cycles | 6.33 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 7.86 |
Stall cycles (UFS) | 0.00 |
Nb insns | 45.00 |
Nb uops | 46.00 |
Nb loads | 19.00 |
Nb stores | 10.00 |
Nb stack references | 12.00 |
FLOP/cycle | 0.00 |
Nb FLOP add-sub | 0.00 |
Nb FLOP mul | 0.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 30.26 |
Bytes prefetched | 0.00 |
Bytes loaded | 152.00 |
Bytes stored | 80.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 0.00 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | NA |
Vectorization ratio add_sub | NA |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 0.00 |
Vector-efficiency ratio all | 12.50 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | NA |
Vector-efficiency ratio add_sub | NA |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 12.50 |
Path / |
Function | hypre_BoomerAMGBuildMultipass._omp_fn.5 |
Source file and lines | par_multi_interp.c:1072-1125 |
Module | libparcsr_ls.so |
nb instructions | 45 |
nb uops | 46 |
loop length | 230 |
used x86 registers | 11 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 12 |
micro-operation queue | 7.67 cycles |
front end | 7.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.10 | 2.00 | 6.33 | 6.33 | 5.00 | 2.00 | 1.90 | 5.00 | 5.00 | 5.00 | 2.00 | 6.33 |
cycles | 2.10 | 2.00 | 6.33 | 6.33 | 5.00 | 2.00 | 1.90 | 5.00 | 5.00 | 5.00 | 2.00 | 6.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 7.86 |
Stall cycles | 0.00 |
Front-end | 7.67 |
Dispatch | 6.33 |
Overall L1 | 7.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0xb0(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%RCX,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(,%RDI,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R8,%RDI,8),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R8),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R8,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 88bf0 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x1120> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDI,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x88(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 88901 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0xe31> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xc0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0xe0(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R11,%RDI,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOT %RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R11),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 88eca <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x13fa> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x88(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd8(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 88c3c <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x116c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INCQ -0x70(%RBP) | 3 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,-0xb8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JG 88890 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0xdc0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
Function | hypre_BoomerAMGBuildMultipass._omp_fn.5 |
Source file and lines | par_multi_interp.c:1072-1125 |
Module | libparcsr_ls.so |
nb instructions | 45 |
nb uops | 46 |
loop length | 230 |
used x86 registers | 11 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 12 |
micro-operation queue | 7.67 cycles |
front end | 7.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.10 | 2.00 | 6.33 | 6.33 | 5.00 | 2.00 | 1.90 | 5.00 | 5.00 | 5.00 | 2.00 | 6.33 |
cycles | 2.10 | 2.00 | 6.33 | 6.33 | 5.00 | 2.00 | 1.90 | 5.00 | 5.00 | 5.00 | 2.00 | 6.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 7.86 |
Stall cycles | 0.00 |
Front-end | 7.67 |
Dispatch | 6.33 |
Overall L1 | 7.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0xb0(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%RCX,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(,%RDI,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R8,%RDI,8),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R8),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R8,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 88bf0 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x1120> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDI,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x88(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 88901 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0xe31> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xc0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0xe0(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R11,%RDI,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOT %RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R11),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 88eca <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x13fa> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x88(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd8(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 88c3c <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x116c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INCQ -0x70(%RBP) | 3 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,-0xb8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JG 88890 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0xdc0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |