Function: _Z16initialise_chunkiR16global_variables.extracted.7 | Module: exec | Source: initialise_chunk.cpp:77-82 [...] | Coverage: 0.01% |
---|
Function: _Z16initialise_chunkiR16global_variables.extracted.7 | Module: exec | Source: initialise_chunk.cpp:77-82 [...] | Coverage: 0.01% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-145-9336/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 46 - 69 |
-------------------------------------------------------------------------------- |
46: T &operator[](size_t i) const { return data[i]; } |
[...] |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
/home/eoseret/qaas_runs_CPU_9468/171-145-9336/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/initialise_chunk.cpp: 77 - 82 |
-------------------------------------------------------------------------------- |
77: #pragma omp parallel for simd collapse(2) |
78: for (int j = (0); j < (yrange1); j++) { |
79: for (int i = (0); i < (xrange1); i++) { |
80: field.volume(i, j) = dx * dy; |
81: field.xarea(i, j) = field.celldy[j]; |
82: field.yarea(i, j) = field.celldx[i]; |
0x42d040 PUSH %RBP |
0x42d041 MOV %RSP,%RBP |
0x42d044 PUSH %R15 |
0x42d046 PUSH %R14 |
0x42d048 PUSH %R13 |
0x42d04a PUSH %R12 |
0x42d04c PUSH %RBX |
0x42d04d SUB $0x68,%RSP |
0x42d051 MOVL $0,-0x30(%RBP) |
0x42d058 MOV %R9,%RBX |
0x42d05b MOV %R8,%R15 |
0x42d05e MOV %RCX,%R12 |
0x42d061 MOV %RDX,%R13 |
0x42d064 MOV (%RDI),%ESI |
0x42d066 MOVQ $0,-0x38(%RBP) |
0x42d06e MOVQ $0x1,-0x88(%RBP) |
0x42d079 SUB $0x8,%RSP |
0x42d07d LEA -0x88(%RBP),%RAX |
0x42d084 LEA -0x30(%RBP),%RCX |
0x42d088 LEA -0x38(%RBP),%R8 |
0x42d08c LEA 0x18(%RBP),%R9 |
0x42d090 MOV $0x481260,%EDI |
0x42d095 MOV %ESI,-0x2c(%RBP) |
0x42d098 MOV $0x22,%EDX |
0x42d09d PUSH $0x1 |
0x42d09f PUSH $0x1 |
0x42d0a1 PUSH %RAX |
0x42d0a2 CALL 4031e0 <__kmpc_for_static_init_8@plt> |
0x42d0a7 ADD $0x20,%RSP |
0x42d0ab MOV -0x38(%RBP),%RSI |
0x42d0af MOV 0x18(%RBP),%R9 |
0x42d0b3 CMP %R9,%RSI |
0x42d0b6 JA 42d45b |
0x42d0bc MOV %RBX,%R8 |
0x42d0bf VMOVQ %R13,%XMM0 |
0x42d0c4 VMOVQ %R12,%XMM1 |
0x42d0c9 VMULSD %XMM0,%XMM1,%XMM16 |
0x42d0cf MOV 0x2a0(%R15),%R12 |
0x42d0d6 MOV 0x290(%R15),%R10 |
0x42d0dd MOV 0x228(%R15),%RBX |
0x42d0e4 MOV 0x248(%R15),%R13 |
0x42d0eb MOV 0x2b8(%R15),%RDI |
0x42d0f2 MOV 0x2a8(%R15),%R11 |
0x42d0f9 MOV 0x2d0(%R15),%R14 |
0x42d100 MOV 0x2c0(%R15),%R15 |
0x42d107 LEA 0x1(%RSI),%RAX |
0x42d10b INC %R9 |
0x42d10e CMP %R9,%RAX |
0x42d111 CMOVG %RAX,%R9 |
0x42d115 MOV %R9,%RCX |
0x42d118 SUB %RSI,%RCX |
0x42d11b MOV %RCX,%RAX |
0x42d11e AND $-0x10,%RAX |
0x42d122 JE 42d479 |
0x42d128 MOV %RCX,-0x40(%RBP) |
0x42d12c MOV %R9,-0x68(%RBP) |
0x42d130 MOV %RAX,-0x48(%RBP) |
0x42d134 DEC %RAX |
0x42d137 MOV %RAX,-0x80(%RBP) |
0x42d13b MOV %R8,-0x70(%RBP) |
0x42d13f VPBROADCASTQ %R8,%YMM8 |
0x42d145 MOV %R10,-0x60(%RBP) |
0x42d149 VPBROADCASTQ %R10,%YMM17 |
0x42d14f VBROADCASTSD %XMM16,%YMM18 |
0x42d155 MOV %R11,-0x58(%RBP) |
0x42d159 VPBROADCASTQ %R11,%YMM19 |
0x42d15f MOV %R15,-0x50(%RBP) |
0x42d163 VPBROADCASTQ %R15,%YMM20 |
0x42d169 XOR %R15D,%R15D |
0x42d16c VMOVDQU64 0x393aa(%RIP),%YMM21 |
0x42d176 VMOVDQU64 0x393c0(%RIP),%YMM22 |
0x42d180 VMOVDQU64 0x374f6(%RIP),%YMM23 |
0x42d18a VMOVDQU64 0x3736c(%RIP),%YMM24 |
0x42d194 MOV %RSI,-0x78(%RBP) |
0x42d198 NOPL (%RAX,%RAX,1) |
(245) 0x42d1a0 LEA (%RSI,%R15,1),%RAX |
(245) 0x42d1a4 VPBROADCASTQ %RAX,%YMM0 |
(245) 0x42d1aa VPADDQ %YMM21,%YMM0,%YMM9 |
(245) 0x42d1b0 VPADDQ %YMM22,%YMM0,%YMM10 |
(245) 0x42d1b6 VPADDQ %YMM23,%YMM0,%YMM11 |
(245) 0x42d1bc VPADDQ %YMM24,%YMM0,%YMM12 |
(245) 0x42d1c2 VMOVDQA %YMM12,%YMM0 |
(245) 0x42d1c6 VMOVDQA %YMM8,%YMM1 |
(245) 0x42d1ca MOV $0x452610,%RAX |
(245) 0x42d1d1 MOV %R14,%RSI |
(245) 0x42d1d4 MOV %RDI,%R14 |
(245) 0x42d1d7 MOV %R13,%RDI |
(245) 0x42d1da MOV %RBX,%R13 |
(245) 0x42d1dd MOV %R12,%RBX |
(245) 0x42d1e0 MOV %RAX,%R12 |
(245) 0x42d1e3 CALL %RAX |
(245) 0x42d1e5 VMOVDQA %YMM0,%YMM13 |
(245) 0x42d1e9 VMOVDQA %YMM11,%YMM0 |
(245) 0x42d1ed VMOVDQA %YMM8,%YMM1 |
(245) 0x42d1f1 CALL %R12 |
(245) 0x42d1f4 VMOVDQA %YMM0,%YMM14 |
(245) 0x42d1f8 VMOVDQA %YMM10,%YMM0 |
(245) 0x42d1fc VMOVDQA %YMM8,%YMM1 |
(245) 0x42d200 CALL %R12 |
(245) 0x42d203 VMOVDQA %YMM0,%YMM15 |
(245) 0x42d207 VMOVDQA %YMM9,%YMM0 |
(245) 0x42d20b VMOVDQA %YMM8,%YMM1 |
(245) 0x42d20f CALL %R12 |
(245) 0x42d212 MOV %RBX,%R12 |
(245) 0x42d215 MOV %R13,%RBX |
(245) 0x42d218 MOV %RDI,%R13 |
(245) 0x42d21b MOV %R14,%RDI |
(245) 0x42d21e MOV %RSI,%R14 |
(245) 0x42d221 MOV -0x78(%RBP),%RSI |
(245) 0x42d225 VXORPS %XMM1,%XMM1,%XMM1 |
(245) 0x42d229 VPMULLQ %YMM8,%YMM0,%YMM1 |
(245) 0x42d22f VXORPS %XMM2,%XMM2,%XMM2 |
(245) 0x42d233 VPMULLQ %YMM8,%YMM15,%YMM2 |
(245) 0x42d239 VXORPS %XMM3,%XMM3,%XMM3 |
(245) 0x42d23d VPMULLQ %YMM8,%YMM14,%YMM3 |
(245) 0x42d243 VPMULLQ %YMM8,%YMM13,%YMM4 |
(245) 0x42d249 VPSLLQ $0x20,%YMM14,%YMM5 |
(245) 0x42d24f VPSRAQ $0x20,%YMM5,%YMM5 |
(245) 0x42d256 VPSLLQ $0x20,%YMM13,%YMM6 |
(245) 0x42d25c VPSRAQ $0x20,%YMM6,%YMM6 |
(245) 0x42d263 VPMULLQ %YMM6,%YMM17,%YMM7 |
(245) 0x42d269 VXORPS %XMM13,%XMM13,%XMM13 |
(245) 0x42d26e VPMULLQ %YMM5,%YMM17,%YMM13 |
(245) 0x42d274 VPSLLQ $0x20,%YMM15,%YMM14 |
(245) 0x42d27a VPSRAQ $0x20,%YMM14,%YMM14 |
(245) 0x42d281 VXORPS %XMM15,%XMM15,%XMM15 |
(245) 0x42d286 VPMULLQ %YMM14,%YMM17,%YMM15 |
(245) 0x42d28c VPSUBQ %YMM4,%YMM12,%YMM4 |
(245) 0x42d290 VPSLLQ $0x20,%YMM0,%YMM0 |
(245) 0x42d295 VPSRAQ $0x20,%YMM0,%YMM0 |
(245) 0x42d29c VXORPS %XMM12,%XMM12,%XMM12 |
(245) 0x42d2a1 VPMULLQ %YMM0,%YMM17,%YMM12 |
(245) 0x42d2a7 VPSUBQ %YMM3,%YMM11,%YMM3 |
(245) 0x42d2ab VPSUBQ %YMM2,%YMM10,%YMM2 |
(245) 0x42d2af VPSUBQ %YMM1,%YMM9,%YMM1 |
(245) 0x42d2b3 VPADDQ %YMM1,%YMM12,%YMM9 |
(245) 0x42d2b7 VPADDQ %YMM2,%YMM15,%YMM10 |
(245) 0x42d2bb VPADDQ %YMM3,%YMM13,%YMM11 |
(245) 0x42d2bf VPADDQ %YMM7,%YMM4,%YMM7 |
(245) 0x42d2c3 KXNORW %K0,%K0,%K1 |
(245) 0x42d2c7 VSCATTERQPD %YMM18,(%R12,%YMM7,8){%K1} |
(245) 0x42d2ce KXNORW %K0,%K0,%K1 |
(245) 0x42d2d2 VSCATTERQPD %YMM18,(%R12,%YMM11,8){%K1} |
(245) 0x42d2d9 KXNORW %K0,%K0,%K1 |
(245) 0x42d2dd VSCATTERQPD %YMM18,(%R12,%YMM10,8){%K1} |
(245) 0x42d2e4 KXNORW %K0,%K0,%K1 |
(245) 0x42d2e8 VSCATTERQPD %YMM18,(%R12,%YMM9,8){%K1} |
(245) 0x42d2ef KXNORW %K0,%K0,%K1 |
(245) 0x42d2f3 VXORPD %XMM7,%XMM7,%XMM7 |
(245) 0x42d2f7 VGATHERQPD (%R13,%YMM0,8),%YMM7{%K1} |
(245) 0x42d2ff KXNORW %K0,%K0,%K1 |
(245) 0x42d303 VXORPD %XMM9,%XMM9,%XMM9 |
(245) 0x42d308 VGATHERQPD (%R13,%YMM14,8),%YMM9{%K1} |
(245) 0x42d310 KXNORW %K0,%K0,%K1 |
(245) 0x42d314 VXORPD %XMM10,%XMM10,%XMM10 |
(245) 0x42d319 VGATHERQPD (%R13,%YMM5,8),%YMM10{%K1} |
(245) 0x42d321 KXNORW %K0,%K0,%K1 |
(245) 0x42d325 VXORPD %XMM11,%XMM11,%XMM11 |
(245) 0x42d32a VGATHERQPD (%R13,%YMM6,8),%YMM11{%K1} |
(245) 0x42d332 VXORPS %XMM12,%XMM12,%XMM12 |
(245) 0x42d337 VPMULLQ %YMM6,%YMM19,%YMM12 |
(245) 0x42d33d VXORPS %XMM13,%XMM13,%XMM13 |
(245) 0x42d342 VPMULLQ %YMM5,%YMM19,%YMM13 |
(245) 0x42d348 VXORPS %XMM15,%XMM15,%XMM15 |
(245) 0x42d34d VPMULLQ %YMM14,%YMM19,%YMM15 |
(245) 0x42d353 VPMULLQ %YMM0,%YMM19,%YMM25 |
(245) 0x42d359 VPADDQ %YMM25,%YMM1,%YMM25 |
(245) 0x42d35f VPADDQ %YMM2,%YMM15,%YMM15 |
(245) 0x42d363 VPADDQ %YMM3,%YMM13,%YMM13 |
(245) 0x42d367 VPADDQ %YMM4,%YMM12,%YMM12 |
(245) 0x42d36b KXNORW %K0,%K0,%K1 |
(245) 0x42d36f VSCATTERQPD %YMM11,(%RDI,%YMM12,8){%K1} |
(245) 0x42d376 KXNORW %K0,%K0,%K1 |
(245) 0x42d37a VSCATTERQPD %YMM10,(%RDI,%YMM13,8){%K1} |
(245) 0x42d381 KXNORW %K0,%K0,%K1 |
(245) 0x42d385 VSCATTERQPD %YMM9,(%RDI,%YMM15,8){%K1} |
(245) 0x42d38c KXNORW %K0,%K0,%K1 |
(245) 0x42d390 VSCATTERQPD %YMM7,(%RDI,%YMM25,8){%K1} |
(245) 0x42d397 KXNORW %K0,%K0,%K1 |
(245) 0x42d39b VXORPD %XMM7,%XMM7,%XMM7 |
(245) 0x42d39f VGATHERQPD (%RBX,%YMM1,8),%YMM7{%K1} |
(245) 0x42d3a6 KXNORW %K0,%K0,%K1 |
(245) 0x42d3aa VXORPD %XMM9,%XMM9,%XMM9 |
(245) 0x42d3af VGATHERQPD (%RBX,%YMM2,8),%YMM9{%K1} |
(245) 0x42d3b6 KXNORW %K0,%K0,%K1 |
(245) 0x42d3ba VXORPD %XMM10,%XMM10,%XMM10 |
(245) 0x42d3bf VGATHERQPD (%RBX,%YMM3,8),%YMM10{%K1} |
(245) 0x42d3c6 KXNORW %K0,%K0,%K1 |
(245) 0x42d3ca VXORPD %XMM11,%XMM11,%XMM11 |
(245) 0x42d3cf VGATHERQPD (%RBX,%YMM4,8),%YMM11{%K1} |
(245) 0x42d3d6 VPMULLQ %YMM6,%YMM20,%YMM6 |
(245) 0x42d3dc VPMULLQ %YMM5,%YMM20,%YMM5 |
(245) 0x42d3e2 VXORPS %XMM12,%XMM12,%XMM12 |
(245) 0x42d3e7 VPMULLQ %YMM14,%YMM20,%YMM12 |
(245) 0x42d3ed VPMULLQ %YMM0,%YMM20,%YMM0 |
(245) 0x42d3f3 VPADDQ %YMM0,%YMM1,%YMM0 |
(245) 0x42d3f7 VPADDQ %YMM2,%YMM12,%YMM1 |
(245) 0x42d3fb VPADDQ %YMM5,%YMM3,%YMM2 |
(245) 0x42d3ff VPADDQ %YMM6,%YMM4,%YMM3 |
(245) 0x42d403 KXNORW %K0,%K0,%K1 |
(245) 0x42d407 VSCATTERQPD %YMM11,(%R14,%YMM3,8){%K1} |
(245) 0x42d40e KXNORW %K0,%K0,%K1 |
(245) 0x42d412 VSCATTERQPD %YMM10,(%R14,%YMM2,8){%K1} |
(245) 0x42d419 KXNORW %K0,%K0,%K1 |
(245) 0x42d41d VSCATTERQPD %YMM9,(%R14,%YMM1,8){%K1} |
(245) 0x42d424 KXNORW %K0,%K0,%K1 |
(245) 0x42d428 VSCATTERQPD %YMM7,(%R14,%YMM0,8){%K1} |
(245) 0x42d42f ADD $0x10,%R15 |
(245) 0x42d433 CMP -0x80(%RBP),%R15 |
(245) 0x42d437 JBE 42d1a0 |
0x42d43d MOV -0x48(%RBP),%RAX |
0x42d441 CMP %RAX,-0x40(%RBP) |
0x42d445 MOV -0x70(%RBP),%R8 |
0x42d449 MOV -0x68(%RBP),%R9 |
0x42d44d MOV -0x60(%RBP),%R10 |
0x42d451 MOV -0x58(%RBP),%R11 |
0x42d455 MOV -0x50(%RBP),%R15 |
0x42d459 JNE 42d47b |
0x42d45b MOV $0x481280,%EDI |
0x42d460 MOV -0x2c(%RBP),%ESI |
0x42d463 ADD $0x68,%RSP |
0x42d467 POP %RBX |
0x42d468 POP %R12 |
0x42d46a POP %R13 |
0x42d46c POP %R14 |
0x42d46e POP %R15 |
0x42d470 POP %RBP |
0x42d471 VZEROUPPER |
0x42d474 JMP 403050 |
0x42d479 XOR %EAX,%EAX |
0x42d47b ADD %RAX,%RSI |
0x42d47e JMP 42d4cb |
(244) 0x42d480 MOV %RSI,%RAX |
(244) 0x42d483 CQTO |
(244) 0x42d485 IDIV %R8 |
(244) 0x42d488 CLTQ |
(244) 0x42d48a MOV %R10,%RCX |
(244) 0x42d48d IMUL %RAX,%RCX |
(244) 0x42d491 ADD %RDX,%RCX |
(244) 0x42d494 VMOVSD %XMM16,(%R12,%RCX,8) |
(244) 0x42d49b MOV %R11,%RCX |
(244) 0x42d49e IMUL %RAX,%RCX |
(244) 0x42d4a2 ADD %RDX,%RCX |
(244) 0x42d4a5 VMOVSD (%R13,%RAX,8),%XMM0 |
(244) 0x42d4ac VMOVSD %XMM0,(%RDI,%RCX,8) |
(244) 0x42d4b1 IMUL %R15,%RAX |
(244) 0x42d4b5 ADD %RDX,%RAX |
(244) 0x42d4b8 VMOVSD (%RBX,%RDX,8),%XMM0 |
(244) 0x42d4bd VMOVSD %XMM0,(%R14,%RAX,8) |
(244) 0x42d4c3 INC %RSI |
(244) 0x42d4c6 CMP %RSI,%R9 |
(244) 0x42d4c9 JE 42d45b |
(244) 0x42d4cb MOV %RSI,%RAX |
(244) 0x42d4ce OR %R8,%RAX |
(244) 0x42d4d1 SHR $0x20,%RAX |
(244) 0x42d4d5 JNE 42d480 |
(244) 0x42d4d7 MOV %ESI,%EAX |
(244) 0x42d4d9 XOR %EDX,%EDX |
(244) 0x42d4db DIV %R8D |
(244) 0x42d4de JMP 42d488 |
Path / |
Source file and lines | initialise_chunk.cpp:77-82 |
Module | exec |
nb instructions | 97 |
nb uops | 98 |
loop length | 419 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 9 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 16.33 cycles |
front end | 16.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 3.30 | 3.30 | 9.67 | 9.67 | 11.50 | 7.00 | 3.20 | 11.50 | 11.50 | 11.50 | 3.20 | 9.67 |
cycles | 3.30 | 3.30 | 9.67 | 9.67 | 11.50 | 7.00 | 3.20 | 11.50 | 11.50 | 11.50 | 3.20 | 9.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 16.09-16.10 |
Stall cycles | 0.00 |
Front-end | 16.33 |
Dispatch | 11.50 |
Overall L1 | 16.33 |
all | 9% |
load | 25% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 0% |
load | NA (no load vectorizable/vectorized instructions) |
store | NA (no store vectorizable/vectorized instructions) |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 9% |
load | 25% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 5% |
all | 15% |
load | 21% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | NA (no load vectorizable/vectorized instructions) |
store | NA (no store vectorizable/vectorized instructions) |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 21% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x68,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x88(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x30(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x38(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x18(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x481260,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 4031e0 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 42d45b <_Z16initialise_chunkiR16global_variables.extracted.7+0x41b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVQ %R12,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMULSD %XMM0,%XMM1,%XMM16 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x2a0(%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x290(%R15),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x228(%R15),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x248(%R15),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2b8(%R15),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2a8(%R15),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2d0(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2c0(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R9,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R9,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 42d479 <_Z16initialise_chunkiR16global_variables.extracted.7+0x439> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R8,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R10,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R10,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM16,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R11,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R15,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R15,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDQU64 0x393aa(%RIP),%YMM21 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0x393c0(%RIP),%YMM22 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0x374f6(%RIP),%YMM23 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0x3736c(%RIP),%YMM24 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %RSI,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,-0x40(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 42d47b <_Z16initialise_chunkiR16global_variables.extracted.7+0x43b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x481280,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x2c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x68,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 403050 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 42d4cb <_Z16initialise_chunkiR16global_variables.extracted.7+0x48b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
Source file and lines | initialise_chunk.cpp:77-82 |
Module | exec |
nb instructions | 97 |
nb uops | 98 |
loop length | 419 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 9 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 16.33 cycles |
front end | 16.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 3.30 | 3.30 | 9.67 | 9.67 | 11.50 | 7.00 | 3.20 | 11.50 | 11.50 | 11.50 | 3.20 | 9.67 |
cycles | 3.30 | 3.30 | 9.67 | 9.67 | 11.50 | 7.00 | 3.20 | 11.50 | 11.50 | 11.50 | 3.20 | 9.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 16.09-16.10 |
Stall cycles | 0.00 |
Front-end | 16.33 |
Dispatch | 11.50 |
Overall L1 | 16.33 |
all | 9% |
load | 25% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 0% |
load | NA (no load vectorizable/vectorized instructions) |
store | NA (no store vectorizable/vectorized instructions) |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 9% |
load | 25% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 5% |
all | 15% |
load | 21% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | NA (no load vectorizable/vectorized instructions) |
store | NA (no store vectorizable/vectorized instructions) |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 21% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x68,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x88(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x30(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x38(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x18(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x481260,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 4031e0 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 42d45b <_Z16initialise_chunkiR16global_variables.extracted.7+0x41b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVQ %R12,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMULSD %XMM0,%XMM1,%XMM16 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x2a0(%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x290(%R15),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x228(%R15),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x248(%R15),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2b8(%R15),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2a8(%R15),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2d0(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2c0(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R9,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R9,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 42d479 <_Z16initialise_chunkiR16global_variables.extracted.7+0x439> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R8,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R10,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R10,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM16,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R11,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R15,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R15,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDQU64 0x393aa(%RIP),%YMM21 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0x393c0(%RIP),%YMM22 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0x374f6(%RIP),%YMM23 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0x3736c(%RIP),%YMM24 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %RSI,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,-0x40(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 42d47b <_Z16initialise_chunkiR16global_variables.extracted.7+0x43b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x481280,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x2c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x68,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 403050 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 42d4cb <_Z16initialise_chunkiR16global_variables.extracted.7+0x48b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_Z16initialise_chunkiR16global_variables.extracted.7– | 0.01 | 0.01 |
○Loop 245 - initialise_chunk.cpp:77-82 - exec | 0.01 | 0.01 |
○Loop 244 - initialise_chunk.cpp:77-82 - exec | 0 | 0 |