Loop Id: 343 | Module: exec | Source: generate_chunk.cpp:85-123 [...] | Coverage: 0.01% |
---|
Loop Id: 343 | Module: exec | Source: generate_chunk.cpp:85-123 [...] | Coverage: 0.01% |
---|
0x4341f6 VPADDQ %ZMM24,%ZMM0,%ZMM0 |
0x4341fc VBROADCASTSD %XMM1,%ZMM1 |
0x434202 VSCATTERQPD %ZMM1,(,%ZMM0,1){%K1} |
0x43420d NOPL (%RAX) |
0x434210 VPADDQ %ZMM24,%ZMM19,%ZMM19 |
0x434216 ADD $0x8,%RSI |
0x43421a CMP %R12,%RSI |
0x43421d JAE 435543 |
0x434223 VPADDQ %ZMM19,%ZMM18,%ZMM16 |
0x434229 MOVSXD %R13D,%RAX |
0x43422c VPBROADCASTQ %RAX,%ZMM17 |
0x434232 VMOVDQA64 %ZMM16,%ZMM0 |
0x434238 VMOVDQA64 %ZMM17,%ZMM1 |
0x43423e LEA 0x2756b(%RIP),%RAX |
0x434245 CALL %RAX |
0x434247 VPXOR %XMM1,%XMM1,%XMM1 |
0x43424b VPMULLQ %ZMM17,%ZMM0,%ZMM1 |
0x434251 VPSUBQ %ZMM1,%ZMM16,%ZMM1 |
0x434257 MOV -0x98(%RBP),%RAX |
0x43425e VBROADCASTSD (%RAX,%R15,8),%ZMM3 |
0x434265 MOV -0x90(%RBP),%RAX |
0x43426c VBROADCASTSD (%RAX,%R15,8),%ZMM2 |
0x434273 CMP $0x2,%R14D |
0x434277 JGE 434540 |
0x43427d CMP $0x1,%R14D |
0x434281 JNE 434210 |
0x434283 MOV -0x58(%RBP),%RAX |
0x434287 MOV (%RAX),%RDX |
0x43428a MOV 0x258(%RDX),%RAX |
0x434291 VPMOVQD %ZMM1,%YMM4 |
0x434297 VPCMPEQD %YMM5,%YMM5,%YMM5 |
0x43429b VPSUBD %YMM5,%YMM4,%YMM4 |
0x43429f KXNORW %K0,%K0,%K1 |
0x4342a3 VPXOR %XMM5,%XMM5,%XMM5 |
0x4342a7 VGATHERDPD (%RAX,%YMM4,8),%ZMM5{%K1} |
0x4342ae VCMPPD $0x2,%ZMM5,%ZMM3,%K1 |
0x4342b5 KORTESTB %K1,%K1 |
0x4342b9 JE 434210 |
0x4342bf JE 4342c9 |
0x4342c1 MOV -0x80(%RBP),%RCX |
0x4342c5 MOV 0x8(%RCX),%RCX |
0x4342c9 KORTESTB %K1,%K1 |
0x4342cd JE 4342d5 |
0x4342cf VMOVSD (%RCX,%R15,8),%XMM3 |
0x4342d5 KMOVQ %K1,%K2 |
0x4342da VXORPD %XMM4,%XMM4,%XMM4 |
0x4342de VGATHERQPD (%RAX,%ZMM1,8),%ZMM4{%K2} |
0x4342e5 VBROADCASTSD %XMM3,%ZMM3 |
0x4342eb VCMPPD $0x1,%ZMM3,%ZMM4,%K1{%K1} |
0x4342f2 KORTESTB %K1,%K1 |
0x4342f6 JE 434210 |
0x4342fc KORTESTB %K1,%K1 |
0x434300 JE 43430a |
0x434302 VMOVQ 0x278(%RDX),%XMM3 |
0x43430a VPSLLQ $0x20,%ZMM0,%ZMM0 |
0x434311 VPADDQ %ZMM20,%ZMM0,%ZMM4 |
0x434317 VPSRAQ $0x20,%ZMM4,%ZMM6 |
0x43431e VMOVQ %XMM3,%RAX |
0x434323 KMOVQ %K1,%K2 |
0x434328 VPXOR %XMM4,%XMM4,%XMM4 |
0x43432c VGATHERQPD (%RAX,%ZMM6,8),%ZMM4{%K2} |
0x434333 VCMPPD $0x2,%ZMM4,%ZMM2,%K1{%K1} |
0x43433a KORTESTB %K1,%K1 |
0x43433e JE 434210 |
0x434344 JE 43434e |
0x434346 MOV -0x78(%RBP),%RAX |
0x43434a MOV 0x8(%RAX),%RAX |
0x43434e KORTESTB %K1,%K1 |
0x434352 JE 43435a |
0x434354 VMOVSD (%RAX,%R15,8),%XMM2 |
0x43435a VPBROADCASTQ %XMM3,%ZMM3 |
0x434360 VPSRAQ $0x1d,%ZMM0,%ZMM4 |
0x434367 VPADDQ %ZMM4,%ZMM3,%ZMM3 |
0x43436d KMOVQ %K1,%K2 |
0x434372 VPXOR %XMM4,%XMM4,%XMM4 |
0x434376 VGATHERQPD (,%ZMM3,1),%ZMM4{%K2} |
0x434381 VBROADCASTSD %XMM2,%ZMM2 |
0x434387 VCMPPD $0x1,%ZMM2,%ZMM4,%K1{%K1} |
0x43438e KORTESTB %K1,%K1 |
0x434392 JE 434210 |
0x434398 JE 4343a2 |
0x43439a MOV -0x40(%RBP),%RAX |
0x43439e MOV 0x8(%RAX),%RAX |
0x4343a2 KORTESTB %K1,%K1 |
0x4343a6 JE 4343ad |
0x4343a8 VMOVQ 0x40(%RDX),%XMM2 |
0x4343ad KORTESTB %K1,%K1 |
0x4343b1 JE 4343b8 |
0x4343b3 VMOVQ 0x30(%RDX),%XMM3 |
0x4343b8 KORTESTB %K1,%K1 |
0x4343bc JE 4343c4 |
0x4343be VMOVSD (%RAX,%R15,8),%XMM4 |
0x4343c4 VPSRAQ $0x20,%ZMM0,%ZMM0 |
0x4343cb VPBROADCASTQ %XMM3,%ZMM3 |
0x4343d1 VPMULLQ %ZMM0,%ZMM3,%ZMM3 |
0x4343d7 VPBROADCASTQ %XMM2,%ZMM2 |
0x4343dd VPADDQ %ZMM3,%ZMM1,%ZMM3 |
0x4343e3 VPSLLQ $0x3,%ZMM3,%ZMM3 |
0x4343ea VPADDQ %ZMM3,%ZMM2,%ZMM2 |
0x4343f0 VBROADCASTSD %XMM4,%ZMM3 |
0x4343f6 KMOVQ %K1,%K2 |
0x4343fb VSCATTERQPD %ZMM3,(,%ZMM2,1){%K2} |
0x434406 KORTESTB %K1,%K1 |
0x43440a JE 434414 |
0x43440c MOV -0x38(%RBP),%RAX |
0x434410 MOV 0x8(%RAX),%RAX |
0x434414 KORTESTB %K1,%K1 |
0x434418 JE 43441f |
0x43441a VMOVQ 0x10(%RDX),%XMM2 |
0x43441f KORTESTB %K1,%K1 |
0x434423 JE 434429 |
0x434425 VMOVQ (%RDX),%XMM3 |
0x434429 KORTESTB %K1,%K1 |
0x43442d JE 434435 |
0x43442f VMOVSD (%RAX,%R15,8),%XMM4 |
0x434435 VPBROADCASTQ %XMM3,%ZMM3 |
0x43443b VPMULLQ %ZMM0,%ZMM3,%ZMM3 |
0x434441 VPBROADCASTQ %XMM2,%ZMM2 |
0x434447 VPADDQ %ZMM3,%ZMM1,%ZMM3 |
0x43444d VPSLLQ $0x3,%ZMM3,%ZMM3 |
0x434454 VPADDQ %ZMM3,%ZMM2,%ZMM2 |
0x43445a VBROADCASTSD %XMM4,%ZMM3 |
0x434460 KMOVQ %K1,%K2 |
0x434465 VSCATTERQPD %ZMM3,(,%ZMM2,1){%K2} |
0x434470 KORTESTB %K1,%K1 |
0x434474 JE 43447e |
0x434476 MOV -0x48(%RBP),%RAX |
0x43447a MOV 0x8(%RAX),%RAX |
0x43447e KORTESTB %K1,%K1 |
0x434482 JE 43448c |
0x434484 VMOVQ 0xb8(%RDX),%XMM2 |
0x43448c KORTESTB %K1,%K1 |
0x434490 JE 434499 |
0x434492 MOV 0xa8(%RDX),%RDI |
0x434499 KORTESTB %K1,%K1 |
0x43449d JE 4344a7 |
0x43449f MOV -0x50(%RBP),%RCX |
0x4344a3 MOV 0x8(%RCX),%RCX |
0x4344a7 KORTESTB %K1,%K1 |
0x4344ab JE 4344b5 |
0x4344ad VMOVQ 0xe8(%RDX),%XMM3 |
0x4344b5 KORTESTB %K1,%K1 |
0x4344b9 JE 4344c2 |
0x4344bb MOV 0xd8(%RDX),%R8 |
0x4344c2 VPBROADCASTQ %XMM2,%ZMM4 |
0x4344c8 VPBROADCASTQ %RDI,%ZMM5 |
0x4344ce VPBROADCASTQ %XMM3,%ZMM2 |
0x4344d4 VPBROADCASTQ %R8,%ZMM3 |
0x4344da VPSUBQ %ZMM21,%ZMM6,%ZMM6 |
0x4344e0 VPSUBQ %ZMM21,%ZMM0,%ZMM7 |
0x4344e6 VPMAXSQ %ZMM7,%ZMM6,%ZMM6 |
0x4344ec VPSUBQ %ZMM0,%ZMM6,%ZMM6 |
0x4344f2 VPCMPNLEUQ 0x38b2b(%RIP){1to0},%ZMM6,%K0 |
0x4344fd KANDB %K0,%K1,%K2 |
0x434501 KORTESTB %K2,%K2 |
0x434505 JE 43545c |
0x43450b VPSRLQ $0x1,%ZMM6,%ZMM7 |
0x434512 VPADDQ %ZMM21,%ZMM7,%ZMM7 |
0x434518 VPMULLQ %ZMM0,%ZMM5,%ZMM8 |
0x43451e VPMULLQ %ZMM0,%ZMM3,%ZMM9 |
0x434524 VPADDQ %ZMM5,%ZMM1,%ZMM10 |
0x43452a VPADDQ %ZMM3,%ZMM1,%ZMM11 |
0x434530 XOR %EDX,%EDX |
0x434532 JMP 434bf4 |
0x434540 JE 434dbb |
0x434546 CMP $0x3,%R14D |
0x43454a JNE 434210 |
0x434550 MOV -0x58(%RBP),%RAX |
0x434554 MOV (%RAX),%RDI |
0x434557 MOV 0x258(%RDI),%RAX |
0x43455e KXNORW %K0,%K0,%K1 |
0x434562 VXORPD %XMM4,%XMM4,%XMM4 |
0x434566 VGATHERQPD (%RAX,%ZMM1,8),%ZMM4{%K1} |
0x43456d VCMPPD $0,%ZMM3,%ZMM4,%K1 |
0x434574 KORTESTB %K1,%K1 |
0x434578 JE 434210 |
0x43457e JE 434588 |
0x434580 VMOVQ 0x278(%RDI),%XMM3 |
0x434588 VMOVQ %XMM3,%RAX |
0x43458d VPSLLQ $0x20,%ZMM0,%ZMM3 |
0x434594 VPSRAQ $0x1d,%ZMM3,%ZMM0 |
0x43459b KMOVQ %K1,%K2 |
0x4345a0 VXORPD %XMM4,%XMM4,%XMM4 |
0x4345a4 VGATHERQPD (%RAX,%ZMM0,1),%ZMM4{%K2} |
0x4345ab VCMPPD $0,%ZMM2,%ZMM4,%K0 |
0x4345b2 KANDB %K0,%K1,%K1 |
0x4345b6 KORTESTB %K1,%K1 |
0x4345ba JE 434210 |
0x4345c0 JE 4345ca |
0x4345c2 MOV -0x40(%RBP),%RAX |
0x4345c6 MOV 0x8(%RAX),%RAX |
0x4345ca KORTESTB %K1,%K1 |
0x4345ce JE 4345d5 |
0x4345d0 VMOVQ 0x40(%RDI),%XMM0 |
0x4345d5 KORTESTB %K1,%K1 |
0x4345d9 JE 4345e0 |
0x4345db VMOVQ 0x30(%RDI),%XMM2 |
0x4345e0 KORTESTB %K1,%K1 |
0x4345e4 JE 4345ec |
0x4345e6 VMOVSD (%RAX,%R15,8),%XMM4 |
0x4345ec VPSRAQ $0x20,%ZMM3,%ZMM7 |
0x4345f3 VPBROADCASTQ %XMM2,%ZMM2 |
0x4345f9 VPMULLQ %ZMM7,%ZMM2,%ZMM2 |
0x4345ff VPBROADCASTQ %XMM0,%ZMM0 |
0x434605 VPADDQ %ZMM2,%ZMM1,%ZMM2 |
0x43460b VPSLLQ $0x3,%ZMM2,%ZMM2 |
0x434612 VPADDQ %ZMM2,%ZMM0,%ZMM0 |
0x434618 VBROADCASTSD %XMM4,%ZMM2 |
0x43461e KMOVQ %K1,%K2 |
0x434623 VSCATTERQPD %ZMM2,(,%ZMM0,1){%K2} |
0x43462e KORTESTB %K1,%K1 |
0x434632 JE 43463c |
0x434634 MOV -0x38(%RBP),%RAX |
0x434638 MOV 0x8(%RAX),%RAX |
0x43463c KORTESTB %K1,%K1 |
0x434640 JE 434647 |
0x434642 VMOVQ 0x10(%RDI),%XMM0 |
0x434647 KORTESTB %K1,%K1 |
0x43464b JE 434651 |
0x43464d VMOVQ (%RDI),%XMM2 |
0x434651 KORTESTB %K1,%K1 |
0x434655 JE 43465d |
0x434657 VMOVSD (%RAX,%R15,8),%XMM4 |
0x43465d VPBROADCASTQ %XMM2,%ZMM2 |
0x434663 VPMULLQ %ZMM7,%ZMM2,%ZMM2 |
0x434669 VPBROADCASTQ %XMM0,%ZMM0 |
0x43466f VPADDQ %ZMM2,%ZMM1,%ZMM2 |
0x434675 VPSLLQ $0x3,%ZMM2,%ZMM2 |
0x43467c VPADDQ %ZMM2,%ZMM0,%ZMM0 |
0x434682 VBROADCASTSD %XMM4,%ZMM2 |
0x434688 KMOVQ %K1,%K2 |
0x43468d VSCATTERQPD %ZMM2,(,%ZMM0,1){%K2} |
0x434698 KORTESTB %K1,%K1 |
0x43469c JE 4346a6 |
0x43469e MOV -0x48(%RBP),%RAX |
0x4346a2 MOV 0x8(%RAX),%RAX |
0x4346a6 KORTESTB %K1,%K1 |
0x4346aa JE 4346b4 |
0x4346ac VMOVQ 0xb8(%RDI),%XMM0 |
0x4346b4 KORTESTB %K1,%K1 |
0x4346b8 JE 4346c1 |
0x4346ba MOV 0xa8(%RDI),%RCX |
0x4346c1 KORTESTB %K1,%K1 |
0x4346c5 JE 4346cf |
0x4346c7 MOV -0x50(%RBP),%RDX |
0x4346cb MOV 0x8(%RDX),%RDX |
0x4346cf KORTESTB %K1,%K1 |
0x4346d3 JE 4346dd |
0x4346d5 VMOVQ 0xe8(%RDI),%XMM2 |
0x4346dd KORTESTB %K1,%K1 |
0x4346e1 JE 4346ea |
0x4346e3 MOV 0xd8(%RDI),%R8 |
0x4346ea VPBROADCASTQ %XMM0,%ZMM0 |
0x4346f0 VPBROADCASTQ %RCX,%ZMM6 |
0x4346f6 VPBROADCASTQ %XMM2,%ZMM2 |
0x4346fc VPBROADCASTQ %R8,%ZMM8 |
0x434702 VPADDQ %ZMM20,%ZMM3,%ZMM3 |
0x434708 VPSRAQ $0x20,%ZMM3,%ZMM3 |
0x43470f VPSUBQ %ZMM21,%ZMM3,%ZMM3 |
0x434715 VPSUBQ %ZMM21,%ZMM7,%ZMM4 |
0x43471b VPMAXSQ %ZMM4,%ZMM3,%ZMM3 |
0x434721 VMOVDQA64 %ZMM7,%ZMM4 |
0x434727 VPTERNLOGQ $0xf,%ZMM7,%ZMM7,%ZMM4 |
0x43472e VPADDQ %ZMM4,%ZMM3,%ZMM3 |
0x434734 VPMOVQD %ZMM1,%YMM4 |
0x43473a VPCMPEQD %YMM5,%YMM5,%YMM5 |
0x43473e VPSUBD %YMM5,%YMM4,%YMM5 |
0x434742 VPMAXSD %YMM4,%YMM5,%YMM5 |
0x434747 VPSUBD %YMM4,%YMM5,%YMM5 |
0x43474b VPMOVZXDQ %YMM5,%ZMM4 |
0x434751 VPSUBQ %ZMM21,%ZMM4,%ZMM9 |
0x434757 VPCMPNLEUD %YMM25,%YMM5,%K2 |
0x43475e KMOVW %K2,-0x2a(%RBP) |
0x434763 VPANDQ %ZMM26,%ZMM9,%ZMM5 |
0x434769 VPCMPLEUQ %ZMM4,%ZMM5,%K3 |
0x434770 VPMULLQ %ZMM7,%ZMM6,%ZMM6 |
0x434776 VPMULLQ %ZMM7,%ZMM8,%ZMM7 |
0x43477c VPSRLQ $0x3,%ZMM9,%ZMM8 |
0x434783 VPADDQ %ZMM21,%ZMM8,%ZMM8 |
0x434789 XOR %R9D,%R9D |
0x43478c JMP 4347ad |
(347) 0x434790 VPBROADCASTQ %R9,%ZMM9 |
(347) 0x434796 INC %R9 |
(347) 0x434799 VPCMPEQQ %ZMM3,%ZMM9,%K4 |
(347) 0x43479f KANDNB %K0,%K4,%K0 |
(347) 0x4347a3 KTESTB %K1,%K0 |
(347) 0x4347a7 JE 434210 |
(347) 0x4347ad KANDB %K0,%K1,%K4 |
(347) 0x4347b1 KORTESTB %K4,%K4 |
(347) 0x4347b5 JE 434bd0 |
(347) 0x4347bb KMOVW -0x2a(%RBP),%K2 |
(347) 0x4347c0 KANDB %K2,%K4,%K5 |
(347) 0x4347c4 KORTESTB %K5,%K5 |
(347) 0x4347c8 JE 434ae0 |
(347) 0x4347ce MOV %RCX,%R10 |
(347) 0x4347d1 IMUL %R9,%R10 |
(347) 0x4347d5 MOV %R8,%R11 |
(347) 0x4347d8 IMUL %R9,%R11 |
(347) 0x4347dc XOR %EDI,%EDI |
(347) 0x4347de KMOVW -0x2a(%RBP),%K6 |
(347) 0x4347e3 JMP 434804 |
(349) 0x4347f0 KXORW %K0,%K0,%K7 |
(349) 0x4347f4 XOR %EDI,%EDI |
(349) 0x4347f6 KANDNB %K6,%K7,%K6 |
(349) 0x4347fa KTESTB %K5,%K6 |
(349) 0x4347fe JE 434ae0 |
(349) 0x434804 KANDB %K6,%K5,%K2 |
(349) 0x434808 KORTESTB %K2,%K2 |
(349) 0x43480c JE 4347f0 |
(349) 0x43480e KORTESTB %K2,%K2 |
(349) 0x434812 JE 43481a |
(349) 0x434814 VMOVSD (%RAX,%R15,8),%XMM10 |
(349) 0x43481a LEA (%R10,%RDI,8),%RBX |
(349) 0x43481e VPBROADCASTQ %RBX,%ZMM9 |
(349) 0x434824 VPADDQ %ZMM9,%ZMM1,%ZMM9 |
(349) 0x43482a VPADDQ %ZMM6,%ZMM9,%ZMM9 |
(349) 0x434830 VPSLLQ $0x3,%ZMM9,%ZMM9 |
(349) 0x434837 VPADDQ %ZMM9,%ZMM0,%ZMM9 |
(349) 0x43483d VBROADCASTSD %XMM10,%ZMM10 |
(349) 0x434843 KMOVQ %K2,%K7 |
(349) 0x434848 VSCATTERQPD %ZMM10,(,%ZMM9,1){%K7} |
(349) 0x434853 KORTESTB %K2,%K2 |
(349) 0x434857 JE 43485f |
(349) 0x434859 VMOVSD (%RDX,%R15,8),%XMM11 |
(349) 0x43485f LEA (,%RDI,8),%RBX |
(349) 0x434867 ADD %R11,%RBX |
(349) 0x43486a VPBROADCASTQ %RBX,%ZMM10 |
(349) 0x434870 VPADDQ %ZMM10,%ZMM1,%ZMM10 |
(349) 0x434876 VPADDQ %ZMM7,%ZMM10,%ZMM10 |
(349) 0x43487c VPSLLQ $0x3,%ZMM10,%ZMM10 |
(349) 0x434883 VPADDQ %ZMM10,%ZMM2,%ZMM10 |
(349) 0x434889 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x43488f KMOVQ %K2,%K7 |
(349) 0x434894 VSCATTERQPD %ZMM11,(,%ZMM10,1){%K7} |
(349) 0x43489f KORTESTB %K2,%K2 |
(349) 0x4348a3 JE 4348ab |
(349) 0x4348a5 VMOVSD (%RAX,%R15,8),%XMM11 |
(349) 0x4348ab VPADDQ %ZMM24,%ZMM9,%ZMM12 |
(349) 0x4348b1 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x4348b7 KMOVQ %K2,%K7 |
(349) 0x4348bc VSCATTERQPD %ZMM11,(,%ZMM12,1){%K7} |
(349) 0x4348c7 KORTESTB %K2,%K2 |
(349) 0x4348cb JE 4348d3 |
(349) 0x4348cd VMOVSD (%RDX,%R15,8),%XMM11 |
(349) 0x4348d3 VPADDQ %ZMM24,%ZMM10,%ZMM12 |
(349) 0x4348d9 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x4348df KMOVQ %K2,%K7 |
(349) 0x4348e4 VSCATTERQPD %ZMM11,(,%ZMM12,1){%K7} |
(349) 0x4348ef KORTESTB %K2,%K2 |
(349) 0x4348f3 JE 4348fb |
(349) 0x4348f5 VMOVSD (%RAX,%R15,8),%XMM11 |
(349) 0x4348fb VPADDQ %ZMM27,%ZMM9,%ZMM12 |
(349) 0x434901 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x434907 KMOVQ %K2,%K7 |
(349) 0x43490c VSCATTERQPD %ZMM11,(,%ZMM12,1){%K7} |
(349) 0x434917 KORTESTB %K2,%K2 |
(349) 0x43491b JE 434923 |
(349) 0x43491d VMOVSD (%RDX,%R15,8),%XMM11 |
(349) 0x434923 VPADDQ %ZMM27,%ZMM10,%ZMM12 |
(349) 0x434929 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x43492f KMOVQ %K2,%K7 |
(349) 0x434934 VSCATTERQPD %ZMM11,(,%ZMM12,1){%K7} |
(349) 0x43493f KORTESTB %K2,%K2 |
(349) 0x434943 JE 43494b |
(349) 0x434945 VMOVSD (%RAX,%R15,8),%XMM11 |
(349) 0x43494b VPADDQ %ZMM28,%ZMM9,%ZMM12 |
(349) 0x434951 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x434957 KMOVQ %K2,%K7 |
(349) 0x43495c VSCATTERQPD %ZMM11,(,%ZMM12,1){%K7} |
(349) 0x434967 KORTESTB %K2,%K2 |
(349) 0x43496b JE 434973 |
(349) 0x43496d VMOVSD (%RDX,%R15,8),%XMM11 |
(349) 0x434973 VPADDQ %ZMM28,%ZMM10,%ZMM12 |
(349) 0x434979 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x43497f KMOVQ %K2,%K7 |
(349) 0x434984 VSCATTERQPD %ZMM11,(,%ZMM12,1){%K7} |
(349) 0x43498f KORTESTB %K2,%K2 |
(349) 0x434993 JE 43499b |
(349) 0x434995 VMOVSD (%RAX,%R15,8),%XMM11 |
(349) 0x43499b VPADDQ %ZMM29,%ZMM9,%ZMM12 |
(349) 0x4349a1 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x4349a7 KMOVQ %K2,%K7 |
(349) 0x4349ac VSCATTERQPD %ZMM11,(,%ZMM12,1){%K7} |
(349) 0x4349b7 KORTESTB %K2,%K2 |
(349) 0x4349bb JE 4349c3 |
(349) 0x4349bd VMOVSD (%RDX,%R15,8),%XMM11 |
(349) 0x4349c3 VPADDQ %ZMM29,%ZMM10,%ZMM12 |
(349) 0x4349c9 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x4349cf KMOVQ %K2,%K7 |
(349) 0x4349d4 VSCATTERQPD %ZMM11,(,%ZMM12,1){%K7} |
(349) 0x4349df KORTESTB %K2,%K2 |
(349) 0x4349e3 JE 4349eb |
(349) 0x4349e5 VMOVSD (%RAX,%R15,8),%XMM11 |
(349) 0x4349eb VPADDQ %ZMM30,%ZMM9,%ZMM12 |
(349) 0x4349f1 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x4349f7 KMOVQ %K2,%K7 |
(349) 0x4349fc VSCATTERQPD %ZMM11,(,%ZMM12,1){%K7} |
(349) 0x434a07 KORTESTB %K2,%K2 |
(349) 0x434a0b JE 434a13 |
(349) 0x434a0d VMOVSD (%RDX,%R15,8),%XMM11 |
(349) 0x434a13 VPADDQ %ZMM30,%ZMM10,%ZMM12 |
(349) 0x434a19 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x434a1f KMOVQ %K2,%K7 |
(349) 0x434a24 VSCATTERQPD %ZMM11,(,%ZMM12,1){%K7} |
(349) 0x434a2f KORTESTB %K2,%K2 |
(349) 0x434a33 JE 434a3b |
(349) 0x434a35 VMOVSD (%RAX,%R15,8),%XMM11 |
(349) 0x434a3b VPADDQ %ZMM31,%ZMM9,%ZMM12 |
(349) 0x434a41 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x434a47 KMOVQ %K2,%K7 |
(349) 0x434a4c VSCATTERQPD %ZMM11,(,%ZMM12,1){%K7} |
(349) 0x434a57 KORTESTB %K2,%K2 |
(349) 0x434a5b JE 434a63 |
(349) 0x434a5d VMOVSD (%RDX,%R15,8),%XMM11 |
(349) 0x434a63 VPADDQ %ZMM31,%ZMM10,%ZMM12 |
(349) 0x434a69 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x434a6f KMOVQ %K2,%K7 |
(349) 0x434a74 VSCATTERQPD %ZMM11,(,%ZMM12,1){%K7} |
(349) 0x434a7f KORTESTB %K2,%K2 |
(349) 0x434a83 JE 434a8b |
(349) 0x434a85 VMOVSD (%RAX,%R15,8),%XMM11 |
(349) 0x434a8b VPADDQ %ZMM22,%ZMM9,%ZMM9 |
(349) 0x434a91 VBROADCASTSD %XMM11,%ZMM11 |
(349) 0x434a97 KMOVQ %K2,%K7 |
(349) 0x434a9c VSCATTERQPD %ZMM11,(,%ZMM9,1){%K7} |
(349) 0x434aa7 KORTESTB %K2,%K2 |
(349) 0x434aab JE 434ab3 |
(349) 0x434aad VMOVSD (%RDX,%R15,8),%XMM9 |
(349) 0x434ab3 VPADDQ %ZMM22,%ZMM10,%ZMM10 |
(349) 0x434ab9 VBROADCASTSD %XMM9,%ZMM9 |
(349) 0x434abf VSCATTERQPD %ZMM9,(,%ZMM10,1){%K2} |
(349) 0x434aca VPBROADCASTQ %RDI,%ZMM9 |
(349) 0x434ad0 INC %RDI |
(349) 0x434ad3 VPCMPEQQ %ZMM8,%ZMM9,%K7 |
(349) 0x434ad9 JMP 4347f6 |
(347) 0x434ae0 KANDB %K3,%K4,%K4 |
(347) 0x434ae4 KORTESTB %K4,%K4 |
(347) 0x434ae8 JE 434790 |
(347) 0x434aee MOV %RCX,%RDI |
(347) 0x434af1 IMUL %R9,%RDI |
(347) 0x434af5 VPBROADCASTQ %RDI,%ZMM9 |
(347) 0x434afb MOV %R8,%RDI |
(347) 0x434afe IMUL %R9,%RDI |
(347) 0x434b02 VPBROADCASTQ %RDI,%ZMM10 |
(347) 0x434b08 VMOVDQA64 %ZMM5,%ZMM11 |
(347) 0x434b0e KMOVQ %K3,%K5 |
(347) 0x434b13 JMP 434b37 |
(348) 0x434b20 KXORW %K0,%K0,%K6 |
(348) 0x434b24 VPXOR %XMM11,%XMM11,%XMM11 |
(348) 0x434b29 KANDNB %K5,%K6,%K5 |
(348) 0x434b2d KTESTB %K4,%K5 |
(348) 0x434b31 JE 434790 |
(348) 0x434b37 KANDB %K5,%K4,%K6 |
(348) 0x434b3b KORTESTB %K6,%K6 |
(348) 0x434b3f JE 434b20 |
(348) 0x434b41 KORTESTB %K6,%K6 |
(348) 0x434b45 JE 434b4d |
(348) 0x434b47 VMOVSD (%RAX,%R15,8),%XMM12 |
(348) 0x434b4d VPADDQ %ZMM11,%ZMM9,%ZMM13 |
(348) 0x434b53 VPADDQ %ZMM13,%ZMM1,%ZMM13 |
(348) 0x434b59 VPADDQ %ZMM6,%ZMM13,%ZMM13 |
(348) 0x434b5f VPSLLQ $0x3,%ZMM13,%ZMM13 |
(348) 0x434b66 VPADDQ %ZMM13,%ZMM0,%ZMM13 |
(348) 0x434b6c VBROADCASTSD %XMM12,%ZMM12 |
(348) 0x434b72 KMOVQ %K6,%K2 |
(348) 0x434b77 VSCATTERQPD %ZMM12,(,%ZMM13,1){%K2} |
(348) 0x434b82 KORTESTB %K6,%K6 |
(348) 0x434b86 JE 434b8e |
(348) 0x434b88 VMOVSD (%RDX,%R15,8),%XMM12 |
(348) 0x434b8e VPADDQ %ZMM11,%ZMM10,%ZMM13 |
(348) 0x434b94 VPADDQ %ZMM13,%ZMM1,%ZMM13 |
(348) 0x434b9a VPADDQ %ZMM7,%ZMM13,%ZMM13 |
(348) 0x434ba0 VPSLLQ $0x3,%ZMM13,%ZMM13 |
(348) 0x434ba7 VPADDQ %ZMM13,%ZMM2,%ZMM13 |
(348) 0x434bad VBROADCASTSD %XMM12,%ZMM12 |
(348) 0x434bb3 VSCATTERQPD %ZMM12,(,%ZMM13,1){%K6} |
(348) 0x434bbe VPCMPEQQ %ZMM4,%ZMM11,%K6 |
(348) 0x434bc4 VPSUBQ %ZMM21,%ZMM11,%ZMM11 |
(348) 0x434bca JMP 434b29 |
(347) 0x434bd0 KXORW %K0,%K0,%K4 |
(347) 0x434bd4 XOR %R9D,%R9D |
(347) 0x434bd7 JMP 43479f |
(350) 0x434be0 KXORW %K0,%K0,%K3 |
(350) 0x434be4 XOR %EDX,%EDX |
(350) 0x434be6 KANDNB %K0,%K3,%K0 |
(350) 0x434bea KTESTB %K2,%K0 |
(350) 0x434bee JE 43545c |
(350) 0x434bf4 KANDB %K0,%K2,%K3 |
(350) 0x434bf8 KORTESTB %K3,%K3 |
(350) 0x434bfc JE 434be0 |
(350) 0x434bfe KORTESTB %K3,%K3 |
(350) 0x434c02 JE 434c0a |
(350) 0x434c04 VMOVSD (%RAX,%R15,8),%XMM13 |
(350) 0x434c0a MOV %RDI,%R9 |
(350) 0x434c0d IMUL %RDX,%R9 |
(350) 0x434c11 ADD %R9,%R9 |
(350) 0x434c14 VPBROADCASTQ %R9,%ZMM12 |
(350) 0x434c1a VPADDQ %ZMM12,%ZMM1,%ZMM14 |
(350) 0x434c20 VPADDQ %ZMM8,%ZMM14,%ZMM14 |
(350) 0x434c26 VPSLLQ $0x3,%ZMM14,%ZMM14 |
(350) 0x434c2d VPADDQ %ZMM14,%ZMM4,%ZMM14 |
(350) 0x434c33 VBROADCASTSD %XMM13,%ZMM13 |
(350) 0x434c39 KMOVQ %K3,%K4 |
(350) 0x434c3e VSCATTERQPD %ZMM13,(,%ZMM14,1){%K4} |
(350) 0x434c49 KORTESTB %K3,%K3 |
(350) 0x434c4d JE 434c56 |
(350) 0x434c4f VMOVSD (%RCX,%R15,8),%XMM16 |
(350) 0x434c56 MOV %R8,%R9 |
(350) 0x434c59 IMUL %RDX,%R9 |
(350) 0x434c5d ADD %R9,%R9 |
(350) 0x434c60 VPBROADCASTQ %R9,%ZMM13 |
(350) 0x434c66 VPADDQ %ZMM13,%ZMM1,%ZMM15 |
(350) 0x434c6c VPADDQ %ZMM9,%ZMM15,%ZMM15 |
(350) 0x434c72 VPSLLQ $0x3,%ZMM15,%ZMM15 |
(350) 0x434c79 VPADDQ %ZMM15,%ZMM2,%ZMM15 |
(350) 0x434c7f VBROADCASTSD %XMM16,%ZMM16 |
(350) 0x434c85 KMOVQ %K3,%K4 |
(350) 0x434c8a VSCATTERQPD %ZMM16,(,%ZMM15,1){%K4} |
(350) 0x434c95 KORTESTB %K3,%K3 |
(350) 0x434c99 JE 434ca2 |
(350) 0x434c9b VMOVSD (%RAX,%R15,8),%XMM16 |
(350) 0x434ca2 VPADDQ %ZMM24,%ZMM14,%ZMM14 |
(350) 0x434ca8 VBROADCASTSD %XMM16,%ZMM16 |
(350) 0x434cae KMOVQ %K3,%K4 |
(350) 0x434cb3 VSCATTERQPD %ZMM16,(,%ZMM14,1){%K4} |
(350) 0x434cbe KORTESTB %K3,%K3 |
(350) 0x434cc2 JE 434cca |
(350) 0x434cc4 VMOVSD (%RCX,%R15,8),%XMM14 |
(350) 0x434cca VPADDQ %ZMM24,%ZMM15,%ZMM15 |
(350) 0x434cd0 VBROADCASTSD %XMM14,%ZMM14 |
(350) 0x434cd6 KMOVQ %K3,%K4 |
(350) 0x434cdb VSCATTERQPD %ZMM14,(,%ZMM15,1){%K4} |
(350) 0x434ce6 KORTESTB %K3,%K3 |
(350) 0x434cea JE 434cf2 |
(350) 0x434cec VMOVSD (%RAX,%R15,8),%XMM14 |
(350) 0x434cf2 VPADDQ %ZMM12,%ZMM10,%ZMM12 |
(350) 0x434cf8 VPADDQ %ZMM8,%ZMM12,%ZMM12 |
(350) 0x434cfe VPSLLQ $0x3,%ZMM12,%ZMM12 |
(350) 0x434d05 VPADDQ %ZMM12,%ZMM4,%ZMM12 |
(350) 0x434d0b VBROADCASTSD %XMM14,%ZMM14 |
(350) 0x434d11 KMOVQ %K3,%K4 |
(350) 0x434d16 VSCATTERQPD %ZMM14,(,%ZMM12,1){%K4} |
(350) 0x434d21 KORTESTB %K3,%K3 |
(350) 0x434d25 JE 434d2d |
(350) 0x434d27 VMOVSD (%RCX,%R15,8),%XMM14 |
(350) 0x434d2d VPADDQ %ZMM13,%ZMM11,%ZMM13 |
(350) 0x434d33 VPADDQ %ZMM9,%ZMM13,%ZMM13 |
(350) 0x434d39 VPSLLQ $0x3,%ZMM13,%ZMM13 |
(350) 0x434d40 VPADDQ %ZMM13,%ZMM2,%ZMM13 |
(350) 0x434d46 VBROADCASTSD %XMM14,%ZMM14 |
(350) 0x434d4c KMOVQ %K3,%K4 |
(350) 0x434d51 VSCATTERQPD %ZMM14,(,%ZMM13,1){%K4} |
(350) 0x434d5c KORTESTB %K3,%K3 |
(350) 0x434d60 JE 434d68 |
(350) 0x434d62 VMOVSD (%RAX,%R15,8),%XMM14 |
(350) 0x434d68 VPADDQ %ZMM24,%ZMM12,%ZMM12 |
(350) 0x434d6e VBROADCASTSD %XMM14,%ZMM14 |
(350) 0x434d74 KMOVQ %K3,%K4 |
(350) 0x434d79 VSCATTERQPD %ZMM14,(,%ZMM12,1){%K4} |
(350) 0x434d84 KORTESTB %K3,%K3 |
(350) 0x434d88 JE 434d90 |
(350) 0x434d8a VMOVSD (%RCX,%R15,8),%XMM12 |
(350) 0x434d90 VPADDQ %ZMM24,%ZMM13,%ZMM13 |
(350) 0x434d96 VBROADCASTSD %XMM12,%ZMM12 |
(350) 0x434d9c VSCATTERQPD %ZMM12,(,%ZMM13,1){%K3} |
(350) 0x434da7 VPBROADCASTQ %RDX,%ZMM12 |
(350) 0x434dad INC %RDX |
(350) 0x434db0 VPCMPEQQ %ZMM7,%ZMM12,%K3 |
(350) 0x434db6 JMP 434be6 |
0x434dbb MOV -0x58(%RBP),%RAX |
0x434dbf MOV (%RAX),%RDI |
0x434dc2 MOV 0x218(%RDI),%RAX |
0x434dc9 KXNORW %K0,%K0,%K1 |
0x434dcd VXORPD %XMM4,%XMM4,%XMM4 |
0x434dd1 VGATHERQPD (%RAX,%ZMM1,8),%ZMM4{%K1} |
0x434dd8 MOV 0x238(%RDI),%RAX |
0x434ddf VSUBPD %ZMM3,%ZMM4,%ZMM3 |
0x434de5 VPSLLQ $0x20,%ZMM0,%ZMM5 |
0x434dec VPSRAQ $0x20,%ZMM5,%ZMM9 |
0x434df3 KXNORW %K0,%K0,%K1 |
0x434df7 VPXOR %XMM0,%XMM0,%XMM0 |
0x434dfb VGATHERQPD (%RAX,%ZMM9,8),%ZMM0{%K1} |
0x434e02 VMULPD %ZMM3,%ZMM3,%ZMM3 |
0x434e08 VSUBPD %ZMM2,%ZMM0,%ZMM0 |
0x434e0e VFMADD213PD %ZMM3,%ZMM0,%ZMM0 |
0x434e14 VSQRTPD %ZMM0,%ZMM0 |
0x434e1a MOV -0x88(%RBP),%RAX |
0x434e21 MOV 0x8(%RAX),%RAX |
0x434e25 VBROADCASTSD (%RAX,%R15,8),%ZMM2 |
0x434e2c VCMPPD $0x2,%ZMM2,%ZMM0,%K1 |
0x434e33 KORTESTB %K1,%K1 |
0x434e37 JE 434210 |
0x434e3d VCMPPD $0x2,%ZMM2,%ZMM0,%K2 |
0x434e44 KORTESTB %K2,%K2 |
0x434e48 JE 434e52 |
0x434e4a MOV -0x40(%RBP),%RAX |
0x434e4e MOV 0x8(%RAX),%RAX |
0x434e52 KORTESTB %K2,%K2 |
0x434e56 JE 434e5d |
0x434e58 VMOVQ 0x40(%RDI),%XMM3 |
0x434e5d KORTESTB %K2,%K2 |
0x434e61 JE 434e68 |
0x434e63 VMOVQ 0x30(%RDI),%XMM4 |
0x434e68 KORTESTB %K2,%K2 |
0x434e6c JE 434e74 |
0x434e6e VMOVSD (%RAX,%R15,8),%XMM6 |
0x434e74 VPBROADCASTQ %XMM4,%ZMM4 |
0x434e7a VPMULLQ %ZMM9,%ZMM4,%ZMM4 |
0x434e80 VPBROADCASTQ %XMM3,%ZMM3 |
0x434e86 VPADDQ %ZMM4,%ZMM1,%ZMM4 |
0x434e8c VPSLLQ $0x3,%ZMM4,%ZMM4 |
0x434e93 VPADDQ %ZMM4,%ZMM3,%ZMM3 |
0x434e99 VBROADCASTSD %XMM6,%ZMM4 |
0x434e9f KMOVQ %K2,%K3 |
0x434ea4 VSCATTERQPD %ZMM4,(,%ZMM3,1){%K3} |
0x434eaf KORTESTB %K2,%K2 |
0x434eb3 JE 434ebd |
0x434eb5 MOV -0x38(%RBP),%RAX |
0x434eb9 MOV 0x8(%RAX),%RAX |
0x434ebd KORTESTB %K2,%K2 |
0x434ec1 JE 434ec8 |
0x434ec3 VMOVQ 0x10(%RDI),%XMM3 |
0x434ec8 KORTESTB %K2,%K2 |
0x434ecc JE 434ed2 |
0x434ece VMOVQ (%RDI),%XMM4 |
0x434ed2 KORTESTB %K2,%K2 |
0x434ed6 JE 434ede |
0x434ed8 VMOVSD (%RAX,%R15,8),%XMM6 |
0x434ede VPBROADCASTQ %XMM4,%ZMM4 |
0x434ee4 VPMULLQ %ZMM9,%ZMM4,%ZMM4 |
0x434eea VPBROADCASTQ %XMM3,%ZMM3 |
0x434ef0 VPADDQ %ZMM4,%ZMM1,%ZMM4 |
0x434ef6 VPSLLQ $0x3,%ZMM4,%ZMM4 |
0x434efd VPADDQ %ZMM4,%ZMM3,%ZMM3 |
0x434f03 VBROADCASTSD %XMM6,%ZMM4 |
0x434f09 KMOVQ %K2,%K3 |
0x434f0e VSCATTERQPD %ZMM4,(,%ZMM3,1){%K3} |
0x434f19 KORTESTB %K2,%K2 |
0x434f1d JE 434f27 |
0x434f1f MOV -0x48(%RBP),%RAX |
0x434f23 MOV 0x8(%RAX),%RAX |
0x434f27 KORTESTB %K2,%K2 |
0x434f2b JE 434f35 |
0x434f2d VMOVQ 0xb8(%RDI),%XMM3 |
0x434f35 KORTESTB %K2,%K2 |
0x434f39 JE 434f42 |
0x434f3b MOV 0xa8(%RDI),%RCX |
0x434f42 KORTESTB %K2,%K2 |
0x434f46 JE 434f50 |
0x434f48 MOV -0x50(%RBP),%RDX |
0x434f4c MOV 0x8(%RDX),%RDX |
0x434f50 KORTESTB %K2,%K2 |
0x434f54 JE 434f5e |
0x434f56 VMOVQ 0xe8(%RDI),%XMM4 |
0x434f5e KORTESTB %K2,%K2 |
0x434f62 JE 434f6b |
0x434f64 MOV 0xd8(%RDI),%R8 |
0x434f6b VPBROADCASTQ %XMM3,%ZMM3 |
0x434f71 VPBROADCASTQ %RCX,%ZMM8 |
0x434f77 VPBROADCASTQ %XMM4,%ZMM4 |
0x434f7d VPBROADCASTQ %R8,%ZMM10 |
0x434f83 VPADDQ %ZMM20,%ZMM5,%ZMM5 |
0x434f89 VPSRAQ $0x20,%ZMM5,%ZMM5 |
0x434f90 VPSUBQ %ZMM21,%ZMM5,%ZMM5 |
0x434f96 VPSUBQ %ZMM21,%ZMM9,%ZMM6 |
0x434f9c VPMAXSQ %ZMM6,%ZMM5,%ZMM5 |
0x434fa2 VMOVDQA64 %ZMM9,%ZMM6 |
0x434fa8 VPTERNLOGQ $0xf,%ZMM9,%ZMM9,%ZMM6 |
0x434faf VPADDQ %ZMM6,%ZMM5,%ZMM5 |
0x434fb5 VPMOVQD %ZMM1,%YMM6 |
0x434fbb VPCMPEQD %YMM7,%YMM7,%YMM7 |
0x434fbf VPSUBD %YMM7,%YMM6,%YMM7 |
0x434fc3 VPMAXSD %YMM6,%YMM7,%YMM7 |
0x434fc8 VPSUBD %YMM6,%YMM7,%YMM7 |
0x434fcc VPMOVZXDQ %YMM7,%ZMM6 |
0x434fd2 VPSUBQ %ZMM21,%ZMM6,%ZMM11 |
0x434fd8 VPCMPNLEUD %YMM25,%YMM7,%K0 |
0x434fdf KMOVW %K0,-0x2a(%RBP) |
0x434fe4 VPANDQ %ZMM26,%ZMM11,%ZMM7 |
0x434fea VPCMPLEUQ %ZMM6,%ZMM7,%K0 |
0x434ff1 VPMULLQ %ZMM9,%ZMM8,%ZMM8 |
0x434ff7 VPMULLQ %ZMM9,%ZMM10,%ZMM9 |
0x434ffd VPSRLQ $0x3,%ZMM11,%ZMM10 |
0x435004 VPADDQ %ZMM21,%ZMM10,%ZMM10 |
0x43500a XOR %R9D,%R9D |
0x43500d JMP 43502d |
(344) 0x435010 VPBROADCASTQ %R9,%ZMM11 |
(344) 0x435016 INC %R9 |
(344) 0x435019 VPCMPEQQ %ZMM5,%ZMM11,%K4 |
(344) 0x43501f KANDNB %K1,%K4,%K1 |
(344) 0x435023 KTESTB %K2,%K1 |
(344) 0x435027 JE 434210 |
(344) 0x43502d VCMPPD $0x2,%ZMM2,%ZMM0,%K4{%K1} |
(344) 0x435034 KORTESTB %K4,%K4 |
(344) 0x435038 JE 435450 |
(344) 0x43503e KMOVW -0x2a(%RBP),%K3 |
(344) 0x435043 KANDB %K3,%K4,%K5 |
(344) 0x435047 KORTESTB %K5,%K5 |
(344) 0x43504b JE 435360 |
(344) 0x435051 MOV %RCX,%R10 |
(344) 0x435054 IMUL %R9,%R10 |
(344) 0x435058 MOV %R8,%R11 |
(344) 0x43505b IMUL %R9,%R11 |
(344) 0x43505f XOR %EDI,%EDI |
(344) 0x435061 KMOVW -0x2a(%RBP),%K6 |
(344) 0x435066 JMP 435084 |
(346) 0x435070 KXORW %K0,%K0,%K7 |
(346) 0x435074 XOR %EDI,%EDI |
(346) 0x435076 KANDNB %K6,%K7,%K6 |
(346) 0x43507a KTESTB %K5,%K6 |
(346) 0x43507e JE 435360 |
(346) 0x435084 KANDB %K6,%K5,%K3 |
(346) 0x435088 KORTESTB %K3,%K3 |
(346) 0x43508c JE 435070 |
(346) 0x43508e KORTESTB %K3,%K3 |
(346) 0x435092 JE 43509a |
(346) 0x435094 VMOVSD (%RAX,%R15,8),%XMM12 |
(346) 0x43509a LEA (%R10,%RDI,8),%RBX |
(346) 0x43509e VPBROADCASTQ %RBX,%ZMM11 |
(346) 0x4350a4 VPADDQ %ZMM11,%ZMM1,%ZMM11 |
(346) 0x4350aa VPADDQ %ZMM8,%ZMM11,%ZMM11 |
(346) 0x4350b0 VPSLLQ $0x3,%ZMM11,%ZMM11 |
(346) 0x4350b7 VPADDQ %ZMM11,%ZMM3,%ZMM11 |
(346) 0x4350bd VBROADCASTSD %XMM12,%ZMM12 |
(346) 0x4350c3 KMOVQ %K3,%K7 |
(346) 0x4350c8 VSCATTERQPD %ZMM12,(,%ZMM11,1){%K7} |
(346) 0x4350d3 KORTESTB %K3,%K3 |
(346) 0x4350d7 JE 4350df |
(346) 0x4350d9 VMOVSD (%RDX,%R15,8),%XMM13 |
(346) 0x4350df LEA (,%RDI,8),%RBX |
(346) 0x4350e7 ADD %R11,%RBX |
(346) 0x4350ea VPBROADCASTQ %RBX,%ZMM12 |
(346) 0x4350f0 VPADDQ %ZMM12,%ZMM1,%ZMM12 |
(346) 0x4350f6 VPADDQ %ZMM9,%ZMM12,%ZMM12 |
(346) 0x4350fc VPSLLQ $0x3,%ZMM12,%ZMM12 |
(346) 0x435103 VPADDQ %ZMM12,%ZMM4,%ZMM12 |
(346) 0x435109 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x43510f KMOVQ %K3,%K7 |
(346) 0x435114 VSCATTERQPD %ZMM13,(,%ZMM12,1){%K7} |
(346) 0x43511f KORTESTB %K3,%K3 |
(346) 0x435123 JE 43512b |
(346) 0x435125 VMOVSD (%RAX,%R15,8),%XMM13 |
(346) 0x43512b VPADDQ %ZMM24,%ZMM11,%ZMM14 |
(346) 0x435131 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x435137 KMOVQ %K3,%K7 |
(346) 0x43513c VSCATTERQPD %ZMM13,(,%ZMM14,1){%K7} |
(346) 0x435147 KORTESTB %K3,%K3 |
(346) 0x43514b JE 435153 |
(346) 0x43514d VMOVSD (%RDX,%R15,8),%XMM13 |
(346) 0x435153 VPADDQ %ZMM24,%ZMM12,%ZMM14 |
(346) 0x435159 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x43515f KMOVQ %K3,%K7 |
(346) 0x435164 VSCATTERQPD %ZMM13,(,%ZMM14,1){%K7} |
(346) 0x43516f KORTESTB %K3,%K3 |
(346) 0x435173 JE 43517b |
(346) 0x435175 VMOVSD (%RAX,%R15,8),%XMM13 |
(346) 0x43517b VPADDQ %ZMM27,%ZMM11,%ZMM14 |
(346) 0x435181 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x435187 KMOVQ %K3,%K7 |
(346) 0x43518c VSCATTERQPD %ZMM13,(,%ZMM14,1){%K7} |
(346) 0x435197 KORTESTB %K3,%K3 |
(346) 0x43519b JE 4351a3 |
(346) 0x43519d VMOVSD (%RDX,%R15,8),%XMM13 |
(346) 0x4351a3 VPADDQ %ZMM27,%ZMM12,%ZMM14 |
(346) 0x4351a9 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x4351af KMOVQ %K3,%K7 |
(346) 0x4351b4 VSCATTERQPD %ZMM13,(,%ZMM14,1){%K7} |
(346) 0x4351bf KORTESTB %K3,%K3 |
(346) 0x4351c3 JE 4351cb |
(346) 0x4351c5 VMOVSD (%RAX,%R15,8),%XMM13 |
(346) 0x4351cb VPADDQ %ZMM28,%ZMM11,%ZMM14 |
(346) 0x4351d1 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x4351d7 KMOVQ %K3,%K7 |
(346) 0x4351dc VSCATTERQPD %ZMM13,(,%ZMM14,1){%K7} |
(346) 0x4351e7 KORTESTB %K3,%K3 |
(346) 0x4351eb JE 4351f3 |
(346) 0x4351ed VMOVSD (%RDX,%R15,8),%XMM13 |
(346) 0x4351f3 VPADDQ %ZMM28,%ZMM12,%ZMM14 |
(346) 0x4351f9 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x4351ff KMOVQ %K3,%K7 |
(346) 0x435204 VSCATTERQPD %ZMM13,(,%ZMM14,1){%K7} |
(346) 0x43520f KORTESTB %K3,%K3 |
(346) 0x435213 JE 43521b |
(346) 0x435215 VMOVSD (%RAX,%R15,8),%XMM13 |
(346) 0x43521b VPADDQ %ZMM29,%ZMM11,%ZMM14 |
(346) 0x435221 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x435227 KMOVQ %K3,%K7 |
(346) 0x43522c VSCATTERQPD %ZMM13,(,%ZMM14,1){%K7} |
(346) 0x435237 KORTESTB %K3,%K3 |
(346) 0x43523b JE 435243 |
(346) 0x43523d VMOVSD (%RDX,%R15,8),%XMM13 |
(346) 0x435243 VPADDQ %ZMM29,%ZMM12,%ZMM14 |
(346) 0x435249 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x43524f KMOVQ %K3,%K7 |
(346) 0x435254 VSCATTERQPD %ZMM13,(,%ZMM14,1){%K7} |
(346) 0x43525f KORTESTB %K3,%K3 |
(346) 0x435263 JE 43526b |
(346) 0x435265 VMOVSD (%RAX,%R15,8),%XMM13 |
(346) 0x43526b VPADDQ %ZMM30,%ZMM11,%ZMM14 |
(346) 0x435271 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x435277 KMOVQ %K3,%K7 |
(346) 0x43527c VSCATTERQPD %ZMM13,(,%ZMM14,1){%K7} |
(346) 0x435287 KORTESTB %K3,%K3 |
(346) 0x43528b JE 435293 |
(346) 0x43528d VMOVSD (%RDX,%R15,8),%XMM13 |
(346) 0x435293 VPADDQ %ZMM30,%ZMM12,%ZMM14 |
(346) 0x435299 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x43529f KMOVQ %K3,%K7 |
(346) 0x4352a4 VSCATTERQPD %ZMM13,(,%ZMM14,1){%K7} |
(346) 0x4352af KORTESTB %K3,%K3 |
(346) 0x4352b3 JE 4352bb |
(346) 0x4352b5 VMOVSD (%RAX,%R15,8),%XMM13 |
(346) 0x4352bb VPADDQ %ZMM31,%ZMM11,%ZMM14 |
(346) 0x4352c1 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x4352c7 KMOVQ %K3,%K7 |
(346) 0x4352cc VSCATTERQPD %ZMM13,(,%ZMM14,1){%K7} |
(346) 0x4352d7 KORTESTB %K3,%K3 |
(346) 0x4352db JE 4352e3 |
(346) 0x4352dd VMOVSD (%RDX,%R15,8),%XMM13 |
(346) 0x4352e3 VPADDQ %ZMM31,%ZMM12,%ZMM14 |
(346) 0x4352e9 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x4352ef KMOVQ %K3,%K7 |
(346) 0x4352f4 VSCATTERQPD %ZMM13,(,%ZMM14,1){%K7} |
(346) 0x4352ff KORTESTB %K3,%K3 |
(346) 0x435303 JE 43530b |
(346) 0x435305 VMOVSD (%RAX,%R15,8),%XMM13 |
(346) 0x43530b VPADDQ %ZMM22,%ZMM11,%ZMM11 |
(346) 0x435311 VBROADCASTSD %XMM13,%ZMM13 |
(346) 0x435317 KMOVQ %K3,%K7 |
(346) 0x43531c VSCATTERQPD %ZMM13,(,%ZMM11,1){%K7} |
(346) 0x435327 KORTESTB %K3,%K3 |
(346) 0x43532b JE 435333 |
(346) 0x43532d VMOVSD (%RDX,%R15,8),%XMM11 |
(346) 0x435333 VPADDQ %ZMM22,%ZMM12,%ZMM12 |
(346) 0x435339 VBROADCASTSD %XMM11,%ZMM11 |
(346) 0x43533f VSCATTERQPD %ZMM11,(,%ZMM12,1){%K3} |
(346) 0x43534a VPBROADCASTQ %RDI,%ZMM11 |
(346) 0x435350 INC %RDI |
(346) 0x435353 VPCMPEQQ %ZMM10,%ZMM11,%K7 |
(346) 0x435359 JMP 435076 |
(344) 0x435360 KANDB %K0,%K4,%K4 |
(344) 0x435364 KORTESTB %K4,%K4 |
(344) 0x435368 JE 435010 |
(344) 0x43536e MOV %RCX,%RDI |
(344) 0x435371 IMUL %R9,%RDI |
(344) 0x435375 VPBROADCASTQ %RDI,%ZMM11 |
(344) 0x43537b MOV %R8,%RDI |
(344) 0x43537e IMUL %R9,%RDI |
(344) 0x435382 VPBROADCASTQ %RDI,%ZMM12 |
(344) 0x435388 VMOVDQA64 %ZMM7,%ZMM13 |
(344) 0x43538e KMOVQ %K0,%K5 |
(344) 0x435393 JMP 4353b7 |
(345) 0x4353a0 KXORW %K0,%K0,%K6 |
(345) 0x4353a4 VPXOR %XMM13,%XMM13,%XMM13 |
(345) 0x4353a9 KANDNB %K5,%K6,%K5 |
(345) 0x4353ad KTESTB %K4,%K5 |
(345) 0x4353b1 JE 435010 |
(345) 0x4353b7 KANDB %K5,%K4,%K6 |
(345) 0x4353bb KORTESTB %K6,%K6 |
(345) 0x4353bf JE 4353a0 |
(345) 0x4353c1 KORTESTB %K6,%K6 |
(345) 0x4353c5 JE 4353cd |
(345) 0x4353c7 VMOVSD (%RAX,%R15,8),%XMM14 |
(345) 0x4353cd VPADDQ %ZMM13,%ZMM11,%ZMM15 |
(345) 0x4353d3 VPADDQ %ZMM15,%ZMM1,%ZMM15 |
(345) 0x4353d9 VPADDQ %ZMM8,%ZMM15,%ZMM15 |
(345) 0x4353df VPSLLQ $0x3,%ZMM15,%ZMM15 |
(345) 0x4353e6 VPADDQ %ZMM15,%ZMM3,%ZMM15 |
(345) 0x4353ec VBROADCASTSD %XMM14,%ZMM14 |
(345) 0x4353f2 KMOVQ %K6,%K3 |
(345) 0x4353f7 VSCATTERQPD %ZMM14,(,%ZMM15,1){%K3} |
(345) 0x435402 KORTESTB %K6,%K6 |
(345) 0x435406 JE 43540e |
(345) 0x435408 VMOVSD (%RDX,%R15,8),%XMM14 |
(345) 0x43540e VPADDQ %ZMM13,%ZMM12,%ZMM15 |
(345) 0x435414 VPADDQ %ZMM15,%ZMM1,%ZMM15 |
(345) 0x43541a VPADDQ %ZMM9,%ZMM15,%ZMM15 |
(345) 0x435420 VPSLLQ $0x3,%ZMM15,%ZMM15 |
(345) 0x435427 VPADDQ %ZMM15,%ZMM4,%ZMM15 |
(345) 0x43542d VBROADCASTSD %XMM14,%ZMM14 |
(345) 0x435433 VSCATTERQPD %ZMM14,(,%ZMM15,1){%K6} |
(345) 0x43543e VPCMPEQQ %ZMM6,%ZMM13,%K6 |
(345) 0x435444 VPSUBQ %ZMM21,%ZMM13,%ZMM13 |
(345) 0x43544a JMP 4353a9 |
(344) 0x435450 KXORW %K0,%K0,%K4 |
(344) 0x435454 XOR %R9D,%R9D |
(344) 0x435457 JMP 43501f |
0x43545c VPANDQ %ZMM23,%ZMM6,%ZMM7 |
0x435462 VPCMPLTUQ %ZMM6,%ZMM7,%K1{%K1} |
0x435469 KORTESTB %K1,%K1 |
0x43546d JE 434210 |
0x435473 KORTESTB %K1,%K1 |
0x435477 JE 43547f |
0x435479 VMOVSD (%RAX,%R15,8),%XMM6 |
0x43547f VPXOR %XMM8,%XMM8,%XMM8 |
0x435484 VPMULLQ %ZMM0,%ZMM5,%ZMM8 |
0x43548a VPMULLQ %ZMM5,%ZMM7,%ZMM5 |
0x435490 VPADDQ %ZMM8,%ZMM1,%ZMM8 |
0x435496 VPADDQ %ZMM5,%ZMM8,%ZMM5 |
0x43549c VPSLLQ $0x3,%ZMM5,%ZMM5 |
0x4354a3 VPADDQ %ZMM5,%ZMM4,%ZMM4 |
0x4354a9 VBROADCASTSD %XMM6,%ZMM5 |
0x4354af KMOVQ %K1,%K2 |
0x4354b4 VSCATTERQPD %ZMM5,(,%ZMM4,1){%K2} |
0x4354bf KORTESTB %K1,%K1 |
0x4354c3 JE 4354cb |
0x4354c5 VMOVSD (%RCX,%R15,8),%XMM5 |
0x4354cb VPMULLQ %ZMM0,%ZMM3,%ZMM0 |
0x4354d1 VPMULLQ %ZMM3,%ZMM7,%ZMM3 |
0x4354d7 VPADDQ %ZMM0,%ZMM1,%ZMM0 |
0x4354dd VPADDQ %ZMM3,%ZMM0,%ZMM0 |
0x4354e3 VPSLLQ $0x3,%ZMM0,%ZMM0 |
0x4354ea VPADDQ %ZMM0,%ZMM2,%ZMM0 |
0x4354f0 VBROADCASTSD %XMM5,%ZMM1 |
0x4354f6 KMOVQ %K1,%K2 |
0x4354fb VSCATTERQPD %ZMM1,(,%ZMM0,1){%K2} |
0x435506 KORTESTB %K1,%K1 |
0x43550a JE 435512 |
0x43550c VMOVSD (%RAX,%R15,8),%XMM1 |
0x435512 VPADDQ %ZMM24,%ZMM4,%ZMM2 |
0x435518 VBROADCASTSD %XMM1,%ZMM1 |
0x43551e KMOVQ %K1,%K2 |
0x435523 VSCATTERQPD %ZMM1,(,%ZMM2,1){%K2} |
0x43552e KORTESTB %K1,%K1 |
0x435532 JE 4341f6 |
0x435538 VMOVSD (%RCX,%R15,8),%XMM1 |
0x43553e JMP 4341f6 |
/home/eoseret/qaas_runs_CPU_9468/171-145-9336/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 46 - 69 |
-------------------------------------------------------------------------------- |
46: T &operator[](size_t i) const { return data[i]; } |
[...] |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
/home/eoseret/qaas_runs_CPU_9468/171-145-9336/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/generate_chunk.cpp: 85 - 123 |
-------------------------------------------------------------------------------- |
85: #pragma omp parallel for simd collapse(2) |
86: for (int j = (0); j < (yrange); j++) { |
87: for (int i = (0); i < (xrange); i++) { |
88: double x_cent = state_xmin[state]; |
89: double y_cent = state_ymin[state]; |
90: if (state_geometry[state] == g_rect) { |
91: if (field.vertexx[i + 1] >= state_xmin[state] && field.vertexx[i] < state_xmax[state]) { |
92: if (field.vertexy[j + 1] >= state_ymin[state] && field.vertexy[j] < state_ymax[state]) { |
93: field.energy0(i, j) = state_energy[state]; |
94: field.density0(i, j) = state_density[state]; |
95: for (int kt = j; kt <= j + 1; ++kt) { |
96: for (int jt = i; jt <= i + 1; ++jt) { |
97: field.xvel0(jt, kt) = state_xvel[state]; |
98: field.yvel0(jt, kt) = state_yvel[state]; |
[...] |
105: std::sqrt((field.cellx[i] - x_cent) * (field.cellx[i] - x_cent) + (field.celly[j] - y_cent) * (field.celly[j] - y_cent)); |
106: if (radius <= state_radius[state]) { |
107: field.energy0(i, j) = state_energy[state]; |
108: field.density0(i, j) = state_density[state]; |
109: for (int kt = j; kt <= j + 1; ++kt) { |
110: for (int jt = i; jt <= i + 1; ++jt) { |
111: field.xvel0(jt, kt) = state_xvel[state]; |
112: field.yvel0(jt, kt) = state_yvel[state]; |
113: } |
114: } |
115: } |
116: } else if (state_geometry[state] == g_point) { |
117: if (field.vertexx[i] == x_cent && field.vertexy[j] == y_cent) { |
118: field.energy0(i, j) = state_energy[state]; |
119: field.density0(i, j) = state_density[state]; |
120: for (int kt = j; kt <= j + 1; ++kt) { |
121: for (int jt = i; jt <= i + 1; ++jt) { |
122: field.xvel0(jt, kt) = state_xvel[state]; |
123: field.yvel0(jt, kt) = state_yvel[state]; |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.33 |
CQA speedup if FP arith vectorized | 1.00 |
CQA speedup if fully vectorized | 1.12 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.25 |
Bottlenecks | P0, P5, |
Function | _Z14generate_chunkiR16global_variables.extracted |
Source | context.h:46-46,context.h:69-69,generate_chunk.cpp:85-87,generate_chunk.cpp:91-98,generate_chunk.cpp:105-112,generate_chunk.cpp:117-123 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 151.50 |
CQA cycles if no scalar integer | 114.00 |
CQA cycles if FP arith vectorized | 151.50 |
CQA cycles if fully vectorized | 135.00 |
Front-end cycles | 120.83 |
DIV/SQRT cycles | 151.50 |
P0 cycles | 12.40 |
P1 cycles | 49.00 |
P2 cycles | 49.00 |
P3 cycles | 41.50 |
P4 cycles | 151.50 |
P5 cycles | 67.00 |
P6 cycles | 41.50 |
P7 cycles | 41.50 |
P8 cycles | 41.50 |
P9 cycles | 12.60 |
P10 cycles | 49.00 |
P11 cycles | 18.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 160.63 - 248.42 |
Stall cycles (UFS) | 60.66 - 148.42 |
Nb insns | 438.00 |
Nb uops | 725.00 |
Nb loads | 92.00 |
Nb stores | 12.00 |
Nb stack references | 11.00 |
FLOP/cycle | 0.32 |
Nb FLOP add-sub | 16.00 |
Nb FLOP mul | 8.00 |
Nb FLOP fma | 8.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 8.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 12.07 |
Bytes prefetched | 0.00 |
Bytes loaded | 1184.00 |
Bytes stored | 644.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 65.00 |
Vectorization ratio load | 19.15 |
Vectorization ratio store | 100.00 |
Vectorization ratio mul | 100.00 |
Vectorization ratio add_sub | 98.04 |
Vectorization ratio fma | 100.00 |
Vectorization ratio div_sqrt | 100.00 |
Vectorization ratio other | 61.29 |
Vector-efficiency ratio all | 63.23 |
Vector-efficiency ratio load | 29.26 |
Vector-efficiency ratio store | 100.00 |
Vector-efficiency ratio mul | 100.00 |
Vector-efficiency ratio add_sub | 93.38 |
Vector-efficiency ratio fma | 100.00 |
Vector-efficiency ratio div_sqrt | 100.00 |
Vector-efficiency ratio other | 56.25 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.33 |
CQA speedup if FP arith vectorized | 1.00 |
CQA speedup if fully vectorized | 1.12 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.25 |
Bottlenecks | P0, P5, |
Function | _Z14generate_chunkiR16global_variables.extracted |
Source | context.h:46-46,context.h:69-69,generate_chunk.cpp:85-87,generate_chunk.cpp:91-98,generate_chunk.cpp:105-112,generate_chunk.cpp:117-123 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 151.50 |
CQA cycles if no scalar integer | 114.00 |
CQA cycles if FP arith vectorized | 151.50 |
CQA cycles if fully vectorized | 135.00 |
Front-end cycles | 120.83 |
DIV/SQRT cycles | 151.50 |
P0 cycles | 12.40 |
P1 cycles | 49.00 |
P2 cycles | 49.00 |
P3 cycles | 41.50 |
P4 cycles | 151.50 |
P5 cycles | 67.00 |
P6 cycles | 41.50 |
P7 cycles | 41.50 |
P8 cycles | 41.50 |
P9 cycles | 12.60 |
P10 cycles | 49.00 |
P11 cycles | 18.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 160.63 - 248.42 |
Stall cycles (UFS) | 60.66 - 148.42 |
Nb insns | 438.00 |
Nb uops | 725.00 |
Nb loads | 92.00 |
Nb stores | 12.00 |
Nb stack references | 11.00 |
FLOP/cycle | 0.32 |
Nb FLOP add-sub | 16.00 |
Nb FLOP mul | 8.00 |
Nb FLOP fma | 8.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 8.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 12.07 |
Bytes prefetched | 0.00 |
Bytes loaded | 1184.00 |
Bytes stored | 644.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 65.00 |
Vectorization ratio load | 19.15 |
Vectorization ratio store | 100.00 |
Vectorization ratio mul | 100.00 |
Vectorization ratio add_sub | 98.04 |
Vectorization ratio fma | 100.00 |
Vectorization ratio div_sqrt | 100.00 |
Vectorization ratio other | 61.29 |
Vector-efficiency ratio all | 63.23 |
Vector-efficiency ratio load | 29.26 |
Vector-efficiency ratio store | 100.00 |
Vector-efficiency ratio mul | 100.00 |
Vector-efficiency ratio add_sub | 93.38 |
Vector-efficiency ratio fma | 100.00 |
Vector-efficiency ratio div_sqrt | 100.00 |
Vector-efficiency ratio other | 56.25 |
Path / |
Function | _Z14generate_chunkiR16global_variables.extracted |
Source file and lines | generate_chunk.cpp:85-123 |
Module | exec |
nb instructions | 438 |
nb uops | 725 |
loop length | 2250 |
used x86 registers | 12 |
used mmx registers | 0 |
used xmm registers | 8 |
used ymm registers | 5 |
used zmm registers | 21 |
nb stack references | 11 |
ADD-SUB / MUL ratio | 2.00 |
micro-operation queue | 120.83 cycles |
front end | 120.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 151.50 | 12.40 | 49.00 | 49.00 | 41.50 | 151.50 | 67.00 | 41.50 | 41.50 | 41.50 | 12.60 | 49.00 |
cycles | 151.50 | 12.40 | 49.00 | 49.00 | 41.50 | 151.50 | 67.00 | 41.50 | 41.50 | 41.50 | 12.60 | 49.00 |
Cycles executing div or sqrt instructions | 18.00 |
FE+BE cycles | 160.63-248.42 |
Stall cycles | 60.67-148.42 |
ROB full (events) | 4.97-134.53 |
RS full (events) | 119.88-36.91 |
Front-end | 120.83 |
Dispatch | 151.50 |
DIV/SQRT | 18.00 |
Overall L1 | 151.50 |
all | 67% |
load | 4% |
store | NA (no store vectorizable/vectorized instructions) |
mul | 100% |
add-sub | 97% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 62% |
all | 56% |
load | 34% |
store | 100% |
mul | 100% |
add-sub | 100% |
fma | 100% |
div/sqrt | 100% |
other | 57% |
all | 65% |
load | 19% |
store | 100% |
mul | 100% |
add-sub | 98% |
fma | 100% |
div/sqrt | 100% |
other | 61% |
all | 65% |
load | 16% |
store | NA (no store vectorizable/vectorized instructions) |
mul | 100% |
add-sub | 93% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 57% |
all | 57% |
load | 42% |
store | 100% |
mul | 100% |
add-sub | 100% |
fma | 100% |
div/sqrt | 100% |
other | 53% |
all | 63% |
load | 29% |
store | 100% |
mul | 100% |
add-sub | 93% |
fma | 100% |
div/sqrt | 100% |
other | 56% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
VPADDQ %ZMM24,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM1,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VSCATTERQPD %ZMM1,(,%ZMM0,1){%K1} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPADDQ %ZMM24,%ZMM19,%ZMM19 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD $0x8,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R12,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 435543 <_Z14generate_chunkiR16global_variables.extracted+0x1513> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VPADDQ %ZMM19,%ZMM18,%ZMM16 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSXD %R13D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
VPBROADCASTQ %RAX,%ZMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQA64 %ZMM16,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VMOVDQA64 %ZMM17,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
LEA 0x2756b(%RIP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL %RAX | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 2.14 |
VPXOR %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPMULLQ %ZMM17,%ZMM0,%ZMM1 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPSUBQ %ZMM1,%ZMM16,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD (%RAX,%R15,8),%ZMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD (%RAX,%R15,8),%ZMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
CMP $0x2,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 434540 <_Z14generate_chunkiR16global_variables.extracted+0x510> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x1,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x258(%RDX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPMOVQD %ZMM1,%YMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPCMPEQD %YMM5,%YMM5,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPSUBD %YMM5,%YMM4,%YMM4 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.33 |
KXNORW %K0,%K0,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VPXOR %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERDPD (%RAX,%YMM4,8),%ZMM5{%K1} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VCMPPD $0x2,%ZMM5,%ZMM3,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JE 4342c9 <_Z14generate_chunkiR16global_variables.extracted+0x299> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x80(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4342d5 <_Z14generate_chunkiR16global_variables.extracted+0x2a5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RCX,%R15,8),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VXORPD %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (%RAX,%ZMM1,8),%ZMM4{%K2} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VBROADCASTSD %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VCMPPD $0x1,%ZMM3,%ZMM4,%K1{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43430a <_Z14generate_chunkiR16global_variables.extracted+0x2da> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x278(%RDX),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPSLLQ $0x20,%ZMM0,%ZMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM20,%ZMM0,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSRAQ $0x20,%ZMM4,%ZMM6 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VMOVQ %XMM3,%RAX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VPXOR %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (%RAX,%ZMM6,8),%ZMM4{%K2} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VCMPPD $0x2,%ZMM4,%ZMM2,%K1{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JE 43434e <_Z14generate_chunkiR16global_variables.extracted+0x31e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43435a <_Z14generate_chunkiR16global_variables.extracted+0x32a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPSRAQ $0x1d,%ZMM0,%ZMM4 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM4,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VPXOR %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (,%ZMM3,1),%ZMM4{%K2} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VBROADCASTSD %XMM2,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VCMPPD $0x1,%ZMM2,%ZMM4,%K1{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JE 4343a2 <_Z14generate_chunkiR16global_variables.extracted+0x372> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4343ad <_Z14generate_chunkiR16global_variables.extracted+0x37d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x40(%RDX),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4343b8 <_Z14generate_chunkiR16global_variables.extracted+0x388> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x30(%RDX),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4343c4 <_Z14generate_chunkiR16global_variables.extracted+0x394> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPSRAQ $0x20,%ZMM0,%ZMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPBROADCASTQ %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMULLQ %ZMM0,%ZMM3,%ZMM3 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPBROADCASTQ %XMM2,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM3,%ZMM1,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM3,%ZMM3 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM3,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM4,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM3,(,%ZMM2,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434414 <_Z14generate_chunkiR16global_variables.extracted+0x3e4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43441f <_Z14generate_chunkiR16global_variables.extracted+0x3ef> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x10(%RDX),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434429 <_Z14generate_chunkiR16global_variables.extracted+0x3f9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ (%RDX),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434435 <_Z14generate_chunkiR16global_variables.extracted+0x405> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMULLQ %ZMM0,%ZMM3,%ZMM3 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPBROADCASTQ %XMM2,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM3,%ZMM1,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM3,%ZMM3 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM3,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM4,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM3,(,%ZMM2,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43447e <_Z14generate_chunkiR16global_variables.extracted+0x44e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43448c <_Z14generate_chunkiR16global_variables.extracted+0x45c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0xb8(%RDX),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434499 <_Z14generate_chunkiR16global_variables.extracted+0x469> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xa8(%RDX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4344a7 <_Z14generate_chunkiR16global_variables.extracted+0x477> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4344b5 <_Z14generate_chunkiR16global_variables.extracted+0x485> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0xe8(%RDX),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4344c2 <_Z14generate_chunkiR16global_variables.extracted+0x492> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd8(%RDX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM2,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RDI,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %XMM3,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R8,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPSUBQ %ZMM21,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPSUBQ %ZMM21,%ZMM0,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPMAXSQ %ZMM7,%ZMM6,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPSUBQ %ZMM0,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPCMPNLEUQ 0x38b2b(%RIP){1to0},%ZMM6,%K0 | |||||||||||||||
KANDB %K0,%K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43545c <_Z14generate_chunkiR16global_variables.extracted+0x142c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VPSRLQ $0x1,%ZMM6,%ZMM7 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM21,%ZMM7,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPMULLQ %ZMM0,%ZMM5,%ZMM8 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPMULLQ %ZMM0,%ZMM3,%ZMM9 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPADDQ %ZMM5,%ZMM1,%ZMM10 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %ZMM3,%ZMM1,%ZMM11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 434bf4 <_Z14generate_chunkiR16global_variables.extracted+0xbc4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
JE 434dbb <_Z14generate_chunkiR16global_variables.extracted+0xd8b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x3,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x258(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KXNORW %K0,%K0,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (%RAX,%ZMM1,8),%ZMM4{%K1} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VCMPPD $0,%ZMM3,%ZMM4,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JE 434588 <_Z14generate_chunkiR16global_variables.extracted+0x558> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x278(%RDI),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %XMM3,%RAX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VPSLLQ $0x20,%ZMM0,%ZMM3 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPSRAQ $0x1d,%ZMM3,%ZMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VXORPD %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (%RAX,%ZMM0,1),%ZMM4{%K2} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VCMPPD $0,%ZMM2,%ZMM4,%K0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KANDB %K0,%K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JE 4345ca <_Z14generate_chunkiR16global_variables.extracted+0x59a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4345d5 <_Z14generate_chunkiR16global_variables.extracted+0x5a5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x40(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4345e0 <_Z14generate_chunkiR16global_variables.extracted+0x5b0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x30(%RDI),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4345ec <_Z14generate_chunkiR16global_variables.extracted+0x5bc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPSRAQ $0x20,%ZMM3,%ZMM7 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPBROADCASTQ %XMM2,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMULLQ %ZMM7,%ZMM2,%ZMM2 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPBROADCASTQ %XMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM2,%ZMM1,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM2,%ZMM2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM2,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM4,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM2,(,%ZMM0,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43463c <_Z14generate_chunkiR16global_variables.extracted+0x60c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434647 <_Z14generate_chunkiR16global_variables.extracted+0x617> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x10(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434651 <_Z14generate_chunkiR16global_variables.extracted+0x621> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ (%RDI),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43465d <_Z14generate_chunkiR16global_variables.extracted+0x62d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM2,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMULLQ %ZMM7,%ZMM2,%ZMM2 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPBROADCASTQ %XMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM2,%ZMM1,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM2,%ZMM2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM2,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM4,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM2,(,%ZMM0,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4346a6 <_Z14generate_chunkiR16global_variables.extracted+0x676> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4346b4 <_Z14generate_chunkiR16global_variables.extracted+0x684> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0xb8(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4346c1 <_Z14generate_chunkiR16global_variables.extracted+0x691> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xa8(%RDI),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4346cf <_Z14generate_chunkiR16global_variables.extracted+0x69f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RDX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4346dd <_Z14generate_chunkiR16global_variables.extracted+0x6ad> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0xe8(%RDI),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4346ea <_Z14generate_chunkiR16global_variables.extracted+0x6ba> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd8(%RDI),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %XMM2,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R8,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM20,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSRAQ $0x20,%ZMM3,%ZMM3 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPSUBQ %ZMM21,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPSUBQ %ZMM21,%ZMM7,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPMAXSQ %ZMM4,%ZMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQA64 %ZMM7,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VPTERNLOGQ $0xf,%ZMM7,%ZMM7,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %ZMM4,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPMOVQD %ZMM1,%YMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPCMPEQD %YMM5,%YMM5,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPSUBD %YMM5,%YMM4,%YMM5 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.33 |
VPMAXSD %YMM4,%YMM5,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSUBD %YMM4,%YMM5,%YMM5 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.33 |
VPMOVZXDQ %YMM5,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPSUBQ %ZMM21,%ZMM4,%ZMM9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPCMPNLEUD %YMM25,%YMM5,%K2 | |||||||||||||||
KMOVW %K2,-0x2a(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VPANDQ %ZMM26,%ZMM9,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPCMPLEUQ %ZMM4,%ZMM5,%K3 | |||||||||||||||
VPMULLQ %ZMM7,%ZMM6,%ZMM6 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPMULLQ %ZMM7,%ZMM8,%ZMM7 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPSRLQ $0x3,%ZMM9,%ZMM8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM21,%ZMM8,%ZMM8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4347ad <_Z14generate_chunkiR16global_variables.extracted+0x77d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x218(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KXNORW %K0,%K0,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (%RAX,%ZMM1,8),%ZMM4{%K1} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
MOV 0x238(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VSUBPD %ZMM3,%ZMM4,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPSLLQ $0x20,%ZMM0,%ZMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPSRAQ $0x20,%ZMM5,%ZMM9 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
KXNORW %K0,%K0,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (%RAX,%ZMM9,8),%ZMM0{%K1} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VMULPD %ZMM3,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSUBPD %ZMM2,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VFMADD213PD %ZMM3,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSQRTPD %ZMM0,%ZMM0 | 3 | 2.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 23-32 | 18 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD (%RAX,%R15,8),%ZMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VCMPPD $0x2,%ZMM2,%ZMM0,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCMPPD $0x2,%ZMM2,%ZMM0,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434e52 <_Z14generate_chunkiR16global_variables.extracted+0xe22> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434e5d <_Z14generate_chunkiR16global_variables.extracted+0xe2d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x40(%RDI),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434e68 <_Z14generate_chunkiR16global_variables.extracted+0xe38> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x30(%RDI),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434e74 <_Z14generate_chunkiR16global_variables.extracted+0xe44> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM4,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMULLQ %ZMM9,%ZMM4,%ZMM4 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPBROADCASTQ %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM4,%ZMM1,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM4,%ZMM4 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM4,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM6,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K2,%K3 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM4,(,%ZMM3,1){%K3} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434ebd <_Z14generate_chunkiR16global_variables.extracted+0xe8d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434ec8 <_Z14generate_chunkiR16global_variables.extracted+0xe98> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x10(%RDI),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434ed2 <_Z14generate_chunkiR16global_variables.extracted+0xea2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ (%RDI),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434ede <_Z14generate_chunkiR16global_variables.extracted+0xeae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM4,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMULLQ %ZMM9,%ZMM4,%ZMM4 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPBROADCASTQ %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM4,%ZMM1,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM4,%ZMM4 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM4,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM6,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K2,%K3 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM4,(,%ZMM3,1){%K3} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434f27 <_Z14generate_chunkiR16global_variables.extracted+0xef7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434f35 <_Z14generate_chunkiR16global_variables.extracted+0xf05> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0xb8(%RDI),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434f42 <_Z14generate_chunkiR16global_variables.extracted+0xf12> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xa8(%RDI),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434f50 <_Z14generate_chunkiR16global_variables.extracted+0xf20> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RDX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434f5e <_Z14generate_chunkiR16global_variables.extracted+0xf2e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0xe8(%RDI),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434f6b <_Z14generate_chunkiR16global_variables.extracted+0xf3b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd8(%RDI),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %XMM4,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R8,%ZMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM20,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSRAQ $0x20,%ZMM5,%ZMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPSUBQ %ZMM21,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPSUBQ %ZMM21,%ZMM9,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPMAXSQ %ZMM6,%ZMM5,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQA64 %ZMM9,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VPTERNLOGQ $0xf,%ZMM9,%ZMM9,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %ZMM6,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPMOVQD %ZMM1,%YMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPCMPEQD %YMM7,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPSUBD %YMM7,%YMM6,%YMM7 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.33 |
VPMAXSD %YMM6,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSUBD %YMM6,%YMM7,%YMM7 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.33 |
VPMOVZXDQ %YMM7,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPSUBQ %ZMM21,%ZMM6,%ZMM11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPCMPNLEUD %YMM25,%YMM7,%K0 | |||||||||||||||
KMOVW %K0,-0x2a(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VPANDQ %ZMM26,%ZMM11,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPCMPLEUQ %ZMM6,%ZMM7,%K0 | |||||||||||||||
VPMULLQ %ZMM9,%ZMM8,%ZMM8 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPMULLQ %ZMM9,%ZMM10,%ZMM9 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPSRLQ $0x3,%ZMM11,%ZMM10 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM21,%ZMM10,%ZMM10 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 43502d <_Z14generate_chunkiR16global_variables.extracted+0xffd> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VPANDQ %ZMM23,%ZMM6,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPCMPLTUQ %ZMM6,%ZMM7,%K1{%K1} | |||||||||||||||
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43547f <_Z14generate_chunkiR16global_variables.extracted+0x144f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPXOR %XMM8,%XMM8,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPMULLQ %ZMM0,%ZMM5,%ZMM8 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPMULLQ %ZMM5,%ZMM7,%ZMM5 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPADDQ %ZMM8,%ZMM1,%ZMM8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %ZMM5,%ZMM8,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM5,%ZMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM5,%ZMM4,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM6,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM5,(,%ZMM4,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4354cb <_Z14generate_chunkiR16global_variables.extracted+0x149b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RCX,%R15,8),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPMULLQ %ZMM0,%ZMM3,%ZMM0 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPMULLQ %ZMM3,%ZMM7,%ZMM3 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPADDQ %ZMM0,%ZMM1,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %ZMM3,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM0,%ZMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM0,%ZMM2,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM5,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM1,(,%ZMM0,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 435512 <_Z14generate_chunkiR16global_variables.extracted+0x14e2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPADDQ %ZMM24,%ZMM4,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM1,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM1,(,%ZMM2,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4341f6 <_Z14generate_chunkiR16global_variables.extracted+0x1c6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RCX,%R15,8),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4341f6 <_Z14generate_chunkiR16global_variables.extracted+0x1c6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
Function | _Z14generate_chunkiR16global_variables.extracted |
Source file and lines | generate_chunk.cpp:85-123 |
Module | exec |
nb instructions | 438 |
nb uops | 725 |
loop length | 2250 |
used x86 registers | 12 |
used mmx registers | 0 |
used xmm registers | 8 |
used ymm registers | 5 |
used zmm registers | 21 |
nb stack references | 11 |
ADD-SUB / MUL ratio | 2.00 |
micro-operation queue | 120.83 cycles |
front end | 120.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 151.50 | 12.40 | 49.00 | 49.00 | 41.50 | 151.50 | 67.00 | 41.50 | 41.50 | 41.50 | 12.60 | 49.00 |
cycles | 151.50 | 12.40 | 49.00 | 49.00 | 41.50 | 151.50 | 67.00 | 41.50 | 41.50 | 41.50 | 12.60 | 49.00 |
Cycles executing div or sqrt instructions | 18.00 |
FE+BE cycles | 160.63-248.42 |
Stall cycles | 60.67-148.42 |
ROB full (events) | 4.97-134.53 |
RS full (events) | 119.88-36.91 |
Front-end | 120.83 |
Dispatch | 151.50 |
DIV/SQRT | 18.00 |
Overall L1 | 151.50 |
all | 67% |
load | 4% |
store | NA (no store vectorizable/vectorized instructions) |
mul | 100% |
add-sub | 97% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 62% |
all | 56% |
load | 34% |
store | 100% |
mul | 100% |
add-sub | 100% |
fma | 100% |
div/sqrt | 100% |
other | 57% |
all | 65% |
load | 19% |
store | 100% |
mul | 100% |
add-sub | 98% |
fma | 100% |
div/sqrt | 100% |
other | 61% |
all | 65% |
load | 16% |
store | NA (no store vectorizable/vectorized instructions) |
mul | 100% |
add-sub | 93% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 57% |
all | 57% |
load | 42% |
store | 100% |
mul | 100% |
add-sub | 100% |
fma | 100% |
div/sqrt | 100% |
other | 53% |
all | 63% |
load | 29% |
store | 100% |
mul | 100% |
add-sub | 93% |
fma | 100% |
div/sqrt | 100% |
other | 56% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
VPADDQ %ZMM24,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM1,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VSCATTERQPD %ZMM1,(,%ZMM0,1){%K1} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPADDQ %ZMM24,%ZMM19,%ZMM19 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD $0x8,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R12,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 435543 <_Z14generate_chunkiR16global_variables.extracted+0x1513> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VPADDQ %ZMM19,%ZMM18,%ZMM16 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSXD %R13D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
VPBROADCASTQ %RAX,%ZMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQA64 %ZMM16,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VMOVDQA64 %ZMM17,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
LEA 0x2756b(%RIP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL %RAX | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 2.14 |
VPXOR %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPMULLQ %ZMM17,%ZMM0,%ZMM1 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPSUBQ %ZMM1,%ZMM16,%ZMM1 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD (%RAX,%R15,8),%ZMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD (%RAX,%R15,8),%ZMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
CMP $0x2,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 434540 <_Z14generate_chunkiR16global_variables.extracted+0x510> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x1,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x258(%RDX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPMOVQD %ZMM1,%YMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPCMPEQD %YMM5,%YMM5,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPSUBD %YMM5,%YMM4,%YMM4 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.33 |
KXNORW %K0,%K0,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VPXOR %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERDPD (%RAX,%YMM4,8),%ZMM5{%K1} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VCMPPD $0x2,%ZMM5,%ZMM3,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JE 4342c9 <_Z14generate_chunkiR16global_variables.extracted+0x299> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x80(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4342d5 <_Z14generate_chunkiR16global_variables.extracted+0x2a5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RCX,%R15,8),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VXORPD %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (%RAX,%ZMM1,8),%ZMM4{%K2} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VBROADCASTSD %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VCMPPD $0x1,%ZMM3,%ZMM4,%K1{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43430a <_Z14generate_chunkiR16global_variables.extracted+0x2da> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x278(%RDX),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPSLLQ $0x20,%ZMM0,%ZMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM20,%ZMM0,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSRAQ $0x20,%ZMM4,%ZMM6 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VMOVQ %XMM3,%RAX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VPXOR %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (%RAX,%ZMM6,8),%ZMM4{%K2} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VCMPPD $0x2,%ZMM4,%ZMM2,%K1{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JE 43434e <_Z14generate_chunkiR16global_variables.extracted+0x31e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43435a <_Z14generate_chunkiR16global_variables.extracted+0x32a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPSRAQ $0x1d,%ZMM0,%ZMM4 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM4,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VPXOR %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (,%ZMM3,1),%ZMM4{%K2} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VBROADCASTSD %XMM2,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VCMPPD $0x1,%ZMM2,%ZMM4,%K1{%K1} | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JE 4343a2 <_Z14generate_chunkiR16global_variables.extracted+0x372> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4343ad <_Z14generate_chunkiR16global_variables.extracted+0x37d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x40(%RDX),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4343b8 <_Z14generate_chunkiR16global_variables.extracted+0x388> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x30(%RDX),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4343c4 <_Z14generate_chunkiR16global_variables.extracted+0x394> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPSRAQ $0x20,%ZMM0,%ZMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPBROADCASTQ %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMULLQ %ZMM0,%ZMM3,%ZMM3 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPBROADCASTQ %XMM2,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM3,%ZMM1,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM3,%ZMM3 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM3,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM4,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM3,(,%ZMM2,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434414 <_Z14generate_chunkiR16global_variables.extracted+0x3e4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43441f <_Z14generate_chunkiR16global_variables.extracted+0x3ef> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x10(%RDX),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434429 <_Z14generate_chunkiR16global_variables.extracted+0x3f9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ (%RDX),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434435 <_Z14generate_chunkiR16global_variables.extracted+0x405> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMULLQ %ZMM0,%ZMM3,%ZMM3 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPBROADCASTQ %XMM2,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM3,%ZMM1,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM3,%ZMM3 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM3,%ZMM2,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM4,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM3,(,%ZMM2,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43447e <_Z14generate_chunkiR16global_variables.extracted+0x44e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43448c <_Z14generate_chunkiR16global_variables.extracted+0x45c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0xb8(%RDX),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434499 <_Z14generate_chunkiR16global_variables.extracted+0x469> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xa8(%RDX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4344a7 <_Z14generate_chunkiR16global_variables.extracted+0x477> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4344b5 <_Z14generate_chunkiR16global_variables.extracted+0x485> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0xe8(%RDX),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4344c2 <_Z14generate_chunkiR16global_variables.extracted+0x492> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd8(%RDX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM2,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RDI,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %XMM3,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R8,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPSUBQ %ZMM21,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPSUBQ %ZMM21,%ZMM0,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPMAXSQ %ZMM7,%ZMM6,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPSUBQ %ZMM0,%ZMM6,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPCMPNLEUQ 0x38b2b(%RIP){1to0},%ZMM6,%K0 | |||||||||||||||
KANDB %K0,%K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43545c <_Z14generate_chunkiR16global_variables.extracted+0x142c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VPSRLQ $0x1,%ZMM6,%ZMM7 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM21,%ZMM7,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPMULLQ %ZMM0,%ZMM5,%ZMM8 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPMULLQ %ZMM0,%ZMM3,%ZMM9 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPADDQ %ZMM5,%ZMM1,%ZMM10 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %ZMM3,%ZMM1,%ZMM11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 434bf4 <_Z14generate_chunkiR16global_variables.extracted+0xbc4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
JE 434dbb <_Z14generate_chunkiR16global_variables.extracted+0xd8b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x3,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x258(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KXNORW %K0,%K0,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (%RAX,%ZMM1,8),%ZMM4{%K1} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VCMPPD $0,%ZMM3,%ZMM4,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JE 434588 <_Z14generate_chunkiR16global_variables.extracted+0x558> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x278(%RDI),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %XMM3,%RAX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VPSLLQ $0x20,%ZMM0,%ZMM3 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPSRAQ $0x1d,%ZMM3,%ZMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VXORPD %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (%RAX,%ZMM0,1),%ZMM4{%K2} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VCMPPD $0,%ZMM2,%ZMM4,%K0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KANDB %K0,%K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JE 4345ca <_Z14generate_chunkiR16global_variables.extracted+0x59a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4345d5 <_Z14generate_chunkiR16global_variables.extracted+0x5a5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x40(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4345e0 <_Z14generate_chunkiR16global_variables.extracted+0x5b0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x30(%RDI),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4345ec <_Z14generate_chunkiR16global_variables.extracted+0x5bc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPSRAQ $0x20,%ZMM3,%ZMM7 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPBROADCASTQ %XMM2,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMULLQ %ZMM7,%ZMM2,%ZMM2 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPBROADCASTQ %XMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM2,%ZMM1,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM2,%ZMM2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM2,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM4,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM2,(,%ZMM0,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43463c <_Z14generate_chunkiR16global_variables.extracted+0x60c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434647 <_Z14generate_chunkiR16global_variables.extracted+0x617> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x10(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434651 <_Z14generate_chunkiR16global_variables.extracted+0x621> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ (%RDI),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43465d <_Z14generate_chunkiR16global_variables.extracted+0x62d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM2,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMULLQ %ZMM7,%ZMM2,%ZMM2 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPBROADCASTQ %XMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM2,%ZMM1,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM2,%ZMM2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM2,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM4,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM2,(,%ZMM0,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4346a6 <_Z14generate_chunkiR16global_variables.extracted+0x676> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4346b4 <_Z14generate_chunkiR16global_variables.extracted+0x684> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0xb8(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4346c1 <_Z14generate_chunkiR16global_variables.extracted+0x691> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xa8(%RDI),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4346cf <_Z14generate_chunkiR16global_variables.extracted+0x69f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RDX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4346dd <_Z14generate_chunkiR16global_variables.extracted+0x6ad> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0xe8(%RDI),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4346ea <_Z14generate_chunkiR16global_variables.extracted+0x6ba> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd8(%RDI),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %XMM2,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R8,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM20,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSRAQ $0x20,%ZMM3,%ZMM3 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPSUBQ %ZMM21,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPSUBQ %ZMM21,%ZMM7,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPMAXSQ %ZMM4,%ZMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQA64 %ZMM7,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VPTERNLOGQ $0xf,%ZMM7,%ZMM7,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %ZMM4,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPMOVQD %ZMM1,%YMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPCMPEQD %YMM5,%YMM5,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPSUBD %YMM5,%YMM4,%YMM5 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.33 |
VPMAXSD %YMM4,%YMM5,%YMM5 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSUBD %YMM4,%YMM5,%YMM5 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.33 |
VPMOVZXDQ %YMM5,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPSUBQ %ZMM21,%ZMM4,%ZMM9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPCMPNLEUD %YMM25,%YMM5,%K2 | |||||||||||||||
KMOVW %K2,-0x2a(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VPANDQ %ZMM26,%ZMM9,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPCMPLEUQ %ZMM4,%ZMM5,%K3 | |||||||||||||||
VPMULLQ %ZMM7,%ZMM6,%ZMM6 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPMULLQ %ZMM7,%ZMM8,%ZMM7 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPSRLQ $0x3,%ZMM9,%ZMM8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM21,%ZMM8,%ZMM8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4347ad <_Z14generate_chunkiR16global_variables.extracted+0x77d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x218(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KXNORW %K0,%K0,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (%RAX,%ZMM1,8),%ZMM4{%K1} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
MOV 0x238(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VSUBPD %ZMM3,%ZMM4,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPSLLQ $0x20,%ZMM0,%ZMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPSRAQ $0x20,%ZMM5,%ZMM9 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
KXNORW %K0,%K0,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VGATHERQPD (%RAX,%ZMM9,8),%ZMM0{%K1} | 5 | 1 | 0 | 2.67 | 2.67 | 0 | 2 | 0 | 0 | 0 | 0 | 0 | 2.67 | 0-29 | 2.67 |
VMULPD %ZMM3,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSUBPD %ZMM2,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VFMADD213PD %ZMM3,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VSQRTPD %ZMM0,%ZMM0 | 3 | 2.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 23-32 | 18 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD (%RAX,%R15,8),%ZMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VCMPPD $0x2,%ZMM2,%ZMM0,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCMPPD $0x2,%ZMM2,%ZMM0,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434e52 <_Z14generate_chunkiR16global_variables.extracted+0xe22> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434e5d <_Z14generate_chunkiR16global_variables.extracted+0xe2d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x40(%RDI),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434e68 <_Z14generate_chunkiR16global_variables.extracted+0xe38> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x30(%RDI),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434e74 <_Z14generate_chunkiR16global_variables.extracted+0xe44> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM4,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMULLQ %ZMM9,%ZMM4,%ZMM4 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPBROADCASTQ %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM4,%ZMM1,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM4,%ZMM4 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM4,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM6,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K2,%K3 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM4,(,%ZMM3,1){%K3} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434ebd <_Z14generate_chunkiR16global_variables.extracted+0xe8d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434ec8 <_Z14generate_chunkiR16global_variables.extracted+0xe98> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0x10(%RDI),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434ed2 <_Z14generate_chunkiR16global_variables.extracted+0xea2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ (%RDI),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434ede <_Z14generate_chunkiR16global_variables.extracted+0xeae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM4,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPMULLQ %ZMM9,%ZMM4,%ZMM4 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPBROADCASTQ %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM4,%ZMM1,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM4,%ZMM4 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM4,%ZMM3,%ZMM3 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM6,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K2,%K3 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM4,(,%ZMM3,1){%K3} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434f27 <_Z14generate_chunkiR16global_variables.extracted+0xef7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434f35 <_Z14generate_chunkiR16global_variables.extracted+0xf05> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0xb8(%RDI),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434f42 <_Z14generate_chunkiR16global_variables.extracted+0xf12> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xa8(%RDI),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434f50 <_Z14generate_chunkiR16global_variables.extracted+0xf20> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RDX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434f5e <_Z14generate_chunkiR16global_variables.extracted+0xf2e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ 0xe8(%RDI),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K2,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434f6b <_Z14generate_chunkiR16global_variables.extracted+0xf3b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd8(%RDI),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %XMM3,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %XMM4,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R8,%ZMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %ZMM20,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSRAQ $0x20,%ZMM5,%ZMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPSUBQ %ZMM21,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPSUBQ %ZMM21,%ZMM9,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPMAXSQ %ZMM6,%ZMM5,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQA64 %ZMM9,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VPTERNLOGQ $0xf,%ZMM9,%ZMM9,%ZMM6 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %ZMM6,%ZMM5,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPMOVQD %ZMM1,%YMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPCMPEQD %YMM7,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPSUBD %YMM7,%YMM6,%YMM7 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.33 |
VPMAXSD %YMM6,%YMM7,%YMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSUBD %YMM6,%YMM7,%YMM7 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.33 |
VPMOVZXDQ %YMM7,%ZMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPSUBQ %ZMM21,%ZMM6,%ZMM11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.50 |
VPCMPNLEUD %YMM25,%YMM7,%K0 | |||||||||||||||
KMOVW %K0,-0x2a(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 |
VPANDQ %ZMM26,%ZMM11,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPCMPLEUQ %ZMM6,%ZMM7,%K0 | |||||||||||||||
VPMULLQ %ZMM9,%ZMM8,%ZMM8 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPMULLQ %ZMM9,%ZMM10,%ZMM9 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPSRLQ $0x3,%ZMM11,%ZMM10 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM21,%ZMM10,%ZMM10 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 43502d <_Z14generate_chunkiR16global_variables.extracted+0xffd> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VPANDQ %ZMM23,%ZMM6,%ZMM7 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPCMPLTUQ %ZMM6,%ZMM7,%K1{%K1} | |||||||||||||||
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 434210 <_Z14generate_chunkiR16global_variables.extracted+0x1e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 43547f <_Z14generate_chunkiR16global_variables.extracted+0x144f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPXOR %XMM8,%XMM8,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPMULLQ %ZMM0,%ZMM5,%ZMM8 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPMULLQ %ZMM5,%ZMM7,%ZMM5 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPADDQ %ZMM8,%ZMM1,%ZMM8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %ZMM5,%ZMM8,%ZMM5 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM5,%ZMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM5,%ZMM4,%ZMM4 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM6,%ZMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM5,(,%ZMM4,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4354cb <_Z14generate_chunkiR16global_variables.extracted+0x149b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RCX,%R15,8),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPMULLQ %ZMM0,%ZMM3,%ZMM0 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPMULLQ %ZMM3,%ZMM7,%ZMM3 | 5 | 1.50 | 0 | 0 | 0 | 0 | 1.50 | 0 | 0 | 0 | 0 | 0 | 0 | 15 | 1.50 |
VPADDQ %ZMM0,%ZMM1,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %ZMM3,%ZMM0,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPSLLQ $0x3,%ZMM0,%ZMM0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2-4 | 1 |
VPADDQ %ZMM0,%ZMM2,%ZMM0 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM5,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM1,(,%ZMM0,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 435512 <_Z14generate_chunkiR16global_variables.extracted+0x14e2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RAX,%R15,8),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPADDQ %ZMM24,%ZMM4,%ZMM2 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM1,%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
KMOVQ %K1,%K2 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VSCATTERQPD %ZMM1,(,%ZMM2,1){%K2} | 20 | 2.20 | 0.20 | 0 | 0 | 4 | 0.20 | 0.20 | 4 | 4 | 4 | 0.20 | 0 | 2-12 | 7 |
KORTESTB %K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 4341f6 <_Z14generate_chunkiR16global_variables.extracted+0x1c6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%RCX,%R15,8),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4341f6 <_Z14generate_chunkiR16global_variables.extracted+0x1c6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |