Function: qmcplusplus::BsplineFunctor<double>::evaluateVGL(int, int, int, double const*, double*, do ... | Module: exec | Source: BsplineFunctor.h:276-339 [...] | Coverage: 0.65% |
---|
Function: qmcplusplus::BsplineFunctor<double>::evaluateVGL(int, int, int, double const*, double*, do ... | Module: exec | Source: BsplineFunctor.h:276-339 [...] | Coverage: 0.65% |
---|
/scratch_na/users/xoserete/qaas_runs/171-417-8059/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/BsplineFunctor.h: 276 - 339 |
-------------------------------------------------------------------------------- |
276: real_type dSquareDeltaRinv = DeltaRInv * DeltaRInv; |
[...] |
284: int iLimit = iEnd - iStart; |
285: const real_type* distArray = _distArray + iStart; |
[...] |
291: for (int jat = 0; jat < iLimit; jat++) |
292: { |
293: real_type r = distArray[jat]; |
294: if (r < cutoff_radius && iStart + jat != iat) |
295: { |
296: distIndices[iCount] = jat; |
297: distArrayCompressed[iCount] = r; |
298: iCount++; |
299: } |
300: } |
301: |
302: #pragma omp simd |
303: for (int j = 0; j < iCount; j++) |
304: { |
305: real_type r = distArrayCompressed[j]; |
306: int iScatter = distIndices[j]; |
307: real_type rinv = cOne / r; |
308: r *= DeltaRInv; |
309: int iGather = (int)r; |
310: real_type t = r - real_type(iGather); |
311: real_type tp0 = t * t * t; |
312: real_type tp1 = t * t; |
313: real_type tp2 = t; |
314: |
315: real_type sCoef0 = SplineCoefs[iGather + 0]; |
316: real_type sCoef1 = SplineCoefs[iGather + 1]; |
317: real_type sCoef2 = SplineCoefs[iGather + 2]; |
318: real_type sCoef3 = SplineCoefs[iGather + 3]; |
319: |
320: // clang-format off |
321: laplArray[iScatter] = dSquareDeltaRinv * |
322: (sCoef0*( d2A[ 2]*tp2 + d2A[ 3])+ |
323: sCoef1*( d2A[ 6]*tp2 + d2A[ 7])+ |
324: sCoef2*( d2A[10]*tp2 + d2A[11])+ |
325: sCoef3*( d2A[14]*tp2 + d2A[15])); |
326: |
327: gradArray[iScatter] = DeltaRInv * rinv * |
328: (sCoef0*( dA[ 1]*tp1 + dA[ 2]*tp2 + dA[ 3])+ |
329: sCoef1*( dA[ 5]*tp1 + dA[ 6]*tp2 + dA[ 7])+ |
330: sCoef2*( dA[ 9]*tp1 + dA[10]*tp2 + dA[11])+ |
331: sCoef3*( dA[13]*tp1 + dA[14]*tp2 + dA[15])); |
332: |
333: valArray[iScatter] = (sCoef0*(A[ 0]*tp0 + A[ 1]*tp1 + A[ 2]*tp2 + A[ 3])+ |
334: sCoef1*(A[ 4]*tp0 + A[ 5]*tp1 + A[ 6]*tp2 + A[ 7])+ |
335: sCoef2*(A[ 8]*tp0 + A[ 9]*tp1 + A[10]*tp2 + A[11])+ |
336: sCoef3*(A[12]*tp0 + A[13]*tp1 + A[14]*tp2 + A[15])); |
337: // clang-format on |
338: } |
339: } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_vector.h: 951 - 951 |
-------------------------------------------------------------------------------- |
951: return *(this->_M_impl._M_start + __n); |
0x41c590 SUB %EDX,%ECX |
0x41c592 TEST %ECX,%ECX |
0x41c594 JLE 41d1a5 |
0x41c59a PUSH %RBP |
0x41c59b MOV %RSP,%RBP |
0x41c59e PUSH %R15 |
0x41c5a0 PUSH %R14 |
0x41c5a2 PUSH %R13 |
0x41c5a4 PUSH %R12 |
0x41c5a6 PUSH %RBX |
0x41c5a7 AND $-0x20,%RSP |
0x41c5ab SUB $0x6e0,%RSP |
0x41c5b2 MOV %R8,0x40(%RSP) |
0x41c5b7 MOV 0x28(%RBP),%RAX |
0x41c5bb MOV 0x20(%RBP),%R8 |
0x41c5bf MOVSXD %EDX,%R11 |
0x41c5c2 VMOVSD 0x8(%RDI),%XMM0 |
0x41c5c7 MOV %ECX,%R14D |
0x41c5ca XOR %EBX,%EBX |
0x41c5cc CMP $0x4,%ECX |
0x41c5cf JAE 41ce02 |
0x41c5d5 MOV %R14D,%ECX |
0x41c5d8 AND $-0x4,%ECX |
0x41c5db CMP %R14,%RCX |
0x41c5de JNE 41ceeb |
0x41c5e4 TEST %EBX,%EBX |
0x41c5e6 JLE 41d197 |
0x41c5ec VMOVSD 0x238(%RDI),%XMM3 |
0x41c5f4 MOV 0x18(%RBP),%RCX |
0x41c5f8 MOV 0x10(%RBP),%RDX |
0x41c5fc MOV 0x218(%RDI),%RSI |
0x41c603 VMOVSD 0x128(%RDI),%XMM11 |
0x41c60b VMOVSD 0x130(%RDI),%XMM0 |
0x41c613 VMOVUPS %XMM0,(%RSP) |
0x41c618 VMOVSD 0x148(%RDI),%XMM0 |
0x41c620 VMOVUPS %XMM0,0xf0(%RSP) |
0x41c629 VMOVSD 0x150(%RDI),%XMM0 |
0x41c631 VMOVSD 0x168(%RDI),%XMM2 |
0x41c639 VMOVQ 0x170(%RDI),%XMM13 |
0x41c641 VMOVSD 0x188(%RDI),%XMM14 |
0x41c649 VMOVSD 0x190(%RDI),%XMM4 |
0x41c651 VMOVUPD 0xa0(%RDI),%XMM5 |
0x41c659 VMOVSD 0xb0(%RDI),%XMM9 |
0x41c661 VMOVUPD 0xc0(%RDI),%XMM7 |
0x41c669 VMOVSD 0xd0(%RDI),%XMM8 |
0x41c671 VMOVUPS 0xe0(%RDI),%XMM1 |
0x41c679 VMOVUPS %YMM1,0x200(%RSP) |
0x41c682 VMOVSD 0xf0(%RDI),%XMM1 |
0x41c68a VMOVUPS %XMM1,0xd0(%RSP) |
0x41c693 VMOVUPS 0x100(%RDI),%XMM1 |
0x41c69b VMOVUPS %YMM1,0x1e0(%RSP) |
0x41c6a4 MOV %EBX,%R10D |
0x41c6a7 VMOVSD 0x110(%RDI),%XMM1 |
0x41c6af VMOVUPS %XMM1,0xc0(%RSP) |
0x41c6b8 VMOVSD 0x18(%RDI),%XMM1 |
0x41c6bd VMOVUPS %XMM1,0xb0(%RSP) |
0x41c6c6 VMOVUPS 0x20(%RDI),%XMM1 |
0x41c6cb VMOVUPS %YMM1,0x1c0(%RSP) |
0x41c6d4 VMOVSD 0x30(%RDI),%XMM1 |
0x41c6d9 VMOVUPS %XMM1,0xa0(%RSP) |
0x41c6e2 VMOVSD 0x38(%RDI),%XMM1 |
0x41c6e7 VMOVUPS %XMM1,0x20(%RSP) |
0x41c6ed VMOVUPD 0x40(%RDI),%XMM12 |
0x41c6f2 VMOVSD 0x50(%RDI),%XMM1 |
0x41c6f7 VMOVUPS %XMM1,0x10(%RSP) |
0x41c6fd VMOVSD 0x58(%RDI),%XMM1 |
0x41c702 VMOVUPS %XMM1,0x90(%RSP) |
0x41c70b VMOVUPD 0x60(%RDI),%XMM10 |
0x41c710 VMOVSD 0x70(%RDI),%XMM1 |
0x41c715 VMOVUPS %XMM1,0x80(%RSP) |
0x41c71e VMOVSD 0x78(%RDI),%XMM1 |
0x41c723 VMOVUPS %XMM1,0x70(%RSP) |
0x41c729 VMOVUPD 0x80(%RDI),%XMM15 |
0x41c731 VMOVSD 0x90(%RDI),%XMM1 |
0x41c739 MOV $-0x4,%EDI |
0x41c73e VMULSD %XMM3,%XMM3,%XMM6 |
0x41c742 AND %R10,%RDI |
0x41c745 VMOVUPD %XMM3,0xe0(%RSP) |
0x41c74e VMOVUPD %XMM11,0x100(%RSP) |
0x41c757 VMOVUPS %XMM0,0x190(%RSP) |
0x41c760 VMOVUPD %XMM2,0x180(%RSP) |
0x41c769 VMOVDQU %XMM13,0x170(%RSP) |
0x41c772 VMOVUPS %XMM14,0x160(%RSP) |
0x41c77b VMOVUPD %XMM4,0x150(%RSP) |
0x41c784 VMOVUPD %YMM5,0x6a0(%RSP) |
0x41c78d VMOVUPD %XMM9,0x140(%RSP) |
0x41c796 VMOVUPD %YMM7,0x680(%RSP) |
0x41c79f VMOVUPD %XMM8,0x130(%RSP) |
0x41c7a8 VMOVUPD %XMM1,0x120(%RSP) |
0x41c7b1 VMOVUPD %XMM6,0x110(%RSP) |
0x41c7ba JE 41cf2b |
0x41c7c0 MOV %R10,0x38(%RSP) |
0x41c7c5 VMOVUPD %YMM15,0x1a0(%RSP) |
0x41c7ce VBROADCASTSD %XMM3,%YMM15 |
0x41c7d3 VBROADCASTSD %XMM11,%YMM3 |
0x41c7d8 VMOVUPD %YMM3,0x620(%RSP) |
0x41c7e1 VMOVAPD %YMM10,%YMM3 |
0x41c7e5 VBROADCASTSD (%RSP),%YMM10 |
0x41c7eb VMOVUPS %YMM10,0x40(%RSP) |
0x41c7f1 VMOVAPD %XMM1,%XMM10 |
0x41c7f5 VBROADCASTSD 0xf0(%RSP),%YMM1 |
0x41c7ff VMOVUPS %YMM1,0x660(%RSP) |
0x41c808 VBROADCASTSD %XMM0,%YMM0 |
0x41c80d VMOVUPS %YMM0,0x640(%RSP) |
0x41c816 VBROADCASTSD %XMM2,%YMM0 |
0x41c81b VMOVUPD %YMM0,0x600(%RSP) |
0x41c824 VPBROADCASTQ %XMM13,%YMM0 |
0x41c829 VMOVDQU %YMM0,0x5e0(%RSP) |
0x41c832 VBROADCASTSD %XMM14,%YMM0 |
0x41c837 VMOVUPS %YMM0,0x5c0(%RSP) |
0x41c840 VBROADCASTSD %XMM4,%YMM0 |
0x41c845 VMOVUPD %YMM0,0x5a0(%RSP) |
0x41c84e VBROADCASTSD %XMM6,%YMM0 |
0x41c853 VMOVUPD %YMM0,0x580(%RSP) |
0x41c85c VBROADCASTSD %XMM5,%YMM0 |
0x41c861 VMOVUPD %YMM0,0x560(%RSP) |
0x41c86a VPERMPD $0x55,%YMM5,%YMM0 |
0x41c870 VMOVUPD %YMM0,0x540(%RSP) |
0x41c879 VBROADCASTSD %XMM9,%YMM0 |
0x41c87e VMOVUPD %YMM0,0x520(%RSP) |
0x41c887 VBROADCASTSD %XMM7,%YMM0 |
0x41c88c VMOVUPD %YMM0,0x500(%RSP) |
0x41c895 VPERMPD $0x55,%YMM7,%YMM0 |
0x41c89b VMOVUPD %YMM0,0x4e0(%RSP) |
0x41c8a4 VBROADCASTSD %XMM8,%YMM0 |
0x41c8a9 VMOVUPD %YMM0,0x4c0(%RSP) |
0x41c8b2 XOR %EBX,%EBX |
0x41c8b4 VMOVUPS 0x200(%RSP),%YMM1 |
0x41c8bd VBROADCASTSD %XMM1,%YMM0 |
0x41c8c2 VMOVUPS %YMM0,0x4a0(%RSP) |
0x41c8cb VPERMPD $0x55,%YMM1,%YMM0 |
0x41c8d1 VMOVUPS %YMM0,0x480(%RSP) |
0x41c8da VBROADCASTSD 0xd0(%RSP),%YMM0 |
0x41c8e4 VMOVUPS %YMM0,0x460(%RSP) |
0x41c8ed VMOVUPS 0x1e0(%RSP),%YMM1 |
0x41c8f6 VBROADCASTSD %XMM1,%YMM0 |
0x41c8fb VMOVUPS %YMM0,0x440(%RSP) |
0x41c904 VPERMPD $0x55,%YMM1,%YMM0 |
0x41c90a VMOVUPS %YMM0,0x420(%RSP) |
0x41c913 VBROADCASTSD 0xc0(%RSP),%YMM0 |
0x41c91d VMOVUPS %YMM0,0x400(%RSP) |
0x41c926 VBROADCASTSD 0xb0(%RSP),%YMM0 |
0x41c930 VMOVUPS %YMM0,0x3e0(%RSP) |
0x41c939 VMOVUPD 0x1c0(%RSP),%YMM1 |
0x41c942 VBROADCASTSD %XMM1,%YMM0 |
0x41c947 VMOVUPD %YMM0,0x3c0(%RSP) |
0x41c950 VPERMPD $0x55,%YMM1,%YMM0 |
0x41c956 VMOVUPD %YMM0,0x3a0(%RSP) |
0x41c95f VBROADCASTSD 0xa0(%RSP),%YMM0 |
0x41c969 VMOVUPS %YMM0,0x380(%RSP) |
0x41c972 VBROADCASTSD 0x20(%RSP),%YMM0 |
0x41c979 VMOVUPS %YMM0,0x360(%RSP) |
0x41c982 VBROADCASTSD %XMM12,%YMM0 |
0x41c987 VMOVUPD %YMM0,0x340(%RSP) |
0x41c990 VMOVUPD %YMM12,0x240(%RSP) |
0x41c999 VPERMPD $0x55,%YMM12,%YMM0 |
0x41c99f VMOVUPD %YMM0,0x320(%RSP) |
0x41c9a8 VBROADCASTSD 0x10(%RSP),%YMM0 |
0x41c9af VMOVUPS %YMM0,0x300(%RSP) |
0x41c9b8 VBROADCASTSD 0x90(%RSP),%YMM0 |
0x41c9c2 VMOVUPS %YMM0,0x2e0(%RSP) |
0x41c9cb VBROADCASTSD %XMM3,%YMM0 |
0x41c9d0 VMOVUPD %YMM0,0x2c0(%RSP) |
0x41c9d9 VMOVUPD %YMM3,0x220(%RSP) |
0x41c9e2 VPERMPD $0x55,%YMM3,%YMM0 |
0x41c9e8 VMOVUPD %YMM0,0x2a0(%RSP) |
0x41c9f1 VBROADCASTSD 0x80(%RSP),%YMM0 |
0x41c9fb VMOVUPS %YMM0,0x280(%RSP) |
0x41ca04 VBROADCASTSD 0x70(%RSP),%YMM0 |
0x41ca0b VMOVUPS %YMM0,0x260(%RSP) |
0x41ca14 VMOVUPD 0x1a0(%RSP),%YMM0 |
0x41ca1d VBROADCASTSD %XMM0,%YMM12 |
0x41ca22 VPERMPD $0x55,%YMM0,%YMM14 |
0x41ca28 VBROADCASTSD %XMM10,%YMM11 |
0x41ca2d VPBROADCASTQ 0xdb3ba(%RIP),%YMM13 |
0x41ca36 VPBROADCASTQ 0xdb3b9(%RIP),%YMM3 |
0x41ca3f VPBROADCASTQ 0xdb3b8(%RIP),%YMM6 |
0x41ca48 NOPL (%RAX,%RAX,1) |
(315) 0x41ca50 VMOVUPD (%R8,%RBX,8),%YMM10 |
(315) 0x41ca56 VMULPD %YMM15,%YMM10,%YMM2 |
(315) 0x41ca5b VCVTTPD2DQ %YMM2,%XMM1 |
(315) 0x41ca5f VPMOVSXDQ %XMM1,%YMM1 |
(315) 0x41ca64 VPSLLQ $0x3,%YMM1,%YMM1 |
(315) 0x41ca69 VMOVQ %RSI,%XMM4 |
(315) 0x41ca6e VPBROADCASTQ %XMM4,%YMM4 |
(315) 0x41ca73 VROUNDPD $0xb,%YMM2,%YMM5 |
(315) 0x41ca79 VPADDQ %YMM1,%YMM4,%YMM1 |
(315) 0x41ca7d VMOVQ %XMM1,%R14 |
(315) 0x41ca82 VEXTRACTI128 $0x1,%YMM1,%XMM8 |
(315) 0x41ca88 VSUBPD %YMM5,%YMM2,%YMM4 |
(315) 0x41ca8c VMOVQ %XMM8,%R15 |
(315) 0x41ca91 VMOVSD (%R15),%XMM2 |
(315) 0x41ca96 VPEXTRQ $0x1,%XMM1,%R15 |
(315) 0x41ca9c VMOVSD (%R14),%XMM5 |
(315) 0x41caa1 VPADDQ %YMM6,%YMM1,%YMM7 |
(315) 0x41caa5 VPEXTRQ $0x1,%XMM8,%R14 |
(315) 0x41caab VMOVQ %XMM7,%R12 |
(315) 0x41cab0 VEXTRACTI128 $0x1,%YMM7,%XMM8 |
(315) 0x41cab6 VPEXTRQ $0x1,%XMM7,%R13 |
(315) 0x41cabc VPEXTRQ $0x1,%XMM8,%R10 |
(315) 0x41cac2 VMOVHPD (%R15),%XMM5,%XMM7 |
(315) 0x41cac7 VMOVQ %XMM8,%R15 |
(315) 0x41cacc VMOVSD (%R15),%XMM5 |
(315) 0x41cad1 VMOVHPD (%R14),%XMM2,%XMM2 |
(315) 0x41cad6 VMOVHPD (%R10),%XMM5,%XMM5 |
(315) 0x41cadb VMOVSD (%R12),%XMM8 |
(315) 0x41cae1 VINSERTF128 $0x1,%XMM2,%YMM7,%YMM2 |
(315) 0x41cae7 VMOVHPD (%R13),%XMM8,%XMM7 |
(315) 0x41caed VMOVAPD %YMM4,%YMM8 |
(315) 0x41caf1 VMOVAPD %YMM4,%YMM9 |
(315) 0x41caf5 VMOVUPD 0x540(%RSP),%YMM0 |
(315) 0x41cafe VFMADD132PD 0x560(%RSP),%YMM0,%YMM9 |
(315) 0x41cb08 VINSERTF128 $0x1,%XMM5,%YMM7,%YMM7 |
(315) 0x41cb0e VFMADD213PD 0x520(%RSP),%YMM4,%YMM9 |
(315) 0x41cb18 VMOVAPD %YMM4,%YMM5 |
(315) 0x41cb1c VMOVUPD 0x620(%RSP),%YMM0 |
(315) 0x41cb25 VFMADD213PD 0x40(%RSP),%YMM0,%YMM5 |
(315) 0x41cb2c VMOVUPD 0x640(%RSP),%YMM0 |
(315) 0x41cb35 VFMADD132PD 0x660(%RSP),%YMM0,%YMM8 |
(315) 0x41cb3f VMULPD %YMM2,%YMM5,%YMM5 |
(315) 0x41cb43 VFMADD213PD %YMM5,%YMM7,%YMM8 |
(315) 0x41cb48 VMOVAPD %YMM4,%YMM5 |
(315) 0x41cb4c VMOVUPD 0x4e0(%RSP),%YMM0 |
(315) 0x41cb55 VFMADD132PD 0x500(%RSP),%YMM0,%YMM5 |
(315) 0x41cb5f VFMADD213PD 0x4c0(%RSP),%YMM4,%YMM5 |
(315) 0x41cb69 VMULPD %YMM2,%YMM9,%YMM9 |
(315) 0x41cb6d VFMADD213PD %YMM9,%YMM7,%YMM5 |
(315) 0x41cb72 VMOVAPD %YMM4,%YMM9 |
(315) 0x41cb76 VMOVUPD 0x3c0(%RSP),%YMM0 |
(315) 0x41cb7f VFMADD132PD 0x3e0(%RSP),%YMM0,%YMM9 |
(315) 0x41cb89 VFMADD213PD 0x3a0(%RSP),%YMM4,%YMM9 |
(315) 0x41cb93 VFMADD213PD 0x380(%RSP),%YMM4,%YMM9 |
(315) 0x41cb9d VMULPD %YMM2,%YMM9,%YMM9 |
(315) 0x41cba1 VMOVAPD %YMM4,%YMM2 |
(315) 0x41cba5 VMOVUPD 0x340(%RSP),%YMM0 |
(315) 0x41cbae VFMADD132PD 0x360(%RSP),%YMM0,%YMM2 |
(315) 0x41cbb8 VFMADD213PD 0x320(%RSP),%YMM4,%YMM2 |
(315) 0x41cbc2 VFMADD213PD 0x300(%RSP),%YMM4,%YMM2 |
(315) 0x41cbcc VFMADD213PD %YMM9,%YMM7,%YMM2 |
(315) 0x41cbd1 VPADDQ %YMM3,%YMM1,%YMM7 |
(315) 0x41cbd5 VPEXTRQ $0x1,%XMM7,%R10 |
(315) 0x41cbdb VMOVQ %XMM7,%R14 |
(315) 0x41cbe0 VEXTRACTI128 $0x1,%YMM7,%XMM7 |
(315) 0x41cbe6 VPEXTRQ $0x1,%XMM7,%R15 |
(315) 0x41cbec VMOVQ %XMM7,%R12 |
(315) 0x41cbf1 VMOVSD (%R12),%XMM7 |
(315) 0x41cbf7 VPADDQ %YMM1,%YMM13,%YMM1 |
(315) 0x41cbfb VMOVQ %XMM1,%R12 |
(315) 0x41cc00 VPEXTRQ $0x1,%XMM1,%R13 |
(315) 0x41cc06 VMOVHPD (%R15),%XMM7,%XMM7 |
(315) 0x41cc0b VEXTRACTI128 $0x1,%YMM1,%XMM1 |
(315) 0x41cc11 VMOVQ %XMM1,%R15 |
(315) 0x41cc16 VPEXTRQ $0x1,%XMM1,%R8 |
(315) 0x41cc1c VMOVSD (%R14),%XMM1 |
(315) 0x41cc21 VMOVHPD (%R10),%XMM1,%XMM1 |
(315) 0x41cc26 VINSERTF128 $0x1,%XMM7,%YMM1,%YMM9 |
(315) 0x41cc2c VMOVAPD %YMM4,%YMM7 |
(315) 0x41cc30 VMOVUPD 0x5e0(%RSP),%YMM0 |
(315) 0x41cc39 VFMADD132PD 0x600(%RSP),%YMM0,%YMM7 |
(315) 0x41cc43 VFMADD213PD %YMM8,%YMM9,%YMM7 |
(315) 0x41cc48 VMOVAPD %YMM4,%YMM8 |
(315) 0x41cc4c VMOVUPD 0x480(%RSP),%YMM0 |
(315) 0x41cc55 VFMADD132PD 0x4a0(%RSP),%YMM0,%YMM8 |
(315) 0x41cc5f VFMADD213PD 0x460(%RSP),%YMM4,%YMM8 |
(315) 0x41cc69 VFMADD213PD %YMM5,%YMM9,%YMM8 |
(315) 0x41cc6e VMOVAPD %YMM4,%YMM1 |
(315) 0x41cc72 VMOVUPD 0x2c0(%RSP),%YMM0 |
(315) 0x41cc7b VFMADD132PD 0x2e0(%RSP),%YMM0,%YMM1 |
(315) 0x41cc85 VFMADD213PD 0x2a0(%RSP),%YMM4,%YMM1 |
(315) 0x41cc8f VFMADD213PD 0x280(%RSP),%YMM4,%YMM1 |
(315) 0x41cc99 VFMADD213PD %YMM2,%YMM9,%YMM1 |
(315) 0x41cc9e VMOVSD (%R15),%XMM2 |
(315) 0x41cca3 VMOVHPD (%R8),%XMM2,%XMM2 |
(315) 0x41cca8 VMOVSD (%R12),%XMM5 |
(315) 0x41ccae VMOVHPD (%R13),%XMM5,%XMM5 |
(315) 0x41ccb4 VINSERTF128 $0x1,%XMM2,%YMM5,%YMM5 |
(315) 0x41ccba VMOVAPD %YMM4,%YMM2 |
(315) 0x41ccbe VMOVUPD 0x420(%RSP),%YMM0 |
(315) 0x41ccc7 VFMADD132PD 0x440(%RSP),%YMM0,%YMM2 |
(315) 0x41ccd1 VFMADD213PD 0x400(%RSP),%YMM4,%YMM2 |
(315) 0x41ccdb VFMADD213PD %YMM8,%YMM5,%YMM2 |
(315) 0x41cce0 VMULPD %YMM2,%YMM15,%YMM2 |
(315) 0x41cce4 VDIVPD %YMM10,%YMM2,%YMM8 |
(315) 0x41cce9 VMOVAPD %YMM4,%YMM2 |
(315) 0x41cced VFMADD132PD 0x260(%RSP),%YMM12,%YMM2 |
(315) 0x41ccf7 VFMADD213PD %YMM14,%YMM4,%YMM2 |
(315) 0x41ccfc VFMADD213PD %YMM11,%YMM4,%YMM2 |
(315) 0x41cd01 VMOVUPD 0x5a0(%RSP),%YMM0 |
(315) 0x41cd0a VFMADD132PD 0x5c0(%RSP),%YMM0,%YMM4 |
(315) 0x41cd14 VFMADD213PD %YMM7,%YMM5,%YMM4 |
(315) 0x41cd19 MOVSXD (%RAX,%RBX,4),%R8 |
(315) 0x41cd1d MOVSXD 0x4(%RAX,%RBX,4),%R10 |
(315) 0x41cd22 MOVSXD 0x8(%RAX,%RBX,4),%R14 |
(315) 0x41cd27 MOVSXD 0xc(%RAX,%RBX,4),%R15 |
(315) 0x41cd2c VMULPD 0x580(%RSP),%YMM4,%YMM4 |
(315) 0x41cd35 ADD %R11,%R8 |
(315) 0x41cd38 VMOVLPD %XMM4,(%RCX,%R8,8) |
(315) 0x41cd3e ADD %R11,%R10 |
(315) 0x41cd41 VMOVHPD %XMM4,(%RCX,%R10,8) |
(315) 0x41cd47 VEXTRACTF128 $0x1,%YMM4,%XMM4 |
(315) 0x41cd4d ADD %R11,%R14 |
(315) 0x41cd50 ADD %R11,%R15 |
(315) 0x41cd53 VMOVLPD %XMM4,(%RCX,%R14,8) |
(315) 0x41cd59 VMOVHPD %XMM4,(%RCX,%R15,8) |
(315) 0x41cd5f VMOVLPD %XMM8,(%RDX,%R8,8) |
(315) 0x41cd65 VFMADD213PD %YMM1,%YMM5,%YMM2 |
(315) 0x41cd6a VMOVHPD %XMM8,(%RDX,%R10,8) |
(315) 0x41cd70 VEXTRACTF128 $0x1,%YMM8,%XMM1 |
(315) 0x41cd76 VMOVLPD %XMM1,(%RDX,%R14,8) |
(315) 0x41cd7c VMOVHPD %XMM1,(%RDX,%R15,8) |
(315) 0x41cd82 VMOVLPD %XMM2,(%R9,%R8,8) |
(315) 0x41cd88 MOV 0x20(%RBP),%R8 |
(315) 0x41cd8c VMOVHPD %XMM2,(%R9,%R10,8) |
(315) 0x41cd92 VEXTRACTF128 $0x1,%YMM2,%XMM1 |
(315) 0x41cd98 VMOVLPD %XMM1,(%R9,%R14,8) |
(315) 0x41cd9e VMOVHPD %XMM1,(%R9,%R15,8) |
(315) 0x41cda4 ADD $0x4,%RBX |
(315) 0x41cda8 CMP %RDI,%RBX |
(315) 0x41cdab JB 41ca50 |
0x41cdb1 MOV 0x38(%RSP),%R10 |
0x41cdb6 CMP %R10,%RDI |
0x41cdb9 VMOVUPD 0x100(%RSP),%XMM11 |
0x41cdc2 VMOVUPD (%RSP),%XMM1 |
0x41cdc7 VMOVUPD 0xe0(%RSP),%XMM3 |
0x41cdd0 VMOVUPD 0x20(%RSP),%XMM14 |
0x41cdd6 VMOVUPD 0x240(%RSP),%YMM12 |
0x41cddf VMOVUPD 0x10(%RSP),%XMM0 |
0x41cde5 VMOVUPD 0x220(%RSP),%YMM10 |
0x41cdee VMOVUPD 0x1a0(%RSP),%YMM15 |
0x41cdf7 JNE 41cf40 |
0x41cdfd JMP 41d197 |
0x41ce02 MOV 0x40(%RSP),%RCX |
0x41ce07 LEA (%RCX,%R11,8),%RCX |
0x41ce0b ADD $0x18,%RCX |
0x41ce0f MOV %R14D,%R15D |
0x41ce12 AND $-0x4,%R15D |
0x41ce16 MOV %EDX,%R12D |
0x41ce19 SUB %ESI,%R12D |
0x41ce1c XOR %R13D,%R13D |
0x41ce1f XOR %EBX,%EBX |
0x41ce21 JMP 41ce3d |
0x41ce23 NOPW %CS:(%RAX,%RAX,1) |
(317) 0x41ce30 ADD $0x4,%R13 |
(317) 0x41ce34 CMP %R13,%R15 |
(317) 0x41ce37 JE 41c5d5 |
(317) 0x41ce3d VMOVSD -0x18(%RCX,%R13,8),%XMM1 |
(317) 0x41ce44 VUCOMISD %XMM1,%XMM0 |
(317) 0x41ce48 JBE 41ce61 |
(317) 0x41ce4a MOV %R12D,%R10D |
(317) 0x41ce4d ADD %R13D,%R10D |
(317) 0x41ce50 JE 41ce61 |
(317) 0x41ce52 MOVSXD %EBX,%RBX |
(317) 0x41ce55 MOV %R13D,(%RAX,%RBX,4) |
(317) 0x41ce59 VMOVSD %XMM1,(%R8,%RBX,8) |
(317) 0x41ce5f INC %EBX |
(317) 0x41ce61 VMOVSD -0x10(%RCX,%R13,8),%XMM1 |
(317) 0x41ce68 VUCOMISD %XMM1,%XMM0 |
(317) 0x41ce6c JBE 41ce8b |
(317) 0x41ce6e LEA (%R12,%R13,1),%R10D |
(317) 0x41ce72 CMP $-0x1,%R10D |
(317) 0x41ce76 JE 41ce8b |
(317) 0x41ce78 MOVSXD %EBX,%RBX |
(317) 0x41ce7b LEA 0x1(%R13),%R10D |
(317) 0x41ce7f MOV %R10D,(%RAX,%RBX,4) |
(317) 0x41ce83 VMOVSD %XMM1,(%R8,%RBX,8) |
(317) 0x41ce89 INC %EBX |
(317) 0x41ce8b VMOVSD -0x8(%RCX,%R13,8),%XMM1 |
(317) 0x41ce92 VUCOMISD %XMM1,%XMM0 |
(317) 0x41ce96 JBE 41ceb5 |
(317) 0x41ce98 LEA (%R12,%R13,1),%R10D |
(317) 0x41ce9c CMP $-0x2,%R10D |
(317) 0x41cea0 JE 41ceb5 |
(317) 0x41cea2 MOVSXD %EBX,%RBX |
(317) 0x41cea5 LEA 0x2(%R13),%R10D |
(317) 0x41cea9 MOV %R10D,(%RAX,%RBX,4) |
(317) 0x41cead VMOVSD %XMM1,(%R8,%RBX,8) |
(317) 0x41ceb3 INC %EBX |
(317) 0x41ceb5 VMOVSD (%RCX,%R13,8),%XMM1 |
(317) 0x41cebb VUCOMISD %XMM1,%XMM0 |
(317) 0x41cebf JBE 41ce30 |
(317) 0x41cec5 LEA (%R12,%R13,1),%R10D |
(317) 0x41cec9 CMP $-0x3,%R10D |
(317) 0x41cecd JE 41ce30 |
(317) 0x41ced3 MOVSXD %EBX,%RBX |
(317) 0x41ced6 LEA 0x3(%R13),%R10D |
(317) 0x41ceda MOV %R10D,(%RAX,%RBX,4) |
(317) 0x41cede VMOVSD %XMM1,(%R8,%RBX,8) |
(317) 0x41cee4 INC %EBX |
(317) 0x41cee6 JMP 41ce30 |
0x41ceeb SUB %EDX,%ESI |
0x41ceed MOV 0x40(%RSP),%RDX |
0x41cef2 LEA (%RDX,%R11,8),%RDX |
0x41cef6 JMP 41cf0c |
0x41cef8 NOPL (%RAX,%RAX,1) |
(316) 0x41cf00 INC %RCX |
(316) 0x41cf03 CMP %RCX,%R14 |
(316) 0x41cf06 JE 41c5e4 |
(316) 0x41cf0c VMOVSD (%RDX,%RCX,8),%XMM1 |
(316) 0x41cf11 VUCOMISD %XMM1,%XMM0 |
(316) 0x41cf15 JBE 41cf00 |
(316) 0x41cf17 CMP %ECX,%ESI |
(316) 0x41cf19 JE 41cf00 |
(316) 0x41cf1b MOVSXD %EBX,%RBX |
(316) 0x41cf1e MOV %ECX,(%RAX,%RBX,4) |
(316) 0x41cf21 VMOVSD %XMM1,(%R8,%RBX,8) |
(316) 0x41cf27 INC %EBX |
(316) 0x41cf29 JMP 41cf00 |
0x41cf2b XOR %EDI,%EDI |
0x41cf2d VMOVUPD 0x10(%RSP),%XMM0 |
0x41cf33 VMOVUPD 0x20(%RSP),%XMM14 |
0x41cf39 VMOVUPD (%RSP),%XMM1 |
0x41cf3e XCHG %AX,%AX |
(314) 0x41cf40 VMOVSD (%R8,%RDI,8),%XMM2 |
(314) 0x41cf46 VMOVSD %XMM2,0x40(%RSP) |
(314) 0x41cf4c VMULSD %XMM3,%XMM2,%XMM2 |
(314) 0x41cf50 VCVTTSD2SI %XMM2,%R8D |
(314) 0x41cf54 VROUNDSD $0xb,%XMM2,%XMM2,%XMM3 |
(314) 0x41cf5a MOVSXD %R8D,%R8 |
(314) 0x41cf5d VMOVSD (%RSI,%R8,8),%XMM8 |
(314) 0x41cf63 VMOVSD 0x8(%RSI,%R8,8),%XMM6 |
(314) 0x41cf6a VMOVSD 0x10(%RSI,%R8,8),%XMM5 |
(314) 0x41cf71 VSUBSD %XMM3,%XMM2,%XMM2 |
(314) 0x41cf75 VMOVSD 0x18(%RSI,%R8,8),%XMM3 |
(314) 0x41cf7c VMULSD %XMM2,%XMM2,%XMM7 |
(314) 0x41cf80 VMULSD %XMM2,%XMM7,%XMM4 |
(314) 0x41cf84 VMOVAPD %XMM2,%XMM9 |
(314) 0x41cf88 VFMADD213SD %XMM1,%XMM11,%XMM9 |
(314) 0x41cf8d VMOVAPD %YMM10,%YMM13 |
(314) 0x41cf92 VMOVAPD %XMM2,%XMM10 |
(314) 0x41cf96 VMULSD %XMM8,%XMM9,%XMM9 |
(314) 0x41cf9b VMOVUPD 0x190(%RSP),%XMM1 |
(314) 0x41cfa4 VFMADD132SD 0xf0(%RSP),%XMM1,%XMM10 |
(314) 0x41cfae VMOVAPD %XMM2,%XMM11 |
(314) 0x41cfb2 VMOVUPD 0x170(%RSP),%XMM1 |
(314) 0x41cfbb VFMADD132SD 0x180(%RSP),%XMM1,%XMM11 |
(314) 0x41cfc5 VUNPCKLPD %XMM2,%XMM7,%XMM7 |
(314) 0x41cfc9 VFMADD213SD %XMM9,%XMM6,%XMM10 |
(314) 0x41cfce VMOVUPD 0x150(%RSP),%XMM1 |
(314) 0x41cfd7 VFMADD132SD 0x160(%RSP),%XMM1,%XMM2 |
(314) 0x41cfe1 VMULPD 0x6a0(%RSP),%XMM7,%XMM9 |
(314) 0x41cfea VMOVAPD %XMM14,%XMM1 |
(314) 0x41cfee VMOVAPD %XMM0,%XMM14 |
(314) 0x41cff2 VMOVAPD %YMM15,%YMM0 |
(314) 0x41cff6 VMOVAPD %YMM12,%YMM15 |
(314) 0x41cffb VSHUFPD $0x1,%XMM9,%XMM9,%XMM12 |
(314) 0x41d001 VFMADD213SD %XMM10,%XMM5,%XMM11 |
(314) 0x41d006 VADDSD %XMM9,%XMM12,%XMM9 |
(314) 0x41d00b VADDSD 0x140(%RSP),%XMM9,%XMM9 |
(314) 0x41d014 VMULPD 0x680(%RSP),%XMM7,%XMM10 |
(314) 0x41d01d VMULSD %XMM8,%XMM9,%XMM9 |
(314) 0x41d022 VSHUFPD $0x1,%XMM10,%XMM10,%XMM12 |
(314) 0x41d028 VADDSD %XMM10,%XMM12,%XMM10 |
(314) 0x41d02d VADDSD 0x130(%RSP),%XMM10,%XMM10 |
(314) 0x41d036 VFMADD213SD %XMM11,%XMM3,%XMM2 |
(314) 0x41d03b VMULPD 0x200(%RSP),%XMM7,%XMM11 |
(314) 0x41d044 VSHUFPD $0x1,%XMM11,%XMM11,%XMM12 |
(314) 0x41d04a VADDSD %XMM11,%XMM12,%XMM11 |
(314) 0x41d04f VFMADD213SD %XMM9,%XMM6,%XMM10 |
(314) 0x41d054 VMULPD 0x1c0(%RSP),%XMM7,%XMM9 |
(314) 0x41d05d VMOVAPD %XMM4,%XMM12 |
(314) 0x41d061 VFMADD132SD 0xb0(%RSP),%XMM9,%XMM12 |
(314) 0x41d06b VSHUFPD $0x1,%XMM9,%XMM9,%XMM9 |
(314) 0x41d071 VADDSD 0xa0(%RSP),%XMM9,%XMM9 |
(314) 0x41d07a VADDSD %XMM9,%XMM12,%XMM9 |
(314) 0x41d07f VMOVAPD %YMM15,%YMM12 |
(314) 0x41d084 VMOVAPD %YMM0,%YMM15 |
(314) 0x41d088 VMOVAPD %XMM14,%XMM0 |
(314) 0x41d08c VMOVAPD %XMM1,%XMM14 |
(314) 0x41d090 VADDSD 0xd0(%RSP),%XMM11,%XMM11 |
(314) 0x41d099 VMULSD %XMM8,%XMM9,%XMM8 |
(314) 0x41d09e VFMADD213SD %XMM10,%XMM5,%XMM11 |
(314) 0x41d0a3 VMULPD %XMM7,%XMM12,%XMM9 |
(314) 0x41d0a7 VMOVAPD %XMM4,%XMM10 |
(314) 0x41d0ab VFMADD213SD %XMM9,%XMM1,%XMM10 |
(314) 0x41d0b0 VSHUFPD $0x1,%XMM9,%XMM9,%XMM9 |
(314) 0x41d0b6 VADDSD %XMM0,%XMM9,%XMM9 |
(314) 0x41d0ba VADDSD %XMM9,%XMM10,%XMM9 |
(314) 0x41d0bf VMOVAPD %YMM13,%YMM10 |
(314) 0x41d0c4 VMOVUPD 0x80(%RSP),%XMM13 |
(314) 0x41d0cd VFMADD213SD %XMM8,%XMM6,%XMM9 |
(314) 0x41d0d2 VMULPD %XMM7,%XMM10,%XMM6 |
(314) 0x41d0d6 VMOVAPD %XMM4,%XMM8 |
(314) 0x41d0da VFMADD132SD 0x90(%RSP),%XMM6,%XMM8 |
(314) 0x41d0e4 VSHUFPD $0x1,%XMM6,%XMM6,%XMM6 |
(314) 0x41d0e9 VADDSD %XMM6,%XMM13,%XMM6 |
(314) 0x41d0ed VADDSD %XMM6,%XMM8,%XMM6 |
(314) 0x41d0f1 VFMADD213SD %XMM9,%XMM5,%XMM6 |
(314) 0x41d0f6 VMOVUPD 0x70(%RSP),%XMM9 |
(314) 0x41d0fc VMULPD 0x1e0(%RSP),%XMM7,%XMM5 |
(314) 0x41d105 VSHUFPD $0x1,%XMM5,%XMM5,%XMM8 |
(314) 0x41d10a VADDSD %XMM5,%XMM8,%XMM5 |
(314) 0x41d10e VMOVUPD 0x120(%RSP),%XMM8 |
(314) 0x41d117 VADDSD 0xc0(%RSP),%XMM5,%XMM5 |
(314) 0x41d120 VFMADD213SD %XMM11,%XMM3,%XMM5 |
(314) 0x41d125 VMULPD %XMM7,%XMM15,%XMM7 |
(314) 0x41d129 VFMADD213SD %XMM7,%XMM9,%XMM4 |
(314) 0x41d12e VSHUFPD $0x1,%XMM7,%XMM7,%XMM7 |
(314) 0x41d133 VADDSD %XMM7,%XMM8,%XMM7 |
(314) 0x41d137 VADDSD %XMM7,%XMM4,%XMM4 |
(314) 0x41d13b VFMADD213SD %XMM6,%XMM3,%XMM4 |
(314) 0x41d140 VMOVUPD 0x110(%RSP),%XMM6 |
(314) 0x41d149 VMOVUPD 0xe0(%RSP),%XMM3 |
(314) 0x41d152 MOVSXD (%RAX,%RDI,4),%R8 |
(314) 0x41d156 ADD %R11,%R8 |
(314) 0x41d159 VMULSD %XMM2,%XMM6,%XMM2 |
(314) 0x41d15d VMOVSD %XMM2,(%RCX,%R8,8) |
(314) 0x41d163 VMULSD %XMM3,%XMM5,%XMM2 |
(314) 0x41d167 VDIVSD 0x40(%RSP),%XMM2,%XMM1 |
(314) 0x41d16d VMOVSD %XMM1,(%RDX,%R8,8) |
(314) 0x41d173 VMOVUPD (%RSP),%XMM1 |
(314) 0x41d178 VMOVUPD 0x100(%RSP),%XMM11 |
(314) 0x41d181 VMOVSD %XMM4,(%R9,%R8,8) |
(314) 0x41d187 MOV 0x20(%RBP),%R8 |
(314) 0x41d18b INC %RDI |
(314) 0x41d18e CMP %RDI,%R10 |
(314) 0x41d191 JNE 41cf40 |
0x41d197 LEA -0x28(%RBP),%RSP |
0x41d19b POP %RBX |
0x41d19c POP %R12 |
0x41d19e POP %R13 |
0x41d1a0 POP %R14 |
0x41d1a2 POP %R15 |
0x41d1a4 POP %RBP |
0x41d1a5 VZEROUPPER |
0x41d1a8 RET |
0x41d1a9 NOPL (%RAX) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►52.34+ | miniqmcreference::TwoBodyJastr[...] | TwoBodyJastrowRef.h:274 | exec |
○ | qmcplusplus::WaveFunction::rat[...] | WaveFunction.cpp:201 | exec |
○ | main.extracted.110 | refwrap.h:313 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►40.63+ | miniqmcreference::TwoBodyJastr[...] | TwoBodyJastrowRef.h:274 | exec |
○ | qmcplusplus::WaveFunction::acc[...] | NewTimer.h:249 | exec |
○ | main.extracted.110 | refwrap.h:313 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►5.10+ | miniqmcreference::TwoBodyJastr[...] | TwoBodyJastrowRef.h:274 | exec |
○ | miniqmcreference::TwoBodyJastr[...] | TwoBodyJastrowRef.h:411 | exec |
○ | qmcplusplus::WaveFunction::eva[...] | WaveFunction.cpp:175 | exec |
○ | main.extracted.113 | miniqmc.cpp:397 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so | |
►1.82+ | miniqmcreference::OneBodyJastr[...] | OneBodyJastrowRef.h:218 | exec |
○ | miniqmcreference::OneBodyJastr[...] | stl_vector.h:1056 | exec |
○ | qmcplusplus::WaveFunction::rat[...] | WaveFunction.cpp:201 | exec |
○ | main.extracted.110 | refwrap.h:313 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | BsplineFunctor.h:276-339 |
Module | exec |
nb instructions | 221 |
nb uops | 222 |
loop length | 1410 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 16 |
used ymm registers | 12 |
used zmm registers | 0 |
nb stack references | 70 |
micro-operation queue | 37.00 cycles |
front end | 37.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.70 | 5.80 | 24.67 | 24.67 | 36.00 | 27.00 | 5.70 | 36.00 | 36.00 | 36.00 | 5.80 | 24.67 |
cycles | 5.70 | 5.80 | 24.67 | 24.67 | 36.00 | 27.00 | 5.70 | 36.00 | 36.00 | 36.00 | 5.80 | 24.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 37.05 |
Stall cycles | 0.00 |
Front-end | 37.00 |
Dispatch | 36.00 |
Overall L1 | 37.00 |
all | 11% |
load | 0% |
store | 50% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 65% |
load | 41% |
store | 100% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 56% |
load | 37% |
store | 96% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 11% |
load | 12% |
store | 25% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 30% |
load | 20% |
store | 41% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 21% |
all | 27% |
load | 20% |
store | 40% |
mul | 12% |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
SUB %EDX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %ECX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41d1a5 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0xc15> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x6e0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD %EDX,%R11 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
VMOVSD 0x8(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ECX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP $0x4,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 41ce02 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x872> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14D,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R14,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 41ceeb <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x95b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
TEST %EBX,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41d197 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0xc07> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD 0x238(%RDI),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x218(%RDI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x128(%RDI),%XMM11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x130(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM0,(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x148(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM0,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x150(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x168(%RDI),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ 0x170(%RDI),%XMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x188(%RDI),%XMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x190(%RDI),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0xa0(%RDI),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0xb0(%RDI),%XMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0xc0(%RDI),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0xd0(%RDI),%XMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS 0xe0(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPS %YMM1,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0xf0(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS 0x100(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPS %YMM1,0x1e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV %EBX,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVSD 0x110(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x18(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS 0x20(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPS %YMM1,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x30(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x38(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x40(%RDI),%XMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0x50(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x58(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x60(%RDI),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0x70(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x78(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x80(%RDI),%XMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0x90(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $-0x4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMULSD %XMM3,%XMM3,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND %R10,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
VMOVUPD %XMM3,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM11,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS %XMM0,0x190(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM2,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVDQU %XMM13,0x170(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS %XMM14,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM4,0x150(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM5,0x6a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM9,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM7,0x680(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM8,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM1,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM6,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
JE 41cf2b <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x99b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVUPD %YMM15,0x1a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM3,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM11,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x620(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVAPD %YMM10,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VBROADCASTSD (%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM10,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVAPD %XMM1,%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VBROADCASTSD 0xf0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM1,0x660(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM0,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x640(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM2,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x600(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %XMM13,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x5e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM14,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x5c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM4,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x5a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM6,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x580(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM5,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x560(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM5,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x540(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM9,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x520(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM7,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x500(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM7,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x4e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM8,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x4c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPS 0x200(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x4a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x480(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xd0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x460(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS 0x1e0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x440(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x420(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xc0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x400(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xb0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x3e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x1c0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x3c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x3a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xa0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x380(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x20(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x360(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM12,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x340(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM12,0x240(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM12,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x320(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x10(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x300(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x90(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x2e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM3,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM3,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM3,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x80(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x280(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x70(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x260(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x1a0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM0,%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPERMPD $0x55,%YMM0,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM10,%YMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ 0xdb3ba(%RIP),%YMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VPBROADCASTQ 0xdb3b9(%RIP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VPBROADCASTQ 0xdb3b8(%RIP),%YMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RSP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R10,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVUPD 0x100(%RSP),%XMM11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD (%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xe0(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x20(%RSP),%XMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x240(%RSP),%YMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x10(%RSP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x220(%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x1a0(%RSP),%YMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
JNE 41cf40 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x9b0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41d197 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0xc07> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x40(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RCX,%R11,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x18,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R14D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%R15D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %EDX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %ESI,%R12D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41ce3d <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x8ad> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %EDX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x40(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDX,%R11,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41cf0c <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x97c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD 0x10(%RSP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x20(%RSP),%XMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD (%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | BsplineFunctor.h:276-339 |
Module | exec |
nb instructions | 221 |
nb uops | 222 |
loop length | 1410 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 16 |
used ymm registers | 12 |
used zmm registers | 0 |
nb stack references | 70 |
micro-operation queue | 37.00 cycles |
front end | 37.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.70 | 5.80 | 24.67 | 24.67 | 36.00 | 27.00 | 5.70 | 36.00 | 36.00 | 36.00 | 5.80 | 24.67 |
cycles | 5.70 | 5.80 | 24.67 | 24.67 | 36.00 | 27.00 | 5.70 | 36.00 | 36.00 | 36.00 | 5.80 | 24.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 37.05 |
Stall cycles | 0.00 |
Front-end | 37.00 |
Dispatch | 36.00 |
Overall L1 | 37.00 |
all | 11% |
load | 0% |
store | 50% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 65% |
load | 41% |
store | 100% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 56% |
load | 37% |
store | 96% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 11% |
load | 12% |
store | 25% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 30% |
load | 20% |
store | 41% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 21% |
all | 27% |
load | 20% |
store | 40% |
mul | 12% |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
SUB %EDX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %ECX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41d1a5 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0xc15> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x6e0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD %EDX,%R11 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
VMOVSD 0x8(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ECX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP $0x4,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 41ce02 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x872> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14D,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R14,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 41ceeb <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x95b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
TEST %EBX,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41d197 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0xc07> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD 0x238(%RDI),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x218(%RDI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x128(%RDI),%XMM11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x130(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM0,(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x148(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM0,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x150(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x168(%RDI),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ 0x170(%RDI),%XMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x188(%RDI),%XMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x190(%RDI),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0xa0(%RDI),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0xb0(%RDI),%XMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0xc0(%RDI),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0xd0(%RDI),%XMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS 0xe0(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPS %YMM1,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0xf0(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS 0x100(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPS %YMM1,0x1e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV %EBX,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVSD 0x110(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x18(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS 0x20(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPS %YMM1,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x30(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x38(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x40(%RDI),%XMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0x50(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x58(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x60(%RDI),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0x70(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x78(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x80(%RDI),%XMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0x90(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $-0x4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMULSD %XMM3,%XMM3,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND %R10,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
VMOVUPD %XMM3,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM11,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS %XMM0,0x190(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM2,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVDQU %XMM13,0x170(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS %XMM14,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM4,0x150(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM5,0x6a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM9,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM7,0x680(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM8,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM1,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM6,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
JE 41cf2b <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x99b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVUPD %YMM15,0x1a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM3,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM11,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM3,0x620(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVAPD %YMM10,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VBROADCASTSD (%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM10,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVAPD %XMM1,%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VBROADCASTSD 0xf0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM1,0x660(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM0,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x640(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM2,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x600(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %XMM13,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x5e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM14,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x5c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM4,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x5a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM6,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x580(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM5,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x560(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM5,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x540(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM9,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x520(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM7,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x500(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM7,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x4e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM8,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x4c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPS 0x200(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x4a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x480(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xd0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x460(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS 0x1e0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x440(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x420(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xc0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x400(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xb0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x3e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x1c0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x3c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x3a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xa0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x380(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x20(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x360(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM12,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x340(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM12,0x240(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM12,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x320(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x10(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x300(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x90(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x2e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM3,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM3,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM3,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x80(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x280(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x70(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x260(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x1a0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM0,%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPERMPD $0x55,%YMM0,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM10,%YMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ 0xdb3ba(%RIP),%YMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VPBROADCASTQ 0xdb3b9(%RIP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VPBROADCASTQ 0xdb3b8(%RIP),%YMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RSP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R10,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVUPD 0x100(%RSP),%XMM11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD (%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xe0(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x20(%RSP),%XMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x240(%RSP),%YMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x10(%RSP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x220(%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x1a0(%RSP),%YMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
JNE 41cf40 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x9b0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41d197 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0xc07> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x40(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RCX,%R11,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x18,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R14D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%R15D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %EDX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %ESI,%R12D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41ce3d <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x8ad> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %EDX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x40(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDX,%R11,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41cf0c <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x97c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD 0x10(%RSP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x20(%RSP),%XMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD (%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼qmcplusplus::BsplineFunctor | 0.65 | 0.74 |
○Loop 317 - BsplineFunctor.h:291-298 - exec | 0.55 | 0.62 |
○Loop 315 - BsplineFunctor.h:303-338 - exec | 0.06 | 0.07 |
○Loop 314 - BsplineFunctor.h:303-338 - exec | 0.01 | 0.01 |
○Loop 316 - BsplineFunctor.h:291-298 - exec | 0 | 0 |