Function: _ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi | Module: exec | Source: BsplineFunctor.h:276-339 [...] | Coverage: 0.64% |
---|
Function: _ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi | Module: exec | Source: BsplineFunctor.h:276-339 [...] | Coverage: 0.64% |
---|
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_vector.h: 1064 - 1064 |
-------------------------------------------------------------------------------- |
1064: return *(this->_M_impl._M_start + __n); |
/home/eoseret/qaas_runs_CPU_9468/171-145-9236/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/BsplineFunctor.h: 276 - 339 |
-------------------------------------------------------------------------------- |
276: real_type dSquareDeltaRinv = DeltaRInv * DeltaRInv; |
[...] |
284: int iLimit = iEnd - iStart; |
285: const real_type* distArray = _distArray + iStart; |
[...] |
291: for (int jat = 0; jat < iLimit; jat++) |
292: { |
293: real_type r = distArray[jat]; |
294: if (r < cutoff_radius && iStart + jat != iat) |
295: { |
296: distIndices[iCount] = jat; |
297: distArrayCompressed[iCount] = r; |
298: iCount++; |
299: } |
300: } |
301: |
302: #pragma omp simd |
303: for (int j = 0; j < iCount; j++) |
304: { |
305: real_type r = distArrayCompressed[j]; |
306: int iScatter = distIndices[j]; |
307: real_type rinv = cOne / r; |
308: r *= DeltaRInv; |
309: int iGather = (int)r; |
310: real_type t = r - real_type(iGather); |
311: real_type tp0 = t * t * t; |
312: real_type tp1 = t * t; |
313: real_type tp2 = t; |
314: |
315: real_type sCoef0 = SplineCoefs[iGather + 0]; |
316: real_type sCoef1 = SplineCoefs[iGather + 1]; |
317: real_type sCoef2 = SplineCoefs[iGather + 2]; |
318: real_type sCoef3 = SplineCoefs[iGather + 3]; |
319: |
320: // clang-format off |
321: laplArray[iScatter] = dSquareDeltaRinv * |
322: (sCoef0*( d2A[ 2]*tp2 + d2A[ 3])+ |
323: sCoef1*( d2A[ 6]*tp2 + d2A[ 7])+ |
324: sCoef2*( d2A[10]*tp2 + d2A[11])+ |
325: sCoef3*( d2A[14]*tp2 + d2A[15])); |
326: |
327: gradArray[iScatter] = DeltaRInv * rinv * |
328: (sCoef0*( dA[ 1]*tp1 + dA[ 2]*tp2 + dA[ 3])+ |
329: sCoef1*( dA[ 5]*tp1 + dA[ 6]*tp2 + dA[ 7])+ |
330: sCoef2*( dA[ 9]*tp1 + dA[10]*tp2 + dA[11])+ |
331: sCoef3*( dA[13]*tp1 + dA[14]*tp2 + dA[15])); |
332: |
333: valArray[iScatter] = (sCoef0*(A[ 0]*tp0 + A[ 1]*tp1 + A[ 2]*tp2 + A[ 3])+ |
334: sCoef1*(A[ 4]*tp0 + A[ 5]*tp1 + A[ 6]*tp2 + A[ 7])+ |
335: sCoef2*(A[ 8]*tp0 + A[ 9]*tp1 + A[10]*tp2 + A[11])+ |
336: sCoef3*(A[12]*tp0 + A[13]*tp1 + A[14]*tp2 + A[15])); |
337: // clang-format on |
338: } |
339: } |
0x41cee0 SUB %EDX,%ECX |
0x41cee2 TEST %ECX,%ECX |
0x41cee4 JLE 41daeb |
0x41ceea PUSH %RBP |
0x41ceeb MOV %RSP,%RBP |
0x41ceee PUSH %R15 |
0x41cef0 PUSH %R14 |
0x41cef2 PUSH %R13 |
0x41cef4 PUSH %R12 |
0x41cef6 PUSH %RBX |
0x41cef7 AND $-0x20,%RSP |
0x41cefb SUB $0x6e0,%RSP |
0x41cf02 MOV %R8,0x40(%RSP) |
0x41cf07 MOV 0x28(%RBP),%RAX |
0x41cf0b MOV 0x20(%RBP),%R8 |
0x41cf0f MOVSXD %EDX,%R11 |
0x41cf12 VMOVSD 0x8(%RDI),%XMM0 |
0x41cf17 MOV %ECX,%R14D |
0x41cf1a XOR %EBX,%EBX |
0x41cf1c CMP $0x4,%ECX |
0x41cf1f JAE 41d777 |
0x41cf25 MOV %R14D,%ECX |
0x41cf28 AND $-0x4,%ECX |
0x41cf2b CMP %R14,%RCX |
0x41cf2e JAE 41cf67 |
0x41cf30 SUB %EDX,%ESI |
0x41cf32 MOV 0x40(%RSP),%RDX |
0x41cf37 LEA (%RDX,%R11,8),%RDX |
0x41cf3b JMP 41cf48 |
0x41cf3d NOPL (%RAX) |
(318) 0x41cf40 INC %RCX |
(318) 0x41cf43 CMP %RCX,%R14 |
(318) 0x41cf46 JE 41cf67 |
(318) 0x41cf48 VMOVSD (%RDX,%RCX,8),%XMM1 |
(318) 0x41cf4d VUCOMISD %XMM1,%XMM0 |
(318) 0x41cf51 JBE 41cf40 |
(318) 0x41cf53 CMP %ECX,%ESI |
(318) 0x41cf55 JE 41cf40 |
(318) 0x41cf57 MOVSXD %EBX,%RBX |
(318) 0x41cf5a MOV %ECX,(%RAX,%RBX,4) |
(318) 0x41cf5d VMOVSD %XMM1,(%R8,%RBX,8) |
(318) 0x41cf63 INC %EBX |
(318) 0x41cf65 JMP 41cf40 |
0x41cf67 TEST %EBX,%EBX |
0x41cf69 JLE 41dadd |
0x41cf6f VMOVSD 0x238(%RDI),%XMM3 |
0x41cf77 MOV 0x18(%RBP),%RCX |
0x41cf7b MOV 0x10(%RBP),%RDX |
0x41cf7f MOV 0x218(%RDI),%RSI |
0x41cf86 VMOVSD 0x128(%RDI),%XMM0 |
0x41cf8e VMOVUPS %XMM0,(%RSP) |
0x41cf93 VMOVSD 0x130(%RDI),%XMM0 |
0x41cf9b VMOVUPS %XMM0,0x100(%RSP) |
0x41cfa4 VMOVSD 0x148(%RDI),%XMM0 |
0x41cfac VMOVUPS %XMM0,0xf0(%RSP) |
0x41cfb5 VMOVSD 0x150(%RDI),%XMM0 |
0x41cfbd VMOVSD 0x168(%RDI),%XMM2 |
0x41cfc5 VMOVSD 0x170(%RDI),%XMM13 |
0x41cfcd VMOVSD 0x188(%RDI),%XMM14 |
0x41cfd5 VMOVSD 0x190(%RDI),%XMM4 |
0x41cfdd VMOVUPD 0xa0(%RDI),%XMM5 |
0x41cfe5 VMOVSD 0xb0(%RDI),%XMM12 |
0x41cfed VMOVUPD 0xc0(%RDI),%XMM7 |
0x41cff5 VMOVSD 0xd0(%RDI),%XMM8 |
0x41cffd VMOVUPS 0xe0(%RDI),%XMM1 |
0x41d005 VMOVUPS %YMM1,0x1e0(%RSP) |
0x41d00e VMOVSD 0xf0(%RDI),%XMM1 |
0x41d016 VMOVUPS %XMM1,0xd0(%RSP) |
0x41d01f VMOVUPD 0x100(%RDI),%XMM11 |
0x41d027 MOV %EBX,%EBX |
0x41d029 VMOVSD 0x110(%RDI),%XMM1 |
0x41d031 VMOVUPS %XMM1,0xc0(%RSP) |
0x41d03a VMOVSD 0x18(%RDI),%XMM1 |
0x41d03f VMOVUPS %XMM1,0xb0(%RSP) |
0x41d048 VMOVUPS 0x20(%RDI),%XMM1 |
0x41d04d VMOVUPS %YMM1,0x1c0(%RSP) |
0x41d056 VMOVSD 0x30(%RDI),%XMM1 |
0x41d05b VMOVUPS %XMM1,0xa0(%RSP) |
0x41d064 VMOVSD 0x38(%RDI),%XMM1 |
0x41d069 VMOVUPS %XMM1,0x20(%RSP) |
0x41d06f VMOVUPD 0x40(%RDI),%XMM9 |
0x41d074 VMOVSD 0x50(%RDI),%XMM15 |
0x41d079 VMOVSD 0x58(%RDI),%XMM1 |
0x41d07e VMOVUPS %XMM1,0x10(%RSP) |
0x41d084 VMOVUPD 0x60(%RDI),%XMM10 |
0x41d089 VMOVSD 0x70(%RDI),%XMM1 |
0x41d08e VMOVUPS %XMM1,0x90(%RSP) |
0x41d097 VMOVSD 0x78(%RDI),%XMM1 |
0x41d09c VMOVUPS %XMM1,0x80(%RSP) |
0x41d0a5 VMOVUPS 0x80(%RDI),%XMM1 |
0x41d0ad VMOVUPS %YMM1,0x1a0(%RSP) |
0x41d0b6 VMOVSD 0x90(%RDI),%XMM1 |
0x41d0be MOV $-0x4,%EDI |
0x41d0c3 VMULSD %XMM3,%XMM3,%XMM6 |
0x41d0c7 AND %RBX,%RDI |
0x41d0ca VMOVUPD %XMM3,0xe0(%RSP) |
0x41d0d3 VMOVUPS %XMM0,0x190(%RSP) |
0x41d0dc VMOVUPD %XMM2,0x180(%RSP) |
0x41d0e5 VMOVUPS %XMM13,0x170(%RSP) |
0x41d0ee VMOVUPD %XMM14,0x160(%RSP) |
0x41d0f7 VMOVUPD %XMM4,0x150(%RSP) |
0x41d100 VMOVUPD %YMM5,0x6a0(%RSP) |
0x41d109 VMOVUPS %XMM12,0x140(%RSP) |
0x41d112 VMOVUPD %YMM7,0x680(%RSP) |
0x41d11b VMOVUPD %XMM8,0x130(%RSP) |
0x41d124 VMOVUPD %YMM11,0x660(%RSP) |
0x41d12d VMOVUPD %XMM1,0x120(%RSP) |
0x41d136 VMOVUPD %XMM6,0x110(%RSP) |
0x41d13f JE 41d85b |
0x41d145 MOV %RBX,0x38(%RSP) |
0x41d14a VMOVUPD %XMM15,0x70(%RSP) |
0x41d150 VBROADCASTSD %XMM3,%YMM15 |
0x41d155 VBROADCASTSD (%RSP),%YMM3 |
0x41d15b VMOVUPS %YMM3,0x600(%RSP) |
0x41d164 VMOVAPD %YMM10,%YMM3 |
0x41d168 VBROADCASTSD 0x100(%RSP),%YMM10 |
0x41d172 VMOVUPS %YMM10,0x40(%RSP) |
0x41d178 VMOVAPD %XMM1,%XMM10 |
0x41d17c VBROADCASTSD 0xf0(%RSP),%YMM1 |
0x41d186 VMOVUPS %YMM1,0x640(%RSP) |
0x41d18f VBROADCASTSD %XMM0,%YMM0 |
0x41d194 VMOVUPS %YMM0,0x620(%RSP) |
0x41d19d VBROADCASTSD %XMM2,%YMM0 |
0x41d1a2 VMOVUPD %YMM0,0x5e0(%RSP) |
0x41d1ab VBROADCASTSD %XMM13,%YMM0 |
0x41d1b0 VMOVUPS %YMM0,0x5c0(%RSP) |
0x41d1b9 VBROADCASTSD %XMM14,%YMM0 |
0x41d1be VMOVUPD %YMM0,0x5a0(%RSP) |
0x41d1c7 VBROADCASTSD %XMM4,%YMM0 |
0x41d1cc VMOVUPD %YMM0,0x580(%RSP) |
0x41d1d5 VBROADCASTSD %XMM6,%YMM0 |
0x41d1da VMOVUPD %YMM0,0x560(%RSP) |
0x41d1e3 VBROADCASTSD %XMM5,%YMM0 |
0x41d1e8 VMOVUPD %YMM0,0x540(%RSP) |
0x41d1f1 VPERMPD $0x55,%YMM5,%YMM0 |
0x41d1f7 VMOVUPD %YMM0,0x520(%RSP) |
0x41d200 VBROADCASTSD %XMM12,%YMM0 |
0x41d205 VMOVUPS %YMM0,0x500(%RSP) |
0x41d20e VBROADCASTSD %XMM7,%YMM0 |
0x41d213 VMOVUPD %YMM0,0x4e0(%RSP) |
0x41d21c VPERMPD $0x55,%YMM7,%YMM0 |
0x41d222 VMOVUPD %YMM0,0x4c0(%RSP) |
0x41d22b VBROADCASTSD %XMM8,%YMM0 |
0x41d230 VMOVUPD %YMM0,0x4a0(%RSP) |
0x41d239 XOR %EBX,%EBX |
0x41d23b VMOVUPS 0x1e0(%RSP),%YMM1 |
0x41d244 VBROADCASTSD %XMM1,%YMM0 |
0x41d249 VMOVUPS %YMM0,0x480(%RSP) |
0x41d252 VPERMPD $0x55,%YMM1,%YMM0 |
0x41d258 VMOVUPS %YMM0,0x460(%RSP) |
0x41d261 VBROADCASTSD 0xd0(%RSP),%YMM0 |
0x41d26b VMOVUPS %YMM0,0x440(%RSP) |
0x41d274 VBROADCASTSD %XMM11,%YMM0 |
0x41d279 VMOVUPD %YMM0,0x420(%RSP) |
0x41d282 VPERMPD $0x55,%YMM11,%YMM0 |
0x41d288 VMOVUPD %YMM0,0x400(%RSP) |
0x41d291 VBROADCASTSD 0xc0(%RSP),%YMM0 |
0x41d29b VMOVUPS %YMM0,0x3e0(%RSP) |
0x41d2a4 VBROADCASTSD 0xb0(%RSP),%YMM0 |
0x41d2ae VMOVUPS %YMM0,0x3c0(%RSP) |
0x41d2b7 VMOVUPD 0x1c0(%RSP),%YMM1 |
0x41d2c0 VBROADCASTSD %XMM1,%YMM0 |
0x41d2c5 VMOVUPD %YMM0,0x3a0(%RSP) |
0x41d2ce VPERMPD $0x55,%YMM1,%YMM0 |
0x41d2d4 VMOVUPD %YMM0,0x380(%RSP) |
0x41d2dd VBROADCASTSD 0xa0(%RSP),%YMM0 |
0x41d2e7 VMOVUPS %YMM0,0x360(%RSP) |
0x41d2f0 VBROADCASTSD 0x20(%RSP),%YMM0 |
0x41d2f7 VMOVUPS %YMM0,0x340(%RSP) |
0x41d300 VBROADCASTSD %XMM9,%YMM0 |
0x41d305 VMOVUPD %YMM0,0x320(%RSP) |
0x41d30e VMOVUPD %YMM9,0x220(%RSP) |
0x41d317 VPERMPD $0x55,%YMM9,%YMM0 |
0x41d31d VMOVUPD %YMM0,0x300(%RSP) |
0x41d326 VBROADCASTSD 0x70(%RSP),%YMM0 |
0x41d32d VMOVUPS %YMM0,0x2e0(%RSP) |
0x41d336 VBROADCASTSD 0x10(%RSP),%YMM0 |
0x41d33d VMOVUPS %YMM0,0x2c0(%RSP) |
0x41d346 VBROADCASTSD %XMM3,%YMM0 |
0x41d34b VMOVUPD %YMM0,0x2a0(%RSP) |
0x41d354 VMOVUPD %YMM3,0x200(%RSP) |
0x41d35d VPERMPD $0x55,%YMM3,%YMM0 |
0x41d363 VMOVUPD %YMM0,0x280(%RSP) |
0x41d36c VBROADCASTSD 0x90(%RSP),%YMM0 |
0x41d376 VMOVUPS %YMM0,0x260(%RSP) |
0x41d37f VBROADCASTSD 0x80(%RSP),%YMM0 |
0x41d389 VMOVUPS %YMM0,0x240(%RSP) |
0x41d392 VMOVUPD 0x1a0(%RSP),%YMM0 |
0x41d39b VBROADCASTSD %XMM0,%YMM12 |
0x41d3a0 VPERMPD $0x55,%YMM0,%YMM14 |
0x41d3a6 VBROADCASTSD %XMM10,%YMM11 |
0x41d3ab VPBROADCASTQ 0xd8f0c(%RIP),%YMM13 |
0x41d3b4 VPBROADCASTQ 0xd8f0b(%RIP),%YMM3 |
0x41d3bd VPBROADCASTQ 0xd8f0a(%RIP),%YMM6 |
0x41d3c6 NOPW %CS:(%RAX,%RAX,1) |
(317) 0x41d3d0 VMOVUPD (%R8,%RBX,8),%YMM10 |
(317) 0x41d3d6 VMULPD %YMM10,%YMM15,%YMM2 |
(317) 0x41d3db VCVTTPD2DQ %YMM2,%XMM1 |
(317) 0x41d3df VPMOVSXDQ %XMM1,%YMM1 |
(317) 0x41d3e4 VPSLLQ $0x3,%YMM1,%YMM1 |
(317) 0x41d3e9 VMOVQ %RSI,%XMM4 |
(317) 0x41d3ee VPBROADCASTQ %XMM4,%YMM4 |
(317) 0x41d3f3 VROUNDPD $0xb,%YMM2,%YMM5 |
(317) 0x41d3f9 VPADDQ %YMM1,%YMM4,%YMM1 |
(317) 0x41d3fd VMOVQ %XMM1,%R14 |
(317) 0x41d402 VEXTRACTI128 $0x1,%YMM1,%XMM8 |
(317) 0x41d408 VSUBPD %YMM5,%YMM2,%YMM4 |
(317) 0x41d40c VMOVQ %XMM8,%R15 |
(317) 0x41d411 VMOVSD (%R15),%XMM2 |
(317) 0x41d416 VPEXTRQ $0x1,%XMM1,%R15 |
(317) 0x41d41c VMOVSD (%R14),%XMM5 |
(317) 0x41d421 VPADDQ %YMM6,%YMM1,%YMM7 |
(317) 0x41d425 VPEXTRQ $0x1,%XMM8,%R14 |
(317) 0x41d42b VMOVQ %XMM7,%R12 |
(317) 0x41d430 VEXTRACTI128 $0x1,%YMM7,%XMM8 |
(317) 0x41d436 VPEXTRQ $0x1,%XMM7,%R13 |
(317) 0x41d43c VPEXTRQ $0x1,%XMM8,%R10 |
(317) 0x41d442 VMOVHPD (%R15),%XMM5,%XMM7 |
(317) 0x41d447 VMOVQ %XMM8,%R15 |
(317) 0x41d44c VMOVSD (%R15),%XMM5 |
(317) 0x41d451 VMOVHPD (%R14),%XMM2,%XMM2 |
(317) 0x41d456 VMOVHPD (%R10),%XMM5,%XMM5 |
(317) 0x41d45b VMOVSD (%R12),%XMM8 |
(317) 0x41d461 VINSERTF128 $0x1,%XMM2,%YMM7,%YMM2 |
(317) 0x41d467 VMOVHPD (%R13),%XMM8,%XMM7 |
(317) 0x41d46d VMOVAPD %YMM4,%YMM8 |
(317) 0x41d471 VMOVAPD %YMM4,%YMM9 |
(317) 0x41d475 VMOVUPD 0x520(%RSP),%YMM0 |
(317) 0x41d47e VFMADD132PD 0x540(%RSP),%YMM0,%YMM9 |
(317) 0x41d488 VINSERTF128 $0x1,%XMM5,%YMM7,%YMM7 |
(317) 0x41d48e VFMADD213PD 0x500(%RSP),%YMM4,%YMM9 |
(317) 0x41d498 VMOVAPD %YMM4,%YMM5 |
(317) 0x41d49c VMOVUPD 0x600(%RSP),%YMM0 |
(317) 0x41d4a5 VFMADD213PD 0x40(%RSP),%YMM0,%YMM5 |
(317) 0x41d4ac VMOVUPD 0x620(%RSP),%YMM0 |
(317) 0x41d4b5 VFMADD132PD 0x640(%RSP),%YMM0,%YMM8 |
(317) 0x41d4bf VMULPD %YMM2,%YMM5,%YMM5 |
(317) 0x41d4c3 VFMADD213PD %YMM5,%YMM7,%YMM8 |
(317) 0x41d4c8 VMOVAPD %YMM4,%YMM5 |
(317) 0x41d4cc VMOVUPD 0x4c0(%RSP),%YMM0 |
(317) 0x41d4d5 VFMADD132PD 0x4e0(%RSP),%YMM0,%YMM5 |
(317) 0x41d4df VFMADD213PD 0x4a0(%RSP),%YMM4,%YMM5 |
(317) 0x41d4e9 VMULPD %YMM2,%YMM9,%YMM9 |
(317) 0x41d4ed VFMADD213PD %YMM9,%YMM7,%YMM5 |
(317) 0x41d4f2 VMOVAPD %YMM4,%YMM9 |
(317) 0x41d4f6 VMOVUPD 0x3a0(%RSP),%YMM0 |
(317) 0x41d4ff VFMADD132PD 0x3c0(%RSP),%YMM0,%YMM9 |
(317) 0x41d509 VFMADD213PD 0x380(%RSP),%YMM4,%YMM9 |
(317) 0x41d513 VFMADD213PD 0x360(%RSP),%YMM4,%YMM9 |
(317) 0x41d51d VMULPD %YMM2,%YMM9,%YMM2 |
(317) 0x41d521 VMOVAPD %YMM4,%YMM9 |
(317) 0x41d525 VMOVUPD 0x320(%RSP),%YMM0 |
(317) 0x41d52e VFMADD132PD 0x340(%RSP),%YMM0,%YMM9 |
(317) 0x41d538 VFMADD213PD 0x300(%RSP),%YMM4,%YMM9 |
(317) 0x41d542 VFMADD213PD 0x2e0(%RSP),%YMM4,%YMM9 |
(317) 0x41d54c VFMADD213PD %YMM2,%YMM7,%YMM9 |
(317) 0x41d551 VPADDQ %YMM3,%YMM1,%YMM2 |
(317) 0x41d555 VPEXTRQ $0x1,%XMM2,%R10 |
(317) 0x41d55b VMOVQ %XMM2,%R14 |
(317) 0x41d560 VEXTRACTI128 $0x1,%YMM2,%XMM2 |
(317) 0x41d566 VPEXTRQ $0x1,%XMM2,%R15 |
(317) 0x41d56c VMOVQ %XMM2,%R12 |
(317) 0x41d571 VMOVSD (%R12),%XMM2 |
(317) 0x41d577 VPADDQ %YMM1,%YMM13,%YMM1 |
(317) 0x41d57b VMOVQ %XMM1,%R12 |
(317) 0x41d580 VPEXTRQ $0x1,%XMM1,%R13 |
(317) 0x41d586 VMOVHPD (%R15),%XMM2,%XMM2 |
(317) 0x41d58b VEXTRACTI128 $0x1,%YMM1,%XMM1 |
(317) 0x41d591 VMOVQ %XMM1,%R15 |
(317) 0x41d596 VPEXTRQ $0x1,%XMM1,%R8 |
(317) 0x41d59c VMOVSD (%R14),%XMM1 |
(317) 0x41d5a1 VMOVHPD (%R10),%XMM1,%XMM1 |
(317) 0x41d5a6 VINSERTF128 $0x1,%XMM2,%YMM1,%YMM1 |
(317) 0x41d5ac VMOVAPD %YMM4,%YMM2 |
(317) 0x41d5b0 VMOVUPD 0x5c0(%RSP),%YMM0 |
(317) 0x41d5b9 VFMADD132PD 0x5e0(%RSP),%YMM0,%YMM2 |
(317) 0x41d5c3 VFMADD213PD %YMM8,%YMM1,%YMM2 |
(317) 0x41d5c8 VMOVAPD %YMM4,%YMM7 |
(317) 0x41d5cc VMOVUPD 0x460(%RSP),%YMM0 |
(317) 0x41d5d5 VFMADD132PD 0x480(%RSP),%YMM0,%YMM7 |
(317) 0x41d5df VFMADD213PD 0x440(%RSP),%YMM4,%YMM7 |
(317) 0x41d5e9 VFMADD213PD %YMM5,%YMM1,%YMM7 |
(317) 0x41d5ee VMOVAPD %YMM4,%YMM5 |
(317) 0x41d5f2 VMOVUPD 0x2a0(%RSP),%YMM0 |
(317) 0x41d5fb VFMADD132PD 0x2c0(%RSP),%YMM0,%YMM5 |
(317) 0x41d605 VFMADD213PD 0x280(%RSP),%YMM4,%YMM5 |
(317) 0x41d60f VFMADD213PD 0x260(%RSP),%YMM4,%YMM5 |
(317) 0x41d619 VFMADD213PD %YMM9,%YMM1,%YMM5 |
(317) 0x41d61e VMOVSD (%R15),%XMM1 |
(317) 0x41d623 VMOVHPD (%R8),%XMM1,%XMM1 |
(317) 0x41d628 VMOVSD (%R12),%XMM8 |
(317) 0x41d62e VMOVHPD (%R13),%XMM8,%XMM8 |
(317) 0x41d634 VINSERTF128 $0x1,%XMM1,%YMM8,%YMM1 |
(317) 0x41d63a VMOVAPD %YMM4,%YMM8 |
(317) 0x41d63e VMOVUPD 0x400(%RSP),%YMM0 |
(317) 0x41d647 VFMADD132PD 0x420(%RSP),%YMM0,%YMM8 |
(317) 0x41d651 VFMADD213PD 0x3e0(%RSP),%YMM4,%YMM8 |
(317) 0x41d65b VFMADD213PD %YMM7,%YMM1,%YMM8 |
(317) 0x41d660 VMULPD %YMM15,%YMM8,%YMM7 |
(317) 0x41d665 VDIVPD %YMM10,%YMM7,%YMM7 |
(317) 0x41d66a VMOVAPD %YMM4,%YMM8 |
(317) 0x41d66e VFMADD132PD 0x240(%RSP),%YMM12,%YMM8 |
(317) 0x41d678 VFMADD213PD %YMM14,%YMM4,%YMM8 |
(317) 0x41d67d VFMADD213PD %YMM11,%YMM4,%YMM8 |
(317) 0x41d682 VMOVUPD 0x580(%RSP),%YMM0 |
(317) 0x41d68b VFMADD132PD 0x5a0(%RSP),%YMM0,%YMM4 |
(317) 0x41d695 VFMADD213PD %YMM2,%YMM1,%YMM4 |
(317) 0x41d69a MOVSXD (%RAX,%RBX,4),%R8 |
(317) 0x41d69e MOVSXD 0x4(%RAX,%RBX,4),%R10 |
(317) 0x41d6a3 MOVSXD 0x8(%RAX,%RBX,4),%R14 |
(317) 0x41d6a8 MOVSXD 0xc(%RAX,%RBX,4),%R15 |
(317) 0x41d6ad VMULPD 0x560(%RSP),%YMM4,%YMM2 |
(317) 0x41d6b6 ADD %R11,%R8 |
(317) 0x41d6b9 VMOVLPD %XMM2,(%RCX,%R8,8) |
(317) 0x41d6bf ADD %R11,%R10 |
(317) 0x41d6c2 VMOVHPD %XMM2,(%RCX,%R10,8) |
(317) 0x41d6c8 VEXTRACTF128 $0x1,%YMM2,%XMM2 |
(317) 0x41d6ce ADD %R11,%R14 |
(317) 0x41d6d1 ADD %R11,%R15 |
(317) 0x41d6d4 VMOVLPD %XMM2,(%RCX,%R14,8) |
(317) 0x41d6da VMOVHPD %XMM2,(%RCX,%R15,8) |
(317) 0x41d6e0 VMOVLPD %XMM7,(%RDX,%R8,8) |
(317) 0x41d6e6 VFMADD213PD %YMM5,%YMM1,%YMM8 |
(317) 0x41d6eb VMOVHPD %XMM7,(%RDX,%R10,8) |
(317) 0x41d6f1 VEXTRACTF128 $0x1,%YMM7,%XMM1 |
(317) 0x41d6f7 VMOVLPD %XMM1,(%RDX,%R14,8) |
(317) 0x41d6fd VMOVHPD %XMM1,(%RDX,%R15,8) |
(317) 0x41d703 VMOVLPD %XMM8,(%R9,%R8,8) |
(317) 0x41d709 MOV 0x20(%RBP),%R8 |
(317) 0x41d70d VMOVHPD %XMM8,(%R9,%R10,8) |
(317) 0x41d713 VEXTRACTF128 $0x1,%YMM8,%XMM1 |
(317) 0x41d719 VMOVLPD %XMM1,(%R9,%R14,8) |
(317) 0x41d71f VMOVHPD %XMM1,(%R9,%R15,8) |
(317) 0x41d725 ADD $0x4,%RBX |
(317) 0x41d729 CMP %RDI,%RBX |
(317) 0x41d72c JB 41d3d0 |
0x41d732 MOV 0x38(%RSP),%RBX |
0x41d737 CMP %RBX,%RDI |
0x41d73a VMOVUPD (%RSP),%XMM1 |
0x41d73f VMOVUPD 0xe0(%RSP),%XMM3 |
0x41d748 VMOVUPD 0x20(%RSP),%XMM12 |
0x41d74e VMOVUPD 0x220(%RSP),%YMM13 |
0x41d757 VMOVUPD 0x70(%RSP),%XMM15 |
0x41d75d VMOVUPD 0x10(%RSP),%XMM0 |
0x41d763 VMOVUPD 0x200(%RSP),%YMM10 |
0x41d76c JNE 41d880 |
0x41d772 JMP 41dadd |
0x41d777 MOV %R14D,%ECX |
0x41d77a AND $-0x4,%ECX |
0x41d77d MOV 0x40(%RSP),%R10 |
0x41d782 LEA (%R10,%R11,8),%R15 |
0x41d786 ADD $0x18,%R15 |
0x41d78a MOV %EDX,%R12D |
0x41d78d SUB %ESI,%R12D |
0x41d790 XOR %R13D,%R13D |
0x41d793 XOR %EBX,%EBX |
0x41d795 JMP 41d7ad |
0x41d797 NOPW (%RAX,%RAX,1) |
(319) 0x41d7a0 ADD $0x4,%R13 |
(319) 0x41d7a4 CMP %R13,%RCX |
(319) 0x41d7a7 JE 41cf25 |
(319) 0x41d7ad VMOVSD -0x18(%R15,%R13,8),%XMM1 |
(319) 0x41d7b4 VUCOMISD %XMM1,%XMM0 |
(319) 0x41d7b8 JBE 41d7d1 |
(319) 0x41d7ba MOV %R12D,%R10D |
(319) 0x41d7bd ADD %R13D,%R10D |
(319) 0x41d7c0 JE 41d7d1 |
(319) 0x41d7c2 MOVSXD %EBX,%RBX |
(319) 0x41d7c5 MOV %R13D,(%RAX,%RBX,4) |
(319) 0x41d7c9 VMOVSD %XMM1,(%R8,%RBX,8) |
(319) 0x41d7cf INC %EBX |
(319) 0x41d7d1 VMOVSD -0x10(%R15,%R13,8),%XMM1 |
(319) 0x41d7d8 VUCOMISD %XMM1,%XMM0 |
(319) 0x41d7dc JBE 41d7fb |
(319) 0x41d7de LEA (%R12,%R13,1),%R10D |
(319) 0x41d7e2 CMP $-0x1,%R10D |
(319) 0x41d7e6 JE 41d7fb |
(319) 0x41d7e8 MOVSXD %EBX,%RBX |
(319) 0x41d7eb LEA 0x1(%R13),%R10D |
(319) 0x41d7ef MOV %R10D,(%RAX,%RBX,4) |
(319) 0x41d7f3 VMOVSD %XMM1,(%R8,%RBX,8) |
(319) 0x41d7f9 INC %EBX |
(319) 0x41d7fb VMOVSD -0x8(%R15,%R13,8),%XMM1 |
(319) 0x41d802 VUCOMISD %XMM1,%XMM0 |
(319) 0x41d806 JBE 41d825 |
(319) 0x41d808 LEA (%R12,%R13,1),%R10D |
(319) 0x41d80c CMP $-0x2,%R10D |
(319) 0x41d810 JE 41d825 |
(319) 0x41d812 MOVSXD %EBX,%RBX |
(319) 0x41d815 LEA 0x2(%R13),%R10D |
(319) 0x41d819 MOV %R10D,(%RAX,%RBX,4) |
(319) 0x41d81d VMOVSD %XMM1,(%R8,%RBX,8) |
(319) 0x41d823 INC %EBX |
(319) 0x41d825 VMOVSD (%R15,%R13,8),%XMM1 |
(319) 0x41d82b VUCOMISD %XMM1,%XMM0 |
(319) 0x41d82f JBE 41d7a0 |
(319) 0x41d835 LEA (%R12,%R13,1),%R10D |
(319) 0x41d839 CMP $-0x3,%R10D |
(319) 0x41d83d JE 41d7a0 |
(319) 0x41d843 MOVSXD %EBX,%RBX |
(319) 0x41d846 LEA 0x3(%R13),%R10D |
(319) 0x41d84a MOV %R10D,(%RAX,%RBX,4) |
(319) 0x41d84e VMOVSD %XMM1,(%R8,%RBX,8) |
(319) 0x41d854 INC %EBX |
(319) 0x41d856 JMP 41d7a0 |
0x41d85b XOR %EDI,%EDI |
0x41d85d VMOVUPD 0x20(%RSP),%XMM12 |
0x41d863 VMOVAPD %YMM9,%YMM13 |
0x41d868 VMOVUPD 0x10(%RSP),%XMM0 |
0x41d86e VMOVUPD (%RSP),%XMM1 |
0x41d873 NOPW %CS:(%RAX,%RAX,1) |
(316) 0x41d880 VMOVSD (%R8,%RDI,8),%XMM2 |
(316) 0x41d886 VMOVSD %XMM2,0x40(%RSP) |
(316) 0x41d88c VMULSD %XMM2,%XMM3,%XMM2 |
(316) 0x41d890 VCVTTSD2SI %XMM2,%R8D |
(316) 0x41d894 VROUNDSD $0xb,%XMM2,%XMM2,%XMM3 |
(316) 0x41d89a MOVSXD %R8D,%R8 |
(316) 0x41d89d VMOVSD (%RSI,%R8,8),%XMM8 |
(316) 0x41d8a3 VMOVSD 0x8(%RSI,%R8,8),%XMM6 |
(316) 0x41d8aa VMOVSD 0x10(%RSI,%R8,8),%XMM5 |
(316) 0x41d8b1 VSUBSD %XMM3,%XMM2,%XMM2 |
(316) 0x41d8b5 VMOVSD 0x18(%RSI,%R8,8),%XMM3 |
(316) 0x41d8bc VMULSD %XMM2,%XMM2,%XMM7 |
(316) 0x41d8c0 VMULSD %XMM2,%XMM7,%XMM4 |
(316) 0x41d8c4 VMOVAPD %XMM2,%XMM9 |
(316) 0x41d8c8 VFMADD213SD 0x100(%RSP),%XMM1,%XMM9 |
(316) 0x41d8d2 VMOVAPD %YMM10,%YMM14 |
(316) 0x41d8d7 VMOVAPD %XMM2,%XMM10 |
(316) 0x41d8db VMULSD %XMM8,%XMM9,%XMM9 |
(316) 0x41d8e0 VMOVUPD 0x190(%RSP),%XMM1 |
(316) 0x41d8e9 VFMADD132SD 0xf0(%RSP),%XMM1,%XMM10 |
(316) 0x41d8f3 VMOVAPD %XMM2,%XMM11 |
(316) 0x41d8f7 VMOVUPD 0x170(%RSP),%XMM1 |
(316) 0x41d900 VFMADD132SD 0x180(%RSP),%XMM1,%XMM11 |
(316) 0x41d90a VUNPCKLPD %XMM2,%XMM7,%XMM7 |
(316) 0x41d90e VFMADD213SD %XMM9,%XMM6,%XMM10 |
(316) 0x41d913 VMOVUPD 0x150(%RSP),%XMM1 |
(316) 0x41d91c VFMADD132SD 0x160(%RSP),%XMM1,%XMM2 |
(316) 0x41d926 VMULPD 0x6a0(%RSP),%XMM7,%XMM9 |
(316) 0x41d92f VMOVAPD %XMM0,%XMM1 |
(316) 0x41d933 VMOVAPD %XMM15,%XMM0 |
(316) 0x41d937 VMOVAPD %YMM13,%YMM15 |
(316) 0x41d93c VMOVAPD %XMM12,%XMM13 |
(316) 0x41d941 VSHUFPD $0x1,%XMM9,%XMM9,%XMM12 |
(316) 0x41d947 VFMADD213SD %XMM10,%XMM5,%XMM11 |
(316) 0x41d94c VADDSD %XMM9,%XMM12,%XMM9 |
(316) 0x41d951 VADDSD 0x140(%RSP),%XMM9,%XMM9 |
(316) 0x41d95a VMULPD 0x680(%RSP),%XMM7,%XMM10 |
(316) 0x41d963 VMULSD %XMM8,%XMM9,%XMM9 |
(316) 0x41d968 VSHUFPD $0x1,%XMM10,%XMM10,%XMM12 |
(316) 0x41d96e VADDSD %XMM10,%XMM12,%XMM10 |
(316) 0x41d973 VADDSD 0x130(%RSP),%XMM10,%XMM10 |
(316) 0x41d97c VFMADD213SD %XMM11,%XMM3,%XMM2 |
(316) 0x41d981 VMULPD 0x1e0(%RSP),%XMM7,%XMM11 |
(316) 0x41d98a VSHUFPD $0x1,%XMM11,%XMM11,%XMM12 |
(316) 0x41d990 VADDSD %XMM11,%XMM12,%XMM11 |
(316) 0x41d995 VFMADD213SD %XMM9,%XMM6,%XMM10 |
(316) 0x41d99a VMULPD 0x1c0(%RSP),%XMM7,%XMM9 |
(316) 0x41d9a3 VMOVAPD %XMM4,%XMM12 |
(316) 0x41d9a7 VFMADD132SD 0xb0(%RSP),%XMM9,%XMM12 |
(316) 0x41d9b1 VSHUFPD $0x1,%XMM9,%XMM9,%XMM9 |
(316) 0x41d9b7 VADDSD 0xa0(%RSP),%XMM9,%XMM9 |
(316) 0x41d9c0 VADDSD %XMM9,%XMM12,%XMM9 |
(316) 0x41d9c5 VMOVAPD %XMM13,%XMM12 |
(316) 0x41d9ca VMOVAPD %YMM15,%YMM13 |
(316) 0x41d9cf VMOVAPD %XMM0,%XMM15 |
(316) 0x41d9d3 VMOVAPD %XMM1,%XMM0 |
(316) 0x41d9d7 VADDSD 0xd0(%RSP),%XMM11,%XMM11 |
(316) 0x41d9e0 VMULSD %XMM8,%XMM9,%XMM8 |
(316) 0x41d9e5 VFMADD213SD %XMM10,%XMM5,%XMM11 |
(316) 0x41d9ea VMULPD %XMM7,%XMM13,%XMM9 |
(316) 0x41d9ee VMOVAPD %XMM4,%XMM10 |
(316) 0x41d9f2 VFMADD213SD %XMM9,%XMM12,%XMM10 |
(316) 0x41d9f7 VSHUFPD $0x1,%XMM9,%XMM9,%XMM9 |
(316) 0x41d9fd VADDSD %XMM15,%XMM9,%XMM9 |
(316) 0x41da02 VADDSD %XMM9,%XMM10,%XMM9 |
(316) 0x41da07 VMOVAPD %YMM14,%YMM10 |
(316) 0x41da0c VMOVUPD 0x90(%RSP),%XMM14 |
(316) 0x41da15 VFMADD213SD %XMM8,%XMM6,%XMM9 |
(316) 0x41da1a VMULPD %XMM7,%XMM10,%XMM6 |
(316) 0x41da1e VMOVAPD %XMM4,%XMM8 |
(316) 0x41da22 VFMADD213SD %XMM6,%XMM1,%XMM8 |
(316) 0x41da27 VSHUFPD $0x1,%XMM6,%XMM6,%XMM6 |
(316) 0x41da2c VADDSD %XMM6,%XMM14,%XMM6 |
(316) 0x41da30 VADDSD %XMM6,%XMM8,%XMM6 |
(316) 0x41da34 VFMADD213SD %XMM9,%XMM5,%XMM6 |
(316) 0x41da39 VMOVUPD 0x1a0(%RSP),%YMM9 |
(316) 0x41da42 VMULPD 0x660(%RSP),%XMM7,%XMM5 |
(316) 0x41da4b VSHUFPD $0x1,%XMM5,%XMM5,%XMM8 |
(316) 0x41da50 VADDSD %XMM5,%XMM8,%XMM5 |
(316) 0x41da54 VMOVUPD 0x80(%RSP),%XMM8 |
(316) 0x41da5d VADDSD 0xc0(%RSP),%XMM5,%XMM5 |
(316) 0x41da66 VFMADD213SD %XMM11,%XMM3,%XMM5 |
(316) 0x41da6b VMOVUPD 0x120(%RSP),%XMM11 |
(316) 0x41da74 VMULPD %XMM7,%XMM9,%XMM7 |
(316) 0x41da78 VFMADD213SD %XMM7,%XMM8,%XMM4 |
(316) 0x41da7d VSHUFPD $0x1,%XMM7,%XMM7,%XMM7 |
(316) 0x41da82 VADDSD %XMM7,%XMM11,%XMM7 |
(316) 0x41da86 VADDSD %XMM7,%XMM4,%XMM4 |
(316) 0x41da8a VFMADD213SD %XMM6,%XMM3,%XMM4 |
(316) 0x41da8f VMOVUPD 0x110(%RSP),%XMM6 |
(316) 0x41da98 VMOVUPD 0xe0(%RSP),%XMM3 |
(316) 0x41daa1 MOVSXD (%RAX,%RDI,4),%R8 |
(316) 0x41daa5 ADD %R11,%R8 |
(316) 0x41daa8 VMULSD %XMM2,%XMM6,%XMM2 |
(316) 0x41daac VMOVSD %XMM2,(%RCX,%R8,8) |
(316) 0x41dab2 VMULSD %XMM3,%XMM5,%XMM2 |
(316) 0x41dab6 VDIVSD 0x40(%RSP),%XMM2,%XMM1 |
(316) 0x41dabc VMOVSD %XMM1,(%RDX,%R8,8) |
(316) 0x41dac2 VMOVUPD (%RSP),%XMM1 |
(316) 0x41dac7 VMOVSD %XMM4,(%R9,%R8,8) |
(316) 0x41dacd MOV 0x20(%RBP),%R8 |
(316) 0x41dad1 INC %RDI |
(316) 0x41dad4 CMP %RDI,%RBX |
(316) 0x41dad7 JNE 41d880 |
0x41dadd LEA -0x28(%RBP),%RSP |
0x41dae1 POP %RBX |
0x41dae2 POP %R12 |
0x41dae4 POP %R13 |
0x41dae6 POP %R14 |
0x41dae8 POP %R15 |
0x41daea POP %RBP |
0x41daeb VZEROUPPER |
0x41daee RET |
0x41daef NOP |
Path / |
Source file and lines | BsplineFunctor.h:276-339 |
Module | exec |
nb instructions | 220 |
nb uops | 221 |
loop length | 1391 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 16 |
used ymm registers | 13 |
used zmm registers | 0 |
nb stack references | 70 |
micro-operation queue | 36.83 cycles |
front end | 36.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.70 | 5.80 | 24.33 | 24.33 | 36.00 | 26.00 | 5.70 | 36.00 | 36.00 | 36.00 | 5.80 | 24.33 |
cycles | 5.70 | 5.80 | 24.33 | 24.33 | 36.00 | 26.00 | 5.70 | 36.00 | 36.00 | 36.00 | 5.80 | 24.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 36.88 |
Stall cycles | 0.00 |
Front-end | 36.83 |
Dispatch | 36.00 |
Overall L1 | 36.83 |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 64% |
load | 38% |
store | 100% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 26% |
all | 55% |
load | 34% |
store | 96% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 20% |
all | 9% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 9% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 8% |
all | 30% |
load | 19% |
store | 41% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 21% |
all | 27% |
load | 18% |
store | 40% |
mul | 12% |
add-sub | 9% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
SUB %EDX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %ECX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41daeb <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0xc0b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x6e0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD %EDX,%R11 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
VMOVSD 0x8(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ECX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP $0x4,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 41d777 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x897> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14D,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R14,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 41cf67 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x87> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SUB %EDX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x40(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDX,%R11,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41cf48 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x68> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %EBX,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41dadd <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0xbfd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD 0x238(%RDI),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x218(%RDI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x128(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM0,(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x130(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM0,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x148(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM0,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x150(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x168(%RDI),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x170(%RDI),%XMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x188(%RDI),%XMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x190(%RDI),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0xa0(%RDI),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0xb0(%RDI),%XMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0xc0(%RDI),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0xd0(%RDI),%XMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS 0xe0(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPS %YMM1,0x1e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0xf0(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x100(%RDI),%XMM11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVSD 0x110(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x18(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS 0x20(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPS %YMM1,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x30(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x38(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x40(%RDI),%XMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0x50(%RDI),%XMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x58(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x60(%RDI),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0x70(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x78(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS 0x80(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPS %YMM1,0x1a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x90(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $-0x4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMULSD %XMM3,%XMM3,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND %RBX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
VMOVUPD %XMM3,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS %XMM0,0x190(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM2,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS %XMM13,0x170(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM14,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM4,0x150(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM5,0x6a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS %XMM12,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM7,0x680(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM8,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM11,0x660(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM1,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM6,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
JE 41d85b <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x97b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVUPD %XMM15,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM3,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD (%RSP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM3,0x600(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVAPD %YMM10,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VBROADCASTSD 0x100(%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM10,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVAPD %XMM1,%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VBROADCASTSD 0xf0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM1,0x640(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM0,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x620(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM2,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x5e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM13,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x5c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM14,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x5a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM4,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x580(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM6,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x560(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM5,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x540(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM5,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x520(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM12,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x500(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM7,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x4e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM7,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x4c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM8,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x4a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPS 0x1e0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x480(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x460(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xd0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x440(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM11,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x420(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM11,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x400(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xc0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x3e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xb0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x3c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x1c0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x3a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x380(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xa0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x360(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x20(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x340(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM9,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x320(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM9,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM9,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x300(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x70(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x2e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x10(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM3,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM3,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM3,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x280(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x90(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x260(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x80(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x240(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x1a0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM0,%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPERMPD $0x55,%YMM0,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM10,%YMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ 0xd8f0c(%RIP),%YMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VPBROADCASTQ 0xd8f0b(%RIP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VPBROADCASTQ 0xd8f0a(%RIP),%YMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RBX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVUPD (%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xe0(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x20(%RSP),%XMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x220(%RSP),%YMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x70(%RSP),%XMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x10(%RSP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x200(%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
JNE 41d880 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x9a0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41dadd <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0xbfd> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R14D,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0x40(%RSP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R10,%R11,8),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x18,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EDX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %ESI,%R12D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41d7ad <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x8cd> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD 0x20(%RSP),%XMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVAPD %YMM9,%YMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VMOVUPD 0x10(%RSP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD (%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | BsplineFunctor.h:276-339 |
Module | exec |
nb instructions | 220 |
nb uops | 221 |
loop length | 1391 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 16 |
used ymm registers | 13 |
used zmm registers | 0 |
nb stack references | 70 |
micro-operation queue | 36.83 cycles |
front end | 36.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.70 | 5.80 | 24.33 | 24.33 | 36.00 | 26.00 | 5.70 | 36.00 | 36.00 | 36.00 | 5.80 | 24.33 |
cycles | 5.70 | 5.80 | 24.33 | 24.33 | 36.00 | 26.00 | 5.70 | 36.00 | 36.00 | 36.00 | 5.80 | 24.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 36.88 |
Stall cycles | 0.00 |
Front-end | 36.83 |
Dispatch | 36.00 |
Overall L1 | 36.83 |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 64% |
load | 38% |
store | 100% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 26% |
all | 55% |
load | 34% |
store | 96% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 20% |
all | 9% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 9% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 8% |
all | 30% |
load | 19% |
store | 41% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 21% |
all | 27% |
load | 18% |
store | 40% |
mul | 12% |
add-sub | 9% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
SUB %EDX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %ECX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41daeb <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0xc0b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x6e0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD %EDX,%R11 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
VMOVSD 0x8(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ECX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP $0x4,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 41d777 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x897> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14D,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R14,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 41cf67 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x87> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SUB %EDX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x40(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDX,%R11,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41cf48 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x68> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %EBX,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 41dadd <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0xbfd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD 0x238(%RDI),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x218(%RDI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x128(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM0,(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x130(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM0,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x148(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM0,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x150(%RDI),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x168(%RDI),%XMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x170(%RDI),%XMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x188(%RDI),%XMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x190(%RDI),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0xa0(%RDI),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0xb0(%RDI),%XMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0xc0(%RDI),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0xd0(%RDI),%XMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS 0xe0(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPS %YMM1,0x1e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0xf0(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x100(%RDI),%XMM11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVSD 0x110(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x18(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS 0x20(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPS %YMM1,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x30(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x38(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x40(%RDI),%XMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0x50(%RDI),%XMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x58(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x60(%RDI),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVSD 0x70(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x78(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPS %XMM1,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS 0x80(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPS %YMM1,0x1a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD 0x90(%RDI),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $-0x4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMULSD %XMM3,%XMM3,%XMM6 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND %RBX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
VMOVUPD %XMM3,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS %XMM0,0x190(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM2,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS %XMM13,0x170(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM14,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM4,0x150(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM5,0x6a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPS %XMM12,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM7,0x680(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM8,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM11,0x660(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM1,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM6,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
JE 41d85b <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x97b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVUPD %XMM15,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM3,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD (%RSP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM3,0x600(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVAPD %YMM10,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VBROADCASTSD 0x100(%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM10,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVAPD %XMM1,%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VBROADCASTSD 0xf0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM1,0x640(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM0,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x620(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM2,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x5e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM13,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x5c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM14,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x5a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM4,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x580(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM6,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x560(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM5,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x540(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM5,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x520(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM12,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x500(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM7,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x4e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM7,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x4c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM8,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x4a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPS 0x1e0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x480(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPS %YMM0,0x460(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xd0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x440(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM11,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x420(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM11,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x400(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xc0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x3e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xb0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x3c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x1c0(%RSP),%YMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x3a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM1,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x380(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0xa0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x360(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x20(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x340(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM9,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x320(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM9,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM9,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x300(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x70(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x2e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x10(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM3,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %YMM3,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPERMPD $0x55,%YMM3,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x280(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x90(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x260(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD 0x80(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVUPS %YMM0,0x240(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD 0x1a0(%RSP),%YMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VBROADCASTSD %XMM0,%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPERMPD $0x55,%YMM0,%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM10,%YMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ 0xd8f0c(%RIP),%YMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VPBROADCASTQ 0xd8f0b(%RIP),%YMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VPBROADCASTQ 0xd8f0a(%RIP),%YMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RBX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVUPD (%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0xe0(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x20(%RSP),%XMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x220(%RSP),%YMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x70(%RSP),%XMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x10(%RSP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD 0x200(%RSP),%YMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
JNE 41d880 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x9a0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 41dadd <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0xbfd> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R14D,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0x40(%RSP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R10,%R11,8),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x18,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EDX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %ESI,%R12D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 41d7ad <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi+0x8cd> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVUPD 0x20(%RSP),%XMM12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVAPD %YMM9,%YMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VMOVUPD 0x10(%RSP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVUPD (%RSP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi– | 0.64 | 0.66 |
○Loop 319 - BsplineFunctor.h:291-298 - exec | 0.53 | 0.54 |
○Loop 317 - BsplineFunctor.h:302-335 - exec | 0.07 | 0.07 |
○Loop 316 - BsplineFunctor.h:302-336 - exec | 0.01 | 0.01 |
○Loop 318 - BsplineFunctor.h:291-298 - exec | 0 | 0 |