Function: .omp_outlined.#0xc138b0 | Module: libgromacs_mpi.so.9.0.0 | Source: pme_spread.cpp:75-923 [...] | Coverage (incl. loops): 0.17% | (excl. loops): 0.00% |
---|
Function: .omp_outlined.#0xc138b0 | Module: libgromacs_mpi.so.9.0.0 | Source: pme_spread.cpp:75-923 [...] | Coverage (incl. loops): 0.17% | (excl. loops): 0.00% |
---|
/home/eoseret/gromacs-2024.2/src/gromacs/ewald/pme_internal.h: 209 - 209 |
-------------------------------------------------------------------------------- |
209: int numAtoms() const { return numAtoms_; } |
/home/eoseret/gromacs-2024.2/src/gromacs/ewald/pme_spread.cpp: 75 - 923 |
-------------------------------------------------------------------------------- |
75: nx = pme->nkx; |
76: ny = pme->nky; |
77: nz = pme->nkz; |
78: |
79: rxx = pme->recipbox[XX][XX]; |
80: ryx = pme->recipbox[YY][XX]; |
81: ryy = pme->recipbox[YY][YY]; |
82: rzx = pme->recipbox[ZZ][XX]; |
83: rzy = pme->recipbox[ZZ][YY]; |
84: rzz = pme->recipbox[ZZ][ZZ]; |
85: |
86: g2tx = pme->pmegrid[grid_index].g2t[XX]; |
87: g2ty = pme->pmegrid[grid_index].g2t[YY]; |
88: g2tz = pme->pmegrid[grid_index].g2t[ZZ]; |
89: |
90: bThreads = (atc->nthread > 1); |
91: if (bThreads) |
92: { |
93: thread_idx = atc->thread_idx.data(); |
94: |
95: tpl_n = atc->threadMap[thread].n; |
96: for (i = 0; i < atc->nthread; i++) |
97: { |
98: tpl_n[i] = 0; |
[...] |
104: for (i = start; i < end; i++) |
[...] |
111: tx = nx * (xptr[XX] * rxx + xptr[YY] * ryx + xptr[ZZ] * rzx + shift); |
112: ty = ny * (xptr[YY] * ryy + xptr[ZZ] * rzy + shift); |
113: tz = nz * (xptr[ZZ] * rzz + shift); |
114: |
115: tix = static_cast<int>(tx); |
116: tiy = static_cast<int>(ty); |
117: tiz = static_cast<int>(tz); |
[...] |
127: fptr[XX] = tx - tix + pme->fshx[tix]; |
128: fptr[YY] = ty - tiy + pme->fshy[tiy]; |
129: fptr[ZZ] = tz - tiz; |
130: |
131: idxptr[XX] = pme->nnx[tix]; |
132: idxptr[YY] = pme->nny[tiy]; |
133: idxptr[ZZ] = pme->nnz[tiz]; |
[...] |
143: thread_i = g2tx[idxptr[XX]] + g2ty[idxptr[YY]] + g2tz[idxptr[ZZ]]; |
144: thread_idx[i] = thread_i; |
145: tpl_n[thread_i]++; |
146: } |
147: } |
148: |
149: if (bThreads) |
150: { |
151: /* Make a list of particle indices sorted on thread */ |
152: |
153: /* Get the cumulative count */ |
154: for (i = 1; i < atc->nthread; i++) |
155: { |
156: tpl_n[i] += tpl_n[i - 1]; |
[...] |
163: threadMap.i.resize(tpl_n[atc->nthread - 1]); |
164: /* Set tpl_n to the cumulative start */ |
165: for (i = atc->nthread - 1; i >= 1; i--) |
166: { |
167: tpl_n[i] = tpl_n[i - 1]; |
168: } |
169: tpl_n[0] = 0; |
170: |
171: /* Fill our thread local array with indices sorted on thread */ |
172: for (i = start; i < end; i++) |
173: { |
174: threadMap.i[tpl_n[atc->thread_idx[i]]++] = i; |
[...] |
910: #pragma omp parallel for num_threads(nthread) schedule(static) |
911: for (int thread = 0; thread < nthread; thread++) |
[...] |
917: start = atc->numAtoms() * thread / nthread; |
918: end = atc->numAtoms() * (thread + 1) / nthread; |
919: |
920: /* Compute fftgrid index for all atoms, |
921: * with help of some extra variables. |
922: */ |
923: calc_interpolation_idx(pme, atc, start, grid_index, end, thread); |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_vector.h: 919 - 1798 |
-------------------------------------------------------------------------------- |
919: { return size_type(this->_M_impl._M_finish - this->_M_impl._M_start); } |
[...] |
939: if (__new_size > size()) |
940: _M_default_append(__new_size - size()); |
941: else if (__new_size < size()) |
942: _M_erase_at_end(this->_M_impl._M_start + __new_size); |
[...] |
1046: return *(this->_M_impl._M_start + __n); |
[...] |
1169: { return _M_data_ptr(this->_M_impl._M_start); } |
[...] |
1794: if (size_type __n = this->_M_impl._M_finish - __pos) |
1795: { |
1796: std::_Destroy(__pos, this->_M_impl._M_finish, |
1797: _M_get_Tp_allocator()); |
1798: this->_M_impl._M_finish = __pos; |
/home/eoseret/gromacs-2024.2/src/external/boost/stl_interfaces/iterator_interface.hpp: 305 - 305 |
-------------------------------------------------------------------------------- |
305: D retval = derived(); |
0xc138b0 PUSH %RBP |
0xc138b1 MOV %RSP,%RBP |
0xc138b4 PUSH %R15 |
0xc138b6 PUSH %R14 |
0xc138b8 PUSH %R13 |
0xc138ba PUSH %R12 |
0xc138bc PUSH %RBX |
0xc138bd SUB $0x88,%RSP |
0xc138c4 MOV %R9,-0x70(%RBP) |
0xc138c8 MOV %R8,-0x68(%RBP) |
0xc138cc MOV %RCX,-0x60(%RBP) |
0xc138d0 MOV %RDX,-0x58(%RBP) |
0xc138d4 MOV (%RDX),%EBX |
0xc138d6 TEST %EBX,%EBX |
0xc138d8 JLE c1394c |
0xc138da DEC %EBX |
0xc138dc MOVL $0,-0x38(%RBP) |
0xc138e3 MOV %EBX,-0x2c(%RBP) |
0xc138e6 MOVL $0x1,-0x44(%RBP) |
0xc138ed MOVL $0,-0x40(%RBP) |
0xc138f4 MOV (%RDI),%ESI |
0xc138f6 SUB $0x8,%RSP |
0xc138fa LEA -0x44(%RBP),%RAX |
0xc138fe LEA 0x3cb1db(%RIP),%RDI |
0xc13905 LEA -0x40(%RBP),%RCX |
0xc13909 LEA -0x38(%RBP),%R8 |
0xc1390d LEA -0x2c(%RBP),%R9 |
0xc13911 MOV %ESI,-0x3c(%RBP) |
0xc13914 MOV $0x22,%EDX |
0xc13919 PUSH $0x1 |
0xc1391b PUSH $0x1 |
0xc1391d PUSH %RAX |
0xc1391e CALL fa67e0 <@plt_start@+0x3330> |
0xc13923 ADD $0x20,%RSP |
0xc13927 MOV -0x2c(%RBP),%EAX |
0xc1392a CMP %EBX,%EAX |
0xc1392c CMOVL %EAX,%EBX |
0xc1392f MOV %EBX,-0x2c(%RBP) |
0xc13932 MOVSXD -0x38(%RBP),%RAX |
0xc13936 CMP %EBX,%EAX |
0xc13938 JLE c1395e |
0xc1393a LEA 0x3cb1b7(%RIP),%RDI |
0xc13941 MOV -0x3c(%RBP),%ESI |
0xc13944 VZEROUPPER |
0xc13947 CALL fa67f0 <@plt_start@+0x3340> |
0xc1394c ADD $0x88,%RSP |
0xc13953 POP %RBX |
0xc13954 POP %R12 |
0xc13956 POP %R13 |
0xc13958 POP %R14 |
0xc1395a POP %R15 |
0xc1395c POP %RBP |
0xc1395d RET |
0xc1395e VMOVSS -0x8b7426(%RIP),%XMM13 |
0xc13966 JMP c1397d |
(1387) 0xc13970 MOVSXD -0x2c(%RBP),%RAX |
(1387) 0xc13974 CMP %RAX,%R12 |
(1387) 0xc13977 MOV -0x78(%RBP),%RAX |
(1387) 0xc1397b JGE c1393a |
(1387) 0xc1397d MOV %RAX,%R9 |
(1387) 0xc13980 MOV -0x60(%RBP),%RAX |
(1387) 0xc13984 MOV (%RAX),%R13 |
(1387) 0xc13987 MOV 0x78(%R13),%ECX |
(1387) 0xc1398b MOV 0x130(%R13),%EBX |
(1387) 0xc13992 MOV %ECX,%EAX |
(1387) 0xc13994 IMUL %R9D,%EAX |
(1387) 0xc13998 MOV -0x58(%RBP),%RDX |
(1387) 0xc1399c MOV (%RDX),%ESI |
(1387) 0xc1399e CLTD |
(1387) 0xc1399f IDIV %ESI |
(1387) 0xc139a1 MOV %EAX,%R11D |
(1387) 0xc139a4 LEA 0x1(%R9),%RAX |
(1387) 0xc139a8 MOV %RAX,-0x78(%RBP) |
(1387) 0xc139ac IMUL %ECX,%EAX |
(1387) 0xc139af CLTD |
(1387) 0xc139b0 IDIV %ESI |
(1387) 0xc139b2 MOV %EAX,%R10D |
(1387) 0xc139b5 MOV -0x68(%RBP),%RAX |
(1387) 0xc139b9 MOV (%RAX),%RCX |
(1387) 0xc139bc MOV -0x70(%RBP),%RAX |
(1387) 0xc139c0 MOVSXD (%RAX),%RAX |
(1387) 0xc139c3 MOV 0x3c(%RCX),%EDX |
(1387) 0xc139c6 MOV 0x40(%RCX),%ESI |
(1387) 0xc139c9 MOV 0x44(%RCX),%EDI |
(1387) 0xc139cc VMOVSS 0x5d0(%RCX),%XMM0 |
(1387) 0xc139d4 VMOVSS 0x5dc(%RCX),%XMM1 |
(1387) 0xc139dc VMOVSS 0x5e0(%RCX),%XMM2 |
(1387) 0xc139e4 VMOVSS 0x5e8(%RCX),%XMM3 |
(1387) 0xc139ec VMOVSS 0x5ec(%RCX),%XMM4 |
(1387) 0xc139f4 VMOVSS 0x5f0(%RCX),%XMM5 |
(1387) 0xc139fc MOV %RAX,%R8 |
(1387) 0xc139ff SAL $0x7,%R8 |
(1387) 0xc13a03 LEA (%R8,%RAX,8),%RAX |
(1387) 0xc13a07 MOV 0xe0(%RCX,%RAX,1),%R8 |
(1387) 0xc13a0f MOV %R8,-0xa8(%RBP) |
(1387) 0xc13a16 MOV 0xe8(%RCX,%RAX,1),%R12 |
(1387) 0xc13a1e MOV 0xf0(%RCX,%RAX,1),%RAX |
(1387) 0xc13a26 MOV %RAX,-0xb0(%RBP) |
(1387) 0xc13a2d MOV %EBX,-0x34(%RBP) |
(1387) 0xc13a30 CMP $0x2,%EBX |
(1387) 0xc13a33 MOV %R9,-0x80(%RBP) |
(1387) 0xc13a37 JL c13a90 |
(1387) 0xc13a39 MOV 0x138(%R13),%RBX |
(1387) 0xc13a40 MOV 0x150(%R13),%RAX |
(1387) 0xc13a47 IMUL $0x38,%R9,%R8 |
(1387) 0xc13a4b MOV (%RAX,%R8,1),%R14 |
(1387) 0xc13a4f XOR %EAX,%EAX |
(1387) 0xc13a51 NOPW %CS:(%RAX,%RAX,1) |
(1396) 0xc13a60 MOVL $0,(%R14,%RAX,4) |
(1396) 0xc13a68 INC %RAX |
(1396) 0xc13a6b MOVSXD 0x130(%R13),%R8 |
(1396) 0xc13a72 CMP %R8,%RAX |
(1396) 0xc13a75 JL c13a60 |
(1387) 0xc13a77 MOV %R10,-0x50(%RBP) |
(1387) 0xc13a7b MOV %R11D,-0x30(%RBP) |
(1387) 0xc13a7f CMP %R10D,%R11D |
(1387) 0xc13a82 JL c13aa6 |
(1387) 0xc13a84 JMP c13d4c |
(1387) 0xc13a90 XOR %R14D,%R14D |
(1387) 0xc13a93 XOR %EBX,%EBX |
(1387) 0xc13a95 MOV %R10,-0x50(%RBP) |
(1387) 0xc13a99 MOV %R11D,-0x30(%RBP) |
(1387) 0xc13a9d CMP %R10D,%R11D |
(1387) 0xc13aa0 JGE c13d4c |
(1387) 0xc13aa6 MOV 0x100(%R13),%RAX |
(1387) 0xc13aad VCVTSI2SS %EDX,%XMM14,%XMM6 |
(1387) 0xc13ab1 VCVTSI2SS %ESI,%XMM14,%XMM7 |
(1387) 0xc13ab5 MOV 0x118(%R13),%RDX |
(1387) 0xc13abc VCVTSI2SS %EDI,%XMM14,%XMM8 |
(1387) 0xc13ac0 MOV 0x5a0(%RCX),%RSI |
(1387) 0xc13ac7 MOV 0x5a8(%RCX),%RDI |
(1387) 0xc13ace MOV 0x588(%RCX),%R8 |
(1387) 0xc13ad5 MOV 0x590(%RCX),%R9 |
(1387) 0xc13adc MOV 0x598(%RCX),%R10 |
(1387) 0xc13ae3 MOVSXD -0x30(%RBP),%R15 |
(1387) 0xc13ae7 MOVSXD -0x50(%RBP),%R11 |
(1387) 0xc13aeb LEA (%R15,%R15,2),%RCX |
(1387) 0xc13aef CMPL $0x1,-0x34(%RBP) |
(1387) 0xc13af3 JLE c13c70 |
(1387) 0xc13af9 LEA 0x8(,%RCX,4),%RCX |
(1387) 0xc13b01 MOV %R12,-0x98(%RBP) |
(1387) 0xc13b08 MOV %RBX,-0x88(%RBP) |
(1387) 0xc13b0f MOV %R14,-0xa0(%RBP) |
(1387) 0xc13b16 MOV %R10,-0x90(%RBP) |
(1387) 0xc13b1d NOPL (%RAX) |
(1395) 0xc13b20 MOV %R9,%R14 |
(1395) 0xc13b23 MOV %R8,%R10 |
(1395) 0xc13b26 MOV %RDI,%R9 |
(1395) 0xc13b29 MOV %RSI,%R8 |
(1395) 0xc13b2c MOV %R13,%RDI |
(1395) 0xc13b2f MOV 0x80(%R13),%R13 |
(1395) 0xc13b36 VMOVSS -0x4(%R13,%RCX,1),%XMM9 |
(1395) 0xc13b3d VMOVSS (%R13,%RCX,1),%XMM10 |
(1395) 0xc13b44 VMULSS %XMM1,%XMM9,%XMM11 |
(1395) 0xc13b48 VFMADD231SS -0x8(%R13,%RCX,1),%XMM0,%XMM11 |
(1395) 0xc13b4f VFMADD231SS %XMM3,%XMM10,%XMM11 |
(1395) 0xc13b54 VADDSS %XMM13,%XMM11,%XMM11 |
(1395) 0xc13b59 VMULSS %XMM6,%XMM11,%XMM11 |
(1395) 0xc13b5d VMULSS %XMM4,%XMM10,%XMM12 |
(1395) 0xc13b61 VFMADD231SS %XMM9,%XMM2,%XMM12 |
(1395) 0xc13b66 VADDSS %XMM13,%XMM12,%XMM9 |
(1395) 0xc13b6b VMULSS %XMM7,%XMM9,%XMM9 |
(1395) 0xc13b6f VFMADD213SS %XMM13,%XMM5,%XMM10 |
(1395) 0xc13b74 VMULSS %XMM8,%XMM10,%XMM10 |
(1395) 0xc13b79 VCVTTSS2SI %XMM11,%R13D |
(1395) 0xc13b7e VCVTTSS2SI %XMM9,%EBX |
(1395) 0xc13b83 VCVTTSS2SI %XMM10,%R12D |
(1395) 0xc13b88 VCVTTPS2DQ %XMM11,%XMM12 |
(1395) 0xc13b8d VCVTDQ2PS %XMM12,%XMM12 |
(1395) 0xc13b92 VSUBSS %XMM12,%XMM11,%XMM11 |
(1395) 0xc13b97 MOVSXD %R13D,%R13 |
(1395) 0xc13b9a VADDSS (%RSI,%R13,4),%XMM11,%XMM11 |
(1395) 0xc13ba0 VMOVSS %XMM11,-0x8(%RDX,%RCX,1) |
(1395) 0xc13ba6 VCVTTPS2DQ %XMM9,%XMM11 |
(1395) 0xc13bab VCVTDQ2PS %XMM11,%XMM11 |
(1395) 0xc13bb0 VSUBSS %XMM11,%XMM9,%XMM9 |
(1395) 0xc13bb5 MOVSXD %EBX,%RBX |
(1395) 0xc13bb8 VADDSS (%R9,%RBX,4),%XMM9,%XMM9 |
(1395) 0xc13bbe VMOVSS %XMM9,-0x4(%RDX,%RCX,1) |
(1395) 0xc13bc4 VCVTTPS2DQ %XMM10,%XMM9 |
(1395) 0xc13bc9 VCVTDQ2PS %XMM9,%XMM9 |
(1395) 0xc13bce VSUBSS %XMM9,%XMM10,%XMM9 |
(1395) 0xc13bd3 VMOVSS %XMM9,(%RDX,%RCX,1) |
(1395) 0xc13bd8 MOVSXD (%R10,%R13,4),%R13 |
(1395) 0xc13bdc MOV %R13D,-0x8(%RAX,%RCX,1) |
(1395) 0xc13be1 MOVSXD (%R14,%RBX,4),%RBX |
(1395) 0xc13be5 MOV %EBX,-0x4(%RAX,%RCX,1) |
(1395) 0xc13be9 MOVSXD %R12D,%R12 |
(1395) 0xc13bec MOV -0x90(%RBP),%RSI |
(1395) 0xc13bf3 MOVSXD (%RSI,%R12,4),%R12 |
(1395) 0xc13bf7 MOV %R12D,(%RAX,%RCX,1) |
(1395) 0xc13bfb MOV %RDX,%RSI |
(1395) 0xc13bfe MOV %RAX,%RDX |
(1395) 0xc13c01 MOV -0x98(%RBP),%RAX |
(1395) 0xc13c08 MOVSXD (%RAX,%RBX,4),%RBX |
(1395) 0xc13c0c MOV %RDX,%RAX |
(1395) 0xc13c0f MOV %RSI,%RDX |
(1395) 0xc13c12 MOV -0xb0(%RBP),%RSI |
(1395) 0xc13c19 MOVSXD (%RSI,%R12,4),%R12 |
(1395) 0xc13c1d ADD %RBX,%R12 |
(1395) 0xc13c20 MOV -0xa8(%RBP),%RBX |
(1395) 0xc13c27 MOVSXD (%RBX,%R13,4),%RBX |
(1395) 0xc13c2b MOV %RDI,%R13 |
(1395) 0xc13c2e MOV %R8,%RSI |
(1395) 0xc13c31 MOV %R9,%RDI |
(1395) 0xc13c34 MOV %R10,%R8 |
(1395) 0xc13c37 MOV %R14,%R9 |
(1395) 0xc13c3a MOV -0xa0(%RBP),%R14 |
(1395) 0xc13c41 ADD %RBX,%R12 |
(1395) 0xc13c44 MOV -0x88(%RBP),%RBX |
(1395) 0xc13c4b MOV %R12D,(%RBX,%R15,4) |
(1395) 0xc13c4f INCL (%R14,%R12,4) |
(1395) 0xc13c53 INC %R15 |
(1395) 0xc13c56 ADD $0xc,%RCX |
(1395) 0xc13c5a CMP %R15,%R11 |
(1395) 0xc13c5d JNE c13b20 |
(1387) 0xc13c63 JMP c13d4c |
(1387) 0xc13c70 SUB %R15,%R11 |
(1387) 0xc13c73 LEA 0x8(,%RCX,4),%RCX |
(1387) 0xc13c7b NOPL (%RAX,%RAX,1) |
(1394) 0xc13c80 MOV 0x80(%R13),%RBX |
(1394) 0xc13c87 VMOVSS -0x4(%RBX,%RCX,1),%XMM9 |
(1394) 0xc13c8d VMOVSS (%RBX,%RCX,1),%XMM10 |
(1394) 0xc13c92 VMULSS %XMM1,%XMM9,%XMM11 |
(1394) 0xc13c96 VFMADD231SS -0x8(%RBX,%RCX,1),%XMM0,%XMM11 |
(1394) 0xc13c9d VFMADD231SS %XMM3,%XMM10,%XMM11 |
(1394) 0xc13ca2 VADDSS %XMM13,%XMM11,%XMM11 |
(1394) 0xc13ca7 VMULSS %XMM6,%XMM11,%XMM11 |
(1394) 0xc13cab VMULSS %XMM4,%XMM10,%XMM12 |
(1394) 0xc13caf VFMADD231SS %XMM9,%XMM2,%XMM12 |
(1394) 0xc13cb4 VADDSS %XMM13,%XMM12,%XMM9 |
(1394) 0xc13cb9 VMULSS %XMM7,%XMM9,%XMM9 |
(1394) 0xc13cbd VFMADD213SS %XMM13,%XMM5,%XMM10 |
(1394) 0xc13cc2 VMULSS %XMM8,%XMM10,%XMM10 |
(1394) 0xc13cc7 VCVTTSS2SI %XMM11,%EBX |
(1394) 0xc13ccc VCVTTSS2SI %XMM9,%R15D |
(1394) 0xc13cd1 VCVTTSS2SI %XMM10,%R12D |
(1394) 0xc13cd6 VCVTTPS2DQ %XMM11,%XMM12 |
(1394) 0xc13cdb VCVTDQ2PS %XMM12,%XMM12 |
(1394) 0xc13ce0 VSUBSS %XMM12,%XMM11,%XMM11 |
(1394) 0xc13ce5 MOVSXD %EBX,%RBX |
(1394) 0xc13ce8 VADDSS (%RSI,%RBX,4),%XMM11,%XMM11 |
(1394) 0xc13ced VMOVSS %XMM11,-0x8(%RDX,%RCX,1) |
(1394) 0xc13cf3 VCVTTPS2DQ %XMM9,%XMM11 |
(1394) 0xc13cf8 VCVTDQ2PS %XMM11,%XMM11 |
(1394) 0xc13cfd VSUBSS %XMM11,%XMM9,%XMM9 |
(1394) 0xc13d02 MOVSXD %R15D,%R15 |
(1394) 0xc13d05 VADDSS (%RDI,%R15,4),%XMM9,%XMM9 |
(1394) 0xc13d0b VMOVSS %XMM9,-0x4(%RDX,%RCX,1) |
(1394) 0xc13d11 VCVTTPS2DQ %XMM10,%XMM9 |
(1394) 0xc13d16 VCVTDQ2PS %XMM9,%XMM9 |
(1394) 0xc13d1b VSUBSS %XMM9,%XMM10,%XMM9 |
(1394) 0xc13d20 VMOVSS %XMM9,(%RDX,%RCX,1) |
(1394) 0xc13d25 MOV (%R8,%RBX,4),%EBX |
(1394) 0xc13d29 MOV %EBX,-0x8(%RAX,%RCX,1) |
(1394) 0xc13d2d MOV (%R9,%R15,4),%EBX |
(1394) 0xc13d31 MOV %EBX,-0x4(%RAX,%RCX,1) |
(1394) 0xc13d35 MOVSXD %R12D,%RBX |
(1394) 0xc13d38 MOV (%R10,%RBX,4),%EBX |
(1394) 0xc13d3c MOV %EBX,(%RAX,%RCX,1) |
(1394) 0xc13d3f ADD $0xc,%RCX |
(1394) 0xc13d43 DEC %R11 |
(1394) 0xc13d46 JNE c13c80 |
(1387) 0xc13d4c CMPL $0x2,-0x34(%RBP) |
(1387) 0xc13d50 MOV -0x80(%RBP),%R12 |
(1387) 0xc13d54 MOV -0x50(%RBP),%R15 |
(1387) 0xc13d58 MOV -0x30(%RBP),%EBX |
(1387) 0xc13d5b JL c13970 |
(1387) 0xc13d61 MOV 0x130(%R13),%EDX |
(1387) 0xc13d68 CMP $0x2,%EDX |
(1387) 0xc13d6b JL c13d97 |
(1387) 0xc13d6d MOV (%R14),%EAX |
(1387) 0xc13d70 MOV $0x1,%ECX |
(1387) 0xc13d75 NOPW %CS:(%RAX,%RAX,1) |
(1393) 0xc13d80 ADD (%R14,%RCX,4),%EAX |
(1393) 0xc13d84 MOV %EAX,(%R14,%RCX,4) |
(1393) 0xc13d88 INC %RCX |
(1393) 0xc13d8b MOVSXD 0x130(%R13),%RDX |
(1393) 0xc13d92 CMP %RDX,%RCX |
(1393) 0xc13d95 JL c13d80 |
(1387) 0xc13d97 MOV 0x150(%R13),%RAX |
(1387) 0xc13d9e IMUL $0x38,%R12,%R8 |
(1387) 0xc13da2 LEA (%RAX,%R8,1),%RDI |
(1387) 0xc13da6 ADD $0x20,%RDI |
(1387) 0xc13daa MOVSXD %EDX,%RCX |
(1387) 0xc13dad MOVSXD -0x4(%R14,%RCX,4),%RSI |
(1387) 0xc13db2 MOV 0x20(%RAX,%R8,1),%RCX |
(1387) 0xc13db7 MOV 0x28(%RAX,%R8,1),%RAX |
(1387) 0xc13dbc MOV %RAX,%R8 |
(1387) 0xc13dbf SUB %RCX,%R8 |
(1387) 0xc13dc2 SAR $0x2,%R8 |
(1387) 0xc13dc6 CMP %RSI,%R8 |
(1387) 0xc13dc9 JAE c13df0 |
(1387) 0xc13dcb SUB %R8,%RSI |
(1387) 0xc13dce MOV %RDI,%RBX |
(1387) 0xc13dd1 VZEROUPPER |
(1387) 0xc13dd4 CALL fb5380 <@plt_start@+0x11ed0> |
(1387) 0xc13dd9 MOV 0x130(%R13),%EDX |
(1387) 0xc13de0 VMOVSS -0x8b78a8(%RIP),%XMM13 |
(1387) 0xc13de8 MOV %RBX,%RDI |
(1387) 0xc13deb MOV -0x30(%RBP),%EBX |
(1387) 0xc13dee JMP c13e00 |
(1387) 0xc13df0 JBE c13e00 |
(1387) 0xc13df2 LEA (%RCX,%RSI,4),%RCX |
(1387) 0xc13df6 CMP %RCX,%RAX |
(1387) 0xc13df9 JE c13e00 |
(1387) 0xc13dfb MOV %RCX,0x8(%RDI) |
(1387) 0xc13dff NOP |
(1387) 0xc13e00 CMP $0x2,%EDX |
(1387) 0xc13e03 JL c13e4c |
(1387) 0xc13e05 MOV %EDX,%EAX |
(1387) 0xc13e07 LEA -0x1(%RAX),%RCX |
(1387) 0xc13e0b CMP $0x4,%RCX |
(1387) 0xc13e0f JAE c13f1a |
(1387) 0xc13e15 MOV %RAX,%RDX |
(1387) 0xc13e18 LEA 0x1(%RDX),%RAX |
(1387) 0xc13e1c MOV $-0x1,%ECX |
(1387) 0xc13e21 ADD %RDX,%RCX |
(1387) 0xc13e24 DEC %RCX |
(1387) 0xc13e27 DEC %RDX |
(1387) 0xc13e2a NOPW (%RAX,%RAX,1) |
(1390) 0xc13e30 MOV %ECX,%ESI |
(1390) 0xc13e32 MOV (%R14,%RSI,4),%ESI |
(1390) 0xc13e36 MOV %EDX,%R8D |
(1390) 0xc13e39 MOV %ESI,(%R14,%R8,4) |
(1390) 0xc13e3d DEC %RAX |
(1390) 0xc13e40 DEC %RCX |
(1390) 0xc13e43 DEC %RDX |
(1390) 0xc13e46 CMP $0x2,%RAX |
(1390) 0xc13e4a JG c13e30 |
(1387) 0xc13e4c MOVL $0,(%R14) |
(1387) 0xc13e53 CMP %R15D,%EBX |
(1387) 0xc13e56 JGE c13970 |
(1387) 0xc13e5c MOV 0x138(%R13),%RAX |
(1387) 0xc13e63 MOV (%RDI),%RCX |
(1387) 0xc13e66 MOVSXD %EBX,%RDX |
(1387) 0xc13e69 MOVSXD %R15D,%RSI |
(1387) 0xc13e6c SUB %EBX,%R15D |
(1387) 0xc13e6f MOV %RDX,%RDI |
(1387) 0xc13e72 NOT %RDI |
(1387) 0xc13e75 ADD %RSI,%RDI |
(1387) 0xc13e78 AND $0x3,%R15 |
(1387) 0xc13e7c JE c13e9c |
(1387) 0xc13e7e XCHG %AX,%AX |
(1389) 0xc13e80 MOVSXD (%RAX,%RDX,4),%R8 |
(1389) 0xc13e84 MOVSXD (%R14,%R8,4),%R9 |
(1389) 0xc13e88 LEA 0x1(%R9),%R10D |
(1389) 0xc13e8c MOV %R10D,(%R14,%R8,4) |
(1389) 0xc13e90 MOV %EDX,(%RCX,%R9,4) |
(1389) 0xc13e94 INC %RDX |
(1389) 0xc13e97 DEC %R15 |
(1389) 0xc13e9a JNE c13e80 |
(1387) 0xc13e9c CMP $0x3,%RDI |
(1387) 0xc13ea0 JB c13970 |
(1387) 0xc13ea6 NOPW %CS:(%RAX,%RAX,1) |
(1388) 0xc13eb0 MOVSXD (%RAX,%RDX,4),%RDI |
(1388) 0xc13eb4 MOVSXD (%R14,%RDI,4),%R8 |
(1388) 0xc13eb8 LEA 0x1(%R8),%R9D |
(1388) 0xc13ebc MOV %R9D,(%R14,%RDI,4) |
(1388) 0xc13ec0 MOV %EDX,(%RCX,%R8,4) |
(1388) 0xc13ec4 MOVSXD 0x4(%RAX,%RDX,4),%RDI |
(1388) 0xc13ec9 MOVSXD (%R14,%RDI,4),%R8 |
(1388) 0xc13ecd LEA 0x1(%R8),%R9D |
(1388) 0xc13ed1 MOV %R9D,(%R14,%RDI,4) |
(1388) 0xc13ed5 LEA 0x1(%RDX),%EDI |
(1388) 0xc13ed8 MOV %EDI,(%RCX,%R8,4) |
(1388) 0xc13edc MOVSXD 0x8(%RAX,%RDX,4),%RDI |
(1388) 0xc13ee1 MOVSXD (%R14,%RDI,4),%R8 |
(1388) 0xc13ee5 LEA 0x1(%R8),%R9D |
(1388) 0xc13ee9 MOV %R9D,(%R14,%RDI,4) |
(1388) 0xc13eed LEA 0x2(%RDX),%EDI |
(1388) 0xc13ef0 MOV %EDI,(%RCX,%R8,4) |
(1388) 0xc13ef4 MOVSXD 0xc(%RAX,%RDX,4),%RDI |
(1388) 0xc13ef9 MOVSXD (%R14,%RDI,4),%R8 |
(1388) 0xc13efd LEA 0x1(%R8),%R9D |
(1388) 0xc13f01 MOV %R9D,(%R14,%RDI,4) |
(1388) 0xc13f05 LEA 0x3(%RDX),%EDI |
(1388) 0xc13f08 MOV %EDI,(%RCX,%R8,4) |
(1388) 0xc13f0c ADD $0x4,%RDX |
(1388) 0xc13f10 CMP %RSI,%RDX |
(1388) 0xc13f13 JNE c13eb0 |
(1387) 0xc13f15 JMP c13970 |
(1387) 0xc13f1a LEA -0x2(%RAX),%R8 |
(1387) 0xc13f1e MOV %R8,%RSI |
(1387) 0xc13f21 SHR $0x20,%RSI |
(1387) 0xc13f25 JNE c13e15 |
(1387) 0xc13f2b LEA -0x2(%RDX),%ESI |
(1387) 0xc13f2e CMP %R8D,%ESI |
(1387) 0xc13f31 JB c13e15 |
(1387) 0xc13f37 DEC %EDX |
(1387) 0xc13f39 CMP %R8D,%EDX |
(1387) 0xc13f3c JB c13e15 |
(1387) 0xc13f42 LEA (%R14,%RDX,4),%R8 |
(1387) 0xc13f46 LEA -0x8(,%RAX,4),%R10 |
(1387) 0xc13f4e MOV %R8,%R9 |
(1387) 0xc13f51 SUB %R10,%R9 |
(1387) 0xc13f54 CMP %R8,%R9 |
(1387) 0xc13f57 JA c13e15 |
(1387) 0xc13f5d LEA (%R14,%RSI,4),%R8 |
(1387) 0xc13f61 MOV %R8,%R9 |
(1387) 0xc13f64 SUB %R10,%R9 |
(1387) 0xc13f67 CMP %R8,%R9 |
(1387) 0xc13f6a JA c13e15 |
(1387) 0xc13f70 LEA (%R14,%RSI,4),%RSI |
(1387) 0xc13f74 LEA (%R14,%RDX,4),%RDX |
(1387) 0xc13f78 SUB %RDX,%RSI |
(1387) 0xc13f7b CMP $0x80,%RSI |
(1387) 0xc13f82 JB c13e15 |
(1387) 0xc13f88 CMP $0x20,%RCX |
(1387) 0xc13f8c JAE c13f92 |
(1387) 0xc13f8e XOR %ESI,%ESI |
(1387) 0xc13f90 JMP c14007 |
(1387) 0xc13f92 MOV %RCX,%RSI |
(1387) 0xc13f95 AND $-0x20,%RSI |
(1387) 0xc13f99 MOV $-0x1,%EDX |
(1387) 0xc13f9e ADD %RAX,%RDX |
(1387) 0xc13fa1 MOV %RSI,%R9 |
(1387) 0xc13fa4 NOPW %CS:(%RAX,%RAX,1) |
(1391) 0xc13fb0 LEA -0x1(%RDX),%R8D |
(1391) 0xc13fb4 VMOVUPS -0x7c(%R14,%R8,4),%YMM0 |
(1391) 0xc13fbb VMOVUPS -0x5c(%R14,%R8,4),%YMM1 |
(1391) 0xc13fc2 VMOVUPS -0x3c(%R14,%R8,4),%YMM2 |
(1391) 0xc13fc9 VMOVUPS -0x1c(%R14,%R8,4),%YMM3 |
(1391) 0xc13fd0 MOV %EDX,%R8D |
(1391) 0xc13fd3 VMOVUPS %YMM3,-0x1c(%R14,%R8,4) |
(1391) 0xc13fda VMOVUPS %YMM2,-0x3c(%R14,%R8,4) |
(1391) 0xc13fe1 VMOVUPS %YMM1,-0x5c(%R14,%R8,4) |
(1391) 0xc13fe8 VMOVUPS %YMM0,-0x7c(%R14,%R8,4) |
(1391) 0xc13fef ADD $-0x20,%RDX |
(1391) 0xc13ff3 ADD $-0x20,%R9 |
(1391) 0xc13ff7 JNE c13fb0 |
(1387) 0xc13ff9 CMP %RSI,%RCX |
(1387) 0xc13ffc JE c13e4c |
(1387) 0xc14002 TEST $0x1c,%CL |
(1387) 0xc14005 JE c1405d |
(1387) 0xc14007 MOV %RCX,%R9 |
(1387) 0xc1400a AND $-0x4,%R9 |
(1387) 0xc1400e MOV %RAX,%RDX |
(1387) 0xc14011 SUB %R9,%RDX |
(1387) 0xc14014 MOV $-0x1,%R8D |
(1387) 0xc1401a ADD %R8,%RAX |
(1387) 0xc1401d SUB %RSI,%RAX |
(1387) 0xc14020 SUB %R9,%RSI |
(1387) 0xc14023 NOPW %CS:(%RAX,%RAX,1) |
(1392) 0xc14030 LEA -0x1(%RAX),%R8D |
(1392) 0xc14034 VMOVUPS -0xc(%R14,%R8,4),%XMM0 |
(1392) 0xc1403b MOV %EAX,%R8D |
(1392) 0xc1403e VMOVUPS %XMM0,-0xc(%R14,%R8,4) |
(1392) 0xc14045 ADD $-0x4,%RAX |
(1392) 0xc14049 ADD $0x4,%RSI |
(1392) 0xc1404d JNE c14030 |
(1387) 0xc1404f CMP %R9,%RCX |
(1387) 0xc14052 JNE c13e18 |
(1387) 0xc14058 JMP c13e4c |
(1387) 0xc1405d SUB %RSI,%RAX |
(1387) 0xc14060 JMP c13e15 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►75.45+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►12.32+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
►12.23+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►82.08+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►12.95+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
►4.97+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►66.27+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►24.01+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
►9.60+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►59.90+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►26.61+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►13.49+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►48.52+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►33.01+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
►18.47+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.89+ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | spread_on_grid(gmx_pme_t const[...] | pme_spread.cpp:910 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1244 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Path / |
The code analyzed by CQA in that panel excludes loops and represents 0.00% of application time for run 1x1
Source file and lines | pme_spread.cpp:75-923 |
Module | libgromacs_mpi.so.9.0.0 |
nb instructions | 55 |
nb uops | 57 |
loop length | 184 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 9 |
micro-operation queue | 9.50 cycles |
front end | 9.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 6.00 | 6.00 | 6.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 6.00 | 6.00 | 6.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 9.50 |
Dispatch | 6.00 |
Overall L1 | 9.50 |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 20% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 20% |
all | 8% |
load | 7% |
store | 8% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 6% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 8% |
load | 7% |
store | 8% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x88,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R9,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R8,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV (%RDX),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
TEST %EBX,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
JLE c1394c <.omp_outlined.+0x9c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
DEC %EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
MOVL $0,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %EBX,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVL $0x1,-0x44(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVL $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x44(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x3cb1db(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x40(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x38(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x2c(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %ESI,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL fa67e0 <@plt_start@+0x3330> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV -0x2c(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
CMP %EBX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
CMOVL %EAX,%EBX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
MOV %EBX,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVSXD -0x38(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
CMP %EBX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
JLE c1395e <.omp_outlined.+0xae> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
LEA 0x3cb1b7(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | vect (25.0%) |
CALL fa67f0 <@plt_start@+0x3340> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
ADD $0x88,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
VMOVSS -0x8b7426(%RIP),%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
JMP c1397d <.omp_outlined.+0xcd> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
The code analyzed by CQA in that panel excludes loops and represents 0.00% of application time for run 1x1
Source file and lines | pme_spread.cpp:75-923 |
Module | libgromacs_mpi.so.9.0.0 |
nb instructions | 55 |
nb uops | 57 |
loop length | 184 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 9 |
micro-operation queue | 9.50 cycles |
front end | 9.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 6.00 | 6.00 | 6.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 6.00 | 6.00 | 6.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 9.50 |
Dispatch | 6.00 |
Overall L1 | 9.50 |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 20% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 20% |
all | 8% |
load | 7% |
store | 8% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 6% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 8% |
load | 7% |
store | 8% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x88,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R9,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R8,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV (%RDX),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
TEST %EBX,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
JLE c1394c <.omp_outlined.+0x9c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
DEC %EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
MOVL $0,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %EBX,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVL $0x1,-0x44(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVL $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x44(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x3cb1db(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x40(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x38(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x2c(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %ESI,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL fa67e0 <@plt_start@+0x3330> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV -0x2c(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
CMP %EBX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
CMOVL %EAX,%EBX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
MOV %EBX,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVSXD -0x38(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
CMP %EBX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
JLE c1395e <.omp_outlined.+0xae> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
LEA 0x3cb1b7(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | vect (25.0%) |
CALL fa67f0 <@plt_start@+0x3340> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
ADD $0x88,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
VMOVSS -0x8b7426(%RIP),%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
JMP c1397d <.omp_outlined.+0xcd> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
Run 1x1 | Number processes: 1Number processes per node: 1OMP_NUM_THREADS: 1 |
---|---|
Run 2x1 | Number processes: 2Number processes per node: 2OMP_NUM_THREADS: 1 |
Run 4x1 | Number processes: 4Number processes per node: 4OMP_NUM_THREADS: 1 |
Run 8x1 | Number processes: 8Number processes per node: 8OMP_NUM_THREADS: 1 |
Run 16x1 | Number processes: 16Number processes per node: 16OMP_NUM_THREADS: 1 |
Run 32x1 | Number processes: 32Number processes per node: 32OMP_NUM_THREADS: 1 |
Run 64x1 | Number processes: 64Number processes per node: 64OMP_NUM_THREADS: 1 |
Run 128x1 | Number processes: 128Number processes per node: 128OMP_NUM_THREADS: 1 |
Run 192x1 | Number processes: 192Number nodes: 1Number processes per node: 192Run Command: <executable> mdrun -s ion_channel.tpr -nsteps 10000 -pin on -deffnm aoccMPI Command: mpirun -genv I_MPI_FABRICS=shm -n <number_processes>Dataset: Run Directory: .OMP_NUM_THREADS: 1 |
(1x1) Efficiency | (1x1) Potential Speed-Up (%) | (2x1) Efficiency | (2x1) Potential Speed-Up (%) | (4x1) Efficiency | (4x1) Potential Speed-Up (%) | (8x1) Efficiency | (8x1) Potential Speed-Up (%) | (16x1) Efficiency | (16x1) Potential Speed-Up (%) | (32x1) Efficiency | (32x1) Potential Speed-Up (%) | (64x1) Efficiency | (64x1) Potential Speed-Up (%) | (128x1) Efficiency | (128x1) Potential Speed-Up (%) | (192x1) Efficiency | (192x1) Potential Speed-Up (%) |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
1 | 0 | 0.97 | 0.01 | 0.96 | 0.02 | 0.68 | 0.15 | 0.9 | 0.03 | 0.94 | 0.01 | 0.99 | 0 | 0.95 | 0.01 | 0.88 | 0.02 |
Run | Number of threads | Efficiency (ideal is 1) | Speedup | Ideal Speedup | Time (s) | Coverage (%) |
---|---|---|---|---|---|---|
1x1 | 1 | 1 | 1 | 1 | 3.9300000667572 | 0.47144654393196 |
2x1 | 2 | 0.97 | 1.94 | 2 | 2.0299999713898 | 0.44675579667091 |
4x1 | 4 | 0.96 | 3.84 | 4 | 1.0749999284744 | 0.4106804728508 |
8x1 | 8 | 0.68 | 5.41 | 8 | 0.8549998998642 | 0.46915805339813 |
16x1 | 16 | 0.9 | 14.47 | 16 | 0.34499999880791 | 0.32830163836479 |
32x1 | 12 | 0.94 | 30.16 | 32 | 0.4149999320507 | 0.25354731082916 |
64x1 | 24 | 0.99 | 63.22 | 64 | 0.23999993503094 | 0.15641723573208 |
128x1 | 44 | 0.95 | 122.15 | 128 | 0.14000000059605 | 0.18931862711906 |
192x1 | 64 | 0.88 | 168.43 | 192 | 0.10999999195337 | 0.17322833836079 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼.omp_outlined.#0xc138b0– | 0.17 | 0.02 |
▼Loop 1387 - pme_spread.cpp:75-923 - libgromacs_mpi.so.9.0.0– | 0.00 | 0.00 |
○Loop 1394 - pme_spread.cpp:104-133 - libgromacs_mpi.so.9.0.0 | 0.17 | 0.07 |
○Loop 1388 - pme_spread.cpp:172-174 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 1389 - pme_spread.cpp:172-174 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 1395 - pme_spread.cpp:104-145 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 1393 - pme_spread.cpp:154-156 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 1391 - pme_spread.cpp:167-167 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 1392 - pme_spread.cpp:167-167 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 1390 - pme_spread.cpp:165-167 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 1396 - pme_spread.cpp:96-98 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |