Function: dd_move_f(gmx_domdec_t*, gmx::ForceWithShiftForces*, gmx_wallcycle*) | Module: libgromacs_mpi.so.9.0.0 | Source: domdec.cpp:358-463 [...] | Coverage (incl. loops): 0.26% | (excl. loops): 0.00% |
---|
Function: dd_move_f(gmx_domdec_t*, gmx::ForceWithShiftForces*, gmx_wallcycle*) | Module: libgromacs_mpi.so.9.0.0 | Source: domdec.cpp:358-463 [...] | Coverage (incl. loops): 0.26% | (excl. loops): 0.00% |
---|
/home/eoseret/gromacs-2024.2/src/gromacs/pbcutil/include/gromacs/pbcutil/ishift.h: 61 - 68 |
-------------------------------------------------------------------------------- |
61: return (detail::c_nBoxX * (detail::c_nBoxY * ((z) + gmx::c_dBoxZ) + (y) + gmx::c_dBoxY) + (x) |
62: + gmx::c_dBoxX); |
[...] |
68: return (xyzToShiftIndex((iv)[XX], (iv)[YY], (iv)[ZZ])); |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/ext/new_allocator.h: 127 - 162 |
-------------------------------------------------------------------------------- |
127: return static_cast<_Tp*>(::operator new(__n * sizeof(_Tp))); |
[...] |
145: ::operator delete(__p |
[...] |
162: { ::new((void *)__p) _Up(std::forward<_Args>(__args)...); } |
/home/eoseret/gromacs-2024.2/api/legacy/include/gromacs/math/vectypes.h: 120 - 120 |
-------------------------------------------------------------------------------- |
120: ValueType& operator[](int i) { return x_[i]; } |
/home/eoseret/gromacs-2024.2/src/gromacs/mdtypes/forceoutput.h: 96 - 96 |
-------------------------------------------------------------------------------- |
96: bool computeVirial() const { return computeVirial_; } |
/home/eoseret/gromacs-2024.2/src/gromacs/timing/include/gromacs/timing/wallcycle.h: 391 - 498 |
-------------------------------------------------------------------------------- |
391: wc->ewc_prev = ewc; |
392: wc->cycle_prev = cycle; |
393: } |
394: |
395: inline void wallcycle_all_stop(gmx_wallcycle* wc, WallCycleCounter ewc, gmx_cycles_t cycle) |
396: { |
397: const int prev = static_cast<int>(wc->ewc_prev); |
398: const int current = static_cast<int>(ewc); |
399: wc->wcc_all[prev * sc_numWallCycleCounters + current].n += 1; |
400: wc->wcc_all[prev * sc_numWallCycleCounters + current].c += cycle - wc->cycle_prev; |
[...] |
411: if (wc == nullptr) |
412: { |
413: return; |
414: } |
415: |
416: wallcycleBarrier(wc); |
[...] |
423: wc->wcc[ewc].start = cycle; |
424: if (!wc->wcc_all.empty()) |
425: { |
426: wc->wc_depth++; |
427: if (ewc == WallCycleCounter::Run) |
428: { |
429: wallcycle_all_start(wc, ewc, cycle); |
430: } |
431: else if (wc->wc_depth == 3) |
[...] |
459: if (wc == nullptr) |
460: { |
461: return 0; |
462: } |
463: |
464: wallcycleBarrier(wc); |
[...] |
480: if (cycle >= wc->wcc[ewc].start) |
[...] |
487: wc->haveInvalidCount = true; |
488: } |
489: wc->wcc[ewc].c += last; |
490: wc->wcc[ewc].n++; |
491: if (!wc->wcc_all.empty()) |
492: { |
493: wc->wc_depth--; |
494: if (ewc == WallCycleCounter::Run) |
495: { |
496: wallcycle_all_stop(wc, ewc, cycle); |
497: } |
498: else if (wc->wc_depth == 2) |
/home/eoseret/gromacs-2024.2/src/gromacs/domdec/domdec_internal.h: 92 - 394 |
-------------------------------------------------------------------------------- |
92: int numPulses() const { return ind.size(); } |
[...] |
230: int end(Type rangeType) const { return end_[static_cast<int>(rangeType)]; } |
[...] |
348: if (numElements > buffer_.size()) |
[...] |
359: GMX_RELEASE_ASSERT(!isInUse_, "Should only request free buffers"); |
360: isInUse_ = true; |
[...] |
368: GMX_RELEASE_ASSERT(isInUse_, "Should only release buffers in use"); |
369: isInUse_ = false; |
[...] |
389: DDBufferAccess(DDBuffer<T>& ddBuffer, size_t numElements) : ddBuffer_(ddBuffer) |
390: { |
391: buffer = ddBuffer_.acquire(numElements); |
392: } |
393: |
394: ~DDBufferAccess() { ddBuffer_.release(); } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_vector.h: 346 - 1762 |
-------------------------------------------------------------------------------- |
346: return __n != 0 ? _Tr::allocate(_M_impl, __n) : pointer(); |
[...] |
353: if (__p) |
[...] |
919: { return size_type(this->_M_impl._M_finish - this->_M_impl._M_start); } |
[...] |
940: _M_default_append(__new_size - size()); |
[...] |
1064: return *(this->_M_impl._M_start + __n); |
[...] |
1758: if (max_size() - size() < __n) |
1759: __throw_length_error(__N(__s)); |
1760: |
1761: const size_type __len = size() + (std::max)(size(), __n); |
1762: return (__len < size() || __len > max_size()) ? max_size() : __len; |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_iterator.h: 1028 - 1182 |
-------------------------------------------------------------------------------- |
1028: : _M_current(__i) { } |
[...] |
1054: ++_M_current; |
[...] |
1166: { return __lhs.base() == __rhs.base(); } |
[...] |
1182: { return __lhs.base() != __rhs.base(); } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_uninitialized.h: 578 - 1031 |
-------------------------------------------------------------------------------- |
578: for (; __n > 0; --__n, (void) ++__cur) |
[...] |
1031: for (; __first != __last; ++__first, (void)++__cur) |
/home/eoseret/gromacs-2024.2/api/legacy/include/gromacs/utility/arrayref.h: 72 - 311 |
-------------------------------------------------------------------------------- |
72: constexpr explicit ArrayRefIter(T* it) noexcept : it_(it) {} |
[...] |
82: it_ += i; |
[...] |
311: return (begin != nullptr) ? ArrayRef<T>(begin, begin + size) : ArrayRef<T>{}; |
/home/eoseret/gromacs-2024.2/src/gromacs/domdec/domdec.cpp: 358 - 463 |
-------------------------------------------------------------------------------- |
358: { |
[...] |
365: int nzone = comm.zones.n / 2; |
366: int nat_tot = comm.atomRanges.end(DDAtomRanges::Type::Zones); |
367: for (int d = dd->ndim - 1; d >= 0; d--) |
368: { |
369: /* Only forces in domains near the PBC boundaries need to |
370: consider PBC in the treatment of fshift */ |
371: const bool shiftForcesNeedPbc = |
372: (forceWithShiftForces->computeVirial() && dd->ci[dd->dim[d]] == 0); |
373: const bool applyScrewPbc = (dd->unitCellInfo.haveScrewPBC && dd->dim[d] == XX); |
374: /* Determine which shift vector we need */ |
375: ivec vis = { 0, 0, 0 }; |
376: vis[dd->dim[d]] = 1; |
377: const int is = gmx::ivecToShiftIndex(vis); |
378: |
379: /* Loop over the pulses */ |
380: const gmx_domdec_comm_dim_t& cd = comm.cd[d]; |
381: for (int p = cd.numPulses() - 1; p >= 0; p--) |
382: { |
383: const gmx_domdec_ind_t& ind = cd.ind[p]; |
384: DDBufferAccess<gmx::RVec> receiveBufferAccess(comm.rvecBuffer, ind.nsend[nzone + 1]); |
385: gmx::ArrayRef<gmx::RVec>& receiveBuffer = receiveBufferAccess.buffer; |
386: |
387: nat_tot -= ind.nrecv[nzone + 1]; |
388: |
389: DDBufferAccess<gmx::RVec> sendBufferAccess( |
390: comm.rvecBuffer2, cd.receiveInPlace ? 0 : ind.nrecv[nzone + 1]); |
391: |
392: gmx::ArrayRef<gmx::RVec> sendBuffer; |
393: if (cd.receiveInPlace) |
394: { |
395: sendBuffer = gmx::arrayRefFromArray(f.data() + nat_tot, ind.nrecv[nzone + 1]); |
[...] |
401: for (int zone = 0; zone < nzone; zone++) |
402: { |
403: for (int i = ind.cell2at0[zone]; i < ind.cell2at1[zone]; i++) |
404: { |
405: sendBuffer[j++] = f[i]; |
406: } |
407: } |
408: } |
409: /* Communicate the forces */ |
410: ddSendrecv(dd, d, dddirForward, sendBuffer, receiveBuffer); |
411: /* Add the received forces */ |
412: int n = 0; |
413: if (!applyScrewPbc && !shiftForcesNeedPbc) |
414: { |
415: for (int j : ind.index) |
416: { |
417: for (int d = 0; d < DIM; d++) |
418: { |
419: f[j][d] += receiveBuffer[n][d]; |
420: } |
421: n++; |
422: } |
423: } |
424: else if (!applyScrewPbc) |
425: { |
426: for (int j : ind.index) |
427: { |
428: for (int d = 0; d < DIM; d++) |
429: { |
430: f[j][d] += receiveBuffer[n][d]; |
431: } |
432: /* Add this force to the shift force */ |
433: for (int d = 0; d < DIM; d++) |
434: { |
435: fshift[is][d] += receiveBuffer[n][d]; |
[...] |
442: for (int j : ind.index) |
443: { |
444: /* Rotate the force */ |
445: f[j][XX] += receiveBuffer[n][XX]; |
446: f[j][YY] -= receiveBuffer[n][YY]; |
447: f[j][ZZ] -= receiveBuffer[n][ZZ]; |
[...] |
453: fshift[is][d] += receiveBuffer[n][d]; |
[...] |
459: } |
460: nzone /= 2; |
461: } |
462: wallcycle_stop(wcycle, WallCycleCounter::MoveF); |
463: } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/unique_ptr.h: 173 - 173 |
-------------------------------------------------------------------------------- |
173: pointer _M_ptr() const { return std::get<0>(_M_t); } |
/home/eoseret/gromacs-2024.2/src/gromacs/timing/include/gromacs/timing/cyclecounter.h: 182 - 188 |
-------------------------------------------------------------------------------- |
182: __asm__ __volatile__("rdtscp" : "=a"(low), "=d"(high)::"ecx"); |
183: # else |
184: __asm__ __volatile__("rdtsc" : "=a"(low), "=d"(high)); |
185: # endif |
186: const gmx_cycles_t c_low = low; |
187: const gmx_cycles_t c_high = high; |
188: return c_low | c_high << 32; |
/home/eoseret/gromacs-2024.2/src/external/boost/stl_interfaces/iterator_interface.hpp: 305 - 305 |
-------------------------------------------------------------------------------- |
305: D retval = derived(); |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/vector.tcc: 617 - 680 |
-------------------------------------------------------------------------------- |
617: size_type __navail = size_type(this->_M_impl._M_end_of_storage |
618: - this->_M_impl._M_finish); |
619: |
620: if (__size > max_size() || __navail > max_size() - __size) |
621: __builtin_unreachable(); |
622: |
623: if (__navail >= __n) |
624: { |
625: _GLIBCXX_ASAN_ANNOTATE_GROW(__n); |
626: this->_M_impl._M_finish = |
[...] |
648: _S_relocate(this->_M_impl._M_start, this->_M_impl._M_finish, |
[...] |
678: this->_M_impl._M_start = __new_start; |
679: this->_M_impl._M_finish = __new_start + __size + __n; |
680: this->_M_impl._M_end_of_storage = __new_start + __len; |
0x690340 PUSH %RBP |
0x690341 MOV %RSP,%RBP |
0x690344 PUSH %R15 |
0x690346 PUSH %R14 |
0x690348 PUSH %R13 |
0x69034a PUSH %R12 |
0x69034c PUSH %RBX |
0x69034d SUB $0x138,%RSP |
0x690354 MOV %RDX,%RBX |
0x690357 MOV %RSI,-0xa0(%RBP) |
0x69035e MOV %RDI,%R15 |
0x690361 TEST %RDX,%RDX |
0x690364 JE 6903c8 |
0x690366 MOV %RBX,%RDI |
0x690369 CALL fa6fc0 <@plt_start@+0x3b10> |
0x69036e RDTSCP |
0x690371 MOV %EAX,%EAX |
0x690373 SAL $0x20,%RDX |
0x690377 OR %RAX,%RDX |
0x69037a MOV %RDX,0x130(%RBX) |
0x690381 MOV 0x8c8(%RBX),%RAX |
0x690388 CMP 0x8d0(%RBX),%RAX |
0x69038f JE 6903c8 |
0x690391 MOV 0x8e0(%RBX),%ECX |
0x690397 INC %ECX |
0x690399 MOV %ECX,0x8e0(%RBX) |
0x69039f CMP $0x3,%ECX |
0x6903a2 JNE 6903c8 |
0x6903a4 MOVSXD 0x8e4(%RBX),%RCX |
0x6903ab IMUL $0x4e0,%RCX,%RCX |
0x6903b2 INCL 0x120(%RCX,%RAX,1) |
0x6903b9 SUB 0x8e8(%RBX),%RDX |
0x6903c0 ADD %RDX,0x128(%RCX,%RAX,1) |
0x6903c8 MOV %RBX,-0xc0(%RBP) |
0x6903cf MOV 0x74(%R15),%ECX |
0x6903d3 TEST %ECX,%ECX |
0x6903d5 JLE 690e12 |
0x6903db MOV -0xa0(%RBP),%RAX |
0x6903e2 MOV (%RAX),%R14 |
0x6903e5 MOV 0x20(%RAX),%RAX |
0x6903e9 MOV %RAX,-0xc8(%RBP) |
0x6903f0 MOV 0x130(%R15),%R8 |
0x6903f7 MOV 0x298(%R8),%R9D |
0x6903fe MOV 0x62c(%R8),%EAX |
0x690405 MOV %RAX,-0xb8(%RBP) |
0x69040c LEA 0x580(%R8),%RDX |
0x690413 LEA 0x678(%R8),%RAX |
0x69041a MOV %RAX,-0x100(%RBP) |
0x690421 LEA 0x6b0(%R8),%RAX |
0x690428 MOV %RAX,-0xf8(%RBP) |
0x69042f MOV $-0x5555555555555555,%RDI |
0x690439 MOV %R15,-0xb0(%RBP) |
0x690440 MOV %R8,-0x68(%RBP) |
0x690444 MOV %RDX,-0xd0(%RBP) |
0x69044b JMP 690472 |
0x69044d NOPL (%RAX) |
(2991) 0x690450 MOV -0xd8(%RBP),%RAX |
(2991) 0x690457 MOV %EAX,%R9D |
(2991) 0x69045a CMPQ $0x1,-0xe0(%RBP) |
(2991) 0x690462 MOV %R13,%RCX |
(2991) 0x690465 MOV -0xd0(%RBP),%RDX |
(2991) 0x69046c JLE 690e12 |
(2991) 0x690472 MOV %R9D,%R10D |
(2991) 0x690475 SHR $0x1f,%R10D |
(2991) 0x690479 LEA -0x1(%RCX),%R13 |
(2991) 0x69047d MOV -0xa0(%RBP),%RAX |
(2991) 0x690484 CMPB $0,0x18(%RAX) |
(2991) 0x690488 JE 6904a0 |
(2991) 0x69048a MOV %R13D,%EAX |
(2991) 0x69048d MOVSXD 0x78(%R15,%RAX,4),%RAX |
(2991) 0x690492 CMPL $0,0x8(%R15,%RAX,4) |
(2991) 0x690498 SETE %AL |
(2991) 0x69049b MOV %EAX,-0x3c(%RBP) |
(2991) 0x69049e JMP 6904a7 |
(2991) 0x6904a0 MOVL $0,-0x3c(%RBP) |
(2991) 0x6904a7 ADD %R9D,%R10D |
(2991) 0x6904aa CMPB $0,0x65(%R15) |
(2991) 0x6904af MOV %R13D,%EAX |
(2991) 0x6904b2 MOV %RCX,-0xe0(%RBP) |
(2991) 0x6904b9 JE 6904d0 |
(2991) 0x6904bb CMPL $0,0x78(%R15,%RAX,4) |
(2991) 0x6904c1 SETE %CL |
(2991) 0x6904c4 MOV %ECX,-0x40(%RBP) |
(2991) 0x6904c7 JMP 6904d7 |
0x6904c9 NOPL (%RAX) |
(2991) 0x6904d0 MOVL $0,-0x40(%RBP) |
(2991) 0x6904d7 SAR $0x1,%R10D |
(2991) 0x6904da MOVL $0,-0x88(%RBP) |
(2991) 0x6904e4 MOVQ $0,-0x90(%RBP) |
(2991) 0x6904ef MOVSXD 0x78(%R15,%RAX,4),%RCX |
(2991) 0x6904f4 MOVL $0x1,-0x90(%RBP,%RCX,4) |
(2991) 0x6904ff LEA (%RAX,%RAX,4),%RCX |
(2991) 0x690503 MOV 0x10(%RDX,%RCX,8),%RAX |
(2991) 0x690508 SUB 0x8(%RDX,%RCX,8),%RAX |
(2991) 0x69050d SAR $0x3,%RAX |
(2991) 0x690511 MOV $0x4ec4ec4ec4ec4ec5,%RSI |
(2991) 0x69051b IMUL %RSI,%RAX |
(2991) 0x69051f TEST %EAX,%EAX |
(2991) 0x690521 MOV %R10,-0xd8(%RBP) |
(2991) 0x690528 JLE 690450 |
(2991) 0x69052e LEA (%RDX,%RCX,8),%RCX |
(2991) 0x690532 ADD $0x8,%RCX |
(2991) 0x690536 MOV %RCX,-0x80(%RBP) |
(2991) 0x69053a MOV -0x90(%RBP),%ECX |
(2991) 0x690540 MOV -0x88(%RBP),%EDX |
(2991) 0x690546 LEA (%RDX,%RDX,2),%EDX |
(2991) 0x690549 ADD -0x8c(%RBP),%EDX |
(2991) 0x69054f LEA (%RDX,%RDX,4),%EDX |
(2991) 0x690552 ADD %EDX,%ECX |
(2991) 0x690554 ADD $0x16,%ECX |
(2991) 0x690557 LEA 0x1(%R10),%EDX |
(2991) 0x69055b MOVSXD %EDX,%RDX |
(2991) 0x69055e MOV %RDX,-0x78(%RBP) |
(2991) 0x690562 MOV -0x3c(%RBP),%EDX |
(2991) 0x690565 OR -0x40(%RBP),%DL |
(2991) 0x690568 MOV %DL,-0x29(%RBP) |
(2991) 0x69056b MOVSXD %ECX,%RCX |
(2991) 0x69056e LEA (%RCX,%RCX,2),%RCX |
(2991) 0x690572 MOV -0xc8(%RBP),%RDX |
(2991) 0x690579 LEA (%RDX,%RCX,4),%R12 |
(2991) 0x69057d MOV %EAX,%EDX |
(2991) 0x69057f MOV %R10D,%ECX |
(2991) 0x690582 MOVZX 0x690(%R8),%EAX |
(2991) 0x69058a MOV %R9D,-0x98(%RBP) |
(2991) 0x690591 AND $-0x2,%R9D |
(2991) 0x690595 MOV %R9D,-0x94(%RBP) |
(2991) 0x69059c MOV %RCX,-0xe8(%RBP) |
(2991) 0x6905a3 AND $-0x2,%ECX |
(2991) 0x6905a6 MOV %RCX,-0x128(%RBP) |
(2991) 0x6905ad MOV %R13,-0x70(%RBP) |
(2991) 0x6905b1 NOPW %CS:(%RAX,%RAX,1) |
(2992) 0x6905c0 MOV %RDX,-0x110(%RBP) |
(2992) 0x6905c7 LEA -0x1(%RDX),%R9 |
(2992) 0x6905cb MOV %R9D,%ECX |
(2992) 0x6905ce MOV -0x80(%RBP),%RDX |
(2992) 0x6905d2 MOV (%RDX),%R10 |
(2992) 0x6905d5 IMUL $0x68,%RCX,%R11 |
(2992) 0x6905d9 LEA (%R10,%R11,1),%R13 |
(2992) 0x6905dd MOV -0x78(%RBP),%RCX |
(2992) 0x6905e1 MOVSXD (%R13,%RCX,4),%RBX |
(2992) 0x6905e6 MOV -0x100(%RBP),%RCX |
(2992) 0x6905ed MOV %RCX,-0x58(%RBP) |
(2992) 0x6905f1 TEST %AL,%AL |
(2992) 0x6905f3 JNE 690ec1 |
(2992) 0x6905f9 MOVB $0x1,0x690(%R8) |
(2992) 0x690601 MOV 0x678(%R8),%RSI |
(2992) 0x690608 MOV 0x680(%R8),%RAX |
(2992) 0x69060f MOV %RAX,%RCX |
(2992) 0x690612 SUB %RSI,%RCX |
(2992) 0x690615 SAR $0x2,%RCX |
(2992) 0x690619 IMUL %RDI,%RCX |
(2992) 0x69061d CMP %RBX,%RCX |
(2992) 0x690620 MOV %R9,-0x108(%RBP) |
(2992) 0x690627 MOV %R10,-0x120(%RBP) |
(2992) 0x69062e MOV %R11,-0x118(%RBP) |
(2992) 0x690635 JAE 69075a |
(2992) 0x69063b MOV %RSI,-0x38(%RBP) |
(2992) 0x69063f MOV %RBX,%RDX |
(2992) 0x690642 SUB %RCX,%RDX |
(2992) 0x690645 MOV 0x688(%R8),%RSI |
(2992) 0x69064c SUB %RAX,%RSI |
(2992) 0x69064f SAR $0x2,%RSI |
(2992) 0x690653 IMUL %RDI,%RSI |
(2992) 0x690657 CMP %RDX,%RSI |
(2992) 0x69065a JAE 6906d0 |
(2992) 0x69065c MOV $0xaaaaaaaaaaaaaaa,%RDI |
(2992) 0x690666 MOV %RDI,%RSI |
(2992) 0x690669 SUB %RCX,%RSI |
(2992) 0x69066c CMP %RDX,%RSI |
(2992) 0x69066f JB 690f36 |
(2992) 0x690675 CMP %RDX,%RCX |
(2992) 0x690678 CMOVA %RCX,%RDX |
(2992) 0x69067c LEA (%RDX,%RCX,1),%R15 |
(2992) 0x690680 CMP %RDI,%R15 |
(2992) 0x690683 CMOVA %RDI,%R15 |
(2992) 0x690687 ADD %RCX,%RDX |
(2992) 0x69068a CMOVB %RDI,%R15 |
(2992) 0x69068e TEST %R15,%R15 |
(2992) 0x690691 MOV -0x38(%RBP),%RDI |
(2992) 0x690695 JE 6906e5 |
(2992) 0x690697 LEA (,%R15,4),%RAX |
(2992) 0x69069f LEA (%RAX,%RAX,2),%RDI |
(2992) 0x6906a3 CALL fa3710 <@plt_start@+0x260> |
(2992) 0x6906a8 MOV -0x68(%RBP),%R8 |
(2992) 0x6906ac MOV %RAX,-0x38(%RBP) |
(2992) 0x6906b0 MOV 0x678(%R8),%RDI |
(2992) 0x6906b7 MOV 0x680(%R8),%RAX |
(2992) 0x6906be CMP %RAX,%RDI |
(2992) 0x6906c1 JNE 6906f0 |
(2992) 0x6906c3 JMP 690719 |
0x6906c5 NOPW %CS:(%RAX,%RAX,1) |
(2992) 0x6906d0 LEA (%RDX,%RDX,2),%RCX |
(2992) 0x6906d4 LEA (%RAX,%RCX,4),%RAX |
(2992) 0x6906d8 MOV %RAX,0x680(%R8) |
(2992) 0x6906df MOV -0x38(%RBP),%RSI |
(2992) 0x6906e3 JMP 69075a |
(2992) 0x6906e5 XOR %ECX,%ECX |
(2992) 0x6906e7 MOV %RCX,-0x38(%RBP) |
(2992) 0x6906eb CMP %RAX,%RDI |
(2992) 0x6906ee JE 690719 |
(2992) 0x6906f0 MOV -0x38(%RBP),%RCX |
(2992) 0x6906f4 MOV %RDI,%RDX |
(2992) 0x6906f7 NOPW (%RAX,%RAX,1) |
(3002) 0x690700 MOV 0x8(%RDX),%ESI |
(3002) 0x690703 MOV %ESI,0x8(%RCX) |
(3002) 0x690706 MOV (%RDX),%RSI |
(3002) 0x690709 MOV %RSI,(%RCX) |
(3002) 0x69070c ADD $0xc,%RDX |
(3002) 0x690710 ADD $0xc,%RCX |
(3002) 0x690714 CMP %RAX,%RDX |
(3002) 0x690717 JNE 690700 |
(2992) 0x690719 TEST %RDI,%RDI |
(2992) 0x69071c JE 690727 |
(2992) 0x69071e CALL fa3730 <@plt_start@+0x280> |
(2992) 0x690723 MOV -0x68(%RBP),%R8 |
(2992) 0x690727 MOV -0x38(%RBP),%RSI |
(2992) 0x69072b MOV %RSI,0x678(%R8) |
(2992) 0x690732 LEA (%RBX,%RBX,2),%RAX |
(2992) 0x690736 LEA (%RSI,%RAX,4),%RAX |
(2992) 0x69073a MOV %RAX,0x680(%R8) |
(2992) 0x690741 LEA (%R15,%R15,2),%RAX |
(2992) 0x690745 LEA (%RSI,%RAX,4),%RAX |
(2992) 0x690749 MOV %RAX,0x688(%R8) |
(2992) 0x690750 MOV $-0x5555555555555555,%RDI |
(2992) 0x69075a TEST %RSI,%RSI |
(2992) 0x69075d LEA (%RBX,%RBX,2),%RAX |
(2992) 0x690761 LEA (%RSI,%RAX,4),%R9 |
(2992) 0x690765 CMOVE %RSI,%R9 |
(2992) 0x690769 MOV %RSI,-0x50(%RBP) |
(2992) 0x69076d MOV %R9,-0x48(%RBP) |
(2992) 0x690771 MOV -0x80(%RBP),%RAX |
(2992) 0x690775 CMPB $0,0x18(%RAX) |
(2992) 0x690779 MOV -0x78(%RBP),%RAX |
(2992) 0x69077d MOVSXD 0x18(%R13,%RAX,4),%R10 |
(2992) 0x690782 MOV $0,%R15D |
(2992) 0x690788 CMOVE %R10,%R15 |
(2992) 0x69078c MOV -0xf8(%RBP),%RAX |
(2992) 0x690793 MOV %RAX,-0x150(%RBP) |
(2992) 0x69079a CMPB $0,0x6c8(%R8) |
(2992) 0x6907a2 JNE 690e9a |
(2992) 0x6907a8 MOVB $0x1,0x6c8(%R8) |
(2992) 0x6907b0 MOV 0x6b0(%R8),%RBX |
(2992) 0x6907b7 MOV 0x6b8(%R8),%RAX |
(2992) 0x6907be MOV %RAX,%RCX |
(2992) 0x6907c1 SUB %RBX,%RCX |
(2992) 0x6907c4 SAR $0x2,%RCX |
(2992) 0x6907c8 IMUL %RDI,%RCX |
(2992) 0x6907cc MOV %R15,%RDX |
(2992) 0x6907cf SUB %RCX,%RDX |
(2992) 0x6907d2 JBE 690912 |
(2992) 0x6907d8 MOV %RSI,-0x38(%RBP) |
(2992) 0x6907dc MOV 0x6c0(%R8),%RSI |
(2992) 0x6907e3 SUB %RAX,%RSI |
(2992) 0x6907e6 SAR $0x2,%RSI |
(2992) 0x6907ea IMUL %RDI,%RSI |
(2992) 0x6907ee CMP %RDX,%RSI |
(2992) 0x6907f1 JAE 690880 |
(2992) 0x6907f7 MOV $0xaaaaaaaaaaaaaaa,%RDI |
(2992) 0x690801 MOV %RDI,%RSI |
(2992) 0x690804 SUB %RCX,%RSI |
(2992) 0x690807 CMP %RDX,%RSI |
(2992) 0x69080a JB 690f42 |
(2992) 0x690810 CMP %RDX,%RCX |
(2992) 0x690813 CMOVA %RCX,%RDX |
(2992) 0x690817 LEA (%RDX,%RCX,1),%RSI |
(2992) 0x69081b CMP %RDI,%RSI |
(2992) 0x69081e CMOVA %RDI,%RSI |
(2992) 0x690822 ADD %RCX,%RDX |
(2992) 0x690825 CMOVB %RDI,%RSI |
(2992) 0x690829 TEST %RSI,%RSI |
(2992) 0x69082c MOV %R9,-0x60(%RBP) |
(2992) 0x690830 MOV %R10,-0xa8(%RBP) |
(2992) 0x690837 MOV %RSI,-0xf0(%RBP) |
(2992) 0x69083e JE 690891 |
(2992) 0x690840 LEA (,%RSI,4),%RAX |
(2992) 0x690848 LEA (%RAX,%RAX,2),%RDI |
(2992) 0x69084c CALL fa3710 <@plt_start@+0x260> |
(2992) 0x690851 MOV %RAX,%RBX |
(2992) 0x690854 MOV -0x68(%RBP),%R8 |
(2992) 0x690858 MOV 0x6b0(%R8),%RDI |
(2992) 0x69085f MOV 0x6b8(%R8),%RAX |
(2992) 0x690866 MOV -0x60(%RBP),%R9 |
(2992) 0x69086a MOV -0xa8(%RBP),%R10 |
(2992) 0x690871 CMP %RAX,%RDI |
(2992) 0x690874 JNE 69089b |
(2992) 0x690876 JMP 6908c9 |
0x690878 NOPL (%RAX,%RAX,1) |
(2992) 0x690880 LEA (%RDX,%RDX,2),%RCX |
(2992) 0x690884 LEA (%RAX,%RCX,4),%RAX |
(2992) 0x690888 MOV %RAX,0x6b8(%R8) |
(2992) 0x69088f JMP 69090e |
(2992) 0x690891 MOV %RBX,%RDI |
(2992) 0x690894 XOR %EBX,%EBX |
(2992) 0x690896 CMP %RAX,%RDI |
(2992) 0x690899 JE 6908c9 |
(2992) 0x69089b MOV %RBX,%RCX |
(2992) 0x69089e MOV %RDI,%RDX |
(2992) 0x6908a1 NOPW %CS:(%RAX,%RAX,1) |
(3001) 0x6908b0 MOV 0x8(%RDX),%ESI |
(3001) 0x6908b3 MOV %ESI,0x8(%RCX) |
(3001) 0x6908b6 MOV (%RDX),%RSI |
(3001) 0x6908b9 MOV %RSI,(%RCX) |
(3001) 0x6908bc ADD $0xc,%RDX |
(3001) 0x6908c0 ADD $0xc,%RCX |
(3001) 0x6908c4 CMP %RAX,%RDX |
(3001) 0x6908c7 JNE 6908b0 |
(2992) 0x6908c9 TEST %RDI,%RDI |
(2992) 0x6908cc JE 6908e2 |
(2992) 0x6908ce CALL fa3730 <@plt_start@+0x280> |
(2992) 0x6908d3 MOV -0xa8(%RBP),%R10 |
(2992) 0x6908da MOV -0x60(%RBP),%R9 |
(2992) 0x6908de MOV -0x68(%RBP),%R8 |
(2992) 0x6908e2 MOV %RBX,0x6b0(%R8) |
(2992) 0x6908e9 LEA (%R15,%R15,2),%RAX |
(2992) 0x6908ed LEA (%RBX,%RAX,4),%RAX |
(2992) 0x6908f1 MOV %RAX,0x6b8(%R8) |
(2992) 0x6908f8 MOV -0xf0(%RBP),%RAX |
(2992) 0x6908ff LEA (%RAX,%RAX,2),%RAX |
(2992) 0x690903 LEA (%RBX,%RAX,4),%RAX |
(2992) 0x690907 MOV %RAX,0x6c0(%R8) |
(2992) 0x69090e MOV -0x38(%RBP),%RSI |
(2992) 0x690912 MOV -0xb8(%RBP),%RCX |
(2992) 0x690919 MOVSXD %ECX,%RCX |
(2992) 0x69091c SUB %R10,%RCX |
(2992) 0x69091f TEST %RBX,%RBX |
(2992) 0x690922 LEA (%R15,%R15,2),%RAX |
(2992) 0x690926 LEA (%RBX,%RAX,4),%R8 |
(2992) 0x69092a CMOVE %RBX,%R8 |
(2992) 0x69092e MOV %RBX,-0x148(%RBP) |
(2992) 0x690935 MOV %R8,-0x140(%RBP) |
(2992) 0x69093c MOV -0x80(%RBP),%RAX |
(2992) 0x690940 CMPB $0,0x18(%RAX) |
(2992) 0x690944 MOV %RCX,-0xb8(%RBP) |
(2992) 0x69094b JE 690990 |
(2992) 0x69094d MOV -0x78(%RBP),%RAX |
(2992) 0x690951 LEA 0x18(,%RAX,4),%RAX |
(2992) 0x690959 ADD %R13,%RAX |
(2992) 0x69095c LEA (%RCX,%RCX,2),%RCX |
(2992) 0x690960 LEA (%R14,%RCX,4),%RBX |
(2992) 0x690964 MOVSXD (%RAX),%RAX |
(2992) 0x690967 TEST %RBX,%RBX |
(2992) 0x69096a LEA (%RAX,%RAX,2),%RAX |
(2992) 0x69096e LEA (%RBX,%RAX,4),%R8 |
(2992) 0x690972 CMOVE %RBX,%R8 |
(2992) 0x690976 MOV -0xb0(%RBP),%R15 |
(2992) 0x69097d JMP 690a30 |
0x690982 NOPW %CS:(%RAX,%RAX,1) |
(2992) 0x690990 CMPL $0x2,-0x98(%RBP) |
(2992) 0x690997 MOV -0xb0(%RBP),%R15 |
(2992) 0x69099e JL 690a30 |
(2992) 0x6909a4 MOV %R9,-0x60(%RBP) |
(2992) 0x6909a8 MOV %RSI,-0x38(%RBP) |
(2992) 0x6909ac CMPL $0x2,-0x94(%RBP) |
(2992) 0x6909b3 JNE 690c87 |
(2992) 0x6909b9 XOR %EAX,%EAX |
(2992) 0x6909bb XOR %ECX,%ECX |
(2992) 0x6909bd TESTB $0x1,-0xe8(%RBP) |
(2992) 0x6909c4 JE 690a21 |
(2992) 0x6909c6 MOVSXD 0x48(%R13,%RAX,4),%RDX |
(2992) 0x6909cb CMP 0x58(%R13,%RAX,4),%EDX |
(2992) 0x6909d0 JGE 690a21 |
(2992) 0x6909d2 LEA 0x58(,%RAX,4),%RAX |
(2992) 0x6909da ADD %R13,%RAX |
(2992) 0x6909dd MOVSXD %ECX,%RCX |
(2992) 0x6909e0 LEA (%RCX,%RCX,2),%RCX |
(2992) 0x6909e4 LEA (%RBX,%RCX,4),%RCX |
(2992) 0x6909e8 LEA (%RDX,%RDX,2),%RSI |
(2992) 0x6909ec LEA (%R14,%RSI,4),%RSI |
(2992) 0x6909f0 XOR %EDI,%EDI |
(2992) 0x6909f2 NOPW %CS:(%RAX,%RAX,1) |
(2997) 0x690a00 MOV 0x8(%RSI,%RDI,1),%R9D |
(2997) 0x690a05 MOV %R9D,0x8(%RCX,%RDI,1) |
(2997) 0x690a0a MOV (%RSI,%RDI,1),%R9 |
(2997) 0x690a0e MOV %R9,(%RCX,%RDI,1) |
(2997) 0x690a12 INC %RDX |
(2997) 0x690a15 MOVSXD (%RAX),%R9 |
(2997) 0x690a18 ADD $0xc,%RDI |
(2997) 0x690a1c CMP %R9,%RDX |
(2997) 0x690a1f JL 690a00 |
(2992) 0x690a21 MOV -0x70(%RBP),%R13 |
(2992) 0x690a25 MOV -0x38(%RBP),%RSI |
(2992) 0x690a29 MOV -0x60(%RBP),%R9 |
(2992) 0x690a2d JMP 690a34 |
0x690a2f NOP |
(2992) 0x690a30 MOV -0x70(%RBP),%R13 |
(2992) 0x690a34 MOV %RSI,-0x138(%RBP) |
(2992) 0x690a3b MOV %R9,-0x130(%RBP) |
(2992) 0x690a42 VMOVUPS -0x138(%RBP),%XMM0 |
(2992) 0x690a4a VMOVUPS %XMM0,(%RSP) |
(2992) 0x690a4f MOV %R15,%RDI |
(2992) 0x690a52 MOV %R13D,%ESI |
(2992) 0x690a55 XOR %EDX,%EDX |
(2992) 0x690a57 MOV %RBX,%RCX |
(2992) 0x690a5a CALL fa8770 <@plt_start@+0x52c0> |
(2992) 0x690a5f MOV -0x120(%RBP),%RCX |
(2992) 0x690a66 MOV -0x118(%RBP),%RDX |
(2992) 0x690a6d MOV 0x30(%RCX,%RDX,1),%RAX |
(2992) 0x690a72 MOV 0x38(%RCX,%RDX,1),%RCX |
(2992) 0x690a77 CMPB $0,-0x29(%RBP) |
(2992) 0x690a7b JE 690b60 |
(2992) 0x690a81 CMPB $0,-0x40(%RBP) |
(2992) 0x690a85 MOV -0x68(%RBP),%R8 |
(2992) 0x690a89 JE 690bd0 |
(2992) 0x690a8f CMP %RCX,%RAX |
(2992) 0x690a92 JE 690dc0 |
(2992) 0x690a98 CMPB $0,-0x3c(%RBP) |
(2992) 0x690a9c JE 690d58 |
(2992) 0x690aa2 XOR %EDX,%EDX |
(2992) 0x690aa4 NOPW %CS:(%RAX,%RAX,1) |
(2996) 0x690ab0 MOVSXD (%RAX),%RSI |
(2996) 0x690ab3 MOV -0x50(%RBP),%RDI |
(2996) 0x690ab7 VMOVSS (%RDI,%RDX,1),%XMM0 |
(2996) 0x690abc LEA (%RSI,%RSI,2),%RSI |
(2996) 0x690ac0 VADDSS (%R14,%RSI,4),%XMM0,%XMM0 |
(2996) 0x690ac6 VMOVSS %XMM0,(%R14,%RSI,4) |
(2996) 0x690acc MOV -0x50(%RBP),%RDI |
(2996) 0x690ad0 VMOVSS 0x4(%R14,%RSI,4),%XMM0 |
(2996) 0x690ad7 VMOVSS 0x8(%R14,%RSI,4),%XMM1 |
(2996) 0x690ade VSUBSS 0x4(%RDI,%RDX,1),%XMM0,%XMM0 |
(2996) 0x690ae4 VMOVSS %XMM0,0x4(%R14,%RSI,4) |
(2996) 0x690aeb MOV -0x50(%RBP),%RDI |
(2996) 0x690aef VSUBSS 0x8(%RDI,%RDX,1),%XMM1,%XMM0 |
(2996) 0x690af5 VMOVSS %XMM0,0x8(%R14,%RSI,4) |
(2996) 0x690afc MOV -0x50(%RBP),%RSI |
(2996) 0x690b00 VMOVSS (%RSI,%RDX,1),%XMM0 |
(2996) 0x690b05 VADDSS (%R12),%XMM0,%XMM0 |
(2996) 0x690b0b VMOVSS %XMM0,(%R12) |
(2996) 0x690b11 MOV -0x50(%RBP),%RSI |
(2996) 0x690b15 VMOVSS 0x4(%RSI,%RDX,1),%XMM0 |
(2996) 0x690b1b VADDSS 0x4(%R12),%XMM0,%XMM0 |
(2996) 0x690b22 VMOVSS %XMM0,0x4(%R12) |
(2996) 0x690b29 MOV -0x50(%RBP),%RSI |
(2996) 0x690b2d VMOVSS 0x8(%RSI,%RDX,1),%XMM0 |
(2996) 0x690b33 VADDSS 0x8(%R12),%XMM0,%XMM0 |
(2996) 0x690b3a VMOVSS %XMM0,0x8(%R12) |
(2996) 0x690b41 ADD $0x4,%RAX |
(2996) 0x690b45 ADD $0xc,%RDX |
(2996) 0x690b49 CMP %RCX,%RAX |
(2996) 0x690b4c JNE 690ab0 |
(2992) 0x690b52 JMP 690dc0 |
0x690b57 NOPW (%RAX,%RAX,1) |
(2992) 0x690b60 CMP %RCX,%RAX |
(2992) 0x690b63 MOV -0x68(%RBP),%R8 |
(2992) 0x690b67 JE 690dc0 |
(2992) 0x690b6d XOR %EDX,%EDX |
(2992) 0x690b6f NOP |
(2993) 0x690b70 MOVSXD (%RAX),%RSI |
(2993) 0x690b73 MOV -0x50(%RBP),%RDI |
(2993) 0x690b77 VMOVSS (%RDI,%RDX,1),%XMM0 |
(2993) 0x690b7c LEA (%RSI,%RSI,2),%RSI |
(2993) 0x690b80 VADDSS (%R14,%RSI,4),%XMM0,%XMM0 |
(2993) 0x690b86 VMOVSS %XMM0,(%R14,%RSI,4) |
(2993) 0x690b8c MOV -0x50(%RBP),%RDI |
(2993) 0x690b90 VMOVSS 0x4(%RDI,%RDX,1),%XMM0 |
(2993) 0x690b96 VADDSS 0x4(%R14,%RSI,4),%XMM0,%XMM0 |
(2993) 0x690b9d VMOVSS %XMM0,0x4(%R14,%RSI,4) |
(2993) 0x690ba4 MOV -0x50(%RBP),%RDI |
(2993) 0x690ba8 VMOVSS 0x8(%RDI,%RDX,1),%XMM0 |
(2993) 0x690bae VADDSS 0x8(%R14,%RSI,4),%XMM0,%XMM0 |
(2993) 0x690bb5 VMOVSS %XMM0,0x8(%R14,%RSI,4) |
(2993) 0x690bbc ADD $0x4,%RAX |
(2993) 0x690bc0 ADD $0xc,%RDX |
(2993) 0x690bc4 CMP %RCX,%RAX |
(2993) 0x690bc7 JNE 690b70 |
(2992) 0x690bc9 JMP 690dc0 |
0x690bce XCHG %AX,%AX |
(2992) 0x690bd0 CMP %RCX,%RAX |
(2992) 0x690bd3 JE 690dc0 |
(2992) 0x690bd9 XOR %EDX,%EDX |
(2992) 0x690bdb NOPL (%RAX,%RAX,1) |
(2994) 0x690be0 MOVSXD (%RAX),%RSI |
(2994) 0x690be3 MOV -0x50(%RBP),%RDI |
(2994) 0x690be7 VMOVSS (%RDI,%RDX,1),%XMM0 |
(2994) 0x690bec LEA (%RSI,%RSI,2),%RSI |
(2994) 0x690bf0 VADDSS (%R14,%RSI,4),%XMM0,%XMM0 |
(2994) 0x690bf6 VMOVSS %XMM0,(%R14,%RSI,4) |
(2994) 0x690bfc MOV -0x50(%RBP),%RDI |
(2994) 0x690c00 VMOVSS 0x4(%RDI,%RDX,1),%XMM0 |
(2994) 0x690c06 VADDSS 0x4(%R14,%RSI,4),%XMM0,%XMM0 |
(2994) 0x690c0d VMOVSS %XMM0,0x4(%R14,%RSI,4) |
(2994) 0x690c14 MOV -0x50(%RBP),%RDI |
(2994) 0x690c18 VMOVSS 0x8(%RDI,%RDX,1),%XMM0 |
(2994) 0x690c1e VADDSS 0x8(%R14,%RSI,4),%XMM0,%XMM0 |
(2994) 0x690c25 VMOVSS %XMM0,0x8(%R14,%RSI,4) |
(2994) 0x690c2c MOV -0x50(%RBP),%RSI |
(2994) 0x690c30 VMOVSS (%RSI,%RDX,1),%XMM0 |
(2994) 0x690c35 VADDSS (%R12),%XMM0,%XMM0 |
(2994) 0x690c3b VMOVSS %XMM0,(%R12) |
(2994) 0x690c41 MOV -0x50(%RBP),%RSI |
(2994) 0x690c45 VMOVSS 0x4(%RSI,%RDX,1),%XMM0 |
(2994) 0x690c4b VADDSS 0x4(%R12),%XMM0,%XMM0 |
(2994) 0x690c52 VMOVSS %XMM0,0x4(%R12) |
(2994) 0x690c59 MOV -0x50(%RBP),%RSI |
(2994) 0x690c5d VMOVSS 0x8(%RSI,%RDX,1),%XMM0 |
(2994) 0x690c63 VADDSS 0x8(%R12),%XMM0,%XMM0 |
(2994) 0x690c6a VMOVSS %XMM0,0x8(%R12) |
(2994) 0x690c71 ADD $0x4,%RAX |
(2994) 0x690c75 ADD $0xc,%RDX |
(2994) 0x690c79 CMP %RCX,%RAX |
(2994) 0x690c7c JNE 690be0 |
(2992) 0x690c82 JMP 690dc0 |
(2992) 0x690c87 XOR %EAX,%EAX |
(2992) 0x690c89 XOR %ECX,%ECX |
(2992) 0x690c8b JMP 690ca1 |
0x690c8d NOPL (%RAX) |
(2998) 0x690c90 ADD $0x2,%RAX |
(2998) 0x690c94 CMP -0x128(%RBP),%RAX |
(2998) 0x690c9b JE 6909bd |
(2998) 0x690ca1 MOVSXD 0x48(%R13,%RAX,4),%RDX |
(2998) 0x690ca6 CMP 0x58(%R13,%RAX,4),%EDX |
(2998) 0x690cab JGE 690cf3 |
(2998) 0x690cad LEA 0x58(,%RAX,4),%RSI |
(2998) 0x690cb5 ADD %R13,%RSI |
(2998) 0x690cb8 MOVSXD %ECX,%RDI |
(2998) 0x690cbb LEA (%RDI,%RDI,2),%RDI |
(2998) 0x690cbf LEA (%RBX,%RDI,4),%RDI |
(2998) 0x690cc3 LEA (%RDX,%RDX,2),%R9 |
(2998) 0x690cc7 LEA (%R14,%R9,4),%R9 |
(2998) 0x690ccb XOR %R10D,%R10D |
(2998) 0x690cce XCHG %AX,%AX |
(3000) 0x690cd0 MOV 0x8(%R9,%R10,1),%R11D |
(3000) 0x690cd5 MOV %R11D,0x8(%RDI,%R10,1) |
(3000) 0x690cda MOV (%R9,%R10,1),%R11 |
(3000) 0x690cde MOV %R11,(%RDI,%R10,1) |
(3000) 0x690ce2 INC %RDX |
(3000) 0x690ce5 MOVSXD (%RSI),%R11 |
(3000) 0x690ce8 ADD $0xc,%R10 |
(3000) 0x690cec INC %ECX |
(3000) 0x690cee CMP %R11,%RDX |
(3000) 0x690cf1 JL 690cd0 |
(2998) 0x690cf3 LEA (,%RAX,4),%RSI |
(2998) 0x690cfb OR $0x4,%RSI |
(2998) 0x690cff MOVSXD 0x48(%RSI,%R13,1),%RDX |
(2998) 0x690d04 CMP 0x58(%RSI,%R13,1),%EDX |
(2998) 0x690d09 JGE 690c90 |
(2998) 0x690d0b ADD %R13,%RSI |
(2998) 0x690d0e ADD $0x58,%RSI |
(2998) 0x690d12 MOVSXD %ECX,%RDI |
(2998) 0x690d15 LEA (%RDI,%RDI,2),%RDI |
(2998) 0x690d19 LEA (%RBX,%RDI,4),%RDI |
(2998) 0x690d1d LEA (%RDX,%RDX,2),%R9 |
(2998) 0x690d21 LEA (%R14,%R9,4),%R9 |
(2998) 0x690d25 XOR %R10D,%R10D |
(2998) 0x690d28 NOPL (%RAX,%RAX,1) |
(2999) 0x690d30 MOV 0x8(%R9,%R10,1),%R11D |
(2999) 0x690d35 MOV %R11D,0x8(%RDI,%R10,1) |
(2999) 0x690d3a MOV (%R9,%R10,1),%R11 |
(2999) 0x690d3e MOV %R11,(%RDI,%R10,1) |
(2999) 0x690d42 INC %RDX |
(2999) 0x690d45 MOVSXD (%RSI),%R11 |
(2999) 0x690d48 ADD $0xc,%R10 |
(2999) 0x690d4c INC %ECX |
(2999) 0x690d4e CMP %R11,%RDX |
(2999) 0x690d51 JL 690d30 |
(2998) 0x690d53 JMP 690c90 |
(2992) 0x690d58 XOR %EDX,%EDX |
(2992) 0x690d5a NOPW (%RAX,%RAX,1) |
(2995) 0x690d60 MOVSXD (%RAX),%RSI |
(2995) 0x690d63 MOV -0x50(%RBP),%RDI |
(2995) 0x690d67 VMOVSS (%RDI,%RDX,1),%XMM0 |
(2995) 0x690d6c LEA (%RSI,%RSI,2),%RSI |
(2995) 0x690d70 VADDSS (%R14,%RSI,4),%XMM0,%XMM0 |
(2995) 0x690d76 VMOVSS %XMM0,(%R14,%RSI,4) |
(2995) 0x690d7c MOV -0x50(%RBP),%RDI |
(2995) 0x690d80 VMOVSS 0x4(%R14,%RSI,4),%XMM0 |
(2995) 0x690d87 VMOVSS 0x8(%R14,%RSI,4),%XMM1 |
(2995) 0x690d8e VSUBSS 0x4(%RDI,%RDX,1),%XMM0,%XMM0 |
(2995) 0x690d94 VMOVSS %XMM0,0x4(%R14,%RSI,4) |
(2995) 0x690d9b MOV -0x50(%RBP),%RDI |
(2995) 0x690d9f VSUBSS 0x8(%RDI,%RDX,1),%XMM1,%XMM0 |
(2995) 0x690da5 VMOVSS %XMM0,0x8(%R14,%RSI,4) |
(2995) 0x690dac ADD $0x4,%RAX |
(2995) 0x690db0 ADD $0xc,%RDX |
(2995) 0x690db4 CMP %RCX,%RAX |
(2995) 0x690db7 JNE 690d60 |
(2992) 0x690db9 NOPL (%RAX) |
(2992) 0x690dc0 CMPB $0,0x6c8(%R8) |
(2992) 0x690dc8 JE 690ee8 |
(2992) 0x690dce MOVB $0,0x6c8(%R8) |
(2992) 0x690dd6 CMPB $0,0x690(%R8) |
(2992) 0x690dde JE 690f0f |
(2992) 0x690de4 MOVB $0,0x690(%R8) |
(2992) 0x690dec XOR %EAX,%EAX |
(2992) 0x690dee CMPQ $0x1,-0x110(%RBP) |
(2992) 0x690df6 MOV -0x108(%RBP),%RDX |
(2992) 0x690dfd MOV $-0x5555555555555555,%RDI |
(2992) 0x690e07 JG 6905c0 |
(2991) 0x690e0d JMP 690450 |
0x690e12 MOV -0xc0(%RBP),%RBX |
0x690e19 TEST %RBX,%RBX |
0x690e1c JE 690e88 |
0x690e1e MOV %RBX,%RDI |
0x690e21 CALL fa6fc0 <@plt_start@+0x3b10> |
0x690e26 RDTSCP |
0x690e29 MOV %EAX,%EAX |
0x690e2b SAL $0x20,%RDX |
0x690e2f OR %RAX,%RDX |
0x690e32 MOV %RDX,%RAX |
0x690e35 SUB 0x130(%RBX),%RAX |
0x690e3c JAE 690e47 |
0x690e3e MOVB $0x1,0x8f0(%RBX) |
0x690e45 XOR %EAX,%EAX |
0x690e47 ADD %RAX,0x128(%RBX) |
0x690e4e INCL 0x120(%RBX) |
0x690e54 MOV 0x8c8(%RBX),%RAX |
0x690e5b CMP 0x8d0(%RBX),%RAX |
0x690e62 JE 690e88 |
0x690e64 MOV 0x8e0(%RBX),%EAX |
0x690e6a DEC %EAX |
0x690e6c MOV %EAX,0x8e0(%RBX) |
0x690e72 CMP $0x2,%EAX |
0x690e75 JNE 690e88 |
0x690e77 MOVL $0xc,0x8e4(%RBX) |
0x690e81 MOV %RDX,0x8e8(%RBX) |
0x690e88 ADD $0x138,%RSP |
0x690e8f POP %RBX |
0x690e90 POP %R12 |
0x690e92 POP %R13 |
0x690e94 POP %R14 |
0x690e96 POP %R15 |
0x690e98 POP %RBP |
0x690e99 RET |
0x690e9a LEA -0x3bba4f(%RIP),%RDI |
0x690ea1 LEA -0x40e89e(%RIP),%RSI |
0x690ea8 LEA -0x361d07(%RIP),%RDX |
0x690eaf LEA -0x4297c4(%RIP),%RCX |
0x690eb6 MOV $0x167,%R8D |
0x690ebc CALL fa35d0 <@plt_start@+0x120> |
0x690ec1 LEA -0x3bba76(%RIP),%RDI |
0x690ec8 LEA -0x40e8c5(%RIP),%RSI |
0x690ecf LEA -0x361d2e(%RIP),%RDX |
0x690ed6 LEA -0x4297eb(%RIP),%RCX |
0x690edd MOV $0x167,%R8D |
0x690ee3 CALL fa35d0 <@plt_start@+0x120> |
0x690ee8 LEA -0x44c93a(%RIP),%RDI |
0x690eef LEA -0x3d70b8(%RIP),%RSI |
0x690ef6 LEA -0x397cc2(%RIP),%RDX |
0x690efd LEA -0x429812(%RIP),%RCX |
0x690f04 MOV $0x170,%R8D |
0x690f0a CALL fa35d0 <@plt_start@+0x120> |
0x690f0f LEA -0x44c961(%RIP),%RDI |
0x690f16 LEA -0x3d70df(%RIP),%RSI |
0x690f1d LEA -0x397ce9(%RIP),%RDX |
0x690f24 LEA -0x429839(%RIP),%RCX |
0x690f2b MOV $0x170,%R8D |
0x690f31 CALL fa35d0 <@plt_start@+0x120> |
0x690f36 LEA -0x3f27ef(%RIP),%RDI |
0x690f3d CALL fa3910 <@plt_start@+0x460> |
0x690f42 LEA -0x3f27fb(%RIP),%RDI |
0x690f49 CALL fa3910 <@plt_start@+0x460> |
0x690f4e JMP 690f71 |
0x690f50 MOV %RAX,%RBX |
0x690f53 LEA -0x150(%RBP),%RDI |
0x690f5a CALL fa8780 <@plt_start@+0x52d0> |
0x690f5f JMP 690f74 |
0x690f61 MOV %RAX,%RDI |
0x690f64 CALL 4abc30 <__clang_call_terminate> |
0x690f69 MOV %RAX,%RDI |
0x690f6c CALL 4abc30 <__clang_call_terminate> |
0x690f71 MOV %RAX,%RBX |
0x690f74 LEA -0x58(%RBP),%RDI |
0x690f78 CALL fa8780 <@plt_start@+0x52d0> |
0x690f7d MOV %RBX,%RDI |
0x690f80 CALL fa3770 <@plt_start@+0x2c0> |
0x690f85 NOPW %CS:(%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►98.98+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►1.02+ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.53+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►74.85+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►14.71+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
►10.20+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►85.31+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►10.49+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
►3.85+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►81.47+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►14.22+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►4.09+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►97.49+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►2.51+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►82.43+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►8.21+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
►6.96+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►2.18+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.85+ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2308 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Path / |
The code analyzed by CQA in that panel excludes loops and represents 0.00% of application time for run 1x1
Source file and lines | domdec.cpp:358-463 |
Module | libgromacs_mpi.so.9.0.0 |
nb instructions | 141 |
nb uops | 238 |
loop length | 709 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 11 |
micro-operation queue | 39.67 cycles |
front end | 39.67 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 16.00 | 16.00 | 15.75 | 15.75 | 12.50 | 16.33 | 16.33 | 16.33 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 16.00 | 16.00 | 15.75 | 15.75 | 12.50 | 16.33 | 16.33 | 16.33 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 39.67 |
Dispatch | 16.33 |
Overall L1 | 39.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 10% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 11% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x138,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %RSI,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
TEST %RDX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JE 6903c8 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0x88> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CALL fa6fc0 <@plt_start@+0x3b10> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
RDTSCP | 46 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 65 | N/A |
MOV %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SAL $0x20,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
OR %RAX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV %RDX,0x130(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x8c8(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CMP 0x8d0(%RBX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
JE 6903c8 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0x88> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV 0x8e0(%RBX),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
INC %ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %ECX,0x8e0(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
CMP $0x3,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
JNE 6903c8 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0x88> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOVSXD 0x8e4(%RBX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
IMUL $0x4e0,%RCX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
INCL 0x120(%RCX,%RAX,1) | 2 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
SUB 0x8e8(%RBX),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
ADD %RDX,0x128(%RCX,%RAX,1) | 2 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
MOV %RBX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x74(%R15),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
TEST %ECX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
JLE 690e12 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xad2> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV (%RAX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV 0x20(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x130(%R15),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x298(%R8),%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOV 0x62c(%R8),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x580(%R8),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x678(%R8),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RAX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x6b0(%R8),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RAX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV $-0x5555555555555555,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
MOV %R15,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R8,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP 690472 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0x132> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
MOV -0xc0(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
TEST %RBX,%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JE 690e88 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xb48> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CALL fa6fc0 <@plt_start@+0x3b10> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
RDTSCP | 46 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 65 | N/A |
MOV %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SAL $0x20,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
OR %RAX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SUB 0x130(%RBX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
JAE 690e47 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xb07> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOVB $0x1,0x8f0(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (1.6%) |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
ADD %RAX,0x128(%RBX) | 2 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
INCL 0x120(%RBX) | 2 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
MOV 0x8c8(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CMP 0x8d0(%RBX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
JE 690e88 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xb48> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV 0x8e0(%RBX),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
DEC %EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %EAX,0x8e0(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
CMP $0x2,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
JNE 690e88 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xb48> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOVL $0xc,0x8e4(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %RDX,0x8e8(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
ADD $0x138,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
LEA -0x3bba4f(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x40e89e(%RIP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x361d07(%RIP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x4297c4(%RIP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x167,%R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa35d0 <@plt_start@+0x120> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
LEA -0x3bba76(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x40e8c5(%RIP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x361d2e(%RIP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x4297eb(%RIP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x167,%R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa35d0 <@plt_start@+0x120> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
LEA -0x44c93a(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x3d70b8(%RIP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x397cc2(%RIP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x429812(%RIP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x170,%R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa35d0 <@plt_start@+0x120> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
LEA -0x44c961(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x3d70df(%RIP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x397ce9(%RIP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x429839(%RIP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x170,%R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa35d0 <@plt_start@+0x120> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
LEA -0x3f27ef(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa3910 <@plt_start@+0x460> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
LEA -0x3f27fb(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa3910 <@plt_start@+0x460> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
JMP 690f71 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xc31> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
LEA -0x150(%RBP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa8780 <@plt_start@+0x52d0> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
JMP 690f74 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xc34> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CALL 4abc30 <__clang_call_terminate> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CALL 4abc30 <__clang_call_terminate> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
LEA -0x58(%RBP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa8780 <@plt_start@+0x52d0> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CALL fa3770 <@plt_start@+0x2c0> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
The code analyzed by CQA in that panel excludes loops and represents 0.00% of application time for run 1x1
Source file and lines | domdec.cpp:358-463 |
Module | libgromacs_mpi.so.9.0.0 |
nb instructions | 141 |
nb uops | 238 |
loop length | 709 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 11 |
micro-operation queue | 39.67 cycles |
front end | 39.67 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 16.00 | 16.00 | 15.75 | 15.75 | 12.50 | 16.33 | 16.33 | 16.33 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 16.00 | 16.00 | 15.75 | 15.75 | 12.50 | 16.33 | 16.33 | 16.33 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 39.67 |
Dispatch | 16.33 |
Overall L1 | 39.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 10% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 11% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0x138,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %RSI,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
TEST %RDX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JE 6903c8 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0x88> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CALL fa6fc0 <@plt_start@+0x3b10> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
RDTSCP | 46 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 65 | N/A |
MOV %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SAL $0x20,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
OR %RAX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV %RDX,0x130(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x8c8(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CMP 0x8d0(%RBX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
JE 6903c8 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0x88> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV 0x8e0(%RBX),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
INC %ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %ECX,0x8e0(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
CMP $0x3,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
JNE 6903c8 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0x88> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOVSXD 0x8e4(%RBX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
IMUL $0x4e0,%RCX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
INCL 0x120(%RCX,%RAX,1) | 2 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
SUB 0x8e8(%RBX),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
ADD %RDX,0x128(%RCX,%RAX,1) | 2 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
MOV %RBX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x74(%R15),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
TEST %ECX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
JLE 690e12 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xad2> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV (%RAX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV 0x20(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x130(%R15),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x298(%R8),%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOV 0x62c(%R8),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x580(%R8),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x678(%R8),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RAX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x6b0(%R8),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RAX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV $-0x5555555555555555,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
MOV %R15,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R8,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP 690472 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0x132> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
MOV -0xc0(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
TEST %RBX,%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JE 690e88 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xb48> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CALL fa6fc0 <@plt_start@+0x3b10> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
RDTSCP | 46 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 65 | N/A |
MOV %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SAL $0x20,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
OR %RAX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SUB 0x130(%RBX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
JAE 690e47 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xb07> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOVB $0x1,0x8f0(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (1.6%) |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
ADD %RAX,0x128(%RBX) | 2 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
INCL 0x120(%RBX) | 2 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
MOV 0x8c8(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
CMP 0x8d0(%RBX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
JE 690e88 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xb48> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV 0x8e0(%RBX),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
DEC %EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %EAX,0x8e0(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
CMP $0x2,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
JNE 690e88 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xb48> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOVL $0xc,0x8e4(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %RDX,0x8e8(%RBX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
ADD $0x138,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
LEA -0x3bba4f(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x40e89e(%RIP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x361d07(%RIP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x4297c4(%RIP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x167,%R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa35d0 <@plt_start@+0x120> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
LEA -0x3bba76(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x40e8c5(%RIP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x361d2e(%RIP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x4297eb(%RIP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x167,%R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa35d0 <@plt_start@+0x120> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
LEA -0x44c93a(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x3d70b8(%RIP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x397cc2(%RIP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x429812(%RIP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x170,%R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa35d0 <@plt_start@+0x120> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
LEA -0x44c961(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x3d70df(%RIP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x397ce9(%RIP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0x429839(%RIP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV $0x170,%R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa35d0 <@plt_start@+0x120> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
LEA -0x3f27ef(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa3910 <@plt_start@+0x460> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
LEA -0x3f27fb(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa3910 <@plt_start@+0x460> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
JMP 690f71 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xc31> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
LEA -0x150(%RBP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa8780 <@plt_start@+0x52d0> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
JMP 690f74 <_Z9dd_move_fP12gmx_domdec_tPN3gmx20ForceWithShiftForcesEP13gmx_wallcycle+0xc34> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CALL 4abc30 <__clang_call_terminate> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CALL 4abc30 <__clang_call_terminate> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
LEA -0x58(%RBP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa8780 <@plt_start@+0x52d0> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
CALL fa3770 <@plt_start@+0x2c0> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Run 1x1 | Number processes: 1Number processes per node: 1OMP_NUM_THREADS: 1 |
---|---|
Run 2x1 | Number processes: 2Number processes per node: 2OMP_NUM_THREADS: 1 |
Run 4x1 | Number processes: 4Number processes per node: 4OMP_NUM_THREADS: 1 |
Run 8x1 | Number processes: 8Number processes per node: 8OMP_NUM_THREADS: 1 |
Run 16x1 | Number processes: 16Number processes per node: 16OMP_NUM_THREADS: 1 |
Run 32x1 | Number processes: 32Number processes per node: 32OMP_NUM_THREADS: 1 |
Run 64x1 | Number processes: 64Number processes per node: 64OMP_NUM_THREADS: 1 |
Run 128x1 | Number processes: 128Number processes per node: 128OMP_NUM_THREADS: 1 |
Run 192x1 | Number processes: 192Number nodes: 1Number processes per node: 192Run Command: <executable> mdrun -s ion_channel.tpr -nsteps 10000 -pin on -deffnm aoccMPI Command: mpirun -genv I_MPI_FABRICS=shm -n <number_processes>Dataset: Run Directory: .OMP_NUM_THREADS: 1 |
(1x1) Efficiency | (1x1) Potential Speed-Up (%) | (2x1) Efficiency | (2x1) Potential Speed-Up (%) | (4x1) Efficiency | (4x1) Potential Speed-Up (%) | (8x1) Efficiency | (8x1) Potential Speed-Up (%) | (16x1) Efficiency | (16x1) Potential Speed-Up (%) | (32x1) Efficiency | (32x1) Potential Speed-Up (%) | (64x1) Efficiency | (64x1) Potential Speed-Up (%) | (128x1) Efficiency | (128x1) Potential Speed-Up (%) | (192x1) Efficiency | (192x1) Potential Speed-Up (%) |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
1 | 0 | 1 | 0 | 1 | 0 | 1 | 0 | 1 | 0 | 1 | 0 | 1 | 0 | 1 | 0 |
Run | Number of threads | Efficiency (ideal is 1) | Speedup | Ideal Speedup | Time (s) | Coverage (%) |
---|---|---|---|---|---|---|
1x1 | ||||||
2x1 | 2 | 1 | 1 | 2 | 0.27499994635582 | 0.054052166640759 |
4x1 | 4 | 1 | 1 | 4 | 0.32499986886978 | 0.1074408814311 |
8x1 | 8 | 1 | 1 | 8 | 0.70999974012375 | 0.34065574407578 |
16x1 | 16 | 1 | 1 | 16 | 0.27999994158745 | 0.21709632873535 |
32x1 | 20 | 1 | 1 | 32 | 0.16499997675419 | 0.14123259484768 |
64x1 | 40 | 1 | 1 | 64 | 0.15499998629093 | 0.14950920641422 |
128x1 | 84 | 1 | 1 | 128 | 0.10499998927116 | 0.22429171204567 |
192x1 | 128 | 1 | 1 | 192 | 0.10499999672174 | 0.25701260566711 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼dd_move_f(gmx_domdec_t*, gmx::ForceWithShiftForces*, gmx_wallcycle*)– | 0.26 | 0.03 |
▼Loop 2991 - domdec.cpp:367-453 - libgromacs_mpi.so.9.0.0– | 0.00 | 0.01 |
▼Loop 2992 - domdec.cpp:381-453 - libgromacs_mpi.so.9.0.0– | 0.01 | 0.01 |
○Loop 2993 - domdec.cpp:415-419 - libgromacs_mpi.so.9.0.0 | 0.23 | 0.05 |
○Loop 2994 - domdec.cpp:426-435 - libgromacs_mpi.so.9.0.0 | 0.01 | 0.01 |
▼Loop 2998 - domdec.cpp:401-405 - libgromacs_mpi.so.9.0.0– | 0.00 | 0.00 |
○Loop 2999 - domdec.cpp:403-405 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 3000 - domdec.cpp:403-405 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 2997 - domdec.cpp:403-405 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 3001 - stl_uninitialized.h:1031-1031 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 2996 - domdec.cpp:442-453 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 2995 - stl_iterator.h:1054-1182 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 3002 - stl_uninitialized.h:1031-1031 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |