Function: do_redist_pos_coeffs(gmx_pme_t*, t_commrec const*, bool, gmx::ArrayRef<gmx::BasicVector<fl ... | Module: libgromacs_mpi.so.9.0.0 | Source: pme_redistribute.cpp:126-506 [...] | Coverage (incl. loops): 0.21% | (excl. loops): 0.00% |
---|
Function: do_redist_pos_coeffs(gmx_pme_t*, t_commrec const*, bool, gmx::ArrayRef<gmx::BasicVector<fl ... | Module: libgromacs_mpi.so.9.0.0 | Source: pme_redistribute.cpp:126-506 [...] | Coverage (incl. loops): 0.21% | (excl. loops): 0.00% |
---|
/home/eoseret/gromacs-2024.2/src/gromacs/ewald/pme_redistribute.cpp: 126 - 506 |
-------------------------------------------------------------------------------- |
126: int nthread = atc->nthread; |
127: |
128: #pragma omp parallel for num_threads(nthread) schedule(static) |
[...] |
145: for (int thread = 1; thread < nthread; thread++) |
146: { |
147: for (int slab = 0; slab < atc->nslab; slab++) |
148: { |
149: atc->count_thread[0][slab] += atc->count_thread[thread][slab]; |
[...] |
252: MPI_Status stat; |
[...] |
265: if (nbyte_s > 0 && nbyte_r > 0) |
266: { |
267: MPI_Sendrecv( |
268: buf_s, nbyte_s, MPI_BYTE, dest, shift, buf_r, nbyte_r, MPI_BYTE, src, shift, atc->mpi_comm, &stat); |
269: } |
270: else if (nbyte_s > 0) |
271: { |
272: MPI_Send(buf_s, nbyte_s, MPI_BYTE, dest, shift, atc->mpi_comm); |
273: } |
274: else if (nbyte_r > 0) |
275: { |
276: MPI_Recv(buf_r, nbyte_r, MPI_BYTE, src, shift, atc->mpi_comm, &stat); |
[...] |
290: nnodes_comm = std::min(2 * atc->maxshift, atc->nslab - 1); |
291: |
292: auto sendCount = atc->sendCount(); |
293: int nsend = 0; |
294: for (i = 0; i < nnodes_comm; i++) |
295: { |
296: const int commnode = atc->slabCommSetup[i].node_dest; |
297: atc->bufferIndices[commnode] = nsend; |
298: nsend += sendCount[commnode]; |
299: } |
300: if (bX) |
301: { |
302: if (sendCount[atc->slabIndex] + nsend != x.ssize()) |
303: { |
304: gmx_fatal( |
305: FARGS, |
306: "%zd particles communicated to PME rank %d are more than 2/3 times the cut-off " |
307: "out of the domain decomposition cell of their charge group in dimension %c.\n" |
308: "This usually means that your system is not well equilibrated.", |
309: x.ssize() - (sendCount[atc->slabIndex] + nsend), |
310: pme->nodeid, |
311: 'x' + atc->dimind); |
312: } |
313: |
314: if (nsend > pme->buf_nalloc) |
315: { |
316: pme->buf_nalloc = over_alloc_dd(nsend); |
317: srenew(pme->bufv, pme->buf_nalloc); |
318: srenew(pme->bufr, pme->buf_nalloc); |
319: } |
320: |
321: int numAtoms = sendCount[atc->slabIndex]; |
322: for (i = 0; i < nnodes_comm; i++) |
323: { |
324: const int commnode = atc->slabCommSetup[i].node_dest; |
325: int scount = sendCount[commnode]; |
326: /* Communicate the count */ |
327: if (debug) |
328: { |
329: fprintf(debug, |
330: "dimind %d PME rank %d send to rank %d: %d\n", |
331: atc->dimind, |
332: atc->slabIndex, |
[...] |
338: numAtoms += atc->slabCommSetup[i].rcount; |
339: } |
340: |
341: atc->setNumAtoms(numAtoms); |
342: } |
343: |
344: local_pos = 0; |
345: for (gmx::Index i = 0; i < x.ssize(); i++) |
346: { |
347: const int slabIndex = atc->pd[i]; |
348: if (slabIndex == atc->slabIndex) |
349: { |
350: /* Copy direct to the receive buffer */ |
351: if (bX) |
352: { |
353: copy_rvec(x[i], atc->xBuffer[local_pos]); |
354: } |
355: atc->coefficientBuffer[local_pos] = data[i]; |
356: local_pos++; |
[...] |
364: copy_rvec(x[i], pme->bufv[buf_index]); |
365: } |
366: pme->bufr[buf_index] = data[i]; |
367: buf_index++; |
368: } |
369: } |
370: |
371: buf_pos = 0; |
372: for (i = 0; i < nnodes_comm; i++) |
373: { |
374: const int scount = atc->sendCount()[atc->slabCommSetup[i].node_dest]; |
375: const int rcount = atc->slabCommSetup[i].rcount; |
376: if (scount > 0 || rcount > 0) |
377: { |
378: if (bX) |
[...] |
384: pme->bufv + buf_pos, |
385: scount * sizeof(rvec), |
386: atc->xBuffer.data() + local_pos, |
387: rcount * sizeof(rvec)); |
[...] |
393: pme->bufr + buf_pos, |
394: scount * sizeof(real), |
395: atc->coefficientBuffer.data() + local_pos, |
396: rcount * sizeof(real)); |
397: buf_pos += scount; |
398: local_pos += atc->slabCommSetup[i].rcount; |
[...] |
479: { |
480: for (int d = pme->ndecompdim - 1; d >= 0; d--) |
481: { |
482: gmx::ArrayRef<const gmx::RVec> xRef; |
483: gmx::ArrayRef<const real> param_d; |
484: if (d == pme->ndecompdim - 1) |
[...] |
494: xRef = atc.x; |
495: param_d = atc.coefficient; |
496: } |
497: PmeAtomComm& atc = pme->atc[d]; |
498: atc.pd.resize(xRef.size()); |
499: pme_calc_pidx_wrapper(xRef, pme->recipbox, &atc); |
500: /* Redistribute x (only once) and qA/c6A or qB/c6B */ |
501: if (haveDDAtomOrdering(*cr)) |
502: { |
503: dd_pmeredist_pos_coeffs(pme, bFirst, xRef, param_d, &atc); |
504: } |
505: } |
506: } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/ext/new_allocator.h: 145 - 145 |
-------------------------------------------------------------------------------- |
145: ::operator delete(__p |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/basic_string.h: 195 - 239 |
-------------------------------------------------------------------------------- |
195: { return _M_dataplus._M_p; } |
[...] |
211: return std::pointer_traits<const_pointer>::pointer_to(*_M_local_buf); |
[...] |
230: { return _M_data() == _M_local_data(); } |
[...] |
239: if (!_M_is_local()) |
/home/eoseret/gromacs-2024.2/src/gromacs/mdtypes/commrec.h: 189 - 189 |
-------------------------------------------------------------------------------- |
189: return cr.dd != nullptr; |
/home/eoseret/gromacs-2024.2/api/legacy/include/gromacs/utility/smalloc.h: 212 - 212 |
-------------------------------------------------------------------------------- |
212: ptr = static_cast<T*>(save_realloc(name, file, line, ptr, nelem, sizeof(T))); |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_vector.h: 919 - 1798 |
-------------------------------------------------------------------------------- |
919: { return size_type(this->_M_impl._M_finish - this->_M_impl._M_start); } |
[...] |
939: if (__new_size > size()) |
940: _M_default_append(__new_size - size()); |
941: else if (__new_size < size()) |
942: _M_erase_at_end(this->_M_impl._M_start + __new_size); |
[...] |
1046: return *(this->_M_impl._M_start + __n); |
[...] |
1169: { return _M_data_ptr(this->_M_impl._M_start); } |
[...] |
1794: if (size_type __n = this->_M_impl._M_finish - __pos) |
1795: { |
1796: std::_Destroy(__pos, this->_M_impl._M_finish, |
1797: _M_get_Tp_allocator()); |
1798: this->_M_impl._M_finish = __pos; |
/home/eoseret/gromacs-2024.2/api/legacy/include/gromacs/utility/arrayref.h: 85 - 180 |
-------------------------------------------------------------------------------- |
85: constexpr auto operator-(ArrayRefIter other) const noexcept { return it_ - other.it_; } |
[...] |
180: ArrayRef(U&& o) : begin_(o.data()), end_(o.data() + o.size()) |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/unique_ptr.h: 360 - 362 |
-------------------------------------------------------------------------------- |
360: if (__ptr != nullptr) |
361: get_deleter()(std::move(__ptr)); |
362: __ptr = pointer(); |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/fs_path.h: 313 - 313 |
-------------------------------------------------------------------------------- |
313: ~path() = default; |
/home/eoseret/gromacs-2024.2/api/legacy/include/gromacs/math/vec.h: 204 - 206 |
-------------------------------------------------------------------------------- |
204: b[XX] = a[XX]; |
205: b[YY] = a[YY]; |
206: b[ZZ] = a[ZZ]; |
0xc0a480 PUSH %RBP |
0xc0a481 MOV %RSP,%RBP |
0xc0a484 PUSH %R15 |
0xc0a486 PUSH %R14 |
0xc0a488 PUSH %R13 |
0xc0a48a PUSH %R12 |
0xc0a48c PUSH %RBX |
0xc0a48d SUB $0xd8,%RSP |
0xc0a494 MOV %R8,-0xd0(%RBP) |
0xc0a49b MOV %RCX,-0xc8(%RBP) |
0xc0a4a2 MOV %EDX,-0x4c(%RBP) |
0xc0a4a5 MOV %RSI,-0xc0(%RBP) |
0xc0a4ac MOV %RDI,-0x38(%RBP) |
0xc0a4b0 MOV (%RDI),%ECX |
0xc0a4b2 TEST %ECX,%ECX |
0xc0a4b4 JLE c0ae99 |
0xc0a4ba MOV -0x38(%RBP),%RAX |
0xc0a4be ADD $0x5d0,%RAX |
0xc0a4c4 MOV %RAX,-0xb8(%RBP) |
0xc0a4cb JMP c0a4e5 |
0xc0a4cd NOPL (%RAX) |
(17422) 0xc0a4d0 CMPQ $0x1,-0xf0(%RBP) |
(17422) 0xc0a4d8 MOV -0xf8(%RBP),%RCX |
(17422) 0xc0a4df JLE c0ae99 |
(17422) 0xc0a4e5 MOV %RCX,%RDI |
(17422) 0xc0a4e8 LEA -0x1(%RCX),%RDX |
(17422) 0xc0a4ec MOV -0x38(%RBP),%RAX |
(17422) 0xc0a4f0 MOV (%RAX),%ECX |
(17422) 0xc0a4f2 MOV 0x5b8(%RAX),%R8 |
(17422) 0xc0a4f9 LEA 0x10(%RBP),%RAX |
(17422) 0xc0a4fd MOV -0xc8(%RBP),%RBX |
(17422) 0xc0a504 MOV -0xd0(%RBP),%R12 |
(17422) 0xc0a50b CMP %RCX,%RDI |
(17422) 0xc0a50e JE c0a531 |
(17422) 0xc0a510 LEA (%RDI,%RDI,2),%RAX |
(17422) 0xc0a514 SAL $0x7,%RAX |
(17422) 0xc0a518 MOV 0x80(%R8,%RAX,1),%RBX |
(17422) 0xc0a520 MOV 0x88(%R8,%RAX,1),%R12 |
(17422) 0xc0a528 ADD %R8,%RAX |
(17422) 0xc0a52b ADD $0x90,%RAX |
(17422) 0xc0a531 MOV (%RAX),%RAX |
(17422) 0xc0a534 MOV %RAX,-0x78(%RBP) |
(17422) 0xc0a538 MOV %RDX,-0xf8(%RBP) |
(17422) 0xc0a53f MOV %EDX,%EAX |
(17422) 0xc0a541 LEA (%RAX,%RAX,2),%R15 |
(17422) 0xc0a545 SAL $0x7,%R15 |
(17422) 0xc0a549 LEA (%R8,%R15,1),%RAX |
(17422) 0xc0a54d MOV %RAX,-0x58(%RBP) |
(17422) 0xc0a551 LEA (%R8,%R15,1),%R14 |
(17422) 0xc0a555 ADD $0x48,%R14 |
(17422) 0xc0a559 SUB %RBX,%R12 |
(17422) 0xc0a55c MOV %R12,-0xe8(%RBP) |
(17422) 0xc0a563 SAR $0x2,%R12 |
(17422) 0xc0a567 MOV $-0x5555555555555555,%RAX |
(17422) 0xc0a571 IMUL %RAX,%R12 |
(17422) 0xc0a575 MOV 0x48(%R8,%R15,1),%RCX |
(17422) 0xc0a57a MOV 0x50(%R8,%R15,1),%RAX |
(17422) 0xc0a57f MOV %RAX,%RDX |
(17422) 0xc0a582 SUB %RCX,%RDX |
(17422) 0xc0a585 SAR $0x2,%RDX |
(17422) 0xc0a589 MOV %R12,%RSI |
(17422) 0xc0a58c SUB %RDX,%RSI |
(17422) 0xc0a58f MOV %R8,-0x48(%RBP) |
(17422) 0xc0a593 MOV %RDI,-0xf0(%RBP) |
(17422) 0xc0a59a JBE c0a5b0 |
(17422) 0xc0a59c MOV %R14,%RDI |
(17422) 0xc0a59f CALL fb5380 <@plt_start@+0x11ed0> |
(17422) 0xc0a5a4 JMP c0a5c0 |
0xc0a5a6 NOPW %CS:(%RAX,%RAX,1) |
(17422) 0xc0a5b0 JAE c0a5c0 |
(17422) 0xc0a5b2 LEA (%RCX,%R12,4),%RCX |
(17422) 0xc0a5b6 CMP %RCX,%RAX |
(17422) 0xc0a5b9 JE c0a5c0 |
(17422) 0xc0a5bb MOV %RCX,0x8(%R14) |
(17422) 0xc0a5bf NOP |
(17422) 0xc0a5c0 MOV %R14,-0xe0(%RBP) |
(17422) 0xc0a5c7 MOV %R12,%R13 |
(17422) 0xc0a5ca LEA (%R12,%R12,2),%RAX |
(17422) 0xc0a5ce LEA (%RBX,%RAX,4),%R12 |
(17422) 0xc0a5d2 LEA 0x3d4477(%RIP),%R14 |
(17422) 0xc0a5d9 MOV %R14,%RDI |
(17422) 0xc0a5dc CALL fa67a0 <@plt_start@+0x32f0> |
(17422) 0xc0a5e1 MOV %RBX,-0xd8(%RBP) |
(17422) 0xc0a5e8 MOV %RBX,-0xb0(%RBP) |
(17422) 0xc0a5ef MOV %R12,-0xa8(%RBP) |
(17422) 0xc0a5f6 MOV -0xb8(%RBP),%RCX |
(17422) 0xc0a5fd MOV %RCX,-0x70(%RBP) |
(17422) 0xc0a601 MOV -0x58(%RBP),%RCX |
(17422) 0xc0a605 MOV %RCX,-0x88(%RBP) |
(17422) 0xc0a60c MOV -0x48(%RBP),%R12 |
(17422) 0xc0a610 MOV 0x130(%R12,%R15,1),%EDX |
(17422) 0xc0a618 MOV %EDX,-0x50(%RBP) |
(17422) 0xc0a61b MOV %R14,%RDI |
(17422) 0xc0a61e MOV %EAX,%ESI |
(17422) 0xc0a620 CALL fa67c0 <@plt_start@+0x3310> |
(17422) 0xc0a625 SUB $0x8,%RSP |
(17422) 0xc0a629 LEA 0x3d4438(%RIP),%RDI |
(17422) 0xc0a630 MOV $0x4,%ESI |
(17422) 0xc0a635 LEA 0x924(%RIP),%RDX |
(17422) 0xc0a63c LEA -0x50(%RBP),%RCX |
(17422) 0xc0a640 LEA -0xb0(%RBP),%R8 |
(17422) 0xc0a647 LEA -0x70(%RBP),%R9 |
(17422) 0xc0a64b XOR %EAX,%EAX |
(17422) 0xc0a64d LEA -0x88(%RBP),%R10 |
(17422) 0xc0a654 PUSH %R10 |
(17422) 0xc0a656 CALL fa67d0 <@plt_start@+0x3320> |
(17422) 0xc0a65b ADD $0x10,%RSP |
(17422) 0xc0a65f MOV -0x50(%RBP),%ESI |
(17422) 0xc0a662 CMP $0x2,%ESI |
(17422) 0xc0a665 JL c0a6d0 |
(17422) 0xc0a667 MOV -0x88(%RBP),%RAX |
(17422) 0xc0a66e MOV 0x4(%RAX),%EDX |
(17422) 0xc0a671 MOV $0x1,%ECX |
(17422) 0xc0a676 JMP c0a68e |
0xc0a678 NOPL (%RAX,%RAX,1) |
(17429) 0xc0a680 MOV -0x50(%RBP),%ESI |
(17429) 0xc0a683 INC %RCX |
(17429) 0xc0a686 MOVSXD %ESI,%RDI |
(17429) 0xc0a689 CMP %RDI,%RCX |
(17429) 0xc0a68c JGE c0a6d0 |
(17429) 0xc0a68e TEST %EDX,%EDX |
(17429) 0xc0a690 JLE c0a683 |
(17429) 0xc0a692 MOV 0x60(%RAX),%RDX |
(17429) 0xc0a696 LEA (%RCX,%RCX,2),%RSI |
(17429) 0xc0a69a MOV (%RDX,%RSI,8),%RSI |
(17429) 0xc0a69e MOV (%RDX),%RDI |
(17429) 0xc0a6a1 XOR %R8D,%R8D |
(17429) 0xc0a6a4 NOPW %CS:(%RAX,%RAX,1) |
(17430) 0xc0a6b0 MOV (%RSI,%R8,4),%EDX |
(17430) 0xc0a6b4 ADD %EDX,(%RDI,%R8,4) |
(17430) 0xc0a6b8 INC %R8 |
(17430) 0xc0a6bb MOVSXD 0x4(%RAX),%RDX |
(17430) 0xc0a6bf CMP %RDX,%R8 |
(17430) 0xc0a6c2 JL c0a6b0 |
(17429) 0xc0a6c4 JMP c0a680 |
0xc0a6c6 NOPW %CS:(%RAX,%RAX,1) |
(17422) 0xc0a6d0 MOV -0xc0(%RBP),%RAX |
(17422) 0xc0a6d7 CMPQ $0,0x40(%RAX) |
(17422) 0xc0a6dc JE c0a4d0 |
(17422) 0xc0a6e2 MOV 0x4(%R12,%R15,1),%ESI |
(17422) 0xc0a6e7 MOV 0x28(%R12,%R15,1),%EAX |
(17422) 0xc0a6ec ADD %EAX,%EAX |
(17422) 0xc0a6ee DEC %ESI |
(17422) 0xc0a6f0 CMP %EAX,%ESI |
(17422) 0xc0a6f2 CMOVGE %EAX,%ESI |
(17422) 0xc0a6f5 MOV 0x60(%R12,%R15,1),%RAX |
(17422) 0xc0a6fa MOV (%RAX),%RBX |
(17422) 0xc0a6fd MOV %ESI,%EDI |
(17422) 0xc0a6ff TEST %ESI,%ESI |
(17422) 0xc0a701 MOV %ESI,-0x60(%RBP) |
(17422) 0xc0a704 MOV %RDI,-0x40(%RBP) |
(17422) 0xc0a708 JLE c0a730 |
(17422) 0xc0a70a MOV 0x10(%R12,%R15,1),%RCX |
(17422) 0xc0a70f MOV 0x30(%R12,%R15,1),%RAX |
(17422) 0xc0a714 MOV %EDI,%EDX |
(17422) 0xc0a716 AND $0x3,%EDX |
(17422) 0xc0a719 CMP $0x4,%ESI |
(17422) 0xc0a71c JAE c0a738 |
(17422) 0xc0a71e XOR %ESI,%ESI |
(17422) 0xc0a720 XOR %R12D,%R12D |
(17422) 0xc0a723 JMP c0a78c |
0xc0a725 NOPW %CS:(%RAX,%RAX,1) |
(17422) 0xc0a730 XOR %R12D,%R12D |
(17422) 0xc0a733 JMP c0a7c5 |
(17422) 0xc0a738 AND $-0x4,%EDI |
(17422) 0xc0a73b XOR %ESI,%ESI |
(17422) 0xc0a73d MOV %RCX,%R8 |
(17422) 0xc0a740 XOR %R12D,%R12D |
(17422) 0xc0a743 NOPW %CS:(%RAX,%RAX,1) |
(17427) 0xc0a750 MOVSXD (%R8),%R9 |
(17427) 0xc0a753 MOV %R12D,(%RAX,%R9,4) |
(17427) 0xc0a757 ADD (%RBX,%R9,4),%R12D |
(17427) 0xc0a75b MOVSXD 0xc(%R8),%R9 |
(17427) 0xc0a75f MOV %R12D,(%RAX,%R9,4) |
(17427) 0xc0a763 ADD (%RBX,%R9,4),%R12D |
(17427) 0xc0a767 MOVSXD 0x18(%R8),%R9 |
(17427) 0xc0a76b MOV %R12D,(%RAX,%R9,4) |
(17427) 0xc0a76f ADD (%RBX,%R9,4),%R12D |
(17427) 0xc0a773 MOVSXD 0x24(%R8),%R9 |
(17427) 0xc0a777 MOV %R12D,(%RAX,%R9,4) |
(17427) 0xc0a77b ADD (%RBX,%R9,4),%R12D |
(17427) 0xc0a77f ADD $0x4,%RSI |
(17427) 0xc0a783 ADD $0x30,%R8 |
(17427) 0xc0a787 CMP %RSI,%RDI |
(17427) 0xc0a78a JNE c0a750 |
(17422) 0xc0a78c TEST %RDX,%RDX |
(17422) 0xc0a78f JE c0a7c5 |
(17422) 0xc0a791 LEA (%RSI,%RSI,2),%RSI |
(17422) 0xc0a795 LEA (%RCX,%RSI,4),%RCX |
(17422) 0xc0a799 SAL $0x2,%RDX |
(17422) 0xc0a79d LEA (%RDX,%RDX,2),%RDX |
(17422) 0xc0a7a1 XOR %ESI,%ESI |
(17422) 0xc0a7a3 NOPW %CS:(%RAX,%RAX,1) |
(17428) 0xc0a7b0 MOVSXD (%RCX,%RSI,1),%RDI |
(17428) 0xc0a7b4 MOV %R12D,(%RAX,%RDI,4) |
(17428) 0xc0a7b8 ADD (%RBX,%RDI,4),%R12D |
(17428) 0xc0a7bc ADD $0xc,%RSI |
(17428) 0xc0a7c0 CMP %RSI,%RDX |
(17428) 0xc0a7c3 JNE c0a7b0 |
(17422) 0xc0a7c5 CMPB $0,-0x4c(%RBP) |
(17422) 0xc0a7c9 MOV %R15,-0x80(%RBP) |
(17422) 0xc0a7cd JE c0a970 |
(17422) 0xc0a7d3 MOV -0x48(%RBP),%RAX |
(17422) 0xc0a7d7 LEA (%RAX,%R15,1),%RCX |
(17422) 0xc0a7db ADD $0x8,%RCX |
(17422) 0xc0a7df MOV %RCX,-0x30(%RBP) |
(17422) 0xc0a7e3 MOVSXD 0x8(%RAX,%R15,1),%RAX |
(17422) 0xc0a7e8 MOV (%RBX,%RAX,4),%R14D |
(17422) 0xc0a7ec LEA (%R14,%R12,1),%EAX |
(17422) 0xc0a7f0 CLTQ |
(17422) 0xc0a7f2 CMP %RAX,%R13 |
(17422) 0xc0a7f5 MOV -0x60(%RBP),%ECX |
(17422) 0xc0a7f8 JNE c0aeab |
(17422) 0xc0a7fe MOV -0x38(%RBP),%RAX |
(17422) 0xc0a802 CMP 0x778(%RAX),%R12D |
(17422) 0xc0a809 JLE c0a897 |
(17422) 0xc0a80f MOV %R12D,%EDI |
(17422) 0xc0a812 CALL fa6070 <@plt_start@+0x2bc0> |
(17422) 0xc0a817 MOV -0x38(%RBP),%R14 |
(17422) 0xc0a81b MOV %EAX,0x778(%R14) |
(17422) 0xc0a822 MOVSXD %EAX,%R8 |
(17422) 0xc0a825 MOV 0x768(%R14),%RCX |
(17422) 0xc0a82c MOV $0xc,%R9D |
(17422) 0xc0a832 LEA -0x8b0e1c(%RIP),%RDI |
(17422) 0xc0a839 MOV %R15,%R12 |
(17422) 0xc0a83c LEA -0x9148a2(%RIP),%R15 |
(17422) 0xc0a843 MOV %R15,%RSI |
(17422) 0xc0a846 MOV $0x13d,%EDX |
(17422) 0xc0a84b CALL fa3cc0 <@plt_start@+0x810> |
(17422) 0xc0a850 MOV %RAX,0x768(%R14) |
(17422) 0xc0a857 MOVSXD 0x778(%R14),%R8 |
(17422) 0xc0a85e MOV 0x770(%R14),%RCX |
(17422) 0xc0a865 MOV $0x4,%R9D |
(17422) 0xc0a86b LEA -0x94b82d(%RIP),%RDI |
(17422) 0xc0a872 MOV %R15,%RSI |
(17422) 0xc0a875 MOV %R12,%R15 |
(17422) 0xc0a878 MOV $0x13e,%EDX |
(17422) 0xc0a87d CALL fa3cc0 <@plt_start@+0x810> |
(17422) 0xc0a882 MOV -0x60(%RBP),%ECX |
(17422) 0xc0a885 MOV %RAX,0x770(%R14) |
(17422) 0xc0a88c MOV -0x30(%RBP),%RAX |
(17422) 0xc0a890 MOVSXD (%RAX),%RAX |
(17422) 0xc0a893 MOV (%RBX,%RAX,4),%R14D |
(17422) 0xc0a897 TEST %ECX,%ECX |
(17422) 0xc0a899 JLE c0a960 |
(17422) 0xc0a89f MOV -0x48(%RBP),%R13 |
(17422) 0xc0a8a3 LEA (%R15,%R13,1),%RAX |
(17422) 0xc0a8a7 ADD $0x10,%RAX |
(17422) 0xc0a8ab MOV %RAX,-0x68(%RBP) |
(17422) 0xc0a8af MOV 0x10(%R13,%R15,1),%R13 |
(17422) 0xc0a8b4 MOV $0x8,%R15D |
(17422) 0xc0a8ba XOR %R12D,%R12D |
(17422) 0xc0a8bd JMP c0a91b |
0xc0a8bf NOP |
(17426) 0xc0a8c0 LEA (%R15,%R13,1),%R9 |
(17426) 0xc0a8c4 MOV -0x8(%R13,%R15,1),%ECX |
(17426) 0xc0a8c9 MOV -0x4(%R13,%R15,1),%EAX |
(17426) 0xc0a8ce MOV -0x68(%RBP),%R13 |
(17426) 0xc0a8d2 MOV -0x4(%R13),%R10D |
(17426) 0xc0a8d6 LEA -0x70(%RBP),%RDI |
(17426) 0xc0a8da MOV $0x4,%ESI |
(17426) 0xc0a8df MOV $0x4c00010d,%EDX |
(17426) 0xc0a8e4 MOV %R12D,%R8D |
(17426) 0xc0a8e7 LEA -0xb0(%RBP),%R11 |
(17426) 0xc0a8ee PUSH %R11 |
(17426) 0xc0a8f0 PUSH %R10 |
(17426) 0xc0a8f2 PUSH %R12 |
(17426) 0xc0a8f4 PUSH %RAX |
(17426) 0xc0a8f5 PUSH $0x4c00010d |
(17426) 0xc0a8fa PUSH $0x4 |
(17426) 0xc0a8fc CALL fa8ec0 <@plt_start@+0x5a10> |
(17426) 0xc0a901 ADD $0x30,%RSP |
(17426) 0xc0a905 MOV (%R13),%R13 |
(17426) 0xc0a909 ADD (%R13,%R15,1),%R14D |
(17426) 0xc0a90e INC %R12 |
(17426) 0xc0a911 ADD $0xc,%R15 |
(17426) 0xc0a915 CMP %R12,-0x40(%RBP) |
(17426) 0xc0a919 JE c0a960 |
(17426) 0xc0a91b MOVSXD -0x8(%R13,%R15,1),%R8 |
(17426) 0xc0a920 MOV (%RBX,%R8,4),%R9D |
(17426) 0xc0a924 MOV %R9D,-0x70(%RBP) |
(17426) 0xc0a928 MOV 0x3f4431(%RIP),%RAX |
(17426) 0xc0a92f MOV (%RAX),%RDI |
(17426) 0xc0a932 TEST %RDI,%RDI |
(17426) 0xc0a935 JE c0a8c0 |
(17426) 0xc0a937 MOV -0x58(%RBP),%RAX |
(17426) 0xc0a93b MOV (%RAX),%EDX |
(17426) 0xc0a93d MOV -0x30(%RBP),%RAX |
(17426) 0xc0a941 MOV (%RAX),%ECX |
(17426) 0xc0a943 LEA -0x9aed8a(%RIP),%RSI |
(17426) 0xc0a94a XOR %EAX,%EAX |
(17426) 0xc0a94c CALL fa3670 <@plt_start@+0x1c0> |
(17426) 0xc0a951 JMP c0a8c0 |
0xc0a956 NOPW %CS:(%RAX,%RAX,1) |
(17422) 0xc0a960 MOV -0x58(%RBP),%RDI |
(17422) 0xc0a964 MOV %R14D,%ESI |
(17422) 0xc0a967 CALL fb5340 <@plt_start@+0x11e90> |
(17422) 0xc0a96c MOV -0x80(%RBP),%R15 |
(17422) 0xc0a970 MOV -0xe8(%RBP),%RDX |
(17422) 0xc0a977 TEST %RDX,%RDX |
(17422) 0xc0a97a JLE c0aab0 |
(17422) 0xc0a980 MOV $-0x5555555555555555,%RAX |
(17422) 0xc0a98a MULX %RAX,%R8,%R8 |
(17422) 0xc0a98f SHR $0x3,%R8 |
(17422) 0xc0a993 MOV -0xe0(%RBP),%RAX |
(17422) 0xc0a99a MOV (%RAX),%RCX |
(17422) 0xc0a99d MOV -0x48(%RBP),%RDI |
(17422) 0xc0a9a1 LEA (%RDI,%R15,1),%RAX |
(17422) 0xc0a9a5 ADD $0x8,%RAX |
(17422) 0xc0a9a9 CMP $0x2,%R8 |
(17422) 0xc0a9ad MOV $0x1,%ESI |
(17422) 0xc0a9b2 CMOVL %RSI,%R8 |
(17422) 0xc0a9b6 CMPB $0,-0x4c(%RBP) |
(17422) 0xc0a9ba JE c0aaca |
(17422) 0xc0a9c0 LEA (%RDI,%R15,1),%RSI |
(17422) 0xc0a9c4 ADD $0xb0,%RSI |
(17422) 0xc0a9cb MOV -0xd8(%RBP),%RBX |
(17422) 0xc0a9d2 ADD $0x8,%RBX |
(17422) 0xc0a9d6 XOR %R15D,%R15D |
(17422) 0xc0a9d9 XOR %EDI,%EDI |
(17422) 0xc0a9db MOV -0x78(%RBP),%R12 |
(17422) 0xc0a9df MOV %R8,%RDX |
(17422) 0xc0a9e2 JMP c0aa42 |
0xc0a9e4 NOPW %CS:(%RAX,%RAX,1) |
(17425) 0xc0a9f0 MOVSXD %R15D,%R15 |
(17425) 0xc0a9f3 MOV (%RSI),%R8 |
(17425) 0xc0a9f6 LEA (%R15,%R15,2),%R9 |
(17425) 0xc0a9fa VMOVSS -0x8(%RBX),%XMM0 |
(17425) 0xc0a9ff VMOVSS %XMM0,(%R8,%R9,4) |
(17425) 0xc0aa05 VMOVSS -0x4(%RBX),%XMM0 |
(17425) 0xc0aa0a VMOVSS %XMM0,0x4(%R8,%R9,4) |
(17425) 0xc0aa11 VMOVSS (%RBX),%XMM0 |
(17425) 0xc0aa15 VMOVSS %XMM0,0x8(%R8,%R9,4) |
(17425) 0xc0aa1c VMOVSS (%R12,%RDI,4),%XMM0 |
(17425) 0xc0aa22 MOV 0xc0(%RAX),%R8 |
(17425) 0xc0aa29 VMOVSS %XMM0,(%R8,%R15,4) |
(17425) 0xc0aa2f INC %R15D |
(17425) 0xc0aa32 INC %RDI |
(17425) 0xc0aa35 ADD $0xc,%RBX |
(17425) 0xc0aa39 CMP %RDI,%RDX |
(17425) 0xc0aa3c JE c0ac00 |
(17425) 0xc0aa42 MOVSXD (%RCX,%RDI,4),%R8 |
(17425) 0xc0aa46 CMP (%RAX),%R8D |
(17425) 0xc0aa49 JE c0a9f0 |
(17425) 0xc0aa4b MOV 0x28(%RAX),%R9 |
(17425) 0xc0aa4f MOV -0x38(%RBP),%R14 |
(17425) 0xc0aa53 MOV 0x768(%R14),%R10 |
(17425) 0xc0aa5a MOVSXD (%R9,%R8,4),%R11 |
(17425) 0xc0aa5e LEA (%R11,%R11,2),%R13 |
(17425) 0xc0aa62 VMOVSS -0x8(%RBX),%XMM0 |
(17425) 0xc0aa67 VMOVSS %XMM0,(%R10,%R13,4) |
(17425) 0xc0aa6d VMOVSS -0x4(%RBX),%XMM0 |
(17425) 0xc0aa72 VMOVSS %XMM0,0x4(%R10,%R13,4) |
(17425) 0xc0aa79 VMOVSS (%RBX),%XMM0 |
(17425) 0xc0aa7d VMOVSS %XMM0,0x8(%R10,%R13,4) |
(17425) 0xc0aa84 VMOVSS (%R12,%RDI,4),%XMM0 |
(17425) 0xc0aa8a MOV 0x770(%R14),%R10 |
(17425) 0xc0aa91 VMOVSS %XMM0,(%R10,%R11,4) |
(17425) 0xc0aa97 LEA 0x1(%R11),%R10D |
(17425) 0xc0aa9b MOV %R10D,(%R9,%R8,4) |
(17425) 0xc0aa9f JMP c0aa32 |
0xc0aaa1 NOPW %CS:(%RAX,%RAX,1) |
(17422) 0xc0aab0 XOR %R15D,%R15D |
(17422) 0xc0aab3 CMPL $0,-0x60(%RBP) |
(17422) 0xc0aab7 MOV -0x48(%RBP),%RAX |
(17422) 0xc0aabb MOV -0x80(%RBP),%RCX |
(17422) 0xc0aabf JG c0ac12 |
(17422) 0xc0aac5 JMP c0a4d0 |
(17422) 0xc0aaca CMP $0x18,%RDX |
(17422) 0xc0aace MOV -0x78(%RBP),%RBX |
(17422) 0xc0aad2 JAE c0aae1 |
(17422) 0xc0aad4 XOR %R15D,%R15D |
(17422) 0xc0aad7 XOR %ESI,%ESI |
(17422) 0xc0aad9 MOV %R8,%RDX |
(17422) 0xc0aadc JMP c0abc8 |
(17422) 0xc0aae1 MOV %R8,%RDX |
(17422) 0xc0aae4 MOV %R8,%RDI |
(17422) 0xc0aae7 AND $-0x2,%RDI |
(17422) 0xc0aaeb XOR %R15D,%R15D |
(17422) 0xc0aaee XOR %ESI,%ESI |
(17422) 0xc0aaf0 JMP c0ab26 |
0xc0aaf2 NOPW %CS:(%RAX,%RAX,1) |
(17424) 0xc0ab00 VMOVSS 0x4(%RBX,%RSI,4),%XMM0 |
(17424) 0xc0ab06 MOVSXD %R15D,%R15 |
(17424) 0xc0ab09 MOV 0xc0(%RAX),%R8 |
(17424) 0xc0ab10 VMOVSS %XMM0,(%R8,%R15,4) |
(17424) 0xc0ab16 INC %R15D |
(17424) 0xc0ab19 ADD $0x2,%RSI |
(17424) 0xc0ab1d CMP %RSI,%RDI |
(17424) 0xc0ab20 JE c0abc8 |
(17424) 0xc0ab26 MOVSXD (%RCX,%RSI,4),%R8 |
(17424) 0xc0ab2a CMP (%RAX),%R8D |
(17424) 0xc0ab2d JNE c0ab60 |
(17424) 0xc0ab2f VMOVSS (%RBX,%RSI,4),%XMM0 |
(17424) 0xc0ab34 MOVSXD %R15D,%R15 |
(17424) 0xc0ab37 MOV 0xc0(%RAX),%R8 |
(17424) 0xc0ab3e VMOVSS %XMM0,(%R8,%R15,4) |
(17424) 0xc0ab44 INC %R15D |
(17424) 0xc0ab47 MOVSXD 0x4(%RCX,%RSI,4),%R8 |
(17424) 0xc0ab4c CMP (%RAX),%R8D |
(17424) 0xc0ab4f JE c0ab00 |
(17424) 0xc0ab51 JMP c0ab94 |
0xc0ab53 NOPW %CS:(%RAX,%RAX,1) |
(17424) 0xc0ab60 MOV 0x28(%RAX),%R9 |
(17424) 0xc0ab64 VMOVSS (%RBX,%RSI,4),%XMM0 |
(17424) 0xc0ab69 MOV -0x38(%RBP),%R10 |
(17424) 0xc0ab6d MOV 0x770(%R10),%R10 |
(17424) 0xc0ab74 MOVSXD (%R9,%R8,4),%R11 |
(17424) 0xc0ab78 VMOVSS %XMM0,(%R10,%R11,4) |
(17424) 0xc0ab7e LEA 0x1(%R11),%R10D |
(17424) 0xc0ab82 MOV %R10D,(%R9,%R8,4) |
(17424) 0xc0ab86 MOVSXD 0x4(%RCX,%RSI,4),%R8 |
(17424) 0xc0ab8b CMP (%RAX),%R8D |
(17424) 0xc0ab8e JE c0ab00 |
(17424) 0xc0ab94 MOV 0x28(%RAX),%R9 |
(17424) 0xc0ab98 VMOVSS 0x4(%RBX,%RSI,4),%XMM0 |
(17424) 0xc0ab9e MOV -0x38(%RBP),%R10 |
(17424) 0xc0aba2 MOV 0x770(%R10),%R10 |
(17424) 0xc0aba9 MOVSXD (%R9,%R8,4),%R11 |
(17424) 0xc0abad VMOVSS %XMM0,(%R10,%R11,4) |
(17424) 0xc0abb3 LEA 0x1(%R11),%R10D |
(17424) 0xc0abb7 MOV %R10D,(%R9,%R8,4) |
(17424) 0xc0abbb ADD $0x2,%RSI |
(17424) 0xc0abbf CMP %RSI,%RDI |
(17424) 0xc0abc2 JNE c0ab26 |
(17422) 0xc0abc8 TEST $0x1,%DL |
(17422) 0xc0abcb JE c0ac00 |
(17422) 0xc0abcd MOVSXD (%RCX,%RSI,4),%RCX |
(17422) 0xc0abd1 CMP (%RAX),%ECX |
(17422) 0xc0abd3 JNE c0ae5f |
(17422) 0xc0abd9 VMOVSS (%RBX,%RSI,4),%XMM0 |
(17422) 0xc0abde MOVSXD %R15D,%R15 |
(17422) 0xc0abe1 MOV 0xc0(%RAX),%RAX |
(17422) 0xc0abe8 VMOVSS %XMM0,(%RAX,%R15,4) |
(17422) 0xc0abee INC %R15D |
(17422) 0xc0abf1 NOPW %CS:(%RAX,%RAX,1) |
(17422) 0xc0ac00 CMPL $0,-0x60(%RBP) |
(17422) 0xc0ac04 MOV -0x48(%RBP),%RAX |
(17422) 0xc0ac08 MOV -0x80(%RBP),%RCX |
(17422) 0xc0ac0c JLE c0a4d0 |
(17422) 0xc0ac12 MOV %R15,%R8 |
(17422) 0xc0ac15 LEA (%RAX,%RCX,1),%R10 |
(17422) 0xc0ac19 ADD $0x60,%R10 |
(17422) 0xc0ac1d MOV 0x10(%RAX,%RCX,1),%RDX |
(17422) 0xc0ac22 MOV -0x40(%RBP),%RAX |
(17422) 0xc0ac26 SAL $0x2,%RAX |
(17422) 0xc0ac2a LEA (%RAX,%RAX,2),%RSI |
(17422) 0xc0ac2e XOR %R14D,%R14D |
(17422) 0xc0ac31 XOR %EBX,%EBX |
(17422) 0xc0ac33 XOR %EDI,%EDI |
(17422) 0xc0ac35 MOV %R10,-0x30(%RBP) |
(17422) 0xc0ac39 MOV %RSI,-0x48(%RBP) |
(17422) 0xc0ac3d JMP c0aca3 |
0xc0ac3f NOP |
(17423) 0xc0ac40 MOV -0x30(%RBP),%RDX |
(17423) 0xc0ac44 MOV -0x54(%RDX),%R10D |
(17423) 0xc0ac48 MOV %R13,%RDI |
(17423) 0xc0ac4b MOV $0x4c00010d,%EDX |
(17423) 0xc0ac50 MOV %R14D,%R8D |
(17423) 0xc0ac53 MOV %R12,%R9 |
(17423) 0xc0ac56 LEA -0xb0(%RBP),%R11 |
(17423) 0xc0ac5d PUSH %R11 |
(17423) 0xc0ac5f PUSH %R10 |
(17423) 0xc0ac61 PUSH %R14 |
(17423) 0xc0ac63 PUSH %RAX |
(17423) 0xc0ac64 PUSH $0x4c00010d |
(17423) 0xc0ac69 PUSH %R15 |
(17423) 0xc0ac6b CALL fa8ec0 <@plt_start@+0x5a10> |
(17423) 0xc0ac70 MOV -0x40(%RBP),%R11 |
(17423) 0xc0ac74 MOV -0x30(%RBP),%R10 |
(17423) 0xc0ac78 ADD $0x30,%RSP |
(17423) 0xc0ac7c MOV -0x58(%RBP),%EDI |
(17423) 0xc0ac7f ADD %R11D,%EDI |
(17423) 0xc0ac82 MOV -0x50(%R10),%RDX |
(17423) 0xc0ac86 MOV -0x68(%RBP),%R8 |
(17423) 0xc0ac8a ADD 0x8(%RDX,%RBX,1),%R8D |
(17423) 0xc0ac8f MOV -0x48(%RBP),%RSI |
(17423) 0xc0ac93 ADD $0xc,%RBX |
(17423) 0xc0ac97 INC %R14D |
(17423) 0xc0ac9a CMP %RBX,%RSI |
(17423) 0xc0ac9d JE c0a4d0 |
(17423) 0xc0aca3 MOV (%R10),%RAX |
(17423) 0xc0aca6 MOV (%RAX),%RAX |
(17423) 0xc0aca9 MOVSXD (%RDX,%RBX,1),%RCX |
(17423) 0xc0acad MOV (%RAX,%RCX,4),%R11D |
(17423) 0xc0acb1 MOV 0x8(%RDX,%RBX,1),%R15D |
(17423) 0xc0acb6 TEST %R11D,%R11D |
(17423) 0xc0acb9 JG c0acc0 |
(17423) 0xc0acbb TEST %R15D,%R15D |
(17423) 0xc0acbe JLE c0ac93 |
(17423) 0xc0acc0 CMPB $0,-0x4c(%RBP) |
(17423) 0xc0acc4 MOV %R11,-0x40(%RBP) |
(17423) 0xc0acc8 MOV %R8,-0x68(%RBP) |
(17423) 0xc0accc MOV %EDI,-0x58(%RBP) |
(17423) 0xc0accf MOVSXD %EDI,%R13 |
(17423) 0xc0acd2 JE c0ad60 |
(17423) 0xc0acd8 LEA (,%R13,2),%RDI |
(17423) 0xc0ace0 ADD %R13,%RDI |
(17423) 0xc0ace3 SAL $0x2,%RDI |
(17423) 0xc0ace7 MOV -0x38(%RBP),%RAX |
(17423) 0xc0aceb ADD 0x768(%RAX),%RDI |
(17423) 0xc0acf2 LEA (,%R11,4),%EAX |
(17423) 0xc0acfa LEA (%RAX,%RAX,2),%ESI |
(17423) 0xc0acfd MOVSXD %R8D,%R12 |
(17423) 0xc0ad00 LEA (%R12,%R12,2),%R9 |
(17423) 0xc0ad04 SAL $0x2,%R9 |
(17423) 0xc0ad08 ADD 0x50(%R10),%R9 |
(17423) 0xc0ad0c LEA (,%R15,4),%EAX |
(17423) 0xc0ad14 LEA (%RAX,%RAX,2),%EAX |
(17423) 0xc0ad17 MOV 0x4(%RDX,%RBX,1),%R8D |
(17423) 0xc0ad1c TEST %ESI,%ESI |
(17423) 0xc0ad1e JLE c0ad65 |
(17423) 0xc0ad20 TEST %EAX,%EAX |
(17423) 0xc0ad22 JLE c0ad65 |
(17423) 0xc0ad24 MOV -0x54(%R10),%EDX |
(17423) 0xc0ad28 MOV %RDX,-0x60(%RBP) |
(17423) 0xc0ad2c MOV $0x4c00010d,%EDX |
(17423) 0xc0ad31 MOV %R8,%R11 |
(17423) 0xc0ad34 MOV %R14D,%R8D |
(17423) 0xc0ad37 LEA -0xb0(%RBP),%R10 |
(17423) 0xc0ad3e PUSH %R10 |
(17423) 0xc0ad40 PUSHQ -0x60(%RBP) |
(17423) 0xc0ad43 PUSH %R14 |
(17423) 0xc0ad45 PUSH %R11 |
(17423) 0xc0ad47 PUSH $0x4c00010d |
(17423) 0xc0ad4c PUSH %RAX |
(17423) 0xc0ad4d CALL fa8ec0 <@plt_start@+0x5a10> |
(17423) 0xc0ad52 MOV -0x40(%RBP),%R11 |
(17423) 0xc0ad56 MOV -0x30(%RBP),%R10 |
(17423) 0xc0ad5a ADD $0x30,%RSP |
(17423) 0xc0ad5e JMP c0adc0 |
(17423) 0xc0ad60 MOVSXD %R8D,%R12 |
(17423) 0xc0ad63 JMP c0adc7 |
(17423) 0xc0ad65 TEST %ESI,%ESI |
(17423) 0xc0ad67 JLE c0ad84 |
(17423) 0xc0ad69 MOV -0x54(%R10),%R9D |
(17423) 0xc0ad6d MOV $0x4c00010d,%EDX |
(17423) 0xc0ad72 MOV %R14D,%R8D |
(17423) 0xc0ad75 CALL fa8410 <@plt_start@+0x4f60> |
(17423) 0xc0ad7a MOV -0x40(%RBP),%R11 |
(17423) 0xc0ad7e MOV -0x30(%RBP),%R10 |
(17423) 0xc0ad82 JMP c0adc0 |
(17423) 0xc0ad84 TEST %EAX,%EAX |
(17423) 0xc0ad86 JLE c0adc0 |
(17423) 0xc0ad88 MOV -0x54(%R10),%R11D |
(17423) 0xc0ad8c SUB $0x8,%RSP |
(17423) 0xc0ad90 MOV %R9,%RDI |
(17423) 0xc0ad93 MOV %EAX,%ESI |
(17423) 0xc0ad95 MOV $0x4c00010d,%EDX |
(17423) 0xc0ad9a MOV %R8D,%ECX |
(17423) 0xc0ad9d MOV %R14D,%R8D |
(17423) 0xc0ada0 MOV %R11D,%R9D |
(17423) 0xc0ada3 LEA -0xb0(%RBP),%RAX |
(17423) 0xc0adaa PUSH %RAX |
(17423) 0xc0adab CALL fa8400 <@plt_start@+0x4f50> |
(17423) 0xc0adb0 MOV -0x40(%RBP),%R11 |
(17423) 0xc0adb4 MOV -0x30(%RBP),%R10 |
(17423) 0xc0adb8 ADD $0x10,%RSP |
(17423) 0xc0adbc NOPL (%RAX) |
(17423) 0xc0adc0 MOV -0x50(%R10),%RDX |
(17423) 0xc0adc4 MOV (%RDX,%RBX,1),%ECX |
(17423) 0xc0adc7 SAL $0x2,%R13 |
(17423) 0xc0adcb MOV -0x38(%RBP),%RAX |
(17423) 0xc0adcf ADD 0x770(%RAX),%R13 |
(17423) 0xc0add6 LEA (,%R11,4),%ESI |
(17423) 0xc0adde SAL $0x2,%R12 |
(17423) 0xc0ade2 ADD 0x68(%R10),%R12 |
(17423) 0xc0ade6 SAL $0x2,%R15D |
(17423) 0xc0adea MOV 0x4(%RDX,%RBX,1),%EAX |
(17423) 0xc0adee TEST %ESI,%ESI |
(17423) 0xc0adf0 JLE c0adfb |
(17423) 0xc0adf2 TEST %R15D,%R15D |
(17423) 0xc0adf5 JG c0ac40 |
(17423) 0xc0adfb TEST %ESI,%ESI |
(17423) 0xc0adfd JLE c0ae20 |
(17423) 0xc0adff MOV -0x54(%R10),%R9D |
(17423) 0xc0ae03 MOV %R13,%RDI |
(17423) 0xc0ae06 MOV $0x4c00010d,%EDX |
(17423) 0xc0ae0b MOV %R14D,%R8D |
(17423) 0xc0ae0e CALL fa8410 <@plt_start@+0x4f60> |
(17423) 0xc0ae13 MOV -0x40(%RBP),%R11 |
(17423) 0xc0ae17 MOV -0x30(%RBP),%R10 |
(17423) 0xc0ae1b JMP c0ac7c |
(17423) 0xc0ae20 TEST %R15D,%R15D |
(17423) 0xc0ae23 JLE c0ac7c |
(17423) 0xc0ae29 MOV -0x54(%R10),%R9D |
(17423) 0xc0ae2d SUB $0x8,%RSP |
(17423) 0xc0ae31 MOV %R12,%RDI |
(17423) 0xc0ae34 MOV %R15D,%ESI |
(17423) 0xc0ae37 MOV $0x4c00010d,%EDX |
(17423) 0xc0ae3c MOV %EAX,%ECX |
(17423) 0xc0ae3e MOV %R14D,%R8D |
(17423) 0xc0ae41 LEA -0xb0(%RBP),%RAX |
(17423) 0xc0ae48 PUSH %RAX |
(17423) 0xc0ae49 CALL fa8400 <@plt_start@+0x4f50> |
(17423) 0xc0ae4e MOV -0x40(%RBP),%R11 |
(17423) 0xc0ae52 MOV -0x30(%RBP),%R10 |
(17423) 0xc0ae56 ADD $0x10,%RSP |
(17423) 0xc0ae5a JMP c0ac7c |
(17422) 0xc0ae5f MOV 0x28(%RAX),%RAX |
(17422) 0xc0ae63 VMOVSS (%RBX,%RSI,4),%XMM0 |
(17422) 0xc0ae68 MOV -0x38(%RBP),%RDX |
(17422) 0xc0ae6c MOV 0x770(%RDX),%RDX |
(17422) 0xc0ae73 MOVSXD (%RAX,%RCX,4),%RSI |
(17422) 0xc0ae77 VMOVSS %XMM0,(%RDX,%RSI,4) |
(17422) 0xc0ae7c LEA 0x1(%RSI),%EDX |
(17422) 0xc0ae7f MOV %EDX,(%RAX,%RCX,4) |
(17422) 0xc0ae82 CMPL $0,-0x60(%RBP) |
(17422) 0xc0ae86 MOV -0x48(%RBP),%RAX |
(17422) 0xc0ae8a MOV -0x80(%RBP),%RCX |
(17422) 0xc0ae8e JG c0ac12 |
(17422) 0xc0ae94 JMP c0a4d0 |
0xc0ae99 ADD $0xd8,%RSP |
0xc0aea0 POP %RBX |
0xc0aea1 POP %R12 |
0xc0aea3 POP %R13 |
0xc0aea5 POP %R14 |
0xc0aea7 POP %R15 |
0xc0aea9 POP %RBP |
0xc0aeaa RET |
0xc0aeab LEA -0x914f11(%RIP),%RSI |
0xc0aeb2 LEA -0xb0(%RBP),%R14 |
0xc0aeb9 MOV %R14,%RDI |
0xc0aebc MOV $0x2,%EDX |
0xc0aec1 CALL fac910 <@plt_start@+0x9460> |
0xc0aec6 MOV -0x30(%RBP),%RAX |
0xc0aeca MOVSXD (%RAX),%RAX |
0xc0aecd MOVSXD (%RBX,%RAX,4),%RAX |
0xc0aed1 MOVSXD %R12D,%RCX |
0xc0aed4 ADD %RAX,%RCX |
0xc0aed7 SUB %RCX,%R13 |
0xc0aeda MOV -0x38(%RBP),%RAX |
0xc0aede MOV 0x4(%RAX),%R9D |
0xc0aee2 MOV -0x58(%RBP),%RAX |
0xc0aee6 MOV (%RAX),%R10D |
0xc0aee9 ADD $0x78,%R10D |
0xc0aeed SUB $0x8,%RSP |
0xc0aef1 LEA -0x8f1535(%RIP),%RCX |
0xc0aef8 XOR %EDI,%EDI |
0xc0aefa MOV %R14,%RSI |
0xc0aefd MOV $0x131,%EDX |
0xc0af02 MOV %R13,%R8 |
0xc0af05 XOR %EAX,%EAX |
0xc0af07 PUSH %R10 |
0xc0af09 CALL fa3b70 <@plt_start@+0x6c0> |
0xc0af0e ADD $0x10,%RSP |
0xc0af12 MOV %RAX,%RBX |
0xc0af15 MOV -0x90(%RBP),%RSI |
0xc0af1c TEST %RSI,%RSI |
0xc0af1f JE c0af2d |
0xc0af21 LEA -0x90(%RBP),%RDI |
0xc0af28 CALL fa3900 <@plt_start@+0x450> |
0xc0af2d MOVQ $0,-0x90(%RBP) |
0xc0af38 MOV -0xb0(%RBP),%RDI |
0xc0af3f LEA -0xa0(%RBP),%RAX |
0xc0af46 CMP %RAX,%RDI |
0xc0af49 JE c0af50 |
0xc0af4b CALL fa3730 <@plt_start@+0x280> |
0xc0af50 MOV %RBX,%RDI |
0xc0af53 CALL fa3770 <@plt_start@+0x2c0> |
0xc0af58 NOPL (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►76.80+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►12.96+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
►10.24+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►84.00+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►11.61+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
►4.39+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►55.03+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►31.49+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
►13.47+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►62.27+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►22.86+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►14.45+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►47.49+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►33.92+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
►18.50+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1230 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Path / |
The code analyzed by CQA in that panel excludes loops and represents 0.00% of application time for run 1x1
Source file and lines | pme_redistribute.cpp:126-506 |
Module | libgromacs_mpi.so.9.0.0 |
nb instructions | 81 |
nb uops | 73 |
loop length | 384 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 11 |
micro-operation queue | 12.17 cycles |
front end | 12.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 6.50 | 6.50 | 6.50 | 6.50 | 5.00 | 7.67 | 7.67 | 7.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 6.50 | 6.50 | 6.50 | 6.50 | 5.00 | 7.67 | 7.67 | 7.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 12.17 |
Dispatch | 7.67 |
Overall L1 | 12.17 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 7% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 11% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 9% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0xd8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV %R8,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RCX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %EDX,-0x4c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %RSI,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV (%RDI),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
TEST %ECX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
JLE c0ae99 <_Z20do_redist_pos_coeffsP9gmx_pme_tPK9t_commrecbN3gmx8ArrayRefIKNS4_11BasicVectorIfEEEENS5_IKfEE+0xa19> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
ADD $0x5d0,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP c0a4e5 <_Z20do_redist_pos_coeffsP9gmx_pme_tPK9t_commrecbN3gmx8ArrayRefIKNS4_11BasicVectorIfEEEENS5_IKfEE+0x65> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
ADD $0xd8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
LEA -0x914f11(%RIP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0xb0(%RBP),%R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV $0x2,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
CALL fac910 <@plt_start@+0x9460> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOVSXD (%RAX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
MOVSXD (%RBX,%RAX,4),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
MOVSXD %R12D,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
ADD %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
SUB %RCX,%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x4(%RAX),%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV (%RAX),%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
ADD $0x78,%R10D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
LEA -0x8f1535(%RIP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV $0x131,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
MOV %R13,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
PUSH %R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL fa3b70 <@plt_start@+0x6c0> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
ADD $0x10,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV -0x90(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
TEST %RSI,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JE c0af2d <_Z20do_redist_pos_coeffsP9gmx_pme_tPK9t_commrecbN3gmx8ArrayRefIKNS4_11BasicVectorIfEEEENS5_IKfEE+0xaad> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
LEA -0x90(%RBP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa3900 <@plt_start@+0x450> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOVQ $0,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV -0xb0(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
LEA -0xa0(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CMP %RAX,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JE c0af50 <_Z20do_redist_pos_coeffsP9gmx_pme_tPK9t_commrecbN3gmx8ArrayRefIKNS4_11BasicVectorIfEEEENS5_IKfEE+0xad0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
CALL fa3730 <@plt_start@+0x280> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
CALL fa3770 <@plt_start@+0x2c0> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
The code analyzed by CQA in that panel excludes loops and represents 0.00% of application time for run 1x1
Source file and lines | pme_redistribute.cpp:126-506 |
Module | libgromacs_mpi.so.9.0.0 |
nb instructions | 81 |
nb uops | 73 |
loop length | 384 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 11 |
micro-operation queue | 12.17 cycles |
front end | 12.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 6.50 | 6.50 | 6.50 | 6.50 | 5.00 | 7.67 | 7.67 | 7.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 6.50 | 6.50 | 6.50 | 6.50 | 5.00 | 7.67 | 7.67 | 7.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 12.17 |
Dispatch | 7.67 |
Overall L1 | 12.17 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 7% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 11% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 9% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
SUB $0xd8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV %R8,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RCX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %EDX,-0x4c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %RSI,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV (%RDI),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
TEST %ECX,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
JLE c0ae99 <_Z20do_redist_pos_coeffsP9gmx_pme_tPK9t_commrecbN3gmx8ArrayRefIKNS4_11BasicVectorIfEEEENS5_IKfEE+0xa19> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
ADD $0x5d0,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP c0a4e5 <_Z20do_redist_pos_coeffsP9gmx_pme_tPK9t_commrecbN3gmx8ArrayRefIKNS4_11BasicVectorIfEEEENS5_IKfEE+0x65> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
ADD $0xd8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
LEA -0x914f11(%RIP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA -0xb0(%RBP),%R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV $0x2,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
CALL fac910 <@plt_start@+0x9460> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOVSXD (%RAX),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
MOVSXD (%RBX,%RAX,4),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
MOVSXD %R12D,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
ADD %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
SUB %RCX,%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x4(%RAX),%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV (%RAX),%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (6.3%) |
ADD $0x78,%R10D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
LEA -0x8f1535(%RIP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
MOV $0x131,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
MOV %R13,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (12.5%) |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | N/A |
PUSH %R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CALL fa3b70 <@plt_start@+0x6c0> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
ADD $0x10,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV -0x90(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
TEST %RSI,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
JE c0af2d <_Z20do_redist_pos_coeffsP9gmx_pme_tPK9t_commrecbN3gmx8ArrayRefIKNS4_11BasicVectorIfEEEENS5_IKfEE+0xaad> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
LEA -0x90(%RBP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fa3900 <@plt_start@+0x450> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOVQ $0,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV -0xb0(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
LEA -0xa0(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CMP %RAX,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JE c0af50 <_Z20do_redist_pos_coeffsP9gmx_pme_tPK9t_commrecbN3gmx8ArrayRefIKNS4_11BasicVectorIfEEEENS5_IKfEE+0xad0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
CALL fa3730 <@plt_start@+0x280> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
CALL fa3770 <@plt_start@+0x2c0> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Run 1x1 | Number processes: 1Number processes per node: 1OMP_NUM_THREADS: 1 |
---|---|
Run 2x1 | Number processes: 2Number processes per node: 2OMP_NUM_THREADS: 1 |
Run 4x1 | Number processes: 4Number processes per node: 4OMP_NUM_THREADS: 1 |
Run 8x1 | Number processes: 8Number processes per node: 8OMP_NUM_THREADS: 1 |
Run 16x1 | Number processes: 16Number processes per node: 16OMP_NUM_THREADS: 1 |
Run 32x1 | Number processes: 32Number processes per node: 32OMP_NUM_THREADS: 1 |
Run 64x1 | Number processes: 64Number processes per node: 64OMP_NUM_THREADS: 1 |
Run 128x1 | Number processes: 128Number processes per node: 128OMP_NUM_THREADS: 1 |
Run 192x1 | Number processes: 192Number nodes: 1Number processes per node: 192Run Command: <executable> mdrun -s ion_channel.tpr -nsteps 10000 -pin on -deffnm aoccMPI Command: mpirun -genv I_MPI_FABRICS=shm -n <number_processes>Dataset: Run Directory: .OMP_NUM_THREADS: 1 |
(1x1) Efficiency | (1x1) Potential Speed-Up (%) | (2x1) Efficiency | (2x1) Potential Speed-Up (%) | (4x1) Efficiency | (4x1) Potential Speed-Up (%) | (8x1) Efficiency | (8x1) Potential Speed-Up (%) | (16x1) Efficiency | (16x1) Potential Speed-Up (%) | (32x1) Efficiency | (32x1) Potential Speed-Up (%) | (64x1) Efficiency | (64x1) Potential Speed-Up (%) | (128x1) Efficiency | (128x1) Potential Speed-Up (%) | (192x1) Efficiency | (192x1) Potential Speed-Up (%) |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
1 | 0 | 1 | 0 | 1 | 0 | 1 | 0 | 1 | 0 | 1 | 0 | 1 | 0 | 1 | 0 |
Run | Number of threads | Efficiency (ideal is 1) | Speedup | Ideal Speedup | Time (s) | Coverage (%) |
---|---|---|---|---|---|---|
1x1 | ||||||
2x1 | 2 | 1 | 1 | 2 | 1.2849998474121 | 0.22558608651161 |
4x1 | 4 | 1 | 1 | 4 | 0.72500002384186 | 0.2600664794445 |
8x1 | 8 | 1 | 1 | 8 | 0.53499984741211 | 0.25256049633026 |
16x1 | 16 | 1 | 1 | 16 | 0.32499995827675 | 0.29414308071136 |
32x1 | 12 | 1 | 1 | 32 | 0.38999995589256 | 0.18749701976776 |
64x1 | 24 | 1 | 1 | 64 | 0.26499995589256 | 0.14063760638237 |
128x1 | 44 | 1 | 1 | 128 | 0.20499996840954 | 0.26462775468826 |
192x1 | 64 | 1 | 1 | 192 | 0.11999998241663 | 0.2068192511797 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼do_redist_pos_coeffs(gmx_pme_t*, t_commrec const*, bool, gmx::ArrayRef | 0.21 | 0.03 |
▼Loop 17422 - pme_redistribute.cpp:126-501 - libgromacs_mpi.so.9.0.0– | 0.00 | 0.01 |
○Loop 17425 - pme_redistribute.cpp:345-367 - libgromacs_mpi.so.9.0.0 | 0.20 | 0.08 |
○Loop 17423 - pme_redistribute.cpp:265-398 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.01 |
○Loop 17426 - pme_redistribute.cpp:252-338 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.01 |
○Loop 17424 - pme_redistribute.cpp:345-367 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 17427 - pme_redistribute.cpp:294-298 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 17428 - pme_redistribute.cpp:294-298 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
▼Loop 17429 - pme_redistribute.cpp:145-149 - libgromacs_mpi.so.9.0.0– | 0.00 | 0.00 |
○Loop 17430 - pme_redistribute.cpp:147-149 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |