Function: void gmx::nbnxmKernelSimd<(KernelLayout)1, (gmx::KernelCoulombType)1, (VdwCutoffCheck)0, ( ... | Module: libgromacs_mpi.so.9.0.0 | Source: simd_kernel.h:121-564 [...] | Coverage (incl. loops): 22.08% | (excl. loops): 0.00% |
---|
Function: void gmx::nbnxmKernelSimd<(KernelLayout)1, (gmx::KernelCoulombType)1, (VdwCutoffCheck)0, ( ... | Module: libgromacs_mpi.so.9.0.0 | Source: simd_kernel.h:121-564 [...] | Coverage (incl. loops): 22.08% | (excl. loops): 0.00% |
---|
/home/eoseret/gromacs-2024.2/src/gromacs/nbnxm/simd_load_store_functions.h: 93 - 109 |
-------------------------------------------------------------------------------- |
93: return loadU1DualHsimd(ptr + offset + iRegister * 2); |
[...] |
109: return loadDuplicateHsimd(ptr + offset); |
/home/eoseret/gromacs-2024.2/src/gromacs/nbnxm/simd_kernel_inner.h: 63 - 275 |
-------------------------------------------------------------------------------- |
63: const int cj = l_cj[cjind].cj; |
64: |
65: /* Atom indices (of the first atom in the cluster) */ |
66: const int gmx_unused aj = cj * c_jClusterSize; |
67: |
68: const int ajx = |
69: (c_jClusterSize == c_stride ? aj * DIM : (cj >> 1) * DIM * c_stride + (cj & 1) * c_jClusterSize); |
[...] |
225: aj2 = aj * 2; |
[...] |
275: const SimdReal sqrtEpsilonJ = loadJAtomData<kernelLayout>(ljc, aj2 + c_stride); |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_vector.h: 1064 - 1064 |
-------------------------------------------------------------------------------- |
1064: return *(this->_M_impl._M_start + __n); |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_iterator.h: 1028 - 1182 |
-------------------------------------------------------------------------------- |
1028: : _M_current(__i) { } |
[...] |
1054: ++_M_current; |
[...] |
1182: { return __lhs.base() != __rhs.base(); } |
/home/eoseret/gromacs-2024.2/src/gromacs/nbnxm/simd_diagonal_masker.h: 140 - 144 |
-------------------------------------------------------------------------------- |
140: if (jClusterIndex * 2 == iClusterIndex) |
141: { |
142: boolV = genBoolArr<nR>([&](int i) { return boolV[i] && diagonalMaskVV_[0][i]; }); |
143: } |
144: else if (jClusterIndex * 2 + 1 == iClusterIndex) |
/home/eoseret/gromacs-2024.2/src/gromacs/simd/include/gromacs/simd/impl_x86_avx_512/impl_x86_avx_512_util_float.h: 95 - 474 |
-------------------------------------------------------------------------------- |
95: _mm512_shuffle_f32x4(a.simdInternal_, a.simdInternal_, 0xEE)); |
96: t = _mm256_load_ps(m); |
97: t = _mm256_sub_ps(t, _mm512_castps512_ps256(a.simdInternal_)); |
98: _mm256_store_ps(m, t); |
[...] |
370: return { _mm512_castpd_ps(_mm512_broadcast_f64x4(_mm256_load_pd(reinterpret_cast<const double*>(m)))) }; |
371: } |
372: |
373: static inline SimdFloat gmx_simdcall loadU1DualHsimd(const float* m) |
374: { |
375: return { _mm512_shuffle_f32x4( |
[...] |
459: t0 = _mm512_shuffle_f32x4(v0.simdInternal_, v1.simdInternal_, 0x88); |
460: t1 = _mm512_shuffle_f32x4(v0.simdInternal_, v1.simdInternal_, 0xDD); |
461: t0 = _mm512_add_ps(t0, t1); |
462: t0 = _mm512_add_ps(t0, _mm512_permute_ps(t0, 0x4E)); |
463: t0 = _mm512_add_ps(t0, _mm512_permute_ps(t0, 0xB1)); |
464: t0 = _mm512_maskz_compress_ps(avx512Int2Mask(0x1111), t0); |
465: |
466: t3 = _mm512_castps512_ps128(t0); |
467: t2 = _mm_load_ps(m); |
468: t2 = _mm_add_ps(t2, t3); |
469: _mm_store_ps(m, t2); |
470: |
471: t3 = _mm_add_ps(t3, _mm_permute_ps(t3, 0x4E)); |
472: t3 = _mm_add_ps(t3, _mm_permute_ps(t3, 0xB1)); |
473: |
474: return _mm_cvtss_f32(t3); |
/home/eoseret/gromacs-2024.2/src/gromacs/simd/include/gromacs/simd/impl_x86_avx_512/impl_x86_avx_512_simd_float.h: 70 - 461 |
-------------------------------------------------------------------------------- |
70: SimdFInt32(std::int32_t i) : simdInternal_(_mm512_set1_epi32(i)) {} |
[...] |
181: return { _mm512_add_ps(a.simdInternal_, b.simdInternal_) }; |
182: } |
183: |
184: static inline SimdFloat gmx_simdcall operator-(SimdFloat a, SimdFloat b) |
185: { |
186: return { _mm512_sub_ps(a.simdInternal_, b.simdInternal_) }; |
[...] |
197: return { _mm512_mul_ps(a.simdInternal_, b.simdInternal_) }; |
198: } |
199: |
200: static inline SimdFloat gmx_simdcall fma(SimdFloat a, SimdFloat b, SimdFloat c) |
201: { |
202: return { _mm512_fmadd_ps(a.simdInternal_, b.simdInternal_, c.simdInternal_) }; |
[...] |
212: return { _mm512_fnmadd_ps(a.simdInternal_, b.simdInternal_, c.simdInternal_) }; |
[...] |
224: return { _mm512_rsqrt14_ps(x.simdInternal_) }; |
225: } |
226: |
227: static inline SimdFloat gmx_simdcall rcp(SimdFloat x) |
228: { |
229: return { _mm512_rcp14_ps(x.simdInternal_) }; |
[...] |
269: return { _mm512_max_ps(a.simdInternal_, b.simdInternal_) }; |
[...] |
367: return { _mm512_cmp_ps_mask(a.simdInternal_, b.simdInternal_, _CMP_LT_OQ) }; |
[...] |
383: return { _mm512_kand(a.simdInternal_, b.simdInternal_) }; |
[...] |
398: return { _mm512_mask_mov_ps(_mm512_setzero_ps(), m.simdInternal_, a.simdInternal_) }; |
[...] |
461: return { _mm512_test_epi32_mask(a.simdInternal_, a.simdInternal_) }; |
/home/eoseret/gromacs-2024.2/src/gromacs/nbnxm/simd_kernel.h: 121 - 564 |
-------------------------------------------------------------------------------- |
121: { |
[...] |
273: for (const nbnxn_ci_t& ciEntry : nbl->ci) |
274: { |
275: const int ish = (ciEntry.shift & NBNXN_CI_SHIFT); |
276: const int ish3 = ish * 3; |
277: const int cjind0 = ciEntry.cj_ind_start; |
278: const int cjind1 = ciEntry.cj_ind_end; |
279: const int ci = ciEntry.ci; |
280: const int ci_sh = (ish == c_centralShiftIndex ? ci : -1); |
[...] |
298: sci = (ci >> 1) * c_stride; |
299: scix = sci * DIM + (ci & 1) * (c_stride >> 1); |
[...] |
311: const bool do_coul = ((ciEntry.shift & NBNXN_CI_DO_COUL(0)) != 0); |
312: const bool half_LJ = (((ciEntry.shift & NBNXN_CI_HALF_LJ(0)) != 0) || !do_LJ) && do_coul; |
[...] |
388: if (do_coul) |
[...] |
461: if (half_LJ) |
[...] |
468: while (cjind < cjind1 && nbl->cj.excl(cjind) != NBNXN_INTERACTION_MASK_ALL) |
[...] |
476: for (; (cjind < cjind1); cjind++) |
[...] |
482: else if (do_coul) |
[...] |
489: while (cjind < cjind1 && nbl->cj.excl(cjind) != NBNXN_INTERACTION_MASK_ALL) |
[...] |
497: for (; (cjind < cjind1); cjind++) |
[...] |
510: while (cjind < cjind1 && nbl->cj.excl(cjind) != NBNXN_INTERACTION_MASK_ALL) |
511: { |
512: #include "simd_kernel_inner.h" |
513: cjind++; |
514: } |
515: } |
516: { |
517: constexpr bool c_needToCheckExclusions = false; |
518: for (; (cjind < cjind1); cjind++) |
[...] |
543: fshift[ish3 + 0] += fShiftX; |
544: fshift[ish3 + 1] += fShiftY; |
545: fshift[ish3 + 2] += fShiftZ; |
[...] |
564: } |
0x52b3b0 PUSH %RBP |
0x52b3b1 MOV %RSP,%RBP |
0x52b3b4 PUSH %R15 |
0x52b3b6 PUSH %R14 |
0x52b3b8 PUSH %R13 |
0x52b3ba PUSH %R12 |
0x52b3bc PUSH %RBX |
0x52b3bd AND $-0x40,%RSP |
0x52b3c1 SUB $0x580,%RSP |
0x52b3c8 MOV %RCX,0x48(%RSP) |
0x52b3cd MOV %RDI,%RBX |
0x52b3d0 MOV 0x50(%RDI),%RDI |
0x52b3d4 MOV 0x58(%RBX),%RAX |
0x52b3d8 MOV %RAX,0x40(%RSP) |
0x52b3dd CMP %RAX,%RDI |
0x52b3e0 JE 52d151 |
0x52b3e6 MOV 0x8(%R8),%R10 |
0x52b3ea MOV 0x28(%R8),%RAX |
0x52b3ee MOV %RAX,0x38(%RSP) |
0x52b3f3 MOV 0x90(%RSI),%R11 |
0x52b3fa MOV 0xb0(%RSI),%RAX |
0x52b401 MOV %RAX,0x20(%RSP) |
0x52b406 MOV 0x168(%RSI),%RAX |
0x52b40d VMOVAPS (%RAX),%ZMM0 |
0x52b413 VXORPS %XMM2,%XMM2,%XMM2 |
0x52b417 VCMPPS $0x1,%ZMM0,%ZMM2,%K0 |
0x52b41e VBROADCASTSS -0x1cf300(%RIP),%ZMM1 |
0x52b428 VADDPS %ZMM1,%ZMM0,%ZMM0 |
0x52b42e VCMPPS $0x1,%ZMM0,%ZMM2,%K1 |
0x52b435 VADDPS %ZMM1,%ZMM0,%ZMM0 |
0x52b43b VCMPPS $0x1,%ZMM0,%ZMM2,%K2 |
0x52b442 VADDPS %ZMM1,%ZMM0,%ZMM0 |
0x52b448 MOV 0x180(%RSI),%RAX |
0x52b44f VMOVAPS (%RAX),%ZMM1 |
0x52b455 VMOVAPS %ZMM1,0x340(%RSP) |
0x52b45d VCMPPS $0x1,%ZMM0,%ZMM2,%K3 |
0x52b464 VMOVAPS 0x40(%RAX),%ZMM0 |
0x52b46b VMOVAPS %ZMM0,0x300(%RSP) |
0x52b473 VBROADCASTSS 0x54(%RDX),%ZMM18 |
0x52b47a VMULSS %XMM18,%XMM18,%XMM0 |
0x52b480 VBROADCASTSS %XMM0,%ZMM0 |
0x52b486 VMOVAPS %ZMM0,0x180(%RSP) |
0x52b48e VMOVSS 0x4c(%RDX),%XMM0 |
0x52b493 VMULSS %XMM0,%XMM0,%XMM0 |
0x52b497 VBROADCASTSS %XMM0,%ZMM17 |
0x52b49d MOV 0x138(%RSI),%RSI |
0x52b4a4 MOV 0x80(%RBX),%R14 |
0x52b4ab VBROADCASTSS 0x6c(%RDX),%ZMM0 |
0x52b4b2 VMOVAPS %ZMM0,0x480(%RSP) |
0x52b4ba VMOVDDUP -0x1ce962(%RIP),%XMM0 |
0x52b4c2 VMOVAPS %XMM0,0x70(%RSP) |
0x52b4c8 VMOVAPS %ZMM18,0x440(%RSP) |
0x52b4d0 VMOVAPS %ZMM17,0x380(%RSP) |
0x52b4d8 MOV %RBX,0x30(%RSP) |
0x52b4dd JMP 52b63a |
0x52b4e2 NOPW %CS:(%RAX,%RAX,1) |
(834) 0x52b4f0 LEA (%R15,%R15,2),%RAX |
(834) 0x52b4f4 ADD $0x2,%RAX |
(834) 0x52b4f8 VSHUFF64X2 $-0x78,%ZMM22,%ZMM23,%ZMM0 |
(834) 0x52b4ff VSHUFF64X2 $-0x23,%ZMM22,%ZMM23,%ZMM1 |
(834) 0x52b506 VADDPS %ZMM1,%ZMM0,%ZMM0 |
(834) 0x52b50c VPERMILPD $0x55,%ZMM0,%ZMM1 |
(834) 0x52b513 VADDPS %ZMM1,%ZMM0,%ZMM0 |
(834) 0x52b519 VPERMILPS $-0x4f,%ZMM0,%ZMM1 |
(834) 0x52b520 VADDPS %ZMM1,%ZMM0,%ZMM0 |
(834) 0x52b526 MOV $0x1111,%CX |
(834) 0x52b52a KMOVD %ECX,%K4 |
(834) 0x52b52e VCOMPRESSPS %ZMM0,%ZMM0{%K4}{z} |
(834) 0x52b534 VADDPS (%R10,%R9,4),%XMM0,%XMM1 |
(834) 0x52b53a VMOVAPS %XMM1,(%R10,%R9,4) |
(834) 0x52b540 VPERMILPD $0x1,%XMM0,%XMM1 |
(834) 0x52b546 VSHUFF64X2 $-0x78,%ZMM21,%ZMM20,%ZMM2 |
(834) 0x52b54d VSHUFF64X2 $-0x23,%ZMM21,%ZMM20,%ZMM3 |
(834) 0x52b554 VADDPS %ZMM3,%ZMM2,%ZMM2 |
(834) 0x52b55a VPERMILPD $0x55,%ZMM2,%ZMM3 |
(834) 0x52b561 VADDPS %ZMM3,%ZMM2,%ZMM2 |
(834) 0x52b567 VPERMILPS $-0x4f,%ZMM2,%ZMM3 |
(834) 0x52b56e VADDPS %ZMM3,%ZMM2,%ZMM2 |
(834) 0x52b574 VCOMPRESSPS %ZMM2,%ZMM2{%K4}{z} |
(834) 0x52b57a MOV 0x50(%RSP),%RCX |
(834) 0x52b57f VADDPS (%R10,%RCX,4),%XMM2,%XMM3 |
(834) 0x52b585 VADDPS %XMM1,%XMM0,%XMM0 |
(834) 0x52b589 VMOVAPS %XMM3,(%R10,%RCX,4) |
(834) 0x52b58f VPERMILPD $0x1,%XMM2,%XMM1 |
(834) 0x52b595 VADDPS %XMM1,%XMM2,%XMM1 |
(834) 0x52b599 VSHUFF64X2 $-0x78,%ZMM19,%ZMM16,%ZMM2 |
(834) 0x52b5a0 VSHUFF64X2 $-0x23,%ZMM19,%ZMM16,%ZMM3 |
(834) 0x52b5a7 VADDPS %ZMM3,%ZMM2,%ZMM2 |
(834) 0x52b5ad VPERMILPD $0x55,%ZMM2,%ZMM3 |
(834) 0x52b5b4 VADDPS %ZMM3,%ZMM2,%ZMM2 |
(834) 0x52b5ba VPERMILPS $-0x4f,%ZMM2,%ZMM3 |
(834) 0x52b5c1 VADDPS %ZMM3,%ZMM2,%ZMM2 |
(834) 0x52b5c7 VCOMPRESSPS %ZMM2,%ZMM2{%K4}{z} |
(834) 0x52b5cd MOV 0x58(%RSP),%RCX |
(834) 0x52b5d2 VADDPS (%R10,%RCX,4),%XMM2,%XMM3 |
(834) 0x52b5d8 VMOVAPS %XMM3,(%R10,%RCX,4) |
(834) 0x52b5de VPERMILPD $0x1,%XMM2,%XMM3 |
(834) 0x52b5e4 VADDPS %XMM3,%XMM2,%XMM2 |
(834) 0x52b5e8 VMOVSHDUP %XMM2,%XMM3 |
(834) 0x52b5ec VADDSS %XMM3,%XMM2,%XMM2 |
(834) 0x52b5f0 MOV 0x38(%RSP),%RCX |
(834) 0x52b5f5 MOV 0x60(%RSP),%RDX |
(834) 0x52b5fa VMOVSD (%RCX,%RDX,4),%XMM3 |
(834) 0x52b5ff VUNPCKLPS %XMM1,%XMM0,%XMM4 |
(834) 0x52b603 VMOVAPS 0x70(%RSP),%XMM5 |
(834) 0x52b609 VPERMT2PS %XMM1,%XMM5,%XMM0 |
(834) 0x52b60f VADDPS %XMM0,%XMM4,%XMM0 |
(834) 0x52b613 VADDPS %XMM3,%XMM0,%XMM0 |
(834) 0x52b617 VMOVLPS %XMM0,(%RCX,%RDX,4) |
(834) 0x52b61c VADDSS (%RCX,%RAX,4),%XMM2,%XMM0 |
(834) 0x52b621 VMOVSS %XMM0,(%RCX,%RAX,4) |
(834) 0x52b626 MOV 0x68(%RSP),%RDI |
(834) 0x52b62b ADD $0x10,%RDI |
(834) 0x52b62f CMP 0x40(%RSP),%RDI |
(834) 0x52b634 JE 52d151 |
(834) 0x52b63a MOV (%RDI),%ECX |
(834) 0x52b63c MOV 0x4(%RDI),%EDX |
(834) 0x52b63f MOV %EDX,%EAX |
(834) 0x52b641 AND $0x7f,%EAX |
(834) 0x52b644 CMP $0x16,%EAX |
(834) 0x52b647 MOV $-0x1,%R8D |
(834) 0x52b64d CMOVE %ECX,%R8D |
(834) 0x52b651 MOV %R8D,0x2c(%RSP) |
(834) 0x52b656 SAL $0x2,%ECX |
(834) 0x52b659 MOV %ECX,%R9D |
(834) 0x52b65c AND $-0x8,%R9D |
(834) 0x52b660 LEA (%R9,%R9,2),%R12D |
(834) 0x52b664 MOV %RDI,%RBX |
(834) 0x52b667 MOV %ECX,%EDI |
(834) 0x52b669 AND $0x4,%EDI |
(834) 0x52b66c OR %EDI,%R12D |
(834) 0x52b66f MOV %EDX,%R8D |
(834) 0x52b672 AND $0x200,%R8D |
(834) 0x52b679 MOV %R8D,%R13D |
(834) 0x52b67c SHR $0x9,%R13D |
(834) 0x52b680 MOV %EDX,%R15D |
(834) 0x52b683 AND $0x180,%R15D |
(834) 0x52b68a CMP $0x80,%R15D |
(834) 0x52b691 SETNE %R15B |
(834) 0x52b695 AND %R13B,%R15B |
(834) 0x52b698 TEST %R8D,%R8D |
(834) 0x52b69b JE 52b6f2 |
(834) 0x52b69d MOVSXD %ECX,%RCX |
(834) 0x52b6a0 MOV 0x20(%RSP),%R8 |
(834) 0x52b6a5 VBROADCASTSS (%R8,%RCX,4),%YMM0 |
(834) 0x52b6ab VBROADCASTSS 0x4(%R8,%RCX,4),%YMM1 |
(834) 0x52b6b2 VINSERTF64X4 $0x1,%YMM1,%ZMM0,%ZMM0 |
(834) 0x52b6b9 VMOVAPS 0x480(%RSP),%ZMM2 |
(834) 0x52b6c1 VMULPS %ZMM0,%ZMM2,%ZMM0 |
(834) 0x52b6c7 VMOVAPS %ZMM0,0x200(%RSP) |
(834) 0x52b6cf VBROADCASTSS 0x8(%R8,%RCX,4),%YMM0 |
(834) 0x52b6d6 VBROADCASTSS 0xc(%R8,%RCX,4),%YMM1 |
(834) 0x52b6dd VINSERTF64X4 $0x1,%YMM1,%ZMM0,%ZMM0 |
(834) 0x52b6e4 VMULPS %ZMM0,%ZMM2,%ZMM0 |
(834) 0x52b6ea VMOVAPS %ZMM0,0x1c0(%RSP) |
(834) 0x52b6f2 MOV %RAX,0x18(%RSP) |
(834) 0x52b6f7 LEA (%RAX,%RAX,2),%RAX |
(834) 0x52b6fb MOV 0x8(%RBX),%ECX |
(834) 0x52b6fe MOVSXD %ECX,%R8 |
(834) 0x52b701 MOV %RBX,0x68(%RSP) |
(834) 0x52b706 MOVSXD 0xc(%RBX),%R13 |
(834) 0x52b70a MOV 0x48(%RSP),%RBX |
(834) 0x52b70f VBROADCASTSS (%RBX,%RAX,4),%ZMM0 |
(834) 0x52b716 VBROADCASTSS 0x4(%RBX,%RAX,4),%ZMM1 |
(834) 0x52b71e MOV %RAX,0x60(%RSP) |
(834) 0x52b723 VBROADCASTSS 0x8(%RBX,%RAX,4),%ZMM2 |
(834) 0x52b72b LEA (%RDI,%R9,2),%EDI |
(834) 0x52b72f MOVSXD %R12D,%R9 |
(834) 0x52b732 LEA 0x8(%R9),%RBX |
(834) 0x52b736 LEA 0x10(%R9),%RAX |
(834) 0x52b73a VBROADCASTSS (%RSI,%R9,4),%YMM6 |
(834) 0x52b740 VBROADCASTSS 0x4(%RSI,%R9,4),%YMM7 |
(834) 0x52b747 VINSERTF64X4 $0x1,%YMM7,%ZMM6,%ZMM6 |
(834) 0x52b74e VADDPS %ZMM6,%ZMM0,%ZMM30 |
(834) 0x52b754 VBROADCASTSS 0x8(%RSI,%R9,4),%YMM6 |
(834) 0x52b75b VBROADCASTSS 0xc(%RSI,%R9,4),%YMM7 |
(834) 0x52b762 VINSERTF64X4 $0x1,%YMM7,%ZMM6,%ZMM6 |
(834) 0x52b769 VADDPS %ZMM6,%ZMM0,%ZMM31 |
(834) 0x52b76f VBROADCASTSS 0x20(%RSI,%R9,4),%YMM0 |
(834) 0x52b776 VBROADCASTSS 0x24(%RSI,%R9,4),%YMM6 |
(834) 0x52b77d VINSERTF64X4 $0x1,%YMM6,%ZMM0,%ZMM0 |
(834) 0x52b784 VADDPS %ZMM0,%ZMM1,%ZMM0 |
(834) 0x52b78a VMOVAPS %ZMM0,0x140(%RSP) |
(834) 0x52b792 VBROADCASTSS 0x28(%RSI,%R9,4),%YMM0 |
(834) 0x52b799 VBROADCASTSS 0x2c(%RSI,%R9,4),%YMM6 |
(834) 0x52b7a0 VINSERTF64X4 $0x1,%YMM6,%ZMM0,%ZMM0 |
(834) 0x52b7a7 VADDPS %ZMM0,%ZMM1,%ZMM0 |
(834) 0x52b7ad VMOVAPS %ZMM0,0x100(%RSP) |
(834) 0x52b7b5 VBROADCASTSS 0x40(%RSI,%R9,4),%YMM0 |
(834) 0x52b7bc VBROADCASTSS 0x44(%RSI,%R9,4),%YMM1 |
(834) 0x52b7c3 VINSERTF64X4 $0x1,%YMM1,%ZMM0,%ZMM0 |
(834) 0x52b7ca VADDPS %ZMM0,%ZMM2,%ZMM0 |
(834) 0x52b7d0 VMOVAPS %ZMM0,0xc0(%RSP) |
(834) 0x52b7d8 VBROADCASTSS 0x48(%RSI,%R9,4),%YMM0 |
(834) 0x52b7df VBROADCASTSS 0x4c(%RSI,%R9,4),%YMM1 |
(834) 0x52b7e6 VINSERTF64X4 $0x1,%YMM1,%ZMM0,%ZMM0 |
(834) 0x52b7ed VADDPS %ZMM0,%ZMM2,%ZMM0 |
(834) 0x52b7f3 VMOVAPS %ZMM0,0x80(%RSP) |
(834) 0x52b7fb MOVSXD %EDI,%RDI |
(834) 0x52b7fe MOV %EDI,%R12D |
(834) 0x52b801 OR $0x8,%R12D |
(834) 0x52b805 MOVSXD %R12D,%R12 |
(834) 0x52b808 VBROADCASTSS (%R11,%RDI,4),%YMM0 |
(834) 0x52b80e VBROADCASTSS 0x4(%R11,%RDI,4),%YMM1 |
(834) 0x52b815 VINSERTF64X4 $0x1,%YMM1,%ZMM0,%ZMM14 |
(834) 0x52b81c VBROADCASTSS (%R11,%R12,4),%YMM0 |
(834) 0x52b822 VBROADCASTSS 0x4(%R11,%R12,4),%YMM1 |
(834) 0x52b829 VINSERTF64X4 $0x1,%YMM1,%ZMM0,%ZMM15 |
(834) 0x52b830 TEST %R15B,%R15B |
(834) 0x52b833 VMOVAPS %ZMM30,0x400(%RSP) |
(834) 0x52b83b VMOVAPS %ZMM31,0x3c0(%RSP) |
(834) 0x52b843 VMOVAPS %ZMM14,0x280(%RSP) |
(834) 0x52b84b VMOVAPS %ZMM15,0x240(%RSP) |
(834) 0x52b853 MOV %RAX,0x58(%RSP) |
(834) 0x52b858 MOV %RBX,0x50(%RSP) |
(834) 0x52b85d JE 52bd70 |
(834) 0x52b863 VXORPS %XMM16,%XMM16,%XMM16 |
(834) 0x52b869 CMP %R13D,%ECX |
(834) 0x52b86c JGE 52c300 |
(834) 0x52b872 LEA 0x4(,%R8,8),%R8 |
(834) 0x52b87a VXORPS %XMM22,%XMM22,%XMM22 |
(834) 0x52b880 VXORPS %XMM23,%XMM23,%XMM23 |
(834) 0x52b886 VXORPS %XMM21,%XMM21,%XMM21 |
(834) 0x52b88c VXORPS %XMM20,%XMM20,%XMM20 |
(834) 0x52b892 VXORPS %XMM19,%XMM19,%XMM19 |
(834) 0x52b898 MOV 0x30(%RSP),%RBX |
(834) 0x52b89d MOV 0x18(%RSP),%R15 |
(834) 0x52b8a2 MOV 0x2c(%RSP),%EDX |
(834) 0x52b8a6 JMP 52bc52 |
0x52b8ab NOPL (%RAX,%RAX,1) |
(840) 0x52b8b0 KANDD %K0,%K5,%K5 |
(840) 0x52b8b5 KANDD %K1,%K4,%K4 |
(840) 0x52b8ba VPTESTNMD %ZMM0,%ZMM0,%K6 |
(840) 0x52b8c0 VBROADCASTSS -0x1cf592(%RIP),%ZMM6 |
(840) 0x52b8ca VMAXPS %ZMM6,%ZMM1,%ZMM0 |
(840) 0x52b8d0 VMAXPS %ZMM6,%ZMM2,%ZMM6 |
(840) 0x52b8d6 VMOVAPS %ZMM0,%ZMM1{%K5}{z} |
(840) 0x52b8dc VMOVAPS 0x180(%RSP),%ZMM3 |
(840) 0x52b8e4 VMULPS %ZMM1,%ZMM3,%ZMM2 |
(840) 0x52b8ea VMOVAPS %ZMM6,%ZMM1{%K4}{z} |
(840) 0x52b8f0 VMULPS %ZMM1,%ZMM3,%ZMM1 |
(840) 0x52b8f6 VBROADCASTSS -0x1cf114(%RIP),%ZMM9 |
(840) 0x52b900 VBROADCASTSS -0x1cf27e(%RIP),%ZMM10 |
(840) 0x52b90a VMULPS %ZMM2,%ZMM2,%ZMM31 |
(840) 0x52b910 VMOVAPS %ZMM10,%ZMM7 |
(840) 0x52b916 VFMADD213PS %ZMM9,%ZMM31,%ZMM7 |
(840) 0x52b91c VBROADCASTSS -0x1cf4ee(%RIP),%ZMM11 |
(840) 0x52b926 VBROADCASTSS -0x1cf628(%RIP),%ZMM12 |
(840) 0x52b930 VMOVAPS %ZMM12,%ZMM8 |
(840) 0x52b936 VFMADD213PS %ZMM11,%ZMM31,%ZMM8 |
(840) 0x52b93c VBROADCASTSS -0x1cf7ba(%RIP),%ZMM13 |
(840) 0x52b946 VFMADD213PS %ZMM13,%ZMM31,%ZMM7 |
(840) 0x52b94c VBROADCASTSS -0x1cf696(%RIP),%ZMM14 |
(840) 0x52b956 VFMADD231PS %ZMM8,%ZMM2,%ZMM7 |
(840) 0x52b95c VBROADCASTSS -0x1cf3be(%RIP),%ZMM15 |
(840) 0x52b966 VMOVAPS %ZMM15,%ZMM8 |
(840) 0x52b96c VFMADD213PS %ZMM14,%ZMM31,%ZMM8 |
(840) 0x52b972 VBROADCASTSS -0x1cf390(%RIP),%ZMM17 |
(840) 0x52b97c VBROADCASTSS -0x1cf21e(%RIP),%ZMM3 |
(840) 0x52b986 VMOVAPS %ZMM3,%ZMM18 |
(840) 0x52b98c VFMADD213PS %ZMM17,%ZMM31,%ZMM18 |
(840) 0x52b992 VBROADCASTSS -0x1cf750(%RIP),%ZMM4 |
(840) 0x52b99c VFMADD213PS %ZMM4,%ZMM31,%ZMM8 |
(840) 0x52b9a2 VBROADCASTSS -0x1cf794(%RIP),%ZMM5 |
(840) 0x52b9ac VFMADD213PS %ZMM5,%ZMM31,%ZMM18 |
(840) 0x52b9b2 VBROADCASTSS -0x1cf4d4(%RIP),%ZMM30 |
(840) 0x52b9bc VFMADD213PS %ZMM30,%ZMM31,%ZMM8 |
(840) 0x52b9c2 VMULPS %ZMM1,%ZMM1,%ZMM31 |
(840) 0x52b9c8 VFMADD213PS %ZMM9,%ZMM31,%ZMM10 |
(840) 0x52b9ce VFMADD213PS %ZMM11,%ZMM31,%ZMM12 |
(840) 0x52b9d4 VFMADD213PS %ZMM13,%ZMM31,%ZMM10 |
(840) 0x52b9da VFMADD213PS %ZMM14,%ZMM31,%ZMM15 |
(840) 0x52b9e0 VFMADD213PS %ZMM17,%ZMM31,%ZMM3 |
(840) 0x52b9e6 VRSQRT14PS %ZMM0,%ZMM9 |
(840) 0x52b9ec VFMADD213PS %ZMM4,%ZMM31,%ZMM15 |
(840) 0x52b9f2 VBROADCASTSS -0x1cf580(%RIP),%ZMM4 |
(840) 0x52b9fc VMULPS %ZMM9,%ZMM0,%ZMM0 |
(840) 0x52ba02 VFMADD213PS %ZMM5,%ZMM31,%ZMM3 |
(840) 0x52ba08 VBROADCASTSS -0x1cf8be(%RIP),%ZMM5 |
(840) 0x52ba12 VFMADD213PS %ZMM5,%ZMM9,%ZMM0 |
(840) 0x52ba18 VMULPS %ZMM4,%ZMM9,%ZMM9 |
(840) 0x52ba1e VFMADD213PS %ZMM30,%ZMM31,%ZMM15 |
(840) 0x52ba24 VRCP14PS %ZMM7,%ZMM11 |
(840) 0x52ba2a VBROADCASTSS -0x1cf4f4(%RIP),%ZMM13 |
(840) 0x52ba34 VMULPS %ZMM0,%ZMM9,%ZMM0{%K5}{z} |
(840) 0x52ba3a VFNMADD213PS %ZMM13,%ZMM11,%ZMM7 |
(840) 0x52ba40 VMULPS %ZMM7,%ZMM11,%ZMM7 |
(840) 0x52ba46 VFMADD231PS %ZMM18,%ZMM2,%ZMM8 |
(840) 0x52ba4c VXORPS %XMM11,%XMM11,%XMM11 |
(840) 0x52ba51 VBLENDMPS %ZMM11,%ZMM0,%ZMM9{%K6} |
(840) 0x52ba57 VMULPS %ZMM7,%ZMM8,%ZMM7 |
(840) 0x52ba5d VMOVAPS 0x440(%RSP),%ZMM18 |
(840) 0x52ba65 VMULPS %ZMM7,%ZMM18,%ZMM7 |
(840) 0x52ba6b VFMADD213PS %ZMM9,%ZMM2,%ZMM7 |
(840) 0x52ba71 VRSQRT14PS %ZMM6,%ZMM2 |
(840) 0x52ba77 VMOVDQA64 0x2c0(%RSP),%ZMM8 |
(840) 0x52ba7f VPTESTMD %ZMM8,%ZMM8,%K5 |
(840) 0x52ba85 VMULPS %ZMM2,%ZMM6,%ZMM6 |
(840) 0x52ba8b VFMADD213PS %ZMM5,%ZMM2,%ZMM6 |
(840) 0x52ba91 VMULPS %ZMM4,%ZMM2,%ZMM2 |
(840) 0x52ba97 VMULPS %ZMM6,%ZMM2,%ZMM2{%K4}{z} |
(840) 0x52ba9d VFMADD231PS %ZMM12,%ZMM1,%ZMM10 |
(840) 0x52baa3 VRCP14PS %ZMM10,%ZMM4 |
(840) 0x52baa9 VFNMADD213PS %ZMM13,%ZMM4,%ZMM10 |
(840) 0x52baaf VMULPS %ZMM10,%ZMM4,%ZMM4 |
(840) 0x52bab5 VFMADD231PS %ZMM3,%ZMM1,%ZMM15 |
(840) 0x52babb VMULPS %ZMM4,%ZMM15,%ZMM3 |
(840) 0x52bac1 VMOVAPS %ZMM2,%ZMM4{%K5}{z} |
(840) 0x52bac7 VMULPS %ZMM3,%ZMM18,%ZMM3 |
(840) 0x52bacd VFMADD213PS %ZMM4,%ZMM1,%ZMM3 |
(840) 0x52bad3 MOV 0x20(%RSP),%RDI |
(840) 0x52bad8 VBROADCASTF64X4 (%RDI,%RAX,4),%ZMM1 |
(840) 0x52badf VMULPS 0x200(%RSP),%ZMM1,%ZMM4 |
(840) 0x52bae7 VMULPS 0x1c0(%RSP),%ZMM1,%ZMM1 |
(840) 0x52baef VMULPS %ZMM2,%ZMM2,%ZMM2 |
(840) 0x52baf5 VMULPS %ZMM7,%ZMM4,%ZMM4 |
(840) 0x52bafb VMULPS %ZMM3,%ZMM1,%ZMM1 |
(840) 0x52bb01 VMULPS %ZMM1,%ZMM2,%ZMM1 |
(840) 0x52bb07 MOV %R15,%RAX |
(840) 0x52bb0a SAL $0x4,%RAX |
(840) 0x52bb0e SAL $0x6,%R15 |
(840) 0x52bb12 VBROADCASTF64X4 (%R11,%R15,1),%ZMM2 |
(840) 0x52bb19 OR $0x8,%EAX |
(840) 0x52bb1c CLTQ |
(840) 0x52bb1e VBROADCASTF64X4 (%R11,%RAX,4),%ZMM3 |
(840) 0x52bb25 VADDPS 0x280(%RSP),%ZMM2,%ZMM2 |
(840) 0x52bb2d VMULPS %ZMM2,%ZMM0,%ZMM2 |
(840) 0x52bb33 VMULPS %ZMM2,%ZMM2,%ZMM2 |
(840) 0x52bb39 VMULPS %ZMM2,%ZMM2,%ZMM5 |
(840) 0x52bb3f VMULPS %ZMM5,%ZMM2,%ZMM2 |
(840) 0x52bb45 VMULPS 0x240(%RSP),%ZMM3,%ZMM3 |
(840) 0x52bb4d VMOVAPS %ZMM11,%ZMM2{%K6} |
(840) 0x52bb53 VMULPS %ZMM2,%ZMM3,%ZMM3 |
(840) 0x52bb59 VMULPS %ZMM3,%ZMM2,%ZMM2 |
(840) 0x52bb5f VSUBPS %ZMM3,%ZMM2,%ZMM2 |
(840) 0x52bb65 VADDPS %ZMM2,%ZMM4,%ZMM2 |
(840) 0x52bb6b VMULPS %ZMM0,%ZMM0,%ZMM0 |
(840) 0x52bb71 VMULPS %ZMM2,%ZMM0,%ZMM0 |
(840) 0x52bb77 VMULPS %ZMM0,%ZMM26,%ZMM2 |
(840) 0x52bb7d VMULPS %ZMM0,%ZMM27,%ZMM3 |
(840) 0x52bb83 VMULPS %ZMM0,%ZMM28,%ZMM0 |
(840) 0x52bb89 VMULPS %ZMM1,%ZMM24,%ZMM4 |
(840) 0x52bb8f VMULPS %ZMM1,%ZMM25,%ZMM5 |
(840) 0x52bb95 VMULPS %ZMM1,%ZMM29,%ZMM1 |
(840) 0x52bb9b VADDPS %ZMM2,%ZMM23,%ZMM23 |
(840) 0x52bba1 VADDPS %ZMM4,%ZMM22,%ZMM22 |
(840) 0x52bba7 VADDPS %ZMM2,%ZMM4,%ZMM2 |
(840) 0x52bbad VADDPS %ZMM3,%ZMM20,%ZMM20 |
(840) 0x52bbb3 VADDPS %ZMM5,%ZMM21,%ZMM21 |
(840) 0x52bbb9 VADDPS %ZMM0,%ZMM16,%ZMM16 |
(840) 0x52bbbf VADDPS %ZMM1,%ZMM19,%ZMM19 |
(840) 0x52bbc5 VADDPS %ZMM3,%ZMM5,%ZMM3 |
(840) 0x52bbcb VADDPS %ZMM0,%ZMM1,%ZMM0 |
(840) 0x52bbd1 VEXTRACTF64X4 $0x1,%ZMM2,%YMM1 |
(840) 0x52bbd8 VADDPS %YMM1,%YMM2,%YMM1 |
(840) 0x52bbdc VMOVAPS (%R10,%R12,4),%YMM2 |
(840) 0x52bbe2 VMOVAPS 0x20(%R10,%R12,4),%YMM4 |
(840) 0x52bbe9 VSUBPS %YMM1,%YMM2,%YMM1 |
(840) 0x52bbed VMOVAPS 0x40(%R10,%R12,4),%YMM2 |
(840) 0x52bbf4 VMOVAPS %YMM1,(%R10,%R12,4) |
(840) 0x52bbfa VEXTRACTF64X4 $0x1,%ZMM3,%YMM1 |
(840) 0x52bc01 VADDPS %YMM1,%YMM3,%YMM1 |
(840) 0x52bc05 VSUBPS %YMM1,%YMM4,%YMM1 |
(840) 0x52bc09 VMOVAPS %YMM1,0x20(%R10,%R12,4) |
(840) 0x52bc10 VEXTRACTF64X4 $0x1,%ZMM0,%YMM1 |
(840) 0x52bc17 VADDPS %YMM1,%YMM0,%YMM0 |
(840) 0x52bc1b VSUBPS %YMM0,%YMM2,%YMM0 |
(840) 0x52bc1f VMOVAPS %YMM0,0x40(%R10,%R12,4) |
(840) 0x52bc26 INC %ECX |
(840) 0x52bc28 ADD $0x8,%R8 |
(840) 0x52bc2c CMP %ECX,%R13D |
(840) 0x52bc2f VMOVAPS 0x380(%RSP),%ZMM17 |
(840) 0x52bc37 MOV 0x18(%RSP),%R15 |
(840) 0x52bc3c VMOVAPS 0x400(%RSP),%ZMM30 |
(840) 0x52bc44 VMOVAPS 0x3c0(%RSP),%ZMM31 |
(840) 0x52bc4c JE 52b4f0 |
(840) 0x52bc52 MOV 0x80(%RBX),%RAX |
(840) 0x52bc59 CMPL $-0x1,(%RAX,%R8,1) |
(840) 0x52bc5e JE 52c323 |
(840) 0x52bc64 MOVSXD -0x4(%R14,%R8,1),%R15 |
(840) 0x52bc69 LEA (,%R15,8),%RAX |
(840) 0x52bc71 VPBROADCASTD (%R14,%R8,1),%ZMM1 |
(840) 0x52bc78 LEA (%RAX,%RAX,2),%R12 |
(840) 0x52bc7c VPANDD 0x340(%RSP),%ZMM1,%ZMM0 |
(840) 0x52bc84 VPANDD 0x300(%RSP),%ZMM1,%ZMM3 |
(840) 0x52bc8c VBROADCASTF64X4 (%RSI,%R12,4),%ZMM1 |
(840) 0x52bc93 MOVSXD %R12D,%RDI |
(840) 0x52bc96 VBROADCASTF64X4 0x20(%RSI,%RDI,4),%ZMM2 |
(840) 0x52bc9e VBROADCASTF64X4 0x40(%RSI,%RDI,4),%ZMM6 |
(840) 0x52bca6 VSUBPS %ZMM1,%ZMM30,%ZMM26 |
(840) 0x52bcac VSUBPS %ZMM1,%ZMM31,%ZMM24 |
(840) 0x52bcb2 VMOVAPS 0x140(%RSP),%ZMM1 |
(840) 0x52bcba VSUBPS %ZMM2,%ZMM1,%ZMM27 |
(840) 0x52bcc0 VMOVAPS 0x100(%RSP),%ZMM1 |
(840) 0x52bcc8 VSUBPS %ZMM2,%ZMM1,%ZMM25 |
(840) 0x52bcce VMOVAPS 0xc0(%RSP),%ZMM1 |
(840) 0x52bcd6 VSUBPS %ZMM6,%ZMM1,%ZMM28 |
(840) 0x52bcdc VMOVAPS 0x80(%RSP),%ZMM1 |
(840) 0x52bce4 VSUBPS %ZMM6,%ZMM1,%ZMM29 |
(840) 0x52bcea VMULPS %ZMM26,%ZMM26,%ZMM1 |
(840) 0x52bcf0 VMULPS %ZMM27,%ZMM27,%ZMM2 |
(840) 0x52bcf6 VADDPS %ZMM2,%ZMM1,%ZMM1 |
(840) 0x52bcfc VMULPS %ZMM28,%ZMM28,%ZMM2 |
(840) 0x52bd02 VADDPS %ZMM2,%ZMM1,%ZMM1 |
(840) 0x52bd08 VMULPS %ZMM24,%ZMM24,%ZMM2 |
(840) 0x52bd0e VMULPS %ZMM25,%ZMM25,%ZMM6 |
(840) 0x52bd14 VADDPS %ZMM6,%ZMM2,%ZMM2 |
(840) 0x52bd1a VMULPS %ZMM29,%ZMM29,%ZMM6 |
(840) 0x52bd20 VADDPS %ZMM6,%ZMM2,%ZMM2 |
(840) 0x52bd26 VCMPPS $0x1,%ZMM17,%ZMM1,%K5 |
(840) 0x52bd2d VCMPPS $0x1,%ZMM17,%ZMM2,%K4 |
(840) 0x52bd34 LEA (%R15,%R15,1),%EDI |
(840) 0x52bd38 CMP %EDX,%EDI |
(840) 0x52bd3a VMOVDQA64 %ZMM3,0x2c0(%RSP) |
(840) 0x52bd42 JE 52b8b0 |
(840) 0x52bd48 OR $0x1,%EDI |
(840) 0x52bd4b CMP %EDX,%EDI |
(840) 0x52bd4d JNE 52b8ba |
(840) 0x52bd53 KANDD %K2,%K5,%K5 |
(840) 0x52bd58 KANDD %K3,%K4,%K4 |
(840) 0x52bd5d JMP 52b8ba |
0x52bd62 NOPW %CS:(%RAX,%RAX,1) |
(834) 0x52bd70 VBROADCASTSS 0x8(%R11,%RDI,4),%YMM0 |
(834) 0x52bd77 VBROADCASTSS 0xc(%R11,%RDI,4),%YMM1 |
(834) 0x52bd7e VINSERTF64X4 $0x1,%YMM1,%ZMM0,%ZMM24 |
(834) 0x52bd85 VBROADCASTSS 0x8(%R11,%R12,4),%YMM0 |
(834) 0x52bd8c VBROADCASTSS 0xc(%R11,%R12,4),%YMM1 |
(834) 0x52bd93 VINSERTF64X4 $0x1,%YMM1,%ZMM0,%ZMM25 |
(834) 0x52bd9a VXORPS %XMM16,%XMM16,%XMM16 |
(834) 0x52bda0 TEST $0x200,%EDX |
(834) 0x52bda6 JE 52c740 |
(834) 0x52bdac CMP %R13D,%ECX |
(834) 0x52bdaf JGE 52ca2c |
(834) 0x52bdb5 LEA 0x4(,%R8,8),%R8 |
(834) 0x52bdbd VXORPS %XMM22,%XMM22,%XMM22 |
(834) 0x52bdc3 VXORPS %XMM23,%XMM23,%XMM23 |
(834) 0x52bdc9 VXORPS %XMM21,%XMM21,%XMM21 |
(834) 0x52bdcf VXORPS %XMM20,%XMM20,%XMM20 |
(834) 0x52bdd5 VXORPS %XMM19,%XMM19,%XMM19 |
(834) 0x52bddb MOV 0x30(%RSP),%RBX |
(834) 0x52bde0 MOV 0x18(%RSP),%R15 |
(834) 0x52bde5 VMOVAPS %ZMM24,0x500(%RSP) |
(834) 0x52bded VMOVAPS %ZMM25,0x4c0(%RSP) |
(834) 0x52bdf5 MOV 0x2c(%RSP),%EDX |
(834) 0x52bdf9 JMP 52c1ee |
0x52bdfe XCHG %AX,%AX |
(838) 0x52be00 KANDD %K0,%K5,%K5 |
(838) 0x52be05 KANDD %K1,%K4,%K4 |
(838) 0x52be0a VPTESTNMD %ZMM0,%ZMM0,%K6 |
(838) 0x52be10 VBROADCASTSS -0x1cfae2(%RIP),%ZMM3 |
(838) 0x52be1a VMAXPS %ZMM3,%ZMM1,%ZMM0 |
(838) 0x52be20 VMAXPS %ZMM3,%ZMM2,%ZMM7 |
(838) 0x52be26 VMOVAPS %ZMM0,%ZMM1{%K5}{z} |
(838) 0x52be2c VMOVAPS 0x180(%RSP),%ZMM2 |
(838) 0x52be34 VMULPS %ZMM1,%ZMM2,%ZMM8 |
(838) 0x52be3a VMOVAPS %ZMM7,%ZMM1{%K4}{z} |
(838) 0x52be40 VMULPS %ZMM1,%ZMM2,%ZMM1 |
(838) 0x52be46 VBROADCASTSS -0x1cf664(%RIP),%ZMM3 |
(838) 0x52be50 VBROADCASTSS -0x1cf7ce(%RIP),%ZMM2 |
(838) 0x52be5a VMULPS %ZMM8,%ZMM8,%ZMM4 |
(838) 0x52be60 VMOVAPS %ZMM2,%ZMM5 |
(838) 0x52be66 VFMADD213PS %ZMM3,%ZMM4,%ZMM5 |
(838) 0x52be6c VBROADCASTSS -0x1cfa3e(%RIP),%ZMM10 |
(838) 0x52be76 VBROADCASTSS -0x1cfb78(%RIP),%ZMM9 |
(838) 0x52be80 VMOVAPS %ZMM9,%ZMM11 |
(838) 0x52be86 VFMADD213PS %ZMM10,%ZMM4,%ZMM11 |
(838) 0x52be8c VBROADCASTSS -0x1cfd0a(%RIP),%ZMM12 |
(838) 0x52be96 VFMADD213PS %ZMM12,%ZMM4,%ZMM5 |
(838) 0x52be9c VBROADCASTSS -0x1cfbe6(%RIP),%ZMM13 |
(838) 0x52bea6 VFMADD231PS %ZMM11,%ZMM8,%ZMM5 |
(838) 0x52beac VBROADCASTSS -0x1cf90e(%RIP),%ZMM11 |
(838) 0x52beb6 VMOVAPS %ZMM11,%ZMM14 |
(838) 0x52bebc VFMADD213PS %ZMM13,%ZMM4,%ZMM14 |
(838) 0x52bec2 VBROADCASTSS -0x1cf8e0(%RIP),%ZMM15 |
(838) 0x52becc VBROADCASTSS -0x1cf76e(%RIP),%ZMM17 |
(838) 0x52bed6 VMOVAPS %ZMM17,%ZMM18 |
(838) 0x52bedc VFMADD213PS %ZMM15,%ZMM4,%ZMM18 |
(838) 0x52bee2 VBROADCASTSS -0x1cfca0(%RIP),%ZMM24 |
(838) 0x52beec VFMADD213PS %ZMM24,%ZMM4,%ZMM14 |
(838) 0x52bef2 VBROADCASTSS -0x1cfce4(%RIP),%ZMM25 |
(838) 0x52befc VFMADD213PS %ZMM25,%ZMM4,%ZMM18 |
(838) 0x52bf02 VBROADCASTSS -0x1cfa24(%RIP),%ZMM6 |
(838) 0x52bf0c VFMADD213PS %ZMM6,%ZMM4,%ZMM14 |
(838) 0x52bf12 VMULPS %ZMM1,%ZMM1,%ZMM4 |
(838) 0x52bf18 VFMADD213PS %ZMM3,%ZMM4,%ZMM2 |
(838) 0x52bf1e VFMADD213PS %ZMM10,%ZMM4,%ZMM9 |
(838) 0x52bf24 VFMADD213PS %ZMM12,%ZMM4,%ZMM2 |
(838) 0x52bf2a VFMADD213PS %ZMM13,%ZMM4,%ZMM11 |
(838) 0x52bf30 VFMADD213PS %ZMM15,%ZMM4,%ZMM17 |
(838) 0x52bf36 VRSQRT14PS %ZMM0,%ZMM3 |
(838) 0x52bf3c VFMADD213PS %ZMM24,%ZMM4,%ZMM11 |
(838) 0x52bf42 VBROADCASTSS -0x1cfad0(%RIP),%ZMM10 |
(838) 0x52bf4c VMULPS %ZMM3,%ZMM0,%ZMM0 |
(838) 0x52bf52 VFMADD213PS %ZMM25,%ZMM4,%ZMM17 |
(838) 0x52bf58 VBROADCASTSS -0x1cfe0e(%RIP),%ZMM12 |
(838) 0x52bf62 VFMADD213PS %ZMM12,%ZMM3,%ZMM0 |
(838) 0x52bf68 VMULPS %ZMM10,%ZMM3,%ZMM3 |
(838) 0x52bf6e VFMADD213PS %ZMM6,%ZMM4,%ZMM11 |
(838) 0x52bf74 VRCP14PS %ZMM5,%ZMM4 |
(838) 0x52bf7a VBROADCASTSS -0x1cfa44(%RIP),%ZMM6 |
(838) 0x52bf84 VMULPS %ZMM0,%ZMM3,%ZMM0{%K5}{z} |
(838) 0x52bf8a VFNMADD213PS %ZMM6,%ZMM4,%ZMM5 |
(838) 0x52bf90 VMULPS %ZMM5,%ZMM4,%ZMM3 |
(838) 0x52bf96 VFMADD231PS %ZMM18,%ZMM8,%ZMM14 |
(838) 0x52bf9c VXORPS %XMM13,%XMM13,%XMM13 |
(838) 0x52bfa1 VBLENDMPS %ZMM13,%ZMM0,%ZMM4{%K6} |
(838) 0x52bfa7 VMULPS %ZMM3,%ZMM14,%ZMM3 |
(838) 0x52bfad VMOVAPS 0x440(%RSP),%ZMM18 |
(838) 0x52bfb5 VMULPS %ZMM3,%ZMM18,%ZMM3 |
(838) 0x52bfbb VFMADD213PS %ZMM4,%ZMM8,%ZMM3 |
(838) 0x52bfc1 VRSQRT14PS %ZMM7,%ZMM4 |
(838) 0x52bfc7 VPTESTNMD %ZMM26,%ZMM26,%K5 |
(838) 0x52bfcd VMULPS %ZMM4,%ZMM7,%ZMM5 |
(838) 0x52bfd3 VFMADD213PS %ZMM12,%ZMM4,%ZMM5 |
(838) 0x52bfd9 VMULPS %ZMM10,%ZMM4,%ZMM4 |
(838) 0x52bfdf VMULPS %ZMM5,%ZMM4,%ZMM4{%K4}{z} |
(838) 0x52bfe5 VFMADD231PS %ZMM9,%ZMM1,%ZMM2 |
(838) 0x52bfeb VRCP14PS %ZMM2,%ZMM5 |
(838) 0x52bff1 VFNMADD213PS %ZMM6,%ZMM5,%ZMM2 |
(838) 0x52bff7 MOV 0x20(%RSP),%RDI |
(838) 0x52bffc VBROADCASTF64X4 (%RDI,%RAX,4),%ZMM6 |
(838) 0x52c003 VMULPS %ZMM2,%ZMM5,%ZMM2 |
(838) 0x52c009 VFMADD231PS %ZMM17,%ZMM1,%ZMM11 |
(838) 0x52c00f VMULPS 0x200(%RSP),%ZMM6,%ZMM5 |
(838) 0x52c017 VMULPS %ZMM2,%ZMM11,%ZMM2 |
(838) 0x52c01d VBLENDMPS %ZMM13,%ZMM4,%ZMM7{%K5} |
(838) 0x52c023 VMULPS 0x1c0(%RSP),%ZMM6,%ZMM6 |
(838) 0x52c02b VMULPS %ZMM2,%ZMM18,%ZMM2 |
(838) 0x52c031 VMULPS %ZMM3,%ZMM5,%ZMM3 |
(838) 0x52c037 VFMADD213PS %ZMM7,%ZMM1,%ZMM2 |
(838) 0x52c03d MOV %R15,%RAX |
(838) 0x52c040 SAL $0x4,%RAX |
(838) 0x52c044 SAL $0x6,%R15 |
(838) 0x52c048 VBROADCASTF64X4 (%R11,%R15,1),%ZMM1 |
(838) 0x52c04f OR $0x8,%EAX |
(838) 0x52c052 CLTQ |
(838) 0x52c054 VBROADCASTF64X4 (%R11,%RAX,4),%ZMM5 |
(838) 0x52c05b VMULPS %ZMM2,%ZMM6,%ZMM2 |
(838) 0x52c061 VADDPS 0x280(%RSP),%ZMM1,%ZMM6 |
(838) 0x52c069 VMOVAPS 0x500(%RSP),%ZMM24 |
(838) 0x52c071 VADDPS %ZMM1,%ZMM24,%ZMM1 |
(838) 0x52c077 VMULPS %ZMM6,%ZMM0,%ZMM6 |
(838) 0x52c07d VMULPS %ZMM1,%ZMM4,%ZMM1 |
(838) 0x52c083 VMULPS %ZMM6,%ZMM6,%ZMM6 |
(838) 0x52c089 VMULPS %ZMM1,%ZMM1,%ZMM1 |
(838) 0x52c08f VMULPS %ZMM6,%ZMM6,%ZMM7 |
(838) 0x52c095 VMULPS %ZMM7,%ZMM6,%ZMM6 |
(838) 0x52c09b VMULPS %ZMM1,%ZMM1,%ZMM7 |
(838) 0x52c0a1 VMULPS %ZMM7,%ZMM1,%ZMM1 |
(838) 0x52c0a7 VMULPS 0x240(%RSP),%ZMM5,%ZMM7 |
(838) 0x52c0af VMOVAPS %ZMM13,%ZMM6{%K6} |
(838) 0x52c0b5 VMULPS %ZMM6,%ZMM7,%ZMM7 |
(838) 0x52c0bb VMULPS %ZMM7,%ZMM6,%ZMM6 |
(838) 0x52c0c1 VSUBPS %ZMM7,%ZMM6,%ZMM6 |
(838) 0x52c0c7 VADDPS %ZMM6,%ZMM3,%ZMM3 |
(838) 0x52c0cd VMULPS %ZMM0,%ZMM0,%ZMM0 |
(838) 0x52c0d3 VMULPS %ZMM3,%ZMM0,%ZMM0 |
(838) 0x52c0d9 VMOVAPS 0x4c0(%RSP),%ZMM25 |
(838) 0x52c0e1 VMULPS %ZMM5,%ZMM25,%ZMM3 |
(838) 0x52c0e7 VMOVAPS %ZMM13,%ZMM1{%K5} |
(838) 0x52c0ed VMULPS %ZMM1,%ZMM3,%ZMM3 |
(838) 0x52c0f3 VMULPS %ZMM3,%ZMM1,%ZMM1 |
(838) 0x52c0f9 VSUBPS %ZMM3,%ZMM1,%ZMM1 |
(838) 0x52c0ff VADDPS %ZMM1,%ZMM2,%ZMM1 |
(838) 0x52c105 VMULPS %ZMM4,%ZMM4,%ZMM2 |
(838) 0x52c10b VMULPS %ZMM1,%ZMM2,%ZMM1 |
(838) 0x52c111 VMULPS %ZMM0,%ZMM28,%ZMM2 |
(838) 0x52c117 VMULPS %ZMM0,%ZMM29,%ZMM3 |
(838) 0x52c11d VMULPS %ZMM0,%ZMM30,%ZMM0 |
(838) 0x52c123 VMULPS 0x2c0(%RSP),%ZMM1,%ZMM4 |
(838) 0x52c12b VMULPS %ZMM1,%ZMM27,%ZMM5 |
(838) 0x52c131 VMULPS %ZMM1,%ZMM31,%ZMM1 |
(838) 0x52c137 VADDPS %ZMM2,%ZMM23,%ZMM23 |
(838) 0x52c13d VADDPS %ZMM4,%ZMM22,%ZMM22 |
(838) 0x52c143 VADDPS %ZMM4,%ZMM2,%ZMM2 |
(838) 0x52c149 VADDPS %ZMM3,%ZMM20,%ZMM20 |
(838) 0x52c14f VADDPS %ZMM5,%ZMM21,%ZMM21 |
(838) 0x52c155 VADDPS %ZMM0,%ZMM16,%ZMM16 |
(838) 0x52c15b VADDPS %ZMM1,%ZMM19,%ZMM19 |
(838) 0x52c161 VADDPS %ZMM5,%ZMM3,%ZMM3 |
(838) 0x52c167 VADDPS %ZMM1,%ZMM0,%ZMM0 |
(838) 0x52c16d VEXTRACTF64X4 $0x1,%ZMM2,%YMM1 |
(838) 0x52c174 VADDPS %YMM1,%YMM2,%YMM1 |
(838) 0x52c178 VMOVAPS (%R10,%R12,4),%YMM2 |
(838) 0x52c17e VMOVAPS 0x20(%R10,%R12,4),%YMM4 |
(838) 0x52c185 VSUBPS %YMM1,%YMM2,%YMM1 |
(838) 0x52c189 VMOVAPS 0x40(%R10,%R12,4),%YMM2 |
(838) 0x52c190 VMOVAPS %YMM1,(%R10,%R12,4) |
(838) 0x52c196 VEXTRACTF64X4 $0x1,%ZMM3,%YMM1 |
(838) 0x52c19d VADDPS %YMM1,%YMM3,%YMM1 |
(838) 0x52c1a1 VSUBPS %YMM1,%YMM4,%YMM1 |
(838) 0x52c1a5 VMOVAPS %YMM1,0x20(%R10,%R12,4) |
(838) 0x52c1ac VEXTRACTF64X4 $0x1,%ZMM0,%YMM1 |
(838) 0x52c1b3 VADDPS %YMM1,%YMM0,%YMM0 |
(838) 0x52c1b7 VSUBPS %YMM0,%YMM2,%YMM0 |
(838) 0x52c1bb VMOVAPS %YMM0,0x40(%R10,%R12,4) |
(838) 0x52c1c2 INC %ECX |
(838) 0x52c1c4 ADD $0x8,%R8 |
(838) 0x52c1c8 CMP %ECX,%R13D |
(838) 0x52c1cb VMOVAPS 0x380(%RSP),%ZMM17 |
(838) 0x52c1d3 MOV 0x18(%RSP),%R15 |
(838) 0x52c1d8 VMOVAPS 0x400(%RSP),%ZMM30 |
(838) 0x52c1e0 VMOVAPS 0x3c0(%RSP),%ZMM31 |
(838) 0x52c1e8 JE 52b4f0 |
(838) 0x52c1ee MOV 0x80(%RBX),%RAX |
(838) 0x52c1f5 CMPL $-0x1,(%RAX,%R8,1) |
(838) 0x52c1fa JE 52ca4f |
(838) 0x52c200 MOVSXD -0x4(%R14,%R8,1),%R15 |
(838) 0x52c205 LEA (,%R15,8),%RAX |
(838) 0x52c20d VPBROADCASTD (%R14,%R8,1),%ZMM1 |
(838) 0x52c214 LEA (%RAX,%RAX,2),%R12 |
(838) 0x52c218 VPANDD 0x340(%RSP),%ZMM1,%ZMM0 |
(838) 0x52c220 VPANDD 0x300(%RSP),%ZMM1,%ZMM26 |
(838) 0x52c228 VBROADCASTF64X4 (%RSI,%R12,4),%ZMM1 |
(838) 0x52c22f MOVSXD %R12D,%RDI |
(838) 0x52c232 VBROADCASTF64X4 0x20(%RSI,%RDI,4),%ZMM2 |
(838) 0x52c23a VBROADCASTF64X4 0x40(%RSI,%RDI,4),%ZMM3 |
(838) 0x52c242 VSUBPS %ZMM1,%ZMM30,%ZMM28 |
(838) 0x52c248 VSUBPS %ZMM1,%ZMM31,%ZMM4 |
(838) 0x52c24e VMOVAPS 0x140(%RSP),%ZMM1 |
(838) 0x52c256 VSUBPS %ZMM2,%ZMM1,%ZMM29 |
(838) 0x52c25c VMOVAPS 0x100(%RSP),%ZMM1 |
(838) 0x52c264 VSUBPS %ZMM2,%ZMM1,%ZMM27 |
(838) 0x52c26a VMOVAPS 0xc0(%RSP),%ZMM1 |
(838) 0x52c272 VSUBPS %ZMM3,%ZMM1,%ZMM30 |
(838) 0x52c278 VMOVAPS 0x80(%RSP),%ZMM1 |
(838) 0x52c280 VSUBPS %ZMM3,%ZMM1,%ZMM31 |
(838) 0x52c286 VMULPS %ZMM28,%ZMM28,%ZMM1 |
(838) 0x52c28c VMULPS %ZMM29,%ZMM29,%ZMM2 |
(838) 0x52c292 VADDPS %ZMM2,%ZMM1,%ZMM1 |
(838) 0x52c298 VMULPS %ZMM30,%ZMM30,%ZMM2 |
(838) 0x52c29e VADDPS %ZMM2,%ZMM1,%ZMM1 |
(838) 0x52c2a4 VMULPS %ZMM4,%ZMM4,%ZMM2 |
(838) 0x52c2aa VMULPS %ZMM27,%ZMM27,%ZMM3 |
(838) 0x52c2b0 VADDPS %ZMM3,%ZMM2,%ZMM2 |
(838) 0x52c2b6 VMULPS %ZMM31,%ZMM31,%ZMM3 |
(838) 0x52c2bc VADDPS %ZMM3,%ZMM2,%ZMM2 |
(838) 0x52c2c2 VCMPPS $0x1,%ZMM17,%ZMM1,%K5 |
(838) 0x52c2c9 VCMPPS $0x1,%ZMM17,%ZMM2,%K4 |
(838) 0x52c2d0 LEA (%R15,%R15,1),%EDI |
(838) 0x52c2d4 CMP %EDX,%EDI |
(838) 0x52c2d6 VMOVAPS %ZMM4,0x2c0(%RSP) |
(838) 0x52c2de JE 52be00 |
(838) 0x52c2e4 OR $0x1,%EDI |
(838) 0x52c2e7 CMP %EDX,%EDI |
(838) 0x52c2e9 JNE 52be0a |
(838) 0x52c2ef KANDD %K2,%K5,%K5 |
(838) 0x52c2f4 KANDD %K3,%K4,%K4 |
(838) 0x52c2f9 JMP 52be0a |
0x52c2fe XCHG %AX,%AX |
(834) 0x52c300 VXORPS %XMM19,%XMM19,%XMM19 |
(834) 0x52c306 VXORPS %XMM20,%XMM20,%XMM20 |
(834) 0x52c30c VXORPS %XMM21,%XMM21,%XMM21 |
(834) 0x52c312 VXORPS %XMM23,%XMM23,%XMM23 |
(834) 0x52c318 VXORPS %XMM22,%XMM22,%XMM22 |
(834) 0x52c31e MOV 0x18(%RSP),%R15 |
(834) 0x52c323 CMP %R13D,%ECX |
(834) 0x52c326 JGE 52b4f0 |
(834) 0x52c32c MOVSXD %ECX,%RCX |
(834) 0x52c32f NOP |
(839) 0x52c330 MOVSXD (%R14,%RCX,8),%RAX |
(839) 0x52c334 LEA (,%RAX,8),%RDX |
(839) 0x52c33c LEA (%RDX,%RDX,2),%RDX |
(839) 0x52c340 VBROADCASTF64X4 (%RSI,%RDX,4),%ZMM0 |
(839) 0x52c347 MOVSXD %EDX,%RDI |
(839) 0x52c34a VBROADCASTF64X4 0x20(%RSI,%RDI,4),%ZMM1 |
(839) 0x52c352 VBROADCASTF64X4 0x40(%RSI,%RDI,4),%ZMM2 |
(839) 0x52c35a VSUBPS %ZMM0,%ZMM30,%ZMM25 |
(839) 0x52c360 VSUBPS %ZMM0,%ZMM31,%ZMM6 |
(839) 0x52c366 VMOVAPS 0x140(%RSP),%ZMM0 |
(839) 0x52c36e VSUBPS %ZMM1,%ZMM0,%ZMM26 |
(839) 0x52c374 VMOVAPS 0x100(%RSP),%ZMM0 |
(839) 0x52c37c VSUBPS %ZMM1,%ZMM0,%ZMM24 |
(839) 0x52c382 VMOVAPS 0xc0(%RSP),%ZMM0 |
(839) 0x52c38a VSUBPS %ZMM2,%ZMM0,%ZMM27 |
(839) 0x52c390 VMOVAPS 0x80(%RSP),%ZMM0 |
(839) 0x52c398 VSUBPS %ZMM2,%ZMM0,%ZMM28 |
(839) 0x52c39e VMULPS %ZMM25,%ZMM25,%ZMM0 |
(839) 0x52c3a4 VMULPS %ZMM26,%ZMM26,%ZMM1 |
(839) 0x52c3aa VADDPS %ZMM1,%ZMM0,%ZMM0 |
(839) 0x52c3b0 VMULPS %ZMM27,%ZMM27,%ZMM1 |
(839) 0x52c3b6 VMULPS %ZMM6,%ZMM6,%ZMM2 |
(839) 0x52c3bc VMULPS %ZMM24,%ZMM24,%ZMM3 |
(839) 0x52c3c2 VADDPS %ZMM1,%ZMM0,%ZMM0 |
(839) 0x52c3c8 VADDPS %ZMM3,%ZMM2,%ZMM1 |
(839) 0x52c3ce VMULPS %ZMM28,%ZMM28,%ZMM2 |
(839) 0x52c3d4 VADDPS %ZMM2,%ZMM1,%ZMM1 |
(839) 0x52c3da VBROADCASTSS -0x1d00ac(%RIP),%ZMM2 |
(839) 0x52c3e4 VCMPPS $0x1,%ZMM17,%ZMM0,%K5 |
(839) 0x52c3eb VCMPPS $0x1,%ZMM17,%ZMM1,%K4 |
(839) 0x52c3f2 VMAXPS %ZMM2,%ZMM0,%ZMM0 |
(839) 0x52c3f8 VMAXPS %ZMM2,%ZMM1,%ZMM3 |
(839) 0x52c3fe VRSQRT14PS %ZMM0,%ZMM4 |
(839) 0x52c404 VMULPS %ZMM4,%ZMM0,%ZMM5 |
(839) 0x52c40a VBROADCASTSS -0x1cff98(%RIP),%ZMM2 |
(839) 0x52c414 VBROADCASTSS -0x1d02ca(%RIP),%ZMM8 |
(839) 0x52c41e VMULPS %ZMM2,%ZMM4,%ZMM9 |
(839) 0x52c424 VRSQRT14PS %ZMM3,%ZMM10 |
(839) 0x52c42a VMULPS %ZMM10,%ZMM3,%ZMM1 |
(839) 0x52c430 VMOVAPS %ZMM0,%ZMM0{%K5}{z} |
(839) 0x52c436 VMULPS %ZMM2,%ZMM10,%ZMM2 |
(839) 0x52c43c VMOVAPS 0x180(%RSP),%ZMM7 |
(839) 0x52c444 VMULPS %ZMM0,%ZMM7,%ZMM29 |
(839) 0x52c44a VMOVAPS %ZMM3,%ZMM0{%K4}{z} |
(839) 0x52c450 VMULPS %ZMM0,%ZMM7,%ZMM7 |
(839) 0x52c456 VBROADCASTSS -0x1cfc74(%RIP),%ZMM3 |
(839) 0x52c460 VFMADD213PS %ZMM8,%ZMM4,%ZMM5 |
(839) 0x52c466 VMULPS %ZMM29,%ZMM29,%ZMM4 |
(839) 0x52c46c VBROADCASTSS -0x1cfdea(%RIP),%ZMM11 |
(839) 0x52c476 VMOVAPS %ZMM11,%ZMM12 |
(839) 0x52c47c VBROADCASTSS -0x1d004e(%RIP),%ZMM13 |
(839) 0x52c486 VFMADD213PS %ZMM8,%ZMM10,%ZMM1 |
(839) 0x52c48c VFMADD213PS %ZMM3,%ZMM4,%ZMM12 |
(839) 0x52c492 VBROADCASTSS -0x1d0194(%RIP),%ZMM8 |
(839) 0x52c49c VMOVAPS %ZMM8,%ZMM10 |
(839) 0x52c4a2 VBROADCASTSS -0x1d0320(%RIP),%ZMM14 |
(839) 0x52c4ac VMULPS %ZMM5,%ZMM9,%ZMM0{%K5}{z} |
(839) 0x52c4b2 VBROADCASTSS -0x1d01fc(%RIP),%ZMM5 |
(839) 0x52c4bc VBROADCASTSS -0x1cff1e(%RIP),%ZMM9 |
(839) 0x52c4c6 VMULPS %ZMM7,%ZMM7,%ZMM15 |
(839) 0x52c4cc VFMADD213PS %ZMM13,%ZMM4,%ZMM10 |
(839) 0x52c4d2 VFMADD213PS %ZMM3,%ZMM15,%ZMM11 |
(839) 0x52c4d8 VMOVAPS %ZMM9,%ZMM3 |
(839) 0x52c4de VFMADD213PS %ZMM5,%ZMM4,%ZMM3 |
(839) 0x52c4e4 VFMADD213PS %ZMM13,%ZMM15,%ZMM8 |
(839) 0x52c4ea VBROADCASTSS -0x1cff08(%RIP),%ZMM13 |
(839) 0x52c4f4 VFMADD213PS %ZMM14,%ZMM4,%ZMM12 |
(839) 0x52c4fa VFMADD213PS %ZMM14,%ZMM15,%ZMM11 |
(839) 0x52c500 VBROADCASTSS -0x1cfda2(%RIP),%ZMM14 |
(839) 0x52c50a VFMADD213PS %ZMM5,%ZMM15,%ZMM9 |
(839) 0x52c510 VMOVAPS %ZMM14,%ZMM5 |
(839) 0x52c516 VFMADD213PS %ZMM13,%ZMM4,%ZMM5 |
(839) 0x52c51c VFMADD231PS %ZMM10,%ZMM29,%ZMM12 |
(839) 0x52c522 VBROADCASTSS -0x1d02e0(%RIP),%ZMM10 |
(839) 0x52c52c VFMADD213PS %ZMM13,%ZMM15,%ZMM14 |
(839) 0x52c532 VBROADCASTSS -0x1d0324(%RIP),%ZMM13 |
(839) 0x52c53c VFMADD213PS %ZMM10,%ZMM4,%ZMM3 |
(839) 0x52c542 VFMADD213PS %ZMM10,%ZMM15,%ZMM9 |
(839) 0x52c548 VFMADD213PS %ZMM13,%ZMM4,%ZMM5 |
(839) 0x52c54e VFMADD213PS %ZMM13,%ZMM15,%ZMM14 |
(839) 0x52c554 VBROADCASTSS -0x1d0076(%RIP),%ZMM10 |
(839) 0x52c55e VFMADD213PS %ZMM10,%ZMM4,%ZMM3 |
(839) 0x52c564 VFMADD213PS %ZMM10,%ZMM15,%ZMM9 |
(839) 0x52c56a VBROADCASTSS -0x1d0034(%RIP),%ZMM4 |
(839) 0x52c574 VRCP14PS %ZMM12,%ZMM10 |
(839) 0x52c57a VMULPS %ZMM1,%ZMM2,%ZMM1{%K4}{z} |
(839) 0x52c580 VFMADD231PS %ZMM8,%ZMM7,%ZMM11 |
(839) 0x52c586 VRCP14PS %ZMM11,%ZMM2 |
(839) 0x52c58c VFNMADD213PS %ZMM4,%ZMM10,%ZMM12 |
(839) 0x52c592 VMULPS %ZMM12,%ZMM10,%ZMM8 |
(839) 0x52c598 VFMADD231PS %ZMM5,%ZMM29,%ZMM3 |
(839) 0x52c59e VFNMADD213PS %ZMM4,%ZMM2,%ZMM11 |
(839) 0x52c5a4 VMULPS %ZMM11,%ZMM2,%ZMM2 |
(839) 0x52c5aa VFMADD231PS %ZMM14,%ZMM7,%ZMM9 |
(839) 0x52c5b0 VMULPS %ZMM8,%ZMM3,%ZMM3 |
(839) 0x52c5b6 MOV %RAX,%RDI |
(839) 0x52c5b9 SAL $0x5,%RDI |
(839) 0x52c5bd VMULPS %ZMM2,%ZMM9,%ZMM2 |
(839) 0x52c5c3 MOV 0x20(%RSP),%R8 |
(839) 0x52c5c8 VBROADCASTF64X4 (%R8,%RDI,1),%ZMM4 |
(839) 0x52c5cf VMULPS %ZMM3,%ZMM18,%ZMM3 |
(839) 0x52c5d5 VFMADD213PS %ZMM0,%ZMM29,%ZMM3 |
(839) 0x52c5db VMULPS 0x200(%RSP),%ZMM4,%ZMM5 |
(839) 0x52c5e3 VMULPS %ZMM3,%ZMM5,%ZMM3 |
(839) 0x52c5e9 VMULPS %ZMM2,%ZMM18,%ZMM2 |
(839) 0x52c5ef VFMADD213PS %ZMM1,%ZMM7,%ZMM2 |
(839) 0x52c5f5 VMULPS 0x1c0(%RSP),%ZMM4,%ZMM4 |
(839) 0x52c5fd VMULPS %ZMM1,%ZMM1,%ZMM1 |
(839) 0x52c603 VMULPS %ZMM2,%ZMM4,%ZMM2 |
(839) 0x52c609 MOV %RAX,%RDI |
(839) 0x52c60c SAL $0x4,%RDI |
(839) 0x52c610 SAL $0x6,%RAX |
(839) 0x52c614 VBROADCASTF64X4 (%R11,%RAX,1),%ZMM4 |
(839) 0x52c61b VMULPS %ZMM2,%ZMM1,%ZMM1 |
(839) 0x52c621 OR $0x8,%EDI |
(839) 0x52c624 MOVSXD %EDI,%RAX |
(839) 0x52c627 VADDPS 0x280(%RSP),%ZMM4,%ZMM2 |
(839) 0x52c62f VMULPS %ZMM2,%ZMM0,%ZMM2 |
(839) 0x52c635 VMULPS %ZMM2,%ZMM2,%ZMM2 |
(839) 0x52c63b VMULPS %ZMM2,%ZMM2,%ZMM4 |
(839) 0x52c641 VMULPS %ZMM4,%ZMM2,%ZMM2 |
(839) 0x52c647 VBROADCASTF64X4 (%R11,%RAX,4),%ZMM4 |
(839) 0x52c64e VMULPS 0x240(%RSP),%ZMM4,%ZMM4 |
(839) 0x52c656 VMULPS %ZMM2,%ZMM4,%ZMM4 |
(839) 0x52c65c VMULPS %ZMM4,%ZMM2,%ZMM2 |
(839) 0x52c662 VSUBPS %ZMM4,%ZMM2,%ZMM2 |
(839) 0x52c668 VADDPS %ZMM2,%ZMM3,%ZMM2 |
(839) 0x52c66e VMULPS %ZMM0,%ZMM0,%ZMM0 |
(839) 0x52c674 VMULPS %ZMM2,%ZMM0,%ZMM0 |
(839) 0x52c67a VMULPS %ZMM0,%ZMM25,%ZMM2 |
(839) 0x52c680 VMULPS %ZMM0,%ZMM26,%ZMM3 |
(839) 0x52c686 VMULPS %ZMM0,%ZMM27,%ZMM0 |
(839) 0x52c68c VMULPS %ZMM1,%ZMM6,%ZMM4 |
(839) 0x52c692 VMULPS %ZMM1,%ZMM24,%ZMM5 |
(839) 0x52c698 VMULPS %ZMM1,%ZMM28,%ZMM1 |
(839) 0x52c69e VADDPS %ZMM4,%ZMM22,%ZMM22 |
(839) 0x52c6a4 VADDPS %ZMM2,%ZMM23,%ZMM23 |
(839) 0x52c6aa VADDPS %ZMM2,%ZMM4,%ZMM2 |
(839) 0x52c6b0 VADDPS %ZMM3,%ZMM20,%ZMM20 |
(839) 0x52c6b6 VADDPS %ZMM5,%ZMM21,%ZMM21 |
(839) 0x52c6bc VADDPS %ZMM0,%ZMM16,%ZMM16 |
(839) 0x52c6c2 VADDPS %ZMM1,%ZMM19,%ZMM19 |
(839) 0x52c6c8 VADDPS %ZMM3,%ZMM5,%ZMM3 |
(839) 0x52c6ce VADDPS %ZMM0,%ZMM1,%ZMM0 |
(839) 0x52c6d4 VEXTRACTF64X4 $0x1,%ZMM2,%YMM1 |
(839) 0x52c6db VADDPS %YMM1,%YMM2,%YMM1 |
(839) 0x52c6df VMOVAPS (%R10,%RDX,4),%YMM2 |
(839) 0x52c6e5 VSUBPS %YMM1,%YMM2,%YMM1 |
(839) 0x52c6e9 VMOVAPS 0x20(%R10,%RDX,4),%YMM2 |
(839) 0x52c6f0 VMOVAPS 0x40(%R10,%RDX,4),%YMM4 |
(839) 0x52c6f7 VMOVAPS %YMM1,(%R10,%RDX,4) |
(839) 0x52c6fd VEXTRACTF64X4 $0x1,%ZMM3,%YMM1 |
(839) 0x52c704 VADDPS %YMM1,%YMM3,%YMM1 |
(839) 0x52c708 VSUBPS %YMM1,%YMM2,%YMM1 |
(839) 0x52c70c VMOVAPS %YMM1,0x20(%R10,%RDX,4) |
(839) 0x52c713 VEXTRACTF64X4 $0x1,%ZMM0,%YMM1 |
(839) 0x52c71a VADDPS %YMM1,%YMM0,%YMM0 |
(839) 0x52c71e VSUBPS %YMM0,%YMM4,%YMM0 |
(839) 0x52c722 VMOVAPS %YMM0,0x40(%R10,%RDX,4) |
(839) 0x52c729 INC %RCX |
(839) 0x52c72c CMP %RCX,%R13 |
(839) 0x52c72f JNE 52c330 |
(834) 0x52c735 JMP 52b4f0 |
0x52c73a NOPW (%RAX,%RAX,1) |
(834) 0x52c740 VXORPS %XMM19,%XMM19,%XMM19 |
(834) 0x52c746 VXORPS %XMM20,%XMM20,%XMM20 |
(834) 0x52c74c VXORPS %XMM21,%XMM21,%XMM21 |
(834) 0x52c752 VXORPS %XMM23,%XMM23,%XMM23 |
(834) 0x52c758 VXORPS %XMM22,%XMM22,%XMM22 |
(834) 0x52c75e CMP %R13D,%ECX |
(834) 0x52c761 MOV 0x30(%RSP),%RBX |
(834) 0x52c766 MOV 0x18(%RSP),%R15 |
(834) 0x52c76b JGE 52cec2 |
(834) 0x52c771 NOPW %CS:(%RAX,%RAX,1) |
(836) 0x52c780 MOV 0x80(%RBX),%RAX |
(836) 0x52c787 CMPL $-0x1,0x4(%RAX,%R8,8) |
(836) 0x52c78d JE 52cebf |
(836) 0x52c793 MOVSXD (%R14,%R8,8),%RCX |
(836) 0x52c797 LEA (,%RCX,8),%RAX |
(836) 0x52c79f LEA (%RAX,%RAX,2),%RAX |
(836) 0x52c7a3 VPBROADCASTD 0x4(%R14,%R8,8),%ZMM3 |
(836) 0x52c7ab VBROADCASTF64X4 (%RSI,%RAX,4),%ZMM0 |
(836) 0x52c7b2 MOVSXD %EAX,%RDX |
(836) 0x52c7b5 VBROADCASTF64X4 0x20(%RSI,%RDX,4),%ZMM1 |
(836) 0x52c7bd VBROADCASTF64X4 0x40(%RSI,%RDX,4),%ZMM4 |
(836) 0x52c7c5 VSUBPS %ZMM0,%ZMM30,%ZMM2 |
(836) 0x52c7cb VSUBPS %ZMM0,%ZMM31,%ZMM0 |
(836) 0x52c7d1 VMOVAPS 0x140(%RSP),%ZMM5 |
(836) 0x52c7d9 VSUBPS %ZMM1,%ZMM5,%ZMM6 |
(836) 0x52c7df VMOVAPS 0x100(%RSP),%ZMM5 |
(836) 0x52c7e7 VSUBPS %ZMM1,%ZMM5,%ZMM1 |
(836) 0x52c7ed VMOVAPS 0xc0(%RSP),%ZMM5 |
(836) 0x52c7f5 VSUBPS %ZMM4,%ZMM5,%ZMM7 |
(836) 0x52c7fb VMOVAPS 0x80(%RSP),%ZMM5 |
(836) 0x52c803 VSUBPS %ZMM4,%ZMM5,%ZMM8 |
(836) 0x52c809 VMULPS %ZMM2,%ZMM2,%ZMM4 |
(836) 0x52c80f VMULPS %ZMM6,%ZMM6,%ZMM5 |
(836) 0x52c815 VADDPS %ZMM5,%ZMM4,%ZMM4 |
(836) 0x52c81b VMULPS %ZMM7,%ZMM7,%ZMM5 |
(836) 0x52c821 VADDPS %ZMM5,%ZMM4,%ZMM4 |
(836) 0x52c827 VMULPS %ZMM0,%ZMM0,%ZMM5 |
(836) 0x52c82d VMULPS %ZMM1,%ZMM1,%ZMM9 |
(836) 0x52c833 VADDPS %ZMM9,%ZMM5,%ZMM5 |
(836) 0x52c839 VMULPS %ZMM8,%ZMM8,%ZMM9 |
(836) 0x52c83f VADDPS %ZMM9,%ZMM5,%ZMM5 |
(836) 0x52c845 VCMPPS $0x1,%ZMM17,%ZMM4,%K4 |
(836) 0x52c84c VCMPPS $0x1,%ZMM17,%ZMM5,%K5 |
(836) 0x52c853 VPTESTMD 0x340(%RSP),%ZMM3,%K4{%K4} |
(836) 0x52c85b VPTESTMD 0x300(%RSP),%ZMM3,%K5{%K5} |
(836) 0x52c863 VBROADCASTSS -0x1d0535(%RIP),%ZMM3 |
(836) 0x52c86d VMAXPS %ZMM3,%ZMM4,%ZMM4 |
(836) 0x52c873 VRSQRT14PS %ZMM4,%ZMM9 |
(836) 0x52c879 VMAXPS %ZMM3,%ZMM5,%ZMM3 |
(836) 0x52c87f VMULPS %ZMM9,%ZMM4,%ZMM4 |
(836) 0x52c885 VBROADCASTSS -0x1d0413(%RIP),%ZMM5 |
(836) 0x52c88f VBROADCASTSS -0x1d0745(%RIP),%ZMM10 |
(836) 0x52c899 VMULPS %ZMM5,%ZMM9,%ZMM11 |
(836) 0x52c89f VFMADD213PS %ZMM10,%ZMM9,%ZMM4 |
(836) 0x52c8a5 VRSQRT14PS %ZMM3,%ZMM9 |
(836) 0x52c8ab VMULPS %ZMM9,%ZMM3,%ZMM3 |
(836) 0x52c8b1 VMULPS %ZMM5,%ZMM9,%ZMM5 |
(836) 0x52c8b7 VFMADD213PS %ZMM10,%ZMM9,%ZMM3 |
(836) 0x52c8bd VMULPS %ZMM4,%ZMM11,%ZMM4{%K4}{z} |
(836) 0x52c8c3 VMULPS %ZMM3,%ZMM5,%ZMM3{%K5}{z} |
(836) 0x52c8c9 MOV %RCX,%RDX |
(836) 0x52c8cc SAL $0x4,%RDX |
(836) 0x52c8d0 SAL $0x6,%RCX |
(836) 0x52c8d4 VBROADCASTF64X4 (%R11,%RCX,1),%ZMM5 |
(836) 0x52c8db OR $0x8,%EDX |
(836) 0x52c8de MOVSXD %EDX,%RCX |
(836) 0x52c8e1 VBROADCASTF64X4 (%R11,%RCX,4),%ZMM9 |
(836) 0x52c8e8 VADDPS %ZMM5,%ZMM14,%ZMM10 |
(836) 0x52c8ee VADDPS %ZMM5,%ZMM24,%ZMM5 |
(836) 0x52c8f4 VMULPS %ZMM4,%ZMM10,%ZMM10 |
(836) 0x52c8fa VMULPS %ZMM3,%ZMM5,%ZMM5 |
(836) 0x52c900 VMULPS %ZMM10,%ZMM10,%ZMM10 |
(836) 0x52c906 VMULPS %ZMM5,%ZMM5,%ZMM5 |
(836) 0x52c90c VMULPS %ZMM10,%ZMM10,%ZMM11 |
(836) 0x52c912 VMULPS %ZMM11,%ZMM10,%ZMM10 |
(836) 0x52c918 VMULPS %ZMM5,%ZMM5,%ZMM11 |
(836) 0x52c91e VMULPS %ZMM11,%ZMM5,%ZMM5 |
(836) 0x52c924 VMULPS %ZMM9,%ZMM15,%ZMM11 |
(836) 0x52c92a VMULPS %ZMM10,%ZMM11,%ZMM11 |
(836) 0x52c930 VMULPS %ZMM11,%ZMM10,%ZMM10 |
(836) 0x52c936 VSUBPS %ZMM11,%ZMM10,%ZMM10 |
(836) 0x52c93c VMULPS %ZMM4,%ZMM4,%ZMM4 |
(836) 0x52c942 VMULPS %ZMM10,%ZMM4,%ZMM4 |
(836) 0x52c948 VMULPS %ZMM9,%ZMM25,%ZMM9 |
(836) 0x52c94e VMULPS %ZMM5,%ZMM9,%ZMM9 |
(836) 0x52c954 VMULPS %ZMM9,%ZMM5,%ZMM5 |
(836) 0x52c95a VSUBPS %ZMM9,%ZMM5,%ZMM5 |
(836) 0x52c960 VMULPS %ZMM3,%ZMM3,%ZMM3 |
(836) 0x52c966 VMULPS %ZMM5,%ZMM3,%ZMM3 |
(836) 0x52c96c VMULPS %ZMM4,%ZMM2,%ZMM2 |
(836) 0x52c972 VMULPS %ZMM4,%ZMM6,%ZMM5 |
(836) 0x52c978 VMULPS %ZMM4,%ZMM7,%ZMM4 |
(836) 0x52c97e VMULPS %ZMM3,%ZMM0,%ZMM0 |
(836) 0x52c984 VMULPS %ZMM3,%ZMM1,%ZMM1 |
(836) 0x52c98a VMULPS %ZMM3,%ZMM8,%ZMM3 |
(836) 0x52c990 VADDPS %ZMM2,%ZMM23,%ZMM23 |
(836) 0x52c996 VADDPS %ZMM0,%ZMM22,%ZMM22 |
(836) 0x52c99c VADDPS %ZMM0,%ZMM2,%ZMM0 |
(836) 0x52c9a2 VADDPS %ZMM5,%ZMM20,%ZMM20 |
(836) 0x52c9a8 VADDPS %ZMM1,%ZMM21,%ZMM21 |
(836) 0x52c9ae VADDPS %ZMM4,%ZMM16,%ZMM16 |
(836) 0x52c9b4 VADDPS %ZMM3,%ZMM19,%ZMM19 |
(836) 0x52c9ba VADDPS %ZMM1,%ZMM5,%ZMM1 |
(836) 0x52c9c0 VADDPS %ZMM3,%ZMM4,%ZMM2 |
(836) 0x52c9c6 VEXTRACTF64X4 $0x1,%ZMM0,%YMM3 |
(836) 0x52c9cd VADDPS %YMM3,%YMM0,%YMM0 |
(836) 0x52c9d1 VMOVAPS (%R10,%RAX,4),%YMM3 |
(836) 0x52c9d7 VSUBPS %YMM0,%YMM3,%YMM0 |
(836) 0x52c9db VMOVAPS 0x20(%R10,%RAX,4),%YMM3 |
(836) 0x52c9e2 VMOVAPS 0x40(%R10,%RAX,4),%YMM4 |
(836) 0x52c9e9 VMOVAPS %YMM0,(%R10,%RAX,4) |
(836) 0x52c9ef VEXTRACTF64X4 $0x1,%ZMM1,%YMM0 |
(836) 0x52c9f6 VADDPS %YMM0,%YMM1,%YMM0 |
(836) 0x52c9fa VSUBPS %YMM0,%YMM3,%YMM0 |
(836) 0x52c9fe VMOVAPS %YMM0,0x20(%R10,%RAX,4) |
(836) 0x52ca05 VEXTRACTF64X4 $0x1,%ZMM2,%YMM0 |
(836) 0x52ca0c VADDPS %YMM0,%YMM2,%YMM0 |
(836) 0x52ca10 VSUBPS %YMM0,%YMM4,%YMM0 |
(836) 0x52ca14 VMOVAPS %YMM0,0x40(%R10,%RAX,4) |
(836) 0x52ca1b INC %R8 |
(836) 0x52ca1e CMP %R8,%R13 |
(836) 0x52ca21 JNE 52c780 |
(834) 0x52ca27 JMP 52b4f0 |
(834) 0x52ca2c VXORPS %XMM19,%XMM19,%XMM19 |
(834) 0x52ca32 VXORPS %XMM20,%XMM20,%XMM20 |
(834) 0x52ca38 VXORPS %XMM21,%XMM21,%XMM21 |
(834) 0x52ca3e VXORPS %XMM23,%XMM23,%XMM23 |
(834) 0x52ca44 VXORPS %XMM22,%XMM22,%XMM22 |
(834) 0x52ca4a MOV 0x18(%RSP),%R15 |
(834) 0x52ca4f CMP %R13D,%ECX |
(834) 0x52ca52 JGE 52b4f0 |
(834) 0x52ca58 MOVSXD %ECX,%RCX |
(834) 0x52ca5b NOPL (%RAX,%RAX,1) |
(837) 0x52ca60 MOVSXD (%R14,%RCX,8),%RAX |
(837) 0x52ca64 LEA (,%RAX,8),%RDX |
(837) 0x52ca6c LEA (%RDX,%RDX,2),%RDX |
(837) 0x52ca70 VBROADCASTF64X4 (%RSI,%RDX,4),%ZMM0 |
(837) 0x52ca77 MOVSXD %EDX,%RDI |
(837) 0x52ca7a VBROADCASTF64X4 0x20(%RSI,%RDI,4),%ZMM1 |
(837) 0x52ca82 VBROADCASTF64X4 0x40(%RSI,%RDI,4),%ZMM2 |
(837) 0x52ca8a VSUBPS %ZMM0,%ZMM30,%ZMM26 |
(837) 0x52ca90 VSUBPS %ZMM0,%ZMM31,%ZMM6 |
(837) 0x52ca96 VMOVAPS 0x140(%RSP),%ZMM0 |
(837) 0x52ca9e VSUBPS %ZMM1,%ZMM0,%ZMM28 |
(837) 0x52caa4 VMOVAPS 0x100(%RSP),%ZMM0 |
(837) 0x52caac VSUBPS %ZMM1,%ZMM0,%ZMM27 |
(837) 0x52cab2 VMOVAPS 0xc0(%RSP),%ZMM0 |
(837) 0x52caba VSUBPS %ZMM2,%ZMM0,%ZMM30 |
(837) 0x52cac0 VMOVAPS 0x80(%RSP),%ZMM0 |
(837) 0x52cac8 VSUBPS %ZMM2,%ZMM0,%ZMM29 |
(837) 0x52cace VMULPS %ZMM26,%ZMM26,%ZMM0 |
(837) 0x52cad4 VMULPS %ZMM28,%ZMM28,%ZMM1 |
(837) 0x52cada VADDPS %ZMM1,%ZMM0,%ZMM0 |
(837) 0x52cae0 VMULPS %ZMM30,%ZMM30,%ZMM1 |
(837) 0x52cae6 VADDPS %ZMM1,%ZMM0,%ZMM0 |
(837) 0x52caec VMULPS %ZMM6,%ZMM6,%ZMM1 |
(837) 0x52caf2 VMULPS %ZMM27,%ZMM27,%ZMM2 |
(837) 0x52caf8 VADDPS %ZMM2,%ZMM1,%ZMM1 |
(837) 0x52cafe VMULPS %ZMM29,%ZMM29,%ZMM2 |
(837) 0x52cb04 VADDPS %ZMM2,%ZMM1,%ZMM1 |
(837) 0x52cb0a VCMPPS $0x1,%ZMM17,%ZMM0,%K5 |
(837) 0x52cb11 VCMPPS $0x1,%ZMM17,%ZMM1,%K4 |
(837) 0x52cb18 VBROADCASTSS -0x1d07ea(%RIP),%ZMM2 |
(837) 0x52cb22 VMAXPS %ZMM2,%ZMM0,%ZMM7 |
(837) 0x52cb28 VMAXPS %ZMM2,%ZMM1,%ZMM31 |
(837) 0x52cb2e VMOVAPS %ZMM7,%ZMM0{%K5}{z} |
(837) 0x52cb34 VMOVAPS %ZMM31,%ZMM3{%K4}{z} |
(837) 0x52cb3a VBROADCASTSS -0x1d0358(%RIP),%ZMM4 |
(837) 0x52cb44 VBROADCASTSS -0x1d04c2(%RIP),%ZMM2 |
(837) 0x52cb4e VMOVAPS 0x180(%RSP),%ZMM5 |
(837) 0x52cb56 VMULPS %ZMM0,%ZMM5,%ZMM1 |
(837) 0x52cb5c VMULPS %ZMM3,%ZMM5,%ZMM0 |
(837) 0x52cb62 VMOVAPS %ZMM2,%ZMM8 |
(837) 0x52cb68 VBROADCASTSS -0x1d073a(%RIP),%ZMM3 |
(837) 0x52cb72 VBROADCASTSS -0x1d0874(%RIP),%ZMM9 |
(837) 0x52cb7c VMULPS %ZMM1,%ZMM1,%ZMM5 |
(837) 0x52cb82 VFMADD213PS %ZMM4,%ZMM5,%ZMM8 |
(837) 0x52cb88 VMOVAPS %ZMM9,%ZMM10 |
(837) 0x52cb8e VBROADCASTSS -0x1d0a0c(%RIP),%ZMM11 |
(837) 0x52cb98 VBROADCASTSS -0x1d08e2(%RIP),%ZMM12 |
(837) 0x52cba2 VFMADD213PS %ZMM3,%ZMM5,%ZMM10 |
(837) 0x52cba8 VBROADCASTSS -0x1d060a(%RIP),%ZMM13 |
(837) 0x52cbb2 VMOVAPS %ZMM13,%ZMM14 |
(837) 0x52cbb8 VFMADD213PS %ZMM12,%ZMM5,%ZMM14 |
(837) 0x52cbbe VBROADCASTSS -0x1d05dc(%RIP),%ZMM15 |
(837) 0x52cbc8 VFMADD213PS %ZMM11,%ZMM5,%ZMM8 |
(837) 0x52cbce VMULPS %ZMM0,%ZMM0,%ZMM17 |
(837) 0x52cbd4 VFMADD213PS %ZMM4,%ZMM17,%ZMM2 |
(837) 0x52cbda VBROADCASTSS -0x1d047c(%RIP),%ZMM4 |
(837) 0x52cbe4 VFMADD213PS %ZMM3,%ZMM17,%ZMM9 |
(837) 0x52cbea VMOVAPS %ZMM4,%ZMM3 |
(837) 0x52cbf0 VFMADD213PS %ZMM11,%ZMM17,%ZMM2 |
(837) 0x52cbf6 VBROADCASTSS -0x1d09b4(%RIP),%ZMM11 |
(837) 0x52cc00 VFMADD213PS %ZMM12,%ZMM17,%ZMM13 |
(837) 0x52cc06 VBROADCASTSS -0x1d09f8(%RIP),%ZMM12 |
(837) 0x52cc10 VFMADD213PS %ZMM15,%ZMM5,%ZMM3 |
(837) 0x52cc16 VFMADD213PS %ZMM11,%ZMM5,%ZMM14 |
(837) 0x52cc1c VFMADD213PS %ZMM12,%ZMM5,%ZMM3 |
(837) 0x52cc22 VFMADD213PS %ZMM15,%ZMM17,%ZMM4 |
(837) 0x52cc28 VBROADCASTSS -0x1d074a(%RIP),%ZMM15 |
(837) 0x52cc32 VFMADD213PS %ZMM15,%ZMM5,%ZMM14 |
(837) 0x52cc38 VFMADD213PS %ZMM11,%ZMM17,%ZMM13 |
(837) 0x52cc3e VFMADD213PS %ZMM12,%ZMM17,%ZMM4 |
(837) 0x52cc44 VRSQRT14PS %ZMM7,%ZMM5 |
(837) 0x52cc4a VFMADD213PS %ZMM15,%ZMM17,%ZMM13 |
(837) 0x52cc50 VMOVAPS 0x380(%RSP),%ZMM17 |
(837) 0x52cc58 VBROADCASTSS -0x1d0b0e(%RIP),%ZMM11 |
(837) 0x52cc62 VRSQRT14PS %ZMM31,%ZMM12 |
(837) 0x52cc68 VMULPS %ZMM5,%ZMM7,%ZMM7 |
(837) 0x52cc6e VFMADD213PS %ZMM11,%ZMM5,%ZMM7 |
(837) 0x52cc74 VMULPS %ZMM12,%ZMM31,%ZMM15 |
(837) 0x52cc7a VMOVAPS 0x3c0(%RSP),%ZMM31 |
(837) 0x52cc82 VFMADD213PS %ZMM11,%ZMM12,%ZMM15 |
(837) 0x52cc88 VBROADCASTSS -0x1d0816(%RIP),%ZMM11 |
(837) 0x52cc92 VMULPS %ZMM11,%ZMM5,%ZMM5 |
(837) 0x52cc98 VMULPS %ZMM11,%ZMM12,%ZMM11 |
(837) 0x52cc9e VMULPS %ZMM7,%ZMM5,%ZMM5{%K5}{z} |
(837) 0x52cca4 VFMADD231PS %ZMM10,%ZMM1,%ZMM8 |
(837) 0x52ccaa VRCP14PS %ZMM8,%ZMM7 |
(837) 0x52ccb0 VMULPS %ZMM15,%ZMM11,%ZMM10{%K4}{z} |
(837) 0x52ccb6 VFMADD231PS %ZMM3,%ZMM1,%ZMM14 |
(837) 0x52ccbc VBROADCASTSS -0x1d0786(%RIP),%ZMM3 |
(837) 0x52ccc6 VFNMADD213PS %ZMM3,%ZMM7,%ZMM8 |
(837) 0x52cccc VMULPS %ZMM8,%ZMM7,%ZMM7 |
(837) 0x52ccd2 VFMADD231PS %ZMM9,%ZMM0,%ZMM2 |
(837) 0x52ccd8 VRCP14PS %ZMM2,%ZMM8 |
(837) 0x52ccde VFNMADD213PS %ZMM3,%ZMM8,%ZMM2 |
(837) 0x52cce4 VMULPS %ZMM7,%ZMM14,%ZMM3 |
(837) 0x52ccea VMULPS %ZMM2,%ZMM8,%ZMM2 |
(837) 0x52ccf0 MOV %RAX,%RDI |
(837) 0x52ccf3 VFMADD231PS %ZMM4,%ZMM0,%ZMM13 |
(837) 0x52ccf9 MOV %RAX,%R8 |
(837) 0x52ccfc SAL $0x6,%RAX |
(837) 0x52cd00 VBROADCASTF64X4 (%R11,%RAX,1),%ZMM4 |
(837) 0x52cd07 SAL $0x5,%RDI |
(837) 0x52cd0b VMULPS %ZMM3,%ZMM18,%ZMM3 |
(837) 0x52cd11 VMULPS %ZMM2,%ZMM13,%ZMM2 |
(837) 0x52cd17 VADDPS 0x280(%RSP),%ZMM4,%ZMM7 |
(837) 0x52cd1f VMULPS %ZMM7,%ZMM5,%ZMM7 |
(837) 0x52cd25 VMULPS %ZMM7,%ZMM7,%ZMM7 |
(837) 0x52cd2b VFMADD213PS %ZMM5,%ZMM1,%ZMM3 |
(837) 0x52cd31 VMULPS %ZMM7,%ZMM7,%ZMM1 |
(837) 0x52cd37 VMULPS %ZMM1,%ZMM7,%ZMM1 |
(837) 0x52cd3d MOV 0x20(%RSP),%RAX |
(837) 0x52cd42 VBROADCASTF64X4 (%RAX,%RDI,1),%ZMM7 |
(837) 0x52cd49 VMULPS %ZMM2,%ZMM18,%ZMM2 |
(837) 0x52cd4f VFMADD213PS %ZMM10,%ZMM0,%ZMM2 |
(837) 0x52cd55 VMULPS 0x200(%RSP),%ZMM7,%ZMM0 |
(837) 0x52cd5d VMULPS 0x1c0(%RSP),%ZMM7,%ZMM7 |
(837) 0x52cd65 SAL $0x4,%R8 |
(837) 0x52cd69 OR $0x8,%R8D |
(837) 0x52cd6d MOVSXD %R8D,%RAX |
(837) 0x52cd70 VMULPS %ZMM3,%ZMM0,%ZMM0 |
(837) 0x52cd76 VBROADCASTF64X4 (%R11,%RAX,4),%ZMM3 |
(837) 0x52cd7d VADDPS %ZMM4,%ZMM24,%ZMM4 |
(837) 0x52cd83 VMULPS %ZMM4,%ZMM10,%ZMM4 |
(837) 0x52cd89 VMULPS %ZMM4,%ZMM4,%ZMM4 |
(837) 0x52cd8f VMULPS %ZMM2,%ZMM7,%ZMM2 |
(837) 0x52cd95 VMULPS %ZMM4,%ZMM4,%ZMM7 |
(837) 0x52cd9b VMULPS %ZMM7,%ZMM4,%ZMM4 |
(837) 0x52cda1 VMULPS 0x240(%RSP),%ZMM3,%ZMM7 |
(837) 0x52cda9 VMULPS %ZMM1,%ZMM7,%ZMM7 |
(837) 0x52cdaf VMULPS %ZMM7,%ZMM1,%ZMM1 |
(837) 0x52cdb5 VSUBPS %ZMM7,%ZMM1,%ZMM1 |
(837) 0x52cdbb VADDPS %ZMM1,%ZMM0,%ZMM0 |
(837) 0x52cdc1 VMULPS %ZMM5,%ZMM5,%ZMM1 |
(837) 0x52cdc7 VMULPS %ZMM0,%ZMM1,%ZMM0 |
(837) 0x52cdcd VMULPS %ZMM3,%ZMM25,%ZMM1 |
(837) 0x52cdd3 VMULPS %ZMM4,%ZMM1,%ZMM1 |
(837) 0x52cdd9 VMULPS %ZMM1,%ZMM4,%ZMM3 |
(837) 0x52cddf VSUBPS %ZMM1,%ZMM3,%ZMM1 |
(837) 0x52cde5 VADDPS %ZMM1,%ZMM2,%ZMM1 |
(837) 0x52cdeb VMULPS %ZMM10,%ZMM10,%ZMM2 |
(837) 0x52cdf1 VMULPS %ZMM1,%ZMM2,%ZMM1 |
(837) 0x52cdf7 VMULPS %ZMM0,%ZMM26,%ZMM2 |
(837) 0x52cdfd VMULPS %ZMM0,%ZMM28,%ZMM3 |
(837) 0x52ce03 VMULPS %ZMM0,%ZMM30,%ZMM0 |
(837) 0x52ce09 VMOVAPS 0x400(%RSP),%ZMM30 |
(837) 0x52ce11 VMULPS %ZMM1,%ZMM6,%ZMM4 |
(837) 0x52ce17 VMULPS %ZMM1,%ZMM27,%ZMM5 |
(837) 0x52ce1d VMULPS %ZMM1,%ZMM29,%ZMM1 |
(837) 0x52ce23 VADDPS %ZMM2,%ZMM23,%ZMM23 |
(837) 0x52ce29 VADDPS %ZMM4,%ZMM22,%ZMM22 |
(837) 0x52ce2f VADDPS %ZMM4,%ZMM2,%ZMM2 |
(837) 0x52ce35 VADDPS %ZMM3,%ZMM20,%ZMM20 |
(837) 0x52ce3b VADDPS %ZMM5,%ZMM21,%ZMM21 |
(837) 0x52ce41 VADDPS %ZMM0,%ZMM16,%ZMM16 |
(837) 0x52ce47 VADDPS %ZMM1,%ZMM19,%ZMM19 |
(837) 0x52ce4d VADDPS %ZMM5,%ZMM3,%ZMM3 |
(837) 0x52ce53 VADDPS %ZMM1,%ZMM0,%ZMM0 |
(837) 0x52ce59 VEXTRACTF64X4 $0x1,%ZMM2,%YMM1 |
(837) 0x52ce60 VADDPS %YMM1,%YMM2,%YMM1 |
(837) 0x52ce64 VMOVAPS (%R10,%RDX,4),%YMM2 |
(837) 0x52ce6a VSUBPS %YMM1,%YMM2,%YMM1 |
(837) 0x52ce6e VMOVAPS 0x20(%R10,%RDX,4),%YMM2 |
(837) 0x52ce75 VMOVAPS 0x40(%R10,%RDX,4),%YMM4 |
(837) 0x52ce7c VMOVAPS %YMM1,(%R10,%RDX,4) |
(837) 0x52ce82 VEXTRACTF64X4 $0x1,%ZMM3,%YMM1 |
(837) 0x52ce89 VADDPS %YMM1,%YMM3,%YMM1 |
(837) 0x52ce8d VSUBPS %YMM1,%YMM2,%YMM1 |
(837) 0x52ce91 VMOVAPS %YMM1,0x20(%R10,%RDX,4) |
(837) 0x52ce98 VEXTRACTF64X4 $0x1,%ZMM0,%YMM1 |
(837) 0x52ce9f VADDPS %YMM1,%YMM0,%YMM0 |
(837) 0x52cea3 VSUBPS %YMM0,%YMM4,%YMM0 |
(837) 0x52cea7 VMOVAPS %YMM0,0x40(%R10,%RDX,4) |
(837) 0x52ceae INC %RCX |
(837) 0x52ceb1 CMP %RCX,%R13 |
(837) 0x52ceb4 JNE 52ca60 |
(834) 0x52ceba JMP 52b4f0 |
(834) 0x52cebf MOV %R8D,%ECX |
(834) 0x52cec2 CMP %R13D,%ECX |
(834) 0x52cec5 JGE 52b4f0 |
(834) 0x52cecb MOVSXD %ECX,%RAX |
(834) 0x52cece XCHG %AX,%AX |
(835) 0x52ced0 MOVSXD (%R14,%RAX,8),%RDX |
(835) 0x52ced4 LEA (,%RDX,8),%RCX |
(835) 0x52cedc LEA (%RCX,%RCX,2),%RCX |
(835) 0x52cee0 VBROADCASTF64X4 (%RSI,%RCX,4),%ZMM1 |
(835) 0x52cee7 MOVSXD %ECX,%RDI |
(835) 0x52ceea VBROADCASTF64X4 0x20(%RSI,%RDI,4),%ZMM3 |
(835) 0x52cef2 VBROADCASTF64X4 0x40(%RSI,%RDI,4),%ZMM4 |
(835) 0x52cefa VSUBPS %ZMM1,%ZMM30,%ZMM0 |
(835) 0x52cf00 VSUBPS %ZMM1,%ZMM31,%ZMM1 |
(835) 0x52cf06 VMOVAPS 0x140(%RSP),%ZMM2 |
(835) 0x52cf0e VSUBPS %ZMM3,%ZMM2,%ZMM2 |
(835) 0x52cf14 VMOVAPS 0x100(%RSP),%ZMM5 |
(835) 0x52cf1c VSUBPS %ZMM3,%ZMM5,%ZMM6 |
(835) 0x52cf22 VMOVAPS 0xc0(%RSP),%ZMM3 |
(835) 0x52cf2a VSUBPS %ZMM4,%ZMM3,%ZMM7 |
(835) 0x52cf30 VMOVAPS 0x80(%RSP),%ZMM3 |
(835) 0x52cf38 VSUBPS %ZMM4,%ZMM3,%ZMM8 |
(835) 0x52cf3e VMULPS %ZMM0,%ZMM0,%ZMM3 |
(835) 0x52cf44 VMULPS %ZMM2,%ZMM2,%ZMM4 |
(835) 0x52cf4a VADDPS %ZMM4,%ZMM3,%ZMM3 |
(835) 0x52cf50 VMULPS %ZMM7,%ZMM7,%ZMM4 |
(835) 0x52cf56 VMULPS %ZMM1,%ZMM1,%ZMM5 |
(835) 0x52cf5c VADDPS %ZMM4,%ZMM3,%ZMM3 |
(835) 0x52cf62 VMULPS %ZMM6,%ZMM6,%ZMM4 |
(835) 0x52cf68 VADDPS %ZMM4,%ZMM5,%ZMM4 |
(835) 0x52cf6e VMULPS %ZMM8,%ZMM8,%ZMM5 |
(835) 0x52cf74 VADDPS %ZMM5,%ZMM4,%ZMM4 |
(835) 0x52cf7a VCMPPS $0x1,%ZMM17,%ZMM3,%K5 |
(835) 0x52cf81 VCMPPS $0x1,%ZMM17,%ZMM4,%K4 |
(835) 0x52cf88 VBROADCASTSS -0x1d0c5a(%RIP),%ZMM5 |
(835) 0x52cf92 VMAXPS %ZMM5,%ZMM3,%ZMM3 |
(835) 0x52cf98 VRSQRT14PS %ZMM3,%ZMM9 |
(835) 0x52cf9e VMAXPS %ZMM5,%ZMM4,%ZMM4 |
(835) 0x52cfa4 VBROADCASTSS -0x1d0b32(%RIP),%ZMM5 |
(835) 0x52cfae VBROADCASTSS -0x1d0e64(%RIP),%ZMM10 |
(835) 0x52cfb8 VMULPS %ZMM9,%ZMM3,%ZMM3 |
(835) 0x52cfbe VMULPS %ZMM5,%ZMM9,%ZMM11 |
(835) 0x52cfc4 VRSQRT14PS %ZMM4,%ZMM12 |
(835) 0x52cfca VMULPS %ZMM12,%ZMM4,%ZMM4 |
(835) 0x52cfd0 VFMADD213PS %ZMM10,%ZMM9,%ZMM3 |
(835) 0x52cfd6 VMULPS %ZMM5,%ZMM12,%ZMM5 |
(835) 0x52cfdc VFMADD213PS %ZMM10,%ZMM12,%ZMM4 |
(835) 0x52cfe2 MOV %RDX,%RDI |
(835) 0x52cfe5 SAL $0x6,%RDX |
(835) 0x52cfe9 VBROADCASTF64X4 (%R11,%RDX,1),%ZMM9 |
(835) 0x52cff0 VMULPS %ZMM3,%ZMM11,%ZMM3{%K5}{z} |
(835) 0x52cff6 SAL $0x4,%RDI |
(835) 0x52cffa OR $0x8,%EDI |
(835) 0x52cffd MOVSXD %EDI,%RDX |
(835) 0x52d000 VBROADCASTF64X4 (%R11,%RDX,4),%ZMM10 |
(835) 0x52d007 VMULPS %ZMM4,%ZMM5,%ZMM4{%K4}{z} |
(835) 0x52d00d VMULPS %ZMM3,%ZMM3,%ZMM5 |
(835) 0x52d013 VADDPS %ZMM9,%ZMM14,%ZMM11 |
(835) 0x52d019 VADDPS %ZMM9,%ZMM24,%ZMM9 |
(835) 0x52d01f VMULPS %ZMM10,%ZMM15,%ZMM12 |
(835) 0x52d025 VMULPS %ZMM10,%ZMM25,%ZMM10 |
(835) 0x52d02b VMULPS %ZMM11,%ZMM3,%ZMM3 |
(835) 0x52d031 VMULPS %ZMM9,%ZMM4,%ZMM9 |
(835) 0x52d037 VMULPS %ZMM3,%ZMM3,%ZMM3 |
(835) 0x52d03d VMULPS %ZMM9,%ZMM9,%ZMM9 |
(835) 0x52d043 VMULPS %ZMM3,%ZMM3,%ZMM11 |
(835) 0x52d049 VMULPS %ZMM9,%ZMM9,%ZMM13 |
(835) 0x52d04f VMULPS %ZMM11,%ZMM3,%ZMM3 |
(835) 0x52d055 VMULPS %ZMM13,%ZMM9,%ZMM9 |
(835) 0x52d05b VMULPS %ZMM3,%ZMM12,%ZMM11 |
(835) 0x52d061 VMULPS %ZMM9,%ZMM10,%ZMM10 |
(835) 0x52d067 VMULPS %ZMM11,%ZMM3,%ZMM3 |
(835) 0x52d06d VMULPS %ZMM10,%ZMM9,%ZMM9 |
(835) 0x52d073 VMULPS %ZMM4,%ZMM4,%ZMM4 |
(835) 0x52d079 VSUBPS %ZMM11,%ZMM3,%ZMM3 |
(835) 0x52d07f VMULPS %ZMM3,%ZMM5,%ZMM3 |
(835) 0x52d085 VSUBPS %ZMM10,%ZMM9,%ZMM5 |
(835) 0x52d08b VMULPS %ZMM5,%ZMM4,%ZMM4 |
(835) 0x52d091 VMULPS %ZMM3,%ZMM0,%ZMM0 |
(835) 0x52d097 VMULPS %ZMM4,%ZMM1,%ZMM1 |
(835) 0x52d09d VMULPS %ZMM3,%ZMM2,%ZMM2 |
(835) 0x52d0a3 VMULPS %ZMM4,%ZMM6,%ZMM5 |
(835) 0x52d0a9 VMULPS %ZMM3,%ZMM7,%ZMM3 |
(835) 0x52d0af VMULPS %ZMM4,%ZMM8,%ZMM4 |
(835) 0x52d0b5 VADDPS %ZMM0,%ZMM23,%ZMM23 |
(835) 0x52d0bb VADDPS %ZMM1,%ZMM22,%ZMM22 |
(835) 0x52d0c1 VADDPS %ZMM2,%ZMM20,%ZMM20 |
(835) 0x52d0c7 VADDPS %ZMM5,%ZMM21,%ZMM21 |
(835) 0x52d0cd VADDPS %ZMM3,%ZMM16,%ZMM16 |
(835) 0x52d0d3 VADDPS %ZMM4,%ZMM19,%ZMM19 |
(835) 0x52d0d9 VADDPS %ZMM1,%ZMM0,%ZMM0 |
(835) 0x52d0df VADDPS %ZMM5,%ZMM2,%ZMM1 |
(835) 0x52d0e5 VADDPS %ZMM4,%ZMM3,%ZMM2 |
(835) 0x52d0eb VEXTRACTF64X4 $0x1,%ZMM0,%YMM3 |
(835) 0x52d0f2 VADDPS %YMM3,%YMM0,%YMM0 |
(835) 0x52d0f6 VMOVAPS (%R10,%RCX,4),%YMM3 |
(835) 0x52d0fc VSUBPS %YMM0,%YMM3,%YMM0 |
(835) 0x52d100 VMOVAPS 0x20(%R10,%RCX,4),%YMM3 |
(835) 0x52d107 VMOVAPS 0x40(%R10,%RCX,4),%YMM4 |
(835) 0x52d10e VMOVAPS %YMM0,(%R10,%RCX,4) |
(835) 0x52d114 VEXTRACTF64X4 $0x1,%ZMM1,%YMM0 |
(835) 0x52d11b VADDPS %YMM0,%YMM1,%YMM0 |
(835) 0x52d11f VSUBPS %YMM0,%YMM3,%YMM0 |
(835) 0x52d123 VEXTRACTF64X4 $0x1,%ZMM2,%YMM1 |
(835) 0x52d12a VMOVAPS %YMM0,0x20(%R10,%RCX,4) |
(835) 0x52d131 VADDPS %YMM1,%YMM2,%YMM0 |
(835) 0x52d135 VSUBPS %YMM0,%YMM4,%YMM0 |
(835) 0x52d139 VMOVAPS %YMM0,0x40(%R10,%RCX,4) |
(835) 0x52d140 INC %RAX |
(835) 0x52d143 CMP %RAX,%R13 |
(835) 0x52d146 JNE 52ced0 |
(834) 0x52d14c JMP 52b4f0 |
0x52d151 LEA -0x28(%RBP),%RSP |
0x52d155 POP %RBX |
0x52d156 POP %R12 |
0x52d158 POP %R13 |
0x52d15a POP %R14 |
0x52d15c POP %R15 |
0x52d15e POP %RBP |
0x52d15f VZEROUPPER |
0x52d162 RET |
0x52d163 INT $0x3 |
0x52d164 INT $0x3 |
0x52d165 INT $0x3 |
0x52d166 INT $0x3 |
0x52d167 INT $0x3 |
0x52d168 INT $0x3 |
0x52d169 INT $0x3 |
0x52d16a INT $0x3 |
0x52d16b INT $0x3 |
0x52d16c INT $0x3 |
0x52d16d INT $0x3 |
0x52d16e INT $0x3 |
0x52d16f INT $0x3 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.99+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►89.79+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►10.20+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►79.85+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►20.15+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►47.99+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►27.57+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►7.27+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
►6.91+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
►5.32+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
►4.93+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►52.71+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►28.84+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►7.49+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
►4.56+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
►4.01+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►2.38+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►48.79+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►31.45+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►9.30+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►5.24+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►3.16+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
►2.07+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►53.71+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►43.96+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►1.18+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►1.15+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►42.34+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►40.71+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►4.44+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
►4.17+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
►2.95+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►2.89+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►1.28+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
►1.22+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►59.87+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1974 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►40.13+ | .omp_outlined.#0x5f8c30 | kerneldispatch.cpp:305 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | nonbonded_verlet_t::dispatchNo[...] | kerneldispatch.cpp:272 | libgromacs_mpi.so.9.0.0 |
○ | do_nb_verlet(t_forcerec*, inte[...] | sim_util.cpp:455 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:1936 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Path / |
The code analyzed by CQA in that panel excludes loops and represents 0.00% of application time for run 1x1
Source file and lines | simd_kernel.h:121-564 |
Module | libgromacs_mpi.so.9.0.0 |
nb instructions | 83 |
nb uops | 70 |
loop length | 380 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 5 |
nb stack references | 13 |
ADD-SUB / MUL ratio | 1.50 |
micro-operation queue | 11.67 cycles |
front end | 11.67 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 1.50 | 1.50 | 1.25 | 1.25 | 1.50 | 10.00 | 10.00 | 10.00 | 4.00 | 4.50 | 4.00 | 1.50 | 6.50 | 6.50 |
cycles | 1.50 | 1.50 | 1.25 | 1.25 | 1.50 | 11.00 | 11.00 | 11.00 | 4.00 | 4.50 | 5.50 | 3.00 | 6.50 | 6.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 11.67 |
Dispatch | 11.00 |
Overall L1 | 11.67 |
all | 11% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 100% |
all | 66% |
load | 37% |
store | 100% |
mul | 0% |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 52% |
load | 27% |
store | 58% |
mul | 0% |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 54% |
all | 13% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 25% |
all | 63% |
load | 42% |
store | 89% |
mul | 6% |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 45% |
all | 51% |
load | 34% |
store | 57% |
mul | 6% |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 43% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SUB $0x580,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV 0x50(%RDI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x58(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
CMP %RAX,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JE 52d151 <_ZN3gmx15nbnxmKernelSimdIL12KernelLayout1ELNS_17KernelCoulombTypeE1EL14VdwCutoffCheck0EL17LJCombinationRule1EL20InteractionModifiers1EL7LJEwald0EL12EnergyOutput0EEEvPK16NbnxnPairlistCpuPK16nbnxn_atomdata_tPK19interaction_const_tPA3_KfP23nbnxn_atomdata_output_t+0x1da1> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV 0x8(%R8),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV 0x28(%R8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x90(%RSI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV 0xb0(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x168(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
VMOVAPS (%RAX),%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
VXORPS %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VCMPPS $0x1,%ZMM0,%ZMM2,%K0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VBROADCASTSS -0x1cf300(%RIP),%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 | scal (6.3%) |
VADDPS %ZMM1,%ZMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 1 | vect (100.0%) |
VCMPPS $0x1,%ZMM0,%ZMM2,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VADDPS %ZMM1,%ZMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 1 | vect (100.0%) |
VCMPPS $0x1,%ZMM0,%ZMM2,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VADDPS %ZMM1,%ZMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 1 | vect (100.0%) |
MOV 0x180(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
VMOVAPS (%RAX),%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
VMOVAPS %ZMM1,0x340(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
VCMPPS $0x1,%ZMM0,%ZMM2,%K3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VMOVAPS 0x40(%RAX),%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
VMOVAPS %ZMM0,0x300(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
VBROADCASTSS 0x54(%RDX),%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 | scal (6.3%) |
VMULSS %XMM18,%XMM18,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
VBROADCASTSS %XMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 1 | scal (6.3%) |
VMOVAPS %ZMM0,0x180(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
VMOVSS 0x4c(%RDX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMULSS %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
VBROADCASTSS %XMM0,%ZMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 1 | scal (6.3%) |
MOV 0x138(%RSI),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x80(%RBX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
VBROADCASTSS 0x6c(%RDX),%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 | scal (6.3%) |
VMOVAPS %ZMM0,0x480(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
VMOVDDUP -0x1ce962(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
VMOVAPS %XMM0,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVAPS %ZMM18,0x440(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
VMOVAPS %ZMM17,0x380(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
MOV %RBX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP 52b63a <_ZN3gmx15nbnxmKernelSimdIL12KernelLayout1ELNS_17KernelCoulombTypeE1EL14VdwCutoffCheck0EL17LJCombinationRule1EL20InteractionModifiers1EL7LJEwald0EL12EnergyOutput0EEEvPK16NbnxnPairlistCpuPK16nbnxn_atomdata_tPK19interaction_const_tPA3_KfP23nbnxn_atomdata_output_t+0x28a> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | vect (25.0%) |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A |
The code analyzed by CQA in that panel excludes loops and represents 0.00% of application time for run 1x1
Source file and lines | simd_kernel.h:121-564 |
Module | libgromacs_mpi.so.9.0.0 |
nb instructions | 83 |
nb uops | 70 |
loop length | 380 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 5 |
nb stack references | 13 |
ADD-SUB / MUL ratio | 1.50 |
micro-operation queue | 11.67 cycles |
front end | 11.67 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 1.50 | 1.50 | 1.25 | 1.25 | 1.50 | 10.00 | 10.00 | 10.00 | 4.00 | 4.50 | 4.00 | 1.50 | 6.50 | 6.50 |
cycles | 1.50 | 1.50 | 1.25 | 1.25 | 1.50 | 11.00 | 11.00 | 11.00 | 4.00 | 4.50 | 5.50 | 3.00 | 6.50 | 6.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 11.67 |
Dispatch | 11.00 |
Overall L1 | 11.67 |
all | 11% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 100% |
all | 66% |
load | 37% |
store | 100% |
mul | 0% |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 52% |
load | 27% |
store | 58% |
mul | 0% |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 54% |
all | 13% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 25% |
all | 63% |
load | 42% |
store | 89% |
mul | 6% |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 45% |
all | 51% |
load | 34% |
store | 57% |
mul | 6% |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 43% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SUB $0x580,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV 0x50(%RDI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x58(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
CMP %RAX,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
JE 52d151 <_ZN3gmx15nbnxmKernelSimdIL12KernelLayout1ELNS_17KernelCoulombTypeE1EL14VdwCutoffCheck0EL17LJCombinationRule1EL20InteractionModifiers1EL7LJEwald0EL12EnergyOutput0EEEvPK16NbnxnPairlistCpuPK16nbnxn_atomdata_tPK19interaction_const_tPA3_KfP23nbnxn_atomdata_output_t+0x1da1> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
MOV 0x8(%R8),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV 0x28(%R8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x90(%RSI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
MOV 0xb0(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RAX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x168(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
VMOVAPS (%RAX),%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
VXORPS %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VCMPPS $0x1,%ZMM0,%ZMM2,%K0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VBROADCASTSS -0x1cf300(%RIP),%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 | scal (6.3%) |
VADDPS %ZMM1,%ZMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 1 | vect (100.0%) |
VCMPPS $0x1,%ZMM0,%ZMM2,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VADDPS %ZMM1,%ZMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 1 | vect (100.0%) |
VCMPPS $0x1,%ZMM0,%ZMM2,%K2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VADDPS %ZMM1,%ZMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 1 | vect (100.0%) |
MOV 0x180(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
VMOVAPS (%RAX),%ZMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
VMOVAPS %ZMM1,0x340(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
VCMPPS $0x1,%ZMM0,%ZMM2,%K3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VMOVAPS 0x40(%RAX),%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
VMOVAPS %ZMM0,0x300(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
VBROADCASTSS 0x54(%RDX),%ZMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 | scal (6.3%) |
VMULSS %XMM18,%XMM18,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
VBROADCASTSS %XMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 1 | scal (6.3%) |
VMOVAPS %ZMM0,0x180(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
VMOVSS 0x4c(%RDX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMULSS %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
VBROADCASTSS %XMM0,%ZMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 1 | scal (6.3%) |
MOV 0x138(%RSI),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x80(%RBX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | scal (12.5%) |
VBROADCASTSS 0x6c(%RDX),%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 | scal (6.3%) |
VMOVAPS %ZMM0,0x480(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
VMOVDDUP -0x1ce962(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
VMOVAPS %XMM0,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVAPS %ZMM18,0x440(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
VMOVAPS %ZMM17,0x380(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
MOV %RBX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP 52b63a <_ZN3gmx15nbnxmKernelSimdIL12KernelLayout1ELNS_17KernelCoulombTypeE1EL14VdwCutoffCheck0EL17LJCombinationRule1EL20InteractionModifiers1EL7LJEwald0EL12EnergyOutput0EEEvPK16NbnxnPairlistCpuPK16nbnxn_atomdata_tPK19interaction_const_tPA3_KfP23nbnxn_atomdata_output_t+0x28a> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | vect (25.0%) |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A | |||||||||||||||||
INT $0x3 | N/A |
Run 1x1 | Number processes: 1Number processes per node: 1OMP_NUM_THREADS: 1 |
---|---|
Run 2x1 | Number processes: 2Number processes per node: 2OMP_NUM_THREADS: 1 |
Run 4x1 | Number processes: 4Number processes per node: 4OMP_NUM_THREADS: 1 |
Run 8x1 | Number processes: 8Number processes per node: 8OMP_NUM_THREADS: 1 |
Run 16x1 | Number processes: 16Number processes per node: 16OMP_NUM_THREADS: 1 |
Run 32x1 | Number processes: 32Number processes per node: 32OMP_NUM_THREADS: 1 |
Run 64x1 | Number processes: 64Number processes per node: 64OMP_NUM_THREADS: 1 |
Run 128x1 | Number processes: 128Number processes per node: 128OMP_NUM_THREADS: 1 |
Run 192x1 | Number processes: 192Number nodes: 1Number processes per node: 192Run Command: <executable> mdrun -s ion_channel.tpr -nsteps 10000 -pin on -deffnm aoccMPI Command: mpirun -genv I_MPI_FABRICS=shm -n <number_processes>Dataset: Run Directory: .OMP_NUM_THREADS: 1 |
(1x1) Efficiency | (1x1) Potential Speed-Up (%) | (2x1) Efficiency | (2x1) Potential Speed-Up (%) | (4x1) Efficiency | (4x1) Potential Speed-Up (%) | (8x1) Efficiency | (8x1) Potential Speed-Up (%) | (16x1) Efficiency | (16x1) Potential Speed-Up (%) | (32x1) Efficiency | (32x1) Potential Speed-Up (%) | (64x1) Efficiency | (64x1) Potential Speed-Up (%) | (128x1) Efficiency | (128x1) Potential Speed-Up (%) | (192x1) Efficiency | (192x1) Potential Speed-Up (%) |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
1 | 0 | 0.95 | 2.46 | 0.87 | 7.08 | 0.72 | 14.48 | 0.8 | 8.8 | 0.79 | 7.62 | 0.62 | 11.07 | 0.86 | 3.5 | 0.82 | 4.08 |
Run | Number of threads | Efficiency (ideal is 1) | Speedup | Ideal Speedup | Time (s) | Coverage (%) |
---|---|---|---|---|---|---|
1x1 | 1 | 1 | 1 | 1 | 465.58087158203 | 55.85152053833 |
2x1 | 2 | 0.95 | 1.91 | 2 | 246.66970825195 | 53.812549591064 |
4x1 | 4 | 0.87 | 3.47 | 4 | 138.40495300293 | 53.813831329346 |
8x1 | 8 | 0.72 | 5.78 | 8 | 82.464904785156 | 52.096599578857 |
16x1 | 16 | 0.8 | 12.8 | 16 | 38.594970703125 | 43.98025894165 |
32x1 | 20 | 0.79 | 25.21 | 32 | 31.384979248047 | 35.932941436768 |
64x1 | 40 | 0.62 | 39.88 | 64 | 19.539976119995 | 29.373104095459 |
128x1 | 84 | 0.86 | 110.01 | 128 | 7.6449961662292 | 24.902202606201 |
192x1 | 128 | 0.82 | 156.52 | 192 | 4.9450011253357 | 22.083818435669 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼void gmx::nbnxmKernelSimd<(KernelLayout)1, (gmx::KernelCoulombType)1, (VdwCutoffCheck)0, (LJCombinationRule)1, (InteractionModifiers)1, (LJEwald)0, (EnergyOutput)0>(NbnxnPairlistCpu const*, nbnxn_atomdata_t const*, interaction_const_t const*, float const (...– | 22.08 | 2.97 |
▼Loop 834 - simd_kernel.h:273-545 - libgromacs_mpi.so.9.0.0– | 0.94 | 0.19 |
○Loop 839 - simd_kernel.h:476-476 - libgromacs_mpi.so.9.0.0 | 14.23 | 2.85 |
○Loop 837 - simd_kernel.h:497-497 - libgromacs_mpi.so.9.0.0 | 5.32 | 1.06 |
○Loop 840 - impl_x86_avx_512_simd_float.h:70-461 - libgromacs_mpi.so.9.0.0 | 0.62 | 0.12 |
○Loop 838 - impl_x86_avx_512_simd_float.h:70-461 - libgromacs_mpi.so.9.0.0 | 0.49 | 0.10 |
○Loop 835 - simd_kernel.h:518-518 - libgromacs_mpi.so.9.0.0 | 0.43 | 0.19 |
○Loop 836 - simd_kernel.h:510-513 - libgromacs_mpi.so.9.0.0 | 0.04 | 0.03 |