Function: solve_pme_yzx(gmx_pme_t const*, t_complex*, float, bool, int, int) | Module: libgromacs_mpi.so.9.0.0 | Source: pme_solve.cpp:233-585 [...] | Coverage (incl. loops): 0.36% | (excl. loops): 0.00% |
---|
Function: solve_pme_yzx(gmx_pme_t const*, t_complex*, float, bool, int, int) | Module: libgromacs_mpi.so.9.0.0 | Source: pme_solve.cpp:233-585 [...] | Coverage (incl. loops): 0.36% | (excl. loops): 0.00% |
---|
/home/eoseret/gromacs-2024.2/src/gromacs/ewald/pme_solve.cpp: 233 - 585 |
-------------------------------------------------------------------------------- |
233: for (size_t kx = 0; kx != d_aligned.size(); ++kx) |
[...] |
328: { |
[...] |
335: real ewaldcoeff = pme->ewaldcoeff_q; |
336: real factor = M_PI * M_PI / (ewaldcoeff * ewaldcoeff); |
337: real ets2, struct2, vfactor, ets2vf; |
338: real d1, d2, energy = 0; |
339: real by, bz; |
340: real virxx = 0, virxy = 0, virxz = 0, viryy = 0, viryz = 0, virzz = 0; |
[...] |
350: elfac = gmx::c_one4PiEps0 / pme->epsilon_r; |
351: |
352: nx = pme->nkx; |
353: ny = pme->nky; |
354: nz = pme->nkz; |
355: |
356: /* Dimensions should be identical for A/B grid, so we just use A here */ |
357: gmx_parallel_3dfft_complex_limits( |
358: pme->pfft_setup[PME_GRID_QA], complex_order, local_ndata, local_offset, local_size); |
[...] |
372: work = &pme->solve_work[thread]; |
373: mhx = work->mhx; |
[...] |
382: iyz0 = local_ndata[YY] * local_ndata[ZZ] * thread / nthread; |
383: iyz1 = local_ndata[YY] * local_ndata[ZZ] * (thread + 1) / nthread; |
384: |
385: for (iyz = iyz0; iyz < iyz1; iyz++) |
386: { |
387: iy = iyz / local_ndata[ZZ]; |
388: iz = iyz - iy * local_ndata[ZZ]; |
389: |
390: ky = iy + local_offset[YY]; |
391: |
392: if (ky < maxky) |
[...] |
401: by = M_PI * vol * pme->bsp_mod[YY][ky]; |
402: |
403: kz = iz + local_offset[ZZ]; |
404: |
405: mz = kz; |
406: |
407: bz = pme->bsp_mod[ZZ][kz]; |
408: |
409: /* 0.5 correction for corner points */ |
410: corner_fac = 1; |
411: if (kz == 0 || kz == (nz + 1) / 2) |
412: { |
413: corner_fac = 0.5; |
414: } |
415: |
416: p0 = grid + iy * local_size[ZZ] * local_size[XX] + iz * local_size[XX]; |
417: |
418: /* We should skip the k-space point (0,0,0) */ |
419: /* Note that since here x is the minor index, local_offset[XX]=0 */ |
420: if (local_offset[XX] > 0 || ky > 0 || kz > 0) |
[...] |
431: if (computeEnergyAndVirial) |
[...] |
440: for (kx = kxstart; kx < maxkx; kx++) |
441: { |
442: mx = kx; |
443: |
444: mhxk = mx * rxx; |
445: mhyk = mx * ryx + my * ryy; |
446: mhzk = mx * rzx + my * rzy + mz * rzz; |
447: m2k = mhxk * mhxk + mhyk * mhyk + mhzk * mhzk; |
448: mhx[kx] = mhxk; |
449: mhy[kx] = mhyk; |
450: mhz[kx] = mhzk; |
451: m2[kx] = m2k; |
452: denom[kx] = m2k * bz * by * pme->bsp_mod[XX][kx]; |
453: tmp1[kx] = -factor * m2k; |
454: } |
455: |
456: for (kx = maxkx; kx < kxend; kx++) |
457: { |
458: mx = (kx - nx); |
459: |
460: mhxk = mx * rxx; |
461: mhyk = mx * ryx + my * ryy; |
462: mhzk = mx * rzx + my * rzy + mz * rzz; |
463: m2k = mhxk * mhxk + mhyk * mhyk + mhzk * mhzk; |
464: mhx[kx] = mhxk; |
465: mhy[kx] = mhyk; |
466: mhz[kx] = mhzk; |
467: m2[kx] = m2k; |
468: denom[kx] = m2k * bz * by * pme->bsp_mod[XX][kx]; |
469: tmp1[kx] = -factor * m2k; |
470: } |
471: |
472: for (kx = kxstart; kx < kxend; kx++) |
473: { |
474: m2inv[kx] = 1.0 / m2[kx]; |
[...] |
485: for (kx = kxstart; kx < kxend; kx++, p0++) |
486: { |
487: d1 = p0->re; |
488: d2 = p0->im; |
489: |
490: p0->re = d1 * eterm[kx]; |
491: p0->im = d2 * eterm[kx]; |
492: |
493: struct2 = 2.0 * (d1 * d1 + d2 * d2); |
494: |
495: tmp1[kx] = eterm[kx] * struct2; |
496: } |
497: |
498: for (kx = kxstart; kx < kxend; kx++) |
499: { |
500: ets2 = corner_fac * tmp1[kx]; |
501: vfactor = (factor * m2[kx] + 1.0) * 2.0 * m2inv[kx]; |
502: energy += ets2; |
503: |
504: ets2vf = ets2 * vfactor; |
505: virxx += ets2vf * mhx[kx] * mhx[kx] - ets2; |
506: virxy += ets2vf * mhx[kx] * mhy[kx]; |
507: virxz += ets2vf * mhx[kx] * mhz[kx]; |
508: viryy += ets2vf * mhy[kx] * mhy[kx] - ets2; |
509: viryz += ets2vf * mhy[kx] * mhz[kx]; |
510: virzz += ets2vf * mhz[kx] * mhz[kx] - ets2; |
[...] |
521: for (kx = kxstart; kx < maxkx; kx++) |
522: { |
523: mx = kx; |
524: |
525: mhxk = mx * rxx; |
526: mhyk = mx * ryx + my * ryy; |
527: mhzk = mx * rzx + my * rzy + mz * rzz; |
528: m2k = mhxk * mhxk + mhyk * mhyk + mhzk * mhzk; |
529: denom[kx] = m2k * bz * by * pme->bsp_mod[XX][kx]; |
530: tmp1[kx] = -factor * m2k; |
531: } |
532: |
533: for (kx = maxkx; kx < kxend; kx++) |
534: { |
535: mx = (kx - nx); |
536: |
537: mhxk = mx * rxx; |
538: mhyk = mx * ryx + my * ryy; |
539: mhzk = mx * rzx + my * rzy + mz * rzz; |
540: m2k = mhxk * mhxk + mhyk * mhyk + mhzk * mhzk; |
541: denom[kx] = m2k * bz * by * pme->bsp_mod[XX][kx]; |
542: tmp1[kx] = -factor * m2k; |
[...] |
554: for (kx = kxstart; kx < kxend; kx++, p0++) |
555: { |
556: d1 = p0->re; |
557: d2 = p0->im; |
558: |
559: p0->re = d1 * eterm[kx]; |
560: p0->im = d2 * eterm[kx]; |
561: } |
562: } |
563: } |
564: |
565: if (computeEnergyAndVirial) |
[...] |
575: work->vir_q[ZZ][ZZ] = 0.25 * virzz; |
576: work->vir_q[XX][YY] = work->vir_q[YY][XX] = 0.25 * virxy; |
577: work->vir_q[XX][ZZ] = work->vir_q[ZZ][XX] = 0.25 * virxz; |
578: work->vir_q[YY][ZZ] = work->vir_q[ZZ][YY] = 0.25 * viryz; |
579: |
580: /* This energy should be corrected for a charged system */ |
581: work->energy_q = 0.5 * energy; |
582: } |
583: |
584: /* Return the loop count over all threads */ |
585: return local_ndata[YY] * local_ndata[ZZ] * local_ndata[XX]; |
/home/eoseret/gromacs-2024.2/src/gromacs/simd/include/gromacs/simd/simd_memory.h: 63 - 63 |
-------------------------------------------------------------------------------- |
63: operator non_const_T() const { return load<non_const_T>(m_); } |
/home/eoseret/gromacs-2024.2/src/gromacs/simd/include/gromacs/simd/impl_x86_avx_512/impl_x86_avx_512_simd_float.h: 109 - 501 |
-------------------------------------------------------------------------------- |
109: _mm512_store_ps(m, a.simdInternal_); |
[...] |
197: return { _mm512_mul_ps(a.simdInternal_, b.simdInternal_) }; |
198: } |
199: |
200: static inline SimdFloat gmx_simdcall fma(SimdFloat a, SimdFloat b, SimdFloat c) |
201: { |
202: return { _mm512_fmadd_ps(a.simdInternal_, b.simdInternal_, c.simdInternal_) }; |
[...] |
212: return { _mm512_fnmadd_ps(a.simdInternal_, b.simdInternal_, c.simdInternal_) }; |
[...] |
229: return { _mm512_rcp14_ps(x.simdInternal_) }; |
[...] |
269: return { _mm512_max_ps(a.simdInternal_, b.simdInternal_) }; |
[...] |
279: return { _mm512_roundscale_ps(x.simdInternal_, 0) }; |
[...] |
332: __m512i iExponent = _mm512_add_epi32(exponent.simdInternal_, exponentBias); |
333: |
334: if (opt == MathOptimization::Safe) |
335: { |
336: // Make sure biased argument is not negative |
337: iExponent = _mm512_max_epi32(iExponent, _mm512_setzero_epi32()); |
338: } |
339: |
340: iExponent = _mm512_slli_epi32(iExponent, 23); |
[...] |
501: return { _mm512_cvtps_epi32(a.simdInternal_) }; |
0xc0bde0 PUSH %RBP |
0xc0bde1 MOV %RSP,%RBP |
0xc0bde4 PUSH %R15 |
0xc0bde6 PUSH %R14 |
0xc0bde8 PUSH %R13 |
0xc0bdea PUSH %R12 |
0xc0bdec PUSH %RBX |
0xc0bded AND $-0x40,%RSP |
0xc0bdf1 SUB $0x4c0,%RSP |
0xc0bdf8 MOV %RDI,%R14 |
0xc0bdfb VMOVSS 0x50(%RDI),%XMM1 |
0xc0be00 VMOVSS %XMM1,0x40(%RSP) |
0xc0be06 VMOVSS 0x58(%RDI),%XMM1 |
0xc0be0b VMOVSS %XMM1,0x18(%RSP) |
0xc0be11 MOV %R8D,%R13D |
0xc0be14 MOV %ECX,%R12D |
0xc0be17 MOV %EDX,0x94(%RSP) |
0xc0be1e VMOVSS %XMM0,0x2a0(%RSP) |
0xc0be27 MOV %RSI,%R15 |
0xc0be2a MOV 0x44(%RDI),%EBX |
0xc0be2d MOV 0x580(%RDI),%RAX |
0xc0be34 MOV (%RAX),%RDI |
0xc0be37 VMOVSD 0x3c(%R14),%XMM0 |
0xc0be3d VMOVAPS %XMM0,0x220(%RSP) |
0xc0be46 LEA 0x2f4(%RSP),%RSI |
0xc0be4e LEA 0xdc(%RSP),%RDX |
0xc0be56 LEA 0x134(%RSP),%RCX |
0xc0be5e LEA 0x214(%RSP),%R8 |
0xc0be66 CALL fb5700 <@plt_start@+0x12250> |
0xc0be6b MOV 0x780(%R14),%RCX |
0xc0be72 MOVSXD %R13D,%RDI |
0xc0be75 MOV 0xe4(%RSP),%R9D |
0xc0be7d MOV 0xe0(%RSP),%ESI |
0xc0be84 IMUL %R9D,%ESI |
0xc0be88 MOV %ESI,%EAX |
0xc0be8a IMUL %EDI,%EAX |
0xc0be8d CLTD |
0xc0be8e IDIV %R12D |
0xc0be91 MOV %EAX,%R11D |
0xc0be94 LEA (%RDI,%RDI,4),%R8 |
0xc0be98 INC %EDI |
0xc0be9a IMUL %ESI,%EDI |
0xc0be9d MOV %EDI,%EAX |
0xc0be9f CLTD |
0xc0bea0 IDIV %R12D |
0xc0bea3 SAL $0x5,%R8 |
0xc0bea7 CMP %EAX,%R11D |
0xc0beaa MOV %RCX,0x1b8(%RSP) |
0xc0beb2 MOV %ESI,0xc0(%RSP) |
0xc0beb9 MOV %R8,0x1b0(%RSP) |
0xc0bec1 JGE c0df8e |
0xc0bec7 VMOVSS 0x40(%RSP),%XMM0 |
0xc0becd VMULSS %XMM0,%XMM0,%XMM0 |
0xc0bed1 VCVTSS2SD %XMM0,%XMM0,%XMM0 |
0xc0bed5 VMOVSD -0x8af225(%RIP),%XMM1 |
0xc0bedd VDIVSD %XMM0,%XMM1,%XMM0 |
0xc0bee1 VCVTSD2SS %XMM0,%XMM0,%XMM19 |
0xc0bee7 VMOVSS 0x5d0(%R14),%XMM22 |
0xc0bef1 VMOVSS 0x5dc(%R14),%XMM2 |
0xc0befa VMOVSS 0x5e0(%R14),%XMM0 |
0xc0bf03 VMOVSS %XMM0,0x54(%RSP) |
0xc0bf09 VMOVSS 0x5e8(%R14),%XMM4 |
0xc0bf12 VMOVSS 0x5ec(%R14),%XMM20 |
0xc0bf1c VMOVSS 0x5f0(%R14),%XMM6 |
0xc0bf25 VPCMPEQD %XMM3,%XMM3,%XMM3 |
0xc0bf29 VMOVDQA 0x220(%RSP),%XMM12 |
0xc0bf32 VPSUBD %XMM3,%XMM12,%XMM3 |
0xc0bf36 VPSRLD $0x1f,%XMM3,%XMM5 |
0xc0bf3b VMOVUPS 0x8(%RCX,%R8,1),%YMM0 |
0xc0bf42 VMOVDQU 0x28(%RCX,%R8,1),%XMM9 |
0xc0bf49 VMOVSS 0x18(%RSP),%XMM1 |
0xc0bf4f VCVTSS2SD %XMM1,%XMM1,%XMM7 |
0xc0bf53 VMOVSD -0x8aeb83(%RIP),%XMM8 |
0xc0bf5b VPADDD %XMM5,%XMM3,%XMM3 |
0xc0bf5f VDIVSD %XMM7,%XMM8,%XMM5 |
0xc0bf63 VCVTSD2SS %XMM5,%XMM5,%XMM5 |
0xc0bf67 VMOVSS 0x2a0(%RSP),%XMM1 |
0xc0bf70 VCVTSS2SD %XMM1,%XMM1,%XMM7 |
0xc0bf74 VPSRAD $0x1,%XMM3,%XMM13 |
0xc0bf79 VMULSD -0x8af61b(%RIP),%XMM7,%XMM26 |
0xc0bf83 MOV %EBX,%EDX |
0xc0bf85 INC %EDX |
0xc0bf87 SHR $0x1f,%EDX |
0xc0bf8a ADD %EBX,%EDX |
0xc0bf8c INC %EDX |
0xc0bf8e SAR $0x1,%EDX |
0xc0bf90 MOV %EDX,0xd4(%RSP) |
0xc0bf97 MOV 0x134(%RSP),%EDX |
0xc0bf9e MOV 0xdc(%RSP),%ESI |
0xc0bfa5 LEA (%RSI,%RDX,1),%EDI |
0xc0bfa8 VXORPS -0x8afdfa(%RIP){1to4},%XMM19,%XMM11 |
0xc0bfb2 MOV %R9D,0x1c(%RSP) |
0xc0bfb7 VMOVD %XMM13,%R9D |
0xc0bfbc MOV %RDX,0x208(%RSP) |
0xc0bfc4 MOV %RSI,0xb8(%RSP) |
0xc0bfcc ADD %ESI,%EDX |
0xc0bfce ADD $0xf,%EDX |
0xc0bfd1 AND $-0x10,%EDX |
0xc0bfd4 VBROADCASTSS %XMM5,%ZMM25 |
0xc0bfda MOV %RDX,%RSI |
0xc0bfdd SHR $0x4,%RSI |
0xc0bfe1 MOV %RSI,0x118(%RSP) |
0xc0bfe9 OR $0xf,%RDX |
0xc0bfed MOV %RDX,0x128(%RSP) |
0xc0bff5 MOV %R9D,0x60(%RSP) |
0xc0bffa MOVSXD %R9D,%RDX |
0xc0bffd MOV %EDI,0x64(%RSP) |
0xc0c001 MOVSXD %EDI,%RDI |
0xc0c004 VPBROADCASTQ %RDX,%YMM3 |
0xc0c00a VPSLLQ $0x2,%YMM3,%YMM5 |
0xc0c00f VMOVDQA64 -0x888419(%RIP),%ZMM7 |
0xc0c019 VPADDQ %YMM0,%YMM5,%YMM5 |
0xc0c01d VPERMQ %ZMM5,%ZMM7,%ZMM7 |
0xc0c023 VMOVDQA64 %ZMM7,0x440(%RSP) |
0xc0c02b VMOVDQA64 -0x8883f5(%RIP),%ZMM7 |
0xc0c035 VPERMQ %ZMM5,%ZMM7,%ZMM7 |
0xc0c03b VMOVDQA64 %ZMM7,0x400(%RSP) |
0xc0c043 VPSLLQ $0x2,%XMM3,%XMM3 |
0xc0c048 VPADDQ %XMM3,%XMM9,%XMM7 |
0xc0c04c MOV %RDI,%RSI |
0xc0c04f SUB %RDX,%RSI |
0xc0c052 VPERMQ $0x54,%YMM7,%YMM3 |
0xc0c058 VMOVDQA %YMM3,0x340(%RSP) |
0xc0c061 VEXTRACTI128 $0x1,%YMM0,%XMM3 |
0xc0c067 VPERMQ $0x5,%YMM7,%YMM10 |
0xc0c06d VBROADCASTSS %XMM22,%YMM31 |
0xc0c073 VBROADCASTSS %XMM2,%YMM1 |
0xc0c078 VBROADCASTSS %XMM4,%YMM17 |
0xc0c07e VBROADCASTSS %XMM6,%YMM18 |
0xc0c084 VBROADCASTSS %XMM11,%YMM15 |
0xc0c089 MOV %RDX,%R9 |
0xc0c08c NEG %R9 |
0xc0c08f MOV %R9,0x110(%RSP) |
0xc0c097 MOV %RSI,%R9 |
0xc0c09a AND $-0x20,%R9 |
0xc0c09e VPBROADCASTD %XMM13,%YMM8 |
0xc0c0a3 VPADDD -0x8a3d6b(%RIP),%YMM8,%YMM8 |
0xc0c0ab VMOVDQA %YMM8,0x2c0(%RSP) |
0xc0c0b4 VPBROADCASTD %XMM12,%YMM16 |
0xc0c0ba MOV %RDI,%RBX |
0xc0c0bd VMOVDQA64 -0x888447(%RIP),%ZMM8 |
0xc0c0c7 NEG %RBX |
0xc0c0ca MOV %RBX,0x1f0(%RSP) |
0xc0c0d2 VPERMI2Q %ZMM7,%ZMM5,%ZMM8 |
0xc0c0d8 VMOVDQA64 %ZMM8,0x3c0(%RSP) |
0xc0c0e0 VMOVDQA -0x8a3c88(%RIP),%YMM8 |
0xc0c0e8 VMOVDQA %YMM10,0x320(%RSP) |
0xc0c0f1 VPERMI2Q %YMM5,%YMM10,%YMM8 |
0xc0c0f7 VMOVDQA %YMM8,0x300(%RSP) |
0xc0c100 MOV %RSI,0x98(%RSP) |
0xc0c108 AND $-0x8,%RSI |
0xc0c10c VMOVD %XMM12,%EBX |
0xc0c110 MOV %EBX,0xc4(%RSP) |
0xc0c117 NEG %EBX |
0xc0c119 MOV %RBX,0x108(%RSP) |
0xc0c121 VXORPS %XMM28,%XMM28,%XMM28 |
0xc0c127 VPEXTRQ $0x1,%XMM7,0x1e8(%RSP) |
0xc0c132 VXORPS %XMM29,%XMM29,%XMM29 |
0xc0c138 VPEXTRD $0x1,%XMM12,0xd0(%RSP) |
0xc0c143 MOV 0x214(%RSP),%EBX |
0xc0c14a MOV %R14,0x30(%RSP) |
0xc0c14f MOV 0x21c(%RSP),%R14D |
0xc0c157 MOV %EBX,0xcc(%RSP) |
0xc0c15e IMUL %EBX,%R14D |
0xc0c162 MOV %R14D,0xc8(%RSP) |
0xc0c16a VPEXTRQ $0x1,%XMM3,%RBX |
0xc0c170 MOV %RBX,0x58(%RSP) |
0xc0c175 VMOVQ %XMM3,%R14 |
0xc0c17a MOV %EAX,0xd8(%RSP) |
0xc0c181 MOV %R15,%RAX |
0xc0c184 MOV 0x40(%RCX,%R8,1),%R15 |
0xc0c189 MOV 0x48(%RCX,%R8,1),%RCX |
0xc0c18e MOV %RDX,%R8 |
0xc0c191 MOVSXD 0x138(%RSP),%RDX |
0xc0c199 MOV %RDX,0x200(%RSP) |
0xc0c1a1 MOVSXD 0x13c(%RSP),%RDX |
0xc0c1a9 MOV %RDX,0x1f8(%RSP) |
0xc0c1b1 VPEXTRQ $0x1,%XMM9,%R12 |
0xc0c1b7 LEA (,%R8,4),%RDX |
0xc0c1bf MOV %RDX,0x100(%RSP) |
0xc0c1c7 VMOVDQA %XMM9,0x290(%RSP) |
0xc0c1d0 VMOVQ %XMM9,%RDX |
0xc0c1d5 LEA (%R9,%R8,1),%R13 |
0xc0c1d9 MOV %R13,0x1d8(%RSP) |
0xc0c1e1 VMOVQ %XMM0,%R13 |
0xc0c1e6 VMOVAPS %YMM0,0x360(%RSP) |
0xc0c1ef VPEXTRQ $0x1,%XMM0,%R10 |
0xc0c1f5 MOV %RSI,0x1a8(%RSP) |
0xc0c1fd LEA (%RSI,%R8,1),%RSI |
0xc0c201 MOV %RSI,0x1a0(%RSP) |
0xc0c209 LEA 0x60(%RDX),%RSI |
0xc0c20d MOV %RSI,0x1d0(%RSP) |
0xc0c215 LEA 0x60(%R12),%RSI |
0xc0c21a MOV %RSI,0x1c8(%RSP) |
0xc0c222 LEA 0x60(,%R8,4),%RSI |
0xc0c22a MOV %RSI,0x1c0(%RSP) |
0xc0c232 MOV %RDX,0x48(%RSP) |
0xc0c237 LEA 0x60(%RDX,%R8,4),%RDX |
0xc0c23c MOV %RDX,0xf0(%RSP) |
0xc0c244 LEA 0x60(%R12,%R8,4),%RDX |
0xc0c249 MOV %RDX,0xe8(%RSP) |
0xc0c251 LEA 0x40(%RAX),%RDX |
0xc0c255 MOV %RDX,0x178(%RSP) |
0xc0c25d LEA 0x20(%R15),%RDX |
0xc0c261 MOV %RDX,0x170(%RSP) |
0xc0c269 MOV %R13,0xa8(%RSP) |
0xc0c271 LEA (%R13,%R8,4),%RDX |
0xc0c276 MOV %RDX,0x198(%RSP) |
0xc0c27e MOV %R10,0xa0(%RSP) |
0xc0c286 LEA (%R10,%R8,4),%RDX |
0xc0c28a MOV %RDX,0x190(%RSP) |
0xc0c292 MOV %R14,0xb0(%RSP) |
0xc0c29a LEA (%R14,%R8,4),%RDX |
0xc0c29e MOV %RDX,0x188(%RSP) |
0xc0c2a6 LEA (%RBX,%R8,4),%RDX |
0xc0c2aa MOV %RDX,0x180(%RSP) |
0xc0c2b2 LEA 0x60(%RBX),%RDX |
0xc0c2b6 MOV %RDX,0x168(%RSP) |
0xc0c2be MOV %RCX,0x68(%RSP) |
0xc0c2c3 LEA 0x60(%RCX),%RCX |
0xc0c2c7 MOV %RCX,0x160(%RSP) |
0xc0c2cf VMOVSS -0x8b014b(%RIP),%XMM12 |
0xc0c2d7 VMOVAPS -0x8a733f(%RIP),%YMM14 |
0xc0c2df VMOVAPS -0x8a6907(%RIP),%YMM10 |
0xc0c2e7 VXORPS %XMM30,%XMM30,%XMM30 |
0xc0c2ed MOV %RAX,0x88(%RSP) |
0xc0c2f5 VMOVAPS %XMM19,0x280(%RSP) |
0xc0c2fd VMOVAPS %XMM20,%XMM24 |
0xc0c303 VMOVSS %XMM20,0x90(%RSP) |
0xc0c30b VMOVDQA64 %XMM13,%XMM21 |
0xc0c311 VMOVDQA %XMM13,0x270(%RSP) |
0xc0c31a VMOVAPD %XMM26,%XMM23 |
0xc0c320 VMOVSD %XMM26,0xf8(%RSP) |
0xc0c328 VMOVAPS %ZMM25,0x380(%RSP) |
0xc0c330 VMOVAPS %XMM22,0x260(%RSP) |
0xc0c338 VMOVAPS %XMM4,0x150(%RSP) |
0xc0c341 VMOVAPS %XMM6,0x140(%RSP) |
0xc0c34a VMOVAPS %YMM15,0x2a0(%RSP) |
0xc0c353 VMOVAPS %XMM2,0x250(%RSP) |
0xc0c35c VMOVDQA64 %YMM16,0x220(%RSP) |
0xc0c364 MOV 0x30(%RSP),%R10 |
0xc0c369 MOV 0x1c(%RSP),%ECX |
0xc0c36d MOV %R8,0x70(%RSP) |
0xc0c372 MOV %RDI,0x20(%RSP) |
0xc0c377 MOV %R9,0x120(%RSP) |
0xc0c37f JMP c0c3a6 |
0xc0c381 NOPW %CS:(%RAX,%RAX,1) |
(17436) 0xc0c390 MOV 0x30(%RSP),%R10 |
(17436) 0xc0c395 INC %R11D |
(17436) 0xc0c398 CMP 0xd8(%RSP),%R11D |
(17436) 0xc0c3a0 JE c0dfa0 |
(17436) 0xc0c3a6 MOV 0x208(%RSP),%R9 |
(17436) 0xc0c3ae TEST %R9D,%R9D |
(17436) 0xc0c3b1 SETLE %SIL |
(17436) 0xc0c3b5 MOV %R11D,%EAX |
(17436) 0xc0c3b8 CLTD |
(17436) 0xc0c3b9 IDIV %ECX |
(17436) 0xc0c3bb MOVSXD %EDX,%RCX |
(17436) 0xc0c3be MOV 0x1f8(%RSP),%RDX |
(17436) 0xc0c3c6 LEA (%RDX,%RCX,1),%RDI |
(17436) 0xc0c3ca CMP 0xd4(%RSP),%EDI |
(17436) 0xc0c3d1 SETE %BL |
(17436) 0xc0c3d4 VCVTSI2SS %EDI,%XMM1,%XMM26 |
(17436) 0xc0c3da MOV 0x608(%R10),%RDX |
(17436) 0xc0c3e1 VMOVSS (%RDX,%RDI,4),%XMM27 |
(17436) 0xc0c3e8 MOV 0xc8(%RSP),%EDX |
(17436) 0xc0c3ef IMUL %EAX,%EDX |
(17436) 0xc0c3f2 IMUL 0xcc(%RSP),%ECX |
(17436) 0xc0c3fa TEST %EDI,%EDI |
(17436) 0xc0c3fc SETE %R13B |
(17436) 0xc0c400 SETLE %DIL |
(17436) 0xc0c404 CLTQ |
(17436) 0xc0c406 ADD 0x200(%RSP),%RAX |
(17436) 0xc0c40e TEST %EAX,%EAX |
(17436) 0xc0c410 SETLE %R8B |
(17436) 0xc0c414 AND %SIL,%DIL |
(17436) 0xc0c417 AND %R8B,%DIL |
(17436) 0xc0c41a MOVZX %DIL,%R8D |
(17436) 0xc0c41e LEA (%R9,%R8,1),%ESI |
(17436) 0xc0c422 MOV %ESI,0x18(%RSP) |
(17436) 0xc0c426 VMOVD %ESI,%XMM3 |
(17436) 0xc0c42a VPINSRD $0x1,%EAX,%XMM3,%XMM3 |
(17436) 0xc0c430 VPCMPGTD %XMM3,%XMM21,%K0 |
(17436) 0xc0c436 KSHIFTRB $0x1,%K0,%K1 |
(17436) 0xc0c43c KMOVD %K1,%ESI |
(17436) 0xc0c440 TEST $0x1,%SIL |
(17436) 0xc0c444 MOV 0x600(%R10),%RSI |
(17436) 0xc0c44b MOVSXD %EDX,%RDI |
(17436) 0xc0c44e VMOVSS (%RSI,%RAX,4),%XMM3 |
(17436) 0xc0c453 MOV 0xd0(%RSP),%EDX |
(17436) 0xc0c45a MOV $0,%ESI |
(17436) 0xc0c45f CMOVNE %ESI,%EDX |
(17436) 0xc0c462 SUB %EDX,%EAX |
(17436) 0xc0c464 MOV %RDI,0x80(%RSP) |
(17436) 0xc0c46c MOV 0x88(%RSP),%RDX |
(17436) 0xc0c474 LEA (%RDX,%RDI,8),%RDX |
(17436) 0xc0c478 MOVSXD %ECX,%RCX |
(17436) 0xc0c47b VCVTSI2SS %EAX,%XMM1,%XMM20 |
(17436) 0xc0c481 VCVTSS2SD %XMM3,%XMM3,%XMM3 |
(17436) 0xc0c485 MOV %RCX,0x78(%RSP) |
(17436) 0xc0c48a LEA (%RDX,%RCX,8),%RAX |
(17436) 0xc0c48e VMULSD %XMM3,%XMM23,%XMM3 |
(17436) 0xc0c494 VCVTSD2SS %XMM3,%XMM3,%XMM7 |
(17436) 0xc0c498 LEA (%RAX,%R8,8),%RAX |
(17436) 0xc0c49c KMOVD %K0,%ECX |
(17436) 0xc0c4a0 CMPB $0,0x94(%RSP) |
(17436) 0xc0c4a8 MOV %R8,0x40(%RSP) |
(17436) 0xc0c4ad JE c0c510 |
(17436) 0xc0c4af MOV %R13D,0x2c(%RSP) |
(17436) 0xc0c4b4 MOV %BL,0x3b(%RSP) |
(17436) 0xc0c4b8 MOV %R11D,0x3c(%RSP) |
(17436) 0xc0c4bd TEST $0x1,%CL |
(17436) 0xc0c4c0 JE c0cc03 |
(17436) 0xc0c4c6 VMOVAPS %XMM20,%XMM0 |
(17436) 0xc0c4cc VMULSS 0x54(%RSP),%XMM20,%XMM8 |
(17436) 0xc0c4d4 VMULSS %XMM20,%XMM24,%XMM13 |
(17436) 0xc0c4da MOV 0x30(%RSP),%RCX |
(17436) 0xc0c4df MOV 0x5f8(%RCX),%R10 |
(17436) 0xc0c4e6 MOVSXD 0x18(%RSP),%RDX |
(17436) 0xc0c4eb MOV 0x70(%RSP),%RBX |
(17436) 0xc0c4f0 SUB %RDX,%RBX |
(17436) 0xc0c4f3 CMP $0x8,%RBX |
(17436) 0xc0c4f7 JAE c0c565 |
(17436) 0xc0c4f9 MOV %RDX,%RSI |
(17436) 0xc0c4fc JMP c0cb37 |
0xc0c501 NOPW %CS:(%RAX,%RAX,1) |
(17436) 0xc0c510 TEST $0x1,%CL |
(17436) 0xc0c513 MOV 0x70(%RSP),%R8 |
(17436) 0xc0c518 MOV 0x20(%RSP),%RDI |
(17436) 0xc0c51d MOV 0x120(%RSP),%R9 |
(17436) 0xc0c525 MOV 0x48(%RSP),%R14 |
(17436) 0xc0c52a JE c0d139 |
(17436) 0xc0c530 MOV %R10,%R13 |
(17436) 0xc0c533 VMULSS 0x54(%RSP),%XMM20,%XMM13 |
(17436) 0xc0c53b VMULSS %XMM20,%XMM24,%XMM8 |
(17436) 0xc0c541 MOV 0x5f8(%R10),%RDX |
(17436) 0xc0c548 MOVSXD 0x18(%RSP),%RCX |
(17436) 0xc0c54d MOV %R8,%R10 |
(17436) 0xc0c550 SUB %RCX,%R10 |
(17436) 0xc0c553 CMP $0x20,%R10 |
(17436) 0xc0c557 JAE c0c7fe |
(17436) 0xc0c55d MOV %RCX,%RSI |
(17436) 0xc0c560 JMP c0d00f |
(17436) 0xc0c565 LEA (%R12,%RDX,4),%RCX |
(17436) 0xc0c569 VPBROADCASTQ %RDX,%YMM0 |
(17436) 0xc0c56f VPSLLQ $0x2,%XMM0,%XMM3 |
(17436) 0xc0c574 VMOVDQA 0x290(%RSP),%XMM5 |
(17436) 0xc0c57d VPINSRQ $0x1,%R10,%XMM5,%XMM5 |
(17436) 0xc0c583 VPADDQ %XMM5,%XMM3,%XMM3 |
(17436) 0xc0c587 VPSLLQ $0x2,%YMM0,%YMM0 |
(17436) 0xc0c58c VPADDQ 0x360(%RSP),%YMM0,%YMM0 |
(17436) 0xc0c595 VMOVDQA64 -0x88895f(%RIP),%ZMM5 |
(17436) 0xc0c59f VPERMQ %ZMM0,%ZMM5,%ZMM5 |
(17436) 0xc0c5a5 VMOVDQA64 -0x8889af(%RIP),%ZMM9 |
(17436) 0xc0c5af VPERMQ %ZMM0,%ZMM9,%ZMM9 |
(17436) 0xc0c5b5 VMOVDQA64 %ZMM0,%ZMM10 |
(17436) 0xc0c5bb VMOVDQA64 -0x8888c5(%RIP),%ZMM12 |
(17436) 0xc0c5c5 VPERMT2Q %ZMM3,%ZMM12,%ZMM10 |
(17436) 0xc0c5cb MOV $0x10,%SIL |
(17436) 0xc0c5ce KMOVD %ESI,%K1 |
(17436) 0xc0c5d2 VPBROADCASTQ %RCX,%ZMM10{%K1} |
(17436) 0xc0c5d8 VPBROADCASTQ %RCX,%ZMM12 |
(17436) 0xc0c5de VMOVDQA64 -0x8888a8(%RIP),%ZMM14 |
(17436) 0xc0c5e8 VPERMQ %ZMM10,%ZMM14,%ZMM14 |
(17436) 0xc0c5ee VPSUBQ %ZMM5,%ZMM14,%ZMM5 |
(17436) 0xc0c5f4 VMOVDQA64 -0x88887e(%RIP),%ZMM14 |
(17436) 0xc0c5fe VPERMQ %ZMM10,%ZMM14,%ZMM10 |
(17436) 0xc0c604 VPBROADCASTQ -0x8af3ae(%RIP),%ZMM14 |
(17436) 0xc0c60e VPSUBQ %ZMM9,%ZMM10,%ZMM9 |
(17436) 0xc0c614 VPCMPLTUQ %ZMM14,%ZMM5,%K0 |
(17436) 0xc0c61b VPCMPLTUQ %ZMM14,%ZMM9,%K1 |
(17436) 0xc0c622 KUNPCKBW %K0,%K1,%K0 |
(17436) 0xc0c626 VPMOVM2B %K0,%XMM5 |
(17436) 0xc0c62c XOR %ESI,%ESI |
(17436) 0xc0c62e VPTEST %XMM5,%XMM5 |
(17436) 0xc0c633 SETE %DIL |
(17436) 0xc0c637 VMOVDQA -0x8a5f3f(%RIP),%YMM5 |
(17436) 0xc0c63f VPERMT2Q %YMM3,%YMM5,%YMM12 |
(17436) 0xc0c645 VINSERTI128 $0x1,%XMM3,%YMM0,%YMM5 |
(17436) 0xc0c64b VMOVDQA -0x8a0bf3(%RIP),%YMM9 |
(17436) 0xc0c653 VPERMT2Q %YMM5,%YMM9,%YMM0 |
(17436) 0xc0c659 VPSUBQ %YMM0,%YMM12,%YMM0 |
(17436) 0xc0c65d VPCMPLTUQ %YMM14,%YMM0,%K0 |
(17436) 0xc0c664 VPMOVM2D %K0,%XMM0 |
(17436) 0xc0c66a XOR %R8D,%R8D |
(17436) 0xc0c66d VPTEST %XMM0,%XMM0 |
(17436) 0xc0c672 SETE %R9B |
(17436) 0xc0c676 VPEXTRQ $0x1,%XMM3,%R11 |
(17436) 0xc0c67c SUB %R11,%RCX |
(17436) 0xc0c67f CMP $0x20,%RCX |
(17436) 0xc0c683 JB c0cb1c |
(17436) 0xc0c689 MOV %R9B,%R8B |
(17436) 0xc0c68c TEST %R8D,%R8D |
(17436) 0xc0c68f JE c0cb1c |
(17436) 0xc0c695 MOV %DIL,%SIL |
(17436) 0xc0c698 TEST %ESI,%ESI |
(17436) 0xc0c69a JE c0cb1c |
(17436) 0xc0c6a0 MOV %RBX,0x1e0(%RSP) |
(17436) 0xc0c6a8 MOV %RBX,%RCX |
(17436) 0xc0c6ab AND $-0x8,%RCX |
(17436) 0xc0c6af LEA (%RCX,%RDX,1),%RSI |
(17436) 0xc0c6b3 SAL $0x2,%RDX |
(17436) 0xc0c6b7 MOV 0x18(%RSP),%EDI |
(17436) 0xc0c6bb VPBROADCASTD %EDI,%YMM0 |
(17436) 0xc0c6c1 VPADDD -0x8a4389(%RIP),%YMM0,%YMM3 |
(17436) 0xc0c6c9 VBROADCASTSS %XMM8,%YMM5 |
(17436) 0xc0c6ce VBROADCASTSS %XMM13,%YMM9 |
(17436) 0xc0c6d3 VBROADCASTSS %XMM26,%YMM10 |
(17436) 0xc0c6d9 VBROADCASTSS %XMM27,%YMM14 |
(17436) 0xc0c6df VMOVAPS %YMM18,%YMM6 |
(17436) 0xc0c6e5 VBROADCASTSS %XMM7,%YMM18 |
(17436) 0xc0c6eb MOV 0xa8(%RSP),%RDI |
(17436) 0xc0c6f3 LEA (%RDI,%RDX,1),%R11 |
(17436) 0xc0c6f7 MOV 0xa0(%RSP),%RDI |
(17436) 0xc0c6ff LEA (%RDI,%RDX,1),%RBX |
(17436) 0xc0c703 MOV 0xb0(%RSP),%RDI |
(17436) 0xc0c70b LEA (%RDI,%RDX,1),%R14 |
(17436) 0xc0c70f MOV 0x58(%RSP),%RDI |
(17436) 0xc0c714 LEA (%RDI,%RDX,1),%R9 |
(17436) 0xc0c718 LEA (%R10,%RDX,1),%R13 |
(17436) 0xc0c71c MOV 0x48(%RSP),%RDI |
(17436) 0xc0c721 LEA (%RDI,%RDX,1),%R8 |
(17436) 0xc0c725 ADD %R12,%RDX |
(17436) 0xc0c728 XOR %EDI,%EDI |
(17436) 0xc0c72a NOPW (%RAX,%RAX,1) |
(17456) 0xc0c730 VCVTDQ2PS %YMM3,%YMM0 |
(17456) 0xc0c734 VMULPS %YMM0,%YMM31,%YMM12 |
(17456) 0xc0c73a VMOVAPS %YMM1,%YMM15 |
(17456) 0xc0c73e VFMADD213PS %YMM5,%YMM0,%YMM15 |
(17456) 0xc0c743 VFMADD213PS %YMM9,%YMM17,%YMM0 |
(17456) 0xc0c749 VFMADD231PS %YMM6,%YMM10,%YMM0 |
(17456) 0xc0c74e VMULPS %YMM15,%YMM15,%YMM16 |
(17456) 0xc0c754 VFMADD231PS %YMM12,%YMM12,%YMM16 |
(17456) 0xc0c75a VMOVUPS %YMM12,(%R11,%RDI,4) |
(17456) 0xc0c760 VMOVUPS %YMM15,(%RBX,%RDI,4) |
(17456) 0xc0c765 VMOVAPS 0x2a0(%RSP),%YMM15 |
(17456) 0xc0c76e VFMADD231PS %YMM0,%YMM0,%YMM16 |
(17456) 0xc0c774 VMOVUPS %YMM0,(%R14,%RDI,4) |
(17456) 0xc0c77a VMOVUPS %YMM16,(%R9,%RDI,4) |
(17456) 0xc0c781 VMULPS %YMM16,%YMM14,%YMM0 |
(17456) 0xc0c787 VMULPS %YMM18,%YMM0,%YMM0 |
(17456) 0xc0c78d VMULPS (%R13,%RDI,4),%YMM0,%YMM0 |
(17456) 0xc0c794 VMOVUPS %YMM0,(%R8,%RDI,4) |
(17456) 0xc0c79a VMULPS %YMM15,%YMM16,%YMM0 |
(17456) 0xc0c7a0 VMOVUPS %YMM0,(%RDX,%RDI,4) |
(17456) 0xc0c7a5 ADD $0x8,%RDI |
(17456) 0xc0c7a9 VPADDD -0x8b0687(%RIP){1to8},%YMM3,%YMM3 |
(17456) 0xc0c7b3 CMP %RDI,%RCX |
(17456) 0xc0c7b6 JNE c0c730 |
(17436) 0xc0c7bc CMP %RCX,0x1e0(%RSP) |
(17436) 0xc0c7c4 VMOVAPS %YMM6,%YMM18 |
(17436) 0xc0c7ca VMOVAPS 0x140(%RSP),%XMM6 |
(17436) 0xc0c7d3 VMOVDQA64 0x220(%RSP),%YMM16 |
(17436) 0xc0c7db VMOVSS -0x8b0657(%RIP),%XMM12 |
(17436) 0xc0c7e3 VMOVAPS -0x8a784b(%RIP),%YMM14 |
(17436) 0xc0c7eb VMOVAPS -0x8a6e13(%RIP),%YMM10 |
(17436) 0xc0c7f3 JNE c0cb37 |
(17436) 0xc0c7f9 JMP c0cc03 |
(17436) 0xc0c7fe VMOVSS %XMM20,0x2c(%RSP) |
(17436) 0xc0c806 LEA (%RDX,%RCX,4),%RSI |
(17436) 0xc0c80a VPBROADCASTQ %RCX,%XMM3 |
(17436) 0xc0c810 VPSLLQ $0x2,%XMM3,%XMM3 |
(17436) 0xc0c815 VPADDQ 0x290(%RSP),%XMM3,%XMM3 |
(17436) 0xc0c81e VPERMQ $0x54,%YMM3,%YMM5 |
(17436) 0xc0c824 VMOVQ %RSI,%XMM9 |
(17436) 0xc0c829 VMOVDQA -0x8ac841(%RIP),%XMM0 |
(17436) 0xc0c831 VPERMT2Q %YMM3,%YMM0,%YMM9 |
(17436) 0xc0c837 VPSUBQ %YMM9,%YMM5,%YMM3 |
(17436) 0xc0c83c VPCMPLTUQ -0x8af0a7(%RIP){1to0},%YMM3,%K0 |
(17436) 0xc0c847 VPMOVM2D %K0,%XMM3 |
(17436) 0xc0c84d VPTEST %XMM3,%XMM3 |
(17436) 0xc0c852 JNE c0d004 |
(17436) 0xc0c858 MOV %R11D,%EDI |
(17436) 0xc0c85b MOV %R10,%R13 |
(17436) 0xc0c85e MOV %R10,%R9 |
(17436) 0xc0c861 AND $-0x20,%R9 |
(17436) 0xc0c865 LEA (%R9,%RCX,1),%RSI |
(17436) 0xc0c869 MOV 0x18(%RSP),%R10D |
(17436) 0xc0c86e VPBROADCASTD %R10D,%YMM3 |
(17436) 0xc0c874 VPADDD -0x8a453c(%RIP),%YMM3,%YMM3 |
(17436) 0xc0c87c VBROADCASTSS %XMM13,%YMM5 |
(17436) 0xc0c881 VBROADCASTSS %XMM8,%YMM10 |
(17436) 0xc0c886 VBROADCASTSS %XMM26,%YMM9 |
(17436) 0xc0c88c VMOVAPS %YMM18,%YMM6 |
(17436) 0xc0c892 VBROADCASTSS %XMM27,%YMM18 |
(17436) 0xc0c898 VBROADCASTSS %XMM7,%YMM14 |
(17436) 0xc0c89d LEA 0x60(%RDX,%RCX,4),%R14 |
(17436) 0xc0c8a2 MOV 0x1d0(%RSP),%R10 |
(17436) 0xc0c8aa LEA (%R10,%RCX,4),%RBX |
(17436) 0xc0c8ae MOV 0x1c8(%RSP),%R10 |
(17436) 0xc0c8b6 LEA (%R10,%RCX,4),%RCX |
(17436) 0xc0c8ba XOR %R11D,%R11D |
(17436) 0xc0c8bd VMOVAPS %YMM31,%YMM22 |
(17436) 0xc0c8c3 VMOVAPS %YMM17,%YMM4 |
(17436) 0xc0c8c9 VMOVAPS %YMM15,%YMM2 |
(17436) 0xc0c8cd NOPL (%RAX) |
(17444) 0xc0c8d0 VPADDD -0x8b07ae(%RIP){1to8},%YMM3,%YMM16 |
(17444) 0xc0c8da VPADDD -0x8b0378(%RIP){1to8},%YMM3,%YMM15 |
(17444) 0xc0c8e4 VPADDD -0x8b0732(%RIP){1to8},%YMM3,%YMM31 |
(17444) 0xc0c8ee VCVTDQ2PS %YMM3,%YMM25 |
(17444) 0xc0c8f4 VCVTDQ2PS %YMM16,%YMM16 |
(17444) 0xc0c8fa VCVTDQ2PS %YMM15,%YMM15 |
(17444) 0xc0c8ff VCVTDQ2PS %YMM31,%YMM31 |
(17444) 0xc0c905 VMULPS %YMM25,%YMM22,%YMM0 |
(17444) 0xc0c90b VMULPS %YMM16,%YMM22,%YMM24 |
(17444) 0xc0c911 VMULPS %YMM15,%YMM22,%YMM17 |
(17444) 0xc0c917 VMOVAPS %YMM1,%YMM20 |
(17444) 0xc0c91d VFMADD213PS %YMM5,%YMM25,%YMM20 |
(17444) 0xc0c923 VMOVAPS %YMM1,%YMM12 |
(17444) 0xc0c927 VFMADD213PS %YMM5,%YMM16,%YMM12 |
(17444) 0xc0c92d VMOVAPS %YMM1,%YMM19 |
(17444) 0xc0c933 VFMADD213PS %YMM5,%YMM15,%YMM19 |
(17444) 0xc0c939 VMOVAPS %YMM1,%YMM21 |
(17444) 0xc0c93f VFMADD213PS %YMM5,%YMM31,%YMM21 |
(17444) 0xc0c945 VMULPS %YMM31,%YMM22,%YMM23 |
(17444) 0xc0c94b VFMADD213PS %YMM10,%YMM4,%YMM25 |
(17444) 0xc0c951 VFMADD213PS %YMM10,%YMM4,%YMM16 |
(17444) 0xc0c957 VFMADD213PS %YMM10,%YMM4,%YMM15 |
(17444) 0xc0c95c VFMADD213PS %YMM10,%YMM4,%YMM31 |
(17444) 0xc0c962 VFMADD231PS %YMM6,%YMM9,%YMM25 |
(17444) 0xc0c968 VFMADD231PS %YMM6,%YMM9,%YMM16 |
(17444) 0xc0c96e VFMADD231PS %YMM6,%YMM9,%YMM15 |
(17444) 0xc0c973 VMULPS %YMM20,%YMM20,%YMM20 |
(17444) 0xc0c979 VMULPS %YMM12,%YMM12,%YMM12 |
(17444) 0xc0c97e VMULPS %YMM19,%YMM19,%YMM19 |
(17444) 0xc0c984 VMULPS %YMM21,%YMM21,%YMM21 |
(17444) 0xc0c98a VFMADD231PS %YMM6,%YMM9,%YMM31 |
(17444) 0xc0c990 VFMADD231PS %YMM0,%YMM0,%YMM20 |
(17444) 0xc0c996 VFMADD231PS %YMM24,%YMM24,%YMM12 |
(17444) 0xc0c99c VFMADD231PS %YMM17,%YMM17,%YMM19 |
(17444) 0xc0c9a2 VFMADD231PS %YMM23,%YMM23,%YMM21 |
(17444) 0xc0c9a8 VFMADD231PS %YMM25,%YMM25,%YMM20 |
(17444) 0xc0c9ae VFMADD231PS %YMM16,%YMM16,%YMM12 |
(17444) 0xc0c9b4 VFMADD231PS %YMM15,%YMM15,%YMM19 |
(17444) 0xc0c9ba VFMADD231PS %YMM31,%YMM31,%YMM21 |
(17444) 0xc0c9c0 VMULPS %YMM20,%YMM18,%YMM0 |
(17444) 0xc0c9c6 VMULPS %YMM12,%YMM18,%YMM15 |
(17444) 0xc0c9cc VMULPS %YMM19,%YMM18,%YMM16 |
(17444) 0xc0c9d2 VMULPS %YMM21,%YMM18,%YMM17 |
(17444) 0xc0c9d8 VMULPS %YMM0,%YMM14,%YMM0 |
(17444) 0xc0c9dc VMULPS %YMM14,%YMM15,%YMM15 |
(17444) 0xc0c9e1 VMULPS %YMM14,%YMM16,%YMM16 |
(17444) 0xc0c9e7 VMULPS -0x60(%R14,%R11,4),%YMM0,%YMM0 |
(17444) 0xc0c9ee VMULPS %YMM14,%YMM17,%YMM17 |
(17444) 0xc0c9f4 VMULPS -0x40(%R14,%R11,4),%YMM15,%YMM15 |
(17444) 0xc0c9fb VMULPS -0x20(%R14,%R11,4),%YMM16,%YMM16 |
(17444) 0xc0ca03 VMULPS (%R14,%R11,4),%YMM17,%YMM17 |
(17444) 0xc0ca0a VMOVUPS %YMM0,-0x60(%RBX,%R11,4) |
(17444) 0xc0ca11 VMOVUPS %YMM15,-0x40(%RBX,%R11,4) |
(17444) 0xc0ca18 VMOVUPS %YMM16,-0x20(%RBX,%R11,4) |
(17444) 0xc0ca20 VMULPS %YMM2,%YMM20,%YMM0 |
(17444) 0xc0ca26 VMULPS %YMM2,%YMM12,%YMM12 |
(17444) 0xc0ca2a VMULPS %YMM2,%YMM19,%YMM15 |
(17444) 0xc0ca30 VMULPS %YMM2,%YMM21,%YMM16 |
(17444) 0xc0ca36 VMOVUPS %YMM17,(%RBX,%R11,4) |
(17444) 0xc0ca3d VMOVUPS %YMM0,-0x60(%RCX,%R11,4) |
(17444) 0xc0ca44 VMOVUPS %YMM12,-0x40(%RCX,%R11,4) |
(17444) 0xc0ca4b VMOVUPS %YMM15,-0x20(%RCX,%R11,4) |
(17444) 0xc0ca52 VMOVUPS %YMM16,(%RCX,%R11,4) |
(17444) 0xc0ca59 ADD $0x20,%R11 |
(17444) 0xc0ca5d VPADDD -0x8b06f7(%RIP){1to8},%YMM3,%YMM3 |
(17444) 0xc0ca67 CMP %R11,%R9 |
(17444) 0xc0ca6a JNE c0c8d0 |
(17436) 0xc0ca70 CMP %R9,%R13 |
(17436) 0xc0ca73 MOV %EDI,%R11D |
(17436) 0xc0ca76 VMOVAPS 0x280(%RSP),%XMM19 |
(17436) 0xc0ca7e VMOVSS 0x90(%RSP),%XMM24 |
(17436) 0xc0ca86 VMOVDQA64 0x270(%RSP),%XMM21 |
(17436) 0xc0ca8e VMOVSD 0xf8(%RSP),%XMM23 |
(17436) 0xc0ca96 VMOVAPS 0x380(%RSP),%ZMM25 |
(17436) 0xc0ca9e MOV 0x20(%RSP),%RDI |
(17436) 0xc0caa3 VMOVAPS %YMM22,%YMM31 |
(17436) 0xc0caa9 VMOVAPS 0x260(%RSP),%XMM22 |
(17436) 0xc0cab1 VMOVAPS %YMM4,%YMM17 |
(17436) 0xc0cab7 VMOVAPS 0x150(%RSP),%XMM4 |
(17436) 0xc0cac0 VMOVAPS %YMM6,%YMM18 |
(17436) 0xc0cac6 VMOVAPS 0x140(%RSP),%XMM6 |
(17436) 0xc0cacf VMOVAPS %YMM2,%YMM15 |
(17436) 0xc0cad3 VMOVAPS 0x250(%RSP),%XMM2 |
(17436) 0xc0cadc MOV 0x120(%RSP),%R9 |
(17436) 0xc0cae4 VMOVDQA64 0x220(%RSP),%YMM16 |
(17436) 0xc0caec MOV 0x48(%RSP),%R14 |
(17436) 0xc0caf1 VMOVSS -0x8b096d(%RIP),%XMM12 |
(17436) 0xc0caf9 VMOVAPS -0x8a7b61(%RIP),%YMM14 |
(17436) 0xc0cb01 VMOVAPS -0x8a7129(%RIP),%YMM10 |
(17436) 0xc0cb09 VMOVSS 0x2c(%RSP),%XMM20 |
(17436) 0xc0cb11 JNE c0d00f |
(17436) 0xc0cb17 JMP c0d139 |
(17436) 0xc0cb1c MOV %RDX,%RSI |
(17436) 0xc0cb1f VMOVSS -0x8b099b(%RIP),%XMM12 |
(17436) 0xc0cb27 VMOVAPS -0x8a7b8f(%RIP),%YMM14 |
(17436) 0xc0cb2f VMOVAPS -0x8a7157(%RIP),%YMM10 |
(17436) 0xc0cb37 MOV 0xa8(%RSP),%RCX |
(17436) 0xc0cb3f LEA (%RCX,%RSI,4),%RCX |
(17436) 0xc0cb43 MOV 0xa0(%RSP),%RDX |
(17436) 0xc0cb4b LEA (%RDX,%RSI,4),%RDX |
(17436) 0xc0cb4f MOV 0xb0(%RSP),%RDI |
(17436) 0xc0cb57 LEA (%RDI,%RSI,4),%R9 |
(17436) 0xc0cb5b MOV 0x58(%RSP),%RDI |
(17436) 0xc0cb60 LEA (%RDI,%RSI,4),%R11 |
(17436) 0xc0cb64 LEA (%R10,%RSI,4),%RBX |
(17436) 0xc0cb68 MOV 0x48(%RSP),%RDI |
(17436) 0xc0cb6d LEA (%RDI,%RSI,4),%R14 |
(17436) 0xc0cb71 LEA (%R12,%RSI,4),%R13 |
(17436) 0xc0cb75 MOV 0x110(%RSP),%RDI |
(17436) 0xc0cb7d LEA (%RDI,%RSI,1),%R8 |
(17436) 0xc0cb81 XOR %EDI,%EDI |
(17436) 0xc0cb83 NOPW %CS:(%RAX,%RAX,1) |
(17455) 0xc0cb90 LEA (%RSI,%RDI,1),%R10D |
(17455) 0xc0cb94 VCVTSI2SS %R10D,%XMM1,%XMM0 |
(17455) 0xc0cb99 VMULSS %XMM0,%XMM22,%XMM3 |
(17455) 0xc0cb9f VMOVAPS %XMM2,%XMM5 |
(17455) 0xc0cba3 VFMADD213SS %XMM8,%XMM0,%XMM5 |
(17455) 0xc0cba8 VFMADD213SS %XMM13,%XMM4,%XMM0 |
(17455) 0xc0cbad VFMADD231SS %XMM6,%XMM26,%XMM0 |
(17455) 0xc0cbb3 VMULSS %XMM5,%XMM5,%XMM9 |
(17455) 0xc0cbb7 VFMADD231SS %XMM3,%XMM3,%XMM9 |
(17455) 0xc0cbbc VFMADD231SS %XMM0,%XMM0,%XMM9 |
(17455) 0xc0cbc1 VMOVSS %XMM3,(%RCX,%RDI,4) |
(17455) 0xc0cbc6 VMOVSS %XMM5,(%RDX,%RDI,4) |
(17455) 0xc0cbcb VMOVSS %XMM0,(%R9,%RDI,4) |
(17455) 0xc0cbd1 VMOVSS %XMM9,(%R11,%RDI,4) |
(17455) 0xc0cbd7 VMULSS %XMM9,%XMM27,%XMM0 |
(17455) 0xc0cbdd VMULSS %XMM7,%XMM0,%XMM0 |
(17455) 0xc0cbe1 VMULSS (%RBX,%RDI,4),%XMM0,%XMM0 |
(17455) 0xc0cbe6 VMOVSS %XMM0,(%R14,%RDI,4) |
(17455) 0xc0cbec VMULSS %XMM11,%XMM9,%XMM0 |
(17455) 0xc0cbf1 VMOVSS %XMM0,(%R13,%RDI,4) |
(17455) 0xc0cbf8 INC %RDI |
(17455) 0xc0cbfb MOV %R8,%R10 |
(17455) 0xc0cbfe ADD %RDI,%R10 |
(17455) 0xc0cc01 JNE c0cb90 |
(17436) 0xc0cc03 MOV 0x60(%RSP),%ECX |
(17436) 0xc0cc07 CMP 0x64(%RSP),%ECX |
(17436) 0xc0cc0b JGE c0cd10 |
(17436) 0xc0cc11 VMULSS 0x54(%RSP),%XMM20,%XMM8 |
(17436) 0xc0cc19 VMULSS %XMM20,%XMM24,%XMM13 |
(17436) 0xc0cc1f MOV 0x30(%RSP),%RCX |
(17436) 0xc0cc24 MOV 0x5f8(%RCX),%RDX |
(17436) 0xc0cc2b MOV 0x70(%RSP),%RDI |
(17436) 0xc0cc30 CMPQ $0x8,0x98(%RSP) |
(17436) 0xc0cc39 JAE c0cd75 |
(17436) 0xc0cc3f MOV 0x108(%RSP),%RCX |
(17436) 0xc0cc47 ADD %EDI,%ECX |
(17436) 0xc0cc49 MOV 0xa8(%RSP),%RSI |
(17436) 0xc0cc51 LEA (%RSI,%RDI,4),%RSI |
(17436) 0xc0cc55 MOV 0xa0(%RSP),%R8 |
(17436) 0xc0cc5d LEA (%R8,%RDI,4),%R9 |
(17436) 0xc0cc61 MOV 0xb0(%RSP),%R8 |
(17436) 0xc0cc69 LEA (%R8,%RDI,4),%R11 |
(17436) 0xc0cc6d MOV 0x58(%RSP),%R8 |
(17436) 0xc0cc72 LEA (%R8,%RDI,4),%RBX |
(17436) 0xc0cc76 LEA (%RDX,%RDI,4),%RDX |
(17436) 0xc0cc7a MOV 0x48(%RSP),%R8 |
(17436) 0xc0cc7f LEA (%R8,%RDI,4),%R14 |
(17436) 0xc0cc83 LEA (%R12,%RDI,4),%R13 |
(17436) 0xc0cc87 MOV 0x20(%RSP),%R8 |
(17436) 0xc0cc8c SUB %RDI,%R8 |
(17436) 0xc0cc8f XOR %EDI,%EDI |
(17436) 0xc0cc91 NOPW %CS:(%RAX,%RAX,1) |
(17453) 0xc0cca0 LEA (%RCX,%RDI,1),%R10D |
(17453) 0xc0cca4 VCVTSI2SS %R10D,%XMM1,%XMM0 |
(17453) 0xc0cca9 VMULSS %XMM0,%XMM22,%XMM3 |
(17453) 0xc0ccaf VMOVAPS %XMM2,%XMM5 |
(17453) 0xc0ccb3 VFMADD213SS %XMM8,%XMM0,%XMM5 |
(17453) 0xc0ccb8 VFMADD213SS %XMM13,%XMM4,%XMM0 |
(17453) 0xc0ccbd VFMADD231SS %XMM6,%XMM26,%XMM0 |
(17453) 0xc0ccc3 VMULSS %XMM5,%XMM5,%XMM9 |
(17453) 0xc0ccc7 VFMADD231SS %XMM3,%XMM3,%XMM9 |
(17453) 0xc0cccc VFMADD231SS %XMM0,%XMM0,%XMM9 |
(17453) 0xc0ccd1 VMOVSS %XMM3,(%RSI,%RDI,4) |
(17453) 0xc0ccd6 VMOVSS %XMM5,(%R9,%RDI,4) |
(17453) 0xc0ccdc VMOVSS %XMM0,(%R11,%RDI,4) |
(17453) 0xc0cce2 VMOVSS %XMM9,(%RBX,%RDI,4) |
(17453) 0xc0cce7 VMULSS %XMM9,%XMM27,%XMM0 |
(17453) 0xc0cced VMULSS %XMM7,%XMM0,%XMM0 |
(17453) 0xc0ccf1 VMULSS (%RDX,%RDI,4),%XMM0,%XMM0 |
(17453) 0xc0ccf6 VMOVSS %XMM0,(%R14,%RDI,4) |
(17453) 0xc0ccfc VMULSS %XMM11,%XMM9,%XMM0 |
(17453) 0xc0cd01 VMOVSS %XMM0,(%R13,%RDI,4) |
(17453) 0xc0cd08 INC %RDI |
(17453) 0xc0cd0b CMP %RDI,%R8 |
(17453) 0xc0cd0e JNE c0cca0 |
(17436) 0xc0cd10 MOV 0x40(%RSP),%R10 |
(17436) 0xc0cd15 CMP %R10D,0xb8(%RSP) |
(17436) 0xc0cd1d MOV 0x20(%RSP),%RDI |
(17436) 0xc0cd22 MOV 0x58(%RSP),%R14 |
(17436) 0xc0cd27 VMOVSD -0x8aff71(%RIP),%XMM26 |
(17436) 0xc0cd31 VMOVAPS -0x88907b(%RIP),%ZMM13 |
(17436) 0xc0cd3b VXORPS %XMM27,%XMM27,%XMM27 |
(17436) 0xc0cd41 MOV 0x2c(%RSP),%EBX |
(17436) 0xc0cd45 JLE c0d8a4 |
(17436) 0xc0cd4b MOVSXD 0x18(%RSP),%RDX |
(17436) 0xc0cd50 LEA 0x1(%RDX),%RCX |
(17436) 0xc0cd54 CMP %RDI,%RCX |
(17436) 0xc0cd57 CMOVLE %RDI,%RCX |
(17436) 0xc0cd5b SUB %RDX,%RCX |
(17436) 0xc0cd5e CMP $0x4,%RCX |
(17436) 0xc0cd62 JAE c0cfca |
(17436) 0xc0cd68 MOV %RDX,%R9 |
(17436) 0xc0cd6b MOV 0x68(%RSP),%RCX |
(17436) 0xc0cd70 JMP c0d890 |
(17436) 0xc0cd75 MOV 0x100(%RSP),%RCX |
(17436) 0xc0cd7d LEA (%RCX,%RDX,1),%RSI |
(17436) 0xc0cd81 MOV $0x20,%CL |
(17436) 0xc0cd83 KMOVD %ECX,%K1 |
(17436) 0xc0cd87 VMOVDQA64 0x3c0(%RSP),%ZMM0 |
(17436) 0xc0cd8f VPBROADCASTQ %RSI,%ZMM0{%K1} |
(17436) 0xc0cd95 VPBROADCASTQ %RSI,%ZMM3 |
(17436) 0xc0cd9b VMOVDQA64 -0x889065(%RIP),%ZMM5 |
(17436) 0xc0cda5 VPERMQ %ZMM0,%ZMM5,%ZMM5 |
(17436) 0xc0cdab VPSUBQ 0x400(%RSP),%ZMM5,%ZMM5 |
(17436) 0xc0cdb3 VMOVDQA64 -0x88903d(%RIP),%ZMM9 |
(17436) 0xc0cdbd VPERMQ %ZMM0,%ZMM9,%ZMM0 |
(17436) 0xc0cdc3 VPSUBQ 0x440(%RSP),%ZMM0,%ZMM0 |
(17436) 0xc0cdcb VPBROADCASTQ -0x8afb75(%RIP),%ZMM9 |
(17436) 0xc0cdd5 VPCMPLTUQ %ZMM9,%ZMM5,%K0 |
(17436) 0xc0cddc VPCMPLTUQ %ZMM9,%ZMM0,%K1 |
(17436) 0xc0cde3 KUNPCKBW %K0,%K1,%K0 |
(17436) 0xc0cde7 VPMOVM2B %K0,%XMM0 |
(17436) 0xc0cded XOR %ECX,%ECX |
(17436) 0xc0cdef VPTEST %XMM0,%XMM0 |
(17436) 0xc0cdf4 SETE %R8B |
(17436) 0xc0cdf8 VMOVDQA 0x320(%RSP),%YMM5 |
(17436) 0xc0ce01 VPINSRQ $0x1,%RSI,%XMM5,%XMM0 |
(17436) 0xc0ce07 VPBLENDD $0xf,%YMM0,%YMM5,%YMM0 |
(17436) 0xc0ce0d VPERMQ $-0x3c,%YMM0,%YMM0 |
(17436) 0xc0ce13 VMOVDQA 0x300(%RSP),%YMM5 |
(17436) 0xc0ce1c VMOVDQA -0x8a13a4(%RIP),%YMM10 |
(17436) 0xc0ce24 VPERMT2Q %YMM3,%YMM10,%YMM5 |
(17436) 0xc0ce2a VMOVAPS -0x8a7452(%RIP),%YMM10 |
(17436) 0xc0ce32 VPSUBQ %YMM5,%YMM0,%YMM0 |
(17436) 0xc0ce36 VPCMPLTUQ %YMM9,%YMM0,%K0 |
(17436) 0xc0ce3d VPMOVM2D %K0,%XMM0 |
(17436) 0xc0ce43 XOR %R9D,%R9D |
(17436) 0xc0ce46 VPTEST %XMM0,%XMM0 |
(17436) 0xc0ce4b SETE %R11B |
(17436) 0xc0ce4f MOV 0x1e8(%RSP),%RBX |
(17436) 0xc0ce57 SUB %RSI,%RBX |
(17436) 0xc0ce5a MOV 0x70(%RSP),%RDI |
(17436) 0xc0ce5f CMP $0x20,%RBX |
(17436) 0xc0ce63 JB c0cc3f |
(17436) 0xc0ce69 MOV %R11B,%R9B |
(17436) 0xc0ce6c MOV 0x70(%RSP),%RDI |
(17436) 0xc0ce71 TEST %R9D,%R9D |
(17436) 0xc0ce74 JE c0cc3f |
(17436) 0xc0ce7a MOV %R8B,%CL |
(17436) 0xc0ce7d MOV 0x70(%RSP),%RDI |
(17436) 0xc0ce82 TEST %ECX,%ECX |
(17436) 0xc0ce84 JE c0cc3f |
(17436) 0xc0ce8a VBROADCASTSS %XMM8,%YMM3 |
(17436) 0xc0ce8f VBROADCASTSS %XMM13,%YMM5 |
(17436) 0xc0ce94 VBROADCASTSS %XMM26,%YMM9 |
(17436) 0xc0ce9a VBROADCASTSS %XMM27,%YMM10 |
(17436) 0xc0cea0 VBROADCASTSS %XMM7,%YMM14 |
(17436) 0xc0cea5 XOR %ECX,%ECX |
(17436) 0xc0cea7 VMOVAPS %YMM17,%YMM4 |
(17436) 0xc0cead VMOVDQA64 0x2c0(%RSP),%YMM17 |
(17436) 0xc0ceb5 MOV 0x1a8(%RSP),%R8 |
(17436) 0xc0cebd MOV 0xf0(%RSP),%RDI |
(17436) 0xc0cec5 MOV 0xe8(%RSP),%R9 |
(17436) 0xc0cecd MOV 0x198(%RSP),%R10 |
(17436) 0xc0ced5 MOV 0x190(%RSP),%R11 |
(17436) 0xc0cedd MOV 0x188(%RSP),%RBX |
(17436) 0xc0cee5 MOV 0x180(%RSP),%R14 |
(17436) 0xc0ceed NOPL (%RAX) |
(17454) 0xc0cef0 VPSUBD %YMM16,%YMM17,%YMM0 |
(17454) 0xc0cef6 VCVTDQ2PS %YMM0,%YMM0 |
(17454) 0xc0cefa VMULPS %YMM0,%YMM31,%YMM12 |
(17454) 0xc0cf00 VMOVAPS %YMM1,%YMM15 |
(17454) 0xc0cf04 VFMADD213PS %YMM3,%YMM0,%YMM15 |
(17454) 0xc0cf09 VFMADD213PS %YMM5,%YMM4,%YMM0 |
(17454) 0xc0cf0e VFMADD231PS %YMM18,%YMM9,%YMM0 |
(17454) 0xc0cf14 VMULPS %YMM15,%YMM15,%YMM16 |
(17454) 0xc0cf1a VFMADD231PS %YMM12,%YMM12,%YMM16 |
(17454) 0xc0cf20 VMOVUPS %YMM12,(%R10,%RCX,4) |
(17454) 0xc0cf26 VMOVUPS %YMM15,(%R11,%RCX,4) |
(17454) 0xc0cf2c VMOVAPS 0x2a0(%RSP),%YMM15 |
(17454) 0xc0cf35 VFMADD231PS %YMM0,%YMM0,%YMM16 |
(17454) 0xc0cf3b VMOVUPS %YMM0,(%RBX,%RCX,4) |
(17454) 0xc0cf40 VMOVUPS %YMM16,(%R14,%RCX,4) |
(17454) 0xc0cf47 VMULPS %YMM16,%YMM10,%YMM0 |
(17454) 0xc0cf4d VMULPS %YMM0,%YMM14,%YMM0 |
(17454) 0xc0cf51 VMULPS (%RSI,%RCX,4),%YMM0,%YMM0 |
(17454) 0xc0cf56 VMOVUPS %YMM0,-0x60(%RDI,%RCX,4) |
(17454) 0xc0cf5c VMULPS %YMM15,%YMM16,%YMM0 |
(17454) 0xc0cf62 VMOVDQA64 0x220(%RSP),%YMM16 |
(17454) 0xc0cf6a VMOVUPS %YMM0,-0x60(%R9,%RCX,4) |
(17454) 0xc0cf71 ADD $0x8,%RCX |
(17454) 0xc0cf75 VPADDD -0x8b0e53(%RIP){1to8},%YMM17,%YMM17 |
(17454) 0xc0cf7f CMP %RCX,%R8 |
(17454) 0xc0cf82 JNE c0cef0 |
(17436) 0xc0cf88 MOV 0x1a0(%RSP),%RDI |
(17436) 0xc0cf90 CMP %R8,0x98(%RSP) |
(17436) 0xc0cf98 VMOVAPS %YMM4,%YMM17 |
(17436) 0xc0cf9e VMOVAPS 0x150(%RSP),%XMM4 |
(17436) 0xc0cfa7 VMOVSS -0x8b0e23(%RIP),%XMM12 |
(17436) 0xc0cfaf VMOVAPS -0x8a8017(%RIP),%YMM14 |
(17436) 0xc0cfb7 VMOVAPS -0x8a75df(%RIP),%YMM10 |
(17436) 0xc0cfbf JNE c0cc3f |
(17436) 0xc0cfc5 JMP c0cd10 |
(17436) 0xc0cfca MOV 0x68(%RSP),%R9 |
(17436) 0xc0cfcf LEA (%R9,%RDX,4),%RSI |
(17436) 0xc0cfd3 LEA (%R14,%RDX,4),%RDI |
(17436) 0xc0cfd7 SUB %RDI,%RSI |
(17436) 0xc0cfda CMP $0x80,%RSI |
(17436) 0xc0cfe1 JAE c0cff3 |
(17436) 0xc0cfe3 MOV %R9,%RCX |
(17436) 0xc0cfe6 MOV %RDX,%R9 |
(17436) 0xc0cfe9 MOV 0x20(%RSP),%RDI |
(17436) 0xc0cfee JMP c0d890 |
(17436) 0xc0cff3 CMP $0x20,%RCX |
(17436) 0xc0cff7 JAE c0d793 |
(17436) 0xc0cffd XOR %ESI,%ESI |
(17436) 0xc0cfff JMP c0d81f |
(17436) 0xc0d004 MOV %RCX,%RSI |
(17436) 0xc0d007 VMOVSS 0x2c(%RSP),%XMM20 |
(17436) 0xc0d00f MOV 0x60(%RSP),%ECX |
(17436) 0xc0d013 MOV %ECX,%EDI |
(17436) 0xc0d015 SUB %ESI,%EDI |
(17436) 0xc0d017 MOV %RSI,%RCX |
(17436) 0xc0d01a TEST $0x1,%DIL |
(17436) 0xc0d01e JE c0d06f |
(17436) 0xc0d020 VCVTSI2SS %ESI,%XMM1,%XMM0 |
(17436) 0xc0d024 VMULSS %XMM0,%XMM22,%XMM3 |
(17436) 0xc0d02a VMOVAPS %XMM2,%XMM5 |
(17436) 0xc0d02e VFMADD213SS %XMM13,%XMM0,%XMM5 |
(17436) 0xc0d033 VFMADD213SS %XMM8,%XMM4,%XMM0 |
(17436) 0xc0d038 VFMADD231SS %XMM6,%XMM26,%XMM0 |
(17436) 0xc0d03e VMULSS %XMM5,%XMM5,%XMM5 |
(17436) 0xc0d042 VFMADD231SS %XMM3,%XMM3,%XMM5 |
(17436) 0xc0d047 VFMADD231SS %XMM0,%XMM0,%XMM5 |
(17436) 0xc0d04c VMULSS %XMM5,%XMM27,%XMM0 |
(17436) 0xc0d052 VMULSS %XMM7,%XMM0,%XMM0 |
(17436) 0xc0d056 VMULSS (%RDX,%RSI,4),%XMM0,%XMM0 |
(17436) 0xc0d05b VMOVSS %XMM0,(%R14,%RSI,4) |
(17436) 0xc0d061 VMULSS %XMM5,%XMM11,%XMM0 |
(17436) 0xc0d065 VMOVSS %XMM0,(%R12,%RSI,4) |
(17436) 0xc0d06b LEA 0x1(%RSI),%RCX |
(17436) 0xc0d06f NOT %RSI |
(17436) 0xc0d072 CMP 0x110(%RSP),%RSI |
(17436) 0xc0d07a MOV 0x20(%RSP),%RDI |
(17436) 0xc0d07f JE c0d139 |
(17436) 0xc0d085 NOPW %CS:(%RAX,%RAX,1) |
(17443) 0xc0d090 VCVTSI2SS %ECX,%XMM1,%XMM0 |
(17443) 0xc0d094 VMULSS %XMM0,%XMM22,%XMM3 |
(17443) 0xc0d09a VMOVAPS %XMM2,%XMM5 |
(17443) 0xc0d09e VFMADD213SS %XMM13,%XMM0,%XMM5 |
(17443) 0xc0d0a3 VFMADD213SS %XMM8,%XMM4,%XMM0 |
(17443) 0xc0d0a8 VFMADD231SS %XMM6,%XMM26,%XMM0 |
(17443) 0xc0d0ae VMULSS %XMM5,%XMM5,%XMM5 |
(17443) 0xc0d0b2 VFMADD231SS %XMM3,%XMM3,%XMM5 |
(17443) 0xc0d0b7 VFMADD231SS %XMM0,%XMM0,%XMM5 |
(17443) 0xc0d0bc VMULSS %XMM5,%XMM27,%XMM0 |
(17443) 0xc0d0c2 VMULSS %XMM7,%XMM0,%XMM0 |
(17443) 0xc0d0c6 VMULSS (%RDX,%RCX,4),%XMM0,%XMM0 |
(17443) 0xc0d0cb VMOVSS %XMM0,(%R14,%RCX,4) |
(17443) 0xc0d0d1 VMULSS %XMM5,%XMM11,%XMM0 |
(17443) 0xc0d0d5 VMOVSS %XMM0,(%R12,%RCX,4) |
(17443) 0xc0d0db LEA 0x1(%RCX),%ESI |
(17443) 0xc0d0de VCVTSI2SS %ESI,%XMM1,%XMM0 |
(17443) 0xc0d0e2 VMULSS %XMM0,%XMM22,%XMM3 |
(17443) 0xc0d0e8 VMOVAPS %XMM2,%XMM5 |
(17443) 0xc0d0ec VFMADD213SS %XMM13,%XMM0,%XMM5 |
(17443) 0xc0d0f1 VFMADD213SS %XMM8,%XMM4,%XMM0 |
(17443) 0xc0d0f6 VFMADD231SS %XMM6,%XMM26,%XMM0 |
(17443) 0xc0d0fc VMULSS %XMM5,%XMM5,%XMM5 |
(17443) 0xc0d100 VFMADD231SS %XMM3,%XMM3,%XMM5 |
(17443) 0xc0d105 VFMADD231SS %XMM0,%XMM0,%XMM5 |
(17443) 0xc0d10a VMULSS %XMM5,%XMM27,%XMM0 |
(17443) 0xc0d110 VMULSS %XMM7,%XMM0,%XMM0 |
(17443) 0xc0d114 VMULSS 0x4(%RDX,%RCX,4),%XMM0,%XMM0 |
(17443) 0xc0d11a VMOVSS %XMM0,0x4(%R14,%RCX,4) |
(17443) 0xc0d121 VMULSS %XMM5,%XMM11,%XMM0 |
(17443) 0xc0d125 VMOVSS %XMM0,0x4(%R12,%RCX,4) |
(17443) 0xc0d12c ADD $0x2,%RCX |
(17443) 0xc0d130 CMP %R8,%RCX |
(17443) 0xc0d133 JNE c0d090 |
(17436) 0xc0d139 MOV 0x60(%RSP),%ECX |
(17436) 0xc0d13d CMP 0x64(%RSP),%ECX |
(17436) 0xc0d141 JGE c0d58d |
(17436) 0xc0d147 VMULSS 0x54(%RSP),%XMM20,%XMM8 |
(17436) 0xc0d14f VMULSS %XMM20,%XMM24,%XMM13 |
(17436) 0xc0d155 MOV 0x30(%RSP),%RCX |
(17436) 0xc0d15a MOV 0x5f8(%RCX),%RDX |
(17436) 0xc0d161 MOV %R8,%RSI |
(17436) 0xc0d164 CMPQ $0x20,0x98(%RSP) |
(17436) 0xc0d16d JB c0d450 |
(17436) 0xc0d173 MOV 0x100(%RSP),%RCX |
(17436) 0xc0d17b ADD %RDX,%RCX |
(17436) 0xc0d17e VMOVQ %RCX,%XMM0 |
(17436) 0xc0d183 VMOVDQA -0x8ad19b(%RIP),%XMM3 |
(17436) 0xc0d18b VMOVDQA 0x340(%RSP),%YMM5 |
(17436) 0xc0d194 VPERMI2Q %YMM5,%YMM0,%YMM3 |
(17436) 0xc0d19a VPSUBQ %YMM3,%YMM5,%YMM0 |
(17436) 0xc0d19e VPCMPLTUQ -0x8afa09(%RIP){1to0},%YMM0,%K0 |
(17436) 0xc0d1a9 VPMOVM2D %K0,%XMM0 |
(17436) 0xc0d1af VPTEST %XMM0,%XMM0 |
(17436) 0xc0d1b4 MOV %R8,%RSI |
(17436) 0xc0d1b7 JNE c0d450 |
(17436) 0xc0d1bd VBROADCASTSS %XMM8,%YMM3 |
(17436) 0xc0d1c2 VBROADCASTSS %XMM13,%YMM5 |
(17436) 0xc0d1c7 VBROADCASTSS %XMM26,%YMM9 |
(17436) 0xc0d1cd VBROADCASTSS %XMM27,%YMM10 |
(17436) 0xc0d1d3 VBROADCASTSS %XMM7,%YMM14 |
(17436) 0xc0d1d8 MOV 0x1c0(%RSP),%RCX |
(17436) 0xc0d1e0 LEA (%RDX,%RCX,1),%RSI |
(17436) 0xc0d1e4 XOR %ECX,%ECX |
(17436) 0xc0d1e6 VMOVAPS %YMM17,%YMM4 |
(17436) 0xc0d1ec VMOVDQA64 0x2c0(%RSP),%YMM17 |
(17436) 0xc0d1f4 VMOVAPS %YMM18,%YMM6 |
(17436) 0xc0d1fa VMOVAPS %YMM15,%YMM2 |
(17436) 0xc0d1fe MOV 0xf0(%RSP),%R10 |
(17436) 0xc0d206 MOV 0xe8(%RSP),%RBX |
(17436) 0xc0d20e XCHG %AX,%AX |
(17442) 0xc0d210 VPSUBD %YMM16,%YMM17,%YMM0 |
(17442) 0xc0d216 VPADDD -0x8b10f4(%RIP){1to8},%YMM0,%YMM12 |
(17442) 0xc0d220 VPADDD -0x8b0cbe(%RIP){1to8},%YMM0,%YMM15 |
(17442) 0xc0d22a VPADDD -0x8b1078(%RIP){1to8},%YMM0,%YMM16 |
(17442) 0xc0d234 VCVTDQ2PS %YMM0,%YMM0 |
(17442) 0xc0d238 VCVTDQ2PS %YMM12,%YMM12 |
(17442) 0xc0d23d VCVTDQ2PS %YMM15,%YMM15 |
(17442) 0xc0d242 VCVTDQ2PS %YMM16,%YMM16 |
(17442) 0xc0d248 VMULPS %YMM0,%YMM31,%YMM18 |
(17442) 0xc0d24e VMULPS %YMM12,%YMM31,%YMM19 |
(17442) 0xc0d254 VMULPS %YMM15,%YMM31,%YMM20 |
(17442) 0xc0d25a VMOVAPS %YMM1,%YMM21 |
(17442) 0xc0d260 VFMADD213PS %YMM3,%YMM0,%YMM21 |
(17442) 0xc0d266 VMOVAPS %YMM1,%YMM23 |
(17442) 0xc0d26c VFMADD213PS %YMM3,%YMM12,%YMM23 |
(17442) 0xc0d272 VMOVAPS %YMM1,%YMM24 |
(17442) 0xc0d278 VFMADD213PS %YMM3,%YMM15,%YMM24 |
(17442) 0xc0d27e VMOVAPS %YMM1,%YMM25 |
(17442) 0xc0d284 VFMADD213PS %YMM3,%YMM16,%YMM25 |
(17442) 0xc0d28a VMOVAPS %YMM31,%YMM22 |
(17442) 0xc0d290 VMULPS %YMM16,%YMM31,%YMM31 |
(17442) 0xc0d296 VFMADD213PS %YMM5,%YMM4,%YMM0 |
(17442) 0xc0d29b VFMADD213PS %YMM5,%YMM4,%YMM12 |
(17442) 0xc0d2a0 VFMADD213PS %YMM5,%YMM4,%YMM15 |
(17442) 0xc0d2a5 VFMADD213PS %YMM5,%YMM4,%YMM16 |
(17442) 0xc0d2ab VFMADD231PS %YMM6,%YMM9,%YMM0 |
(17442) 0xc0d2b0 VFMADD231PS %YMM6,%YMM9,%YMM12 |
(17442) 0xc0d2b5 VFMADD231PS %YMM6,%YMM9,%YMM15 |
(17442) 0xc0d2ba VMULPS %YMM21,%YMM21,%YMM21 |
(17442) 0xc0d2c0 VMULPS %YMM23,%YMM23,%YMM23 |
(17442) 0xc0d2c6 VMULPS %YMM24,%YMM24,%YMM24 |
(17442) 0xc0d2cc VMULPS %YMM25,%YMM25,%YMM25 |
(17442) 0xc0d2d2 VFMADD231PS %YMM6,%YMM9,%YMM16 |
(17442) 0xc0d2d8 VFMADD231PS %YMM18,%YMM18,%YMM21 |
(17442) 0xc0d2de VFMADD231PS %YMM19,%YMM19,%YMM23 |
(17442) 0xc0d2e4 VFMADD231PS %YMM20,%YMM20,%YMM24 |
(17442) 0xc0d2ea VFMADD231PS %YMM31,%YMM31,%YMM25 |
(17442) 0xc0d2f0 VMOVAPS %YMM22,%YMM31 |
(17442) 0xc0d2f6 VFMADD231PS %YMM0,%YMM0,%YMM21 |
(17442) 0xc0d2fc VFMADD231PS %YMM12,%YMM12,%YMM23 |
(17442) 0xc0d302 VFMADD231PS %YMM15,%YMM15,%YMM24 |
(17442) 0xc0d308 VFMADD231PS %YMM16,%YMM16,%YMM25 |
(17442) 0xc0d30e VMULPS %YMM21,%YMM10,%YMM0 |
(17442) 0xc0d314 VMULPS %YMM23,%YMM10,%YMM12 |
(17442) 0xc0d31a VMULPS %YMM24,%YMM10,%YMM15 |
(17442) 0xc0d320 VMULPS %YMM25,%YMM10,%YMM16 |
(17442) 0xc0d326 VMULPS %YMM0,%YMM14,%YMM0 |
(17442) 0xc0d32a VMULPS %YMM14,%YMM12,%YMM12 |
(17442) 0xc0d32f VMULPS %YMM14,%YMM15,%YMM15 |
(17442) 0xc0d334 VMULPS -0x60(%RSI,%RCX,4),%YMM0,%YMM0 |
(17442) 0xc0d33a VMULPS %YMM14,%YMM16,%YMM16 |
(17442) 0xc0d340 VMULPS -0x40(%RSI,%RCX,4),%YMM12,%YMM12 |
(17442) 0xc0d346 VMULPS -0x20(%RSI,%RCX,4),%YMM15,%YMM15 |
(17442) 0xc0d34c VMULPS (%RSI,%RCX,4),%YMM16,%YMM16 |
(17442) 0xc0d353 VMOVUPS %YMM0,-0x60(%R10,%RCX,4) |
(17442) 0xc0d35a VMOVUPS %YMM12,-0x40(%R10,%RCX,4) |
(17442) 0xc0d361 VMOVUPS %YMM15,-0x20(%R10,%RCX,4) |
(17442) 0xc0d368 VMULPS %YMM2,%YMM21,%YMM0 |
(17442) 0xc0d36e VMULPS %YMM2,%YMM23,%YMM12 |
(17442) 0xc0d374 VMULPS %YMM2,%YMM24,%YMM15 |
(17442) 0xc0d37a VMULPS %YMM2,%YMM25,%YMM18 |
(17442) 0xc0d380 VMOVUPS %YMM16,(%R10,%RCX,4) |
(17442) 0xc0d387 VMOVDQA64 0x220(%RSP),%YMM16 |
(17442) 0xc0d38f VMOVUPS %YMM0,-0x60(%RBX,%RCX,4) |
(17442) 0xc0d395 VMOVUPS %YMM12,-0x40(%RBX,%RCX,4) |
(17442) 0xc0d39b VMOVUPS %YMM15,-0x20(%RBX,%RCX,4) |
(17442) 0xc0d3a1 VMOVUPS %YMM18,(%RBX,%RCX,4) |
(17442) 0xc0d3a8 ADD $0x20,%RCX |
(17442) 0xc0d3ac VPADDD -0x8b1046(%RIP){1to8},%YMM17,%YMM17 |
(17442) 0xc0d3b6 CMP %RCX,%R9 |
(17442) 0xc0d3b9 JNE c0d210 |
(17436) 0xc0d3bf MOV 0x1d8(%RSP),%RSI |
(17436) 0xc0d3c7 CMP %R9,0x98(%RSP) |
(17436) 0xc0d3cf VMOVAPS 0x280(%RSP),%XMM19 |
(17436) 0xc0d3d7 VMOVSS 0x90(%RSP),%XMM24 |
(17436) 0xc0d3df VMOVDQA64 0x270(%RSP),%XMM21 |
(17436) 0xc0d3e7 VMOVSD 0xf8(%RSP),%XMM23 |
(17436) 0xc0d3ef VMOVAPS 0x380(%RSP),%ZMM25 |
(17436) 0xc0d3f7 VMOVAPS 0x260(%RSP),%XMM22 |
(17436) 0xc0d3ff VMOVAPS %YMM4,%YMM17 |
(17436) 0xc0d405 VMOVAPS 0x150(%RSP),%XMM4 |
(17436) 0xc0d40e VMOVAPS %YMM6,%YMM18 |
(17436) 0xc0d414 VMOVAPS 0x140(%RSP),%XMM6 |
(17436) 0xc0d41d VMOVAPS %YMM2,%YMM15 |
(17436) 0xc0d421 VMOVAPS 0x250(%RSP),%XMM2 |
(17436) 0xc0d42a MOV 0x48(%RSP),%R14 |
(17436) 0xc0d42f VMOVSS -0x8b12ab(%RIP),%XMM12 |
(17436) 0xc0d437 VMOVAPS -0x8a849f(%RIP),%YMM14 |
(17436) 0xc0d43f VMOVAPS -0x8a7a67(%RIP),%YMM10 |
(17436) 0xc0d447 JE c0d58d |
(17436) 0xc0d44d NOPL (%RAX) |
(17436) 0xc0d450 MOV 0x64(%RSP),%ECX |
(17436) 0xc0d454 MOV %ECX,%EDI |
(17436) 0xc0d456 SUB %ESI,%EDI |
(17436) 0xc0d458 MOV %RSI,%RCX |
(17436) 0xc0d45b TEST $0x1,%DIL |
(17436) 0xc0d45f JE c0d4bd |
(17436) 0xc0d461 MOV %ESI,%ECX |
(17436) 0xc0d463 SUB 0xc4(%RSP),%ECX |
(17436) 0xc0d46a VCVTSI2SS %ECX,%XMM1,%XMM0 |
(17436) 0xc0d46e VMULSS %XMM0,%XMM22,%XMM3 |
(17436) 0xc0d474 VMOVAPS %XMM2,%XMM5 |
(17436) 0xc0d478 VFMADD213SS %XMM8,%XMM0,%XMM5 |
(17436) 0xc0d47d VFMADD213SS %XMM13,%XMM4,%XMM0 |
(17436) 0xc0d482 VFMADD231SS %XMM6,%XMM26,%XMM0 |
(17436) 0xc0d488 VMULSS %XMM5,%XMM5,%XMM5 |
(17436) 0xc0d48c VFMADD231SS %XMM3,%XMM3,%XMM5 |
(17436) 0xc0d491 VFMADD231SS %XMM0,%XMM0,%XMM5 |
(17436) 0xc0d496 VMULSS %XMM5,%XMM27,%XMM0 |
(17436) 0xc0d49c VMULSS %XMM7,%XMM0,%XMM0 |
(17436) 0xc0d4a0 VMULSS (%RDX,%RSI,4),%XMM0,%XMM0 |
(17436) 0xc0d4a5 MOV 0x48(%RSP),%RCX |
(17436) 0xc0d4aa VMOVSS %XMM0,(%RCX,%RSI,4) |
(17436) 0xc0d4af VMULSS %XMM5,%XMM11,%XMM0 |
(17436) 0xc0d4b3 VMOVSS %XMM0,(%R12,%RSI,4) |
(17436) 0xc0d4b9 LEA 0x1(%RSI),%RCX |
(17436) 0xc0d4bd NOT %RSI |
(17436) 0xc0d4c0 CMP 0x1f0(%RSP),%RSI |
(17436) 0xc0d4c8 MOV 0x20(%RSP),%RDI |
(17436) 0xc0d4cd MOV 0x108(%RSP),%RBX |
(17436) 0xc0d4d5 MOV 0x48(%RSP),%R14 |
(17436) 0xc0d4da JE c0d58d |
(17441) 0xc0d4e0 LEA (%RBX,%RCX,1),%ESI |
(17441) 0xc0d4e3 VCVTSI2SS %ESI,%XMM1,%XMM0 |
(17441) 0xc0d4e7 VMULSS %XMM0,%XMM22,%XMM3 |
(17441) 0xc0d4ed VMOVAPS %XMM2,%XMM5 |
(17441) 0xc0d4f1 VFMADD213SS %XMM8,%XMM0,%XMM5 |
(17441) 0xc0d4f6 VFMADD213SS %XMM13,%XMM4,%XMM0 |
(17441) 0xc0d4fb VFMADD231SS %XMM6,%XMM26,%XMM0 |
(17441) 0xc0d501 VMULSS %XMM5,%XMM5,%XMM5 |
(17441) 0xc0d505 VFMADD231SS %XMM3,%XMM3,%XMM5 |
(17441) 0xc0d50a VFMADD231SS %XMM0,%XMM0,%XMM5 |
(17441) 0xc0d50f VMULSS %XMM5,%XMM27,%XMM0 |
(17441) 0xc0d515 VMULSS %XMM7,%XMM0,%XMM0 |
(17441) 0xc0d519 VMULSS (%RDX,%RCX,4),%XMM0,%XMM0 |
(17441) 0xc0d51e VMOVSS %XMM0,(%R14,%RCX,4) |
(17441) 0xc0d524 VMULSS %XMM5,%XMM11,%XMM0 |
(17441) 0xc0d528 VMOVSS %XMM0,(%R12,%RCX,4) |
(17441) 0xc0d52e LEA 0x1(%RBX,%RCX,1),%ESI |
(17441) 0xc0d532 VCVTSI2SS %ESI,%XMM1,%XMM0 |
(17441) 0xc0d536 VMULSS %XMM0,%XMM22,%XMM3 |
(17441) 0xc0d53c VMOVAPS %XMM2,%XMM5 |
(17441) 0xc0d540 VFMADD213SS %XMM8,%XMM0,%XMM5 |
(17441) 0xc0d545 VFMADD213SS %XMM13,%XMM4,%XMM0 |
(17441) 0xc0d54a VFMADD231SS %XMM6,%XMM26,%XMM0 |
(17441) 0xc0d550 VMULSS %XMM5,%XMM5,%XMM5 |
(17441) 0xc0d554 VFMADD231SS %XMM3,%XMM3,%XMM5 |
(17441) 0xc0d559 VFMADD231SS %XMM0,%XMM0,%XMM5 |
(17441) 0xc0d55e VMULSS %XMM5,%XMM27,%XMM0 |
(17441) 0xc0d564 VMULSS %XMM7,%XMM0,%XMM0 |
(17441) 0xc0d568 VMULSS 0x4(%RDX,%RCX,4),%XMM0,%XMM0 |
(17441) 0xc0d56e VMOVSS %XMM0,0x4(%R14,%RCX,4) |
(17441) 0xc0d575 VMULSS %XMM5,%XMM11,%XMM0 |
(17441) 0xc0d579 VMOVSS %XMM0,0x4(%R12,%RCX,4) |
(17441) 0xc0d580 ADD $0x2,%RCX |
(17441) 0xc0d584 CMP %RCX,%RDI |
(17441) 0xc0d587 JNE c0d4e0 |
(17436) 0xc0d58d CMPL $0x1f,0x128(%RSP) |
(17436) 0xc0d595 VPXOR %XMM13,%XMM13,%XMM13 |
(17436) 0xc0d59a JB c0d6b0 |
(17436) 0xc0d5a0 VRCP14PS -0x8b0ee2(%RIP){1to16},%ZMM0 |
(17436) 0xc0d5aa VBROADCASTSS -0x8b0d98(%RIP),%ZMM3 |
(17436) 0xc0d5b4 VFMADD213PS -0x8b107e(%RIP){1to16},%ZMM0,%ZMM3 |
(17436) 0xc0d5be VMULPS %ZMM3,%ZMM0,%ZMM0 |
(17436) 0xc0d5c4 VMULPS -0x8b123e(%RIP){1to16},%ZMM0,%ZMM3 |
(17436) 0xc0d5ce XOR %ECX,%ECX |
(17436) 0xc0d5d0 MOV 0x118(%RSP),%RDX |
(17436) 0xc0d5d8 NOPL (%RAX,%RAX,1) |
(17440) 0xc0d5e0 VMOVAPS (%R14,%RCX,1),%ZMM0 |
(17440) 0xc0d5e7 VMOVAPS (%R12,%RCX,1),%ZMM5 |
(17440) 0xc0d5ee VMAXPS %ZMM3,%ZMM5,%ZMM5 |
(17440) 0xc0d5f4 VMULPS -0x8b0f36(%RIP){1to16},%ZMM5,%ZMM7 |
(17440) 0xc0d5fe VCVTPS2DQ %ZMM7,%ZMM8 |
(17440) 0xc0d604 VPADDD -0x8b0dae(%RIP){1to16},%ZMM8,%ZMM8 |
(17440) 0xc0d60e VPMAXSD %ZMM13,%ZMM8,%ZMM8 |
(17440) 0xc0d614 VRNDSCALEPS $0,%ZMM7,%ZMM7 |
(17440) 0xc0d61b VFMADD231PS -0x8b0f2d(%RIP){1to16},%ZMM7,%ZMM5 |
(17440) 0xc0d625 VFMADD231PS -0x8b1443(%RIP){1to16},%ZMM7,%ZMM5 |
(17440) 0xc0d62f VBROADCASTSS -0x8b1009(%RIP),%ZMM7 |
(17440) 0xc0d639 VFMADD213PS -0x8b1203(%RIP){1to16},%ZMM5,%ZMM7 |
(17440) 0xc0d643 VFMADD213PS -0x8b1281(%RIP){1to16},%ZMM5,%ZMM7 |
(17440) 0xc0d64d VFMADD213PS -0x8b1023(%RIP){1to16},%ZMM5,%ZMM7 |
(17440) 0xc0d657 VPSLLD $0x17,%ZMM8,%ZMM8 |
(17440) 0xc0d65e VFMADD213PS -0x8b0e2c(%RIP){1to16},%ZMM5,%ZMM7 |
(17440) 0xc0d668 VMULPS %ZMM5,%ZMM5,%ZMM9 |
(17440) 0xc0d66e VFMADD213PS %ZMM5,%ZMM7,%ZMM9 |
(17440) 0xc0d674 VFMADD213PS %ZMM8,%ZMM8,%ZMM9 |
(17440) 0xc0d67a VRCP14PS %ZMM0,%ZMM5 |
(17440) 0xc0d680 VFNMADD213PS -0x8b114a(%RIP){1to16},%ZMM5,%ZMM0 |
(17440) 0xc0d68a VMULPS %ZMM0,%ZMM5,%ZMM0 |
(17440) 0xc0d690 VMULPS %ZMM0,%ZMM25,%ZMM0 |
(17440) 0xc0d696 VMULPS %ZMM9,%ZMM0,%ZMM0 |
(17440) 0xc0d69c VMOVAPS %ZMM0,(%R15,%RCX,1) |
(17440) 0xc0d6a3 ADD $0x40,%RCX |
(17440) 0xc0d6a7 DEC %RDX |
(17440) 0xc0d6aa JNE c0d5e0 |
(17436) 0xc0d6b0 MOV 0x40(%RSP),%RCX |
(17436) 0xc0d6b5 CMP %ECX,0xb8(%RSP) |
(17436) 0xc0d6bc VMOVAPS -0x889a06(%RIP),%ZMM13 |
(17436) 0xc0d6c6 JLE c0d6f0 |
(17436) 0xc0d6c8 MOVSXD 0x18(%RSP),%RSI |
(17436) 0xc0d6cd LEA 0x1(%RSI),%RCX |
(17436) 0xc0d6d1 CMP %RDI,%RCX |
(17436) 0xc0d6d4 MOV %RDI,%RDX |
(17436) 0xc0d6d7 CMOVG %RCX,%RDX |
(17436) 0xc0d6db SUB %RSI,%RDX |
(17436) 0xc0d6de CMP $0x4,%RDX |
(17436) 0xc0d6e2 JAE c0d6fe |
(17436) 0xc0d6e4 MOV %RSI,%R9 |
(17436) 0xc0d6e7 JMP c0d746 |
0xc0d6e9 NOPL (%RAX) |
(17436) 0xc0d6f0 MOV 0x30(%RSP),%R10 |
(17436) 0xc0d6f5 MOV 0x1c(%RSP),%ECX |
(17436) 0xc0d6f9 JMP c0c395 |
(17436) 0xc0d6fe CMP %RDI,%RCX |
(17436) 0xc0d701 CMOVLE %RDI,%RCX |
(17436) 0xc0d705 LEA (%R15,%RCX,4),%RDI |
(17436) 0xc0d709 CMP %RDI,%RAX |
(17436) 0xc0d70c JAE c0d77f |
(17436) 0xc0d70e MOV 0x80(%RSP),%RDI |
(17436) 0xc0d716 MOV 0x78(%RSP),%R9 |
(17436) 0xc0d71b ADD %R9,%RDI |
(17436) 0xc0d71e MOV 0x88(%RSP),%R9 |
(17436) 0xc0d726 ADD 0x40(%RSP),%RDI |
(17436) 0xc0d72b ADD %RDI,%RCX |
(17436) 0xc0d72e SUB %RSI,%RCX |
(17436) 0xc0d731 LEA (%R9,%RCX,8),%RCX |
(17436) 0xc0d735 LEA (%R15,%RSI,4),%RDI |
(17436) 0xc0d739 CMP %RCX,%RDI |
(17436) 0xc0d73c JAE c0d77f |
(17436) 0xc0d73e MOV %RSI,%R9 |
(17436) 0xc0d741 MOV 0x20(%RSP),%RDI |
(17436) 0xc0d746 MOV 0x30(%RSP),%R10 |
(17436) 0xc0d74b MOV 0x1c(%RSP),%ECX |
(17436) 0xc0d74f NOP |
(17438) 0xc0d750 VMOVSS (%RAX),%XMM0 |
(17438) 0xc0d754 VMOVSS 0x4(%RAX),%XMM3 |
(17438) 0xc0d759 VMULSS (%R15,%R9,4),%XMM0,%XMM0 |
(17438) 0xc0d75f VMOVSS %XMM0,(%RAX) |
(17438) 0xc0d763 VMULSS (%R15,%R9,4),%XMM3,%XMM0 |
(17438) 0xc0d769 VMOVSS %XMM0,0x4(%RAX) |
(17438) 0xc0d76e INC %R9 |
(17438) 0xc0d771 ADD $0x8,%RAX |
(17438) 0xc0d775 CMP %RDI,%R9 |
(17438) 0xc0d778 JL c0d750 |
(17436) 0xc0d77a JMP c0c395 |
(17436) 0xc0d77f MOV %R11D,%EBX |
(17436) 0xc0d782 CMP $0x10,%RDX |
(17436) 0xc0d786 JAE c0db92 |
(17436) 0xc0d78c XOR %ECX,%ECX |
(17436) 0xc0d78e JMP c0dec3 |
(17436) 0xc0d793 LEA (,%RDX,4),%RDI |
(17436) 0xc0d79b MOV %RCX,%RSI |
(17436) 0xc0d79e AND $-0x20,%RSI |
(17436) 0xc0d7a2 MOV 0x168(%RSP),%R8 |
(17436) 0xc0d7aa ADD %RDI,%R8 |
(17436) 0xc0d7ad ADD 0x160(%RSP),%RDI |
(17436) 0xc0d7b5 XOR %R9D,%R9D |
(17436) 0xc0d7b8 NOPL (%RAX,%RAX,1) |
(17450) 0xc0d7c0 VBROADCASTSS -0x8b163d(%RIP),%YMM0 |
(17450) 0xc0d7c9 VDIVPS -0x60(%R8,%R9,4),%YMM0,%YMM3 |
(17450) 0xc0d7d0 VDIVPS -0x40(%R8,%R9,4),%YMM0,%YMM5 |
(17450) 0xc0d7d7 VDIVPS -0x20(%R8,%R9,4),%YMM0,%YMM7 |
(17450) 0xc0d7de VDIVPS (%R8,%R9,4),%YMM0,%YMM0 |
(17450) 0xc0d7e4 VMOVUPS %YMM3,-0x60(%RDI,%R9,4) |
(17450) 0xc0d7eb VMOVUPS %YMM5,-0x40(%RDI,%R9,4) |
(17450) 0xc0d7f2 VMOVUPS %YMM7,-0x20(%RDI,%R9,4) |
(17450) 0xc0d7f9 VMOVUPS %YMM0,(%RDI,%R9,4) |
(17450) 0xc0d7ff ADD $0x20,%R9 |
(17450) 0xc0d803 CMP %R9,%RSI |
(17450) 0xc0d806 JNE c0d7c0 |
(17436) 0xc0d808 CMP %RSI,%RCX |
(17436) 0xc0d80b MOV 0x20(%RSP),%RDI |
(17436) 0xc0d810 JE c0d8a4 |
(17436) 0xc0d816 TEST $0x1c,%CL |
(17436) 0xc0d819 JE c0df83 |
(17436) 0xc0d81f MOV %RCX,%RDI |
(17436) 0xc0d822 AND $-0x4,%RDI |
(17436) 0xc0d826 LEA (%RDI,%RDX,1),%R9 |
(17436) 0xc0d82a MOV %RDI,%R8 |
(17436) 0xc0d82d SUB %RSI,%R8 |
(17436) 0xc0d830 ADD %RDX,%RSI |
(17436) 0xc0d833 LEA (%R14,%RSI,4),%RDX |
(17436) 0xc0d837 MOV 0x68(%RSP),%R10 |
(17436) 0xc0d83c LEA (%R10,%RSI,4),%RSI |
(17436) 0xc0d840 XOR %R11D,%R11D |
(17436) 0xc0d843 NOPW %CS:(%RAX,%RAX,1) |
(17452) 0xc0d850 VBROADCASTSS -0x8b16cd(%RIP),%XMM0 |
(17452) 0xc0d859 VDIVPS (%RDX,%R11,4),%XMM0,%XMM0 |
(17452) 0xc0d85f VMOVUPS %XMM0,(%RSI,%R11,4) |
(17452) 0xc0d865 ADD $0x4,%R11 |
(17452) 0xc0d869 CMP %R11,%R8 |
(17452) 0xc0d86c JNE c0d850 |
(17436) 0xc0d86e CMP %RDI,%RCX |
(17436) 0xc0d871 MOV 0x20(%RSP),%RDI |
(17436) 0xc0d876 MOV 0x68(%RSP),%RCX |
(17436) 0xc0d87b MOV 0x40(%RSP),%R10 |
(17436) 0xc0d880 JE c0d8a4 |
(17436) 0xc0d882 NOPW %CS:(%RAX,%RAX,1) |
(17451) 0xc0d890 VDIVSS (%R14,%R9,4),%XMM12,%XMM0 |
(17451) 0xc0d896 VMOVSS %XMM0,(%RCX,%R9,4) |
(17451) 0xc0d89c INC %R9 |
(17451) 0xc0d89f CMP %RDI,%R9 |
(17451) 0xc0d8a2 JL c0d890 |
(17436) 0xc0d8a4 CMPL $0x1f,0x128(%RSP) |
(17436) 0xc0d8ac MOV 0x3c(%RSP),%R11D |
(17436) 0xc0d8b1 MOV 0x48(%RSP),%RSI |
(17436) 0xc0d8b6 JB c0d9d0 |
(17436) 0xc0d8bc VRCP14PS -0x8b11fe(%RIP){1to16},%ZMM0 |
(17436) 0xc0d8c6 VBROADCASTSS -0x8b10b4(%RIP),%ZMM3 |
(17436) 0xc0d8d0 VFMADD213PS -0x8b139a(%RIP){1to16},%ZMM0,%ZMM3 |
(17436) 0xc0d8da VMULPS %ZMM3,%ZMM0,%ZMM0 |
(17436) 0xc0d8e0 VMULPS -0x8b155a(%RIP){1to16},%ZMM0,%ZMM3 |
(17436) 0xc0d8ea XOR %ECX,%ECX |
(17436) 0xc0d8ec MOV 0x118(%RSP),%RDX |
(17436) 0xc0d8f4 NOPW %CS:(%RAX,%RAX,1) |
(17449) 0xc0d900 VMOVAPS (%RSI,%RCX,1),%ZMM0 |
(17449) 0xc0d907 VMOVAPS (%R12,%RCX,1),%ZMM5 |
(17449) 0xc0d90e VMAXPS %ZMM3,%ZMM5,%ZMM5 |
(17449) 0xc0d914 VMULPS -0x8b1256(%RIP){1to16},%ZMM5,%ZMM7 |
(17449) 0xc0d91e VCVTPS2DQ %ZMM7,%ZMM8 |
(17449) 0xc0d924 VPADDD -0x8b10ce(%RIP){1to16},%ZMM8,%ZMM8 |
(17449) 0xc0d92e VPMAXSD %ZMM27,%ZMM8,%ZMM8 |
(17449) 0xc0d934 VRNDSCALEPS $0,%ZMM7,%ZMM7 |
(17449) 0xc0d93b VFMADD231PS -0x8b124d(%RIP){1to16},%ZMM7,%ZMM5 |
(17449) 0xc0d945 VFMADD231PS -0x8b1763(%RIP){1to16},%ZMM7,%ZMM5 |
(17449) 0xc0d94f VBROADCASTSS -0x8b1329(%RIP),%ZMM7 |
(17449) 0xc0d959 VFMADD213PS -0x8b1523(%RIP){1to16},%ZMM5,%ZMM7 |
(17449) 0xc0d963 VFMADD213PS -0x8b15a1(%RIP){1to16},%ZMM5,%ZMM7 |
(17449) 0xc0d96d VFMADD213PS -0x8b1343(%RIP){1to16},%ZMM5,%ZMM7 |
(17449) 0xc0d977 VPSLLD $0x17,%ZMM8,%ZMM8 |
(17449) 0xc0d97e VFMADD213PS -0x8b114c(%RIP){1to16},%ZMM5,%ZMM7 |
(17449) 0xc0d988 VMULPS %ZMM5,%ZMM5,%ZMM9 |
(17449) 0xc0d98e VFMADD213PS %ZMM5,%ZMM7,%ZMM9 |
(17449) 0xc0d994 VFMADD213PS %ZMM8,%ZMM8,%ZMM9 |
(17449) 0xc0d99a VRCP14PS %ZMM0,%ZMM5 |
(17449) 0xc0d9a0 VFNMADD213PS -0x8b146a(%RIP){1to16},%ZMM5,%ZMM0 |
(17449) 0xc0d9aa VMULPS %ZMM0,%ZMM5,%ZMM0 |
(17449) 0xc0d9b0 VMULPS %ZMM0,%ZMM25,%ZMM0 |
(17449) 0xc0d9b6 VMULPS %ZMM9,%ZMM0,%ZMM0 |
(17449) 0xc0d9bc VMOVAPS %ZMM0,(%R15,%RCX,1) |
(17449) 0xc0d9c3 ADD $0x40,%RCX |
(17449) 0xc0d9c7 DEC %RDX |
(17449) 0xc0d9ca JNE c0d900 |
(17436) 0xc0d9d0 CMP %R10D,0xb8(%RSP) |
(17436) 0xc0d9d8 MOV 0x1c(%RSP),%ECX |
(17436) 0xc0d9dc JLE c0c390 |
(17436) 0xc0d9e2 MOVSXD 0x18(%RSP),%RSI |
(17436) 0xc0d9e7 MOV %RDI,%R9 |
(17436) 0xc0d9ea LEA 0x1(%RSI),%RDI |
(17436) 0xc0d9ee CMP %R9,%RDI |
(17436) 0xc0d9f1 MOV %R9,%RDX |
(17436) 0xc0d9f4 CMOVG %RDI,%RDX |
(17436) 0xc0d9f8 SUB %RSI,%RDX |
(17436) 0xc0d9fb CMP $0x4,%RDX |
(17436) 0xc0d9ff JAE c0da11 |
(17436) 0xc0da01 MOV %RSI,%RCX |
(17436) 0xc0da04 MOV 0x30(%RSP),%R10 |
(17436) 0xc0da09 MOV %R9,%RDI |
(17436) 0xc0da0c JMP c0dd50 |
(17436) 0xc0da11 CMP %R9,%RDI |
(17436) 0xc0da14 CMOVLE %R9,%RDI |
(17436) 0xc0da18 MOV 0x80(%RSP),%RCX |
(17436) 0xc0da20 MOV 0x78(%RSP),%R8 |
(17436) 0xc0da25 ADD %R8,%RCX |
(17436) 0xc0da28 ADD %R10,%RCX |
(17436) 0xc0da2b ADD %RDI,%RCX |
(17436) 0xc0da2e SUB %RSI,%RCX |
(17436) 0xc0da31 MOV 0x88(%RSP),%R8 |
(17436) 0xc0da39 LEA (%R8,%RCX,8),%R10 |
(17436) 0xc0da3d LEA (%R12,%RSI,4),%RCX |
(17436) 0xc0da41 LEA (%R12,%RDI,4),%R14 |
(17436) 0xc0da45 LEA (%R15,%RSI,4),%R11 |
(17436) 0xc0da49 LEA (%R15,%RDI,4),%R13 |
(17436) 0xc0da4d CMP %R14,%RAX |
(17436) 0xc0da50 SETB %DIL |
(17436) 0xc0da54 CMP %R10,%RCX |
(17436) 0xc0da57 SETB %R8B |
(17436) 0xc0da5b CMP %R13,%RAX |
(17436) 0xc0da5e SETB %R9B |
(17436) 0xc0da62 CMP %R10,%R11 |
(17436) 0xc0da65 SETB %BL |
(17436) 0xc0da68 CMP %R13,%RCX |
(17436) 0xc0da6b SETB %R10B |
(17436) 0xc0da6f CMP %R14,%R11 |
(17436) 0xc0da72 SETB %R14B |
(17436) 0xc0da76 TEST %R14B,%R10B |
(17436) 0xc0da79 JNE c0db72 |
(17436) 0xc0da7f AND %BL,%R9B |
(17436) 0xc0da82 JNE c0db72 |
(17436) 0xc0da88 AND %R8B,%DIL |
(17436) 0xc0da8b MOV 0x30(%RSP),%R10 |
(17436) 0xc0da90 MOV 0x58(%RSP),%R14 |
(17436) 0xc0da95 MOV 0x2c(%RSP),%EBX |
(17436) 0xc0da99 JNE c0dd3e |
(17436) 0xc0da9f CMP $0x8,%RDX |
(17436) 0xc0daa3 JAE c0dc9b |
(17436) 0xc0daa9 XOR %R9D,%R9D |
(17436) 0xc0daac MOV 0x40(%RSP),%R13 |
(17436) 0xc0dab1 MOV %RDX,%R11 |
(17436) 0xc0dab4 AND $-0x4,%R11 |
(17436) 0xc0dab8 LEA (%R11,%RSI,1),%RCX |
(17436) 0xc0dabc LEA (%RAX,%R11,8),%RAX |
(17436) 0xc0dac0 MOV 0x80(%RSP),%RDI |
(17436) 0xc0dac8 SAL $0x3,%RDI |
(17436) 0xc0dacc LEA (%RDI,%R9,8),%RDI |
(17436) 0xc0dad0 MOV 0x78(%RSP),%R8 |
(17436) 0xc0dad5 LEA (%RDI,%R8,8),%RDI |
(17436) 0xc0dad9 LEA (%RDI,%R13,8),%RDI |
(17436) 0xc0dadd ADD 0x88(%RSP),%RDI |
(17436) 0xc0dae5 MOV %R11,%R8 |
(17436) 0xc0dae8 SUB %R9,%R8 |
(17436) 0xc0daeb ADD %RSI,%R9 |
(17436) 0xc0daee LEA (%R15,%R9,4),%RSI |
(17436) 0xc0daf2 LEA (%R12,%R9,4),%R9 |
(17436) 0xc0daf6 XOR %EBX,%EBX |
(17436) 0xc0daf8 NOPL (%RAX,%RAX,1) |
(17448) 0xc0db00 VMOVUPS (%RDI,%RBX,8),%XMM0 |
(17448) 0xc0db05 VMOVUPS 0x10(%RDI,%RBX,8),%XMM3 |
(17448) 0xc0db0b VSHUFPS $-0x78,%XMM3,%XMM0,%XMM5 |
(17448) 0xc0db10 VMOVUPS (%RSI,%RBX,4),%XMM7 |
(17448) 0xc0db15 VSHUFPS $-0x23,%XMM3,%XMM0,%XMM0 |
(17448) 0xc0db1a VMULPS %XMM7,%XMM5,%XMM3 |
(17448) 0xc0db1e VMULPS %XMM7,%XMM0,%XMM7 |
(17448) 0xc0db22 VUNPCKLPS %XMM7,%XMM3,%XMM8 |
(17448) 0xc0db26 VMOVUPS %XMM8,(%RDI,%RBX,8) |
(17448) 0xc0db2b VUNPCKHPS %XMM7,%XMM3,%XMM3 |
(17448) 0xc0db2f VMOVUPS %XMM3,0x10(%RDI,%RBX,8) |
(17448) 0xc0db35 VMULPS %XMM0,%XMM0,%XMM0 |
(17448) 0xc0db39 VFMADD231PS %XMM5,%XMM5,%XMM0 |
(17448) 0xc0db3e VADDPS %XMM0,%XMM0,%XMM0 |
(17448) 0xc0db42 VMULPS (%RSI,%RBX,4),%XMM0,%XMM0 |
(17448) 0xc0db47 VMOVUPS %XMM0,(%R9,%RBX,4) |
(17448) 0xc0db4d ADD $0x4,%RBX |
(17448) 0xc0db51 CMP %RBX,%R8 |
(17448) 0xc0db54 JNE c0db00 |
(17436) 0xc0db56 CMP %R11,%RDX |
(17436) 0xc0db59 MOV 0x3c(%RSP),%R11D |
(17436) 0xc0db5e MOV 0x20(%RSP),%RDI |
(17436) 0xc0db63 MOV 0x2c(%RSP),%EBX |
(17436) 0xc0db67 JNE c0dd50 |
(17436) 0xc0db6d JMP c0dd93 |
(17436) 0xc0db72 MOV %RSI,%RCX |
(17436) 0xc0db75 MOV 0x30(%RSP),%R10 |
(17436) 0xc0db7a MOV 0x3c(%RSP),%R11D |
(17436) 0xc0db7f MOV 0x20(%RSP),%RDI |
(17436) 0xc0db84 MOV 0x58(%RSP),%R14 |
(17436) 0xc0db89 MOV 0x2c(%RSP),%EBX |
(17436) 0xc0db8d JMP c0dd50 |
(17436) 0xc0db92 MOV %RDX,%RCX |
(17436) 0xc0db95 AND $-0x10,%RCX |
(17436) 0xc0db99 MOV 0x78(%RSP),%RDI |
(17436) 0xc0db9e LEA (,%RDI,8),%RDI |
(17436) 0xc0dba6 MOV 0x80(%RSP),%R8 |
(17436) 0xc0dbae LEA (%RDI,%R8,8),%RDI |
(17436) 0xc0dbb2 MOV 0x40(%RSP),%R8 |
(17436) 0xc0dbb7 LEA (%RDI,%R8,8),%R9 |
(17436) 0xc0dbbb ADD 0x178(%RSP),%R9 |
(17436) 0xc0dbc3 MOV 0x170(%RSP),%RDI |
(17436) 0xc0dbcb LEA (%RDI,%RSI,4),%R11 |
(17436) 0xc0dbcf XOR %R8D,%R8D |
(17436) 0xc0dbd2 NOPW %CS:(%RAX,%RAX,1) |
(17437) 0xc0dbe0 VMOVUPS -0x40(%R9,%R8,8),%YMM0 |
(17437) 0xc0dbe7 VMOVUPS -0x20(%R9,%R8,8),%YMM3 |
(17437) 0xc0dbee VMOVUPS (%R9,%R8,8),%YMM5 |
(17437) 0xc0dbf4 VMOVUPS 0x20(%R9,%R8,8),%YMM7 |
(17437) 0xc0dbfb VMOVAPS %YMM0,%YMM8 |
(17437) 0xc0dbff VPERMT2PS %YMM3,%YMM14,%YMM8 |
(17437) 0xc0dc05 VMOVAPS %YMM5,%YMM9 |
(17437) 0xc0dc09 VPERMT2PS %YMM7,%YMM14,%YMM9 |
(17437) 0xc0dc0f VPERMT2PS %YMM3,%YMM10,%YMM0 |
(17437) 0xc0dc15 VPERMT2PS %YMM7,%YMM10,%YMM5 |
(17437) 0xc0dc1b VMOVUPS -0x20(%R11,%R8,4),%YMM3 |
(17437) 0xc0dc22 VMOVUPS (%R11,%R8,4),%YMM7 |
(17437) 0xc0dc28 VMULPS %YMM3,%YMM8,%YMM8 |
(17437) 0xc0dc2c VMULPS %YMM7,%YMM9,%YMM9 |
(17437) 0xc0dc30 VMULPS %YMM3,%YMM0,%YMM0 |
(17437) 0xc0dc34 VMULPS %YMM7,%YMM5,%YMM3 |
(17437) 0xc0dc38 VINSERTF64X4 $0x1,%YMM0,%ZMM0,%ZMM0 |
(17437) 0xc0dc3f VINSERTF64X4 $0x1,%YMM8,%ZMM8,%ZMM5 |
(17437) 0xc0dc46 VPERMT2PS %ZMM0,%ZMM13,%ZMM5 |
(17437) 0xc0dc4c VMOVUPS %ZMM5,-0x40(%R9,%R8,8) |
(17437) 0xc0dc54 VINSERTF64X4 $0x1,%YMM3,%ZMM3,%ZMM0 |
(17437) 0xc0dc5b VINSERTF64X4 $0x1,%YMM9,%ZMM9,%ZMM3 |
(17437) 0xc0dc62 VPERMT2PS %ZMM0,%ZMM13,%ZMM3 |
(17437) 0xc0dc68 VMOVUPS %ZMM3,(%R9,%R8,8) |
(17437) 0xc0dc6f ADD $0x10,%R8 |
(17437) 0xc0dc73 CMP %R8,%RCX |
(17437) 0xc0dc76 JNE c0dbe0 |
(17436) 0xc0dc7c CMP %RCX,%RDX |
(17436) 0xc0dc7f MOV 0x20(%RSP),%RDI |
(17436) 0xc0dc84 JNE c0deba |
(17436) 0xc0dc8a MOV %EBX,%R11D |
(17436) 0xc0dc8d MOV 0x30(%RSP),%R10 |
(17436) 0xc0dc92 MOV 0x1c(%RSP),%ECX |
(17436) 0xc0dc96 JMP c0c395 |
(17436) 0xc0dc9b MOV %RDX,%R9 |
(17436) 0xc0dc9e AND $-0x8,%R9 |
(17436) 0xc0dca2 XOR %EDI,%EDI |
(17436) 0xc0dca4 NOPW %CS:(%RAX,%RAX,1) |
(17447) 0xc0dcb0 VMOVUPS (%RAX,%RDI,8),%YMM0 |
(17447) 0xc0dcb5 VMOVUPS 0x20(%RAX,%RDI,8),%YMM3 |
(17447) 0xc0dcbb VMOVAPS %YMM0,%YMM5 |
(17447) 0xc0dcbf VPERMT2PS %YMM3,%YMM14,%YMM5 |
(17447) 0xc0dcc5 VPERMT2PS %YMM3,%YMM10,%YMM0 |
(17447) 0xc0dccb VMOVUPS (%R11,%RDI,4),%YMM3 |
(17447) 0xc0dcd1 VMULPS %YMM3,%YMM5,%YMM7 |
(17447) 0xc0dcd5 VMULPS %YMM3,%YMM0,%YMM3 |
(17447) 0xc0dcd9 VINSERTF64X4 $0x1,%YMM3,%ZMM3,%ZMM3 |
(17447) 0xc0dce0 VINSERTF64X4 $0x1,%YMM7,%ZMM7,%ZMM7 |
(17447) 0xc0dce7 VPERMT2PS %ZMM3,%ZMM13,%ZMM7 |
(17447) 0xc0dced VMOVUPS %ZMM7,(%RAX,%RDI,8) |
(17447) 0xc0dcf4 VMULPS %YMM0,%YMM0,%YMM0 |
(17447) 0xc0dcf8 VFMADD231PS %YMM5,%YMM5,%YMM0 |
(17447) 0xc0dcfd VADDPS %YMM0,%YMM0,%YMM0 |
(17447) 0xc0dd01 VMULPS (%R11,%RDI,4),%YMM0,%YMM0 |
(17447) 0xc0dd07 VMOVUPS %YMM0,(%RCX,%RDI,4) |
(17447) 0xc0dd0c ADD $0x8,%RDI |
(17447) 0xc0dd10 CMP %RDI,%R9 |
(17447) 0xc0dd13 JNE c0dcb0 |
(17436) 0xc0dd15 CMP %R9,%RDX |
(17436) 0xc0dd18 MOV 0x3c(%RSP),%R11D |
(17436) 0xc0dd1d MOV 0x20(%RSP),%RDI |
(17436) 0xc0dd22 MOV 0x40(%RSP),%R13 |
(17436) 0xc0dd27 JE c0dd93 |
(17436) 0xc0dd29 TEST $0x4,%DL |
(17436) 0xc0dd2c JNE c0dab1 |
(17436) 0xc0dd32 LEA (%RAX,%R9,8),%RAX |
(17436) 0xc0dd36 ADD %R9,%RSI |
(17436) 0xc0dd39 MOV %RSI,%RCX |
(17436) 0xc0dd3c JMP c0dd50 |
(17436) 0xc0dd3e MOV %RSI,%RCX |
(17436) 0xc0dd41 MOV 0x3c(%RSP),%R11D |
(17436) 0xc0dd46 MOV 0x20(%RSP),%RDI |
(17436) 0xc0dd4b NOPL (%RAX,%RAX,1) |
(17445) 0xc0dd50 VMOVSS (%RAX),%XMM0 |
(17445) 0xc0dd54 VMOVSS 0x4(%RAX),%XMM3 |
(17445) 0xc0dd59 VMULSS (%R15,%RCX,4),%XMM0,%XMM5 |
(17445) 0xc0dd5f VMOVSS %XMM5,(%RAX) |
(17445) 0xc0dd63 VMULSS (%R15,%RCX,4),%XMM3,%XMM5 |
(17445) 0xc0dd69 VMOVSS %XMM5,0x4(%RAX) |
(17445) 0xc0dd6e VMULSS %XMM3,%XMM3,%XMM3 |
(17445) 0xc0dd72 VFMADD231SS %XMM0,%XMM0,%XMM3 |
(17445) 0xc0dd77 VADDSS %XMM3,%XMM3,%XMM0 |
(17445) 0xc0dd7b VMULSS (%R15,%RCX,4),%XMM0,%XMM0 |
(17445) 0xc0dd81 VMOVSS %XMM0,(%R12,%RCX,4) |
(17445) 0xc0dd87 INC %RCX |
(17445) 0xc0dd8a ADD $0x8,%RAX |
(17445) 0xc0dd8e CMP %RDI,%RCX |
(17445) 0xc0dd91 JL c0dd50 |
(17436) 0xc0dd93 KMOVD %EBX,%K1 |
(17436) 0xc0dd97 XOR %ECX,%ECX |
(17436) 0xc0dd99 MOVZX 0x3b(%RSP),%EAX |
(17436) 0xc0dd9e MOV %AL,%CL |
(17436) 0xc0dda0 LEA -0x8b13a7(%RIP),%RAX |
(17436) 0xc0dda7 VMOVSS (%RAX,%RCX,4),%XMM3 |
(17436) 0xc0ddac VMOVSS -0x8b1906(%RIP),%XMM3{%K1} |
(17436) 0xc0ddb6 MOVSXD 0x18(%RSP),%RAX |
(17436) 0xc0ddbb VMOVSHDUP %XMM28,%XMM5 |
(17436) 0xc0ddc1 VPERMILPD $0x1,%XMM28,%XMM7 |
(17436) 0xc0ddc8 VPERMILPS $-0x1,%XMM28,%XMM8 |
(17436) 0xc0ddcf MOV 0xb0(%RSP),%RCX |
(17436) 0xc0ddd7 MOV 0x68(%RSP),%RDX |
(17436) 0xc0dddc MOV 0xa8(%RSP),%RSI |
(17436) 0xc0dde4 MOV 0xa0(%RSP),%R9 |
(17436) 0xc0ddec NOPL (%RAX) |
(17446) 0xc0ddf0 VMULSS (%R12,%RAX,4),%XMM3,%XMM0 |
(17446) 0xc0ddf6 VMULSS (%R14,%RAX,4),%XMM19,%XMM9 |
(17446) 0xc0ddfd VCVTSS2SD %XMM9,%XMM9,%XMM9 |
(17446) 0xc0de02 VADDSD %XMM26,%XMM9,%XMM9 |
(17446) 0xc0de08 VADDSD %XMM9,%XMM9,%XMM9 |
(17446) 0xc0de0d VMOVSS (%RDX,%RAX,4),%XMM10 |
(17446) 0xc0de12 VCVTSS2SD %XMM10,%XMM10,%XMM10 |
(17446) 0xc0de17 VMULSD %XMM10,%XMM9,%XMM9 |
(17446) 0xc0de1c VCVTSD2SS %XMM9,%XMM9,%XMM9 |
(17446) 0xc0de21 VMULSS %XMM0,%XMM9,%XMM9 |
(17446) 0xc0de25 VMOVSS (%RSI,%RAX,4),%XMM10 |
(17446) 0xc0de2a VMULSS %XMM9,%XMM10,%XMM12 |
(17446) 0xc0de2f VFMSUB213SS %XMM0,%XMM12,%XMM10 |
(17446) 0xc0de34 VMOVSS (%R9,%RAX,4),%XMM13 |
(17446) 0xc0de3a VMOVSS (%RCX,%RAX,4),%XMM14 |
(17446) 0xc0de3f VFMADD231SS %XMM13,%XMM12,%XMM5 |
(17446) 0xc0de44 VFMADD231SS %XMM12,%XMM14,%XMM28 |
(17446) 0xc0de4a VMULSS %XMM9,%XMM13,%XMM12 |
(17446) 0xc0de4f VFMSUB213SS %XMM0,%XMM12,%XMM13 |
(17446) 0xc0de54 VADDSS %XMM7,%XMM13,%XMM7 |
(17446) 0xc0de58 VINSERTPS $0x10,%XMM10,%XMM0,%XMM10 |
(17446) 0xc0de5e VADDPS %XMM10,%XMM30,%XMM30 |
(17446) 0xc0de64 VFMADD231SS %XMM12,%XMM14,%XMM8 |
(17446) 0xc0de69 VMULSS %XMM9,%XMM14,%XMM9 |
(17446) 0xc0de6e VFMSUB213SS %XMM0,%XMM14,%XMM9 |
(17446) 0xc0de73 VADDSS %XMM9,%XMM29,%XMM29 |
(17446) 0xc0de79 INC %RAX |
(17446) 0xc0de7c CMP %RDI,%RAX |
(17446) 0xc0de7f JL c0ddf0 |
(17436) 0xc0de85 VINSERTPS $0x10,%XMM5,%XMM28,%XMM0 |
(17436) 0xc0de8c VINSERTPS $0x20,%XMM7,%XMM0,%XMM0 |
(17436) 0xc0de92 VINSERTPS $0x30,%XMM8,%XMM0,%XMM28 |
(17436) 0xc0de99 VMOVSS -0x8b1d15(%RIP),%XMM12 |
(17436) 0xc0dea1 VMOVAPS -0x8a8f09(%RIP),%YMM14 |
(17436) 0xc0dea9 VMOVAPS -0x8a84d1(%RIP),%YMM10 |
(17436) 0xc0deb1 MOV 0x1c(%RSP),%ECX |
(17436) 0xc0deb5 JMP c0c395 |
(17436) 0xc0deba TEST $0xc,%DL |
(17436) 0xc0debd JE c0df71 |
(17436) 0xc0dec3 MOV %RDX,%RDI |
(17436) 0xc0dec6 AND $-0x4,%RDI |
(17436) 0xc0deca LEA (%RDI,%RSI,1),%R9 |
(17436) 0xc0dece LEA (%RAX,%RDI,8),%RAX |
(17436) 0xc0ded2 MOV 0x80(%RSP),%R8 |
(17436) 0xc0deda SAL $0x3,%R8 |
(17436) 0xc0dede LEA (%R8,%RCX,8),%R8 |
(17436) 0xc0dee2 MOV 0x78(%RSP),%R11 |
(17436) 0xc0dee7 LEA (%R8,%R11,8),%R8 |
(17436) 0xc0deeb MOV 0x40(%RSP),%R10 |
(17436) 0xc0def0 LEA (%R8,%R10,8),%R8 |
(17436) 0xc0def4 ADD 0x88(%RSP),%R8 |
(17436) 0xc0defc MOV %RDI,%R11 |
(17436) 0xc0deff SUB %RCX,%R11 |
(17436) 0xc0df02 ADD %RSI,%RCX |
(17436) 0xc0df05 LEA (%R15,%RCX,4),%RCX |
(17436) 0xc0df09 XOR %ESI,%ESI |
(17436) 0xc0df0b NOPL (%RAX,%RAX,1) |
(17439) 0xc0df10 VMOVUPS (%R8,%RSI,8),%XMM0 |
(17439) 0xc0df16 VMOVUPS 0x10(%R8,%RSI,8),%XMM3 |
(17439) 0xc0df1d VSHUFPS $-0x78,%XMM3,%XMM0,%XMM5 |
(17439) 0xc0df22 VSHUFPS $-0x23,%XMM3,%XMM0,%XMM0 |
(17439) 0xc0df27 VMOVUPS (%RCX,%RSI,4),%XMM3 |
(17439) 0xc0df2c VMULPS %XMM3,%XMM5,%XMM5 |
(17439) 0xc0df30 VMULPS %XMM3,%XMM0,%XMM0 |
(17439) 0xc0df34 VUNPCKHPS %XMM0,%XMM5,%XMM3 |
(17439) 0xc0df38 VUNPCKLPS %XMM0,%XMM5,%XMM0 |
(17439) 0xc0df3c VMOVUPS %XMM0,(%R8,%RSI,8) |
(17439) 0xc0df42 VMOVUPS %XMM3,0x10(%R8,%RSI,8) |
(17439) 0xc0df49 ADD $0x4,%RSI |
(17439) 0xc0df4d CMP %RSI,%R11 |
(17439) 0xc0df50 JNE c0df10 |
(17436) 0xc0df52 CMP %RDI,%RDX |
(17436) 0xc0df55 MOV %EBX,%R11D |
(17436) 0xc0df58 MOV 0x20(%RSP),%RDI |
(17436) 0xc0df5d MOV 0x30(%RSP),%R10 |
(17436) 0xc0df62 MOV 0x1c(%RSP),%ECX |
(17436) 0xc0df66 JNE c0d750 |
(17436) 0xc0df6c JMP c0c395 |
(17436) 0xc0df71 LEA (%RAX,%RCX,8),%RAX |
(17436) 0xc0df75 ADD %RCX,%RSI |
(17436) 0xc0df78 MOV %RSI,%R9 |
(17436) 0xc0df7b MOV %EBX,%R11D |
(17436) 0xc0df7e JMP c0d746 |
(17436) 0xc0df83 ADD %RDX,%RSI |
(17436) 0xc0df86 MOV %RSI,%R9 |
(17436) 0xc0df89 JMP c0cd6b |
0xc0df8e VXORPS %XMM28,%XMM28,%XMM28 |
0xc0df94 VXORPS %XMM29,%XMM29,%XMM29 |
0xc0df9a VXORPS %XMM30,%XMM30,%XMM30 |
0xc0dfa0 CMPB $0,0x94(%RSP) |
0xc0dfa8 JE c0dffe |
0xc0dfaa VMULPS -0x8ae574(%RIP),%XMM30,%XMM0 |
0xc0dfb4 VMULPS -0x8b1c9a(%RIP){1to4},%XMM28,%XMM1 |
0xc0dfbe VMULSS -0x8b1ca4(%RIP),%XMM29,%XMM2 |
0xc0dfc8 MOV 0x1b8(%RSP),%RAX |
0xc0dfd0 MOV 0x1b0(%RSP),%RCX |
0xc0dfd8 VMOVSS %XMM2,0x74(%RAX,%RCX,1) |
0xc0dfde VEXTRACTPS $0x1,%XMM1,0x58(%RAX,%RCX,1) |
0xc0dfe6 VPERMILPS $-0x14,%XMM1,%XMM2 |
0xc0dfec VMOVLPS %XMM2,0x6c(%RAX,%RCX,1) |
0xc0dff2 VMOVUPS %XMM1,0x5c(%RAX,%RCX,1) |
0xc0dff8 VMOVLPS %XMM0,0x50(%RAX,%RCX,1) |
0xc0dffe MOV 0xc0(%RSP),%EAX |
0xc0e005 IMUL 0xdc(%RSP),%EAX |
0xc0e00d LEA -0x28(%RBP),%RSP |
0xc0e011 POP %RBX |
0xc0e012 POP %R12 |
0xc0e014 POP %R13 |
0xc0e016 POP %R14 |
0xc0e018 POP %R15 |
0xc0e01a POP %RBP |
0xc0e01b VZEROUPPER |
0xc0e01e RET |
0xc0e01f NOP |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.83+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►76.10+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►12.46+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
►11.37+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►81.26+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►12.70+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
►6.04+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | CpuPpLongRangeNonbondeds::calc[...] | force.cpp:261 | libgromacs_mpi.so.9.0.0 |
○ | do_force(_IO_FILE*, t_commrec [...] | sim_util.cpp:2073 | libgromacs_mpi.so.9.0.0 |
○ | gmx::LegacySimulator::do_md() | md.cpp:1248 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2311 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►66.43+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►24.29+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
►9.22+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►60.37+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 | |
►27.75+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►11.88+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►46.23+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
►34.91+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
►18.87+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.95+ | .omp_outlined..49 | pme.cpp:1303 | libgromacs_mpi.so.9.0.0 |
○ | __kmp_invoke_microtask | libomp.so | |
○ | __kmp_fork_call | libomp.so | |
○ | __kmpc_fork_call | libomp.so | |
○ | gmx_pme_do(gmx_pme_t*, gmx::Ar[...] | pme.cpp:1276 | libgromacs_mpi.so.9.0.0 |
○ | gmx_pmeonly(gmx_pme_t**, t_com[...] | stl_vector.h:1169 | libgromacs_mpi.so.9.0.0 |
○ | gmx::Mdrunner::mdrunner() | runner.cpp:2330 | libgromacs_mpi.so.9.0.0 |
○ | gmx::gmx_mdrun(int, gmx_hw_inf[...] | mdrun.cpp:280 | gmx_mpi |
○ | gmx::gmx_mdrun(int, char**) | mdrun.cpp:82 | gmx_mpi |
○ | gmx::CommandLineModuleManager:[...] | cmdlinemodulemanager.cpp:569 | libgromacs_mpi.so.9.0.0 |
○ | main | gmx.cpp:58 | gmx_mpi |
○ | __libc_start_call_main | libc.so.6 |
Path / |
The code analyzed by CQA in that panel excludes loops and represents 0.00% of application time for run 1x1
Source file and lines | pme_solve.cpp:233-585 |
Module | libgromacs_mpi.so.9.0.0 |
nb instructions | 277 |
nb uops | 287 |
loop length | 1624 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 23 |
used ymm registers | 13 |
used zmm registers | 4 |
nb stack references | 85 |
micro-operation queue | 47.83 cycles |
front end | 47.83 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 15.00 | 15.00 | 14.75 | 14.75 | 4.50 | 45.33 | 45.33 | 45.33 | 12.25 | 12.25 | 12.33 | 12.17 | 22.00 | 22.00 |
cycles | 15.00 | 15.00 | 14.75 | 14.75 | 4.50 | 46.33 | 46.33 | 46.33 | 12.25 | 12.25 | 12.33 | 12.17 | 22.00 | 22.00 |
Cycles executing div or sqrt instructions | 22.00 |
Front-end | 47.83 |
Dispatch | 46.33 |
DIV/SQRT | 22.00 |
Overall L1 | 47.83 |
all | 33% |
load | 100% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 45% |
all | 40% |
load | 26% |
store | 60% |
mul | 40% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 47% |
all | 36% |
load | 43% |
store | 26% |
mul | 40% |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 48% |
all | 24% |
load | 64% |
store | 19% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 26% |
all | 17% |
load | 15% |
store | 22% |
mul | 15% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 12% |
other | 15% |
all | 21% |
load | 26% |
store | 19% |
mul | 15% |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 22% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SUB $0x4c0,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
VMOVSS 0x50(%RDI),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS %XMM1,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (6.3%) |
VMOVSS 0x58(%RDI),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS %XMM1,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (6.3%) |
MOV %R8D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %ECX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %EDX,0x94(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
VMOVSS %XMM0,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (6.3%) |
MOV %RSI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV 0x44(%RDI),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x580(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
VMOVSD 0x3c(%R14),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
VMOVAPS %XMM0,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
LEA 0x2f4(%RSP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0xdc(%RSP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x134(%RSP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x214(%RSP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fb5700 <@plt_start@+0x12250> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV 0x780(%R14),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOVSXD %R13D,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV 0xe4(%RSP),%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0xe0(%RSP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
IMUL %R9D,%ESI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
MOV %ESI,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
IMUL %EDI,%EAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
CLTD | scal (6.3%) | |||||||||||||||||
IDIV %R12D | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-14 | 6 | scal (6.3%) |
MOV %EAX,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (6.3%) |
LEA (%RDI,%RDI,4),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
INC %EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
IMUL %ESI,%EDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
MOV %EDI,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
CLTD | scal (6.3%) | |||||||||||||||||
IDIV %R12D | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-14 | 6 | scal (6.3%) |
SAL $0x5,%R8 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CMP %EAX,%R11D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
MOV %RCX,0x1b8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %ESI,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %R8,0x1b0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JGE c0df8e <_Z13solve_pme_yzxPK9gmx_pme_tP9t_complexfbii+0x21ae> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
VMOVSS 0x40(%RSP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMULSS %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
VCVTSS2SD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
VMOVSD -0x8af225(%RIP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
VDIVSD %XMM0,%XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 13 | 5 | scal (12.5%) |
VCVTSD2SS %XMM0,%XMM0,%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 | scal (12.5%) |
VMOVSS 0x5d0(%R14),%XMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS 0x5dc(%R14),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS 0x5e0(%R14),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS %XMM0,0x54(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (6.3%) |
VMOVSS 0x5e8(%R14),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS 0x5ec(%R14),%XMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS 0x5f0(%R14),%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VPCMPEQD %XMM3,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 | vect (25.0%) |
VMOVDQA 0x220(%RSP),%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (25.0%) |
VPSUBD %XMM3,%XMM12,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 | vect (25.0%) |
VPSRLD $0x1f,%XMM3,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 | vect (25.0%) |
VMOVUPS 0x8(%RCX,%R8,1),%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (50.0%) |
VMOVDQU 0x28(%RCX,%R8,1),%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (25.0%) |
VMOVSS 0x18(%RSP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VCVTSS2SD %XMM1,%XMM1,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
VMOVSD -0x8aeb83(%RIP),%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
VPADDD %XMM5,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 | vect (25.0%) |
VDIVSD %XMM7,%XMM8,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 13 | 5 | scal (12.5%) |
VCVTSD2SS %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 | scal (12.5%) |
VMOVSS 0x2a0(%RSP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VCVTSS2SD %XMM1,%XMM1,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
VPSRAD $0x1,%XMM3,%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 | vect (25.0%) |
VMULSD -0x8af61b(%RIP),%XMM7,%XMM26 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | scal (12.5%) |
MOV %EBX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
INC %EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SHR $0x1f,%EDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
ADD %EBX,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
INC %EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SAR $0x1,%EDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %EDX,0xd4(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV 0x134(%RSP),%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0xdc(%RSP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
LEA (%RSI,%RDX,1),%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VXORPS -0x8afdfa(%RIP){1to4},%XMM19,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 | vect (25.0%) |
MOV %R9D,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
VMOVD %XMM13,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 5 | 1 | scal (6.3%) |
MOV %RDX,0x208(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RSI,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
ADD %ESI,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
ADD $0xf,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
AND $-0x10,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VBROADCASTSS %XMM5,%ZMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 1 | scal (6.3%) |
MOV %RDX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SHR $0x4,%RSI | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSI,0x118(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
OR $0xf,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x128(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R9D,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVSXD %R9D,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %EDI,0x64(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVSXD %EDI,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VPBROADCASTQ %RDX,%YMM3 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 | scal (12.5%) |
VPSLLQ $0x2,%YMM3,%YMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 | vect (50.0%) |
VMOVDQA64 -0x888419(%RIP),%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
VPADDQ %YMM0,%YMM5,%YMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 | vect (50.0%) |
VPERMQ %ZMM5,%ZMM7,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VMOVDQA64 %ZMM7,0x440(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 4 | 2 | vect (100.0%) |
VMOVDQA64 -0x8883f5(%RIP),%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
VPERMQ %ZMM5,%ZMM7,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VMOVDQA64 %ZMM7,0x400(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 4 | 2 | vect (100.0%) |
VPSLLQ $0x2,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 | vect (25.0%) |
VPADDQ %XMM3,%XMM9,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 | vect (25.0%) |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SUB %RDX,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VPERMQ $0x54,%YMM7,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 0.50 | vect (50.0%) |
VMOVDQA %YMM3,0x340(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
VEXTRACTI128 $0x1,%YMM0,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 | vect (25.0%) |
VPERMQ $0x5,%YMM7,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 0.50 | vect (50.0%) |
VBROADCASTSS %XMM22,%YMM31 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VBROADCASTSS %XMM2,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VBROADCASTSS %XMM4,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VBROADCASTSS %XMM6,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VBROADCASTSS %XMM11,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
MOV %RDX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
NEG %R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R9,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RSI,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
AND $-0x20,%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VPBROADCASTD %XMM13,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VPADDD -0x8a3d6b(%RIP),%YMM8,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 | vect (50.0%) |
VMOVDQA %YMM8,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
VPBROADCASTD %XMM12,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
VMOVDQA64 -0x888447(%RIP),%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
NEG %RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RBX,0x1f0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VPERMI2Q %ZMM7,%ZMM5,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VMOVDQA64 %ZMM8,0x3c0(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 4 | 2 | vect (100.0%) |
VMOVDQA -0x8a3c88(%RIP),%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (50.0%) |
VMOVDQA %YMM10,0x320(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
VPERMI2Q %YMM5,%YMM10,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 0.50 | vect (50.0%) |
VMOVDQA %YMM8,0x300(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
MOV %RSI,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
AND $-0x8,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VMOVD %XMM12,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 5 | 1 | scal (6.3%) |
MOV %EBX,0xc4(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
NEG %EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RBX,0x108(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VXORPS %XMM28,%XMM28,%XMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VPEXTRQ $0x1,%XMM7,0x1e8(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 | scal (12.5%) |
VXORPS %XMM29,%XMM29,%XMM29 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VPEXTRD $0x1,%XMM12,0xd0(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 | scal (6.3%) |
MOV 0x214(%RSP),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %R14,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x21c(%RSP),%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %EBX,0xcc(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
IMUL %EBX,%R14D | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
MOV %R14D,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
VPEXTRQ $0x1,%XMM3,%RBX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 | scal (12.5%) |
MOV %RBX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VMOVQ %XMM3,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (12.5%) |
MOV %EAX,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV 0x40(%RCX,%R8,1),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x48(%RCX,%R8,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RDX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOVSXD 0x138(%RSP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
MOV %RDX,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOVSXD 0x13c(%RSP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
MOV %RDX,0x1f8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VPEXTRQ $0x1,%XMM9,%R12 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 | scal (12.5%) |
LEA (,%R8,4),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VMOVDQA %XMM9,0x290(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVQ %XMM9,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (12.5%) |
LEA (%R9,%R8,1),%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R13,0x1d8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VMOVQ %XMM0,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (12.5%) |
VMOVAPS %YMM0,0x360(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
VPEXTRQ $0x1,%XMM0,%R10 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 | scal (12.5%) |
MOV %RSI,0x1a8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA (%RSI,%R8,1),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RSI,0x1a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(%RDX),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RSI,0x1d0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(%R12),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RSI,0x1c8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(,%R8,4),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RSI,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(%RDX,%R8,4),%RDX | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | N/A |
MOV %RDX,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(%R12,%R8,4),%RDX | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | N/A |
MOV %RDX,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x40(%RAX),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x178(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x20(%R15),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x170(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R13,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA (%R13,%R8,4),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x198(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R10,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA (%R10,%R8,4),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x190(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R14,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA (%R14,%R8,4),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x188(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA (%RBX,%R8,4),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(%RBX),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x168(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RCX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(%RCX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VMOVSS -0x8b014b(%RIP),%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVAPS -0x8a733f(%RIP),%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (50.0%) |
VMOVAPS -0x8a6907(%RIP),%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (50.0%) |
VXORPS %XMM30,%XMM30,%XMM30 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
MOV %RAX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VMOVAPS %XMM19,0x280(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVAPS %XMM20,%XMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VMOVSS %XMM20,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (6.3%) |
VMOVDQA64 %XMM13,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VMOVDQA %XMM13,0x270(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVAPD %XMM26,%XMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VMOVSD %XMM26,0xf8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (12.5%) |
VMOVAPS %ZMM25,0x380(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
VMOVAPS %XMM22,0x260(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVAPS %XMM4,0x150(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVAPS %XMM6,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVAPS %YMM15,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
VMOVAPS %XMM2,0x250(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVDQA64 %YMM16,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
MOV 0x30(%RSP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x1c(%RSP),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %R8,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDI,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R9,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP c0c3a6 <_Z13solve_pme_yzxPK9gmx_pme_tP9t_complexfbii+0x5c6> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
VXORPS %XMM28,%XMM28,%XMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VXORPS %XMM29,%XMM29,%XMM29 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VXORPS %XMM30,%XMM30,%XMM30 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
CMPB $0,0x94(%RSP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
JE c0dffe <_Z13solve_pme_yzxPK9gmx_pme_tP9t_complexfbii+0x221e> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
VMULPS -0x8ae574(%RIP),%XMM30,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (25.0%) |
VMULPS -0x8b1c9a(%RIP){1to4},%XMM28,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (25.0%) |
VMULSS -0x8b1ca4(%RIP),%XMM29,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
MOV 0x1b8(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x1b0(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
VMOVSS %XMM2,0x74(%RAX,%RCX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (6.3%) |
VEXTRACTPS $0x1,%XMM1,0x58(%RAX,%RCX,1) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 | scal (6.3%) |
VPERMILPS $-0x14,%XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | vect (25.0%) |
VMOVLPS %XMM2,0x6c(%RAX,%RCX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | vect (12.5%) |
VMOVUPS %XMM1,0x5c(%RAX,%RCX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVLPS %XMM0,0x50(%RAX,%RCX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | vect (12.5%) |
MOV 0xc0(%RSP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
IMUL 0xdc(%RSP),%EAX | 1 | 0 | 1 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | vect (25.0%) |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
The code analyzed by CQA in that panel excludes loops and represents 0.00% of application time for run 1x1
Source file and lines | pme_solve.cpp:233-585 |
Module | libgromacs_mpi.so.9.0.0 |
nb instructions | 277 |
nb uops | 287 |
loop length | 1624 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 23 |
used ymm registers | 13 |
used zmm registers | 4 |
nb stack references | 85 |
micro-operation queue | 47.83 cycles |
front end | 47.83 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 15.00 | 15.00 | 14.75 | 14.75 | 4.50 | 45.33 | 45.33 | 45.33 | 12.25 | 12.25 | 12.33 | 12.17 | 22.00 | 22.00 |
cycles | 15.00 | 15.00 | 14.75 | 14.75 | 4.50 | 46.33 | 46.33 | 46.33 | 12.25 | 12.25 | 12.33 | 12.17 | 22.00 | 22.00 |
Cycles executing div or sqrt instructions | 22.00 |
Front-end | 47.83 |
Dispatch | 46.33 |
DIV/SQRT | 22.00 |
Overall L1 | 47.83 |
all | 33% |
load | 100% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 45% |
all | 40% |
load | 26% |
store | 60% |
mul | 40% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 47% |
all | 36% |
load | 43% |
store | 26% |
mul | 40% |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 48% |
all | 24% |
load | 64% |
store | 19% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 26% |
all | 17% |
load | 15% |
store | 22% |
mul | 15% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 12% |
other | 15% |
all | 21% |
load | 26% |
store | 19% |
mul | 15% |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 22% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput | Vectorization |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SUB $0x4c0,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
VMOVSS 0x50(%RDI),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS %XMM1,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (6.3%) |
VMOVSS 0x58(%RDI),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS %XMM1,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (6.3%) |
MOV %R8D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %ECX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV %EDX,0x94(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
VMOVSS %XMM0,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (6.3%) |
MOV %RSI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV 0x44(%RDI),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x580(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
VMOVSD 0x3c(%R14),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
VMOVAPS %XMM0,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
LEA 0x2f4(%RSP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0xdc(%RSP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x134(%RSP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
LEA 0x214(%RSP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
CALL fb5700 <@plt_start@+0x12250> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | N/A |
MOV 0x780(%R14),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOVSXD %R13D,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV 0xe4(%RSP),%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0xe0(%RSP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
IMUL %R9D,%ESI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
MOV %ESI,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
IMUL %EDI,%EAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
CLTD | scal (6.3%) | |||||||||||||||||
IDIV %R12D | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-14 | 6 | scal (6.3%) |
MOV %EAX,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | scal (6.3%) |
LEA (%RDI,%RDI,4),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
INC %EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
IMUL %ESI,%EDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
MOV %EDI,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
CLTD | scal (6.3%) | |||||||||||||||||
IDIV %R12D | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-14 | 6 | scal (6.3%) |
SAL $0x5,%R8 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
CMP %EAX,%R11D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (6.3%) |
MOV %RCX,0x1b8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %ESI,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %R8,0x1b0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JGE c0df8e <_Z13solve_pme_yzxPK9gmx_pme_tP9t_complexfbii+0x21ae> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
VMOVSS 0x40(%RSP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMULSS %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
VCVTSS2SD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
VMOVSD -0x8af225(%RIP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
VDIVSD %XMM0,%XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 13 | 5 | scal (12.5%) |
VCVTSD2SS %XMM0,%XMM0,%XMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 | scal (12.5%) |
VMOVSS 0x5d0(%R14),%XMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS 0x5dc(%R14),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS 0x5e0(%R14),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS %XMM0,0x54(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (6.3%) |
VMOVSS 0x5e8(%R14),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS 0x5ec(%R14),%XMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVSS 0x5f0(%R14),%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VPCMPEQD %XMM3,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 | vect (25.0%) |
VMOVDQA 0x220(%RSP),%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (25.0%) |
VPSUBD %XMM3,%XMM12,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 | vect (25.0%) |
VPSRLD $0x1f,%XMM3,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 | vect (25.0%) |
VMOVUPS 0x8(%RCX,%R8,1),%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (50.0%) |
VMOVDQU 0x28(%RCX,%R8,1),%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (25.0%) |
VMOVSS 0x18(%RSP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VCVTSS2SD %XMM1,%XMM1,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
VMOVSD -0x8aeb83(%RIP),%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (12.5%) |
VPADDD %XMM5,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 | vect (25.0%) |
VDIVSD %XMM7,%XMM8,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 13 | 5 | scal (12.5%) |
VCVTSD2SS %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 | scal (12.5%) |
VMOVSS 0x2a0(%RSP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VCVTSS2SD %XMM1,%XMM1,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
VPSRAD $0x1,%XMM3,%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 | vect (25.0%) |
VMULSD -0x8af61b(%RIP),%XMM7,%XMM26 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | scal (12.5%) |
MOV %EBX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
INC %EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SHR $0x1f,%EDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
ADD %EBX,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
INC %EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
SAR $0x1,%EDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %EDX,0xd4(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV 0x134(%RSP),%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0xdc(%RSP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
LEA (%RSI,%RDX,1),%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VXORPS -0x8afdfa(%RIP){1to4},%XMM19,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 | vect (25.0%) |
MOV %R9D,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
VMOVD %XMM13,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 5 | 1 | scal (6.3%) |
MOV %RDX,0x208(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RSI,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
ADD %ESI,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
ADD $0xf,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
AND $-0x10,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VBROADCASTSS %XMM5,%ZMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 1 | scal (6.3%) |
MOV %RDX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SHR $0x4,%RSI | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
MOV %RSI,0x118(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
OR $0xf,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x128(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R9D,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVSXD %R9D,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %EDI,0x64(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOVSXD %EDI,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VPBROADCASTQ %RDX,%YMM3 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 | scal (12.5%) |
VPSLLQ $0x2,%YMM3,%YMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 | vect (50.0%) |
VMOVDQA64 -0x888419(%RIP),%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
VPADDQ %YMM0,%YMM5,%YMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 | vect (50.0%) |
VPERMQ %ZMM5,%ZMM7,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VMOVDQA64 %ZMM7,0x440(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 4 | 2 | vect (100.0%) |
VMOVDQA64 -0x8883f5(%RIP),%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
VPERMQ %ZMM5,%ZMM7,%ZMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VMOVDQA64 %ZMM7,0x400(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 4 | 2 | vect (100.0%) |
VPSLLQ $0x2,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 | vect (25.0%) |
VPADDQ %XMM3,%XMM9,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 | vect (25.0%) |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
SUB %RDX,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VPERMQ $0x54,%YMM7,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 0.50 | vect (50.0%) |
VMOVDQA %YMM3,0x340(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
VEXTRACTI128 $0x1,%YMM0,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 | vect (25.0%) |
VPERMQ $0x5,%YMM7,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 0.50 | vect (50.0%) |
VBROADCASTSS %XMM22,%YMM31 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VBROADCASTSS %XMM2,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VBROADCASTSS %XMM4,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VBROADCASTSS %XMM6,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VBROADCASTSS %XMM11,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
MOV %RDX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
NEG %R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R9,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RSI,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
AND $-0x20,%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VPBROADCASTD %XMM13,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VPADDD -0x8a3d6b(%RIP),%YMM8,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 | vect (50.0%) |
VMOVDQA %YMM8,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
VPBROADCASTD %XMM12,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
VMOVDQA64 -0x888447(%RIP),%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | vect (100.0%) |
NEG %RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RBX,0x1f0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VPERMI2Q %ZMM7,%ZMM5,%ZMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 5 | 1 | vect (100.0%) |
VMOVDQA64 %ZMM8,0x3c0(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 4 | 2 | vect (100.0%) |
VMOVDQA -0x8a3c88(%RIP),%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (50.0%) |
VMOVDQA %YMM10,0x320(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
VPERMI2Q %YMM5,%YMM10,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 0.50 | vect (50.0%) |
VMOVDQA %YMM8,0x300(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
MOV %RSI,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
AND $-0x8,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
VMOVD %XMM12,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 5 | 1 | scal (6.3%) |
MOV %EBX,0xc4(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
NEG %EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RBX,0x108(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VXORPS %XMM28,%XMM28,%XMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VPEXTRQ $0x1,%XMM7,0x1e8(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 | scal (12.5%) |
VXORPS %XMM29,%XMM29,%XMM29 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VPEXTRD $0x1,%XMM12,0xd0(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 | scal (6.3%) |
MOV 0x214(%RSP),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %R14,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV 0x21c(%RSP),%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %EBX,0xcc(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
IMUL %EBX,%R14D | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
MOV %R14D,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
VPEXTRQ $0x1,%XMM3,%RBX | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 | scal (12.5%) |
MOV %RBX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VMOVQ %XMM3,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (12.5%) |
MOV %EAX,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (6.3%) |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOV 0x40(%RCX,%R8,1),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x48(%RCX,%R8,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %RDX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | N/A |
MOVSXD 0x138(%RSP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
MOV %RDX,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOVSXD 0x13c(%RSP),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
MOV %RDX,0x1f8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VPEXTRQ $0x1,%XMM9,%R12 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 | scal (12.5%) |
LEA (,%R8,4),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VMOVDQA %XMM9,0x290(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVQ %XMM9,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (12.5%) |
LEA (%R9,%R8,1),%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %R13,0x1d8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VMOVQ %XMM0,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (12.5%) |
VMOVAPS %YMM0,0x360(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
VPEXTRQ $0x1,%XMM0,%R10 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 | scal (12.5%) |
MOV %RSI,0x1a8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA (%RSI,%R8,1),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RSI,0x1a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(%RDX),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RSI,0x1d0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(%R12),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RSI,0x1c8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(,%R8,4),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RSI,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(%RDX,%R8,4),%RDX | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | N/A |
MOV %RDX,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(%R12,%R8,4),%RDX | 2 | 0 | 0 | 0.50 | 0.50 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | N/A |
MOV %RDX,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x40(%RAX),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x178(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x20(%R15),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x170(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R13,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA (%R13,%R8,4),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x198(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R10,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA (%R10,%R8,4),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x190(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R14,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA (%R14,%R8,4),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x188(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA (%RBX,%R8,4),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(%RBX),%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RDX,0x168(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RCX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
LEA 0x60(%RCX),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
MOV %RCX,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VMOVSS -0x8b014b(%RIP),%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | scal (6.3%) |
VMOVAPS -0x8a733f(%RIP),%YMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (50.0%) |
VMOVAPS -0x8a6907(%RIP),%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (50.0%) |
VXORPS %XMM30,%XMM30,%XMM30 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
MOV %RAX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
VMOVAPS %XMM19,0x280(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVAPS %XMM20,%XMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VMOVSS %XMM20,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (6.3%) |
VMOVDQA64 %XMM13,%XMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VMOVDQA %XMM13,0x270(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVAPD %XMM26,%XMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VMOVSD %XMM26,0xf8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (12.5%) |
VMOVAPS %ZMM25,0x380(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 5 | 2 | vect (100.0%) |
VMOVAPS %XMM22,0x260(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVAPS %XMM4,0x150(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVAPS %XMM6,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVAPS %YMM15,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
VMOVAPS %XMM2,0x250(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVDQA64 %YMM16,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (50.0%) |
MOV 0x30(%RSP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x1c(%RSP),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV %R8,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %RDI,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
MOV %R9,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 | scal (12.5%) |
JMP c0c3a6 <_Z13solve_pme_yzxPK9gmx_pme_tP9t_complexfbii+0x5c6> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
VXORPS %XMM28,%XMM28,%XMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VXORPS %XMM29,%XMM29,%XMM29 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
VXORPS %XMM30,%XMM30,%XMM30 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 | vect (25.0%) |
CMPB $0,0x94(%RSP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
JE c0dffe <_Z13solve_pme_yzxPK9gmx_pme_tP9t_complexfbii+0x221e> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 | N/A |
VMULPS -0x8ae574(%RIP),%XMM30,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (25.0%) |
VMULPS -0x8b1c9a(%RIP){1to4},%XMM28,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | vect (25.0%) |
VMULSS -0x8b1ca4(%RIP),%XMM29,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 3 | 0.50 | scal (6.3%) |
MOV 0x1b8(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
MOV 0x1b0(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
VMOVSS %XMM2,0x74(%RAX,%RCX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | scal (6.3%) |
VEXTRACTPS $0x1,%XMM1,0x58(%RAX,%RCX,1) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0.33 | 0.33 | 0.50 | 0.50 | 6 | 1 | scal (6.3%) |
VPERMILPS $-0x14,%XMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 | vect (25.0%) |
VMOVLPS %XMM2,0x6c(%RAX,%RCX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | vect (12.5%) |
VMOVUPS %XMM1,0x5c(%RAX,%RCX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 | vect (25.0%) |
VMOVLPS %XMM0,0x50(%RAX,%RCX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 | vect (12.5%) |
MOV 0xc0(%RSP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 | N/A |
IMUL 0xdc(%RSP),%EAX | 1 | 0 | 1 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 | N/A |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | N/A |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | vect (25.0%) |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 | N/A |
Run 1x1 | Number processes: 1Number processes per node: 1OMP_NUM_THREADS: 1 |
---|---|
Run 2x1 | Number processes: 2Number processes per node: 2OMP_NUM_THREADS: 1 |
Run 4x1 | Number processes: 4Number processes per node: 4OMP_NUM_THREADS: 1 |
Run 8x1 | Number processes: 8Number processes per node: 8OMP_NUM_THREADS: 1 |
Run 16x1 | Number processes: 16Number processes per node: 16OMP_NUM_THREADS: 1 |
Run 32x1 | Number processes: 32Number processes per node: 32OMP_NUM_THREADS: 1 |
Run 64x1 | Number processes: 64Number processes per node: 64OMP_NUM_THREADS: 1 |
Run 128x1 | Number processes: 128Number processes per node: 128OMP_NUM_THREADS: 1 |
Run 192x1 | Number processes: 192Number nodes: 1Number processes per node: 192Run Command: <executable> mdrun -s ion_channel.tpr -nsteps 10000 -pin on -deffnm aoccMPI Command: mpirun -genv I_MPI_FABRICS=shm -n <number_processes>Dataset: Run Directory: .OMP_NUM_THREADS: 1 |
(1x1) Efficiency | (1x1) Potential Speed-Up (%) | (2x1) Efficiency | (2x1) Potential Speed-Up (%) | (4x1) Efficiency | (4x1) Potential Speed-Up (%) | (8x1) Efficiency | (8x1) Potential Speed-Up (%) | (16x1) Efficiency | (16x1) Potential Speed-Up (%) | (32x1) Efficiency | (32x1) Potential Speed-Up (%) | (64x1) Efficiency | (64x1) Potential Speed-Up (%) | (128x1) Efficiency | (128x1) Potential Speed-Up (%) | (192x1) Efficiency | (192x1) Potential Speed-Up (%) |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
1 | 0 | 0.97 | 0.03 | 0.99 | 0.01 | 1.04 | 0 | 1.04 | 0 | 1.01 | 0 | 1 | -0 | 0.94 | 0.03 | 0.91 | 0.03 |
Run | Number of threads | Efficiency (ideal is 1) | Speedup | Ideal Speedup | Time (s) | Coverage (%) |
---|---|---|---|---|---|---|
1x1 | 1 | 1 | 1 | 1 | 8.5599908828735 | 1.0268646478653 |
2x1 | 2 | 0.97 | 1.95 | 2 | 4.4499940872192 | 0.96962505578995 |
4x1 | 4 | 0.99 | 3.97 | 4 | 2.2250008583069 | 0.86604428291321 |
8x1 | 8 | 1.04 | 8.28 | 8 | 1.254998922348 | 0.66797387599945 |
16x1 | 16 | 1.04 | 16.65 | 16 | 0.66499972343445 | 0.62168443202972 |
32x1 | 12 | 1.01 | 32.34 | 32 | 0.77999919652939 | 0.51500874757767 |
64x1 | 24 | 1 | 64.19 | 64 | 0.42999970912933 | 0.33551782369614 |
128x1 | 44 | 0.94 | 119.88 | 128 | 0.27000004053116 | 0.42014142870903 |
192x1 | 64 | 0.91 | 174.38 | 192 | 0.1900000423193 | 0.36442348361015 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼solve_pme_yzx(gmx_pme_t const*, t_complex*, float, bool, int, int)– | 0.36 | 0.05 |
▼Loop 17436 - pme_solve.cpp:233-560 - libgromacs_mpi.so.9.0.0– | 0.03 | 0.01 |
○Loop 17446 - pme_solve.cpp:498-510 - libgromacs_mpi.so.9.0.0 | 0.07 | 0.03 |
○Loop 17440 - pme_solve.cpp:233-233 - libgromacs_mpi.so.9.0.0 | 0.07 | 0.03 |
○Loop 17443 - pme_solve.cpp:521-530 - libgromacs_mpi.so.9.0.0 | 0.06 | 0.03 |
○Loop 17441 - pme_solve.cpp:533-542 - libgromacs_mpi.so.9.0.0 | 0.06 | 0.02 |
○Loop 17437 - pme_solve.cpp:556-560 - libgromacs_mpi.so.9.0.0 | 0.02 | 0.01 |
○Loop 17444 - pme_solve.cpp:523-530 - libgromacs_mpi.so.9.0.0 | 0.01 | 0.01 |
○Loop 17442 - pme_solve.cpp:535-542 - libgromacs_mpi.so.9.0.0 | 0.01 | 0.01 |
○Loop 17449 - pme_solve.cpp:233-233 - libgromacs_mpi.so.9.0.0 | 0.01 | 0.01 |
○Loop 17447 - pme_solve.cpp:487-495 - libgromacs_mpi.so.9.0.0 | 0.01 | 0.01 |
○Loop 17454 - pme_solve.cpp:458-469 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.01 |
○Loop 17450 - pme_solve.cpp:474-474 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 17456 - pme_solve.cpp:442-453 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 17445 - pme_solve.cpp:485-495 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 17448 - pme_solve.cpp:487-495 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 17452 - pme_solve.cpp:474-474 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 17451 - pme_solve.cpp:472-474 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 17455 - pme_solve.cpp:440-453 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 17438 - pme_solve.cpp:554-560 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 17439 - pme_solve.cpp:556-560 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |
○Loop 17453 - pme_solve.cpp:456-469 - libgromacs_mpi.so.9.0.0 | 0.00 | 0.00 |