Function: miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcp ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.17% |
---|
Function: miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcp ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.17% |
---|
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/shared_ptr_base.h: 1308 - 1308 |
-------------------------------------------------------------------------------- |
1308: { return _M_ptr; } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 231 - 273 |
-------------------------------------------------------------------------------- |
231: inline const AoSElement_t operator[](size_t i) const { return AoSElement_t(myData + i, nGhosts); } |
[...] |
244: *(_base + M * i) = rhs[i]; |
[...] |
263: inline Accessor operator()(size_t i) { return Accessor(myData + i, nGhosts); } |
[...] |
273: inline const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 313 - 316 |
-------------------------------------------------------------------------------- |
313: inline int first(int igroup) const { return (*group_offsets_)[igroup]; } |
314: |
315: ///return the last index of a group i |
316: inline int last(int igroup) const { return (*group_offsets_)[igroup + 1]; } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 145 - 169 |
-------------------------------------------------------------------------------- |
145: X[i] = base[i * offset]; |
[...] |
169: inline Type_t& operator[](unsigned int i) { return X[i]; } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Particle/DistanceTable.h: 268 - 268 |
-------------------------------------------------------------------------------- |
268: const DistRow& getDistRow(int iel) const { return distances_[iel]; } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/TwoBodyJastrowRef.h: 268 - 432 |
-------------------------------------------------------------------------------- |
268: const int igt = P.GroupID[iat] * NumGroups; |
269: for (int jg = 0; jg < NumGroups; ++jg) |
270: { |
271: const FuncType& f2(*F[igt + jg]); |
272: int iStart = P.first(jg); |
273: int iEnd = std::min(jelmax, P.last(jg)); |
274: f2.evaluateVGL(iat, iStart, iEnd, dist, u, du, d2u, DistCompressed.data(), DistIndice.data()); |
[...] |
360: const auto& d_table = P.getDistTableAA(myTableID); |
361: for (int ig = 0; ig < NumGroups; ++ig) |
362: { |
363: const int igt = ig * NumGroups; |
364: for (int iat = P.first(ig), last = P.last(ig); iat < last; ++iat) |
365: { |
366: computeU3(P, iat, d_table.getDistRow(iat).data(), cur_u.data(), cur_du.data(), cur_d2u.data(), true); |
367: Uat[iat] = std::accumulate(cur_u.begin(), cur_u.begin() + iat, valT()); |
[...] |
375: for (int jat = 0; jat < iat; ++jat) |
376: lap += d2u[jat] + lapfac * du[jat]; |
377: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
378: { |
379: const valT* restrict dX = displ.data(idim); |
380: valT s = valT(); |
381: for (int jat = 0; jat < iat; ++jat) |
382: s += du[jat] * dX[jat]; |
383: grad[idim] = s; |
384: } |
385: dUat(iat) = grad; |
386: d2Uat[iat] = -lap; |
387: // add the contribution from the upper triangle |
388: for (int jat = 0; jat < iat; jat++) |
389: { |
390: Uat[jat] += u[jat]; |
391: d2Uat[jat] -= d2u[jat] + lapfac * du[jat]; |
392: } |
393: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
394: { |
395: valT* restrict save_g = dUat.data(idim); |
396: const valT* restrict dX = displ.data(idim); |
397: for (int jat = 0; jat < iat; jat++) |
398: save_g[jat] -= du[jat] * dX[jat]; |
[...] |
419: { |
420: if (fromscratch) |
421: recompute(P); |
422: LogValue = valT(0); |
423: for (int iat = 0; iat < N; ++iat) |
424: { |
425: LogValue += Uat[iat]; |
426: G[iat] += dUat[iat]; |
427: L[iat] += d2Uat[iat]; |
428: } |
429: |
430: constexpr valT mhalf(-0.5); |
431: LogValue = mhalf * LogValue; |
432: } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_numeric.h: 126 - 127 |
-------------------------------------------------------------------------------- |
126: for (; __first != __last; ++__first) |
127: __init = __init + *__first; |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
[...] |
249: inline const_pointer data() const { return X; } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_algobase.h: 200 - 754 |
-------------------------------------------------------------------------------- |
200: if (__b < __a) |
[...] |
752: for (__decltype(__n + 0) __niter = __n; |
753: __niter > 0; --__niter, (void) ++__first) |
754: *__first = __tmp; |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_iterator.h: 784 - 887 |
-------------------------------------------------------------------------------- |
784: : _M_current(__i) { } |
[...] |
887: { return __lhs.base() != __rhs.base(); } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 94 - 94 |
-------------------------------------------------------------------------------- |
94: (const_cast<T1&>(a) += b); |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_vector.h: 951 - 1056 |
-------------------------------------------------------------------------------- |
951: return *(this->_M_impl._M_start + __n); |
[...] |
1056: { return _M_data_ptr(this->_M_impl._M_start); } |
0x428bc0 PUSH %RBP |
0x428bc1 MOV %RSP,%RBP |
0x428bc4 PUSH %R15 |
0x428bc6 PUSH %R14 |
0x428bc8 PUSH %R13 |
0x428bca PUSH %R12 |
0x428bcc PUSH %RBX |
0x428bcd AND $-0x20,%RSP |
0x428bd1 SUB $0x160,%RSP |
0x428bd8 MOV %RCX,0x80(%RSP) |
0x428be0 MOV %RDX,0x78(%RSP) |
0x428be5 TEST %R8B,%R8B |
0x428be8 MOV %RDI,0x18(%RSP) |
0x428bed JE 429740 |
0x428bf3 MOV %RSI,%RBX |
0x428bf6 MOV 0x248(%RDI),%ESI |
0x428bfc MOV %RBX,%RDI |
0x428bff CALL 47a850 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> |
0x428c04 MOV 0x18(%RSP),%RDI |
0x428c09 MOV 0xa0(%RDI),%R9 |
0x428c10 TEST %R9,%R9 |
0x428c13 JE 429740 |
0x428c19 MOV %RAX,%R11 |
0x428c1c XOR %ECX,%ECX |
0x428c1e VMOVSD 0x116a40(%RIP),%XMM16 |
0x428c28 VBROADCASTSD 0x116a36(%RIP),%YMM17 |
0x428c32 VBROADCASTSD 0x1158f4(%RIP),%YMM18 |
0x428c3c VMOVSD 0x1158ea(%RIP),%XMM19 |
0x428c46 MOV %R9,%RAX |
0x428c49 MOV %R9,0x28(%RSP) |
0x428c4e MOV %RBX,0x50(%RSP) |
0x428c53 MOV %R11,0x20(%RSP) |
0x428c58 JMP 428ca6 |
0x428c5a NOPW %CS:(%RAX,%RAX,1) |
0x428c69 NOPW %CS:(%RAX,%RAX,1) |
0x428c78 NOPL (%RAX,%RAX,1) |
(368) 0x428c80 MOV 0x28(%RSP),%RAX |
(368) 0x428c85 MOV 0x88(%RSP),%RCX |
(368) 0x428c8d INC %RCX |
(368) 0x428c90 MOV %RAX,%RSI |
(368) 0x428c93 MOV %RAX,0x28(%RSP) |
(368) 0x428c98 CMP %RCX,%RAX |
(368) 0x428c9b MOV 0x50(%RSP),%RBX |
(368) 0x428ca0 JBE 429740 |
(368) 0x428ca6 MOV 0x268(%RBX),%RAX |
(368) 0x428cad MOV 0x18(%RAX),%RAX |
(368) 0x428cb1 MOVSXD (%RAX,%RCX,4),%RSI |
(368) 0x428cb5 MOV %RCX,0x88(%RSP) |
(368) 0x428cbd MOVSXD 0x4(%RAX,%RCX,4),%RAX |
(368) 0x428cc2 MOV %RAX,0x98(%RSP) |
(368) 0x428cca CMP %EAX,%ESI |
(368) 0x428ccc JGE 428c80 |
(368) 0x428cce MOV 0x140(%RDI),%R12 |
(368) 0x428cd5 MOV 0x158(%RDI),%R13 |
(368) 0x428cdc MOV 0x170(%RDI),%R15 |
(368) 0x428ce3 MOV $0x1fffffffffffffff,%RAX |
(368) 0x428ced ADD %RSI,%RAX |
(368) 0x428cf0 MOV %RAX,0x58(%RSP) |
(368) 0x428cf5 MOVQ $0,0x68(%RSP) |
(368) 0x428cfe LEA -0x1(%RSI),%RAX |
(368) 0x428d02 MOV %RAX,0x90(%RSP) |
(368) 0x428d0a JMP 428d68 |
0x428d0c NOPW %CS:(%RAX,%RAX,1) |
0x428d1b NOPW %CS:(%RAX,%RAX,1) |
0x428d2a NOPW %CS:(%RAX,%RAX,1) |
0x428d39 NOPL (%RAX) |
(369) 0x428d40 INC %RSI |
(369) 0x428d43 INCQ 0x68(%RSP) |
(369) 0x428d48 INCQ 0x58(%RSP) |
(369) 0x428d4d MOV 0x70(%RSP),%R9 |
(369) 0x428d52 MOV %R9,%RAX |
(369) 0x428d55 CMP 0x98(%RSP),%RSI |
(369) 0x428d5d MOV 0x18(%RSP),%RDI |
(369) 0x428d62 JE 428c85 |
(369) 0x428d68 MOV 0x48(%R11),%RAX |
(369) 0x428d6c LEA (%RSI,%RSI,4),%RCX |
(369) 0x428d70 MOV %RCX,0x38(%RSP) |
(369) 0x428d75 MOV 0x18(%RAX,%RCX,8),%R8 |
(369) 0x428d7a TEST %RSI,%RSI |
(369) 0x428d7d MOV %RSI,0x30(%RSP) |
(369) 0x428d82 MOV %R9,0x70(%RSP) |
(369) 0x428d87 JLE 428dd3 |
(369) 0x428d89 MOV %ESI,%EBX |
(369) 0x428d8b SAL $0x3,%RBX |
(369) 0x428d8f MOV %R12,%RDI |
(369) 0x428d92 XOR %ESI,%ESI |
(369) 0x428d94 MOV %RBX,%RDX |
(369) 0x428d97 MOV %R11,%R14 |
(369) 0x428d9a MOV %R8,0x10(%RSP) |
(369) 0x428d9f VZEROUPPER |
(369) 0x428da2 CALL 53c6d0 <__intel_avx_rep_memset> |
(369) 0x428da7 MOV %R13,%RDI |
(369) 0x428daa XOR %ESI,%ESI |
(369) 0x428dac MOV %RBX,%RDX |
(369) 0x428daf CALL 53c6d0 <__intel_avx_rep_memset> |
(369) 0x428db4 MOV %R15,%RDI |
(369) 0x428db7 XOR %ESI,%ESI |
(369) 0x428db9 MOV %RBX,%RDX |
(369) 0x428dbc CALL 53c6d0 <__intel_avx_rep_memset> |
(369) 0x428dc1 MOV 0x10(%RSP),%R8 |
(369) 0x428dc6 MOV %R14,%R11 |
(369) 0x428dc9 MOV 0x30(%RSP),%RSI |
(369) 0x428dce MOV 0x18(%RSP),%RDI |
(369) 0x428dd3 MOV 0x28(%RSP),%RCX |
(369) 0x428dd8 TEST %RCX,%RCX |
(369) 0x428ddb JE 428ec0 |
(369) 0x428de1 MOV 0x50(%RSP),%RAX |
(369) 0x428de6 MOV 0x18(%RAX),%RAX |
(369) 0x428dea IMUL (%RAX,%RSI,4),%ECX |
(369) 0x428dee MOV %R12,0x10(%RSP) |
(369) 0x428df3 MOVSXD %ECX,%R12 |
(369) 0x428df6 SAL $0x3,%R12 |
(369) 0x428dfa MOV $0x1,%EBX |
(369) 0x428dff NOP |
(383) 0x428e00 MOV 0x200(%RDI),%RAX |
(383) 0x428e07 ADD %R12,%RAX |
(383) 0x428e0a MOV -0x8(%RAX,%RBX,8),%RDI |
(383) 0x428e0f MOV 0x50(%RSP),%RAX |
(383) 0x428e14 MOV 0x268(%RAX),%RAX |
(383) 0x428e1b MOV 0x18(%RAX),%RAX |
(383) 0x428e1f MOV -0x4(%RAX,%RBX,4),%EDX |
(383) 0x428e23 MOVSXD (%RAX,%RBX,4),%RAX |
(383) 0x428e27 CMP %RAX,%RSI |
(383) 0x428e2a MOV %ESI,%ECX |
(383) 0x428e2c CMOVG %EAX,%ECX |
(383) 0x428e2f MOV %R8,%R14 |
(383) 0x428e32 MOV 0x10(%RSP),%R9 |
(383) 0x428e37 MOV 0x18(%RSP),%RAX |
(383) 0x428e3c PUSHQ 0x1e8(%RAX) |
(383) 0x428e42 PUSHQ 0x1d0(%RAX) |
(383) 0x428e48 PUSH %R15 |
(383) 0x428e4a PUSH %R13 |
(383) 0x428e4c VZEROUPPER |
(383) 0x428e4f CALL 424fc0 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi> |
(383) 0x428e54 MOV %R14,%R8 |
(383) 0x428e57 MOV 0x50(%RSP),%RSI |
(383) 0x428e5c MOV 0x38(%RSP),%RDI |
(383) 0x428e61 ADD $0x20,%RSP |
(383) 0x428e65 MOV %EBX,%EAX |
(383) 0x428e67 MOV 0xa0(%RDI),%RCX |
(383) 0x428e6e INC %RBX |
(383) 0x428e71 CMP %RAX,%RCX |
(383) 0x428e74 JA 428e00 |
(369) 0x428e76 MOV 0x140(%RDI),%R12 |
(369) 0x428e7d MOV %RCX,0x70(%RSP) |
(369) 0x428e82 MOV %RCX,0x28(%RSP) |
(369) 0x428e87 MOV 0x20(%RSP),%R11 |
(369) 0x428e8c VMOVSD 0x1167d2(%RIP),%XMM16 |
(369) 0x428e96 VBROADCASTSD 0x1167c8(%RIP),%YMM17 |
(369) 0x428ea0 VBROADCASTSD 0x115686(%RIP),%YMM18 |
(369) 0x428eaa VMOVSD 0x11567c(%RIP),%XMM19 |
(369) 0x428eb4 JMP 428ec9 |
0x428eb6 NOPW %CS:(%RAX,%RAX,1) |
(369) 0x428ec0 MOVQ $0,0x28(%RSP) |
(369) 0x428ec9 VXORPD %XMM0,%XMM0,%XMM0 |
(369) 0x428ecd VXORPD %XMM1,%XMM1,%XMM1 |
(369) 0x428ed1 MOV $0x1fffffffffffffff,%RAX |
(369) 0x428edb TEST %RAX,%RSI |
(369) 0x428ede JE 428f5e |
(369) 0x428ee0 LEA (%RSI,%RAX,1),%RCX |
(369) 0x428ee4 AND %RAX,%RCX |
(369) 0x428ee7 INC %RCX |
(369) 0x428eea MOV %RCX,%RAX |
(369) 0x428eed MOV $0x3ffffffffffffffc,%RDX |
(369) 0x428ef7 AND %RDX,%RAX |
(369) 0x428efa JE 428f40 |
(369) 0x428efc VXORPD %XMM1,%XMM1,%XMM1 |
(369) 0x428f00 XOR %EDX,%EDX |
(369) 0x428f02 NOPW %CS:(%RAX,%RAX,1) |
(382) 0x428f10 VADDPD (%R12,%RDX,8),%YMM1,%YMM1 |
(382) 0x428f16 ADD $0x4,%RDX |
(382) 0x428f1a CMP %RAX,%RDX |
(382) 0x428f1d JB 428f10 |
(369) 0x428f1f VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(369) 0x428f25 VADDPD %XMM2,%XMM1,%XMM1 |
(369) 0x428f29 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(369) 0x428f2e VADDSD %XMM2,%XMM1,%XMM1 |
(369) 0x428f32 CMP %RAX,%RCX |
(369) 0x428f35 JNE 428f42 |
(369) 0x428f37 JMP 428f5e |
0x428f39 NOPL (%RAX) |
(369) 0x428f40 XOR %EAX,%EAX |
(369) 0x428f42 MOV $0x3d,%CL |
(369) 0x428f44 BZHI %RCX,0x58(%RSP),%RCX |
(369) 0x428f4b INC %RCX |
(369) 0x428f4e XCHG %AX,%AX |
(381) 0x428f50 VADDSD (%R12,%RAX,8),%XMM1,%XMM1 |
(381) 0x428f56 INC %RAX |
(381) 0x428f59 CMP %RAX,%RCX |
(381) 0x428f5c JNE 428f50 |
(369) 0x428f5e MOV 0xd8(%RDI),%RDX |
(369) 0x428f65 VMOVSD %XMM1,(%RDX,%RSI,8) |
(369) 0x428f6a MOV 0x158(%RDI),%R13 |
(369) 0x428f71 MOV 0x170(%RDI),%R15 |
(369) 0x428f78 MOV 0x60(%R11),%RAX |
(369) 0x428f7c TEST %RSI,%RSI |
(369) 0x428f7f JLE 429026 |
(369) 0x428f85 MOV %RSI,%RCX |
(369) 0x428f88 AND $-0x4,%RCX |
(369) 0x428f8c JE 429000 |
(369) 0x428f8e LEA -0x1(%RCX),%R9 |
(369) 0x428f92 VXORPD %XMM0,%XMM0,%XMM0 |
(369) 0x428f96 XOR %R8D,%R8D |
(369) 0x428f99 NOPL (%RAX) |
(380) 0x428fa0 VADDPD (%R15,%R8,8),%YMM0,%YMM0 |
(380) 0x428fa6 VFMADD231PD (%R13,%R8,8),%YMM17,%YMM0 |
(380) 0x428fae ADD $0x4,%R8 |
(380) 0x428fb2 CMP %R9,%R8 |
(380) 0x428fb5 JLE 428fa0 |
(369) 0x428fb7 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(369) 0x428fbd VADDPD %XMM1,%XMM0,%XMM0 |
(369) 0x428fc1 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(369) 0x428fc6 VADDSD %XMM1,%XMM0,%XMM0 |
(369) 0x428fca JMP 429021 |
0x428fcc NOPW %CS:(%RAX,%RAX,1) |
0x428fdb NOPW %CS:(%RAX,%RAX,1) |
0x428fea NOPW %CS:(%RAX,%RAX,1) |
0x428ff9 NOPL (%RAX) |
(369) 0x429000 VXORPD %XMM0,%XMM0,%XMM0 |
(369) 0x429004 XOR %ECX,%ECX |
(369) 0x429006 NOPW %CS:(%RAX,%RAX,1) |
(379) 0x429010 VADDSD (%R15,%RCX,8),%XMM0,%XMM0 |
(379) 0x429016 VFMADD231SD (%R13,%RCX,8),%XMM16,%XMM0 |
(379) 0x42901e INC %RCX |
(379) 0x429021 CMP %RCX,%RSI |
(379) 0x429024 JNE 429010 |
(369) 0x429026 MOV 0x38(%RSP),%RCX |
(369) 0x42902b MOV 0x8(%RAX,%RCX,8),%RBX |
(369) 0x429030 MOV 0x18(%RAX,%RCX,8),%RAX |
(369) 0x429035 VXORPD %XMM2,%XMM2,%XMM2 |
(369) 0x429039 VXORPD %XMM1,%XMM1,%XMM1 |
(369) 0x42903d TEST %RSI,%RSI |
(369) 0x429040 JLE 4290e5 |
(369) 0x429046 MOV %RSI,%R9 |
(369) 0x429049 AND $-0x4,%R9 |
(369) 0x42904d JE 4290c0 |
(369) 0x42904f LEA -0x1(%R9),%RCX |
(369) 0x429053 VXORPD %XMM1,%XMM1,%XMM1 |
(369) 0x429057 XOR %R8D,%R8D |
(369) 0x42905a NOPW (%RAX,%RAX,1) |
(378) 0x429060 VMOVUPD (%RAX,%R8,8),%YMM3 |
(378) 0x429066 VFMADD231PD (%R13,%R8,8),%YMM3,%YMM1 |
(378) 0x42906d ADD $0x4,%R8 |
(378) 0x429071 CMP %RCX,%R8 |
(378) 0x429074 JLE 429060 |
(369) 0x429076 VEXTRACTF128 $0x1,%YMM1,%XMM3 |
(369) 0x42907c VADDPD %XMM3,%XMM1,%XMM1 |
(369) 0x429080 VSHUFPD $0x1,%XMM1,%XMM1,%XMM3 |
(369) 0x429085 VADDSD %XMM3,%XMM1,%XMM1 |
(369) 0x429089 JMP 4290e0 |
0x42908b NOPW %CS:(%RAX,%RAX,1) |
0x42909a NOPW %CS:(%RAX,%RAX,1) |
0x4290a9 NOPW %CS:(%RAX,%RAX,1) |
0x4290b8 NOPL (%RAX,%RAX,1) |
(369) 0x4290c0 XOR %R9D,%R9D |
(369) 0x4290c3 NOPW %CS:(%RAX,%RAX,1) |
(377) 0x4290d0 VMOVSD (%RAX,%R9,8),%XMM3 |
(377) 0x4290d6 VFMADD231SD (%R13,%R9,8),%XMM3,%XMM1 |
(377) 0x4290dd INC %R9 |
(377) 0x4290e0 CMP %R9,%RSI |
(377) 0x4290e3 JNE 4290d0 |
(369) 0x4290e5 TEST %RSI,%RSI |
(369) 0x4290e8 JLE 429165 |
(369) 0x4290ea MOV %RSI,%R10 |
(369) 0x4290ed AND $-0x4,%R10 |
(369) 0x4290f1 JE 429140 |
(369) 0x4290f3 LEA -0x1(%R10),%RCX |
(369) 0x4290f7 LEA (%RAX,%RBX,8),%R9 |
(369) 0x4290fb VXORPD %XMM2,%XMM2,%XMM2 |
(369) 0x4290ff XOR %R8D,%R8D |
(369) 0x429102 NOPW %CS:(%RAX,%RAX,1) |
(376) 0x429110 VMOVUPD (%R9,%R8,8),%YMM3 |
(376) 0x429116 VFMADD231PD (%R13,%R8,8),%YMM3,%YMM2 |
(376) 0x42911d ADD $0x4,%R8 |
(376) 0x429121 CMP %RCX,%R8 |
(376) 0x429124 JLE 429110 |
(369) 0x429126 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(369) 0x42912c VADDPD %XMM3,%XMM2,%XMM2 |
(369) 0x429130 VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(369) 0x429135 VADDSD %XMM3,%XMM2,%XMM2 |
(369) 0x429139 CMP %R10,%RSI |
(369) 0x42913c JNE 429147 |
(369) 0x42913e JMP 429165 |
(369) 0x429140 VXORPD %XMM2,%XMM2,%XMM2 |
(369) 0x429144 XOR %R10D,%R10D |
(369) 0x429147 LEA (%RAX,%RBX,8),%RCX |
(369) 0x42914b NOPL (%RAX,%RAX,1) |
(375) 0x429150 VMOVSD (%RCX,%R10,8),%XMM3 |
(375) 0x429156 VFMADD231SD (%R13,%R10,8),%XMM3,%XMM2 |
(375) 0x42915d INC %R10 |
(375) 0x429160 CMP %R10,%RSI |
(375) 0x429163 JNE 429150 |
(369) 0x429165 TEST %RSI,%RSI |
(369) 0x429168 JLE 4291c0 |
(369) 0x42916a MOV %RSI,%R10 |
(369) 0x42916d AND $-0x4,%R10 |
(369) 0x429171 JE 429200 |
(369) 0x429177 LEA -0x1(%R10),%RCX |
(369) 0x42917b MOV %RBX,%R9 |
(369) 0x42917e SAL $0x4,%R9 |
(369) 0x429182 ADD %RAX,%R9 |
(369) 0x429185 VXORPD %XMM3,%XMM3,%XMM3 |
(369) 0x429189 XOR %R8D,%R8D |
(369) 0x42918c NOPL (%RAX) |
(374) 0x429190 VMOVUPD (%R9,%R8,8),%YMM4 |
(374) 0x429196 VFMADD231PD (%R13,%R8,8),%YMM4,%YMM3 |
(374) 0x42919d ADD $0x4,%R8 |
(374) 0x4291a1 CMP %RCX,%R8 |
(374) 0x4291a4 JLE 429190 |
(369) 0x4291a6 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(369) 0x4291ac VADDPD %XMM4,%XMM3,%XMM3 |
(369) 0x4291b0 VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(369) 0x4291b5 VADDSD %XMM4,%XMM3,%XMM3 |
(369) 0x4291b9 CMP %R10,%RSI |
(369) 0x4291bc JNE 429207 |
(369) 0x4291be JMP 429235 |
(369) 0x4291c0 VXORPD %XMM3,%XMM3,%XMM3 |
(369) 0x4291c4 JMP 429235 |
0x4291c6 NOPW %CS:(%RAX,%RAX,1) |
0x4291d5 NOPW %CS:(%RAX,%RAX,1) |
0x4291e4 NOPW %CS:(%RAX,%RAX,1) |
0x4291f3 NOPW %CS:(%RAX,%RAX,1) |
(369) 0x429200 VXORPD %XMM3,%XMM3,%XMM3 |
(369) 0x429204 XOR %R10D,%R10D |
(369) 0x429207 MOV %RBX,%RCX |
(369) 0x42920a SAL $0x4,%RCX |
(369) 0x42920e ADD %RAX,%RCX |
(369) 0x429211 NOPW %CS:(%RAX,%RAX,1) |
(373) 0x429220 VMOVSD (%RCX,%R10,8),%XMM4 |
(373) 0x429226 VFMADD231SD (%R13,%R10,8),%XMM4,%XMM3 |
(373) 0x42922d INC %R10 |
(373) 0x429230 CMP %R10,%RSI |
(373) 0x429233 JNE 429220 |
(369) 0x429235 VPUNPCKLQDQ %XMM2,%XMM1,%XMM1 |
(369) 0x429239 MOV 0xf0(%RDI),%R9 |
(369) 0x429240 MOV 0x100(%RDI),%R8 |
(369) 0x429247 VMOVLPD %XMM1,(%R8,%RSI,8) |
(369) 0x42924d LEA (%RSI,%R9,1),%RCX |
(369) 0x429251 VMOVHPD %XMM1,(%R8,%RCX,8) |
(369) 0x429257 MOV %R9,0x60(%RSP) |
(369) 0x42925c LEA (%RSI,%R9,2),%RCX |
(369) 0x429260 MOV %R8,0x38(%RSP) |
(369) 0x429265 VMOVSD %XMM3,(%R8,%RCX,8) |
(369) 0x42926b VXORPD 0x11528b(%RIP){1to2},%XMM0,%XMM0 |
(369) 0x429275 MOV 0x128(%RDI),%R8 |
(369) 0x42927c VMOVLPD %XMM0,(%R8,%RSI,8) |
(369) 0x429282 TEST %RSI,%RSI |
(369) 0x429285 JLE 42945c |
(369) 0x42928b MOV %RBX,0x40(%RSP) |
(369) 0x429290 LEA -0x1(%RSI),%R9 |
(369) 0x429294 LEA (%RDX,%R9,8),%R11 |
(369) 0x429298 CMP %R8,%R11 |
(369) 0x42929b SETAEB 0xf(%RSP) |
(369) 0x4292a0 LEA (%R8,%R9,8),%RCX |
(369) 0x4292a4 CMP %RDX,%RCX |
(369) 0x4292a7 SETAE %DIL |
(369) 0x4292ab CMP %R12,%R11 |
(369) 0x4292ae MOV %R13,%R14 |
(369) 0x4292b1 MOV %R15,%R13 |
(369) 0x4292b4 SETB %R15B |
(369) 0x4292b8 LEA (%R12,%R9,8),%R10 |
(369) 0x4292bc CMP %RDX,%R10 |
(369) 0x4292bf SETB %SIL |
(369) 0x4292c3 CMP %R8,%R10 |
(369) 0x4292c6 MOV %R12,%R10 |
(369) 0x4292c9 SETB %R12B |
(369) 0x4292cd MOV %R10,0x10(%RSP) |
(369) 0x4292d2 CMP %R10,%RCX |
(369) 0x4292d5 SETBB 0xe(%RSP) |
(369) 0x4292da CMP %R14,%R11 |
(369) 0x4292dd SETB %R10B |
(369) 0x4292e1 LEA (%R14,%R9,8),%RBX |
(369) 0x4292e5 CMP %RDX,%RBX |
(369) 0x4292e8 SETBB 0xd(%RSP) |
(369) 0x4292ed CMP %R13,%R11 |
(369) 0x4292f0 SETB %R11B |
(369) 0x4292f4 LEA (%R13,%R9,8),%R9 |
(369) 0x4292f9 CMP %RDX,%R9 |
(369) 0x4292fc SETBB 0xc(%RSP) |
(369) 0x429301 CMP %R8,%RBX |
(369) 0x429304 SETB %BL |
(369) 0x429307 MOV %R14,0x48(%RSP) |
(369) 0x42930c CMP %R14,%RCX |
(369) 0x42930f SETBB 0xb(%RSP) |
(369) 0x429314 CMP %R8,%R9 |
(369) 0x429317 SETB %R9B |
(369) 0x42931b MOV %R13,%R14 |
(369) 0x42931e CMP %R13,%RCX |
(369) 0x429321 SETB %CL |
(369) 0x429324 TEST %DIL,0xf(%RSP) |
(369) 0x429329 JNE 429400 |
(369) 0x42932f OR %SIL,%R15B |
(369) 0x429332 JE 429400 |
(369) 0x429338 OR 0xe(%RSP),%R12B |
(369) 0x42933d JE 429400 |
(369) 0x429343 OR 0xd(%RSP),%R10B |
(369) 0x429348 JE 429400 |
(369) 0x42934e OR 0xc(%RSP),%R11B |
(369) 0x429353 JE 429400 |
(369) 0x429359 OR 0xb(%RSP),%BL |
(369) 0x42935d JE 429400 |
(369) 0x429363 OR %CL,%R9B |
(369) 0x429366 JE 429400 |
(369) 0x42936c MOV 0x30(%RSP),%RSI |
(369) 0x429371 MOV %RSI,%R9 |
(369) 0x429374 AND $-0x4,%R9 |
(369) 0x429378 JE 429640 |
(369) 0x42937e LEA -0x1(%R9),%RCX |
(369) 0x429382 XOR %EDI,%EDI |
(369) 0x429384 MOV 0x10(%RSP),%R12 |
(369) 0x429389 MOV %R14,%R15 |
(369) 0x42938c MOV 0x48(%RSP),%R13 |
(369) 0x429391 MOV 0x40(%RSP),%RBX |
(369) 0x429396 NOPW %CS:(%RAX,%RAX,1) |
(372) 0x4293a0 VMOVUPD (%RDX,%RDI,8),%YMM0 |
(372) 0x4293a5 VADDPD (%R12,%RDI,8),%YMM0,%YMM0 |
(372) 0x4293ab VMOVUPD %YMM0,(%RDX,%RDI,8) |
(372) 0x4293b0 VMOVUPD (%R13,%RDI,8),%YMM0 |
(372) 0x4293b7 VFMSUB213PD (%R15,%RDI,8),%YMM18,%YMM0 |
(372) 0x4293be VADDPD (%R8,%RDI,8),%YMM0,%YMM0 |
(372) 0x4293c4 VMOVUPD %YMM0,(%R8,%RDI,8) |
(372) 0x4293ca ADD $0x4,%RDI |
(372) 0x4293ce CMP %RCX,%RDI |
(372) 0x4293d1 JLE 4293a0 |
(369) 0x4293d3 CMP %R9,%RSI |
(369) 0x4293d6 MOV 0x20(%RSP),%R11 |
(369) 0x4293db JE 42945c |
(369) 0x4293e1 JMP 42965a |
0x4293e6 NOPW %CS:(%RAX,%RAX,1) |
0x4293f5 NOPW %CS:(%RAX,%RAX,1) |
(369) 0x429400 XOR %ECX,%ECX |
(369) 0x429402 MOV 0x30(%RSP),%RSI |
(369) 0x429407 MOV 0x10(%RSP),%R12 |
(369) 0x42940c MOV %R14,%R15 |
(369) 0x42940f MOV 0x48(%RSP),%R13 |
(369) 0x429414 NOPW %CS:(%RAX,%RAX,1) |
(371) 0x429420 VMOVSD (%RDX,%RCX,8),%XMM0 |
(371) 0x429425 VADDSD (%R12,%RCX,8),%XMM0,%XMM0 |
(371) 0x42942b VMOVSD %XMM0,(%RDX,%RCX,8) |
(371) 0x429430 VMOVSD (%R13,%RCX,8),%XMM0 |
(371) 0x429437 VFMSUB213SD (%R15,%RCX,8),%XMM19,%XMM0 |
(371) 0x42943e VADDSD (%R8,%RCX,8),%XMM0,%XMM0 |
(371) 0x429444 VMOVSD %XMM0,(%R8,%RCX,8) |
(371) 0x42944a INC %RCX |
(371) 0x42944d CMP %RCX,%RSI |
(371) 0x429450 JNE 429420 |
(369) 0x429452 MOV 0x20(%RSP),%R11 |
(369) 0x429457 MOV 0x40(%RSP),%RBX |
(369) 0x42945c TEST %RSI,%RSI |
(369) 0x42945f JLE 428d40 |
(369) 0x429465 MOV %R15,0x10(%RSP) |
(369) 0x42946a MOV %R12,%RDI |
(369) 0x42946d MOV 0x90(%RSP),%RCX |
(369) 0x429475 ADD 0x68(%RSP),%RCX |
(369) 0x42947a JNE 4294c0 |
(369) 0x42947c MOV %RBX,%R14 |
(369) 0x42947f XOR %EDX,%EDX |
(369) 0x429481 JMP 42958e |
0x429486 NOPW %CS:(%RAX,%RAX,1) |
0x429495 NOPW %CS:(%RAX,%RAX,1) |
0x4294a4 NOPW %CS:(%RAX,%RAX,1) |
0x4294b3 NOPW %CS:(%RAX,%RAX,1) |
(369) 0x4294c0 MOV %RSI,%R8 |
(369) 0x4294c3 AND $-0x2,%R8 |
(369) 0x4294c7 LEA 0x8(%RAX),%R9 |
(369) 0x4294cb MOV 0x38(%RSP),%RDX |
(369) 0x4294d0 LEA 0x8(%RDX),%R10 |
(369) 0x4294d4 LEA 0x8(%RAX,%RBX,8),%R11 |
(369) 0x4294d9 MOV 0x60(%RSP),%RSI |
(369) 0x4294de LEA 0x8(%RDX,%RSI,8),%R15 |
(369) 0x4294e3 MOV %RBX,%R14 |
(369) 0x4294e6 MOV %RBX,%RCX |
(369) 0x4294e9 SAL $0x4,%RCX |
(369) 0x4294ed LEA 0x8(%RAX,%RCX,1),%R12 |
(369) 0x4294f2 MOV %RSI,%RCX |
(369) 0x4294f5 SAL $0x4,%RCX |
(369) 0x4294f9 LEA 0x8(%RDX,%RCX,1),%RBX |
(369) 0x4294fe XOR %EDX,%EDX |
(370) 0x429500 VMOVSD (%R13,%RDX,8),%XMM0 |
(370) 0x429507 VMOVSD -0x8(%R9,%RDX,8),%XMM1 |
(370) 0x42950e VFNMADD213SD -0x8(%R10,%RDX,8),%XMM0,%XMM1 |
(370) 0x429515 VMOVSD %XMM1,-0x8(%R10,%RDX,8) |
(370) 0x42951c VMOVSD -0x8(%R11,%RDX,8),%XMM1 |
(370) 0x429523 VFNMADD213SD -0x8(%R15,%RDX,8),%XMM0,%XMM1 |
(370) 0x42952a VMOVSD %XMM1,-0x8(%R15,%RDX,8) |
(370) 0x429531 VMOVSD -0x8(%R12,%RDX,8),%XMM1 |
(370) 0x429538 VFNMADD213SD -0x8(%RBX,%RDX,8),%XMM0,%XMM1 |
(370) 0x42953f VMOVSD %XMM1,-0x8(%RBX,%RDX,8) |
(370) 0x429545 VMOVSD 0x8(%R13,%RDX,8),%XMM0 |
(370) 0x42954c VMOVSD (%R9,%RDX,8),%XMM1 |
(370) 0x429552 VFNMADD213SD (%R10,%RDX,8),%XMM0,%XMM1 |
(370) 0x429558 VMOVSD %XMM1,(%R10,%RDX,8) |
(370) 0x42955e VMOVSD (%R11,%RDX,8),%XMM1 |
(370) 0x429564 VFNMADD213SD (%R15,%RDX,8),%XMM0,%XMM1 |
(370) 0x42956a VMOVSD %XMM1,(%R15,%RDX,8) |
(370) 0x429570 VMOVSD (%R12,%RDX,8),%XMM1 |
(370) 0x429576 VFNMADD213SD (%RBX,%RDX,8),%XMM0,%XMM1 |
(370) 0x42957c VMOVSD %XMM1,(%RBX,%RDX,8) |
(370) 0x429581 ADD $0x2,%RDX |
(370) 0x429585 CMP %RDX,%R8 |
(370) 0x429588 JNE 429500 |
(369) 0x42958e MOV 0x30(%RSP),%RSI |
(369) 0x429593 TEST $0x1,%SIL |
(369) 0x429597 MOV %RDI,%R12 |
(369) 0x42959a MOV 0x10(%RSP),%R15 |
(369) 0x42959f MOV 0x20(%RSP),%R11 |
(369) 0x4295a4 JE 428d40 |
(369) 0x4295aa VMOVSD (%R13,%RDX,8),%XMM0 |
(369) 0x4295b1 VMOVSD (%RAX,%RDX,8),%XMM1 |
(369) 0x4295b6 MOV 0x38(%RSP),%R8 |
(369) 0x4295bb VFNMADD213SD (%R8,%RDX,8),%XMM0,%XMM1 |
(369) 0x4295c1 VMOVSD %XMM1,(%R8,%RDX,8) |
(369) 0x4295c7 LEA (%R14,%R14,1),%RCX |
(369) 0x4295cb ADD %RDX,%R14 |
(369) 0x4295ce VMOVSD (%RAX,%R14,8),%XMM1 |
(369) 0x4295d4 MOV 0x60(%RSP),%R9 |
(369) 0x4295d9 LEA (%R9,%R9,1),%RDI |
(369) 0x4295dd ADD %RDX,%R9 |
(369) 0x4295e0 VFNMADD213SD (%R8,%R9,8),%XMM0,%XMM1 |
(369) 0x4295e6 VMOVSD %XMM1,(%R8,%R9,8) |
(369) 0x4295ec ADD %RDX,%RCX |
(369) 0x4295ef VMOVSD (%RAX,%RCX,8),%XMM1 |
(369) 0x4295f4 ADD %RDX,%RDI |
(369) 0x4295f7 VFNMADD213SD (%R8,%RDI,8),%XMM0,%XMM1 |
(369) 0x4295fd VMOVSD %XMM1,(%R8,%RDI,8) |
(369) 0x429603 JMP 428d40 |
0x429608 NOPW %CS:(%RAX,%RAX,1) |
0x429617 NOPW %CS:(%RAX,%RAX,1) |
0x429626 NOPW %CS:(%RAX,%RAX,1) |
0x429635 NOPW %CS:(%RAX,%RAX,1) |
(369) 0x429640 XOR %R9D,%R9D |
(369) 0x429643 MOV 0x10(%RSP),%R12 |
(369) 0x429648 MOV 0x20(%RSP),%R11 |
(369) 0x42964d MOV %R14,%R15 |
(369) 0x429650 MOV 0x48(%RSP),%R13 |
(369) 0x429655 MOV 0x40(%RSP),%RBX |
(369) 0x42965a MOV %RSI,%RCX |
(369) 0x42965d SUB %R9,%RCX |
(369) 0x429660 VPBROADCASTQ %RCX,%YMM0 |
(369) 0x429666 VPCMPNLEUQ 0x11612f(%RIP),%YMM0,%K1 |
(369) 0x429671 VMOVUPD (%RDX,%R9,8),%YMM0{%K1}{z} |
(369) 0x429678 VMOVUPD 0xa0(%RSP),%YMM2 |
(369) 0x429681 VMOVAPD %YMM0,%YMM2{%K1} |
(369) 0x429687 VMOVUPD (%R12,%R9,8),%YMM0{%K1}{z} |
(369) 0x42968e VMOVUPD 0xc0(%RSP),%YMM1 |
(369) 0x429697 VMOVAPD %YMM0,%YMM1{%K1} |
(369) 0x42969d VMOVUPD %YMM1,0xc0(%RSP) |
(369) 0x4296a6 VMOVUPD %YMM2,0xa0(%RSP) |
(369) 0x4296af VADDPD %YMM1,%YMM2,%YMM0 |
(369) 0x4296b3 VMOVUPD %YMM0,(%RDX,%R9,8){%K1} |
(369) 0x4296ba VMOVUPD (%R13,%R9,8),%YMM0{%K1}{z} |
(369) 0x4296c2 VMOVUPD 0xe0(%RSP),%YMM2 |
(369) 0x4296cb VMOVAPD %YMM0,%YMM2{%K1} |
(369) 0x4296d1 VMOVUPD (%R15,%R9,8),%YMM0{%K1}{z} |
(369) 0x4296d8 VMOVUPD 0x100(%RSP),%YMM1 |
(369) 0x4296e1 VMOVAPD %YMM0,%YMM1{%K1} |
(369) 0x4296e7 VMOVUPD %YMM1,0x100(%RSP) |
(369) 0x4296f0 VMOVAPD %YMM1,%YMM0 |
(369) 0x4296f4 VMOVUPD %YMM2,0xe0(%RSP) |
(369) 0x4296fd VFMSUB231PD %YMM18,%YMM2,%YMM0 |
(369) 0x429703 VMOVUPD (%R8,%R9,8),%YMM1{%K1}{z} |
(369) 0x42970a VMOVUPD 0x120(%RSP),%YMM2 |
(369) 0x429713 VMOVAPD %YMM1,%YMM2{%K1} |
(369) 0x429719 VMOVUPD %YMM2,0x120(%RSP) |
(369) 0x429722 VADDPD %YMM0,%YMM2,%YMM0 |
(369) 0x429726 VMOVUPD %YMM0,(%R8,%R9,8){%K1} |
(369) 0x42972d TEST %RSI,%RSI |
(369) 0x429730 JG 429465 |
(369) 0x429736 JMP 428d40 |
0x42973b NOPL (%RAX,%RAX,1) |
0x429740 MOVQ $0,0x10(%RDI) |
0x429748 MOV 0x90(%RDI),%R10 |
0x42974f TEST %R10,%R10 |
0x429752 JE 4297c0 |
0x429754 MOV %RDI,%RAX |
0x429757 MOV 0xd8(%RDI),%R9 |
0x42975e MOV 0x100(%RDI),%RDX |
0x429765 MOVSXD 0xf0(%RDI),%RDI |
0x42976c MOV 0x78(%RSP),%RCX |
0x429771 MOV 0x18(%RCX),%RSI |
0x429775 MOV 0x128(%RAX),%RAX |
0x42977c MOV 0x80(%RSP),%RCX |
0x429784 MOV 0x18(%RCX),%RCX |
0x429788 LEA (%RDI,%RDI,1),%R8 |
0x42978c CMP $0x1,%R10 |
0x429790 JNE 429800 |
0x429792 VXORPD %XMM0,%XMM0,%XMM0 |
0x429796 XOR %R11D,%R11D |
0x429799 JMP 4298ea |
0x42979e NOPW %CS:(%RAX,%RAX,1) |
0x4297ad NOPW %CS:(%RAX,%RAX,1) |
0x4297bc NOPL (%RAX) |
0x4297c0 VMOVSD 0x114d38(%RIP),%XMM0 |
0x4297c8 JMP 42995b |
0x4297cd NOPW %CS:(%RAX,%RAX,1) |
0x4297dc NOPW %CS:(%RAX,%RAX,1) |
0x4297eb NOPW %CS:(%RAX,%RAX,1) |
0x4297fa NOPW (%RAX,%RAX,1) |
0x429800 MOV %R10,%RBX |
0x429803 AND $-0x2,%RBX |
0x429807 LEA 0x8(%RDX,%RDI,8),%R14 |
0x42980c LEA 0x8(%RDX,%R8,8),%R15 |
0x429811 LEA 0x28(%RSI),%R12 |
0x429815 VXORPD %XMM0,%XMM0,%XMM0 |
0x429819 XOR %R11D,%R11D |
0x42981c MOV 0x18(%RSP),%R13 |
0x429821 NOPW %CS:(%RAX,%RAX,1) |
(367) 0x429830 VADDSD (%R9,%R11,8),%XMM0,%XMM0 |
(367) 0x429836 VMOVSD %XMM0,0x10(%R13) |
(367) 0x42983c VMOVSD (%RDX,%R11,8),%XMM0 |
(367) 0x429842 VMOVHPD -0x8(%R14,%R11,8),%XMM0,%XMM0 |
(367) 0x429849 VADDPD -0x28(%R12),%XMM0,%XMM0 |
(367) 0x429850 VMOVSD -0x18(%R12),%XMM1 |
(367) 0x429857 VADDSD -0x8(%R15,%R11,8),%XMM1,%XMM1 |
(367) 0x42985e VMOVUPD %XMM0,-0x28(%R12) |
(367) 0x429865 VMOVSD %XMM1,-0x18(%R12) |
(367) 0x42986c VMOVSD (%RCX,%R11,8),%XMM0 |
(367) 0x429872 VADDSD (%RAX,%R11,8),%XMM0,%XMM0 |
(367) 0x429878 VMOVSD %XMM0,(%RCX,%R11,8) |
(367) 0x42987e VMOVSD 0x8(%R9,%R11,8),%XMM0 |
(367) 0x429885 VADDSD 0x10(%R13),%XMM0,%XMM0 |
(367) 0x42988b VMOVSD %XMM0,0x10(%R13) |
(367) 0x429891 VMOVSD 0x8(%RDX,%R11,8),%XMM0 |
(367) 0x429898 VMOVHPD (%R14,%R11,8),%XMM0,%XMM0 |
(367) 0x42989e VADDPD -0x10(%R12),%XMM0,%XMM0 |
(367) 0x4298a5 VMOVSD (%R12),%XMM1 |
(367) 0x4298ab VADDSD (%R15,%R11,8),%XMM1,%XMM1 |
(367) 0x4298b1 VMOVUPD %XMM0,-0x10(%R12) |
(367) 0x4298b8 VMOVSD %XMM1,(%R12) |
(367) 0x4298be VMOVSD 0x8(%RCX,%R11,8),%XMM0 |
(367) 0x4298c5 VADDSD 0x8(%RAX,%R11,8),%XMM0,%XMM0 |
(367) 0x4298cc VMOVSD %XMM0,0x8(%RCX,%R11,8) |
(367) 0x4298d3 VMOVSD 0x10(%R13),%XMM0 |
(367) 0x4298d9 ADD $0x2,%R11 |
(367) 0x4298dd ADD $0x30,%R12 |
(367) 0x4298e1 CMP %R11,%RBX |
(367) 0x4298e4 JNE 429830 |
0x4298ea TEST $0x1,%R10B |
0x4298ee JE 42994e |
0x4298f0 VADDSD (%R9,%R11,8),%XMM0,%XMM0 |
0x4298f6 MOV 0x18(%RSP),%R10 |
0x4298fb VMOVSD %XMM0,0x10(%R10) |
0x429901 ADD %R11,%RDI |
0x429904 ADD %R11,%R8 |
0x429907 LEA (%R11,%R11,2),%R9 |
0x42990b VMOVSD (%RDX,%R11,8),%XMM0 |
0x429911 VMOVHPD (%RDX,%RDI,8),%XMM0,%XMM0 |
0x429916 VADDPD (%RSI,%R9,8),%XMM0,%XMM0 |
0x42991c VMOVSD 0x10(%RSI,%R9,8),%XMM1 |
0x429923 VADDSD (%RDX,%R8,8),%XMM1,%XMM1 |
0x429929 VMOVUPD %XMM0,(%RSI,%R9,8) |
0x42992f VMOVSD %XMM1,0x10(%RSI,%R9,8) |
0x429936 VMOVSD (%RCX,%R11,8),%XMM0 |
0x42993c VADDSD (%RAX,%R11,8),%XMM0,%XMM0 |
0x429942 VMOVSD %XMM0,(%RCX,%R11,8) |
0x429948 VMOVSD 0x10(%R10),%XMM0 |
0x42994e VMULSD 0x114b9a(%RIP),%XMM0,%XMM0 |
0x429956 MOV 0x18(%RSP),%RDI |
0x42995b VMOVSD %XMM0,0x10(%RDI) |
0x429960 LEA -0x28(%RBP),%RSP |
0x429964 POP %RBX |
0x429965 POP %R12 |
0x429967 POP %R13 |
0x429969 POP %R14 |
0x42996b POP %R15 |
0x42996d POP %RBP |
0x42996e VZEROUPPER |
0x429971 RET |
0x429972 NOPW %CS:(%RAX,%RAX,1) |
0x42997c NOPL (%RAX) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.93+ | miniqmcreference::TwoBodyJastr[...] | TwoBodyJastrowRef.h:411 | exec |
○ | qmcplusplus::WaveFunction::eva[...] | WaveFunction.cpp:175 | exec |
○ | main.extracted.113 | miniqmc.cpp:397 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 135 |
nb uops | 137 |
loop length | 959 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 7 |
ADD-SUB / MUL ratio | 4.00 |
micro-operation queue | 23.67 cycles |
front end | 23.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.90 | 4.90 | 12.33 | 12.33 | 9.50 | 4.70 | 4.70 | 9.50 | 9.50 | 9.50 | 4.80 | 12.33 |
cycles | 4.90 | 4.90 | 12.33 | 12.33 | 9.50 | 4.70 | 4.70 | 9.50 | 9.50 | 9.50 | 4.80 | 12.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 23.52-23.59 |
Stall cycles | 0.00 |
Front-end | 23.67 |
Dispatch | 12.33 |
Overall L1 | 23.67 |
all | 6% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 14% |
all | 18% |
load | 6% |
store | 20% |
mul | 0% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 13% |
load | 6% |
store | 8% |
mul | 0% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 27% |
all | 12% |
load | 12% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 14% |
all | 14% |
load | 13% |
store | 15% |
mul | 12% |
add-sub | 15% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 14% |
load | 13% |
store | 13% |
mul | 12% |
add-sub | 15% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x160,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %RDI,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 429740 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x248(%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 47a850 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa0(%RDI),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R9,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 429740 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0x116a40(%RIP),%XMM16 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0x116a36(%RIP),%YMM17 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x1158f4(%RIP),%YMM18 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVSD 0x1158ea(%RIP),%XMM19 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 428ca6 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xe6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVQ $0,0x10(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RDI),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R10,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4297c0 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDI,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xd8(%RDI),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x100(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0xf0(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x78(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RCX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x128(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDI,%RDI,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP $0x1,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 429800 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc40> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4298ea <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xd2a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0x114d38(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 42995b <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xd9b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R10,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x2,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
LEA 0x8(%RDX,%RDI,8),%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x8(%RDX,%R8,8),%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x28(%RSI),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%R10B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 42994e <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xd8e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VADDSD (%R9,%R11,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
MOV 0x18(%RSP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%R10) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R11,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R11,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (%R11,%R11,2),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD (%RDX,%R11,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVHPD (%RDX,%RDI,8),%XMM0,%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4-12 | 1 |
VADDPD (%RSI,%R9,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD 0x10(%RSI,%R9,8),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RDX,%R8,8),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVUPD %XMM0,(%RSI,%R9,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD %XMM1,0x10(%RSI,%R9,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD (%RCX,%R11,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R11,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RCX,%R11,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x10(%R10),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0x114b9a(%RIP),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV 0x18(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 135 |
nb uops | 137 |
loop length | 959 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 7 |
ADD-SUB / MUL ratio | 4.00 |
micro-operation queue | 23.67 cycles |
front end | 23.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.90 | 4.90 | 12.33 | 12.33 | 9.50 | 4.70 | 4.70 | 9.50 | 9.50 | 9.50 | 4.80 | 12.33 |
cycles | 4.90 | 4.90 | 12.33 | 12.33 | 9.50 | 4.70 | 4.70 | 9.50 | 9.50 | 9.50 | 4.80 | 12.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 23.52-23.59 |
Stall cycles | 0.00 |
Front-end | 23.67 |
Dispatch | 12.33 |
Overall L1 | 23.67 |
all | 6% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 14% |
all | 18% |
load | 6% |
store | 20% |
mul | 0% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 13% |
load | 6% |
store | 8% |
mul | 0% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 27% |
all | 12% |
load | 12% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 14% |
all | 14% |
load | 13% |
store | 15% |
mul | 12% |
add-sub | 15% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 14% |
load | 13% |
store | 13% |
mul | 12% |
add-sub | 15% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x160,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %RDI,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 429740 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x248(%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 47a850 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa0(%RDI),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R9,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 429740 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0x116a40(%RIP),%XMM16 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0x116a36(%RIP),%YMM17 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x1158f4(%RIP),%YMM18 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVSD 0x1158ea(%RIP),%XMM19 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 428ca6 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xe6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVQ $0,0x10(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RDI),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R10,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4297c0 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDI,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xd8(%RDI),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x100(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0xf0(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x78(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RCX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x128(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDI,%RDI,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP $0x1,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 429800 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc40> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4298ea <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xd2a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0x114d38(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 42995b <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xd9b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R10,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x2,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
LEA 0x8(%RDX,%RDI,8),%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x8(%RDX,%R8,8),%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x28(%RSI),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%R10B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 42994e <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xd8e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VADDSD (%R9,%R11,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
MOV 0x18(%RSP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%R10) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R11,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R11,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (%R11,%R11,2),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD (%RDX,%R11,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVHPD (%RDX,%RDI,8),%XMM0,%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4-12 | 1 |
VADDPD (%RSI,%R9,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD 0x10(%RSI,%R9,8),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RDX,%R8,8),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVUPD %XMM0,(%RSI,%R9,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD %XMM1,0x10(%RSI,%R9,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD (%RCX,%R11,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R11,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RCX,%R11,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x10(%R10),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0x114b9a(%RIP),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV 0x18(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM0,0x10(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼miniqmcreference::TwoBodyJastrowRef | 0.17 | 0.14 |
○Loop 367 - TwoBodyJastrowRef.h:423-427 - exec | 0 | 0 |
▼Loop 368 - TwoBodyJastrowRef.h:268-420 - exec– | 0 | 0 |
▼Loop 369 - stl_algobase.h:200-754 - exec– | 0 | 0 |
○Loop 370 - TwoBodyJastrowRef.h:393-398 - exec | 0.05 | 0.04 |
○Loop 376 - TwoBodyJastrowRef.h:381-382 - exec | 0.03 | 0.02 |
○Loop 378 - TwoBodyJastrowRef.h:381-382 - exec | 0.03 | 0.02 |
○Loop 374 - TwoBodyJastrowRef.h:381-382 - exec | 0.03 | 0.02 |
○Loop 380 - TwoBodyJastrowRef.h:375-376 - exec | 0.02 | 0.02 |
○Loop 382 - stl_numeric.h:126-127 - exec | 0.01 | 0 |
○Loop 372 - TwoBodyJastrowRef.h:388-391 - exec | 0.01 | 0.01 |
○Loop 375 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 381 - stl_numeric.h:126-127 - exec | 0 | 0 |
○Loop 371 - TwoBodyJastrowRef.h:388-391 - exec | 0 | 0 |
○Loop 377 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 373 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 383 - TwoBodyJastrowRef.h:269-274 - exec | 0 | 0 |
○Loop 379 - TwoBodyJastrowRef.h:375-376 - exec | 0 | 0 |