Function: _ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLER ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.12% |
---|
Function: _ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLER ... | Module: exec | Source: TwoBodyJastrowRef.h:268-432 [...] | Coverage: 0.12% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Particle/DistanceTable.h: 268 - 268 |
-------------------------------------------------------------------------------- |
268: const DistRow& getDistRow(int iel) const { return distances_[iel]; } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/TwoBodyJastrowRef.h: 268 - 432 |
-------------------------------------------------------------------------------- |
268: const int igt = P.GroupID[iat] * NumGroups; |
269: for (int jg = 0; jg < NumGroups; ++jg) |
270: { |
271: const FuncType& f2(*F[igt + jg]); |
272: int iStart = P.first(jg); |
273: int iEnd = std::min(jelmax, P.last(jg)); |
274: f2.evaluateVGL(iat, iStart, iEnd, dist, u, du, d2u, DistCompressed.data(), DistIndice.data()); |
[...] |
360: const auto& d_table = P.getDistTableAA(myTableID); |
361: for (int ig = 0; ig < NumGroups; ++ig) |
362: { |
363: const int igt = ig * NumGroups; |
364: for (int iat = P.first(ig), last = P.last(ig); iat < last; ++iat) |
365: { |
366: computeU3(P, iat, d_table.getDistRow(iat).data(), cur_u.data(), cur_du.data(), cur_d2u.data(), true); |
367: Uat[iat] = std::accumulate(cur_u.begin(), cur_u.begin() + iat, valT()); |
[...] |
375: for (int jat = 0; jat < iat; ++jat) |
376: lap += d2u[jat] + lapfac * du[jat]; |
377: for (int idim = 0; idim < OHMMS_DIM; ++idim) |
378: { |
379: const valT* restrict dX = displ.data(idim); |
380: valT s = valT(); |
381: for (int jat = 0; jat < iat; ++jat) |
382: s += du[jat] * dX[jat]; |
383: grad[idim] = s; |
384: } |
385: dUat(iat) = grad; |
386: d2Uat[iat] = -lap; |
387: // add the contribution from the upper triangle |
388: for (int jat = 0; jat < iat; jat++) |
389: { |
390: Uat[jat] += u[jat]; |
391: d2Uat[jat] -= d2u[jat] + lapfac * du[jat]; |
[...] |
397: for (int jat = 0; jat < iat; jat++) |
398: save_g[jat] -= du[jat] * dX[jat]; |
[...] |
419: { |
420: if (fromscratch) |
421: recompute(P); |
422: LogValue = valT(0); |
423: for (int iat = 0; iat < N; ++iat) |
424: { |
425: LogValue += Uat[iat]; |
426: G[iat] += dUat[iat]; |
427: L[iat] += d2Uat[iat]; |
428: } |
429: |
430: constexpr valT mhalf(-0.5); |
431: LogValue = mhalf * LogValue; |
432: } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 145 - 169 |
-------------------------------------------------------------------------------- |
145: X[i] = base[i * offset]; |
[...] |
169: inline Type_t& operator[](unsigned int i) { return X[i]; } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_numeric.h: 140 - 141 |
-------------------------------------------------------------------------------- |
140: for (; __first != __last; ++__first) |
141: __init = _GLIBCXX_MOVE_IF_20(__init) + *__first; |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/shared_ptr_base.h: 1296 - 1296 |
-------------------------------------------------------------------------------- |
1296: { return _M_ptr; } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_vector.h: 1064 - 1169 |
-------------------------------------------------------------------------------- |
1064: return *(this->_M_impl._M_start + __n); |
[...] |
1169: { return _M_data_ptr(this->_M_impl._M_start); } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_algobase.h: 924 - 1115 |
-------------------------------------------------------------------------------- |
924: *__first = __tmp; |
[...] |
1115: if (__n <= 0) |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 313 - 316 |
-------------------------------------------------------------------------------- |
313: inline int first(int igroup) const { return (*group_offsets_)[igroup]; } |
314: |
315: ///return the last index of a group i |
316: inline int last(int igroup) const { return (*group_offsets_)[igroup + 1]; } |
/usr/lib/gcc/x86_64-redhat-linux/11/../../../../include/c++/11/bits/stl_iterator.h: 1028 - 1182 |
-------------------------------------------------------------------------------- |
1028: : _M_current(__i) { } |
[...] |
1182: { return __lhs.base() != __rhs.base(); } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 231 - 273 |
-------------------------------------------------------------------------------- |
231: inline const AoSElement_t operator[](size_t i) const { return AoSElement_t(myData + i, nGhosts); } |
[...] |
244: *(_base + M * i) = rhs[i]; |
[...] |
263: inline Accessor operator()(size_t i) { return Accessor(myData + i, nGhosts); } |
[...] |
273: inline const T* restrict data(size_t i) const { return myData + i * nGhosts; } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
[...] |
249: inline const_pointer data() const { return X; } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 94 - 94 |
-------------------------------------------------------------------------------- |
94: (const_cast<T1&>(a) += b); |
0x4202b0 PUSH %RBP |
0x4202b1 MOV %RSP,%RBP |
0x4202b4 PUSH %R15 |
0x4202b6 PUSH %R14 |
0x4202b8 PUSH %R13 |
0x4202ba PUSH %R12 |
0x4202bc PUSH %RBX |
0x4202bd AND $-0x20,%RSP |
0x4202c1 SUB $0x160,%RSP |
0x4202c8 MOV %RCX,0x90(%RSP) |
0x4202d0 MOV %RDX,0x88(%RSP) |
0x4202d8 MOV %RDI,%R12 |
0x4202db TEST %R8B,%R8B |
0x4202de JE 420d55 |
0x4202e4 MOV %RSI,%RBX |
0x4202e7 MOV 0x248(%R12),%ESI |
0x4202ef MOV %RBX,%RDI |
0x4202f2 CALL 45f8c0 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> |
0x4202f7 MOV 0xa0(%R12),%R10 |
0x4202ff TEST %R10,%R10 |
0x420302 JE 420d55 |
0x420308 MOV %RAX,%R15 |
0x42030b XOR %ECX,%ECX |
0x42030d VMOVSD 0xd5f63(%RIP),%XMM6 |
0x420315 VBROADCASTSD 0xd5f5a(%RIP),%YMM7 |
0x42031e VBROADCASTSD 0xd4d51(%RIP),%YMM8 |
0x420327 VMOVSD 0xd4d49(%RIP),%XMM9 |
0x42032f MOV %R10,%RDX |
0x420332 MOV %RBX,0x68(%RSP) |
0x420337 MOV %R12,0x48(%RSP) |
0x42033c MOV %RAX,0x28(%RSP) |
0x420341 JMP 42036f |
0x420343 NOPW %CS:(%RAX,%RAX,1) |
(375) 0x420350 MOV %RDX,%RAX |
(375) 0x420353 MOV 0x98(%RSP),%RCX |
(375) 0x42035b INC %RCX |
(375) 0x42035e MOV %RAX,%RDX |
(375) 0x420361 CMP %RCX,%RAX |
(375) 0x420364 MOV 0x68(%RSP),%RBX |
(375) 0x420369 JBE 420d55 |
(375) 0x42036f MOV 0x268(%RBX),%RAX |
(375) 0x420376 MOV 0x18(%RAX),%RAX |
(375) 0x42037a MOVSXD (%RAX,%RCX,4),%RSI |
(375) 0x42037e MOV 0x4(%RAX,%RCX,4),%EAX |
(375) 0x420382 CMP %EAX,%ESI |
(375) 0x420384 MOV %RCX,0x98(%RSP) |
(375) 0x42038c JGE 420350 |
(375) 0x42038e MOV %EAX,0x74(%RSP) |
(375) 0x420392 MOV 0x140(%R12),%R9 |
(375) 0x42039a MOV 0x158(%R12),%R13 |
(375) 0x4203a2 MOV 0x170(%R12),%RBX |
(375) 0x4203aa MOV $0x1fffffffffffffff,%RAX |
(375) 0x4203b4 ADD %RSI,%RAX |
(375) 0x4203b7 MOV %RAX,0x78(%RSP) |
(375) 0x4203bc JMP 4203dd |
0x4203be XCHG %AX,%AX |
(377) 0x4203c0 INC %RSI |
(377) 0x4203c3 INCQ 0x78(%RSP) |
(377) 0x4203c8 MOV %R10,%RAX |
(377) 0x4203cb CMP %ESI,0x74(%RSP) |
(377) 0x4203cf MOV 0x80(%RSP),%RDX |
(377) 0x4203d7 JE 420353 |
(377) 0x4203dd MOV %RBX,0x30(%RSP) |
(377) 0x4203e2 MOV 0x48(%R15),%RAX |
(377) 0x4203e6 LEA (%RSI,%RSI,4),%RCX |
(377) 0x4203ea MOV %RCX,0x20(%RSP) |
(377) 0x4203ef MOV 0x18(%RAX,%RCX,8),%R8 |
(377) 0x4203f4 TEST %RSI,%RSI |
(377) 0x4203f7 MOV %RSI,0x60(%RSP) |
(377) 0x4203fc MOV %R9,0x38(%RSP) |
(377) 0x420401 JLE 42047d |
(377) 0x420403 MOV %ESI,%EBX |
(377) 0x420405 SAL $0x3,%RBX |
(377) 0x420409 MOV %R9,%RDI |
(377) 0x42040c XOR %ESI,%ESI |
(377) 0x42040e MOV %RDX,%R15 |
(377) 0x420411 MOV %RBX,%RDX |
(377) 0x420414 MOV %R10,%R14 |
(377) 0x420417 MOV %R8,%R12 |
(377) 0x42041a VZEROUPPER |
(377) 0x42041d CALL 4e63c0 <_intel_fast_memset> |
(377) 0x420422 MOV %R13,%RDI |
(377) 0x420425 XOR %ESI,%ESI |
(377) 0x420427 MOV %RBX,%RDX |
(377) 0x42042a CALL 4e63c0 <_intel_fast_memset> |
(377) 0x42042f MOV 0x30(%RSP),%RDI |
(377) 0x420434 XOR %ESI,%ESI |
(377) 0x420436 MOV %RBX,%RDX |
(377) 0x420439 CALL 4e63c0 <_intel_fast_memset> |
(377) 0x42043e MOV %R12,%R8 |
(377) 0x420441 MOV %R15,%RDX |
(377) 0x420444 MOV 0x28(%RSP),%R15 |
(377) 0x420449 MOV 0x48(%RSP),%R12 |
(377) 0x42044e MOV 0x38(%RSP),%R9 |
(377) 0x420453 MOV 0x60(%RSP),%RSI |
(377) 0x420458 MOV %R14,%R10 |
(377) 0x42045b VMOVSD 0xd4c15(%RIP),%XMM9 |
(377) 0x420463 VBROADCASTSD 0xd4c0c(%RIP),%YMM8 |
(377) 0x42046c VBROADCASTSD 0xd5e03(%RIP),%YMM7 |
(377) 0x420475 VMOVSD 0xd5dfb(%RIP),%XMM6 |
(377) 0x42047d TEST %RDX,%RDX |
(377) 0x420480 JE 420560 |
(377) 0x420486 MOV 0x68(%RSP),%RAX |
(377) 0x42048b MOV 0x18(%RAX),%RAX |
(377) 0x42048f IMUL (%RAX,%RSI,4),%EDX |
(377) 0x420493 MOVSXD %EDX,%R14 |
(377) 0x420496 SAL $0x3,%R14 |
(377) 0x42049a MOV %R12,%R15 |
(377) 0x42049d MOV $0x1,%R12D |
(377) 0x4204a3 MOV %R13,0x40(%RSP) |
(377) 0x4204a8 MOV 0x30(%RSP),%R13 |
(377) 0x4204ad NOPL (%RAX) |
(395) 0x4204b0 MOV 0x200(%R15),%RAX |
(395) 0x4204b7 ADD %R14,%RAX |
(395) 0x4204ba MOV -0x8(%RAX,%R12,8),%RDI |
(395) 0x4204bf MOV 0x68(%RSP),%RAX |
(395) 0x4204c4 MOV 0x268(%RAX),%RAX |
(395) 0x4204cb MOV 0x18(%RAX),%RAX |
(395) 0x4204cf MOV -0x4(%RAX,%R12,4),%EDX |
(395) 0x4204d4 MOV (%RAX,%R12,4),%ECX |
(395) 0x4204d8 CMP %ESI,%ECX |
(395) 0x4204da CMOVGE %ESI,%ECX |
(395) 0x4204dd MOV %R8,%RBX |
(395) 0x4204e0 PUSHQ 0x1e8(%R15) |
(395) 0x4204e7 PUSHQ 0x1d0(%R15) |
(395) 0x4204ee PUSH %R13 |
(395) 0x4204f0 PUSHQ 0x58(%RSP) |
(395) 0x4204f4 VZEROUPPER |
(395) 0x4204f7 CALL 41d2d0 <_ZNK11qmcplusplus14BsplineFunctorIdE11evaluateVGLEiiiPKdPdS4_S4_S4_Pi> |
(395) 0x4204fc MOV %RBX,%R8 |
(395) 0x4204ff MOV 0x58(%RSP),%R9 |
(395) 0x420504 MOV 0x80(%RSP),%RSI |
(395) 0x42050c ADD $0x20,%RSP |
(395) 0x420510 MOV %R12D,%EAX |
(395) 0x420513 MOV 0xa0(%R15),%R10 |
(395) 0x42051a INC %R12 |
(395) 0x42051d CMP %RAX,%R10 |
(395) 0x420520 JA 4204b0 |
(377) 0x420522 MOV 0x140(%R15),%R9 |
(377) 0x420529 MOV %R10,%RAX |
(377) 0x42052c MOV %R10,0x80(%RSP) |
(377) 0x420534 MOV %R15,%R12 |
(377) 0x420537 MOV 0x28(%RSP),%R15 |
(377) 0x42053c VMOVSD 0xd5d34(%RIP),%XMM6 |
(377) 0x420544 VBROADCASTSD 0xd5d2b(%RIP),%YMM7 |
(377) 0x42054d VBROADCASTSD 0xd4b22(%RIP),%YMM8 |
(377) 0x420556 VMOVSD 0xd4b1a(%RIP),%XMM9 |
(377) 0x42055e JMP 42056a |
(377) 0x420560 XOR %EAX,%EAX |
(377) 0x420562 MOV %RAX,0x80(%RSP) |
(377) 0x42056a VXORPD %XMM0,%XMM0,%XMM0 |
(377) 0x42056e VXORPD %XMM1,%XMM1,%XMM1 |
(377) 0x420572 MOV $0x1fffffffffffffff,%RAX |
(377) 0x42057c TEST %RAX,%RSI |
(377) 0x42057f JE 4205fe |
(377) 0x420581 LEA (%RSI,%RAX,1),%RCX |
(377) 0x420585 AND %RAX,%RCX |
(377) 0x420588 INC %RCX |
(377) 0x42058b MOV %RCX,%RAX |
(377) 0x42058e MOV $0x3ffffffffffffffc,%RDX |
(377) 0x420598 AND %RDX,%RAX |
(377) 0x42059b JE 4205e0 |
(377) 0x42059d VXORPD %XMM1,%XMM1,%XMM1 |
(377) 0x4205a1 XOR %EDX,%EDX |
(377) 0x4205a3 NOPW %CS:(%RAX,%RAX,1) |
(394) 0x4205b0 VADDPD (%R9,%RDX,8),%YMM1,%YMM1 |
(394) 0x4205b6 ADD $0x4,%RDX |
(394) 0x4205ba CMP %RAX,%RDX |
(394) 0x4205bd JB 4205b0 |
(377) 0x4205bf VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(377) 0x4205c5 VADDPD %XMM2,%XMM1,%XMM1 |
(377) 0x4205c9 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(377) 0x4205ce VADDSD %XMM2,%XMM1,%XMM1 |
(377) 0x4205d2 CMP %RAX,%RCX |
(377) 0x4205d5 JNE 4205e2 |
(377) 0x4205d7 JMP 4205fe |
0x4205d9 NOPL (%RAX) |
(377) 0x4205e0 XOR %EAX,%EAX |
(377) 0x4205e2 MOV $0x3d,%CL |
(377) 0x4205e4 BZHI %RCX,0x78(%RSP),%RCX |
(377) 0x4205eb INC %RCX |
(377) 0x4205ee XCHG %AX,%AX |
(393) 0x4205f0 VADDSD (%R9,%RAX,8),%XMM1,%XMM1 |
(393) 0x4205f6 INC %RAX |
(393) 0x4205f9 CMP %RAX,%RCX |
(393) 0x4205fc JNE 4205f0 |
(377) 0x4205fe MOV 0xd8(%R12),%RDX |
(377) 0x420606 VMOVSD %XMM1,(%RDX,%RSI,8) |
(377) 0x42060b MOV 0x158(%R12),%R13 |
(377) 0x420613 MOV 0x170(%R12),%RBX |
(377) 0x42061b MOV 0x60(%R15),%RAX |
(377) 0x42061f TEST %RSI,%RSI |
(377) 0x420622 JLE 420680 |
(377) 0x420624 MOV %RSI,%RCX |
(377) 0x420627 AND $-0x4,%RCX |
(377) 0x42062b JE 420670 |
(377) 0x42062d LEA -0x1(%RCX),%R8 |
(377) 0x420631 VXORPD %XMM0,%XMM0,%XMM0 |
(377) 0x420635 XOR %EDI,%EDI |
(377) 0x420637 NOPW (%RAX,%RAX,1) |
(392) 0x420640 VADDPD (%RBX,%RDI,8),%YMM0,%YMM0 |
(392) 0x420645 VFMADD231PD (%R13,%RDI,8),%YMM7,%YMM0 |
(392) 0x42064c ADD $0x4,%RDI |
(392) 0x420650 CMP %R8,%RDI |
(392) 0x420653 JLE 420640 |
(377) 0x420655 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(377) 0x42065b VADDPD %XMM1,%XMM0,%XMM0 |
(377) 0x42065f VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(377) 0x420664 VADDSD %XMM1,%XMM0,%XMM0 |
(377) 0x420668 JMP 420be0 |
0x42066d NOPL (%RAX) |
(377) 0x420670 VXORPD %XMM0,%XMM0,%XMM0 |
(377) 0x420674 XOR %ECX,%ECX |
(377) 0x420676 JMP 420be9 |
0x42067b NOPL (%RAX,%RAX,1) |
(377) 0x420680 MOV 0x20(%RSP),%RCX |
(377) 0x420685 MOV 0x8(%RAX,%RCX,8),%R14 |
(377) 0x42068a MOV 0x18(%RAX,%RCX,8),%RAX |
(377) 0x42068f VXORPD %XMM2,%XMM2,%XMM2 |
(377) 0x420693 VXORPD %XMM1,%XMM1,%XMM1 |
(377) 0x420697 TEST %RSI,%RSI |
(377) 0x42069a JLE 420705 |
(377) 0x42069c MOV %RSI,%R8 |
(377) 0x42069f AND $-0x4,%R8 |
(377) 0x4206a3 JE 4206e0 |
(377) 0x4206a5 LEA -0x1(%R8),%RCX |
(377) 0x4206a9 VXORPD %XMM1,%XMM1,%XMM1 |
(377) 0x4206ad XOR %EDI,%EDI |
(377) 0x4206af NOP |
(390) 0x4206b0 VMOVUPD (%RAX,%RDI,8),%YMM3 |
(390) 0x4206b5 VFMADD231PD (%R13,%RDI,8),%YMM3,%YMM1 |
(390) 0x4206bc ADD $0x4,%RDI |
(390) 0x4206c0 CMP %RCX,%RDI |
(390) 0x4206c3 JLE 4206b0 |
(377) 0x4206c5 VEXTRACTF128 $0x1,%YMM1,%XMM3 |
(377) 0x4206cb VADDPD %XMM3,%XMM1,%XMM1 |
(377) 0x4206cf VSHUFPD $0x1,%XMM1,%XMM1,%XMM3 |
(377) 0x4206d4 VADDSD %XMM3,%XMM1,%XMM1 |
(377) 0x4206d8 JMP 420700 |
0x4206da NOPW (%RAX,%RAX,1) |
(377) 0x4206e0 XOR %R8D,%R8D |
(377) 0x4206e3 NOPW %CS:(%RAX,%RAX,1) |
(389) 0x4206f0 VMOVSD (%RAX,%R8,8),%XMM3 |
(389) 0x4206f6 VFMADD231SD (%R13,%R8,8),%XMM3,%XMM1 |
(389) 0x4206fd INC %R8 |
(389) 0x420700 CMP %R8,%RSI |
(389) 0x420703 JNE 4206f0 |
(377) 0x420705 TEST %RSI,%RSI |
(377) 0x420708 JLE 420785 |
(377) 0x42070a MOV %RSI,%R11 |
(377) 0x42070d AND $-0x4,%R11 |
(377) 0x420711 JE 420760 |
(377) 0x420713 LEA -0x1(%R11),%RCX |
(377) 0x420717 LEA (%RAX,%R14,8),%RDI |
(377) 0x42071b VXORPD %XMM2,%XMM2,%XMM2 |
(377) 0x42071f XOR %R8D,%R8D |
(377) 0x420722 NOPW %CS:(%RAX,%RAX,1) |
(388) 0x420730 VMOVUPD (%RDI,%R8,8),%YMM3 |
(388) 0x420736 VFMADD231PD (%R13,%R8,8),%YMM3,%YMM2 |
(388) 0x42073d ADD $0x4,%R8 |
(388) 0x420741 CMP %RCX,%R8 |
(388) 0x420744 JLE 420730 |
(377) 0x420746 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(377) 0x42074c VADDPD %XMM3,%XMM2,%XMM2 |
(377) 0x420750 VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(377) 0x420755 VADDSD %XMM3,%XMM2,%XMM2 |
(377) 0x420759 CMP %R11,%RSI |
(377) 0x42075c JNE 420767 |
(377) 0x42075e JMP 420785 |
(377) 0x420760 VXORPD %XMM2,%XMM2,%XMM2 |
(377) 0x420764 XOR %R11D,%R11D |
(377) 0x420767 LEA (%RAX,%R14,8),%RCX |
(377) 0x42076b NOPL (%RAX,%RAX,1) |
(387) 0x420770 VMOVSD (%RCX,%R11,8),%XMM3 |
(387) 0x420776 VFMADD231SD (%R13,%R11,8),%XMM3,%XMM2 |
(387) 0x42077d INC %R11 |
(387) 0x420780 CMP %R11,%RSI |
(387) 0x420783 JNE 420770 |
(377) 0x420785 TEST %RSI,%RSI |
(377) 0x420788 MOV %R10,0x58(%RSP) |
(377) 0x42078d JLE 4207e0 |
(377) 0x42078f MOV %RSI,%R11 |
(377) 0x420792 AND $-0x4,%R11 |
(377) 0x420796 JE 4207f0 |
(377) 0x420798 LEA -0x1(%R11),%RCX |
(377) 0x42079c MOV %R14,%RDI |
(377) 0x42079f SAL $0x4,%RDI |
(377) 0x4207a3 ADD %RAX,%RDI |
(377) 0x4207a6 VXORPD %XMM3,%XMM3,%XMM3 |
(377) 0x4207aa XOR %R8D,%R8D |
(377) 0x4207ad NOPL (%RAX) |
(386) 0x4207b0 VMOVUPD (%RDI,%R8,8),%YMM4 |
(386) 0x4207b6 VFMADD231PD (%R13,%R8,8),%YMM4,%YMM3 |
(386) 0x4207bd ADD $0x4,%R8 |
(386) 0x4207c1 CMP %RCX,%R8 |
(386) 0x4207c4 JLE 4207b0 |
(377) 0x4207c6 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(377) 0x4207cc VADDPD %XMM4,%XMM3,%XMM3 |
(377) 0x4207d0 VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(377) 0x4207d5 VADDSD %XMM4,%XMM3,%XMM3 |
(377) 0x4207d9 CMP %R11,%RSI |
(377) 0x4207dc JNE 4207f7 |
(377) 0x4207de JMP 420825 |
(377) 0x4207e0 VXORPD %XMM3,%XMM3,%XMM3 |
(377) 0x4207e4 JMP 420825 |
0x4207e6 NOPW %CS:(%RAX,%RAX,1) |
(377) 0x4207f0 VXORPD %XMM3,%XMM3,%XMM3 |
(377) 0x4207f4 XOR %R11D,%R11D |
(377) 0x4207f7 MOV %R14,%RCX |
(377) 0x4207fa SAL $0x4,%RCX |
(377) 0x4207fe ADD %RAX,%RCX |
(377) 0x420801 NOPW %CS:(%RAX,%RAX,1) |
(385) 0x420810 VMOVSD (%RCX,%R11,8),%XMM4 |
(385) 0x420816 VFMADD231SD (%R13,%R11,8),%XMM4,%XMM3 |
(385) 0x42081d INC %R11 |
(385) 0x420820 CMP %R11,%RSI |
(385) 0x420823 JNE 420810 |
(377) 0x420825 MOV %R14,0x20(%RSP) |
(377) 0x42082a VPUNPCKLQDQ %XMM2,%XMM1,%XMM1 |
(377) 0x42082e MOV 0xf0(%R12),%RDI |
(377) 0x420836 MOV 0x100(%R12),%R14 |
(377) 0x42083e VMOVQ %RDI,%XMM2 |
(377) 0x420843 VPSLLDQ $0x8,%XMM2,%XMM2 |
(377) 0x420848 VPBROADCASTQ %R14,%XMM4 |
(377) 0x42084e VPBROADCASTQ %RSI,%XMM5 |
(377) 0x420854 VPADDQ %XMM2,%XMM5,%XMM2 |
(377) 0x420858 VPSLLQ $0x3,%XMM2,%XMM2 |
(377) 0x42085d VPADDQ %XMM2,%XMM4,%XMM2 |
(377) 0x420861 VMOVQ %XMM2,%RCX |
(377) 0x420866 VMOVLPD %XMM1,(%RCX) |
(377) 0x42086a VPEXTRQ $0x1,%XMM2,%RCX |
(377) 0x420870 VMOVHPD %XMM1,(%RCX) |
(377) 0x420874 MOV %RDI,0x50(%RSP) |
(377) 0x420879 LEA (%RSI,%RDI,2),%RCX |
(377) 0x42087d VMOVSD %XMM3,(%R14,%RCX,8) |
(377) 0x420883 VXORPD 0xd47b3(%RIP){1to2},%XMM0,%XMM0 |
(377) 0x42088d MOV 0x128(%R12),%R8 |
(377) 0x420895 VMOVLPD %XMM0,(%R8,%RSI,8) |
(377) 0x42089b TEST %RSI,%RSI |
(377) 0x42089e JLE 420a10 |
(377) 0x4208a4 LEA -0x8(%RDX,%RSI,8),%R11 |
(377) 0x4208a9 CMP %R8,%R11 |
(377) 0x4208ac SETAEB 0x1f(%RSP) |
(377) 0x4208b1 LEA -0x8(%R8,%RSI,8),%RDI |
(377) 0x4208b6 CMP %RDX,%RDI |
(377) 0x4208b9 SETAEB 0x1e(%RSP) |
(377) 0x4208be CMP %R9,%R11 |
(377) 0x4208c1 SETB %R15B |
(377) 0x4208c5 LEA -0x8(%R9,%RSI,8),%R10 |
(377) 0x4208ca CMP %RDX,%R10 |
(377) 0x4208cd SETBB 0x1d(%RSP) |
(377) 0x4208d2 CMP %R8,%R10 |
(377) 0x4208d5 SETB %R12B |
(377) 0x4208d9 MOV %R9,0x38(%RSP) |
(377) 0x4208de CMP %R9,%RDI |
(377) 0x4208e1 SETBB 0x1c(%RSP) |
(377) 0x4208e6 CMP %R13,%R11 |
(377) 0x4208e9 SETB %R10B |
(377) 0x4208ed MOV %R13,%RCX |
(377) 0x4208f0 MOV %RBX,%R13 |
(377) 0x4208f3 LEA -0x8(%RCX,%RSI,8),%RBX |
(377) 0x4208f8 CMP %RDX,%RBX |
(377) 0x4208fb SETBB 0x1b(%RSP) |
(377) 0x420900 CMP %R13,%R11 |
(377) 0x420903 SETB %R11B |
(377) 0x420907 LEA -0x8(%R13,%RSI,8),%R9 |
(377) 0x42090c CMP %RDX,%R9 |
(377) 0x42090f SETBB 0x1a(%RSP) |
(377) 0x420914 CMP %R8,%RBX |
(377) 0x420917 SETB %BL |
(377) 0x42091a MOV %RCX,0x40(%RSP) |
(377) 0x42091f CMP %RCX,%RDI |
(377) 0x420922 SETB %SIL |
(377) 0x420926 CMP %R8,%R9 |
(377) 0x420929 SETB %R9B |
(377) 0x42092d MOV %R13,0x30(%RSP) |
(377) 0x420932 CMP %R13,%RDI |
(377) 0x420935 SETB %CL |
(377) 0x420938 MOVZX 0x1e(%RSP),%EDI |
(377) 0x42093d TEST %DIL,0x1f(%RSP) |
(377) 0x420942 JNE 420a30 |
(377) 0x420948 OR 0x1d(%RSP),%R15B |
(377) 0x42094d JE 420a30 |
(377) 0x420953 OR 0x1c(%RSP),%R12B |
(377) 0x420958 JE 420a30 |
(377) 0x42095e OR 0x1b(%RSP),%R10B |
(377) 0x420963 JE 420a30 |
(377) 0x420969 OR 0x1a(%RSP),%R11B |
(377) 0x42096e JE 420a30 |
(377) 0x420974 OR %SIL,%BL |
(377) 0x420977 JE 420a30 |
(377) 0x42097d OR %CL,%R9B |
(377) 0x420980 JE 420a30 |
(377) 0x420986 MOV 0x60(%RSP),%RSI |
(377) 0x42098b MOV %RSI,%R11 |
(377) 0x42098e AND $-0x4,%R11 |
(377) 0x420992 JE 420ad7 |
(377) 0x420998 LEA -0x1(%R11),%RCX |
(377) 0x42099c XOR %EDI,%EDI |
(377) 0x42099e MOV 0x38(%RSP),%R9 |
(377) 0x4209a3 MOV 0x30(%RSP),%RBX |
(377) 0x4209a8 MOV 0x40(%RSP),%R13 |
(377) 0x4209ad NOPL (%RAX) |
(384) 0x4209b0 VMOVUPD (%RDX,%RDI,8),%YMM0 |
(384) 0x4209b5 VADDPD (%R9,%RDI,8),%YMM0,%YMM0 |
(384) 0x4209bb VMOVUPD %YMM0,(%RDX,%RDI,8) |
(384) 0x4209c0 VMOVUPD (%R13,%RDI,8),%YMM0 |
(384) 0x4209c7 VFMSUB213PD (%RBX,%RDI,8),%YMM8,%YMM0 |
(384) 0x4209cd VADDPD (%R8,%RDI,8),%YMM0,%YMM0 |
(384) 0x4209d3 VMOVUPD %YMM0,(%R8,%RDI,8) |
(384) 0x4209d9 ADD $0x4,%RDI |
(384) 0x4209dd CMP %RCX,%RDI |
(384) 0x4209e0 JLE 4209b0 |
(377) 0x4209e2 CMP %R11,%RSI |
(377) 0x4209e5 MOV 0x48(%RSP),%R12 |
(377) 0x4209ea MOV 0x58(%RSP),%R10 |
(377) 0x4209ef MOV 0x28(%RSP),%R15 |
(377) 0x4209f4 JE 420a86 |
(377) 0x4209fa VPBROADCASTQ %RSI,%YMM0 |
(377) 0x420a00 JMP 420afe |
0x420a05 NOPW %CS:(%RAX,%RAX,1) |
(377) 0x420a10 MOV 0x58(%RSP),%R10 |
(377) 0x420a15 MOV 0x28(%RSP),%R15 |
(377) 0x420a1a TEST %RSI,%RSI |
(377) 0x420a1d JG 420a8f |
(377) 0x420a1f JMP 4203c0 |
0x420a24 NOPW %CS:(%RAX,%RAX,1) |
(377) 0x420a30 XOR %ECX,%ECX |
(377) 0x420a32 MOV 0x58(%RSP),%R10 |
(377) 0x420a37 MOV 0x28(%RSP),%R15 |
(377) 0x420a3c MOV 0x60(%RSP),%RSI |
(377) 0x420a41 MOV 0x38(%RSP),%R9 |
(377) 0x420a46 MOV 0x30(%RSP),%RBX |
(377) 0x420a4b MOV 0x40(%RSP),%R13 |
(383) 0x420a50 VMOVSD (%RDX,%RCX,8),%XMM0 |
(383) 0x420a55 VADDSD (%R9,%RCX,8),%XMM0,%XMM0 |
(383) 0x420a5b VMOVSD %XMM0,(%RDX,%RCX,8) |
(383) 0x420a60 VMOVSD (%R13,%RCX,8),%XMM0 |
(383) 0x420a67 VFMSUB213SD (%RBX,%RCX,8),%XMM9,%XMM0 |
(383) 0x420a6d VADDSD (%R8,%RCX,8),%XMM0,%XMM0 |
(383) 0x420a73 VMOVSD %XMM0,(%R8,%RCX,8) |
(383) 0x420a79 INC %RCX |
(383) 0x420a7c CMP %RCX,%RSI |
(383) 0x420a7f JNE 420a50 |
(377) 0x420a81 MOV 0x48(%RSP),%R12 |
(377) 0x420a86 TEST %RSI,%RSI |
(377) 0x420a89 JLE 4203c0 |
(377) 0x420a8f MOV %RSI,%RDX |
(377) 0x420a92 AND $-0x4,%RDX |
(377) 0x420a96 JE 420ad0 |
(377) 0x420a98 LEA -0x1(%RDX),%RCX |
(377) 0x420a9c XOR %EDI,%EDI |
(377) 0x420a9e XCHG %AX,%AX |
(382) 0x420aa0 VMOVUPD (%RAX,%RDI,8),%YMM0 |
(382) 0x420aa5 VMOVUPD (%R13,%RDI,8),%YMM1 |
(382) 0x420aac VFNMADD213PD (%R14,%RDI,8),%YMM0,%YMM1 |
(382) 0x420ab2 VMOVUPD %YMM1,(%R14,%RDI,8) |
(382) 0x420ab8 ADD $0x4,%RDI |
(382) 0x420abc CMP %RCX,%RDI |
(382) 0x420abf JLE 420aa0 |
(377) 0x420ac1 JMP 420c1b |
0x420ac6 NOPW %CS:(%RAX,%RAX,1) |
(377) 0x420ad0 XOR %EDX,%EDX |
(377) 0x420ad2 JMP 420c00 |
(377) 0x420ad7 VPBROADCASTQ %RSI,%YMM0 |
(377) 0x420add XOR %R11D,%R11D |
(377) 0x420ae0 MOV 0x48(%RSP),%R12 |
(377) 0x420ae5 MOV 0x58(%RSP),%R10 |
(377) 0x420aea MOV 0x28(%RSP),%R15 |
(377) 0x420aef MOV 0x38(%RSP),%R9 |
(377) 0x420af4 MOV 0x30(%RSP),%RBX |
(377) 0x420af9 MOV 0x40(%RSP),%R13 |
(377) 0x420afe VPBROADCASTQ %R11,%YMM1 |
(377) 0x420b04 VPSUBQ %YMM1,%YMM0,%YMM0 |
(377) 0x420b08 VPCMPNLEUQ 0xd58ad(%RIP),%YMM0,%K1 |
(377) 0x420b13 VMOVUPD (%RDX,%R11,8),%YMM0{%K1}{z} |
(377) 0x420b1a VMOVUPD 0xa0(%RSP),%YMM2 |
(377) 0x420b23 VMOVAPD %YMM0,%YMM2{%K1} |
(377) 0x420b29 VMOVUPD (%R9,%R11,8),%YMM0{%K1}{z} |
(377) 0x420b30 VMOVUPD 0xc0(%RSP),%YMM1 |
(377) 0x420b39 VMOVAPD %YMM0,%YMM1{%K1} |
(377) 0x420b3f VMOVUPD %YMM1,0xc0(%RSP) |
(377) 0x420b48 VMOVUPD %YMM2,0xa0(%RSP) |
(377) 0x420b51 VADDPD %YMM1,%YMM2,%YMM0 |
(377) 0x420b55 VMOVUPD %YMM0,(%RDX,%R11,8){%K1} |
(377) 0x420b5c VMOVUPD (%R13,%R11,8),%YMM0{%K1}{z} |
(377) 0x420b64 VMOVUPD 0xe0(%RSP),%YMM2 |
(377) 0x420b6d VMOVAPD %YMM0,%YMM2{%K1} |
(377) 0x420b73 VMOVUPD (%RBX,%R11,8),%YMM0{%K1}{z} |
(377) 0x420b7a VMOVUPD 0x100(%RSP),%YMM1 |
(377) 0x420b83 VMOVAPD %YMM0,%YMM1{%K1} |
(377) 0x420b89 VMOVUPD %YMM1,0x100(%RSP) |
(377) 0x420b92 VMOVAPD %YMM1,%YMM0 |
(377) 0x420b96 VMOVUPD %YMM2,0xe0(%RSP) |
(377) 0x420b9f VFMSUB231PD %YMM8,%YMM2,%YMM0 |
(377) 0x420ba4 VMOVUPD (%R8,%R11,8),%YMM1{%K1}{z} |
(377) 0x420bab VMOVUPD 0x120(%RSP),%YMM2 |
(377) 0x420bb4 VMOVAPD %YMM1,%YMM2{%K1} |
(377) 0x420bba VMOVUPD %YMM2,0x120(%RSP) |
(377) 0x420bc3 VADDPD %YMM0,%YMM2,%YMM0 |
(377) 0x420bc7 VMOVUPD %YMM0,(%R8,%R11,8){%K1} |
(377) 0x420bce TEST %RSI,%RSI |
(377) 0x420bd1 JG 420a8f |
(377) 0x420bd7 JMP 4203c0 |
0x420bdc NOPL (%RAX) |
(391) 0x420be0 CMP %RCX,%RSI |
(391) 0x420be3 JE 420680 |
(391) 0x420be9 VADDSD (%RBX,%RCX,8),%XMM0,%XMM0 |
(391) 0x420bee VFMADD231SD (%R13,%RCX,8),%XMM6,%XMM0 |
(391) 0x420bf5 INC %RCX |
(391) 0x420bf8 JMP 420be0 |
0x420bfa NOPW (%RAX,%RAX,1) |
(376) 0x420c00 VMOVSD (%RAX,%RDX,8),%XMM0 |
(376) 0x420c05 VMOVSD (%R13,%RDX,8),%XMM1 |
(376) 0x420c0c VFNMADD213SD (%R14,%RDX,8),%XMM0,%XMM1 |
(376) 0x420c12 VMOVSD %XMM1,(%R14,%RDX,8) |
(376) 0x420c18 INC %RDX |
(376) 0x420c1b CMP %RDX,%RSI |
(376) 0x420c1e JNE 420c00 |
(377) 0x420c20 TEST %RSI,%RSI |
(377) 0x420c23 JLE 4203c0 |
(377) 0x420c29 MOV %RSI,%RDX |
(377) 0x420c2c AND $-0x4,%RDX |
(377) 0x420c30 JE 420c79 |
(377) 0x420c32 LEA -0x1(%RDX),%RCX |
(377) 0x420c36 MOV 0x50(%RSP),%RDI |
(377) 0x420c3b LEA (%R14,%RDI,8),%RDI |
(377) 0x420c3f MOV 0x20(%RSP),%R8 |
(377) 0x420c44 LEA (%RAX,%R8,8),%R8 |
(377) 0x420c48 XOR %R11D,%R11D |
(377) 0x420c4b NOPL (%RAX,%RAX,1) |
(381) 0x420c50 VMOVUPD (%R8,%R11,8),%YMM0 |
(381) 0x420c56 VMOVUPD (%R13,%R11,8),%YMM1 |
(381) 0x420c5d VFNMADD213PD (%RDI,%R11,8),%YMM0,%YMM1 |
(381) 0x420c63 VMOVUPD %YMM1,(%RDI,%R11,8) |
(381) 0x420c69 ADD $0x4,%R11 |
(381) 0x420c6d CMP %RCX,%R11 |
(381) 0x420c70 JLE 420c50 |
(377) 0x420c72 CMP %RDX,%RSI |
(377) 0x420c75 JNE 420c7b |
(377) 0x420c77 JMP 420caf |
(377) 0x420c79 XOR %EDX,%EDX |
(377) 0x420c7b MOV 0x50(%RSP),%RCX |
(377) 0x420c80 LEA (%R14,%RCX,8),%RCX |
(377) 0x420c84 MOV 0x20(%RSP),%RDI |
(377) 0x420c89 LEA (%RAX,%RDI,8),%RDI |
(377) 0x420c8d NOPL (%RAX) |
(378) 0x420c90 VMOVSD (%RDI,%RDX,8),%XMM0 |
(378) 0x420c95 VMOVSD (%R13,%RDX,8),%XMM1 |
(378) 0x420c9c VFNMADD213SD (%RCX,%RDX,8),%XMM0,%XMM1 |
(378) 0x420ca2 VMOVSD %XMM1,(%RCX,%RDX,8) |
(378) 0x420ca7 INC %RDX |
(378) 0x420caa CMP %RDX,%RSI |
(378) 0x420cad JNE 420c90 |
(377) 0x420caf TEST %RSI,%RSI |
(377) 0x420cb2 JLE 4203c0 |
(377) 0x420cb8 MOV %RSI,%RDX |
(377) 0x420cbb AND $-0x4,%RDX |
(377) 0x420cbf JE 420d0d |
(377) 0x420cc1 LEA -0x1(%RDX),%RCX |
(377) 0x420cc5 MOV 0x50(%RSP),%RDI |
(377) 0x420cca SAL $0x4,%RDI |
(377) 0x420cce ADD %R14,%RDI |
(377) 0x420cd1 MOV 0x20(%RSP),%R8 |
(377) 0x420cd6 SAL $0x4,%R8 |
(377) 0x420cda ADD %RAX,%R8 |
(377) 0x420cdd XOR %R11D,%R11D |
(380) 0x420ce0 VMOVUPD (%R8,%R11,8),%YMM0 |
(380) 0x420ce6 VMOVUPD (%R13,%R11,8),%YMM1 |
(380) 0x420ced VFNMADD213PD (%RDI,%R11,8),%YMM0,%YMM1 |
(380) 0x420cf3 VMOVUPD %YMM1,(%RDI,%R11,8) |
(380) 0x420cf9 ADD $0x4,%R11 |
(380) 0x420cfd CMP %RCX,%R11 |
(380) 0x420d00 JLE 420ce0 |
(377) 0x420d02 CMP %RDX,%RSI |
(377) 0x420d05 JE 4203c0 |
(377) 0x420d0b JMP 420d0f |
(377) 0x420d0d XOR %EDX,%EDX |
(377) 0x420d0f MOV 0x50(%RSP),%RCX |
(377) 0x420d14 SAL $0x4,%RCX |
(377) 0x420d18 ADD %RCX,%R14 |
(377) 0x420d1b MOV 0x20(%RSP),%RCX |
(377) 0x420d20 SAL $0x4,%RCX |
(377) 0x420d24 ADD %RCX,%RAX |
(377) 0x420d27 NOPW (%RAX,%RAX,1) |
(379) 0x420d30 VMOVSD (%RAX,%RDX,8),%XMM0 |
(379) 0x420d35 VMOVSD (%R13,%RDX,8),%XMM1 |
(379) 0x420d3c VFNMADD213SD (%R14,%RDX,8),%XMM0,%XMM1 |
(379) 0x420d42 VMOVSD %XMM1,(%R14,%RDX,8) |
(379) 0x420d48 INC %RDX |
(379) 0x420d4b CMP %RDX,%RSI |
(379) 0x420d4e JNE 420d30 |
(377) 0x420d50 JMP 4203c0 |
0x420d55 MOVQ $0,0x10(%R12) |
0x420d5e MOV 0x90(%R12),%R9 |
0x420d66 TEST %R9,%R9 |
0x420d69 JE 420db5 |
0x420d6b MOV 0xd8(%R12),%R8 |
0x420d73 MOV 0xf0(%R12),%RDI |
0x420d7b MOV 0x100(%R12),%RSI |
0x420d83 MOV 0x88(%RSP),%RAX |
0x420d8b MOV 0x18(%RAX),%RDX |
0x420d8f MOV 0x128(%R12),%RAX |
0x420d97 MOV 0x90(%RSP),%RCX |
0x420d9f MOV 0x18(%RCX),%RCX |
0x420da3 CMP $0x1,%R9 |
0x420da7 JNE 420dc2 |
0x420da9 VXORPD %XMM0,%XMM0,%XMM0 |
0x420dad XOR %R10D,%R10D |
0x420db0 JMP 420ea6 |
0x420db5 VMOVSD 0xd4283(%RIP),%XMM0 |
0x420dbd JMP 420f13 |
0x420dc2 MOV %R9,%R11 |
0x420dc5 AND $-0x2,%R11 |
0x420dc9 MOVSXD %EDI,%R10 |
0x420dcc LEA 0x8(%RSI,%R10,8),%RBX |
0x420dd1 SAL $0x4,%R10 |
0x420dd5 LEA 0x8(%R10,%RSI,1),%R14 |
0x420dda LEA 0x28(%RDX),%R15 |
0x420dde VXORPD %XMM0,%XMM0,%XMM0 |
0x420de2 XOR %R10D,%R10D |
0x420de5 NOPW %CS:(%RAX,%RAX,1) |
(374) 0x420df0 VADDSD (%R8,%R10,8),%XMM0,%XMM0 |
(374) 0x420df6 VMOVSD %XMM0,0x10(%R12) |
(374) 0x420dfd VMOVSD (%RSI,%R10,8),%XMM0 |
(374) 0x420e03 VMOVHPD -0x8(%RBX,%R10,8),%XMM0,%XMM0 |
(374) 0x420e0a VADDPD -0x28(%R15),%XMM0,%XMM0 |
(374) 0x420e10 VMOVSD -0x18(%R15),%XMM1 |
(374) 0x420e16 VADDSD -0x8(%R14,%R10,8),%XMM1,%XMM1 |
(374) 0x420e1d VMOVUPD %XMM0,-0x28(%R15) |
(374) 0x420e23 VMOVSD %XMM1,-0x18(%R15) |
(374) 0x420e29 VMOVSD (%RCX,%R10,8),%XMM0 |
(374) 0x420e2f VADDSD (%RAX,%R10,8),%XMM0,%XMM0 |
(374) 0x420e35 VMOVSD %XMM0,(%RCX,%R10,8) |
(374) 0x420e3b VMOVSD 0x8(%R8,%R10,8),%XMM0 |
(374) 0x420e42 VADDSD 0x10(%R12),%XMM0,%XMM0 |
(374) 0x420e49 VMOVSD %XMM0,0x10(%R12) |
(374) 0x420e50 VMOVSD 0x8(%RSI,%R10,8),%XMM0 |
(374) 0x420e57 VMOVHPD (%RBX,%R10,8),%XMM0,%XMM0 |
(374) 0x420e5d VADDPD -0x10(%R15),%XMM0,%XMM0 |
(374) 0x420e63 VMOVSD (%R15),%XMM1 |
(374) 0x420e68 VADDSD (%R14,%R10,8),%XMM1,%XMM1 |
(374) 0x420e6e VMOVUPD %XMM0,-0x10(%R15) |
(374) 0x420e74 VMOVSD %XMM1,(%R15) |
(374) 0x420e79 VMOVSD 0x8(%RCX,%R10,8),%XMM0 |
(374) 0x420e80 VADDSD 0x8(%RAX,%R10,8),%XMM0,%XMM0 |
(374) 0x420e87 VMOVSD %XMM0,0x8(%RCX,%R10,8) |
(374) 0x420e8e VMOVSD 0x10(%R12),%XMM0 |
(374) 0x420e95 ADD $0x2,%R10 |
(374) 0x420e99 ADD $0x30,%R15 |
(374) 0x420e9d CMP %R10,%R11 |
(374) 0x420ea0 JNE 420df0 |
0x420ea6 TEST $0x1,%R9B |
0x420eaa JE 420f0b |
0x420eac VADDSD (%R8,%R10,8),%XMM0,%XMM0 |
0x420eb2 VMOVSD %XMM0,0x10(%R12) |
0x420eb9 MOVSXD %EDI,%RDI |
0x420ebc LEA (%R10,%RDI,2),%R8 |
0x420ec0 ADD %R10,%RDI |
0x420ec3 LEA (%R10,%R10,2),%R9 |
0x420ec7 VMOVSD (%RSI,%R10,8),%XMM0 |
0x420ecd VMOVHPD (%RSI,%RDI,8),%XMM0,%XMM0 |
0x420ed2 VADDPD (%RDX,%R9,8),%XMM0,%XMM0 |
0x420ed8 VMOVSD 0x10(%RDX,%R9,8),%XMM1 |
0x420edf VADDSD (%RSI,%R8,8),%XMM1,%XMM1 |
0x420ee5 VMOVUPD %XMM0,(%RDX,%R9,8) |
0x420eeb VMOVSD %XMM1,0x10(%RDX,%R9,8) |
0x420ef2 VMOVSD (%RCX,%R10,8),%XMM0 |
0x420ef8 VADDSD (%RAX,%R10,8),%XMM0,%XMM0 |
0x420efe VMOVSD %XMM0,(%RCX,%R10,8) |
0x420f04 VMOVSD 0x10(%R12),%XMM0 |
0x420f0b VMULSD 0xd411d(%RIP),%XMM0,%XMM0 |
0x420f13 VMOVSD %XMM0,0x10(%R12) |
0x420f1a LEA -0x28(%RBP),%RSP |
0x420f1e POP %RBX |
0x420f1f POP %R12 |
0x420f21 POP %R13 |
0x420f23 POP %R14 |
0x420f25 POP %R15 |
0x420f27 POP %RBP |
0x420f28 VZEROUPPER |
0x420f2b RET |
0x420f2c NOPL (%RAX) |
Path / |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 104 |
nb uops | 106 |
loop length | 529 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 6 |
ADD-SUB / MUL ratio | 4.00 |
micro-operation queue | 18.50 cycles |
front end | 18.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.20 | 5.30 | 11.00 | 11.00 | 9.00 | 5.10 | 5.20 | 9.00 | 9.00 | 9.00 | 5.20 | 11.00 |
cycles | 5.20 | 5.30 | 11.00 | 11.00 | 9.00 | 5.10 | 5.20 | 9.00 | 9.00 | 9.00 | 5.20 | 11.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 18.37-18.46 |
Stall cycles | 0.00 |
Front-end | 18.50 |
Dispatch | 11.00 |
Overall L1 | 18.50 |
all | 7% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 18% |
load | 6% |
store | 20% |
mul | 0% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 13% |
load | 6% |
store | 9% |
mul | 0% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 12% |
load | NA (no load vectorizable/vectorized instructions) |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 14% |
all | 14% |
load | 13% |
store | 15% |
mul | 12% |
add-sub | 15% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 14% |
load | 13% |
store | 13% |
mul | 12% |
add-sub | 15% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x160,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 420d55 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xaa5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x248(%R12),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 45f8c0 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0xa0(%R12),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R10,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 420d55 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xaa5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0xd5f63(%RIP),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0xd5f5a(%RIP),%YMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xd4d51(%RIP),%YMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVSD 0xd4d49(%RIP),%XMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 42036f <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xbf> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVQ $0,0x10(%R12) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%R12),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R9,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 420db5 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb05> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd8(%R12),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xf0(%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x100(%R12),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x88(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x128(%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x90(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 420dc2 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb12> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 420ea6 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xbf6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
VMOVSD 0xd4283(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 420f13 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc63> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R9,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x2,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOVSXD %EDI,%R10 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
LEA 0x8(%RSI,%R10,8),%RBX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x4,%R10 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x8(%R10,%RSI,1),%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x28(%RDX),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%R9B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 420f0b <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc5b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VADDSD (%R8,%R10,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,0x10(%R12) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %EDI,%RDI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
LEA (%R10,%RDI,2),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R10,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (%R10,%R10,2),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD (%RSI,%R10,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVHPD (%RSI,%RDI,8),%XMM0,%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4-12 | 1 |
VADDPD (%RDX,%R9,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD 0x10(%RDX,%R9,8),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RSI,%R8,8),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVUPD %XMM0,(%RDX,%R9,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD %XMM1,0x10(%RDX,%R9,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD (%RCX,%R10,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R10,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RCX,%R10,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x10(%R12),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0xd411d(%RIP),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD %XMM0,0x10(%R12) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | TwoBodyJastrowRef.h:268-432 |
Module | exec |
nb instructions | 104 |
nb uops | 106 |
loop length | 529 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 6 |
ADD-SUB / MUL ratio | 4.00 |
micro-operation queue | 18.50 cycles |
front end | 18.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.20 | 5.30 | 11.00 | 11.00 | 9.00 | 5.10 | 5.20 | 9.00 | 9.00 | 9.00 | 5.20 | 11.00 |
cycles | 5.20 | 5.30 | 11.00 | 11.00 | 9.00 | 5.10 | 5.20 | 9.00 | 9.00 | 9.00 | 5.20 | 11.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 18.37-18.46 |
Stall cycles | 0.00 |
Front-end | 18.50 |
Dispatch | 11.00 |
Overall L1 | 18.50 |
all | 7% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 18% |
load | 6% |
store | 20% |
mul | 0% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 13% |
load | 6% |
store | 9% |
mul | 0% |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 12% |
load | NA (no load vectorizable/vectorized instructions) |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 14% |
all | 14% |
load | 13% |
store | 15% |
mul | 12% |
add-sub | 15% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 14% |
load | 13% |
store | 13% |
mul | 12% |
add-sub | 15% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x160,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R8B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 420d55 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xaa5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x248(%R12),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 45f8c0 <_ZNK11qmcplusplus11ParticleSet14getDistTableAAEi> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0xa0(%R12),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R10,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 420d55 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xaa5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD 0xd5f63(%RIP),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0xd5f5a(%RIP),%YMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xd4d51(%RIP),%YMM8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VMOVSD 0xd4d49(%RIP),%XMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 42036f <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xbf> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVQ $0,0x10(%R12) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%R12),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R9,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 420db5 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb05> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xd8(%R12),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xf0(%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x100(%R12),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x88(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x128(%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x90(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 420dc2 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xb12> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 420ea6 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xbf6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
VMOVSD 0xd4283(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 420f13 <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc63> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R9,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x2,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOVSXD %EDI,%R10 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
LEA 0x8(%RSI,%R10,8),%RBX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x4,%R10 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x8(%R10,%RSI,1),%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x28(%RDX),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%R9B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 420f0b <_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0xc5b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VADDSD (%R8,%R10,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,0x10(%R12) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %EDI,%RDI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
LEA (%R10,%RDI,2),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R10,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (%R10,%R10,2),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD (%RSI,%R10,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVHPD (%RSI,%RDI,8),%XMM0,%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4-12 | 1 |
VADDPD (%RDX,%R9,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD 0x10(%RDX,%R9,8),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RSI,%R8,8),%XMM1,%XMM1 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVUPD %XMM0,(%RDX,%R9,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVSD %XMM1,0x10(%RDX,%R9,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD (%RCX,%R10,8),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R10,8),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RCX,%R10,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x10(%R12),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0xd411d(%RIP),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD %XMM0,0x10(%R12) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_ZN16miniqmcreference17TwoBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb– | 0.12 | 0.09 |
○Loop 374 - TwoBodyJastrowRef.h:422-427 - exec | 0 | 0 |
▼Loop 375 - TwoBodyJastrowRef.h:268-420 - exec– | 0 | 0 |
▼Loop 377 - TwoBodyJastrowRef.h:268-420 - exec– | 0 | 0 |
○Loop 392 - TwoBodyJastrowRef.h:375-376 - exec | 0.02 | 0.01 |
○Loop 388 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.01 |
○Loop 384 - TwoBodyJastrowRef.h:388-391 - exec | 0.02 | 0.01 |
○Loop 390 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.01 |
○Loop 386 - TwoBodyJastrowRef.h:381-382 - exec | 0.02 | 0.01 |
○Loop 381 - TwoBodyJastrowRef.h:397-398 - exec | 0.01 | 0.01 |
○Loop 382 - TwoBodyJastrowRef.h:397-398 - exec | 0.01 | 0.01 |
○Loop 380 - TwoBodyJastrowRef.h:397-398 - exec | 0.01 | 0.01 |
○Loop 394 - stl_numeric.h:140-141 - exec | 0.01 | 0 |
○Loop 389 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 395 - TwoBodyJastrowRef.h:269-274 - exec | 0 | 0 |
○Loop 378 - TwoBodyJastrowRef.h:397-398 - exec | 0 | 0 |
○Loop 393 - stl_numeric.h:140-141 - exec | 0 | 0 |
○Loop 391 - TwoBodyJastrowRef.h:375-376 - exec | 0 | 0 |
○Loop 385 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 376 - TwoBodyJastrowRef.h:397-398 - exec | 0 | 0 |
○Loop 383 - TwoBodyJastrowRef.h:388-391 - exec | 0 | 0 |
○Loop 387 - TwoBodyJastrowRef.h:381-382 - exec | 0 | 0 |
○Loop 379 - TwoBodyJastrowRef.h:397-398 - exec | 0 | 0 |