Function: _ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6 ... | Module: libqmcwfs.so | Source: einspline_spo_ref.hpp:203-230 [...] | Coverage: 0.99% |
---|
Function: _ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6 ... | Module: libqmcwfs.so | Source: einspline_spo_ref.hpp:203-230 [...] | Coverage: 0.99% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 145 - 145 |
-------------------------------------------------------------------------------- |
145: X[i] = base[i * offset]; |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/stl_vector.h: 1126 - 1258 |
-------------------------------------------------------------------------------- |
1126: return *(this->_M_impl._M_start + __n); |
[...] |
1258: { return _M_data_ptr(this->_M_impl._M_start); } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 143 - 143 |
-------------------------------------------------------------------------------- |
143: return (active_ptcl_ == iat) ? active_pos_ : R[iat]; |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/stl_algobase.h: 238 - 238 |
-------------------------------------------------------------------------------- |
238: if (__b < __a) |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/einspline_spo_ref.hpp: 203 - 230 |
-------------------------------------------------------------------------------- |
203: ScopedTimer local_timer(timer); |
204: |
205: auto u = Lattice.toUnit_floor(P.activeR(iat)); |
206: for (int i = 0; i < nBlocks; ++i) |
207: MultiBsplineEvalRef::evaluate_vgh(einsplines[i], u[0], u[1], u[2], psi[i].data(), grad[i].data(), hess[i].data(), |
208: nSplinesPerBlock); |
209: } |
210: |
211: inline void evaluate(const ParticleSet& P, |
[...] |
219: for (int i = 0; i < nBlocks; ++i) |
220: { |
221: // in real simulation, phase needs to be applied. Here just fake computation |
222: const int first = i * nBlocks; |
223: for (int j = first; j < std::min((i + 1) * nSplinesPerBlock, OrbitalSetSize); j++) |
224: { |
225: psi_v[j] = psi[i][j - first]; |
226: dpsi_v[j] = grad[i][j - first]; |
227: d2psi_v[j] = hess[i].data(0)[j - first]; |
228: } |
229: } |
230: } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Utilities/NewTimer.h: 242 - 249 |
-------------------------------------------------------------------------------- |
242: ScopeGuard(TIMER& t) : timer(t) { timer.start(); } |
[...] |
249: ~ScopeGuard() { timer.stop(); } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 231 - 271 |
-------------------------------------------------------------------------------- |
231: inline const AoSElement_t operator[](size_t i) const { return AoSElement_t(myData + i, nGhosts); } |
[...] |
265: inline T* data() { return myData; } |
[...] |
271: inline T* restrict data(size_t i) { return myData + i * nGhosts; } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 229 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
0x6ced0 PUSH %RBP |
0x6ced1 MOV %RSP,%RBP |
0x6ced4 PUSH %R15 |
0x6ced6 PUSH %R14 |
0x6ced8 PUSH %R13 |
0x6ceda MOVSXD %EDX,%R13 |
0x6cedd PUSH %R12 |
0x6cedf MOV %RSI,%R12 |
0x6cee2 PUSH %RBX |
0x6cee3 MOV %RDI,%RBX |
0x6cee6 SUB $0x88,%RSP |
0x6ceed MOV %RCX,-0x98(%RBP) |
0x6cef4 MOV 0x358(%RDI),%R15 |
0x6cefb MOV %R8,-0xa0(%RBP) |
0x6cf02 MOV %R9,-0xa8(%RBP) |
0x6cf09 MOV %R15,%RDI |
0x6cf0c CALL 8560 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv@plt> |
0x6cf11 LEA 0x48(%RBX),%RSI |
0x6cf15 LEA 0x128(%R12),%RDX |
0x6cf1d CMP 0x124(%R12),%R13D |
0x6cf25 JE 6cf35 |
0x6cf27 MOV 0x40(%R12),%RAX |
0x6cf2c LEA (%R13,%R13,2),%RDX |
0x6cf31 LEA (%RAX,%RDX,8),%RDX |
0x6cf35 LEA -0x50(%RBP),%RDI |
0x6cf39 CALL 13870 <_ZNK11qmcplusplus14CrystalLatticeIdLj3EE12toUnit_floorIdEENS_10TinyVectorIdLj3EEERKNS3_IT_Lj3EEE> |
0x6cf3e MOV 0x30(%RBX),%R9D |
0x6cf42 TEST %R9D,%R9D |
0x6cf45 JLE 6d046 |
0x6cf4b MOV -0x40(%RBP),%R14 |
0x6cf4f MOV -0x48(%RBP),%RCX |
0x6cf53 XOR %R12D,%R12D |
0x6cf56 VMOVSD -0x50(%RBP),%XMM3 |
0x6cf5b VMOVQ %R14,%XMM2 |
0x6cf60 VMOVQ %RCX,%XMM1 |
0x6cf65 VMOVSD %XMM3,-0x58(%RBP) |
(697) 0x6cf6a MOV 0x310(%RBX),%R11 |
(697) 0x6cf71 MOV 0x340(%RBX),%RDI |
(697) 0x6cf78 LEA (%R12,%R12,2),%R10 |
(697) 0x6cf7c LEA (%R12,%R12,4),%RSI |
(697) 0x6cf80 MOV 0x328(%RBX),%R8 |
(697) 0x6cf87 MOV 0x2f8(%RBX),%RAX |
(697) 0x6cf8e SAL $0x3,%RSI |
(697) 0x6cf92 LEA 0x1(%R12),%R14 |
(697) 0x6cf97 LEA (%R11,%R10,8),%R13 |
(697) 0x6cf9b MOV 0x18(%RDI,%RSI,1),%RCX |
(697) 0x6cfa0 VMOVSD -0x58(%RBP),%XMM0 |
(697) 0x6cfa5 VMOVSD %XMM2,-0x68(%RBP) |
(697) 0x6cfaa MOV 0x18(%R8,%RSI,1),%RDX |
(697) 0x6cfaf MOV (%RAX,%R12,8),%RDI |
(697) 0x6cfb3 VMOVSD %XMM1,-0x60(%RBP) |
(697) 0x6cfb8 MOV (%R13),%RSI |
(697) 0x6cfbc MOVSXD 0x40(%RBX),%R8 |
(697) 0x6cfc0 CALL 6c610 <_ZN16miniqmcreference19MultiBsplineEvalRef12evaluate_vghIdEEvPKN11qmcplusplus14bspline_traitsIT_Lj3EE10SplineTypeES4_S4_S4_PS4_S9_S9_m> |
(697) 0x6cfc5 CMP %R14D,0x30(%RBX) |
(697) 0x6cfc9 VMOVSD -0x60(%RBP),%XMM1 |
(697) 0x6cfce VMOVSD -0x68(%RBP),%XMM2 |
(697) 0x6cfd3 JLE 6d046 |
(697) 0x6cfd5 MOV 0x328(%RBX),%RSI |
(697) 0x6cfdc MOV 0x310(%RBX),%RDI |
(697) 0x6cfe3 LEA (%R14,%R14,4),%RDX |
(697) 0x6cfe7 LEA (%R14,%R14,2),%R8 |
(697) 0x6cfeb SAL $0x3,%RDX |
(697) 0x6cfef MOV 0x340(%RBX),%R9 |
(697) 0x6cff6 MOV 0x2f8(%RBX),%R13 |
(697) 0x6cffd ADD $0x2,%R12 |
(697) 0x6d001 LEA (%RDI,%R8,8),%R11 |
(697) 0x6d005 MOV 0x18(%RSI,%RDX,1),%R10 |
(697) 0x6d00a MOVSXD 0x40(%RBX),%R8 |
(697) 0x6d00e VMOVSD %XMM2,-0x68(%RBP) |
(697) 0x6d013 MOV 0x18(%R9,%RDX,1),%RCX |
(697) 0x6d018 MOV (%R11),%RSI |
(697) 0x6d01b VMOVSD %XMM1,-0x60(%RBP) |
(697) 0x6d020 MOV (%R13,%R14,8),%RDI |
(697) 0x6d025 VMOVSD -0x58(%RBP),%XMM0 |
(697) 0x6d02a MOV %R10,%RDX |
(697) 0x6d02d CALL 6c610 <_ZN16miniqmcreference19MultiBsplineEvalRef12evaluate_vghIdEEvPKN11qmcplusplus14bspline_traitsIT_Lj3EE10SplineTypeES4_S4_S4_PS4_S9_S9_m> |
(697) 0x6d032 CMP %R12D,0x30(%RBX) |
(697) 0x6d036 VMOVSD -0x60(%RBP),%XMM1 |
(697) 0x6d03b VMOVSD -0x68(%RBP),%XMM2 |
(697) 0x6d040 JG 6cf6a |
0x6d046 MOV %R15,%RDI |
0x6d049 CALL 8460 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv@plt> |
0x6d04e MOV 0x30(%RBX),%R15D |
0x6d052 MOV %R15D,-0x74(%RBP) |
0x6d056 TEST %R15D,%R15D |
0x6d059 JLE 6d326 |
0x6d05f MOVSXD -0x74(%RBP),%RAX |
0x6d063 MOV 0x40(%RBX),%R12D |
0x6d067 MOVQ $0,-0x68(%RBP) |
0x6d06f XOR %R15D,%R15D |
0x6d072 MOV 0x8(%RBX),%ECX |
0x6d075 MOVQ $0,-0x70(%RBP) |
0x6d07d LEA (%RAX,%RAX,2),%RDX |
0x6d081 MOV %R12D,-0x84(%RBP) |
0x6d088 LEA (,%RAX,8),%R14 |
0x6d090 SAL $0x3,%RDX |
0x6d094 MOV %ECX,-0x78(%RBP) |
0x6d097 MOV %RDX,-0x90(%RBP) |
0x6d09e MOV %R12D,-0x60(%RBP) |
0x6d0a2 MOVL $0,-0x58(%RBP) |
0x6d0a9 MOV %R14,-0x80(%RBP) |
0x6d0ad XOR %R14D,%R14D |
(695) 0x6d0b0 MOV -0x60(%RBP),%R9D |
(695) 0x6d0b4 MOV -0x78(%RBP),%R12D |
(695) 0x6d0b8 CMP %R12D,%R9D |
(695) 0x6d0bb CMOVLE %R9D,%R12D |
(695) 0x6d0bf CMP %R12D,-0x58(%RBP) |
(695) 0x6d0c3 JGE 6d2ef |
(695) 0x6d0c9 MOV 0x310(%RBX),%R10 |
(695) 0x6d0d0 MOV 0x328(%RBX),%R8 |
(695) 0x6d0d7 MOV 0x340(%RBX),%RDI |
(695) 0x6d0de MOV -0xa0(%RBP),%R13 |
(695) 0x6d0e5 MOV -0x58(%RBP),%EAX |
(695) 0x6d0e8 MOV (%R10,%R14,1),%R11 |
(695) 0x6d0ec ADD %R15,%R8 |
(695) 0x6d0ef MOV -0x68(%RBP),%RDX |
(695) 0x6d0f3 MOV -0x98(%RBP),%R10 |
(695) 0x6d0fa MOV 0x18(%R8),%RSI |
(695) 0x6d0fe MOVSXD 0x8(%R8),%RCX |
(695) 0x6d102 SUB %EAX,%R12D |
(695) 0x6d105 XOR %EAX,%EAX |
(695) 0x6d107 MOV 0x18(%RDI,%R15,1),%R8 |
(695) 0x6d10c MOV 0x18(%R10),%R10 |
(695) 0x6d110 SAL $0x3,%R12 |
(695) 0x6d114 MOV -0x70(%RBP),%RDI |
(695) 0x6d118 ADD 0x18(%R13),%RDX |
(695) 0x6d11c LEA (%RSI,%RCX,8),%R9 |
(695) 0x6d120 SAL $0x4,%RCX |
(695) 0x6d124 MOV -0xa8(%RBP),%R13 |
(695) 0x6d12b ADD %RSI,%RCX |
(695) 0x6d12e ADD %RDI,%R10 |
(695) 0x6d131 ADD 0x18(%R13),%RDI |
(695) 0x6d135 LEA -0x8(%R12),%R13 |
(695) 0x6d13a SHR $0x3,%R13 |
(695) 0x6d13e INC %R13 |
(695) 0x6d141 AND $0x3,%R13D |
(695) 0x6d145 JE 6d205 |
(695) 0x6d14b CMP $0x1,%R13 |
(695) 0x6d14f JE 6d1c3 |
(695) 0x6d151 CMP $0x2,%R13 |
(695) 0x6d155 JE 6d18a |
(695) 0x6d157 VMOVSD (%R11),%XMM0 |
(695) 0x6d15c ADD $0x18,%RDX |
(695) 0x6d160 MOV $0x8,%EAX |
(695) 0x6d165 VMOVSD %XMM0,(%R10) |
(695) 0x6d16a VMOVSD (%RSI),%XMM2 |
(695) 0x6d16e VMOVSD (%RCX),%XMM1 |
(695) 0x6d172 VMOVHPD (%R9),%XMM2,%XMM4 |
(695) 0x6d177 VMOVSD %XMM1,-0x8(%RDX) |
(695) 0x6d17c VMOVUPD %XMM4,-0x18(%RDX) |
(695) 0x6d181 VMOVSD (%R8),%XMM5 |
(695) 0x6d186 VMOVSD %XMM5,(%RDI) |
(695) 0x6d18a VMOVSD (%R11,%RAX,1),%XMM6 |
(695) 0x6d190 ADD $0x18,%RDX |
(695) 0x6d194 VMOVSD %XMM6,(%R10,%RAX,1) |
(695) 0x6d19a VMOVSD (%RSI,%RAX,1),%XMM8 |
(695) 0x6d19f VMOVSD (%RCX,%RAX,1),%XMM7 |
(695) 0x6d1a4 VMOVHPD (%R9,%RAX,1),%XMM8,%XMM9 |
(695) 0x6d1aa VMOVSD %XMM7,-0x8(%RDX) |
(695) 0x6d1af VMOVUPD %XMM9,-0x18(%RDX) |
(695) 0x6d1b4 VMOVSD (%R8,%RAX,1),%XMM10 |
(695) 0x6d1ba VMOVSD %XMM10,(%RDI,%RAX,1) |
(695) 0x6d1bf ADD $0x8,%RAX |
(695) 0x6d1c3 VMOVSD (%R11,%RAX,1),%XMM11 |
(695) 0x6d1c9 ADD $0x18,%RDX |
(695) 0x6d1cd VMOVSD %XMM11,(%R10,%RAX,1) |
(695) 0x6d1d3 VMOVSD (%RSI,%RAX,1),%XMM13 |
(695) 0x6d1d8 VMOVSD (%RCX,%RAX,1),%XMM12 |
(695) 0x6d1dd VMOVHPD (%R9,%RAX,1),%XMM13,%XMM14 |
(695) 0x6d1e3 VMOVSD %XMM12,-0x8(%RDX) |
(695) 0x6d1e8 VMOVUPD %XMM14,-0x18(%RDX) |
(695) 0x6d1ed VMOVSD (%R8,%RAX,1),%XMM15 |
(695) 0x6d1f3 VMOVSD %XMM15,(%RDI,%RAX,1) |
(695) 0x6d1f8 ADD $0x8,%RAX |
(695) 0x6d1fc CMP %RAX,%R12 |
(695) 0x6d1ff JE 6d2ef |
(696) 0x6d205 VMOVSD (%R11,%RAX,1),%XMM3 |
(696) 0x6d20b ADD $0x60,%RDX |
(696) 0x6d20f VMOVSD %XMM3,(%R10,%RAX,1) |
(696) 0x6d215 VMOVSD (%RSI,%RAX,1),%XMM0 |
(696) 0x6d21a VMOVSD (%RCX,%RAX,1),%XMM1 |
(696) 0x6d21f VMOVHPD (%R9,%RAX,1),%XMM0,%XMM2 |
(696) 0x6d225 VMOVSD %XMM1,-0x50(%RDX) |
(696) 0x6d22a VMOVUPD %XMM2,-0x60(%RDX) |
(696) 0x6d22f VMOVSD (%R8,%RAX,1),%XMM4 |
(696) 0x6d235 VMOVSD %XMM4,(%RDI,%RAX,1) |
(696) 0x6d23a VMOVSD 0x8(%R11,%RAX,1),%XMM5 |
(696) 0x6d241 VMOVSD %XMM5,0x8(%RAX,%R10,1) |
(696) 0x6d248 VMOVSD 0x8(%RSI,%RAX,1),%XMM7 |
(696) 0x6d24e VMOVSD 0x8(%RCX,%RAX,1),%XMM6 |
(696) 0x6d254 VMOVHPD 0x8(%R9,%RAX,1),%XMM7,%XMM8 |
(696) 0x6d25b VMOVSD %XMM6,-0x38(%RDX) |
(696) 0x6d260 VMOVUPD %XMM8,-0x48(%RDX) |
(696) 0x6d265 VMOVSD 0x8(%R8,%RAX,1),%XMM9 |
(696) 0x6d26c VMOVSD %XMM9,0x8(%RAX,%RDI,1) |
(696) 0x6d272 VMOVSD 0x10(%R11,%RAX,1),%XMM10 |
(696) 0x6d279 VMOVSD %XMM10,0x10(%RAX,%R10,1) |
(696) 0x6d280 VMOVSD 0x10(%RSI,%RAX,1),%XMM12 |
(696) 0x6d286 VMOVSD 0x10(%RCX,%RAX,1),%XMM11 |
(696) 0x6d28c VMOVHPD 0x10(%R9,%RAX,1),%XMM12,%XMM13 |
(696) 0x6d293 VMOVSD %XMM11,-0x20(%RDX) |
(696) 0x6d298 VMOVUPD %XMM13,-0x30(%RDX) |
(696) 0x6d29d VMOVSD 0x10(%R8,%RAX,1),%XMM14 |
(696) 0x6d2a4 VMOVSD %XMM14,0x10(%RAX,%RDI,1) |
(696) 0x6d2aa VMOVSD 0x18(%R11,%RAX,1),%XMM15 |
(696) 0x6d2b1 VMOVSD %XMM15,0x18(%RAX,%R10,1) |
(696) 0x6d2b8 VMOVSD 0x18(%RSI,%RAX,1),%XMM1 |
(696) 0x6d2be VMOVSD 0x18(%RCX,%RAX,1),%XMM3 |
(696) 0x6d2c4 VMOVHPD 0x18(%R9,%RAX,1),%XMM1,%XMM0 |
(696) 0x6d2cb VMOVUPD %XMM0,-0x18(%RDX) |
(696) 0x6d2d0 VMOVSD %XMM3,-0x8(%RDX) |
(696) 0x6d2d5 VMOVSD 0x18(%R8,%RAX,1),%XMM2 |
(696) 0x6d2dc ADD $0x20,%RAX |
(696) 0x6d2e0 VMOVSD %XMM2,-0x8(%RAX,%RDI,1) |
(696) 0x6d2e6 CMP %RAX,%R12 |
(696) 0x6d2e9 JNE 6d205 |
(695) 0x6d2ef MOV -0x84(%RBP),%R12D |
(695) 0x6d2f6 MOV -0x74(%RBP),%R11D |
(695) 0x6d2fa ADD $0x18,%R14 |
(695) 0x6d2fe ADD $0x28,%R15 |
(695) 0x6d302 MOV -0x80(%RBP),%RSI |
(695) 0x6d306 MOV -0x90(%RBP),%RCX |
(695) 0x6d30d ADD %R12D,-0x60(%RBP) |
(695) 0x6d311 ADD %R11D,-0x58(%RBP) |
(695) 0x6d315 ADD %RSI,-0x70(%RBP) |
(695) 0x6d319 ADD %RCX,-0x68(%RBP) |
(695) 0x6d31d CMP %R14,%RCX |
(695) 0x6d320 JNE 6d0b0 |
0x6d326 ADD $0x88,%RSP |
0x6d32d POP %RBX |
0x6d32e POP %R12 |
0x6d330 POP %R13 |
0x6d332 POP %R14 |
0x6d334 POP %R15 |
0x6d336 POP %RBP |
0x6d337 RET |
0x6d338 NOPL (%RAX,%RAX,1) |
Path / |
Source file and lines | einspline_spo_ref.hpp:203-230 |
Module | libqmcwfs.so |
nb instructions | 67 |
nb uops | 70 |
loop length | 286 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 15 |
micro-operation queue | 11.67 cycles |
front end | 11.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.70 | 2.67 | 6.00 | 6.00 | 11.00 | 2.60 | 2.50 | 11.00 | 11.00 | 11.00 | 2.53 | 6.00 |
cycles | 2.70 | 2.67 | 6.00 | 6.00 | 11.00 | 2.60 | 2.50 | 11.00 | 11.00 | 11.00 | 2.53 | 6.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 11.27-11.28 |
Stall cycles | 0.00 |
Front-end | 11.67 |
Dispatch | 11.00 |
Overall L1 | 11.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 8% |
load | 8% |
store | 8% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 8% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 9% |
load | 9% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 8% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOVSXD %EDX,%R13 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB $0x88,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x358(%RDI),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 8560 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x48(%RBX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x128(%R12),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP 0x124(%R12),%R13D | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 6cf35 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x65> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x40(%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R13,%R13,2),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RAX,%RDX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x50(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 13870 <_ZNK11qmcplusplus14CrystalLatticeIdLj3EE12toUnit_floorIdEENS_10TinyVectorIdLj3EEERKNS3_IT_Lj3EEE> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x30(%RBX),%R9D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R9D,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 6d046 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x176> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %R12D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD -0x50(%RBP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R14,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVQ %RCX,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVSD %XMM3,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 8460 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x30(%RBX),%R15D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15D,-0x74(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %R15D,%R15D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 6d326 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x456> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD -0x74(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBX),%R12D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x8(%RBX),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RAX,%RAX,2),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12D,-0x84(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RAX,8),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %ECX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12D,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x88,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | einspline_spo_ref.hpp:203-230 |
Module | libqmcwfs.so |
nb instructions | 67 |
nb uops | 70 |
loop length | 286 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 15 |
micro-operation queue | 11.67 cycles |
front end | 11.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.70 | 2.67 | 6.00 | 6.00 | 11.00 | 2.60 | 2.50 | 11.00 | 11.00 | 11.00 | 2.53 | 6.00 |
cycles | 2.70 | 2.67 | 6.00 | 6.00 | 11.00 | 2.60 | 2.50 | 11.00 | 11.00 | 11.00 | 2.53 | 6.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 11.27-11.28 |
Stall cycles | 0.00 |
Front-end | 11.67 |
Dispatch | 11.00 |
Overall L1 | 11.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 8% |
load | 8% |
store | 8% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 8% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 9% |
load | 9% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 8% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOVSXD %EDX,%R13 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB $0x88,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x358(%RDI),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 8560 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x48(%RBX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x128(%R12),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP 0x124(%R12),%R13D | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 6cf35 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x65> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x40(%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R13,%R13,2),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RAX,%RDX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x50(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 13870 <_ZNK11qmcplusplus14CrystalLatticeIdLj3EE12toUnit_floorIdEENS_10TinyVectorIdLj3EEERKNS3_IT_Lj3EEE> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x30(%RBX),%R9D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R9D,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 6d046 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x176> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %R12D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD -0x50(%RBP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R14,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVQ %RCX,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVSD %XMM3,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 8460 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x30(%RBX),%R15D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15D,-0x74(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %R15D,%R15D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 6d326 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_+0x456> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD -0x74(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBX),%R12D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x8(%RBX),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RAX,%RAX,2),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12D,-0x84(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RAX,8),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %ECX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12D,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x88,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEERNS6_INS2_10TinyVectorIdLj3EEESaISB_EEES9_– | 0.99 | 0.98 |
○Loop 697 - einspline_spo_ref.hpp:206-207 - libqmcwfs.so | 0 | 0.01 |
▼Loop 695 - einspline_spo_ref.hpp:219-227 - libqmcwfs.so– | 0 | 0.01 |
○Loop 696 - einspline_spo_ref.hpp:223-227 - libqmcwfs.so | 0.98 | 0.82 |