Function: _ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6 ... | Module: libqmcwfs.so | Source: einspline_spo_ref.hpp:172-189 [...] | Coverage: 21.07% |
---|
Function: _ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6 ... | Module: libqmcwfs.so | Source: einspline_spo_ref.hpp:172-189 [...] | Coverage: 21.07% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineData.hpp: 54 - 57 |
-------------------------------------------------------------------------------- |
54: a[0] = ((A00 * tx + A01) * tx + A02) * tx + A03; |
55: a[1] = ((A10 * tx + A11) * tx + A12) * tx + A13; |
56: a[2] = ((A20 * tx + A21) * tx + A22) * tx + A23; |
57: a[3] = ((A30 * tx + A31) * tx + A32) * tx + A33; |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/stl_algo.h: 731 - 757 |
-------------------------------------------------------------------------------- |
731: { return std::copy(__first, __first + __n, __result); } |
[...] |
757: if (__n2 <= 0) |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/stl_vector.h: 1258 - 1258 |
-------------------------------------------------------------------------------- |
1258: { return _M_data_ptr(this->_M_impl._M_start); } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineEvalHelper.hpp: 53 - 63 |
-------------------------------------------------------------------------------- |
53: if (x < 0) |
[...] |
60: ind = static_cast<int>(x); |
61: dx = x - ind; |
62: // upper bound |
63: if (ind > nmax) |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 143 - 143 |
-------------------------------------------------------------------------------- |
143: return (active_ptcl_ == iat) ? active_pos_ : R[iat]; |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/stl_algobase.h: 238 - 931 |
-------------------------------------------------------------------------------- |
238: if (__b < __a) |
[...] |
398: { *__to = *__from; } |
[...] |
436: if (__builtin_expect(_Num > 1, true)) |
437: __builtin_memmove(__result, __first, sizeof(_Tp) * _Num); |
[...] |
930: for (; __first != __last; ++__first) |
931: *__first = __tmp; |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/einspline_spo_ref.hpp: 172 - 189 |
-------------------------------------------------------------------------------- |
172: ScopedTimer local_timer(timer); |
173: |
174: auto u = Lattice.toUnit_floor(P.activeR(iat)); |
175: for (int i = 0; i < nBlocks; ++i) |
176: MultiBsplineEvalRef::evaluate_v(einsplines[i], u[0], u[1], u[2], psi[i].data(), nSplinesPerBlock); |
177: } |
178: |
179: inline void evaluate(const ParticleSet& P, int iat, ValueVector_t& psi_v) |
180: { |
181: evaluate_v(P, iat); |
182: |
183: for (int i = 0; i < nBlocks; ++i) |
184: { |
185: // in real simulation, phase needs to be applied. Here just fake computation |
186: const int first = i * nBlocks; |
187: std::copy_n(psi[i].data(), std::min((i + 1) * nSplinesPerBlock, OrbitalSetSize) - first, psi_v.data() + first); |
188: } |
189: } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Utilities/NewTimer.h: 242 - 249 |
-------------------------------------------------------------------------------- |
242: ScopeGuard(TIMER& t) : timer(t) { timer.start(); } |
[...] |
249: ~ScopeGuard() { timer.stop(); } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Numerics/Spline2/MultiBsplineRef.hpp: 42 - 71 |
-------------------------------------------------------------------------------- |
42: x -= spline_m->x_grid.start; |
43: y -= spline_m->y_grid.start; |
44: z -= spline_m->z_grid.start; |
45: T tx, ty, tz; |
46: int ix, iy, iz; |
47: spline2::getSplineBound(x * spline_m->x_grid.delta_inv, tx, ix, spline_m->x_grid.num - 1); |
48: spline2::getSplineBound(y * spline_m->y_grid.delta_inv, ty, iy, spline_m->y_grid.num - 1); |
49: spline2::getSplineBound(z * spline_m->z_grid.delta_inv, tz, iz, spline_m->z_grid.num - 1); |
[...] |
56: const intptr_t xs = spline_m->x_stride; |
57: const intptr_t ys = spline_m->y_stride; |
58: const intptr_t zs = spline_m->z_stride; |
59: |
60: constexpr T zero(0); |
61: std::fill(vals, vals + num_splines, zero); |
62: |
63: for (size_t i = 0; i < 4; i++) |
64: for (size_t j = 0; j < 4; j++) |
65: { |
66: const T pre00 = a[i] * b[j]; |
67: const T* restrict coefs = spline_m->coefs + (ix + i) * xs + (iy + j) * ys + iz * zs; |
68: for (size_t n = 0; n < num_splines; n++) |
69: vals[n] += pre00 * |
70: (c[0] * coefs[n] + c[1] * coefs[n + zs] + c[2] * coefs[n + 2 * zs] + |
71: c[3] * coefs[n + 3 * zs]); |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 229 - 229 |
-------------------------------------------------------------------------------- |
229: return X[i]; |
0x6bc60 PUSH %RBP |
0x6bc61 MOV %RSP,%RBP |
0x6bc64 PUSH %R15 |
0x6bc66 MOVSXD %EDX,%R15 |
0x6bc69 PUSH %R14 |
0x6bc6b MOV %RSI,%R14 |
0x6bc6e PUSH %R13 |
0x6bc70 PUSH %R12 |
0x6bc72 MOV %RCX,%R12 |
0x6bc75 PUSH %RBX |
0x6bc76 MOV %RDI,%RBX |
0x6bc79 AND $-0x20,%RSP |
0x6bc7d SUB $0x160,%RSP |
0x6bc84 MOV 0x358(%RDI),%R13 |
0x6bc8b MOV %R13,%RDI |
0x6bc8e CALL 8560 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv@plt> |
0x6bc93 LEA 0x48(%RBX),%RSI |
0x6bc97 LEA 0x128(%R14),%RDX |
0x6bc9e CMP 0x124(%R14),%R15D |
0x6bca5 JE 6bcb3 |
0x6bca7 MOV 0x40(%R14),%RAX |
0x6bcab LEA (%R15,%R15,2),%RDX |
0x6bcaf LEA (%RAX,%RDX,8),%RDX |
0x6bcb3 LEA 0x100(%RSP),%RDI |
0x6bcbb CALL 13870 <_ZNK11qmcplusplus14CrystalLatticeIdLj3EE12toUnit_floorIdEENS_10TinyVectorIdLj3EEERKNS3_IT_Lj3EEE> |
0x6bcc0 MOVSXD 0x30(%RBX),%RSI |
0x6bcc4 TEST %ESI,%ESI |
0x6bcc6 JLE 6c4ce |
0x6bccc MOVSXD 0x40(%RBX),%RDI |
0x6bcd0 MOV 0x2f8(%RBX),%R10 |
0x6bcd7 MOV %R13,0x28(%RSP) |
0x6bcdc MOV 0x310(%RBX),%R9 |
0x6bce3 VMOVSD 0x110(%RSP),%XMM7 |
0x6bcec MOV %RBX,0x20(%RSP) |
0x6bcf1 MOV %RDI,%R15 |
0x6bcf4 LEA (,%RDI,8),%R8 |
0x6bcfc LEA -0x1(%RDI),%R14 |
0x6bd00 MOV %EDI,0x98(%RSP) |
0x6bd07 SHR $0x2,%R15 |
0x6bd0b MOV %RDI,0x78(%RSP) |
0x6bd10 LEA (%R10,%RSI,8),%R11 |
0x6bd14 AND $-0x4,%RDI |
0x6bd18 SAL $0x5,%R15 |
0x6bd1c VMOVSD 0x108(%RSP),%XMM4 |
0x6bd25 VMOVSD 0x100(%RSP),%XMM0 |
0x6bd2e MOV %R8,0x58(%RSP) |
0x6bd33 MOV %R9,0x50(%RSP) |
0x6bd38 MOV %R10,0x60(%RSP) |
0x6bd3d MOV %R11,0x30(%RSP) |
0x6bd42 MOV %R14,0xa0(%RSP) |
0x6bd4a MOV %R15,0xf0(%RSP) |
0x6bd52 MOV %RDI,0x70(%RSP) |
0x6bd57 MOV %R12,0x18(%RSP) |
0x6bd5c VMOVSD %XMM7,0x48(%RSP) |
0x6bd62 VMOVSD %XMM4,0x40(%RSP) |
0x6bd68 VMOVSD %XMM0,0x38(%RSP) |
(687) 0x6bd6e MOV 0x60(%RSP),%R12 |
(687) 0x6bd73 VMOVSD 0x38(%RSP),%XMM5 |
(687) 0x6bd79 VXORPD %XMM9,%XMM9,%XMM9 |
(687) 0x6bd7e MOV 0x50(%RSP),%RBX |
(687) 0x6bd83 VMOVSD 0x40(%RSP),%XMM1 |
(687) 0x6bd89 MOV (%R12),%RCX |
(687) 0x6bd8d VMOVSD 0x48(%RSP),%XMM2 |
(687) 0x6bd93 MOV (%RBX),%R15 |
(687) 0x6bd96 VSUBSD 0x28(%RCX),%XMM5,%XMM6 |
(687) 0x6bd9b VSUBSD 0x50(%RCX),%XMM1,%XMM10 |
(687) 0x6bda0 VSUBSD 0x78(%RCX),%XMM2,%XMM3 |
(687) 0x6bda5 MOV 0x38(%RCX),%EAX |
(687) 0x6bda8 VMULSD 0x48(%RCX),%XMM6,%XMM8 |
(687) 0x6bdad VCOMISD %XMM8,%XMM9 |
(687) 0x6bdb2 JA 6c593 |
(687) 0x6bdb8 VCVTTSD2SI %XMM8,%R13D |
(687) 0x6bdbd DEC %EAX |
(687) 0x6bdbf CMP %R13D,%EAX |
(687) 0x6bdc2 JL 6c5bc |
(687) 0x6bdc8 VRNDSCALESD $0xb,%XMM8,%XMM8,%XMM11 |
(687) 0x6bdcf VSUBSD %XMM11,%XMM8,%XMM12 |
(687) 0x6bdd4 VMOVSD 0x1b884(%RIP),%XMM14 |
(687) 0x6bddc VMOVSD 0x1beac(%RIP),%XMM7 |
(687) 0x6bde4 MOVSXD %R13D,%RDX |
(687) 0x6bde7 MOV %RDX,0xf8(%RSP) |
(687) 0x6bdef VMULSD %XMM14,%XMM12,%XMM15 |
(687) 0x6bdf4 VMOVSD %XMM12,%XMM12,%XMM1 |
(687) 0x6bdf8 VMOVSD %XMM12,%XMM12,%XMM0 |
(687) 0x6bdfc VFNMADD132SD %XMM7,%XMM7,%XMM1 |
(687) 0x6be01 VFMADD213SD 0x1ba06(%RIP),%XMM7,%XMM0 |
(687) 0x6be0a VMULSD %XMM12,%XMM12,%XMM13 |
(687) 0x6be0f VSUBSD %XMM15,%XMM7,%XMM4 |
(687) 0x6be14 VFMADD231SD %XMM1,%XMM12,%XMM7 |
(687) 0x6be19 VMULSD %XMM13,%XMM15,%XMM2 |
(687) 0x6be1e VFMADD213SD 0x1b841(%RIP),%XMM13,%XMM0 |
(687) 0x6be27 VFMADD213SD 0x1c350(%RIP),%XMM12,%XMM4 |
(687) 0x6be30 VFMADD132SD %XMM12,%XMM14,%XMM4 |
(687) 0x6be35 VFMADD132SD %XMM7,%XMM14,%XMM12 |
(687) 0x6be3a VUNPCKLPD %XMM0,%XMM4,%XMM6 |
(687) 0x6be3e VUNPCKLPD %XMM2,%XMM12,%XMM5 |
(687) 0x6be42 VINSERTF128 $0x1,%XMM5,%YMM6,%YMM11 |
(687) 0x6be48 VMULSD 0x70(%RCX),%XMM10,%XMM10 |
(687) 0x6be4d VXORPD %XMM8,%XMM8,%XMM8 |
(687) 0x6be52 MOV 0x60(%RCX),%ESI |
(687) 0x6be55 VCOMISD %XMM10,%XMM8 |
(687) 0x6be5a JA 6c583 |
(687) 0x6be60 VCVTTSD2SI %XMM10,%EDI |
(687) 0x6be65 DEC %ESI |
(687) 0x6be67 CMP %EDI,%ESI |
(687) 0x6be69 JL 6c5ac |
(687) 0x6be6f VRNDSCALESD $0xb,%XMM10,%XMM10,%XMM9 |
(687) 0x6be76 VSUBSD %XMM9,%XMM10,%XMM12 |
(687) 0x6be7b VMOVSD 0x1be0d(%RIP),%XMM14 |
(687) 0x6be83 VMOVSD 0x1b7d5(%RIP),%XMM4 |
(687) 0x6be8b MOVSXD %EDI,%R13 |
(687) 0x6be8e VMULSD 0x1b972(%RIP),%XMM12,%XMM13 |
(687) 0x6be96 VMOVSD %XMM12,%XMM12,%XMM7 |
(687) 0x6be9a VMOVSD %XMM12,%XMM12,%XMM1 |
(687) 0x6be9e VFNMADD132SD %XMM14,%XMM14,%XMM7 |
(687) 0x6bea3 VFMADD213SD 0x1b964(%RIP),%XMM14,%XMM1 |
(687) 0x6beac VMULSD %XMM12,%XMM12,%XMM2 |
(687) 0x6beb1 VADDSD %XMM14,%XMM13,%XMM15 |
(687) 0x6beb6 VXORPD 0x1b9c2(%RIP),%XMM13,%XMM0 |
(687) 0x6bebe VFMADD231SD %XMM7,%XMM12,%XMM14 |
(687) 0x6bec3 VMULSD %XMM2,%XMM0,%XMM5 |
(687) 0x6bec7 VFMADD213SD 0x1b798(%RIP),%XMM2,%XMM1 |
(687) 0x6bed0 VFMADD213SD 0x1c2a7(%RIP),%XMM12,%XMM15 |
(687) 0x6bed9 VFMADD132SD %XMM12,%XMM4,%XMM15 |
(687) 0x6bede VFMADD231SD %XMM14,%XMM12,%XMM4 |
(687) 0x6bee3 VUNPCKLPD %XMM1,%XMM15,%XMM10 |
(687) 0x6bee7 VUNPCKLPD %XMM5,%XMM4,%XMM6 |
(687) 0x6beeb VINSERTF128 $0x1,%XMM6,%YMM10,%YMM12 |
(687) 0x6bef1 VMULSD 0x98(%RCX),%XMM3,%XMM8 |
(687) 0x6bef9 VXORPD %XMM3,%XMM3,%XMM3 |
(687) 0x6befd MOV 0x88(%RCX),%EAX |
(687) 0x6bf03 VCOMISD %XMM8,%XMM3 |
(687) 0x6bf08 JA 6c556 |
(687) 0x6bf0e VCVTTSD2SI %XMM8,%R8D |
(687) 0x6bf13 DEC %EAX |
(687) 0x6bf15 CMP %R8D,%EAX |
(687) 0x6bf18 JL 6c5d3 |
(687) 0x6bf1e VRNDSCALESD $0xb,%XMM8,%XMM8,%XMM9 |
(687) 0x6bf25 VSUBSD %XMM9,%XMM8,%XMM3 |
(687) 0x6bf2a VMOVSD 0x1bd5e(%RIP),%XMM14 |
(687) 0x6bf32 VMOVSD 0x1b726(%RIP),%XMM15 |
(687) 0x6bf3a MOVSXD %R8D,%R9 |
(687) 0x6bf3d MOV %R9,0xe8(%RSP) |
(687) 0x6bf45 VMULSD 0x1b8bb(%RIP),%XMM3,%XMM13 |
(687) 0x6bf4d VMOVSD %XMM3,%XMM3,%XMM1 |
(687) 0x6bf51 VMOVSD %XMM3,%XMM3,%XMM6 |
(687) 0x6bf55 VFNMADD132SD %XMM14,%XMM14,%XMM1 |
(687) 0x6bf5a VFMADD213SD 0x1b8ad(%RIP),%XMM14,%XMM6 |
(687) 0x6bf63 VMULSD %XMM3,%XMM3,%XMM4 |
(687) 0x6bf67 VADDSD %XMM14,%XMM13,%XMM5 |
(687) 0x6bf6c VXORPD 0x1b90c(%RIP),%XMM13,%XMM2 |
(687) 0x6bf74 VFMADD231SD %XMM1,%XMM3,%XMM14 |
(687) 0x6bf79 VFMADD213SD 0x1b6e6(%RIP),%XMM4,%XMM6 |
(687) 0x6bf82 VMULSD %XMM4,%XMM2,%XMM4 |
(687) 0x6bf86 VFMADD213SD 0x1c1f1(%RIP),%XMM3,%XMM5 |
(687) 0x6bf8f VFMADD132SD %XMM3,%XMM15,%XMM5 |
(687) 0x6bf94 VFMADD132SD %XMM14,%XMM15,%XMM3 |
(687) 0x6bf99 CMPQ $0,0x58(%RSP) |
(687) 0x6bf9f MOV 0x10(%RCX),%RBX |
(687) 0x6bfa3 VMOVAPD %YMM11,0x120(%RSP) |
(687) 0x6bfac MOV 0x18(%RCX),%R12 |
(687) 0x6bfb0 MOV 0x20(%RCX),%R14 |
(687) 0x6bfb4 VMOVAPD %YMM12,0x140(%RSP) |
(687) 0x6bfbd JE 6c029 |
(687) 0x6bfbf MOV %RCX,0xe0(%RSP) |
(687) 0x6bfc7 MOV 0x58(%RSP),%RDX |
(687) 0x6bfcc XOR %ESI,%ESI |
(687) 0x6bfce MOV %R15,%RDI |
(687) 0x6bfd1 VMOVSD %XMM4,0xc0(%RSP) |
(687) 0x6bfda VMOVSD %XMM3,0xc8(%RSP) |
(687) 0x6bfe3 VMOVSD %XMM6,0xd0(%RSP) |
(687) 0x6bfec VMOVSD %XMM5,0xd8(%RSP) |
(687) 0x6bff5 VZEROUPPER |
(687) 0x6bff8 CALL 80e0 <memset@plt> |
(687) 0x6bffd MOV 0xe0(%RSP),%RCX |
(687) 0x6c005 VMOVSD 0xd8(%RSP),%XMM5 |
(687) 0x6c00e VMOVSD 0xd0(%RSP),%XMM6 |
(687) 0x6c017 VMOVSD 0xc8(%RSP),%XMM3 |
(687) 0x6c020 VMOVSD 0xc0(%RSP),%XMM4 |
(687) 0x6c029 MOV 0xe8(%RSP),%RAX |
(687) 0x6c031 MOV 0x8(%RCX),%RSI |
(687) 0x6c035 IMUL %R14,%RAX |
(687) 0x6c039 CMPQ $0,0x78(%RSP) |
(687) 0x6c03f JE 6c4a0 |
(687) 0x6c045 MOV 0xf8(%RSP),%RDX |
(687) 0x6c04d MOV %R13,%R8 |
(687) 0x6c050 LEA 0x1(%R13),%R13 |
(687) 0x6c054 MOV 0x98(%RSP),%ECX |
(687) 0x6c05b IMUL %R12,%R13 |
(687) 0x6c05f LEA 0x140(%RSP),%R11 |
(687) 0x6c067 MOV %R12,%R10 |
(687) 0x6c06a MOV %RBX,0x68(%RSP) |
(687) 0x6c06f IMUL %RBX,%RDX |
(687) 0x6c073 AND $0x3,%ECX |
(687) 0x6c076 MOV %R11,0xa8(%RSP) |
(687) 0x6c07e SAL $0x4,%R10 |
(687) 0x6c082 IMUL %R12,%R8 |
(687) 0x6c086 MOV %ECX,0x9c(%RSP) |
(687) 0x6c08d LEA (%R12,%R12,1),%R12 |
(687) 0x6c091 VBROADCASTSD %XMM5,%YMM10 |
(687) 0x6c096 MOV %R10,0xb0(%RSP) |
(687) 0x6c09e LEA 0x120(%RSP),%RDI |
(687) 0x6c0a6 VBROADCASTSD %XMM6,%YMM9 |
(687) 0x6c0ab VBROADCASTSD %XMM3,%YMM8 |
(687) 0x6c0b0 ADD %RDX,%R13 |
(687) 0x6c0b3 MOV %R12,0xb8(%RSP) |
(687) 0x6c0bb VBROADCASTSD %XMM4,%YMM7 |
(687) 0x6c0c0 MOV %R15,%R12 |
(687) 0x6c0c3 LEA (%R13,%RAX,1),%R9 |
(687) 0x6c0c8 ADD %RDX,%R8 |
(687) 0x6c0cb LEA (,%R14,8),%R13 |
(687) 0x6c0d3 MOV %RSI,%R15 |
(687) 0x6c0d6 LEA (%R8,%RAX,1),%R8 |
(687) 0x6c0da MOV %R9,%R10 |
(689) 0x6c0dd MOV 0xa8(%RSP),%R9 |
(689) 0x6c0e5 MOV %R10,0xe8(%RSP) |
(689) 0x6c0ed LEA 0x160(%RSP),%RBX |
(689) 0x6c0f5 LEA (%R15,%R8,8),%RCX |
(689) 0x6c0f9 MOV %R8,0xf8(%RSP) |
(689) 0x6c101 VMOVSD (%RDI),%XMM19 |
(689) 0x6c107 LEA (%R15,%R10,8),%RDX |
(689) 0x6c10b VMOVDDUP %XMM5,%XMM15 |
(689) 0x6c10f MOV %R10,0x90(%RSP) |
(689) 0x6c117 VMOVDDUP %XMM6,%XMM14 |
(689) 0x6c11b VMOVDDUP %XMM3,%XMM13 |
(689) 0x6c11f VMOVDDUP %XMM4,%XMM12 |
(689) 0x6c123 MOV %R8,0x88(%RSP) |
(689) 0x6c12b MOV %RDI,0x80(%RSP) |
(689) 0x6c133 MOV %RBX,0xc0(%RSP) |
(689) 0x6c13b MOV %R15,%RBX |
(689) 0x6c13e MOV %R9,%R15 |
(688) 0x6c141 VMULSD (%R15),%XMM19,%XMM2 |
(688) 0x6c147 CMPQ $0x2,0xa0(%RSP) |
(688) 0x6c150 JBE 6c54f |
(688) 0x6c156 VMULSD 0x8(%R15),%XMM19,%XMM16 |
(688) 0x6c15d LEA (%RCX,%R13,1),%R9 |
(688) 0x6c161 LEA (%R13,%RDX,1),%RDI |
(688) 0x6c166 XOR %EAX,%EAX |
(688) 0x6c168 LEA (%R13,%R9,1),%R8 |
(688) 0x6c16d LEA (%R13,%RDI,1),%RSI |
(688) 0x6c172 VBROADCASTSD %XMM2,%YMM17 |
(688) 0x6c178 LEA (%R8,%R13,1),%R11 |
(688) 0x6c17c LEA (%R13,%RSI,1),%R10 |
(688) 0x6c181 VBROADCASTSD %XMM16,%YMM20 |
(688) 0x6c187 TESTB $0x20,0xf0(%RSP) |
(688) 0x6c18f JE 6c1f0 |
(688) 0x6c191 VMULPD (%R9),%YMM9,%YMM11 |
(688) 0x6c196 CMPQ $0x20,0xf0(%RSP) |
(688) 0x6c19f MOV $0x20,%EAX |
(688) 0x6c1a4 VMULPD (%R11),%YMM7,%YMM0 |
(688) 0x6c1a9 VMULPD (%R10),%YMM7,%YMM18 |
(688) 0x6c1af VFMADD231PD (%RCX),%YMM10,%YMM11 |
(688) 0x6c1b4 VFMADD231PD (%R8),%YMM8,%YMM0 |
(688) 0x6c1b9 VFMADD231PD (%RSI),%YMM8,%YMM18 |
(688) 0x6c1bf VADDPD %YMM0,%YMM11,%YMM1 |
(688) 0x6c1c3 VMULPD (%RDI),%YMM9,%YMM11 |
(688) 0x6c1c7 VFMADD213PD (%R12),%YMM17,%YMM1 |
(688) 0x6c1ce VFMADD231PD (%RDX),%YMM10,%YMM11 |
(688) 0x6c1d3 VADDPD %YMM18,%YMM11,%YMM0 |
(688) 0x6c1d9 VFMADD132PD %YMM20,%YMM1,%YMM0 |
(688) 0x6c1df VMOVUPD %YMM0,(%R12) |
(688) 0x6c1e5 JE 6c2a9 |
(688) 0x6c1eb NOPL (%RAX,%RAX,1) |
(690) 0x6c1f0 VMULPD (%R9,%RAX,1),%YMM9,%YMM1 |
(690) 0x6c1f6 VMULPD (%R11,%RAX,1),%YMM7,%YMM11 |
(690) 0x6c1fc VMULPD (%RDI,%RAX,1),%YMM9,%YMM0 |
(690) 0x6c201 VMULPD (%R10,%RAX,1),%YMM7,%YMM21 |
(690) 0x6c208 VMULPD 0x20(%R10,%RAX,1),%YMM7,%YMM22 |
(690) 0x6c210 VFMADD231PD (%RCX,%RAX,1),%YMM10,%YMM1 |
(690) 0x6c216 VFMADD231PD (%R8,%RAX,1),%YMM8,%YMM11 |
(690) 0x6c21c VFMADD231PD (%RDX,%RAX,1),%YMM10,%YMM0 |
(690) 0x6c222 VFMADD231PD (%RSI,%RAX,1),%YMM8,%YMM21 |
(690) 0x6c229 VFMADD231PD 0x20(%RAX,%RSI,1),%YMM8,%YMM22 |
(690) 0x6c231 VADDPD %YMM11,%YMM1,%YMM1 |
(690) 0x6c236 VADDPD %YMM21,%YMM0,%YMM11 |
(690) 0x6c23c VMULPD 0x20(%R11,%RAX,1),%YMM7,%YMM0 |
(690) 0x6c243 VFMADD213PD (%R12,%RAX,1),%YMM17,%YMM1 |
(690) 0x6c24a VFMADD231PD 0x20(%R8,%RAX,1),%YMM8,%YMM0 |
(690) 0x6c251 VFMADD132PD %YMM20,%YMM1,%YMM11 |
(690) 0x6c257 VMULPD 0x20(%R9,%RAX,1),%YMM9,%YMM1 |
(690) 0x6c25e VMOVUPD %YMM11,(%R12,%RAX,1) |
(690) 0x6c264 VFMADD231PD 0x20(%RCX,%RAX,1),%YMM10,%YMM1 |
(690) 0x6c26b VADDPD %YMM0,%YMM1,%YMM11 |
(690) 0x6c26f VMULPD 0x20(%RAX,%RDI,1),%YMM9,%YMM1 |
(690) 0x6c275 VFMADD213PD 0x20(%R12,%RAX,1),%YMM17,%YMM11 |
(690) 0x6c27d VFMADD231PD 0x20(%RDX,%RAX,1),%YMM10,%YMM1 |
(690) 0x6c284 VADDPD %YMM22,%YMM1,%YMM0 |
(690) 0x6c28a VFMADD132PD %YMM20,%YMM11,%YMM0 |
(690) 0x6c290 VMOVUPD %YMM0,0x20(%R12,%RAX,1) |
(690) 0x6c297 ADD $0x40,%RAX |
(690) 0x6c29b CMP %RAX,0xf0(%RSP) |
(690) 0x6c2a3 JNE 6c1f0 |
(688) 0x6c2a9 MOV 0x9c(%RSP),%R9D |
(688) 0x6c2b1 TEST %R9D,%R9D |
(688) 0x6c2b4 JE 6c430 |
(688) 0x6c2ba MOV 0x70(%RSP),%RAX |
(688) 0x6c2bf MOV 0x78(%RSP),%R8 |
(688) 0x6c2c4 SUB %RAX,%R8 |
(688) 0x6c2c7 MOV %R8,0xc8(%RSP) |
(688) 0x6c2cf CMP $0x1,%R8 |
(688) 0x6c2d3 JE 6c3d3 |
(688) 0x6c2d9 MOV 0xf8(%RSP),%R11 |
(688) 0x6c2e1 LEA (%R12,%RAX,8),%R9 |
(688) 0x6c2e5 VMOVDDUP %XMM2,%XMM11 |
(688) 0x6c2e9 LEA (%R11,%R14,1),%R8 |
(688) 0x6c2ed LEA (%R14,%R8,1),%RDI |
(688) 0x6c2f1 ADD %RAX,%R8 |
(688) 0x6c2f4 LEA (%RDI,%RAX,1),%RSI |
(688) 0x6c2f8 VMULPD (%RBX,%R8,8),%XMM14,%XMM1 |
(688) 0x6c2fe ADD %R14,%RDI |
(688) 0x6c301 LEA (%RDI,%RAX,1),%R10 |
(688) 0x6c305 MOV 0xe8(%RSP),%RDI |
(688) 0x6c30d MOV %RSI,0xe0(%RSP) |
(688) 0x6c315 MOV %R10,0xd8(%RSP) |
(688) 0x6c31d LEA (%RDI,%R14,1),%RSI |
(688) 0x6c321 MOV %RDI,%R11 |
(688) 0x6c324 LEA (%RAX,%RSI,1),%RDI |
(688) 0x6c328 ADD %R14,%RSI |
(688) 0x6c32b ADD %RAX,%R11 |
(688) 0x6c32e LEA (%RAX,%RSI,1),%R10 |
(688) 0x6c332 MOV 0xd8(%RSP),%R8 |
(688) 0x6c33a VMULPD (%RBX,%RDI,8),%XMM14,%XMM24 |
(688) 0x6c341 ADD %R14,%RSI |
(688) 0x6c344 ADD %RAX,%RSI |
(688) 0x6c347 MOV %RSI,0xd0(%RSP) |
(688) 0x6c34f VMULPD (%RBX,%R8,8),%XMM12,%XMM23 |
(688) 0x6c356 MOV 0xf8(%RSP),%RSI |
(688) 0x6c35e ADD %RAX,%RSI |
(688) 0x6c361 VFMADD231PD (%RBX,%R11,8),%XMM15,%XMM24 |
(688) 0x6c368 MOV 0xd0(%RSP),%R11 |
(688) 0x6c370 VFMADD231PD (%RBX,%RSI,8),%XMM15,%XMM1 |
(688) 0x6c376 MOV 0xe0(%RSP),%RSI |
(688) 0x6c37e VMULPD (%RBX,%R11,8),%XMM12,%XMM25 |
(688) 0x6c385 VFMADD231PD (%RBX,%RSI,8),%XMM13,%XMM23 |
(688) 0x6c38c VFMADD231PD (%RBX,%R10,8),%XMM13,%XMM25 |
(688) 0x6c393 VADDPD %XMM23,%XMM1,%XMM0 |
(688) 0x6c399 VFMADD213PD (%R9),%XMM11,%XMM0 |
(688) 0x6c39e VMULSD 0x8(%R15),%XMM19,%XMM11 |
(688) 0x6c3a5 VADDPD %XMM24,%XMM25,%XMM26 |
(688) 0x6c3ab VMOVDDUP %XMM11,%XMM1 |
(688) 0x6c3b0 VFMADD231PD %XMM26,%XMM1,%XMM0 |
(688) 0x6c3b6 VMOVUPD %XMM0,(%R9) |
(688) 0x6c3bb MOV 0xc8(%RSP),%R9 |
(688) 0x6c3c3 TEST $0x1,%R9B |
(688) 0x6c3c7 JE 6c430 |
(688) 0x6c3c9 MOV %R9,%RDI |
(688) 0x6c3cc AND $-0x2,%RDI |
(688) 0x6c3d0 ADD %RDI,%RAX |
(688) 0x6c3d3 LEA (%R14,%RAX,1),%R8 |
(688) 0x6c3d7 LEA (%R12,%RAX,8),%R10 |
(688) 0x6c3db LEA (%R14,%R8,1),%RSI |
(688) 0x6c3df LEA (%R14,%RSI,1),%R11 |
(688) 0x6c3e3 VMULSD (%RCX,%RSI,8),%XMM3,%XMM0 |
(688) 0x6c3e8 VMULSD (%RCX,%R11,8),%XMM4,%XMM11 |
(688) 0x6c3ee VFMADD231SD (%RCX,%R8,8),%XMM6,%XMM0 |
(688) 0x6c3f4 VFMADD231SD (%RCX,%RAX,8),%XMM5,%XMM11 |
(688) 0x6c3fa VADDSD %XMM11,%XMM0,%XMM1 |
(688) 0x6c3ff VMULSD (%RDX,%RSI,8),%XMM3,%XMM0 |
(688) 0x6c404 VMULSD 0x8(%R15),%XMM19,%XMM11 |
(688) 0x6c40b VFMADD213SD (%R10),%XMM1,%XMM2 |
(688) 0x6c410 VMULSD (%RDX,%R11,8),%XMM4,%XMM1 |
(688) 0x6c416 VFMADD231SD (%RDX,%R8,8),%XMM6,%XMM0 |
(688) 0x6c41c VFMADD231SD (%RDX,%RAX,8),%XMM5,%XMM1 |
(688) 0x6c422 VADDSD %XMM1,%XMM0,%XMM0 |
(688) 0x6c426 VFMADD231SD %XMM11,%XMM0,%XMM2 |
(688) 0x6c42b VMOVSD %XMM2,(%R10) |
(688) 0x6c430 MOV 0xb0(%RSP),%RAX |
(688) 0x6c438 MOV 0xb8(%RSP),%R9 |
(688) 0x6c440 ADD $0x10,%R15 |
(688) 0x6c444 ADD %R9,0xf8(%RSP) |
(688) 0x6c44c ADD %RAX,%RCX |
(688) 0x6c44f ADD %RAX,%RDX |
(688) 0x6c452 ADD %R9,0xe8(%RSP) |
(688) 0x6c45a CMP %R15,0xc0(%RSP) |
(688) 0x6c462 JNE 6c141 |
(689) 0x6c468 MOV 0x80(%RSP),%RDI |
(689) 0x6c470 MOV 0x68(%RSP),%RCX |
(689) 0x6c475 MOV %RBX,%R15 |
(689) 0x6c478 MOV 0x90(%RSP),%R10 |
(689) 0x6c480 MOV 0x88(%RSP),%R8 |
(689) 0x6c488 ADD $0x8,%RDI |
(689) 0x6c48c ADD %RCX,%R8 |
(689) 0x6c48f ADD %RCX,%R10 |
(689) 0x6c492 CMP %RDI,0xa8(%RSP) |
(689) 0x6c49a JNE 6c0dd |
(687) 0x6c4a0 ADDQ $0x8,0x60(%RSP) |
(687) 0x6c4a6 ADDQ $0x18,0x50(%RSP) |
(687) 0x6c4ac MOV 0x60(%RSP),%RDX |
(687) 0x6c4b1 CMP %RDX,0x30(%RSP) |
(687) 0x6c4b6 JNE 6bd6e |
0x6c4bc MOV 0x28(%RSP),%R13 |
0x6c4c1 MOV 0x20(%RSP),%RBX |
0x6c4c6 MOV 0x18(%RSP),%R12 |
0x6c4cb VZEROUPPER |
0x6c4ce MOV %R13,%RDI |
0x6c4d1 XOR %R14D,%R14D |
0x6c4d4 CALL 8460 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv@plt> |
0x6c4d9 MOV 0x30(%RBX),%ECX |
0x6c4dc TEST %ECX,%ECX |
0x6c4de JLE 6c540 |
(686) 0x6c4e0 LEA 0x1(%R14),%EAX |
(686) 0x6c4e4 MOV 0x8(%RBX),%ESI |
(686) 0x6c4e7 MOV %ECX,%R11D |
(686) 0x6c4ea IMUL 0x40(%RBX),%EAX |
(686) 0x6c4ee IMUL %R14D,%R11D |
(686) 0x6c4f2 CMP %ESI,%EAX |
(686) 0x6c4f4 CMOVG %ESI,%EAX |
(686) 0x6c4f7 SUB %R11D,%EAX |
(686) 0x6c4fa TEST %EAX,%EAX |
(686) 0x6c4fc JLE 6c538 |
(686) 0x6c4fe MOV 0x310(%RBX),%R8 |
(686) 0x6c505 LEA (%R14,%R14,2),%R10 |
(686) 0x6c509 MOV 0x18(%R12),%R15 |
(686) 0x6c50e CLTQ |
(686) 0x6c510 MOVSXD %R11D,%R9 |
(686) 0x6c513 LEA (%R8,%R10,8),%RDX |
(686) 0x6c517 LEA (%R15,%R9,8),%RDI |
(686) 0x6c51b MOV (%RDX),%RSI |
(686) 0x6c51e LEA (,%RAX,8),%RDX |
(686) 0x6c526 CMP $0x8,%RDX |
(686) 0x6c52a JE 6c602 |
(686) 0x6c530 CALL 8090 <memmove@plt> |
(686) 0x6c535 MOV 0x30(%RBX),%ECX |
(686) 0x6c538 INC %R14 |
(686) 0x6c53b CMP %R14D,%ECX |
(686) 0x6c53e JG 6c4e0 |
0x6c540 LEA -0x28(%RBP),%RSP |
0x6c544 POP %RBX |
0x6c545 POP %R12 |
0x6c547 POP %R13 |
0x6c549 POP %R14 |
0x6c54b POP %R15 |
0x6c54d POP %RBP |
0x6c54e RET |
(688) 0x6c54f XOR %EAX,%EAX |
(688) 0x6c551 JMP 6c2bf |
(687) 0x6c556 VMOVSD 0x1b102(%RIP),%XMM3 |
(687) 0x6c55e MOV 0x1b103(%RIP),%R11 |
(687) 0x6c565 MOVQ $0,0xe8(%RSP) |
(687) 0x6c571 VXORPD %XMM4,%XMM4,%XMM4 |
(687) 0x6c575 VMOVQ %R11,%XMM6 |
(687) 0x6c57a VMOVSD %XMM3,%XMM3,%XMM5 |
(687) 0x6c57e JMP 6bf99 |
(687) 0x6c583 VMOVAPD 0x1b0d5(%RIP),%YMM12 |
(687) 0x6c58b XOR %R13D,%R13D |
(687) 0x6c58e JMP 6bef1 |
(687) 0x6c593 MOVQ $0,0xf8(%RSP) |
(687) 0x6c59f VMOVAPD 0x1b0b9(%RIP),%YMM11 |
(687) 0x6c5a7 JMP 6be48 |
(687) 0x6c5ac VMOVAPD 0x1b0cc(%RIP),%YMM12 |
(687) 0x6c5b4 MOVSXD %ESI,%R13 |
(687) 0x6c5b7 JMP 6bef1 |
(687) 0x6c5bc CLTQ |
(687) 0x6c5be VMOVAPD 0x1b0ba(%RIP),%YMM11 |
(687) 0x6c5c6 MOV %RAX,0xf8(%RSP) |
(687) 0x6c5ce JMP 6be48 |
(687) 0x6c5d3 MOV 0x1b08e(%RIP),%R10 |
(687) 0x6c5da CLTQ |
(687) 0x6c5dc VMOVSD 0x1b0b4(%RIP),%XMM4 |
(687) 0x6c5e4 VXORPD %XMM5,%XMM5,%XMM5 |
(687) 0x6c5e8 MOV %RAX,0xe8(%RSP) |
(687) 0x6c5f0 VMOVSD 0x1b090(%RIP),%XMM6 |
(687) 0x6c5f8 VMOVQ %R10,%XMM3 |
(687) 0x6c5fd JMP 6bf99 |
(686) 0x6c602 VMOVSD (%RSI),%XMM15 |
(686) 0x6c606 VMOVSD %XMM15,(%RDI) |
(686) 0x6c60a JMP 6c538 |
0x6c60f NOP |
Path / |
Source file and lines | einspline_spo_ref.hpp:172-189 |
Module | libqmcwfs.so |
nb instructions | 75 |
nb uops | 79 |
loop length | 322 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 19 |
micro-operation queue | 13.17 cycles |
front end | 13.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 3.00 | 2.33 | 7.00 | 7.00 | 12.00 | 2.33 | 3.00 | 12.00 | 12.00 | 12.00 | 2.33 | 7.00 |
cycles | 3.00 | 2.33 | 7.00 | 7.00 | 12.00 | 2.33 | 3.00 | 12.00 | 12.00 | 12.00 | 2.33 | 7.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 12.65 |
Stall cycles | 0.00 |
Front-end | 13.17 |
Dispatch | 12.00 |
Overall L1 | 13.17 |
all | 5% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 25% |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 12% |
load | 11% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 12% |
load | 11% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOVSXD %EDX,%R15 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x160,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x358(%RDI),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 8560 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x48(%RBX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x128(%R14),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP 0x124(%R14),%R15D | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 6bcb3 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x53> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x40(%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R15,%R15,2),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RAX,%RDX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x100(%RSP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 13870 <_ZNK11qmcplusplus14CrystalLatticeIdLj3EE12toUnit_floorIdEENS_10TinyVectorIdLj3EEERKNS3_IT_Lj3EEE> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOVSXD 0x30(%RBX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %ESI,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 6c4ce <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x86e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD 0x40(%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2f8(%RBX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x310(%RBX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x110(%RSP),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (,%RDI,8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x1(%RDI),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDI,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x2,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RDI,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%RSI,8),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x4,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SAL $0x5,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
VMOVSD 0x108(%RSP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x100(%RSP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM7,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM4,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM0,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RSP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 8460 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x30(%RBX),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %ECX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 6c540 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x8e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | einspline_spo_ref.hpp:172-189 |
Module | libqmcwfs.so |
nb instructions | 75 |
nb uops | 79 |
loop length | 322 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 19 |
micro-operation queue | 13.17 cycles |
front end | 13.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 3.00 | 2.33 | 7.00 | 7.00 | 12.00 | 2.33 | 3.00 | 12.00 | 12.00 | 12.00 | 2.33 | 7.00 |
cycles | 3.00 | 2.33 | 7.00 | 7.00 | 12.00 | 2.33 | 3.00 | 12.00 | 12.00 | 12.00 | 2.33 | 7.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 12.65 |
Stall cycles | 0.00 |
Front-end | 13.17 |
Dispatch | 12.00 |
Overall L1 | 13.17 |
all | 5% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 25% |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 12% |
load | 11% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 12% |
load | 11% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOVSXD %EDX,%R15 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x160,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x358(%RDI),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 8560 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x48(%RBX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x128(%R14),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP 0x124(%R14),%R15D | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 6bcb3 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x53> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x40(%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R15,%R15,2),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RAX,%RDX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x100(%RSP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 13870 <_ZNK11qmcplusplus14CrystalLatticeIdLj3EE12toUnit_floorIdEENS_10TinyVectorIdLj3EEERKNS3_IT_Lj3EEE> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOVSXD 0x30(%RBX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %ESI,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 6c4ce <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x86e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD 0x40(%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2f8(%RBX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x310(%RBX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x110(%RSP),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (,%RDI,8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x1(%RDI),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDI,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x2,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RDI,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%RSI,8),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x4,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SAL $0x5,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
VMOVSD 0x108(%RSP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x100(%RSP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM7,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM4,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM0,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RSP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 8460 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x30(%RBX),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %ECX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 6c540 <_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE+0x8e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_ZN16miniqmcreference17einspline_spo_refIdE8evaluateERKN11qmcplusplus11ParticleSetEiRNS2_6VectorIdSaIdEEE– | 21.07 | 20.94 |
▼Loop 687 - einspline_spo_ref.hpp:175-176 - libqmcwfs.so– | 0.02 | 0.02 |
▼Loop 689 - MultiBsplineRef.hpp:63-71 - libqmcwfs.so– | 0 | 0 |
▼Loop 688 - MultiBsplineRef.hpp:64-71 - libqmcwfs.so– | 0 | 0 |
○Loop 690 - MultiBsplineRef.hpp:68-71 - libqmcwfs.so | 21.04 | 17.6 |
○Loop 686 - einspline_spo_ref.hpp:183-187 - libqmcwfs.so | 0 | 0 |