Function: miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evalua ... | Module: libqmcwfs.so | Source: DiracDeterminantRef.cpp:152-181 [...] | Coverage: 0.58% |
---|
Function: miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evalua ... | Module: libqmcwfs.so | Source: DiracDeterminantRef.cpp:152-181 [...] | Coverage: 0.58% |
---|
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Platforms/CPU/SIMD/inner_product.hpp: 82 - 156 |
-------------------------------------------------------------------------------- |
82: for (int i = 0; i < n; i++) |
83: res += a[i] * b[i]; |
[...] |
149: inline TinyVector<T, D> dot(const T* a, const TinyVector<T, D>* b, int n) |
[...] |
155: for (int i = 0; i < n; i++) |
156: res += a[i] * b[i]; |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsMatrix.h: 217 - 217 |
-------------------------------------------------------------------------------- |
217: inline Type_t* operator[](size_type i) { return X.data() + i * D2; } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 62 - 62 |
-------------------------------------------------------------------------------- |
62: X[d] = T(0); |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 248 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
248: inline pointer data() { return X; } |
/software/compilers/gcc/gcc-13.1.0-full+isl+binutils/include/c++/13.1.0/bits/unique_ptr.h: 199 - 199 |
-------------------------------------------------------------------------------- |
199: pointer _M_ptr() const noexcept { return std::get<0>(_M_t); } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Numerics/PETE/OperatorTags.h: 63 - 94 |
-------------------------------------------------------------------------------- |
63: return (a * b); |
[...] |
94: (const_cast<T1&>(a) += b); |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/DiracDeterminantRef.cpp: 152 - 181 |
-------------------------------------------------------------------------------- |
152: void DiracDeterminantRef<DU_TYPE>::evaluateGL(ParticleSet& P, |
153: ParticleSet::ParticleGradient& G, |
154: ParticleSet::ParticleLaplacian& L, |
155: bool fromscratch) |
156: { |
157: if (UpdateMode == ORB_PBYP_RATIO) |
158: { //need to compute dpsiM and d2psiM. Do not touch psiM! |
159: SPOVGLTimer->start(); |
160: Phi->evaluate_notranspose(P, FirstIndex, LastIndex, psiM_temp, dpsiM, d2psiM); |
161: SPOVGLTimer->stop(); |
162: } |
163: |
164: if (NumPtcls == 1) |
[...] |
173: for (size_t i = 0, iat = FirstIndex; i < NumPtcls; ++i, ++iat) |
174: { |
175: mValueType dot_temp = simd::dot(psiM[i], d2psiM[i], NumOrbitals); |
176: mGradType rv = simd::dot(psiM[i], dpsiM[i], NumOrbitals); |
177: G[iat] += rv; |
178: L[iat] += dot_temp - dot(rv, rv); |
179: } |
180: } |
181: } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVectorOps.h: 129 - 131 |
-------------------------------------------------------------------------------- |
129: Type_t res = lhs[0] * rhs[0]; |
130: for (unsigned d = 1; d < D; ++d) |
131: res += lhs[d] * rhs[d]; |
0x6ca80 PUSH %R13 |
0x6ca82 LEA 0x10(%RSP),%R13 |
0x6ca87 AND $-0x20,%RSP |
0x6ca8b PUSHQ -0x8(%R13) |
0x6ca8f PUSH %RBP |
0x6ca90 MOV %RSP,%RBP |
0x6ca93 PUSH %R15 |
0x6ca95 PUSH %R14 |
0x6ca97 MOV %RDX,%R14 |
0x6ca9a PUSH %R13 |
0x6ca9c PUSH %R12 |
0x6ca9e MOV %RCX,%R12 |
0x6caa1 PUSH %RBX |
0x6caa2 SUB $0x68,%RSP |
0x6caa6 MOV 0xc(%RDI),%ECX |
0x6caa9 MOV %RDI,-0x50(%RBP) |
0x6caad TEST %ECX,%ECX |
0x6caaf JE 6d0f6 |
0x6cab5 MOV -0x50(%RBP),%RDI |
0x6cab9 MOV 0x484(%RDI),%EDX |
0x6cabf CMP $0x1,%EDX |
0x6cac2 JE 6d0d7 |
0x6cac8 MOVSXD %EDX,%RSI |
0x6cacb MOVSXD 0x478(%RDI),%R10 |
0x6cad2 MOV %RSI,-0x60(%RBP) |
0x6cad6 TEST %EDX,%EDX |
0x6cad8 JE 6d058 |
0x6cade MOV 0x480(%RDI),%EBX |
0x6cae4 MOV 0x18(%R12),%R12 |
0x6cae9 LEA (%R10,%R10,2),%R13 |
0x6caed MOV 0x158(%RDI),%R9 |
0x6caf4 MOV 0xd8(%RDI),%R15 |
0x6cafb MOV 0x18(%R14),%R14 |
0x6caff MOV %EBX,%EDX |
0x6cb01 MOV 0x100(%RDI),%R11 |
0x6cb08 LEA -0x1(%RBX),%EAX |
0x6cb0b MOV 0x180(%RDI),%R8 |
0x6cb12 AND $-0x4,%EDX |
0x6cb15 LEA (%R12,%R10,8),%RDI |
0x6cb19 MOV %R9,-0x70(%RBP) |
0x6cb1d MOV %R15,-0x68(%RBP) |
0x6cb21 LEA (%R14,%R13,8),%R9 |
0x6cb25 MOV %EBX,%R13D |
0x6cb28 XOR %R12D,%R12D |
0x6cb2b MOV %EAX,-0x40(%RBP) |
0x6cb2e SHR $0x2,%R13D |
0x6cb32 XOR %R10D,%R10D |
0x6cb35 LEA (,%R15,8),%RCX |
0x6cb3d MOV %EDX,-0x44(%RBP) |
0x6cb40 SAL $0x5,%R13 |
0x6cb44 MOV %RDI,-0x78(%RBP) |
0x6cb48 MOV %R11,-0x38(%RBP) |
0x6cb4c MOV %RCX,-0x58(%RBP) |
0x6cb50 MOV %R11,%RCX |
0x6cb53 XOR %R11D,%R11D |
0x6cb56 NOPW %CS:(%RAX,%RAX,1) |
(726) 0x6cb60 LEA (,%R12,8),%RDX |
(726) 0x6cb68 TEST %EBX,%EBX |
(726) 0x6cb6a JLE 6d088 |
(726) 0x6cb70 CMPL $0x2,-0x40(%RBP) |
(726) 0x6cb74 JBE 6d0a8 |
(726) 0x6cb7a LEA -0x20(%R13),%R14 |
(726) 0x6cb7e LEA (%R8,%RDX,1),%R15 |
(726) 0x6cb82 VXORPD %XMM4,%XMM4,%XMM4 |
(726) 0x6cb86 XOR %EDI,%EDI |
(726) 0x6cb88 SHR $0x5,%R14 |
(726) 0x6cb8c INC %R14 |
(726) 0x6cb8f AND $0x7,%R14D |
(726) 0x6cb93 JE 6cc2e |
(726) 0x6cb99 CMP $0x1,%R14 |
(726) 0x6cb9d JE 6cc16 |
(726) 0x6cb9f CMP $0x2,%R14 |
(726) 0x6cba3 JE 6cc07 |
(726) 0x6cba5 CMP $0x3,%R14 |
(726) 0x6cba9 JE 6cbf8 |
(726) 0x6cbab CMP $0x4,%R14 |
(726) 0x6cbaf JE 6cbe9 |
(726) 0x6cbb1 CMP $0x5,%R14 |
(726) 0x6cbb5 JE 6cbda |
(726) 0x6cbb7 CMP $0x6,%R14 |
(726) 0x6cbbb JE 6cbcb |
(726) 0x6cbbd VMOVUPD (%RCX),%YMM5 |
(726) 0x6cbc1 VFMADD231PD (%R15),%YMM5,%YMM4 |
(726) 0x6cbc6 MOV $0x20,%EDI |
(726) 0x6cbcb VMOVUPD (%RCX,%RDI,1),%YMM3 |
(726) 0x6cbd0 VFMADD231PD (%R15,%RDI,1),%YMM3,%YMM4 |
(726) 0x6cbd6 ADD $0x20,%RDI |
(726) 0x6cbda VMOVUPD (%RCX,%RDI,1),%YMM7 |
(726) 0x6cbdf VFMADD231PD (%R15,%RDI,1),%YMM7,%YMM4 |
(726) 0x6cbe5 ADD $0x20,%RDI |
(726) 0x6cbe9 VMOVUPD (%RCX,%RDI,1),%YMM1 |
(726) 0x6cbee VFMADD231PD (%R15,%RDI,1),%YMM1,%YMM4 |
(726) 0x6cbf4 ADD $0x20,%RDI |
(726) 0x6cbf8 VMOVUPD (%RCX,%RDI,1),%YMM2 |
(726) 0x6cbfd VFMADD231PD (%R15,%RDI,1),%YMM2,%YMM4 |
(726) 0x6cc03 ADD $0x20,%RDI |
(726) 0x6cc07 VMOVUPD (%RCX,%RDI,1),%YMM6 |
(726) 0x6cc0c VFMADD231PD (%R15,%RDI,1),%YMM6,%YMM4 |
(726) 0x6cc12 ADD $0x20,%RDI |
(726) 0x6cc16 VMOVUPD (%RCX,%RDI,1),%YMM8 |
(726) 0x6cc1b VFMADD231PD (%R15,%RDI,1),%YMM8,%YMM4 |
(726) 0x6cc21 ADD $0x20,%RDI |
(726) 0x6cc25 CMP %R13,%RDI |
(726) 0x6cc28 JE 6ccbc |
(728) 0x6cc2e VMOVUPD (%RCX,%RDI,1),%YMM9 |
(728) 0x6cc33 VFMADD231PD (%R15,%RDI,1),%YMM9,%YMM4 |
(728) 0x6cc39 VMOVUPD 0x20(%RCX,%RDI,1),%YMM10 |
(728) 0x6cc3f VFMADD231PD 0x20(%R15,%RDI,1),%YMM10,%YMM4 |
(728) 0x6cc46 VMOVUPD 0x40(%RCX,%RDI,1),%YMM11 |
(728) 0x6cc4c VFMADD231PD 0x40(%R15,%RDI,1),%YMM11,%YMM4 |
(728) 0x6cc53 VMOVUPD 0x80(%RCX,%RDI,1),%YMM13 |
(728) 0x6cc5c VMOVUPD 0x60(%RCX,%RDI,1),%YMM12 |
(728) 0x6cc62 VMOVUPD 0xa0(%RCX,%RDI,1),%YMM14 |
(728) 0x6cc6b VFMADD231PD 0x60(%R15,%RDI,1),%YMM12,%YMM4 |
(728) 0x6cc72 VFMADD231PD 0x80(%R15,%RDI,1),%YMM13,%YMM4 |
(728) 0x6cc7c VMOVUPD 0xc0(%RCX,%RDI,1),%YMM15 |
(728) 0x6cc85 VFMADD231PD 0xa0(%R15,%RDI,1),%YMM14,%YMM4 |
(728) 0x6cc8f VMOVUPD 0xe0(%RCX,%RDI,1),%YMM0 |
(728) 0x6cc98 VFMADD231PD 0xc0(%R15,%RDI,1),%YMM15,%YMM4 |
(728) 0x6cca2 VFMADD231PD 0xe0(%R15,%RDI,1),%YMM0,%YMM4 |
(728) 0x6ccac ADD $0x100,%RDI |
(728) 0x6ccb3 CMP %R13,%RDI |
(728) 0x6ccb6 JNE 6cc2e |
(726) 0x6ccbc VEXTRACTF128 $0x1,%YMM4,%XMM5 |
(726) 0x6ccc2 MOV -0x44(%RBP),%EAX |
(726) 0x6ccc5 VADDPD %XMM4,%XMM5,%XMM7 |
(726) 0x6ccc9 VUNPCKHPD %XMM7,%XMM7,%XMM3 |
(726) 0x6cccd VADDPD %XMM7,%XMM3,%XMM12 |
(726) 0x6ccd1 CMP %EAX,%EBX |
(726) 0x6ccd3 JE 6d06d |
(726) 0x6ccd9 VADDPD %XMM5,%XMM4,%XMM0 |
(726) 0x6ccdd MOV %EAX,%ESI |
(726) 0x6ccdf MOV %EBX,%EDI |
(726) 0x6cce1 SUB %ESI,%EDI |
(726) 0x6cce3 CMP $0x1,%EDI |
(726) 0x6cce6 JE 6cd12 |
(726) 0x6cce8 MOV -0x38(%RBP),%R15 |
(726) 0x6ccec LEA (%R11,%RSI,1),%R14 |
(726) 0x6ccf0 ADD %R12,%RSI |
(726) 0x6ccf3 VMOVUPD (%R15,%R14,8),%XMM4 |
(726) 0x6ccf9 VFMADD231PD (%R8,%RSI,8),%XMM4,%XMM0 |
(726) 0x6ccff VUNPCKHPD %XMM0,%XMM0,%XMM1 |
(726) 0x6cd03 VADDPD %XMM0,%XMM1,%XMM12 |
(726) 0x6cd07 TEST $0x1,%DIL |
(726) 0x6cd0b JE 6cd22 |
(726) 0x6cd0d AND $-0x2,%EDI |
(726) 0x6cd10 ADD %EDI,%EAX |
(726) 0x6cd12 CLTQ |
(726) 0x6cd14 ADD %R8,%RDX |
(726) 0x6cd17 VMOVSD (%RCX,%RAX,8),%XMM2 |
(726) 0x6cd1c VFMADD231SD (%RDX,%RAX,8),%XMM2,%XMM12 |
(726) 0x6cd22 MOV -0x50(%RBP),%RSI |
(726) 0x6cd26 MOV 0x118(%RSI),%RAX |
(726) 0x6cd2d MOV 0x140(%RSI),%RDI |
(726) 0x6cd34 IMUL %R10,%RAX |
(726) 0x6cd38 CMPL $0x2,-0x40(%RBP) |
(726) 0x6cd3c JBE 6d0ba |
(726) 0x6cd42 VXORPD %XMM13,%XMM13,%XMM13 |
(726) 0x6cd47 LEA (%RAX,%RAX,2),%R14 |
(726) 0x6cd4b LEA (%RCX,%R13,1),%R15 |
(726) 0x6cd4f MOV %RCX,%RSI |
(726) 0x6cd52 LEA (%RDI,%R14,8),%RDX |
(726) 0x6cd56 VMOVAPD %YMM13,%YMM3 |
(726) 0x6cd5a VMOVAPD %YMM13,%YMM2 |
(726) 0x6cd5e TEST $0x20,%R13B |
(726) 0x6cd62 JE 6cde0 |
(726) 0x6cd64 VMOVUPD (%RDX),%YMM9 |
(726) 0x6cd68 VMOVUPD 0x20(%RDX),%YMM6 |
(726) 0x6cd6d LEA 0x20(%RCX),%RSI |
(726) 0x6cd71 ADD $0x60,%RDX |
(726) 0x6cd75 VMOVUPD -0x20(%RDX),%YMM14 |
(726) 0x6cd7a VPALIGNR $0x8,%YMM6,%YMM9,%YMM4 |
(726) 0x6cd80 VPERMPD $0x2c,%YMM9,%YMM11 |
(726) 0x6cd86 VBLENDPD $0xc,%YMM6,%YMM9,%YMM15 |
(726) 0x6cd8c VBLENDPD $0x4,%YMM6,%YMM11,%YMM8 |
(726) 0x6cd92 VPERMPD $0x53,%YMM4,%YMM1 |
(726) 0x6cd98 VPERM2F128 $0x2,%YMM6,%YMM9,%YMM0 |
(726) 0x6cd9e VINSERTF128 $0x1,%XMM14,%YMM1,%YMM2 |
(726) 0x6cda4 VPERMILPD $0x2,%YMM14,%YMM7 |
(726) 0x6cdaa VPERM2F128 $0x21,%YMM14,%YMM8,%YMM9 |
(726) 0x6cdb0 VSHUFPD $0x5,%YMM0,%YMM15,%YMM5 |
(726) 0x6cdb5 VBLENDPD $0x7,%YMM2,%YMM14,%YMM10 |
(726) 0x6cdbb VBLENDPD $0x8,%YMM7,%YMM5,%YMM3 |
(726) 0x6cdc1 VBLENDPD $0x8,%YMM9,%YMM8,%YMM2 |
(726) 0x6cdc7 VFMADD132PD (%RCX),%YMM13,%YMM3 |
(726) 0x6cdcc VFMADD132PD (%RCX),%YMM13,%YMM2 |
(726) 0x6cdd1 VFMADD231PD (%RCX),%YMM10,%YMM13 |
(726) 0x6cdd6 CMP %RSI,%R15 |
(726) 0x6cdd9 JE 6cecf |
(726) 0x6cddf NOP |
(727) 0x6cde0 VMOVUPD (%RDX),%YMM14 |
(727) 0x6cde4 VMOVUPD 0x20(%RDX),%YMM15 |
(727) 0x6cde9 ADD $0x40,%RSI |
(727) 0x6cded ADD $0xc0,%RDX |
(727) 0x6cdf4 VMOVUPD -0x80(%RDX),%YMM6 |
(727) 0x6cdf9 VBLENDPD $0xc,%YMM15,%YMM14,%YMM0 |
(727) 0x6cdff VPERM2F128 $0x2,%YMM15,%YMM14,%YMM5 |
(727) 0x6ce05 VPALIGNR $0x8,%YMM15,%YMM14,%YMM1 |
(727) 0x6ce0b VPERMILPD $0x2,%YMM6,%YMM7 |
(727) 0x6ce11 VSHUFPD $0x5,%YMM5,%YMM0,%YMM4 |
(727) 0x6ce16 VPERMPD $0x2c,%YMM14,%YMM14 |
(727) 0x6ce1c VMOVUPD -0x60(%RDX),%YMM5 |
(727) 0x6ce21 VBLENDPD $0x8,%YMM7,%YMM4,%YMM10 |
(727) 0x6ce27 VPERMPD $0x53,%YMM1,%YMM11 |
(727) 0x6ce2d VBLENDPD $0x4,%YMM15,%YMM14,%YMM15 |
(727) 0x6ce33 VFMADD231PD -0x40(%RSI),%YMM10,%YMM3 |
(727) 0x6ce39 VMOVUPD -0x40(%RDX),%YMM10 |
(727) 0x6ce3e VINSERTF128 $0x1,%XMM6,%YMM11,%YMM8 |
(727) 0x6ce44 VBLENDPD $0x7,%YMM8,%YMM6,%YMM9 |
(727) 0x6ce4a VMOVUPD -0x20(%RDX),%YMM11 |
(727) 0x6ce4f VPERM2F128 $0x21,%YMM6,%YMM15,%YMM6 |
(727) 0x6ce55 VPALIGNR $0x8,%YMM10,%YMM5,%YMM14 |
(727) 0x6ce5b VBLENDPD $0x8,%YMM6,%YMM15,%YMM0 |
(727) 0x6ce61 VBLENDPD $0xc,%YMM10,%YMM5,%YMM4 |
(727) 0x6ce67 VPERM2F128 $0x2,%YMM10,%YMM5,%YMM7 |
(727) 0x6ce6d VPERMPD $0x53,%YMM14,%YMM15 |
(727) 0x6ce73 VPERMPD $0x2c,%YMM5,%YMM5 |
(727) 0x6ce79 VINSERTF128 $0x1,%XMM11,%YMM15,%YMM6 |
(727) 0x6ce7f VBLENDPD $0x4,%YMM10,%YMM5,%YMM10 |
(727) 0x6ce85 VPERMILPD $0x2,%YMM11,%YMM8 |
(727) 0x6ce8b VSHUFPD $0x5,%YMM7,%YMM4,%YMM1 |
(727) 0x6ce90 VFMADD231PD -0x40(%RSI),%YMM0,%YMM2 |
(727) 0x6ce96 VBLENDPD $0x7,%YMM6,%YMM11,%YMM0 |
(727) 0x6ce9c VPERM2F128 $0x21,%YMM11,%YMM10,%YMM11 |
(727) 0x6cea2 VFMADD231PD -0x40(%RSI),%YMM9,%YMM13 |
(727) 0x6cea8 VBLENDPD $0x8,%YMM11,%YMM10,%YMM4 |
(727) 0x6ceae VBLENDPD $0x8,%YMM8,%YMM1,%YMM9 |
(727) 0x6ceb4 VFMADD231PD -0x20(%RSI),%YMM4,%YMM2 |
(727) 0x6ceba VFMADD231PD -0x20(%RSI),%YMM9,%YMM3 |
(727) 0x6cec0 VFMADD231PD -0x20(%RSI),%YMM0,%YMM13 |
(727) 0x6cec6 CMP %RSI,%R15 |
(727) 0x6cec9 JNE 6cde0 |
(726) 0x6cecf VEXTRACTF128 $0x1,%YMM3,%XMM14 |
(726) 0x6ced5 VEXTRACTF128 $0x1,%YMM2,%XMM5 |
(726) 0x6cedb VEXTRACTF128 $0x1,%YMM13,%XMM9 |
(726) 0x6cee1 MOV -0x44(%RBP),%EDX |
(726) 0x6cee4 VADDPD %XMM3,%XMM14,%XMM8 |
(726) 0x6cee8 VADDPD %XMM2,%XMM5,%XMM10 |
(726) 0x6ceec VADDPD %XMM13,%XMM9,%XMM7 |
(726) 0x6cef1 MOV %EDX,%ESI |
(726) 0x6cef3 VUNPCKHPD %XMM8,%XMM8,%XMM15 |
(726) 0x6cef8 VUNPCKHPD %XMM10,%XMM10,%XMM6 |
(726) 0x6cefd VADDPD %XMM8,%XMM15,%XMM0 |
(726) 0x6cf02 VADDPD %XMM10,%XMM6,%XMM11 |
(726) 0x6cf07 VUNPCKHPD %XMM7,%XMM7,%XMM1 |
(726) 0x6cf0b VADDPD %XMM7,%XMM1,%XMM1 |
(726) 0x6cf0f VUNPCKLPD %XMM0,%XMM11,%XMM4 |
(726) 0x6cf13 CMP %ESI,%EBX |
(726) 0x6cf15 JE 6cfe7 |
(726) 0x6cf1b VADDPD %XMM5,%XMM2,%XMM8 |
(726) 0x6cf1f VADDPD %XMM14,%XMM3,%XMM11 |
(726) 0x6cf24 VADDPD %XMM9,%XMM13,%XMM10 |
(726) 0x6cf29 MOV %EBX,%R14D |
(726) 0x6cf2c SUB %ESI,%R14D |
(726) 0x6cf2f MOV %R14D,-0x3c(%RBP) |
(726) 0x6cf33 CMP $0x1,%R14D |
(726) 0x6cf37 JE 6cfc4 |
(726) 0x6cf3d LEA (%RAX,%RSI,1),%R15 |
(726) 0x6cf41 ADD %R11,%RSI |
(726) 0x6cf44 LEA (%R15,%R15,2),%R14 |
(726) 0x6cf48 LEA (%RDI,%R14,8),%R15 |
(726) 0x6cf4c MOV -0x38(%RBP),%R14 |
(726) 0x6cf50 VMOVUPD (%R15),%XMM3 |
(726) 0x6cf55 VMOVUPD 0x10(%R15),%XMM2 |
(726) 0x6cf5b VMOVUPD 0x20(%R15),%XMM9 |
(726) 0x6cf61 VMOVUPD (%R14,%RSI,8),%XMM13 |
(726) 0x6cf67 VPERMILPD $0x1,%XMM3,%XMM4 |
(726) 0x6cf6d VBLENDPD $0x2,%XMM2,%XMM3,%XMM15 |
(726) 0x6cf73 VUNPCKLPD %XMM3,%XMM2,%XMM1 |
(726) 0x6cf77 MOV -0x3c(%RBP),%R15D |
(726) 0x6cf7b VUNPCKLPD %XMM9,%XMM4,%XMM7 |
(726) 0x6cf80 VFMADD132PD %XMM13,%XMM8,%XMM15 |
(726) 0x6cf85 VBLENDPD $0x2,%XMM9,%XMM1,%XMM14 |
(726) 0x6cf8b VFMADD132PD %XMM13,%XMM11,%XMM7 |
(726) 0x6cf90 VFMADD132PD %XMM14,%XMM10,%XMM13 |
(726) 0x6cf95 MOV %R15D,%ESI |
(726) 0x6cf98 AND $0x1,%ESI |
(726) 0x6cf9b VUNPCKHPD %XMM15,%XMM15,%XMM10 |
(726) 0x6cfa0 VUNPCKHPD %XMM7,%XMM7,%XMM0 |
(726) 0x6cfa4 VADDPD %XMM15,%XMM10,%XMM6 |
(726) 0x6cfa9 VUNPCKHPD %XMM13,%XMM13,%XMM8 |
(726) 0x6cfae VADDPD %XMM7,%XMM0,%XMM5 |
(726) 0x6cfb2 VADDPD %XMM13,%XMM8,%XMM1 |
(726) 0x6cfb7 VUNPCKLPD %XMM5,%XMM6,%XMM4 |
(726) 0x6cfbb JE 6cfe7 |
(726) 0x6cfbd AND $-0x2,%R15D |
(726) 0x6cfc1 ADD %R15D,%EDX |
(726) 0x6cfc4 MOVSXD %EDX,%RDX |
(726) 0x6cfc7 ADD %RDX,%RAX |
(726) 0x6cfca VMOVSD (%RCX,%RDX,8),%XMM11 |
(726) 0x6cfcf LEA (%RAX,%RAX,2),%RAX |
(726) 0x6cfd3 LEA (%RDI,%RAX,8),%RDI |
(726) 0x6cfd7 VMOVDDUP %XMM11,%XMM13 |
(726) 0x6cfdc VFMADD231SD 0x10(%RDI),%XMM11,%XMM1 |
(726) 0x6cfe2 VFMADD231PD (%RDI),%XMM13,%XMM4 |
(726) 0x6cfe7 VMULSD %XMM4,%XMM4,%XMM9 |
(726) 0x6cfeb VUNPCKHPD %XMM4,%XMM4,%XMM3 |
(726) 0x6cfef VMULSD %XMM3,%XMM3,%XMM7 |
(726) 0x6cff3 VMULSD %XMM1,%XMM1,%XMM14 |
(726) 0x6cff7 VADDSD 0x10(%R9),%XMM1,%XMM8 |
(726) 0x6cffd MOV -0x78(%RBP),%R14 |
(726) 0x6d001 VADDSD %XMM7,%XMM9,%XMM1 |
(726) 0x6d005 ADD $0x18,%R9 |
(726) 0x6d009 VADDPD -0x18(%R9),%XMM4,%XMM15 |
(726) 0x6d00f MOV -0x58(%RBP),%R15 |
(726) 0x6d013 MOV -0x68(%RBP),%RSI |
(726) 0x6d017 MOV -0x70(%RBP),%RDX |
(726) 0x6d01b VMOVSD %XMM8,-0x8(%R9) |
(726) 0x6d021 MOV -0x60(%RBP),%RAX |
(726) 0x6d025 ADD %R15,%RCX |
(726) 0x6d028 VMOVUPD %XMM15,-0x18(%R9) |
(726) 0x6d02e VADDSD (%R14,%R10,8),%XMM12,%XMM12 |
(726) 0x6d034 ADD %RSI,%R11 |
(726) 0x6d037 ADD %RDX,%R12 |
(726) 0x6d03a VSUBSD %XMM1,%XMM12,%XMM0 |
(726) 0x6d03e VSUBSD %XMM14,%XMM0,%XMM5 |
(726) 0x6d043 VMOVSD %XMM5,(%R14,%R10,8) |
(726) 0x6d049 INC %R10 |
(726) 0x6d04c CMP %RAX,%R10 |
(726) 0x6d04f JNE 6cb60 |
0x6d055 VZEROUPPER |
0x6d058 LEA -0x28(%RBP),%RSP |
0x6d05c POP %RBX |
0x6d05d POP %R12 |
0x6d05f POP %R8 |
0x6d061 POP %R14 |
0x6d063 POP %R15 |
0x6d065 POP %RBP |
0x6d066 LEA -0x10(%R8),%RSP |
0x6d06a POP %R13 |
0x6d06c RET |
(726) 0x6d06d MOV -0x50(%RBP),%RDX |
(726) 0x6d071 MOV 0x118(%RDX),%RAX |
(726) 0x6d078 MOV 0x140(%RDX),%RDI |
(726) 0x6d07f IMUL %R10,%RAX |
(726) 0x6d083 JMP 6cd42 |
(726) 0x6d088 VXORPD %XMM14,%XMM14,%XMM14 |
(726) 0x6d08d VXORPD %XMM4,%XMM4,%XMM4 |
(726) 0x6d091 VMOVSD %XMM14,%XMM14,%XMM7 |
(726) 0x6d095 VMOVSD %XMM14,%XMM14,%XMM9 |
(726) 0x6d09a VMOVSD %XMM14,%XMM14,%XMM12 |
(726) 0x6d09f VMOVSD %XMM14,%XMM14,%XMM1 |
(726) 0x6d0a3 JMP 6cff7 |
(726) 0x6d0a8 VXORPD %XMM0,%XMM0,%XMM0 |
(726) 0x6d0ac XOR %ESI,%ESI |
(726) 0x6d0ae VXORPD %XMM12,%XMM12,%XMM12 |
(726) 0x6d0b3 XOR %EAX,%EAX |
(726) 0x6d0b5 JMP 6ccdf |
(726) 0x6d0ba VXORPD %XMM4,%XMM4,%XMM4 |
(726) 0x6d0be XOR %ESI,%ESI |
(726) 0x6d0c0 VXORPD %XMM1,%XMM1,%XMM1 |
(726) 0x6d0c4 XOR %EDX,%EDX |
(726) 0x6d0c6 VMOVAPD %XMM4,%XMM10 |
(726) 0x6d0ca VMOVAPD %XMM4,%XMM11 |
(726) 0x6d0ce VMOVAPD %XMM4,%XMM8 |
(726) 0x6d0d2 JMP 6cf29 |
0x6d0d7 LEA -0x28(%RBP),%RSP |
0x6d0db MOV %R12,%RDX |
0x6d0de MOV %R14,%RSI |
0x6d0e1 POP %RBX |
0x6d0e2 POP %R12 |
0x6d0e4 POP %R9 |
0x6d0e6 POP %R14 |
0x6d0e8 POP %R15 |
0x6d0ea POP %RBP |
0x6d0eb LEA -0x10(%R9),%RSP |
0x6d0ef POP %R13 |
0x6d0f1 JMP 61ea0 |
0x6d0f6 MOV %RDI,%RBX |
0x6d0f9 MOV 0x468(%RDI),%RDI |
0x6d100 MOV %RSI,-0x38(%RBP) |
0x6d104 CALL 8540 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv@plt> |
0x6d109 MOV 0x470(%RBX),%RDI |
0x6d110 SUB $0x8,%RSP |
0x6d114 LEA 0x150(%RBX),%R8 |
0x6d11b MOV 0x478(%RBX),%EDX |
0x6d121 MOV 0x47c(%RBX),%ECX |
0x6d127 LEA 0x110(%RBX),%R9 |
0x6d12e MOV (%RDI),%RAX |
0x6d131 PUSH %R8 |
0x6d133 LEA 0x90(%RBX),%R8 |
0x6d13a MOV -0x38(%RBP),%RSI |
0x6d13e CALLQ 0x28(%RAX) |
0x6d141 MOV 0x468(%RBX),%RDI |
0x6d148 POP %RAX |
0x6d149 POP %RDX |
0x6d14a CALL 8450 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv@plt> |
0x6d14f JMP 6cab5 |
0x6d154 NOPW %CS:(%RAX,%RAX,1) |
0x6d15f NOP |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►50.54+ | qmcplusplus::WaveFunction::eva[...] | WaveFunction.cpp:249 | libqmcwfs.so |
○ | main._omp_fn.1 | stl_vector.h:1121 | exec |
○ | gomp_thread_start | team.c:130 | libgomp.so.1.0.0 |
►47.54+ | qmcplusplus::WaveFunction::eva[...] | WaveFunction.cpp:250 | libqmcwfs.so |
○ | main._omp_fn.1 | stl_vector.h:1121 | exec |
○ | gomp_thread_start | team.c:130 | libgomp.so.1.0.0 |
Path / |
Source file and lines | DiracDeterminantRef.cpp:152-181 |
Module | libqmcwfs.so |
nb instructions | 101 |
nb uops | 107 |
loop length | 385 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 11 |
micro-operation queue | 17.83 cycles |
front end | 17.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 3.50 | 2.73 | 12.33 | 12.33 | 11.00 | 2.73 | 3.50 | 11.00 | 11.00 | 11.00 | 2.53 | 12.33 |
cycles | 3.50 | 2.73 | 12.33 | 12.33 | 11.00 | 2.73 | 3.50 | 11.00 | 11.00 | 11.00 | 2.53 | 12.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 17.54 |
Stall cycles | 0.00 |
Front-end | 17.83 |
Dispatch | 12.33 |
Overall L1 | 17.83 |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 9% |
all | 10% |
load | 8% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
LEA 0x10(%RSP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
PUSHQ -0x8(%R13) | 2 | 0 | 0 | 0.33 | 0.33 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0.33 | 5-12 | 0.62 |
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x68,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xc(%RDI),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %ECX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 6d0f6 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x676> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x484(%RDI),%EDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 6d0d7 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x657> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD %EDX,%RSI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOVSXD 0x478(%RDI),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %EDX,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 6d058 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5d8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x480(%RDI),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R12),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R10,%R10,2),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x158(%RDI),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xd8(%RDI),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R14),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EBX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x100(%RDI),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%RBX),%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0x180(%RDI),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
AND $-0x4,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
LEA (%R12,%R10,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R14,%R13,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EBX,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %R12D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x2,%R13D | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (,%R15,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDX,-0x44(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x5,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RDI,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
LEA -0x10(%R8),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
LEA -0x10(%R9),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 61ea0 <_ZN11qmcplusplus16DiracDeterminantINS_13DelayedUpdateIddEEE10evaluateGLERNS_11ParticleSetERNS_14ParticleAttribINS_10TinyVectorIdLj3EEESaIS8_EEERNS6_IdSaIdEEEb.part.0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x468(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 8540 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x470(%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x150(%RBX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x478(%RBX),%EDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x47c(%RBX),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x110(%RBX),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
PUSH %R8 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
LEA 0x90(%RBX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALLQ 0x28(%RAX) | 3 | 0.70 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.70 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 0 | 2.27 |
MOV 0x468(%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
POP %RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
CALL 8450 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
JMP 6cab5 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x35> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | DiracDeterminantRef.cpp:152-181 |
Module | libqmcwfs.so |
nb instructions | 101 |
nb uops | 107 |
loop length | 385 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 11 |
micro-operation queue | 17.83 cycles |
front end | 17.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 3.50 | 2.73 | 12.33 | 12.33 | 11.00 | 2.73 | 3.50 | 11.00 | 11.00 | 11.00 | 2.53 | 12.33 |
cycles | 3.50 | 2.73 | 12.33 | 12.33 | 11.00 | 2.73 | 3.50 | 11.00 | 11.00 | 11.00 | 2.53 | 12.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 17.54 |
Stall cycles | 0.00 |
Front-end | 17.83 |
Dispatch | 12.33 |
Overall L1 | 17.83 |
all | 3% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 9% |
all | 10% |
load | 8% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
LEA 0x10(%RSP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
PUSHQ -0x8(%R13) | 2 | 0 | 0 | 0.33 | 0.33 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0.33 | 5-12 | 0.62 |
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x68,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xc(%RDI),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %ECX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 6d0f6 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x676> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x484(%RDI),%EDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 6d0d7 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x657> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD %EDX,%RSI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOVSXD 0x478(%RDI),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %EDX,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 6d058 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x5d8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x480(%RDI),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R12),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R10,%R10,2),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x158(%RDI),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xd8(%RDI),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%R14),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EBX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x100(%RDI),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%RBX),%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0x180(%RDI),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
AND $-0x4,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
LEA (%R12,%R10,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R14,%R13,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EBX,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %R12D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x2,%R13D | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (,%R15,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDX,-0x44(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x5,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RDI,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
LEA -0x10(%R8),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
LEA -0x10(%R9),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 61ea0 <_ZN11qmcplusplus16DiracDeterminantINS_13DelayedUpdateIddEEE10evaluateGLERNS_11ParticleSetERNS_14ParticleAttribINS_10TinyVectorIdLj3EEESaIS8_EEERNS6_IdSaIdEEEb.part.0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x468(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 8540 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x470(%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x150(%RBX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x478(%RBX),%EDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x47c(%RBX),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x110(%RBX),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
PUSH %R8 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
LEA 0x90(%RBX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALLQ 0x28(%RAX) | 3 | 0.70 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.70 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 0 | 2.27 |
MOV 0x468(%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
POP %RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
CALL 8450 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
JMP 6cab5 <_ZN16miniqmcreference19DiracDeterminantRefIN11qmcplusplus13DelayedUpdateIddEEE10evaluateGLERNS1_11ParticleSetERNS1_14ParticleAttribINS1_10TinyVectorIdLj3EEESaIS9_EEERNS7_IdSaIdEEEb+0x35> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼miniqmcreference::DiracDeterminantRef | 0.58 | 0.5 |
▼Loop 726 - DiracDeterminantRef.cpp:173-178 - libqmcwfs.so– | 0 | 0 |
○Loop 727 - OperatorTags.h:63-94 - libqmcwfs.so | 0.38 | 0.32 |
○Loop 728 - inner_product.hpp:82-83 - libqmcwfs.so | 0.19 | 0.16 |