Function: qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::evaluate(qmcplusplus::ParticleSe ... | Module: exec | Source: SoaDistanceTableABOMPTarget.h:61-233 [...] | Coverage: 9.4% |
---|
Function: qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::evaluate(qmcplusplus::ParticleSe ... | Module: exec | Source: SoaDistanceTableABOMPTarget.h:61-233 [...] | Coverage: 9.4% |
---|
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Utilities/NewTimer.h: 242 - 249 |
-------------------------------------------------------------------------------- |
242: ScopeGuard(TIMER& t) : timer(t) { timer.start(); } |
[...] |
249: ~ScopeGuard() { timer.stop(); } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Particle/Lattice/ParticleBConds3DSoa.h: 274 - 298 |
-------------------------------------------------------------------------------- |
274: const T* restrict pz = R0 + r0_stride * 2; |
[...] |
280: T displ_0 = px[iat] - x0; |
281: T displ_1 = py[iat] - y0; |
282: T displ_2 = pz[iat] - z0; |
283: |
284: T ar_0 = displ_0 * g00 + displ_1 * g10 + displ_2 * g20; |
285: T ar_1 = displ_0 * g01 + displ_1 * g11 + displ_2 * g21; |
286: T ar_2 = displ_0 * g02 + displ_1 * g12 + displ_2 * g22; |
287: |
288: //put them in the box |
289: ar_0 -= round(ar_0); |
290: ar_1 -= round(ar_1); |
291: ar_2 -= round(ar_2); |
292: |
293: //unit2cart |
294: dx[iat] = ar_0 * r00 + ar_1 * r10 + ar_2 * r20; |
295: dy[iat] = ar_0 * r01 + ar_1 * r11 + ar_2 * r21; |
296: dz[iat] = ar_0 * r02 + ar_1 * r12 + ar_2 * r22; |
297: |
298: temp_r[iat] = std::sqrt(dx[iat] * dx[iat] + dy[iat] * dy[iat] + dz[iat] * dz[iat]); |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 151 - 267 |
-------------------------------------------------------------------------------- |
151: mAllocator.deallocate(myData, nAllocated); |
152: nLocal = 0; |
153: nGhosts = 0; |
[...] |
167: if (nAllocated) |
[...] |
174: nLocal = n; |
175: nGhosts = n_padded; |
176: myData = ptr; |
[...] |
267: inline const T* data() const { return myData; } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/TinyVector.h: 169 - 169 |
-------------------------------------------------------------------------------- |
169: inline Type_t& operator[](unsigned int i) { return X[i]; } |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_construct.h: 98 - 107 |
-------------------------------------------------------------------------------- |
98: { __pointer->~_Tp(); } |
[...] |
107: for (; __first != __last; ++__first) |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 149 - 248 |
-------------------------------------------------------------------------------- |
149: if (nAllocated) |
[...] |
156: nLocal = n; |
157: nAllocated = 0; |
158: X = ref; |
[...] |
212: mAllocator.deallocate(X, nAllocated); |
213: } |
214: nLocal = 0; |
215: nAllocated = 0; |
[...] |
223: return X[i]; |
[...] |
248: inline pointer data() { return X; } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Platforms/CPU/SIMD/aligned_allocator.hpp: 46 - 46 |
-------------------------------------------------------------------------------- |
46: return ((n + ND - 1) / ND) * ND; |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Particle/SoaDistanceTableABOMPTarget.h: 61 - 233 |
-------------------------------------------------------------------------------- |
61: if (num_sources_ * num_targets_ == 0) |
62: return; |
63: if (distances_.size()) |
64: return; |
65: |
66: // initialize memory containers and views |
67: const size_t num_padded = getAlignedSize<T>(num_sources_); |
68: const size_t stride_size = getPerTargetPctlStrideSize(); |
69: r_dr_memorypool_.resize(stride_size * num_targets_); |
70: |
71: distances_.resize(num_targets_); |
72: displacements_.resize(num_targets_); |
73: for (int i = 0; i < num_targets_; ++i) |
74: { |
75: distances_[i].attachReference(r_dr_memorypool_.data() + i * stride_size, num_sources_); |
76: displacements_[i].attachReference(num_sources_, num_padded, |
[...] |
184: { |
185: resize(); |
186: |
187: ScopedTimer local_timer(evaluate_timer_); |
188: // be aware of the sign of Displacement |
189: const int num_targets_local = num_targets_; |
190: const int num_sources_local = num_sources_; |
191: const int num_padded = getAlignedSize<T>(num_sources_); |
192: |
193: target_pos.resize(num_targets_ * D); |
194: for (size_t iat = 0; iat < num_targets_; iat++) |
195: for (size_t idim = 0; idim < D; idim++) |
196: target_pos[iat * D + idim] = P.R[iat][idim]; |
197: |
198: auto* target_pos_ptr = target_pos.data(); |
199: auto* source_pos_ptr = origin_.getCoordinates().getAllParticlePos().data(); |
[...] |
205: const size_t num_teams = (num_sources_ + ChunkSizePerTeam - 1) / ChunkSizePerTeam; |
206: const size_t stride_size = getPerTargetPctlStrideSize(); |
207: |
208: { |
209: ScopedTimer offload(offload_timer_); |
210: PRAGMA_OFFLOAD("omp target teams distribute collapse(2) num_teams(num_targets_*num_teams) \ |
211: map(to: source_pos_ptr[:num_padded*D]) \ |
212: map(always, to: target_pos_ptr[:num_targets_*D]) \ |
213: map(always, from: r_dr_ptr[:num_targets_*stride_size])") |
214: for (int iat = 0; iat < num_targets_local; ++iat) |
215: for (int team_id = 0; team_id < num_teams; team_id++) |
216: { |
217: const int first = ChunkSizePerTeam * team_id; |
218: const int last = omptarget::min(first + ChunkSizePerTeam, num_sources_local); |
219: |
220: T pos[D]; |
221: for (int idim = 0; idim < D; idim++) |
222: pos[idim] = target_pos_ptr[iat * D + idim]; |
223: |
224: auto* r_iat_ptr = r_dr_ptr + iat * stride_size; |
225: auto* dr_iat_ptr = r_iat_ptr + num_padded; |
226: |
227: PRAGMA_OFFLOAD("omp parallel for") |
228: for (int iel = first; iel < last; iel++) |
229: DTD_BConds<T, D, SC>::computeDistancesOffload(pos, source_pos_ptr, num_padded, r_iat_ptr, dr_iat_ptr, |
230: num_padded, iel); |
231: } |
232: } |
233: } |
/scratch_na/users/xoserete/qaas_runs/171-417-3180/intel/miniqmc/build/miniqmc/src/Platforms/CPU/SIMD/Mallocator.hpp: 78 - 78 |
-------------------------------------------------------------------------------- |
78: free(p); |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/stl_vector.h: 806 - 1660 |
-------------------------------------------------------------------------------- |
806: { return size_type(this->_M_impl._M_finish - this->_M_impl._M_start); } |
[...] |
826: if (__new_size > size()) |
827: _M_default_append(__new_size - size()); |
828: else if (__new_size < size()) |
829: _M_erase_at_end(this->_M_impl._M_start + __new_size); |
[...] |
933: return *(this->_M_impl._M_start + __n); |
[...] |
1656: if (size_type __n = this->_M_impl._M_finish - __pos) |
1657: { |
1658: std::_Destroy(__pos, this->_M_impl._M_finish, |
1659: _M_get_Tp_allocator()); |
1660: this->_M_impl._M_finish = __pos; |
/usr/lib/gcc/x86_64-redhat-linux/8/../../../../include/c++/8/bits/unique_ptr.h: 150 - 150 |
-------------------------------------------------------------------------------- |
150: pointer _M_ptr() const { return std::get<0>(_M_t); } |
0x4ca1e0 PUSH %RBP |
0x4ca1e1 MOV %RSP,%RBP |
0x4ca1e4 PUSH %R15 |
0x4ca1e6 PUSH %R14 |
0x4ca1e8 PUSH %R13 |
0x4ca1ea PUSH %R12 |
0x4ca1ec PUSH %RBX |
0x4ca1ed SUB $0xb8,%RSP |
0x4ca1f4 MOV %RSI,-0x60(%RBP) |
0x4ca1f8 MOV %RDI,%R15 |
0x4ca1fb MOV 0x10(%RDI),%RCX |
0x4ca1ff MOV 0x18(%RDI),%RAX |
0x4ca203 IMUL %RCX,%RAX |
0x4ca207 TEST %RAX,%RAX |
0x4ca20a MOV %RDI,-0x80(%RBP) |
0x4ca20e JE 4ca21e |
0x4ca210 MOV 0x50(%R15),%RAX |
0x4ca214 CMP 0x48(%R15),%RAX |
0x4ca218 JE 4ca2fa |
0x4ca21e MOV 0x1b8(%R15),%RBX |
0x4ca225 MOV %RBX,%RDI |
0x4ca228 VZEROUPPER |
0x4ca22b CALL 48e0f0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> |
0x4ca230 MOV 0x10(%R15),%RAX |
0x4ca234 MOV %RAX,-0x58(%RBP) |
0x4ca238 MOV 0x18(%R15),%R13 |
0x4ca23c LEA 0x180(%R15),%RDI |
0x4ca243 LEA (%R13,%R13,2),%RSI |
0x4ca248 VPXOR %XMM0,%XMM0,%XMM0 |
0x4ca24c MOV %RBX,-0x70(%RBP) |
0x4ca250 CALL 44c7c0 <_ZN11qmcplusplus6VectorIdNS_12OMPallocatorIdNS_10MallocatorIdLm64EEEEEE6resizeEmd> |
0x4ca255 MOV 0x18(%R15),%RCX |
0x4ca259 TEST %RCX,%RCX |
0x4ca25c JE 4ca2dc |
0x4ca25e MOV -0x60(%RBP),%RAX |
0x4ca262 MOV 0x40(%RAX),%RAX |
0x4ca266 MOV 0x198(%R15),%R14 |
0x4ca26d LEA (,%RCX,8),%RDX |
0x4ca275 LEA (%RDX,%RDX,2),%RDX |
0x4ca279 LEA -0x8(%RAX,%RDX,1),%RSI |
0x4ca27e CMP %R14,%RSI |
0x4ca281 JB 4ca2e8 |
0x4ca283 LEA -0x8(%R14,%RDX,1),%RDX |
0x4ca288 CMP %RAX,%RDX |
0x4ca28b JB 4ca2e8 |
0x4ca28d DEC %RCX |
0x4ca290 XOR %ESI,%ESI |
0x4ca292 MOV %R14,%RDX |
0x4ca295 NOPW %CS:(%RAX,%RAX,1) |
(2094) 0x4ca2a0 XOR %EDI,%EDI |
(2094) 0x4ca2a2 NOPW %CS:(%RAX,%RAX,1) |
(2093) 0x4ca2b0 VMOVQ (%RAX,%RDI,8),%XMM0 |
(2093) 0x4ca2b5 VMOVQ %XMM0,(%RDX,%RDI,8) |
(2093) 0x4ca2ba INC %RDI |
(2093) 0x4ca2bd CMP $0x3,%RDI |
(2093) 0x4ca2c1 JNE 4ca2b0 |
(2094) 0x4ca2c3 LEA 0x1(%RSI),%RDI |
(2094) 0x4ca2c7 ADD $0x18,%RAX |
(2094) 0x4ca2cb ADD $0x18,%RDX |
(2094) 0x4ca2cf CMP %RCX,%RSI |
(2094) 0x4ca2d2 MOV %RDI,%RSI |
(2094) 0x4ca2d5 JNE 4ca2a0 |
0x4ca2d7 JMP 4ca42f |
0x4ca2dc MOV 0x198(%R15),%R14 |
0x4ca2e3 JMP 4ca42f |
0x4ca2e8 MOV %ECX,%EDX |
0x4ca2ea AND $0x3,%EDX |
0x4ca2ed CMP $0x4,%RCX |
0x4ca2f1 JAE 4ca366 |
0x4ca2f3 XOR %ESI,%ESI |
0x4ca2f5 JMP 4ca3f3 |
0x4ca2fa MOV %RCX,%R12 |
0x4ca2fd LEA 0x48(%R15),%R13 |
0x4ca301 MOV (%R15),%RAX |
0x4ca304 MOV %R15,%RDI |
0x4ca307 CALLQ 0x88(%RAX) |
0x4ca30d LEA 0x158(%R15),%RDI |
0x4ca314 MOV 0x18(%R15),%RSI |
0x4ca318 MOV %RAX,-0x50(%RBP) |
0x4ca31c IMUL %RAX,%RSI |
0x4ca320 VPXOR %XMM0,%XMM0,%XMM0 |
0x4ca324 CALL 44c7c0 <_ZN11qmcplusplus6VectorIdNS_12OMPallocatorIdNS_10MallocatorIdLm64EEEEEE6resizeEmd> |
0x4ca329 MOV 0x18(%R15),%RAX |
0x4ca32d MOV 0x50(%R15),%RBX |
0x4ca331 MOV (%R13),%RCX |
0x4ca335 MOV %RBX,%RDX |
0x4ca338 SUB %RCX,%RDX |
0x4ca33b SAR $0x3,%RDX |
0x4ca33f MOV $-0x3333333333333333,%RDI |
0x4ca349 IMUL %RDX,%RDI |
0x4ca34d MOV %RAX,%RSI |
0x4ca350 SUB %RDI,%RSI |
0x4ca353 JBE 4ca889 |
0x4ca359 MOV %R13,%RDI |
0x4ca35c CALL 469f00 <_ZNSt6vectorIN11qmcplusplus6VectorIdNS0_10MallocatorIdLm64EEEEESaIS4_EE17_M_default_appendEm> |
0x4ca361 JMP 4ca8ba |
0x4ca366 AND $-0x4,%RCX |
0x4ca36a MOV $0x58,%EDI |
0x4ca36f XOR %ESI,%ESI |
0x4ca371 NOPW %CS:(%RAX,%RAX,1) |
(2091) 0x4ca380 VMOVUPS -0x58(%RAX,%RDI,1),%XMM0 |
(2091) 0x4ca386 VMOVUPS %XMM0,-0x58(%R14,%RDI,1) |
(2091) 0x4ca38d VMOVSD -0x48(%RAX,%RDI,1),%XMM0 |
(2091) 0x4ca393 VMOVSD %XMM0,-0x48(%R14,%RDI,1) |
(2091) 0x4ca39a VMOVUPS -0x40(%RAX,%RDI,1),%XMM0 |
(2091) 0x4ca3a0 VMOVUPS %XMM0,-0x40(%R14,%RDI,1) |
(2091) 0x4ca3a7 VMOVSD -0x30(%RAX,%RDI,1),%XMM0 |
(2091) 0x4ca3ad VMOVSD %XMM0,-0x30(%R14,%RDI,1) |
(2091) 0x4ca3b4 VMOVUPS -0x28(%RAX,%RDI,1),%XMM0 |
(2091) 0x4ca3ba VMOVUPS %XMM0,-0x28(%R14,%RDI,1) |
(2091) 0x4ca3c1 VMOVSD -0x18(%RAX,%RDI,1),%XMM0 |
(2091) 0x4ca3c7 VMOVSD %XMM0,-0x18(%R14,%RDI,1) |
(2091) 0x4ca3ce VMOVUPS -0x10(%RAX,%RDI,1),%XMM0 |
(2091) 0x4ca3d4 VMOVUPS %XMM0,-0x10(%R14,%RDI,1) |
(2091) 0x4ca3db VMOVQ (%RAX,%RDI,1),%XMM0 |
(2091) 0x4ca3e0 VMOVQ %XMM0,(%R14,%RDI,1) |
(2091) 0x4ca3e6 ADD $0x4,%RSI |
(2091) 0x4ca3ea ADD $0x60,%RDI |
(2091) 0x4ca3ee CMP %RSI,%RCX |
(2091) 0x4ca3f1 JNE 4ca380 |
0x4ca3f3 TEST %RDX,%RDX |
0x4ca3f6 JE 4ca42f |
0x4ca3f8 LEA (%RSI,%RSI,2),%RCX |
0x4ca3fc LEA 0x10(%RAX,%RCX,8),%RAX |
0x4ca401 LEA 0x10(%R14,%RCX,8),%RCX |
0x4ca406 SAL $0x3,%EDX |
0x4ca409 LEA (%RDX,%RDX,2),%RDX |
0x4ca40d XOR %ESI,%ESI |
0x4ca40f NOP |
(2092) 0x4ca410 VMOVUPS -0x10(%RAX,%RSI,1),%XMM0 |
(2092) 0x4ca416 VMOVUPS %XMM0,-0x10(%RCX,%RSI,1) |
(2092) 0x4ca41c VMOVQ (%RAX,%RSI,1),%XMM0 |
(2092) 0x4ca421 VMOVQ %XMM0,(%RCX,%RSI,1) |
(2092) 0x4ca426 ADD $0x18,%RSI |
(2092) 0x4ca42a CMP %RSI,%RDX |
(2092) 0x4ca42d JNE 4ca410 |
0x4ca42f MOV 0x8(%R15),%RAX |
0x4ca433 MOV 0x278(%RAX),%RDI |
0x4ca43a MOV (%RDI),%RAX |
0x4ca43d CALLQ 0x48(%RAX) |
0x4ca440 MOV 0x18(%RAX),%RAX |
0x4ca444 MOV %RAX,-0xc0(%RBP) |
0x4ca44b MOV (%R15),%RAX |
0x4ca44e MOV 0x48(%R15),%RCX |
0x4ca452 MOV 0x18(%RCX),%RCX |
0x4ca456 MOV %RCX,-0x88(%RBP) |
0x4ca45d MOV $0x1ff,%R12D |
0x4ca463 ADD 0x10(%R15),%R12 |
0x4ca467 MOV %R15,%RDI |
0x4ca46a CALLQ 0x88(%RAX) |
0x4ca470 MOV %RAX,-0x78(%RBP) |
0x4ca474 MOV %R14,-0xc8(%RBP) |
0x4ca47b MOV 0x1b0(%R15),%RDI |
0x4ca482 MOV %RDI,-0x90(%RBP) |
0x4ca489 CALL 48e0f0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> |
0x4ca48e TEST %R13D,%R13D |
0x4ca491 JLE 4ca49c |
0x4ca493 CMP $0x200,%R12 |
0x4ca49a JAE 4ca4c3 |
0x4ca49c MOV -0x90(%RBP),%RDI |
0x4ca4a3 CALL 48e2a0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> |
0x4ca4a8 MOV -0x70(%RBP),%RDI |
0x4ca4ac CALL 48e2a0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> |
0x4ca4b1 ADD $0xb8,%RSP |
0x4ca4b8 POP %RBX |
0x4ca4b9 POP %R12 |
0x4ca4bb POP %R13 |
0x4ca4bd POP %R14 |
0x4ca4bf POP %R15 |
0x4ca4c1 POP %RBP |
0x4ca4c2 RET |
0x4ca4c3 MOV -0x58(%RBP),%RAX |
0x4ca4c7 ADD $0x7,%RAX |
0x4ca4cb AND $-0x8,%RAX |
0x4ca4cf SHR $0x9,%R12 |
0x4ca4d3 MOVSXD %EAX,%RDX |
0x4ca4d6 LEA (%RAX,%RAX,1),%ECX |
0x4ca4d9 SAL $0x20,%RAX |
0x4ca4dd MOVSXD %ECX,%RCX |
0x4ca4e0 MOVSXD %R13D,%RSI |
0x4ca4e3 DEC %RSI |
0x4ca4e6 MOV %RSI,-0xa0(%RBP) |
0x4ca4ed DEC %R12 |
0x4ca4f0 MOV %R12,-0x68(%RBP) |
0x4ca4f4 SAR $0x1f,%RAX |
0x4ca4f8 MOV %RAX,-0x30(%RBP) |
0x4ca4fc MOV %RCX,-0xb0(%RBP) |
0x4ca503 LEA (%RCX,%RDX,1),%RAX |
0x4ca507 MOV %RAX,-0x48(%RBP) |
0x4ca50b MOV -0x78(%RBP),%RAX |
0x4ca50f LEA (,%RAX,8),%RAX |
0x4ca517 MOV %RAX,-0x98(%RBP) |
0x4ca51e XOR %EAX,%EAX |
0x4ca520 VPBROADCASTQ 0x30d17(%RIP),%XMM0 |
0x4ca529 VPBROADCASTQ 0x3748e(%RIP),%XMM1 |
0x4ca532 MOV %RDX,-0xb8(%RBP) |
0x4ca539 MOV %RDX,-0x40(%RBP) |
0x4ca53d MOV -0x88(%RBP),%RCX |
0x4ca544 MOV %RCX,-0x38(%RBP) |
0x4ca548 JMP 4ca58b |
0x4ca54a NOPW (%RAX,%RAX,1) |
(2088) 0x4ca550 MOV -0xa8(%RBP),%RDX |
(2088) 0x4ca557 LEA 0x1(%RDX),%RAX |
(2088) 0x4ca55b MOV -0x78(%RBP),%RCX |
(2088) 0x4ca55f ADD %RCX,-0x48(%RBP) |
(2088) 0x4ca563 ADD %RCX,-0x30(%RBP) |
(2088) 0x4ca567 MOV -0x38(%RBP),%RSI |
(2088) 0x4ca56b ADD -0x98(%RBP),%RSI |
(2088) 0x4ca572 MOV %RSI,-0x38(%RBP) |
(2088) 0x4ca576 ADD %RCX,-0x40(%RBP) |
(2088) 0x4ca57a CMP -0xa0(%RBP),%RDX |
(2088) 0x4ca581 MOV -0x80(%RBP),%R15 |
(2088) 0x4ca585 JE 4ca49c |
(2088) 0x4ca58b VMOVSD 0x110(%R15),%XMM2 |
(2088) 0x4ca594 VMOVSD 0x118(%R15),%XMM3 |
(2088) 0x4ca59d VMOVSD 0x120(%R15),%XMM4 |
(2088) 0x4ca5a6 VMOVSD 0x128(%R15),%XMM5 |
(2088) 0x4ca5af VMOVSD 0x130(%R15),%XMM6 |
(2088) 0x4ca5b8 VMOVSD 0x138(%R15),%XMM7 |
(2088) 0x4ca5c1 VMOVSD 0x140(%R15),%XMM8 |
(2088) 0x4ca5ca VMOVSD 0x148(%R15),%XMM9 |
(2088) 0x4ca5d3 VMOVSD 0x150(%R15),%XMM10 |
(2088) 0x4ca5dc VMOVSD 0xc8(%R15),%XMM11 |
(2088) 0x4ca5e5 VMOVSD 0xd0(%R15),%XMM12 |
(2088) 0x4ca5ee VMOVSD 0xd8(%R15),%XMM13 |
(2088) 0x4ca5f7 VMOVSD 0xe0(%R15),%XMM14 |
(2088) 0x4ca600 VMOVSD 0xe8(%R15),%XMM15 |
(2088) 0x4ca609 VMOVSD 0xf0(%R15),%XMM16 |
(2088) 0x4ca610 VMOVSD 0xf8(%R15),%XMM17 |
(2088) 0x4ca617 VMOVSD 0x100(%R15),%XMM18 |
(2088) 0x4ca61e VMOVSD 0x108(%R15),%XMM19 |
(2088) 0x4ca625 LEA (%RAX,%RAX,2),%ECX |
(2088) 0x4ca628 MOV %RCX,-0x60(%RBP) |
(2088) 0x4ca62c LEA 0x1(%RAX,%RAX,2),%ECX |
(2088) 0x4ca630 MOV %RCX,-0xd8(%RBP) |
(2088) 0x4ca637 MOV %RAX,-0xa8(%RBP) |
(2088) 0x4ca63e LEA 0x2(%RAX,%RAX,2),%EAX |
(2088) 0x4ca642 MOV %RAX,-0xd0(%RBP) |
(2088) 0x4ca649 MOV $0x200,%EAX |
(2088) 0x4ca64e MOV $0x1,%EDX |
(2088) 0x4ca653 MOV $-0x1,%ECX |
(2088) 0x4ca658 XOR %EDI,%EDI |
(2088) 0x4ca65a XOR %R8D,%R8D |
(2088) 0x4ca65d JMP 4ca688 |
0x4ca65f NOP |
(2089) 0x4ca660 LEA 0x1(%R8),%RSI |
(2089) 0x4ca664 ADD $0x200,%EAX |
(2089) 0x4ca669 ADD $0x200,%EDX |
(2089) 0x4ca66f ADD $-0x200,%ECX |
(2089) 0x4ca675 ADD $0x200,%EDI |
(2089) 0x4ca67b CMP -0x68(%RBP),%R8 |
(2089) 0x4ca67f MOV %RSI,%R8 |
(2089) 0x4ca682 JE 4ca550 |
(2089) 0x4ca688 MOV -0x58(%RBP),%R9 |
(2089) 0x4ca68c CMP %R9D,%EAX |
(2089) 0x4ca68f MOV %R9D,%R15D |
(2089) 0x4ca692 CMOVL %EAX,%R15D |
(2089) 0x4ca696 CMP %EDX,%R15D |
(2089) 0x4ca699 CMOVLE %EDX,%R15D |
(2089) 0x4ca69d MOV %R8D,%ESI |
(2089) 0x4ca6a0 SAL $0x9,%ESI |
(2089) 0x4ca6a3 CMP %R9D,%ESI |
(2089) 0x4ca6a6 JGE 4ca660 |
(2089) 0x4ca6a8 MOV %EDI,%R12D |
(2089) 0x4ca6ab MOV -0x48(%RBP),%RSI |
(2089) 0x4ca6af ADD %R12,%RSI |
(2089) 0x4ca6b2 MOV -0x88(%RBP),%R14 |
(2089) 0x4ca6b9 LEA (%R14,%RSI,8),%R9 |
(2089) 0x4ca6bd MOV -0x30(%RBP),%RSI |
(2089) 0x4ca6c1 LEA (%RSI,%R12,1),%RSI |
(2089) 0x4ca6c5 LEA (%R14,%RSI,8),%RSI |
(2089) 0x4ca6c9 MOV -0x38(%RBP),%R10 |
(2089) 0x4ca6cd LEA (%R10,%R12,8),%R11 |
(2089) 0x4ca6d1 MOV -0xb0(%RBP),%R10 |
(2089) 0x4ca6d8 LEA (%R10,%R12,1),%R10 |
(2089) 0x4ca6dc MOV -0xc0(%RBP),%R13 |
(2089) 0x4ca6e3 LEA (%R13,%R10,8),%R10 |
(2089) 0x4ca6e8 MOV -0x40(%RBP),%RBX |
(2089) 0x4ca6ec ADD %R12,%RBX |
(2089) 0x4ca6ef LEA (%R14,%RBX,8),%RBX |
(2089) 0x4ca6f3 MOV -0xb8(%RBP),%R14 |
(2089) 0x4ca6fa ADD %R12,%R14 |
(2089) 0x4ca6fd LEA (%R13,%R14,8),%R14 |
(2089) 0x4ca702 LEA (%R13,%R12,8),%R12 |
(2089) 0x4ca707 ADD %ECX,%R15D |
(2089) 0x4ca70a LEA 0x8(,%R15,8),%R15 |
(2089) 0x4ca712 MOV -0xc8(%RBP),%R13 |
(2089) 0x4ca719 MOV %ECX,-0x50(%RBP) |
(2089) 0x4ca71c MOV -0x60(%RBP),%RCX |
(2089) 0x4ca720 VMOVSD (%R13,%RCX,8),%XMM20 |
(2089) 0x4ca728 MOV -0xd8(%RBP),%RCX |
(2089) 0x4ca72f VMOVSD (%R13,%RCX,8),%XMM21 |
(2089) 0x4ca737 MOV -0xd0(%RBP),%RCX |
(2089) 0x4ca73e VMOVSD (%R13,%RCX,8),%XMM22 |
(2089) 0x4ca746 MOV -0x50(%RBP),%ECX |
(2089) 0x4ca749 XOR %R13D,%R13D |
(2089) 0x4ca74c NOPL (%RAX) |
(2090) 0x4ca750 VMOVSD (%R12,%R13,1),%XMM23 |
(2090) 0x4ca757 VSUBSD %XMM20,%XMM23,%XMM23 |
(2090) 0x4ca75d VMOVSD (%R14,%R13,1),%XMM24 |
(2090) 0x4ca764 VSUBSD %XMM21,%XMM24,%XMM24 |
(2090) 0x4ca76a VMOVSD (%R10,%R13,1),%XMM25 |
(2090) 0x4ca771 VSUBSD %XMM22,%XMM25,%XMM25 |
(2090) 0x4ca777 VMULSD %XMM23,%XMM2,%XMM26 |
(2090) 0x4ca77d VFMADD231SD %XMM24,%XMM3,%XMM26 |
(2090) 0x4ca783 VFMADD231SD %XMM25,%XMM4,%XMM26 |
(2090) 0x4ca789 VMULSD %XMM23,%XMM5,%XMM27 |
(2090) 0x4ca78f VFMADD231SD %XMM24,%XMM6,%XMM27 |
(2090) 0x4ca795 VFMADD231SD %XMM25,%XMM7,%XMM27 |
(2090) 0x4ca79b VMULSD %XMM23,%XMM8,%XMM23 |
(2090) 0x4ca7a1 VFMADD231SD %XMM24,%XMM9,%XMM23 |
(2090) 0x4ca7a7 VFMADD231SD %XMM25,%XMM10,%XMM23 |
(2090) 0x4ca7ad VMOVDQA64 %XMM1,%XMM24 |
(2090) 0x4ca7b3 VPTERNLOGQ $-0x8,%XMM0,%XMM26,%XMM24 |
(2090) 0x4ca7ba VADDSD %XMM24,%XMM26,%XMM24 |
(2090) 0x4ca7c0 VRNDSCALESD $0xb,%XMM24,%XMM24,%XMM24 |
(2090) 0x4ca7c7 VMOVDQA64 %XMM1,%XMM25 |
(2090) 0x4ca7cd VPTERNLOGQ $-0x8,%XMM0,%XMM27,%XMM25 |
(2090) 0x4ca7d4 VADDSD %XMM25,%XMM27,%XMM25 |
(2090) 0x4ca7da VRNDSCALESD $0xb,%XMM25,%XMM25,%XMM25 |
(2090) 0x4ca7e1 VSUBSD %XMM24,%XMM26,%XMM24 |
(2090) 0x4ca7e7 VSUBSD %XMM25,%XMM27,%XMM25 |
(2090) 0x4ca7ed VMOVDQA64 %XMM1,%XMM26 |
(2090) 0x4ca7f3 VPTERNLOGQ $-0x8,%XMM0,%XMM23,%XMM26 |
(2090) 0x4ca7fa VADDSD %XMM26,%XMM23,%XMM26 |
(2090) 0x4ca800 VRNDSCALESD $0xb,%XMM26,%XMM26,%XMM26 |
(2090) 0x4ca807 VSUBSD %XMM26,%XMM23,%XMM23 |
(2090) 0x4ca80d VMULSD %XMM24,%XMM11,%XMM26 |
(2090) 0x4ca813 VFMADD231SD %XMM25,%XMM12,%XMM26 |
(2090) 0x4ca819 VFMADD231SD %XMM13,%XMM23,%XMM26 |
(2090) 0x4ca81f VMOVSD %XMM26,(%RBX,%R13,1) |
(2090) 0x4ca826 VMULSD %XMM24,%XMM14,%XMM27 |
(2090) 0x4ca82c VFMADD231SD %XMM25,%XMM15,%XMM27 |
(2090) 0x4ca832 VFMADD231SD %XMM23,%XMM16,%XMM27 |
(2090) 0x4ca838 VMOVSD %XMM27,(%RSI,%R13,1) |
(2090) 0x4ca83f VMULSD %XMM24,%XMM17,%XMM24 |
(2090) 0x4ca845 VFMADD231SD %XMM25,%XMM18,%XMM24 |
(2090) 0x4ca84b VFMADD231SD %XMM23,%XMM19,%XMM24 |
(2090) 0x4ca851 VMOVSD %XMM24,(%R9,%R13,1) |
(2090) 0x4ca858 VMULSD %XMM26,%XMM26,%XMM23 |
(2090) 0x4ca85e VFMADD231SD %XMM27,%XMM27,%XMM23 |
(2090) 0x4ca864 VFMADD231SD %XMM24,%XMM24,%XMM23 |
(2090) 0x4ca86a VSQRTSD %XMM23,%XMM23,%XMM23 |
(2090) 0x4ca870 VMOVSD %XMM23,(%R11,%R13,1) |
(2090) 0x4ca877 ADD $0x8,%R13 |
(2090) 0x4ca87b CMP %R13,%R15 |
(2090) 0x4ca87e JNE 4ca750 |
(2089) 0x4ca884 JMP 4ca660 |
0x4ca889 JAE 4ca8ba |
0x4ca88b LEA (%RAX,%RAX,4),%RAX |
0x4ca88f LEA (%RCX,%RAX,8),%R14 |
0x4ca893 CMP %R14,%RBX |
0x4ca896 JE 4ca8ba |
0x4ca898 MOV %R13,-0x30(%RBP) |
0x4ca89c MOV %R14,%R13 |
0x4ca89f NOP |
(2096) 0x4ca8a0 MOV (%R13),%RAX |
(2096) 0x4ca8a4 MOV %R13,%RDI |
(2096) 0x4ca8a7 CALLQ (%RAX) |
(2096) 0x4ca8a9 ADD $0x28,%R13 |
(2096) 0x4ca8ad CMP %RBX,%R13 |
(2096) 0x4ca8b0 JNE 4ca8a0 |
0x4ca8b2 MOV %R14,0x50(%R15) |
0x4ca8b6 MOV -0x30(%RBP),%R13 |
0x4ca8ba LEA 0x60(%R15),%RDI |
0x4ca8be MOV 0x18(%R15),%RSI |
0x4ca8c2 MOV %RDI,-0x38(%RBP) |
0x4ca8c6 CALL 4696e0 <_ZNSt6vectorIN11qmcplusplus18VectorSoAContainerIdLj3ENS0_10MallocatorIdLm64EEEEESaIS4_EE6resizeEm> |
0x4ca8cb CMPQ $0,0x18(%R15) |
0x4ca8d0 JE 4ca21e |
0x4ca8d6 ADD $0x7,%R12 |
0x4ca8da MOV %R12,%RAX |
0x4ca8dd AND $-0x8,%RAX |
0x4ca8e1 MOV %RAX,-0x40(%RBP) |
0x4ca8e5 SAL $0x3,%R12 |
0x4ca8e9 AND $-0x40,%R12 |
0x4ca8ed MOV %R12,-0x48(%RBP) |
0x4ca8f1 SALQ $0x3,-0x50(%RBP) |
0x4ca8f6 MOV $0x18,%R14D |
0x4ca8fc XOR %R12D,%R12D |
0x4ca8ff XOR %EAX,%EAX |
0x4ca901 MOV %R13,-0x30(%RBP) |
0x4ca905 JMP 4ca94d |
0x4ca907 NOPW (%RAX,%RAX,1) |
(2095) 0x4ca910 MOV -0x48(%RBP),%RAX |
(2095) 0x4ca914 ADD %R12,%RAX |
(2095) 0x4ca917 ADD %RAX,%R15 |
(2095) 0x4ca91a MOV %RCX,-0x18(%RBX,%R14,1) |
(2095) 0x4ca91f MOV -0x40(%RBP),%RAX |
(2095) 0x4ca923 MOV %RAX,-0x10(%RBX,%R14,1) |
(2095) 0x4ca928 MOV %R15,(%RBX,%R14,1) |
(2095) 0x4ca92c MOV -0x58(%RBP),%RAX |
(2095) 0x4ca930 INC %RAX |
(2095) 0x4ca933 ADD $0x28,%R14 |
(2095) 0x4ca937 ADD -0x50(%RBP),%R12 |
(2095) 0x4ca93b MOV -0x80(%RBP),%R15 |
(2095) 0x4ca93f CMP %RAX,0x18(%R15) |
(2095) 0x4ca943 MOV -0x30(%RBP),%R13 |
(2095) 0x4ca947 JBE 4ca21e |
(2095) 0x4ca94d MOV %RAX,-0x58(%RBP) |
(2095) 0x4ca951 MOV (%R13),%RBX |
(2095) 0x4ca955 MOV 0x10(%R15),%RAX |
(2095) 0x4ca959 MOV 0x170(%R15),%R13 |
(2095) 0x4ca960 CMPQ $0,-0x8(%RBX,%R14,1) |
(2095) 0x4ca966 MOV %R15,%RDX |
(2095) 0x4ca969 MOV %R13,%R15 |
(2095) 0x4ca96c MOV %RAX,%RCX |
(2095) 0x4ca96f JE 4ca9a6 |
(2095) 0x4ca971 MOV (%RBX,%R14,1),%RDI |
(2095) 0x4ca975 MOV %RAX,-0x68(%RBP) |
(2095) 0x4ca979 MOV %RDX,%R15 |
(2095) 0x4ca97c VZEROUPPER |
(2095) 0x4ca97f CALL 403a90 <free@plt> |
(2095) 0x4ca984 MOV -0x68(%RBP),%RAX |
(2095) 0x4ca988 VPXOR %XMM0,%XMM0,%XMM0 |
(2095) 0x4ca98c VMOVDQU %XMM0,-0x10(%RBX,%R14,1) |
(2095) 0x4ca993 MOVQ $0,(%RBX,%R14,1) |
(2095) 0x4ca99b MOV 0x10(%R15),%RCX |
(2095) 0x4ca99f MOV 0x170(%R15),%R15 |
(2095) 0x4ca9a6 MOV %RAX,-0x10(%RBX,%R14,1) |
(2095) 0x4ca9ab MOVQ $0,-0x8(%RBX,%R14,1) |
(2095) 0x4ca9b4 ADD %R12,%R13 |
(2095) 0x4ca9b7 MOV %R13,(%RBX,%R14,1) |
(2095) 0x4ca9bb MOV -0x38(%RBP),%RAX |
(2095) 0x4ca9bf MOV (%RAX),%RBX |
(2095) 0x4ca9c2 CMPQ $0,-0x8(%RBX,%R14,1) |
(2095) 0x4ca9c8 JE 4ca910 |
(2095) 0x4ca9ce MOV (%RBX,%R14,1),%RDI |
(2095) 0x4ca9d2 MOV %RCX,%R13 |
(2095) 0x4ca9d5 VZEROUPPER |
(2095) 0x4ca9d8 CALL 403a90 <free@plt> |
(2095) 0x4ca9dd MOV %R13,%RCX |
(2095) 0x4ca9e0 VPXOR %XMM0,%XMM0,%XMM0 |
(2095) 0x4ca9e4 VMOVDQU %YMM0,-0x18(%RBX,%R14,1) |
(2095) 0x4ca9eb JMP 4ca910 |
0x4ca9f0 MOV %RAX,%RDI |
0x4ca9f3 CALL 40d030 <__clang_call_terminate> |
0x4ca9f8 MOV %RAX,%RDI |
0x4ca9fb CALL 40d030 <__clang_call_terminate> |
0x4caa00 JMP 4caa06 |
0x4caa02 JMP 4caa06 |
0x4caa04 JMP 4caa06 |
0x4caa06 MOV %RAX,%RBX |
0x4caa09 MOV -0x70(%RBP),%RDI |
0x4caa0d CALL 48e2a0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> |
0x4caa12 MOV %RBX,%RDI |
0x4caa15 CALL 4038c0 <_Unwind_Resume@plt> |
0x4caa1a MOV %RAX,%RDI |
0x4caa1d CALL 40d030 <__clang_call_terminate> |
0x4caa22 NOPW %CS:(%RAX,%RAX,1) |
0x4caa2c NOPL (%RAX) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►99.64+ | qmcplusplus::ParticleSet::upda[...] | ParticleSet.cpp:242 | exec |
○ | qmcplusplus::NonLocalPP<double[...] | NonLocalPP.hpp:134 | exec |
○ | main.extracted.110 | NewTimer.h:249 | exec |
○ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | SoaDistanceTableABOMPTarget.h:61-233 |
Module | exec |
nb instructions | 208 |
nb uops | 230 |
loop length | 861 |
used x86 registers | 12 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 19 |
micro-operation queue | 38.33 cycles |
front end | 38.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 12.60 | 12.60 | 16.00 | 16.00 | 24.00 | 12.67 | 12.60 | 24.00 | 24.00 | 24.00 | 12.53 | 16.00 |
cycles | 12.60 | 13.80 | 16.00 | 16.00 | 24.00 | 12.67 | 12.60 | 24.00 | 24.00 | 24.00 | 12.53 | 16.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 36.21 |
Stall cycles | 0.00 |
Front-end | 38.33 |
Dispatch | 24.00 |
Overall L1 | 38.33 |
all | 6% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
all | 13% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x10(%RDI),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %RCX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %RDI,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4ca21e <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x3e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x50(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP 0x48(%R15),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4ca2fa <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x11a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x1b8(%R15),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 48e0f0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x10(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%R15),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x180(%R15),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R13,%R13,2),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 44c7c0 <_ZN11qmcplusplus6VectorIdNS_12OMPallocatorIdNS_10MallocatorIdLm64EEEEEE6resizeEmd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%R15),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4ca2dc <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0xfc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x198(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (,%RCX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDX,%RDX,2),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(%RAX,%RDX,1),%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R14,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4ca2e8 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x108> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x8(%R14,%RDX,1),%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4ca2e8 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x108> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
DEC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ca42f <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x24f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x198(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4ca42f <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x24f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %ECX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $0x3,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP $0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4ca366 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x186> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ca3f3 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x213> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x48(%R15),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALLQ 0x88(%RAX) | 3 | 0.70 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.70 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 0 | 2.27 |
LEA 0x158(%R15),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%R15),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 44c7c0 <_ZN11qmcplusplus6VectorIdNS_12OMPallocatorIdNS_10MallocatorIdLm64EEEEEE6resizeEmd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%R15),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $-0x3333333333333333,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
IMUL %RDX,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RDI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4ca889 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x6a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 469f00 <_ZNSt6vectorIN11qmcplusplus6VectorIdNS0_10MallocatorIdLm64EEEEESaIS4_EE17_M_default_appendEm> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
JMP 4ca8ba <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x6da> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV $0x58,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4ca42f <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x24f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RSI,%RSI,2),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x10(%RAX,%RCX,8),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x10(%R14,%RCX,8),%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x3,%EDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA (%RDX,%RDX,2),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x8(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x278(%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALLQ 0x48(%RAX) | 3 | 0.70 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.70 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 0 | 2.27 |
MOV 0x18(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%R15),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x1ff,%R12D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD 0x10(%R15),%R12 | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALLQ 0x88(%RAX) | 3 | 0.70 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.70 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 0 | 2.27 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1b0(%R15),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 48e0f0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R13D,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4ca49c <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x2bc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x200,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4ca4c3 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x2e3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x90(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 48e2a0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 48e2a0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x7,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x8,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x9,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOVSXD %EAX,%RDX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
LEA (%RAX,%RAX,1),%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SAL $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOVSXD %ECX,%RCX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOVSXD %R13D,%RSI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
DEC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RSI,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAR $0x1f,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%RDX,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (,%RAX,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPBROADCASTQ 0x30d17(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VPBROADCASTQ 0x3748e(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV %RDX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x88(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4ca58b <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x3ab> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JAE 4ca8ba <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x6da> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RAX,%RAX,4),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RCX,%RAX,8),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 4ca8ba <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x6da> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,0x50(%R15) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x60(%R15),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%R15),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4696e0 <_ZNSt6vectorIN11qmcplusplus18VectorSoAContainerIdLj3ENS0_10MallocatorIdLm64EEEEESaIS4_EE6resizeEm> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,0x18(%R15) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4ca21e <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x3e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x7,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x8,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x3,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
AND $-0x40,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R12,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SALQ $0x3,-0x50(%RBP) | 3 | 0.50 | 0 | 0.33 | 0.33 | 0.50 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0.33 | 0-2 | 0.50 |
MOV $0x18,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R12D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4ca94d <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x76d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 40d030 <__clang_call_terminate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 40d030 <__clang_call_terminate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
JMP 4caa06 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x826> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
JMP 4caa06 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x826> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
JMP 4caa06 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x826> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 48e2a0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4038c0 <_Unwind_Resume@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 40d030 <__clang_call_terminate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | SoaDistanceTableABOMPTarget.h:61-233 |
Module | exec |
nb instructions | 208 |
nb uops | 230 |
loop length | 861 |
used x86 registers | 12 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 19 |
micro-operation queue | 38.33 cycles |
front end | 38.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 12.60 | 12.60 | 16.00 | 16.00 | 24.00 | 12.67 | 12.60 | 24.00 | 24.00 | 24.00 | 12.53 | 16.00 |
cycles | 12.60 | 13.80 | 16.00 | 16.00 | 24.00 | 12.67 | 12.60 | 24.00 | 24.00 | 24.00 | 12.53 | 16.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 36.21 |
Stall cycles | 0.00 |
Front-end | 38.33 |
Dispatch | 24.00 |
Overall L1 | 38.33 |
all | 6% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
all | 13% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x10(%RDI),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %RCX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %RDI,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4ca21e <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x3e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x50(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP 0x48(%R15),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4ca2fa <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x11a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x1b8(%R15),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 48e0f0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x10(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%R15),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x180(%R15),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R13,%R13,2),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 44c7c0 <_ZN11qmcplusplus6VectorIdNS_12OMPallocatorIdNS_10MallocatorIdLm64EEEEEE6resizeEmd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%R15),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4ca2dc <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0xfc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x198(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (,%RCX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDX,%RDX,2),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(%RAX,%RDX,1),%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R14,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4ca2e8 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x108> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x8(%R14,%RDX,1),%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4ca2e8 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x108> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
DEC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ca42f <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x24f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x198(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4ca42f <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x24f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %ECX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $0x3,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP $0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4ca366 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x186> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ca3f3 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x213> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x48(%R15),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALLQ 0x88(%RAX) | 3 | 0.70 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.70 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 0 | 2.27 |
LEA 0x158(%R15),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%R15),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 44c7c0 <_ZN11qmcplusplus6VectorIdNS_12OMPallocatorIdNS_10MallocatorIdLm64EEEEEE6resizeEmd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%R15),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $-0x3333333333333333,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
IMUL %RDX,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RDI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4ca889 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x6a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 469f00 <_ZNSt6vectorIN11qmcplusplus6VectorIdNS0_10MallocatorIdLm64EEEEESaIS4_EE17_M_default_appendEm> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
JMP 4ca8ba <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x6da> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV $0x58,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4ca42f <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x24f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RSI,%RSI,2),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x10(%RAX,%RCX,8),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x10(%R14,%RCX,8),%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x3,%EDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA (%RDX,%RDX,2),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x8(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x278(%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALLQ 0x48(%RAX) | 3 | 0.70 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.70 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 0 | 2.27 |
MOV 0x18(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%R15),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x1ff,%R12D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD 0x10(%R15),%R12 | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALLQ 0x88(%RAX) | 3 | 0.70 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.70 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 0 | 2.27 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1b0(%R15),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 48e0f0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R13D,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4ca49c <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x2bc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x200,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4ca4c3 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x2e3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x90(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 48e2a0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 48e2a0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x7,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x8,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x9,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOVSXD %EAX,%RDX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
LEA (%RAX,%RAX,1),%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SAL $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOVSXD %ECX,%RCX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOVSXD %R13D,%RSI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
DEC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RSI,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAR $0x1f,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%RDX,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (,%RAX,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPBROADCASTQ 0x30d17(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VPBROADCASTQ 0x3748e(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV %RDX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x88(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4ca58b <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x3ab> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JAE 4ca8ba <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x6da> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RAX,%RAX,4),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RCX,%RAX,8),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 4ca8ba <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x6da> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,0x50(%R15) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x60(%R15),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%R15),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4696e0 <_ZNSt6vectorIN11qmcplusplus18VectorSoAContainerIdLj3ENS0_10MallocatorIdLm64EEEEESaIS4_EE6resizeEm> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,0x18(%R15) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4ca21e <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x3e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x7,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x8,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x3,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
AND $-0x40,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R12,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SALQ $0x3,-0x50(%RBP) | 3 | 0.50 | 0 | 0.33 | 0.33 | 0.50 | 0 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0.33 | 0-2 | 0.50 |
MOV $0x18,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R12D,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4ca94d <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x76d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 40d030 <__clang_call_terminate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 40d030 <__clang_call_terminate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
JMP 4caa06 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x826> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
JMP 4caa06 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x826> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
JMP 4caa06 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x826> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 48e2a0 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4038c0 <_Unwind_Resume@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 40d030 <__clang_call_terminate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼qmcplusplus::SoaDistanceTableABOMPTarget | 9.4 | 7.57 |
○Loop 2096 - stl_construct.h:98-107 - exec | 0 | 0 |
▼Loop 2094 - SoaDistanceTableABOMPTarget.h:194-196 - exec– | 0 | 0 |
○Loop 2093 - SoaDistanceTableABOMPTarget.h:195-196 - exec | 0 | 0 |
○Loop 2092 - SoaDistanceTableABOMPTarget.h:194-196 - exec | 0 | 0 |
▼Loop 2088 - SoaDistanceTableABOMPTarget.h:214-228 - exec– | 0 | 0 |
▼Loop 2089 - SoaDistanceTableABOMPTarget.h:215-228 - exec– | 0.01 | 0.01 |
○Loop 2090 - SoaDistanceTableABOMPTarget.h:228-228 - exec | 9.38 | 7.35 |
○Loop 2091 - SoaDistanceTableABOMPTarget.h:194-196 - exec | 0 | 0.01 |
○Loop 2095 - VectorSoAContainer.h:151-176 - exec | 0 | 0 |