Function: _Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buf ... | Module: exec | Source: advec_mom.cpp:180-211 [...] | Coverage: 5.25% |
---|
Function: _Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buf ... | Module: exec | Source: advec_mom.cpp:180-211 [...] | Coverage: 5.25% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/advec_mom.cpp: 180 - 211 |
-------------------------------------------------------------------------------- |
180: #pragma omp parallel for simd collapse(2) |
181: for (int j = (y_min - 1 + 1); j < (y_max + 1 + 2); j++) { |
182: for (int i = (x_min + 1); i < (x_max + 1 + 2); i++) |
183: ({ |
184: int upwind, donor, downwind, dif; |
185: double sigma, width, limiter, vdiffuw, vdiffdw, auw, adw, wind, advec_vel_s; |
186: if (node_flux(i, j) < 0.0) { |
187: upwind = j + 2; |
188: donor = j + 1; |
189: downwind = j; |
190: dif = donor; |
191: } else { |
192: upwind = j - 1; |
193: donor = j; |
194: downwind = j + 1; |
195: dif = upwind; |
196: } |
197: sigma = std::fabs(node_flux(i, j)) / (node_mass_pre(i, donor)); |
198: width = celldy[j]; |
199: vdiffuw = vel1(i, donor) - vel1(i, upwind); |
200: vdiffdw = vel1(i, downwind) - vel1(i, donor); |
201: limiter = 0.0; |
202: if (vdiffuw * vdiffdw > 0.0) { |
203: auw = std::fabs(vdiffuw); |
204: adw = std::fabs(vdiffdw); |
205: wind = 1.0; |
206: if (vdiffdw <= 0.0) wind = -1.0; |
207: limiter = |
208: wind * std::fmin(std::fmin(width * ((2.0 - sigma) * adw / width + (1.0 + sigma) * auw / celldy[dif]) / 6.0, auw), adw); |
209: } |
210: advec_vel_s = vel1(i, donor) + (1.0 - sigma) * limiter; |
211: mom_flux(i, j) = advec_vel_s * node_flux(i, j); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 46 - 69 |
-------------------------------------------------------------------------------- |
46: T &operator[](size_t i) const { return data[i]; } |
[...] |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
0x438f70 PUSH %RBP |
0x438f71 MOV %RSP,%RBP |
0x438f74 PUSH %R15 |
0x438f76 PUSH %R14 |
0x438f78 PUSH %R13 |
0x438f7a PUSH %R12 |
0x438f7c PUSH %RBX |
0x438f7d SUB $0x158,%RSP |
0x438f84 MOV %RCX,%R13 |
0x438f87 MOV %RDX,%R15 |
0x438f8a MOV 0x38(%RBP),%RAX |
0x438f8e MOV 0x28(%RBP),%RBX |
0x438f92 MOV 0x20(%RBP),%RCX |
0x438f96 MOV 0x10(%RBP),%RDX |
0x438f9a MOV %RDX,-0x48(%RBP) |
0x438f9e MOV 0x18(%RBP),%EDX |
0x438fa1 MOV %EDX,-0x2c(%RBP) |
0x438fa4 MOVL $0,-0x34(%RBP) |
0x438fab TEST %RAX,%RAX |
0x438fae JS 439699 |
0x438fb4 MOV %R9,%R14 |
0x438fb7 MOV %R8,%R12 |
0x438fba MOV %RCX,-0x40(%RBP) |
0x438fbe MOV (%RDI),%ESI |
0x438fc0 MOVQ $0,-0x58(%RBP) |
0x438fc8 MOV %RAX,-0x50(%RBP) |
0x438fcc MOVQ $0x1,-0x98(%RBP) |
0x438fd7 SUB $0x8,%RSP |
0x438fdb LEA -0x98(%RBP),%RAX |
0x438fe2 LEA -0x34(%RBP),%RCX |
0x438fe6 LEA -0x58(%RBP),%R8 |
0x438fea LEA -0x50(%RBP),%R9 |
0x438fee MOV $0x4aa8a0,%EDI |
0x438ff3 MOV %ESI,-0x30(%RBP) |
0x438ff6 MOV $0x22,%EDX |
0x438ffb PUSH $0x1 |
0x438ffd PUSH $0x1 |
0x438fff PUSH %RAX |
0x439000 CALL 404240 <__kmpc_for_static_init_8@plt> |
0x439005 ADD $0x20,%RSP |
0x439009 MOV -0x58(%RBP),%RCX |
0x43900d MOV -0x50(%RBP),%RAX |
0x439011 CMP %RAX,%RCX |
0x439014 JA 4396b5 |
0x43901a MOV %RAX,%RSI |
0x43901d MOV -0x40(%RBP),%RAX |
0x439021 SUB %EAX,%EBX |
0x439023 MOV (%R13),%RDX |
0x439027 MOV 0x10(%R13),%R11 |
0x43902b MOV (%R12),%R8 |
0x43902f MOV 0x10(%R12),%RDI |
0x439034 MOV (%R15),%R9 |
0x439037 MOV 0x10(%R15),%R12 |
0x43903b MOV (%R14),%R15 |
0x43903e MOV 0x10(%R14),%R10 |
0x439042 INC %RSI |
0x439045 MOV %RSI,-0x90(%RBP) |
0x43904c SUB %RCX,%RSI |
0x43904f MOV $-0x2,%R13D |
0x439055 AND %RSI,%R13 |
0x439058 MOV %RDI,-0x88(%RBP) |
0x43905f MOV %R9,-0x80(%RBP) |
0x439063 MOV %R15,-0x78(%RBP) |
0x439067 MOV %R10,-0x70(%RBP) |
0x43906b JE 4396d3 |
0x439071 MOV %RSI,-0x60(%RBP) |
0x439075 MOVD %EBX,%XMM0 |
0x439079 PSHUFD $0x44,%XMM0,%XMM1 |
0x43907e MOVD -0x2c(%RBP),%XMM0 |
0x439083 PSHUFD $0x50,%XMM0,%XMM0 |
0x439088 MOVDQA %XMM0,-0x170(%RBP) |
0x439090 MOVQ %RAX,%XMM0 |
0x439095 PSHUFD $0x44,%XMM0,%XMM0 |
0x43909a MOVDQA %XMM0,-0x160(%RBP) |
0x4390a2 MOVQ %RDX,%XMM0 |
0x4390a7 PSHUFD $0x44,%XMM0,%XMM2 |
0x4390ac MOVQ %R11,%XMM0 |
0x4390b1 PSHUFD $0x44,%XMM0,%XMM0 |
0x4390b6 MOVDQA %XMM0,-0x140(%RBP) |
0x4390be MOVQ %R8,%XMM0 |
0x4390c3 PSHUFD $0x44,%XMM0,%XMM0 |
0x4390c8 MOVDQA %XMM0,-0x130(%RBP) |
0x4390d0 MOVQ %RDI,%XMM0 |
0x4390d5 PSHUFD $0x44,%XMM0,%XMM0 |
0x4390da MOVDQA %XMM0,-0x120(%RBP) |
0x4390e2 MOVQ %R9,%XMM0 |
0x4390e7 PSHUFD $0x44,%XMM0,%XMM0 |
0x4390ec MOVDQA %XMM0,-0x110(%RBP) |
0x4390f4 MOV %R12,-0x68(%RBP) |
0x4390f8 MOVQ %R12,%XMM0 |
0x4390fd PSHUFD $0x44,%XMM0,%XMM0 |
0x439102 MOVDQA %XMM0,-0x100(%RBP) |
0x43910a MOVQ %R15,%XMM0 |
0x43910f PSHUFD $0x44,%XMM0,%XMM0 |
0x439114 MOVDQA %XMM0,-0xf0(%RBP) |
0x43911c MOVQ %R10,%XMM0 |
0x439121 PSHUFD $0x44,%XMM0,%XMM0 |
0x439126 MOVDQA %XMM0,-0xe0(%RBP) |
0x43912e MOVQ %RCX,%XMM0 |
0x439133 PSHUFD $0x44,%XMM0,%XMM7 |
0x439138 PADDQ 0x52450(%RIP),%XMM7 |
0x439140 XOR %R10D,%R10D |
0x439143 MOVDQA %XMM1,-0x180(%RBP) |
0x43914b PSHUFD $-0x12,%XMM1,%XMM0 |
0x439150 MOVDQA %XMM0,-0xd0(%RBP) |
0x439158 MOVDQA %XMM2,-0x150(%RBP) |
0x439160 PSRLQ $0x20,%XMM2 |
0x439165 MOVDQA %XMM2,-0xc0(%RBP) |
0x43916d MOV %RDX,%R14 |
0x439170 MOVDQA -0x100(%RBP),%XMM11 |
0x439179 JMP 43925d |
0x43917e XCHG %AX,%AX |
(310) 0x439180 MOVDQA -0xb0(%RBP),%XMM7 |
(310) 0x439188 DIVPD %XMM8,%XMM15 |
(310) 0x43918d ADDPD %XMM9,%XMM15 |
(310) 0x439192 XORPD %XMM8,%XMM8 |
(310) 0x439197 CMPPD $0x1,%XMM3,%XMM8 |
(310) 0x43919d MULPD 0x525cb(%RIP),%XMM5 |
(310) 0x4391a5 MULPD %XMM15,%XMM5 |
(310) 0x4391aa MINPD %XMM4,%XMM0 |
(310) 0x4391ae MINPD %XMM5,%XMM0 |
(310) 0x4391b2 MOVAPD %XMM0,%XMM3 |
(310) 0x4391b6 XORPD 0x525c2(%RIP),%XMM3 |
(310) 0x4391be ANDPD %XMM8,%XMM0 |
(310) 0x4391c3 ANDNPD %XMM3,%XMM8 |
(310) 0x4391c8 ORPD %XMM0,%XMM8 |
(310) 0x4391cd ANDPD %XMM8,%XMM14 |
(310) 0x4391d2 MOVAPD 0x52576(%RIP),%XMM0 |
(310) 0x4391da SUBPD %XMM13,%XMM0 |
(310) 0x4391df MULPD %XMM14,%XMM0 |
(310) 0x4391e4 ADDPD %XMM12,%XMM0 |
(310) 0x4391e9 MULPD %XMM6,%XMM0 |
(310) 0x4391ed MOVDQA -0xf0(%RBP),%XMM5 |
(310) 0x4391f5 MOVDQA %XMM5,%XMM3 |
(310) 0x4391f9 PSRLQ $0x20,%XMM3 |
(310) 0x4391fe PMULUDQ %XMM2,%XMM3 |
(310) 0x439202 MOVDQA %XMM5,%XMM4 |
(310) 0x439206 PMULUDQ %XMM2,%XMM4 |
(310) 0x43920a PSRLQ $0x20,%XMM2 |
(310) 0x43920f PMULUDQ %XMM5,%XMM2 |
(310) 0x439213 PADDQ %XMM3,%XMM2 |
(310) 0x439217 PADDQ %XMM1,%XMM4 |
(310) 0x43921b PSLLQ $0x20,%XMM2 |
(310) 0x439220 PADDQ %XMM2,%XMM4 |
(310) 0x439224 PSLLQ $0x3,%XMM4 |
(310) 0x439229 PADDQ -0xe0(%RBP),%XMM4 |
(310) 0x439231 MOVQ %XMM4,%RAX |
(310) 0x439236 PSHUFD $-0x12,%XMM4,%XMM1 |
(310) 0x43923b MOVQ %XMM1,%RDX |
(310) 0x439240 MOVLPD %XMM0,(%RAX) |
(310) 0x439244 MOVHPD %XMM0,(%RDX) |
(310) 0x439248 PADDQ 0x52360(%RIP),%XMM7 |
(310) 0x439250 ADD $0x2,%R10 |
(310) 0x439254 CMP %R13,%R10 |
(310) 0x439257 JAE 4396ab |
(310) 0x43925d MOV %R8,%R12 |
(310) 0x439260 MOV %R11,%R8 |
(310) 0x439263 MOV %R14,%R11 |
(310) 0x439266 MOVQ %XMM7,%RSI |
(310) 0x43926b MOVDQA -0x180(%RBP),%XMM0 |
(310) 0x439273 MOVQ %XMM0,%R9 |
(310) 0x439278 MOV %RSI,%RAX |
(310) 0x43927b XOR %EDX,%EDX |
(310) 0x43927d DIV %R9 |
(310) 0x439280 MOVQ %RAX,%XMM0 |
(310) 0x439285 MOVDQA %XMM7,-0xb0(%RBP) |
(310) 0x43928d PSHUFD $-0x12,%XMM7,%XMM1 |
(310) 0x439292 MOVQ %XMM1,%RDI |
(310) 0x439297 MOVDQA -0xd0(%RBP),%XMM1 |
(310) 0x43929f MOVQ %XMM1,%R14 |
(310) 0x4392a4 MOV %RDI,%RAX |
(310) 0x4392a7 XOR %EDX,%EDX |
(310) 0x4392a9 DIV %R14 |
(310) 0x4392ac MOVQ %RAX,%XMM1 |
(310) 0x4392b1 PUNPCKLQDQ %XMM1,%XMM0 |
(310) 0x4392b5 PSHUFD $-0x18,%XMM0,%XMM0 |
(310) 0x4392ba PADDD -0x170(%RBP),%XMM0 |
(310) 0x4392c2 MOV %RSI,%RAX |
(310) 0x4392c5 CQTO |
(310) 0x4392c7 IDIV %R9 |
(310) 0x4392ca MOVQ %RDX,%XMM1 |
(310) 0x4392cf MOV %RDI,%RAX |
(310) 0x4392d2 CQTO |
(310) 0x4392d4 IDIV %R14 |
(310) 0x4392d7 MOVQ %RDX,%XMM2 |
(310) 0x4392dc PUNPCKLQDQ %XMM2,%XMM1 |
(310) 0x4392e0 PADDQ -0x160(%RBP),%XMM1 |
(310) 0x4392e8 PSLLQ $0x20,%XMM1 |
(310) 0x4392ed PSHUFD $-0x13,%XMM1,%XMM1 |
(310) 0x4392f2 MOVDQA %XMM1,%XMM2 |
(310) 0x4392f6 PSRAD $0x1f,%XMM2 |
(310) 0x4392fb PUNPCKLDQ %XMM2,%XMM1 |
(310) 0x4392ff PXOR %XMM3,%XMM3 |
(310) 0x439303 PCMPGTD %XMM0,%XMM3 |
(310) 0x439307 MOVDQA %XMM0,%XMM2 |
(310) 0x43930b PUNPCKLDQ %XMM3,%XMM2 |
(310) 0x43930f MOVDQA -0x150(%RBP),%XMM6 |
(310) 0x439317 MOVDQA %XMM6,%XMM4 |
(310) 0x43931b PMULUDQ %XMM2,%XMM4 |
(310) 0x43931f MOVDQA -0xc0(%RBP),%XMM5 |
(310) 0x439327 PMULUDQ %XMM2,%XMM5 |
(310) 0x43932b PSHUFD $-0x2c,%XMM3,%XMM3 |
(310) 0x439330 PMULUDQ %XMM6,%XMM3 |
(310) 0x439334 PADDQ %XMM5,%XMM3 |
(310) 0x439338 PSLLQ $0x20,%XMM3 |
(310) 0x43933d PADDQ %XMM1,%XMM4 |
(310) 0x439341 PADDQ %XMM3,%XMM4 |
(310) 0x439345 PSLLQ $0x3,%XMM4 |
(310) 0x43934a PADDQ -0x140(%RBP),%XMM4 |
(310) 0x439352 MOVQ %XMM4,%RAX |
(310) 0x439357 PSHUFD $-0x12,%XMM4,%XMM3 |
(310) 0x43935c MOVQ %XMM3,%RDX |
(310) 0x439361 MOVSD (%RAX),%XMM6 |
(310) 0x439365 MOVHPD (%RDX),%XMM6 |
(310) 0x439369 MOVAPD %XMM6,%XMM4 |
(310) 0x43936d CMPPD $0x1,0x5147a(%RIP),%XMM4 |
(310) 0x439376 MOVDQA %XMM0,%XMM13 |
(310) 0x43937b PCMPEQD %XMM3,%XMM3 |
(310) 0x43937f PSUBD %XMM3,%XMM13 |
(310) 0x439384 MOVDQA %XMM0,%XMM15 |
(310) 0x439389 PADDD %XMM3,%XMM15 |
(310) 0x43938e PXOR %XMM3,%XMM3 |
(310) 0x439392 PCMPGTD %XMM13,%XMM3 |
(310) 0x439397 MOVDQA %XMM13,%XMM10 |
(310) 0x43939c PUNPCKLDQ %XMM3,%XMM10 |
(310) 0x4393a1 PADDD 0x543b7(%RIP),%XMM0 |
(310) 0x4393a9 MOVAPD %XMM4,%XMM5 |
(310) 0x4393ad ANDNPD %XMM10,%XMM5 |
(310) 0x4393b2 MOVDQA %XMM2,%XMM3 |
(310) 0x4393b6 PAND %XMM4,%XMM3 |
(310) 0x4393ba POR %XMM5,%XMM3 |
(310) 0x4393be MOVDQA %XMM4,%XMM5 |
(310) 0x4393c2 PANDN %XMM2,%XMM5 |
(310) 0x4393c6 PAND %XMM4,%XMM10 |
(310) 0x4393cb POR %XMM5,%XMM10 |
(310) 0x4393d0 MOVDQA %XMM10,%XMM5 |
(310) 0x4393d5 PSRLQ $0x20,%XMM5 |
(310) 0x4393da MOVDQA -0x110(%RBP),%XMM7 |
(310) 0x4393e2 MOVDQA %XMM7,%XMM14 |
(310) 0x4393e7 PSRLQ $0x20,%XMM14 |
(310) 0x4393ed MOVDQA %XMM14,%XMM8 |
(310) 0x4393f2 PMULUDQ %XMM10,%XMM8 |
(310) 0x4393f7 MOVDQA %XMM7,%XMM9 |
(310) 0x4393fc PMULUDQ %XMM5,%XMM9 |
(310) 0x439401 PADDQ %XMM8,%XMM9 |
(310) 0x439406 PSLLQ $0x20,%XMM9 |
(310) 0x43940c MOVDQA %XMM7,%XMM8 |
(310) 0x439411 PMULUDQ %XMM10,%XMM8 |
(310) 0x439416 PADDQ %XMM1,%XMM8 |
(310) 0x43941b PADDQ %XMM9,%XMM8 |
(310) 0x439420 PSLLQ $0x3,%XMM8 |
(310) 0x439426 PADDQ %XMM11,%XMM8 |
(310) 0x43942b MOVQ %XMM8,%RAX |
(310) 0x439430 PSHUFD $-0x12,%XMM8,%XMM8 |
(310) 0x439436 MOVQ %XMM8,%RDX |
(310) 0x43943b PXOR %XMM8,%XMM8 |
(310) 0x439440 PCMPGTD %XMM15,%XMM8 |
(310) 0x439445 MOVDQA %XMM15,%XMM9 |
(310) 0x43944a PUNPCKLDQ %XMM8,%XMM9 |
(310) 0x43944f MOVDQA %XMM4,%XMM8 |
(310) 0x439454 PANDN %XMM9,%XMM8 |
(310) 0x439459 PXOR %XMM9,%XMM9 |
(310) 0x43945e PCMPGTD %XMM0,%XMM9 |
(310) 0x439463 PUNPCKLDQ %XMM9,%XMM0 |
(310) 0x439468 PAND %XMM4,%XMM0 |
(310) 0x43946c POR %XMM8,%XMM0 |
(310) 0x439471 MOVDQA %XMM14,%XMM8 |
(310) 0x439476 PMULUDQ %XMM0,%XMM8 |
(310) 0x43947b MOVDQA %XMM7,%XMM9 |
(310) 0x439480 PMULUDQ %XMM0,%XMM9 |
(310) 0x439485 PSRLQ $0x20,%XMM0 |
(310) 0x43948a PMULUDQ %XMM7,%XMM0 |
(310) 0x43948e PADDQ %XMM8,%XMM0 |
(310) 0x439493 MOVSD (%RAX),%XMM12 |
(310) 0x439498 MOVHPD (%RDX),%XMM12 |
(310) 0x43949d PSLLQ $0x20,%XMM0 |
(310) 0x4394a2 PADDQ %XMM1,%XMM9 |
(310) 0x4394a7 PADDQ %XMM0,%XMM9 |
(310) 0x4394ac PSLLQ $0x3,%XMM9 |
(310) 0x4394b2 PADDQ %XMM11,%XMM9 |
(310) 0x4394b7 MOVQ %XMM9,%RAX |
(310) 0x4394bc PSHUFD $-0x12,%XMM9,%XMM0 |
(310) 0x4394c2 MOVQ %XMM0,%RDX |
(310) 0x4394c7 MOVSD (%RAX),%XMM8 |
(310) 0x4394cc MOVHPD (%RDX),%XMM8 |
(310) 0x4394d1 PMULUDQ %XMM3,%XMM14 |
(310) 0x4394d6 MOVDQA %XMM7,%XMM9 |
(310) 0x4394db PMULUDQ %XMM3,%XMM9 |
(310) 0x4394e0 PSRLQ $0x20,%XMM3 |
(310) 0x4394e5 PMULUDQ %XMM7,%XMM3 |
(310) 0x4394e9 PADDQ %XMM14,%XMM3 |
(310) 0x4394ee MOVAPD %XMM12,%XMM0 |
(310) 0x4394f3 PSLLQ $0x20,%XMM3 |
(310) 0x4394f8 PADDQ %XMM1,%XMM9 |
(310) 0x4394fd PADDQ %XMM3,%XMM9 |
(310) 0x439502 PSLLQ $0x3,%XMM9 |
(310) 0x439508 PADDQ %XMM11,%XMM9 |
(310) 0x43950d MOVQ %XMM9,%RAX |
(310) 0x439512 PSHUFD $-0x12,%XMM9,%XMM3 |
(310) 0x439518 MOVQ %XMM3,%RDX |
(310) 0x43951d MOVSD (%RAX),%XMM3 |
(310) 0x439521 MOVHPD (%RDX),%XMM3 |
(310) 0x439525 SUBPD %XMM8,%XMM0 |
(310) 0x43952a SUBPD %XMM12,%XMM3 |
(310) 0x43952f MOVAPD %XMM3,%XMM8 |
(310) 0x439534 MULPD %XMM0,%XMM8 |
(310) 0x439539 PXOR %XMM14,%XMM14 |
(310) 0x43953e CMPPD $0x1,%XMM8,%XMM14 |
(310) 0x439544 MOVMSKPD %XMM14,%EAX |
(310) 0x439549 TEST %EAX,%EAX |
(310) 0x43954b JE 439557 |
(310) 0x43954d MOV -0x48(%RBP),%RDX |
(310) 0x439551 MOVQ 0x8(%RDX),%XMM9 |
(310) 0x439557 MOVDQA -0x130(%RBP),%XMM7 |
(310) 0x43955f MOVDQA %XMM7,%XMM8 |
(310) 0x439564 PSRLQ $0x20,%XMM8 |
(310) 0x43956a PMULUDQ %XMM10,%XMM8 |
(310) 0x43956f PMULUDQ %XMM7,%XMM5 |
(310) 0x439573 PADDQ %XMM8,%XMM5 |
(310) 0x439578 PSLLQ $0x20,%XMM5 |
(310) 0x43957d PMULUDQ %XMM7,%XMM10 |
(310) 0x439582 PADDQ %XMM1,%XMM10 |
(310) 0x439587 PADDQ %XMM5,%XMM10 |
(310) 0x43958c PSLLQ $0x3,%XMM10 |
(310) 0x439592 PADDQ -0x120(%RBP),%XMM10 |
(310) 0x43959b MOVQ %XMM10,%RDX |
(310) 0x4395a0 PSHUFD $-0x12,%XMM10,%XMM5 |
(310) 0x4395a6 MOVQ %XMM5,%RSI |
(310) 0x4395ab MOVSD (%RDX),%XMM8 |
(310) 0x4395b0 MOVHPD (%RSI),%XMM8 |
(310) 0x4395b5 PSHUFD $0x44,%XMM9,%XMM10 |
(310) 0x4395bb MOVDQA %XMM2,%XMM9 |
(310) 0x4395c0 PSLLQ $0x3,%XMM9 |
(310) 0x4395c6 PADDQ %XMM10,%XMM9 |
(310) 0x4395cb TEST $0x1,%AL |
(310) 0x4395cd JE 4395d8 |
(310) 0x4395cf MOVQ %XMM9,%RDX |
(310) 0x4395d4 MOVSD (%RDX),%XMM5 |
(310) 0x4395d8 TEST $0x2,%AL |
(310) 0x4395da MOV %R11,%R14 |
(310) 0x4395dd MOVAPD 0x5158b(%RIP),%XMM7 |
(310) 0x4395e5 JE 4395f6 |
(310) 0x4395e7 PSHUFD $-0x12,%XMM9,%XMM9 |
(310) 0x4395ed MOVQ %XMM9,%RDX |
(310) 0x4395f2 MOVHPD (%RDX),%XMM5 |
(310) 0x4395f6 MOV %R8,%R11 |
(310) 0x4395f9 MOV %R12,%R8 |
(310) 0x4395fc SHUFPS $-0x18,%XMM4,%XMM4 |
(310) 0x439600 PAND %XMM4,%XMM13 |
(310) 0x439605 PANDN %XMM15,%XMM4 |
(310) 0x43960a POR %XMM13,%XMM4 |
(310) 0x43960f MOVAPD %XMM6,%XMM13 |
(310) 0x439614 ANDPD %XMM7,%XMM13 |
(310) 0x439619 DIVPD %XMM8,%XMM13 |
(310) 0x43961e MOVAPD %XMM13,%XMM15 |
(310) 0x439623 ADDPD 0x52124(%RIP),%XMM15 |
(310) 0x43962c XORPD %XMM8,%XMM8 |
(310) 0x439631 PCMPGTD %XMM4,%XMM8 |
(310) 0x439636 PUNPCKLDQ %XMM8,%XMM4 |
(310) 0x43963b PSLLQ $0x3,%XMM4 |
(310) 0x439640 PADDQ %XMM4,%XMM10 |
(310) 0x439645 TEST $0x1,%AL |
(310) 0x439647 JE 439653 |
(310) 0x439649 MOVQ %XMM10,%RDX |
(310) 0x43964e MOVSD (%RDX),%XMM8 |
(310) 0x439653 ANDPD %XMM7,%XMM0 |
(310) 0x439657 MOVAPD %XMM3,%XMM4 |
(310) 0x43965b ANDPD %XMM7,%XMM4 |
(310) 0x43965f MOVAPD 0x520f8(%RIP),%XMM9 |
(310) 0x439668 SUBPD %XMM13,%XMM9 |
(310) 0x43966d MULPD %XMM4,%XMM9 |
(310) 0x439672 DIVPD %XMM5,%XMM9 |
(310) 0x439677 MULPD %XMM0,%XMM15 |
(310) 0x43967c TEST $0x2,%AL |
(310) 0x43967e JE 439180 |
(310) 0x439684 PSHUFD $-0x12,%XMM10,%XMM10 |
(310) 0x43968a MOVQ %XMM10,%RAX |
(310) 0x43968f MOVHPD (%RAX),%XMM8 |
(310) 0x439694 JMP 439180 |
0x439699 ADD $0x158,%RSP |
0x4396a0 POP %RBX |
0x4396a1 POP %R12 |
0x4396a3 POP %R13 |
0x4396a5 POP %R14 |
0x4396a7 POP %R15 |
0x4396a9 POP %RBP |
0x4396aa RET |
0x4396ab CMP %R13,-0x60(%RBP) |
0x4396af MOV -0x68(%RBP),%R15 |
0x4396b3 JNE 4396db |
0x4396b5 MOV $0x4aa8c0,%EDI |
0x4396ba MOV -0x30(%RBP),%ESI |
0x4396bd ADD $0x158,%RSP |
0x4396c4 POP %RBX |
0x4396c5 POP %R12 |
0x4396c7 POP %R13 |
0x4396c9 POP %R14 |
0x4396cb POP %R15 |
0x4396cd POP %RBP |
0x4396ce JMP 404050 |
0x4396d3 MOV %RDX,%R14 |
0x4396d6 MOV %R12,%R15 |
0x4396d9 JMP 4396de |
0x4396db ADD %R13,%RCX |
0x4396de PXOR %XMM0,%XMM0 |
0x4396e2 MOVAPD 0x51486(%RIP),%XMM1 |
0x4396ea MOVSD 0x5209e(%RIP),%XMM2 |
0x4396f2 MOVSD 0x51416(%RIP),%XMM3 |
0x4396fa MOVSD 0x52096(%RIP),%XMM4 |
0x439702 MOVAPD 0x52076(%RIP),%XMM5 |
0x43970a MOV %RBX,%R13 |
0x43970d JMP 43974e |
0x43970f NOP |
(309) 0x439710 MOVAPD %XMM3,%XMM9 |
(309) 0x439715 SUBSD %XMM7,%XMM9 |
(309) 0x43971a MULSD %XMM11,%XMM9 |
(309) 0x43971f ADDSD %XMM8,%XMM9 |
(309) 0x439724 MULSD %XMM6,%XMM9 |
(309) 0x439729 IMUL -0x78(%RBP),%RDX |
(309) 0x43972e ADD %RAX,%RDX |
(309) 0x439731 MOV -0x70(%RBP),%RAX |
(309) 0x439735 MOVSD %XMM9,(%RAX,%RDX,8) |
(309) 0x43973b INC %RCX |
(309) 0x43973e CMP %RCX,-0x90(%RBP) |
(309) 0x439745 MOV %R13,%RBX |
(309) 0x439748 JE 4396b5 |
(309) 0x43974e MOV %RCX,%RDI |
(309) 0x439751 SHR $0x20,%RDI |
(309) 0x439755 JE 439780 |
(309) 0x439757 MOV %RCX,%RAX |
(309) 0x43975a XOR %EDX,%EDX |
(309) 0x43975c DIV %RBX |
(309) 0x43975f MOV %RAX,%RSI |
(309) 0x439762 TEST %RDI,%RDI |
(309) 0x439765 JE 43978d |
(309) 0x439767 MOV %RCX,%RAX |
(309) 0x43976a CQTO |
(309) 0x43976c IDIV %RBX |
(309) 0x43976f JMP 439793 |
0x439771 NOPW %CS:(%RAX,%RAX,1) |
(309) 0x439780 MOV %ECX,%EAX |
(309) 0x439782 XOR %EDX,%EDX |
(309) 0x439784 DIV %EBX |
(309) 0x439786 MOV %EAX,%ESI |
(309) 0x439788 TEST %RDI,%RDI |
(309) 0x43978b JNE 439767 |
(309) 0x43978d MOV %ECX,%EAX |
(309) 0x43978f XOR %EDX,%EDX |
(309) 0x439791 DIV %EBX |
(309) 0x439793 ADD -0x2c(%RBP),%ESI |
(309) 0x439796 ADD -0x40(%RBP),%EDX |
(309) 0x439799 MOVSXD %EDX,%RAX |
(309) 0x43979c MOVSXD %ESI,%RDX |
(309) 0x43979f MOV %R14,%RDI |
(309) 0x4397a2 IMUL %RDX,%RDI |
(309) 0x4397a6 ADD %RAX,%RDI |
(309) 0x4397a9 MOVSD (%R11,%RDI,8),%XMM6 |
(309) 0x4397af LEA 0x1(%RDX),%EDI |
(309) 0x4397b2 UCOMISD %XMM6,%XMM0 |
(309) 0x4397b6 MOVSXD %EDI,%R10 |
(309) 0x4397b9 JBE 4397d0 |
(309) 0x4397bb ADD $0x2,%ESI |
(309) 0x4397be MOV %RDX,%R12 |
(309) 0x4397c1 JMP 4397da |
0x4397c3 NOPW %CS:(%RAX,%RAX,1) |
(309) 0x4397d0 DEC %ESI |
(309) 0x4397d2 MOV %R10,%R12 |
(309) 0x4397d5 MOV %RDX,%R10 |
(309) 0x4397d8 MOV %ESI,%EDI |
(309) 0x4397da MOVAPD %XMM6,%XMM7 |
(309) 0x4397de ANDPD %XMM1,%XMM7 |
(309) 0x4397e2 MOV %R8,%R9 |
(309) 0x4397e5 IMUL %R10,%R9 |
(309) 0x4397e9 ADD %RAX,%R9 |
(309) 0x4397ec MOV -0x88(%RBP),%RBX |
(309) 0x4397f3 DIVSD (%RBX,%R9,8),%XMM7 |
(309) 0x4397f9 MOV -0x80(%RBP),%R9 |
(309) 0x4397fd IMUL %R9,%R10 |
(309) 0x439801 ADD %RAX,%R10 |
(309) 0x439804 MOVSXD %ESI,%RSI |
(309) 0x439807 IMUL %R9,%RSI |
(309) 0x43980b ADD %RAX,%RSI |
(309) 0x43980e IMUL %R9,%R12 |
(309) 0x439812 ADD %RAX,%R12 |
(309) 0x439815 MOVSD (%R15,%R10,8),%XMM8 |
(309) 0x43981b MOVAPD %XMM8,%XMM9 |
(309) 0x439820 MOVHPD (%R15,%R12,8),%XMM9 |
(309) 0x439826 MOVSD (%R15,%RSI,8),%XMM10 |
(309) 0x43982c UNPCKLPD %XMM8,%XMM10 |
(309) 0x439831 SUBPD %XMM10,%XMM9 |
(309) 0x439836 MOVAPD %XMM9,%XMM10 |
(309) 0x43983b UNPCKHPD %XMM9,%XMM10 |
(309) 0x439840 MOVAPD %XMM10,%XMM12 |
(309) 0x439845 MULSD %XMM9,%XMM12 |
(309) 0x43984a PXOR %XMM11,%XMM11 |
(309) 0x43984f UCOMISD %XMM11,%XMM12 |
(309) 0x439854 JBE 439710 |
(309) 0x43985a MOV -0x48(%RBP),%RSI |
(309) 0x43985e MOV 0x8(%RSI),%RSI |
(309) 0x439862 ANDPD %XMM1,%XMM9 |
(309) 0x439867 MOVAPD %XMM2,%XMM11 |
(309) 0x43986c SUBSD %XMM7,%XMM11 |
(309) 0x439871 MOVAPD %XMM7,%XMM12 |
(309) 0x439876 ADDSD %XMM3,%XMM12 |
(309) 0x43987b UNPCKLPD %XMM11,%XMM12 |
(309) 0x439880 MOVSXD %EDI,%RDI |
(309) 0x439883 MOVSD (%RSI,%RDX,8),%XMM11 |
(309) 0x439889 MULPD %XMM9,%XMM12 |
(309) 0x43988e MOVSD (%RSI,%RDI,8),%XMM13 |
(309) 0x439894 UNPCKLPD %XMM11,%XMM13 |
(309) 0x439899 DIVPD %XMM13,%XMM12 |
(309) 0x43989e MOVAPD %XMM12,%XMM13 |
(309) 0x4398a3 UNPCKHPD %XMM12,%XMM13 |
(309) 0x4398a8 ADDSD %XMM12,%XMM13 |
(309) 0x4398ad MULSD %XMM4,%XMM11 |
(309) 0x4398b2 MULSD %XMM13,%XMM11 |
(309) 0x4398b7 PSHUFD $-0x12,%XMM9,%XMM12 |
(309) 0x4398bd MINSD %XMM9,%XMM12 |
(309) 0x4398c2 MINSD %XMM11,%XMM12 |
(309) 0x4398c7 XORPD %XMM11,%XMM11 |
(309) 0x4398cc CMPSD $0x1,%XMM10,%XMM11 |
(309) 0x4398d2 MOVAPD %XMM11,%XMM9 |
(309) 0x4398d7 ANDPD %XMM12,%XMM9 |
(309) 0x4398dc XORPD %XMM5,%XMM12 |
(309) 0x4398e1 ANDNPD %XMM12,%XMM11 |
(309) 0x4398e6 ORPD %XMM9,%XMM11 |
(309) 0x4398eb JMP 439710 |
Path / |
Source file and lines | advec_mom.cpp:180-211 |
Module | exec |
nb instructions | 148 |
nb uops | 155 |
loop length | 675 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 8 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 33 |
micro-operation queue | 25.83 cycles |
front end | 25.83 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 6.75 | 6.75 | 6.75 | 6.75 | 5.00 | 19.00 | 19.00 | 19.00 | 6.25 | 6.17 | 6.33 | 6.25 | 6.50 | 6.50 |
cycles | 6.75 | 6.75 | 6.75 | 6.75 | 5.00 | 19.00 | 19.00 | 19.00 | 6.25 | 6.17 | 6.33 | 6.25 | 6.50 | 6.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 25.83 |
Dispatch | 19.00 |
Overall L1 | 25.83 |
all | 37% |
load | 14% |
store | 46% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 11% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 46% |
all | 40% |
load | 40% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 37% |
load | 21% |
store | 46% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 11% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 46% |
all | 16% |
load | 12% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 17% |
all | 17% |
load | 17% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 16% |
load | 13% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x20(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RBP),%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %EDX,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,-0x34(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JS 439699 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x729> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R9,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x98(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x34(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x58(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x50(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x4aa8a0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404240 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JA 4396b5 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x745> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EAX,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%R13),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R13),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R12),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R12),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R15),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R15),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R14),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R14),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
INC %RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RSI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x2,%R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND %RSI,%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R9,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R15,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JE 4396d3 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x763> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RSI,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVD %EBX,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PSHUFD $0x44,%XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVD -0x2c(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
PSHUFD $0x50,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x170(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RAX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x160(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RDX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVQ %R11,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R8,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RDI,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R9,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOV %R12,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ %R12,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R15,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R10,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RCX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
PADDQ 0x52450(%RIP),%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVDQA %XMM1,-0x180(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
PSHUFD $-0x12,%XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVDQA %XMM2,-0x150(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
PSRLQ $0x20,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVDQA %XMM2,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVDQA -0x100(%RBP),%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
JMP 43925d <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x2ed> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
ADD $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R13,-0x60(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV -0x68(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JNE 4396db <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x76b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x4aa8c0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x30(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 404050 <__kmpc_for_static_fini@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4396de <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x76e> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
ADD %R13,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PXOR %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVAPD 0x51486(%RIP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSD 0x5209e(%RIP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x51416(%RIP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x52096(%RIP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVAPD 0x52076(%RIP),%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 43974e <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x7de> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Source file and lines | advec_mom.cpp:180-211 |
Module | exec |
nb instructions | 148 |
nb uops | 155 |
loop length | 675 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 8 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 33 |
micro-operation queue | 25.83 cycles |
front end | 25.83 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 6.75 | 6.75 | 6.75 | 6.75 | 5.00 | 19.00 | 19.00 | 19.00 | 6.25 | 6.17 | 6.33 | 6.25 | 6.50 | 6.50 |
cycles | 6.75 | 6.75 | 6.75 | 6.75 | 5.00 | 19.00 | 19.00 | 19.00 | 6.25 | 6.17 | 6.33 | 6.25 | 6.50 | 6.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 25.83 |
Dispatch | 19.00 |
Overall L1 | 25.83 |
all | 37% |
load | 14% |
store | 46% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 11% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 46% |
all | 40% |
load | 40% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 37% |
load | 21% |
store | 46% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 11% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 46% |
all | 16% |
load | 12% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 17% |
all | 17% |
load | 17% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 16% |
load | 13% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x20(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RBP),%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %EDX,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,-0x34(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JS 439699 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x729> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R9,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x98(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x34(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x58(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x50(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x4aa8a0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404240 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JA 4396b5 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x745> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EAX,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%R13),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R13),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R12),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R12),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R15),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R15),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R14),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R14),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
INC %RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RSI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x2,%R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND %RSI,%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R9,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R15,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JE 4396d3 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x763> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RSI,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVD %EBX,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PSHUFD $0x44,%XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVD -0x2c(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
PSHUFD $0x50,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x170(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RAX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x160(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RDX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVQ %R11,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R8,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RDI,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R9,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOV %R12,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ %R12,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R15,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R10,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RCX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
PADDQ 0x52450(%RIP),%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVDQA %XMM1,-0x180(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
PSHUFD $-0x12,%XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVDQA %XMM2,-0x150(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
PSRLQ $0x20,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVDQA %XMM2,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVDQA -0x100(%RBP),%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
JMP 43925d <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x2ed> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
ADD $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R13,-0x60(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV -0x68(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JNE 4396db <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x76b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x4aa8c0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x30(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 404050 <__kmpc_for_static_fini@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4396de <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x76e> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
ADD %R13,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PXOR %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVAPD 0x51486(%RIP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSD 0x5209e(%RIP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x51416(%RIP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x52096(%RIP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVAPD 0x52076(%RIP),%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 43974e <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7+0x7de> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.7– | 5.25 | 2.88 |
○Loop 310 - advec_mom.cpp:180-211 - exec | 5.25 | 2.88 |
○Loop 309 - advec_mom.cpp:180-211 - exec | 0 | 0 |