Function: _Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buf ... | Module: exec | Source: advec_mom.cpp:108-139 [...] | Coverage: 4.83% |
---|
Function: _Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buf ... | Module: exec | Source: advec_mom.cpp:108-139 [...] | Coverage: 4.83% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/advec_mom.cpp: 108 - 139 |
-------------------------------------------------------------------------------- |
108: #pragma omp parallel for simd collapse(2) |
109: for (int j = (y_min + 1); j < (y_max + 1 + 2); j++) { |
110: for (int i = (x_min - 1 + 1); i < (x_max + 1 + 2); i++) |
111: ({ |
112: int upwind, donor, downwind, dif; |
113: double sigma, width, limiter, vdiffuw, vdiffdw, auw, adw, wind, advec_vel_s; |
114: if (node_flux(i, j) < 0.0) { |
115: upwind = i + 2; |
116: donor = i + 1; |
117: downwind = i; |
118: dif = donor; |
119: } else { |
120: upwind = i - 1; |
121: donor = i; |
122: downwind = i + 1; |
123: dif = upwind; |
124: } |
125: sigma = std::fabs(node_flux(i, j)) / (node_mass_pre(donor, j)); |
126: width = celldx[i]; |
127: vdiffuw = vel1(donor, j) - vel1(upwind, j); |
128: vdiffdw = vel1(downwind, j) - vel1(donor, j); |
129: limiter = 0.0; |
130: if (vdiffuw * vdiffdw > 0.0) { |
131: auw = std::fabs(vdiffuw); |
132: adw = std::fabs(vdiffdw); |
133: wind = 1.0; |
134: if (vdiffdw <= 0.0) wind = -1.0; |
135: limiter = |
136: wind * std::fmin(std::fmin(width * ((2.0 - sigma) * adw / width + (1.0 + sigma) * auw / celldx[dif]) / 6.0, auw), adw); |
137: } |
138: advec_vel_s = vel1(donor, j) + (1.0 - sigma) * limiter; |
139: mom_flux(i, j) = advec_vel_s * node_flux(i, j); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 46 - 69 |
-------------------------------------------------------------------------------- |
46: T &operator[](size_t i) const { return data[i]; } |
[...] |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
0x43aba0 PUSH %RBP |
0x43aba1 MOV %RSP,%RBP |
0x43aba4 PUSH %R15 |
0x43aba6 PUSH %R14 |
0x43aba8 PUSH %R13 |
0x43abaa PUSH %R12 |
0x43abac PUSH %RBX |
0x43abad SUB $0x158,%RSP |
0x43abb4 MOV %RCX,%R13 |
0x43abb7 MOV %RDX,%R15 |
0x43abba MOV 0x38(%RBP),%RAX |
0x43abbe MOV 0x28(%RBP),%RDX |
0x43abc2 MOV 0x20(%RBP),%R14 |
0x43abc6 MOV 0x18(%RBP),%RCX |
0x43abca MOV %RCX,-0x40(%RBP) |
0x43abce MOV 0x10(%RBP),%RCX |
0x43abd2 MOV %RCX,-0x48(%RBP) |
0x43abd6 MOVL $0,-0x30(%RBP) |
0x43abdd TEST %RAX,%RAX |
0x43abe0 JS 43b26a |
0x43abe6 MOV %R8,%R12 |
0x43abe9 MOV %R9,-0x70(%RBP) |
0x43abed MOV (%RDI),%ESI |
0x43abef MOVQ $0,-0x58(%RBP) |
0x43abf7 MOV %RAX,-0x50(%RBP) |
0x43abfb MOVQ $0x1,-0xa8(%RBP) |
0x43ac06 SUB $0x8,%RSP |
0x43ac0a LEA -0xa8(%RBP),%RAX |
0x43ac11 LEA -0x30(%RBP),%RCX |
0x43ac15 LEA -0x58(%RBP),%R8 |
0x43ac19 MOV %RDX,%RBX |
0x43ac1c LEA -0x50(%RBP),%R9 |
0x43ac20 MOV $0x4aaa20,%EDI |
0x43ac25 MOV %ESI,-0x2c(%RBP) |
0x43ac28 MOV $0x22,%EDX |
0x43ac2d PUSH $0x1 |
0x43ac2f PUSH $0x1 |
0x43ac31 PUSH %RAX |
0x43ac32 CALL 404240 <__kmpc_for_static_init_8@plt> |
0x43ac37 ADD $0x20,%RSP |
0x43ac3b MOV -0x58(%RBP),%RCX |
0x43ac3f MOV -0x50(%RBP),%RAX |
0x43ac43 CMP %RAX,%RCX |
0x43ac46 JA 43b286 |
0x43ac4c MOV %RBX,%R9 |
0x43ac4f MOV %RAX,%RDX |
0x43ac52 SUB %R14D,%R9D |
0x43ac55 MOV (%R13),%RAX |
0x43ac59 MOV 0x10(%R13),%R13 |
0x43ac5d MOV (%R12),%R8 |
0x43ac61 MOV 0x10(%R12),%RSI |
0x43ac66 MOV (%R15),%R11 |
0x43ac69 MOV 0x10(%R15),%R15 |
0x43ac6d MOV -0x70(%RBP),%R10 |
0x43ac71 MOV (%R10),%RDI |
0x43ac74 MOV 0x10(%R10),%R10 |
0x43ac78 INC %RDX |
0x43ac7b MOV %RDX,-0xa0(%RBP) |
0x43ac82 SUB %RCX,%RDX |
0x43ac85 MOV $-0x2,%EBX |
0x43ac8a AND %RDX,%RBX |
0x43ac8d MOV %R9,-0x38(%RBP) |
0x43ac91 MOV %RSI,-0x98(%RBP) |
0x43ac98 MOV %R11,-0x90(%RBP) |
0x43ac9f MOV %RDI,-0x88(%RBP) |
0x43aca6 MOV %R10,-0x80(%RBP) |
0x43acaa JE 43b2a4 |
0x43acb0 MOV %RDX,-0x78(%RBP) |
0x43acb4 MOVD %R9D,%XMM0 |
0x43acb9 PSHUFD $0x44,%XMM0,%XMM1 |
0x43acbe MOVQ -0x40(%RBP),%XMM0 |
0x43acc3 PSHUFD $0x44,%XMM0,%XMM0 |
0x43acc8 MOVDQA %XMM0,-0x170(%RBP) |
0x43acd0 MOVD %R14D,%XMM0 |
0x43acd5 PSHUFD $0x50,%XMM0,%XMM0 |
0x43acda MOVDQA %XMM0,-0x160(%RBP) |
0x43ace2 MOVQ %RAX,%XMM0 |
0x43ace7 PSHUFD $0x44,%XMM0,%XMM2 |
0x43acec MOVQ %R13,%XMM0 |
0x43acf1 PSHUFD $0x44,%XMM0,%XMM0 |
0x43acf6 MOVDQA %XMM0,-0x140(%RBP) |
0x43acfe MOVQ %R8,%XMM0 |
0x43ad03 PSHUFD $0x44,%XMM0,%XMM0 |
0x43ad08 MOVDQA %XMM0,-0x130(%RBP) |
0x43ad10 MOVQ %RSI,%XMM0 |
0x43ad15 PSHUFD $0x44,%XMM0,%XMM0 |
0x43ad1a MOVDQA %XMM0,-0x120(%RBP) |
0x43ad22 MOVQ %R11,%XMM0 |
0x43ad27 PSHUFD $0x44,%XMM0,%XMM0 |
0x43ad2c MOVDQA %XMM0,-0x110(%RBP) |
0x43ad34 MOVQ %R15,%XMM0 |
0x43ad39 PSHUFD $0x44,%XMM0,%XMM0 |
0x43ad3e MOVDQA %XMM0,-0x100(%RBP) |
0x43ad46 MOVQ %RDI,%XMM0 |
0x43ad4b PSHUFD $0x44,%XMM0,%XMM0 |
0x43ad50 MOVDQA %XMM0,-0xf0(%RBP) |
0x43ad58 MOVQ %R10,%XMM0 |
0x43ad5d PSHUFD $0x44,%XMM0,%XMM0 |
0x43ad62 MOVDQA %XMM0,-0xe0(%RBP) |
0x43ad6a MOVQ %RCX,%XMM0 |
0x43ad6f PSHUFD $0x44,%XMM0,%XMM9 |
0x43ad75 PADDQ 0x50812(%RIP),%XMM9 |
0x43ad7e XOR %R9D,%R9D |
0x43ad81 MOVDQA %XMM1,-0x180(%RBP) |
0x43ad89 PSHUFD $-0x12,%XMM1,%XMM0 |
0x43ad8e MOVDQA %XMM0,-0xd0(%RBP) |
0x43ad96 MOVDQA %XMM2,-0x150(%RBP) |
0x43ad9e PSRLQ $0x20,%XMM2 |
0x43ada3 MOVDQA %XMM2,-0xc0(%RBP) |
0x43adab MOV %RAX,%R12 |
0x43adae JMP 43ae97 |
0x43adb3 NOPW %CS:(%RAX,%RAX,1) |
(318) 0x43adc0 MOVDQA -0x70(%RBP),%XMM9 |
(318) 0x43adc6 DIVPD %XMM7,%XMM14 |
(318) 0x43adcb ADDPD %XMM8,%XMM14 |
(318) 0x43add0 XORPD %XMM7,%XMM7 |
(318) 0x43add4 CMPPD $0x1,%XMM3,%XMM7 |
(318) 0x43add9 MULPD 0x5098f(%RIP),%XMM6 |
(318) 0x43ade1 MULPD %XMM14,%XMM6 |
(318) 0x43ade6 MINPD %XMM4,%XMM0 |
(318) 0x43adea MINPD %XMM6,%XMM0 |
(318) 0x43adee MOVAPD %XMM0,%XMM3 |
(318) 0x43adf2 XORPD 0x50986(%RIP),%XMM3 |
(318) 0x43adfa ANDPD %XMM7,%XMM0 |
(318) 0x43adfe ANDNPD %XMM3,%XMM7 |
(318) 0x43ae02 ORPD %XMM0,%XMM7 |
(318) 0x43ae06 ANDPD %XMM7,%XMM13 |
(318) 0x43ae0b MOVAPD 0x5093d(%RIP),%XMM0 |
(318) 0x43ae13 SUBPD %XMM5,%XMM0 |
(318) 0x43ae17 MULPD %XMM13,%XMM0 |
(318) 0x43ae1c ADDPD %XMM12,%XMM0 |
(318) 0x43ae21 MULPD %XMM10,%XMM0 |
(318) 0x43ae26 MOVDQA -0xf0(%RBP),%XMM5 |
(318) 0x43ae2e MOVDQA %XMM5,%XMM3 |
(318) 0x43ae32 PSRLQ $0x20,%XMM3 |
(318) 0x43ae37 PMULUDQ %XMM2,%XMM3 |
(318) 0x43ae3b MOVDQA %XMM5,%XMM4 |
(318) 0x43ae3f PMULUDQ %XMM2,%XMM4 |
(318) 0x43ae43 PSRLQ $0x20,%XMM2 |
(318) 0x43ae48 PMULUDQ %XMM5,%XMM2 |
(318) 0x43ae4c PADDQ %XMM3,%XMM2 |
(318) 0x43ae50 PADDQ %XMM1,%XMM4 |
(318) 0x43ae54 PSLLQ $0x20,%XMM2 |
(318) 0x43ae59 PADDQ %XMM2,%XMM4 |
(318) 0x43ae5d PSLLQ $0x3,%XMM4 |
(318) 0x43ae62 PADDQ -0xe0(%RBP),%XMM4 |
(318) 0x43ae6a MOVQ %XMM4,%RAX |
(318) 0x43ae6f PSHUFD $-0x12,%XMM4,%XMM1 |
(318) 0x43ae74 MOVQ %XMM1,%RDX |
(318) 0x43ae79 MOVLPD %XMM0,(%RAX) |
(318) 0x43ae7d MOVHPD %XMM0,(%RDX) |
(318) 0x43ae81 PADDQ 0x50726(%RIP),%XMM9 |
(318) 0x43ae8a ADD $0x2,%R9 |
(318) 0x43ae8e CMP %RBX,%R9 |
(318) 0x43ae91 JAE 43b27c |
(318) 0x43ae97 MOV %R8,%R10 |
(318) 0x43ae9a MOV %R13,%R8 |
(318) 0x43ae9d MOV %R12,%R13 |
(318) 0x43aea0 MOVQ %XMM9,%RSI |
(318) 0x43aea5 MOVDQA -0x180(%RBP),%XMM0 |
(318) 0x43aead MOVQ %XMM0,%R12 |
(318) 0x43aeb2 MOV %RSI,%RAX |
(318) 0x43aeb5 XOR %EDX,%EDX |
(318) 0x43aeb7 DIV %R12 |
(318) 0x43aeba MOVQ %RAX,%XMM6 |
(318) 0x43aebf MOVDQA %XMM9,-0x70(%RBP) |
(318) 0x43aec5 PSHUFD $-0x12,%XMM9,%XMM0 |
(318) 0x43aecb MOVQ %XMM0,%RDI |
(318) 0x43aed0 MOVDQA -0xd0(%RBP),%XMM0 |
(318) 0x43aed8 MOVQ %XMM0,%R11 |
(318) 0x43aedd MOV %RDI,%RAX |
(318) 0x43aee0 XOR %EDX,%EDX |
(318) 0x43aee2 DIV %R11 |
(318) 0x43aee5 MOVQ %RAX,%XMM0 |
(318) 0x43aeea PUNPCKLQDQ %XMM0,%XMM6 |
(318) 0x43aeee PADDQ -0x170(%RBP),%XMM6 |
(318) 0x43aef6 MOV %RSI,%RAX |
(318) 0x43aef9 CQTO |
(318) 0x43aefb IDIV %R12 |
(318) 0x43aefe MOVQ %RDX,%XMM0 |
(318) 0x43af03 MOV %RDI,%RAX |
(318) 0x43af06 CQTO |
(318) 0x43af08 IDIV %R11 |
(318) 0x43af0b MOVQ %RDX,%XMM1 |
(318) 0x43af10 PUNPCKLQDQ %XMM1,%XMM0 |
(318) 0x43af14 PSHUFD $-0x18,%XMM0,%XMM0 |
(318) 0x43af19 PADDD -0x160(%RBP),%XMM0 |
(318) 0x43af21 PXOR %XMM2,%XMM2 |
(318) 0x43af25 PCMPGTD %XMM0,%XMM2 |
(318) 0x43af29 MOVDQA %XMM0,%XMM1 |
(318) 0x43af2d PUNPCKLDQ %XMM2,%XMM1 |
(318) 0x43af31 PSHUFD $-0x18,%XMM6,%XMM2 |
(318) 0x43af36 PSLLQ $0x20,%XMM6 |
(318) 0x43af3b PSRAD $0x1f,%XMM6 |
(318) 0x43af40 PSHUFD $-0x13,%XMM6,%XMM3 |
(318) 0x43af45 PUNPCKLDQ %XMM3,%XMM2 |
(318) 0x43af49 MOVDQA -0x150(%RBP),%XMM5 |
(318) 0x43af51 MOVDQA %XMM5,%XMM3 |
(318) 0x43af55 PMULUDQ %XMM2,%XMM3 |
(318) 0x43af59 MOVDQA -0xc0(%RBP),%XMM4 |
(318) 0x43af61 PMULUDQ %XMM2,%XMM4 |
(318) 0x43af65 PSRLQ $0x20,%XMM6 |
(318) 0x43af6a PMULUDQ %XMM6,%XMM5 |
(318) 0x43af6e PADDQ %XMM4,%XMM5 |
(318) 0x43af72 PSLLQ $0x20,%XMM5 |
(318) 0x43af77 PADDQ %XMM1,%XMM3 |
(318) 0x43af7b PADDQ %XMM5,%XMM3 |
(318) 0x43af7f PSLLQ $0x3,%XMM3 |
(318) 0x43af84 PADDQ -0x140(%RBP),%XMM3 |
(318) 0x43af8c MOVQ %XMM3,%RAX |
(318) 0x43af91 PSHUFD $-0x12,%XMM3,%XMM3 |
(318) 0x43af96 MOVQ %XMM3,%RDX |
(318) 0x43af9b MOVSD (%RAX),%XMM10 |
(318) 0x43afa0 MOVHPD (%RDX),%XMM10 |
(318) 0x43afa5 MOVAPD %XMM10,%XMM4 |
(318) 0x43afaa CMPPD $0x1,0x4f83d(%RIP),%XMM4 |
(318) 0x43afb3 MOVDQA %XMM0,%XMM5 |
(318) 0x43afb7 PCMPEQD %XMM3,%XMM3 |
(318) 0x43afbb PSUBD %XMM3,%XMM5 |
(318) 0x43afbf MOVDQA %XMM0,%XMM14 |
(318) 0x43afc4 PADDD %XMM3,%XMM14 |
(318) 0x43afc9 PXOR %XMM3,%XMM3 |
(318) 0x43afcd PCMPGTD %XMM5,%XMM3 |
(318) 0x43afd1 MOVDQA %XMM5,%XMM15 |
(318) 0x43afd6 PUNPCKLDQ %XMM3,%XMM15 |
(318) 0x43afdb PADDD 0x5277d(%RIP),%XMM0 |
(318) 0x43afe3 MOVAPD %XMM4,%XMM7 |
(318) 0x43afe7 ANDNPD %XMM15,%XMM7 |
(318) 0x43afec MOVDQA %XMM1,%XMM3 |
(318) 0x43aff0 PAND %XMM4,%XMM3 |
(318) 0x43aff4 POR %XMM7,%XMM3 |
(318) 0x43aff8 MOVDQA %XMM4,%XMM7 |
(318) 0x43affc PANDN %XMM1,%XMM7 |
(318) 0x43b000 PAND %XMM4,%XMM15 |
(318) 0x43b005 POR %XMM7,%XMM15 |
(318) 0x43b00a MOVDQA -0x110(%RBP),%XMM13 |
(318) 0x43b013 MOVDQA %XMM13,%XMM7 |
(318) 0x43b018 PMULUDQ %XMM2,%XMM7 |
(318) 0x43b01c MOVDQA %XMM13,%XMM8 |
(318) 0x43b021 PSRLQ $0x20,%XMM8 |
(318) 0x43b027 PMULUDQ %XMM2,%XMM8 |
(318) 0x43b02c PMULUDQ %XMM6,%XMM13 |
(318) 0x43b031 PADDQ %XMM8,%XMM13 |
(318) 0x43b036 PSLLQ $0x20,%XMM13 |
(318) 0x43b03c PADDQ %XMM7,%XMM13 |
(318) 0x43b041 MOVDQA %XMM13,%XMM7 |
(318) 0x43b046 PADDQ %XMM15,%XMM7 |
(318) 0x43b04b PSLLQ $0x3,%XMM7 |
(318) 0x43b050 MOVDQA -0x100(%RBP),%XMM9 |
(318) 0x43b059 PADDQ %XMM9,%XMM7 |
(318) 0x43b05e MOVQ %XMM7,%RAX |
(318) 0x43b063 PSHUFD $-0x12,%XMM7,%XMM7 |
(318) 0x43b068 MOVQ %XMM7,%RDX |
(318) 0x43b06d PXOR %XMM7,%XMM7 |
(318) 0x43b071 PCMPGTD %XMM14,%XMM7 |
(318) 0x43b076 MOVDQA %XMM14,%XMM8 |
(318) 0x43b07b PUNPCKLDQ %XMM7,%XMM8 |
(318) 0x43b080 MOVDQA %XMM4,%XMM7 |
(318) 0x43b084 PANDN %XMM8,%XMM7 |
(318) 0x43b089 PXOR %XMM8,%XMM8 |
(318) 0x43b08e PCMPGTD %XMM0,%XMM8 |
(318) 0x43b093 PUNPCKLDQ %XMM8,%XMM0 |
(318) 0x43b098 MOVSD (%RAX),%XMM12 |
(318) 0x43b09d MOVHPD (%RDX),%XMM12 |
(318) 0x43b0a2 PAND %XMM4,%XMM0 |
(318) 0x43b0a6 POR %XMM7,%XMM0 |
(318) 0x43b0aa PADDQ %XMM13,%XMM0 |
(318) 0x43b0af PSLLQ $0x3,%XMM0 |
(318) 0x43b0b4 PADDQ %XMM9,%XMM0 |
(318) 0x43b0b9 MOVQ %XMM0,%RAX |
(318) 0x43b0be PSHUFD $-0x12,%XMM0,%XMM0 |
(318) 0x43b0c3 MOVQ %XMM0,%RDX |
(318) 0x43b0c8 MOVSD (%RAX),%XMM7 |
(318) 0x43b0cc MOVHPD (%RDX),%XMM7 |
(318) 0x43b0d0 MOVAPD %XMM12,%XMM0 |
(318) 0x43b0d5 PADDQ %XMM3,%XMM13 |
(318) 0x43b0da PSLLQ $0x3,%XMM13 |
(318) 0x43b0e0 PADDQ %XMM9,%XMM13 |
(318) 0x43b0e5 MOVQ %XMM13,%RAX |
(318) 0x43b0ea PSHUFD $-0x12,%XMM13,%XMM3 |
(318) 0x43b0f0 MOVQ %XMM3,%RDX |
(318) 0x43b0f5 MOVSD (%RAX),%XMM3 |
(318) 0x43b0f9 MOVHPD (%RDX),%XMM3 |
(318) 0x43b0fd SUBPD %XMM7,%XMM0 |
(318) 0x43b101 SUBPD %XMM12,%XMM3 |
(318) 0x43b106 MOVAPD %XMM3,%XMM7 |
(318) 0x43b10a MULPD %XMM0,%XMM7 |
(318) 0x43b10e PXOR %XMM13,%XMM13 |
(318) 0x43b113 CMPPD $0x1,%XMM7,%XMM13 |
(318) 0x43b119 MOVMSKPD %XMM13,%EAX |
(318) 0x43b11e TEST %EAX,%EAX |
(318) 0x43b120 JE 43b12b |
(318) 0x43b122 MOV -0x48(%RBP),%RDX |
(318) 0x43b126 MOVQ 0x8(%RDX),%XMM7 |
(318) 0x43b12b MOVDQA -0x130(%RBP),%XMM8 |
(318) 0x43b134 MOVDQA %XMM8,%XMM11 |
(318) 0x43b139 PMULUDQ %XMM2,%XMM11 |
(318) 0x43b13e MOVDQA %XMM8,%XMM9 |
(318) 0x43b143 PSRLQ $0x20,%XMM9 |
(318) 0x43b149 PMULUDQ %XMM2,%XMM9 |
(318) 0x43b14e PMULUDQ %XMM8,%XMM6 |
(318) 0x43b153 PADDQ %XMM9,%XMM6 |
(318) 0x43b158 PSLLQ $0x20,%XMM6 |
(318) 0x43b15d PADDQ %XMM11,%XMM6 |
(318) 0x43b162 PADDQ %XMM15,%XMM6 |
(318) 0x43b167 PSLLQ $0x3,%XMM6 |
(318) 0x43b16c PADDQ -0x120(%RBP),%XMM6 |
(318) 0x43b174 MOVQ %XMM6,%RDX |
(318) 0x43b179 PSHUFD $-0x12,%XMM6,%XMM6 |
(318) 0x43b17e MOVQ %XMM6,%RSI |
(318) 0x43b183 MOVSD (%RDX),%XMM8 |
(318) 0x43b188 MOVHPD (%RSI),%XMM8 |
(318) 0x43b18d PSHUFD $0x44,%XMM7,%XMM15 |
(318) 0x43b193 MOVDQA %XMM1,%XMM7 |
(318) 0x43b197 PSLLQ $0x3,%XMM7 |
(318) 0x43b19c PADDQ %XMM15,%XMM7 |
(318) 0x43b1a1 TEST $0x1,%AL |
(318) 0x43b1a3 JE 43b1ae |
(318) 0x43b1a5 MOVQ %XMM7,%RDX |
(318) 0x43b1aa MOVSD (%RDX),%XMM6 |
(318) 0x43b1ae TEST $0x2,%AL |
(318) 0x43b1b0 MOV %R13,%R12 |
(318) 0x43b1b3 MOVAPD 0x4f9b4(%RIP),%XMM9 |
(318) 0x43b1bc JE 43b1cc |
(318) 0x43b1be PSHUFD $-0x12,%XMM7,%XMM7 |
(318) 0x43b1c3 MOVQ %XMM7,%RDX |
(318) 0x43b1c8 MOVHPD (%RDX),%XMM6 |
(318) 0x43b1cc MOV %R8,%R13 |
(318) 0x43b1cf MOV %R10,%R8 |
(318) 0x43b1d2 SHUFPS $-0x18,%XMM4,%XMM4 |
(318) 0x43b1d6 PAND %XMM4,%XMM5 |
(318) 0x43b1da PANDN %XMM14,%XMM4 |
(318) 0x43b1df POR %XMM5,%XMM4 |
(318) 0x43b1e3 MOVAPD %XMM10,%XMM5 |
(318) 0x43b1e8 ANDPD %XMM9,%XMM5 |
(318) 0x43b1ed DIVPD %XMM8,%XMM5 |
(318) 0x43b1f2 MOVAPD %XMM5,%XMM14 |
(318) 0x43b1f7 ADDPD 0x50550(%RIP),%XMM14 |
(318) 0x43b200 PXOR %XMM7,%XMM7 |
(318) 0x43b204 PCMPGTD %XMM4,%XMM7 |
(318) 0x43b208 PUNPCKLDQ %XMM7,%XMM4 |
(318) 0x43b20c PSLLQ $0x3,%XMM4 |
(318) 0x43b211 PADDQ %XMM4,%XMM15 |
(318) 0x43b216 TEST $0x1,%AL |
(318) 0x43b218 JE 43b223 |
(318) 0x43b21a MOVQ %XMM15,%RDX |
(318) 0x43b21f MOVSD (%RDX),%XMM7 |
(318) 0x43b223 ANDPD %XMM9,%XMM0 |
(318) 0x43b228 MOVAPD %XMM3,%XMM4 |
(318) 0x43b22c ANDPD %XMM9,%XMM4 |
(318) 0x43b231 MOVAPD 0x50526(%RIP),%XMM8 |
(318) 0x43b23a SUBPD %XMM5,%XMM8 |
(318) 0x43b23f MULPD %XMM4,%XMM8 |
(318) 0x43b244 DIVPD %XMM6,%XMM8 |
(318) 0x43b249 MULPD %XMM0,%XMM14 |
(318) 0x43b24e TEST $0x2,%AL |
(318) 0x43b250 JE 43adc0 |
(318) 0x43b256 PSHUFD $-0x12,%XMM15,%XMM9 |
(318) 0x43b25c MOVQ %XMM9,%RAX |
(318) 0x43b261 MOVHPD (%RAX),%XMM7 |
(318) 0x43b265 JMP 43adc0 |
0x43b26a ADD $0x158,%RSP |
0x43b271 POP %RBX |
0x43b272 POP %R12 |
0x43b274 POP %R13 |
0x43b276 POP %R14 |
0x43b278 POP %R15 |
0x43b27a POP %RBP |
0x43b27b RET |
0x43b27c CMP %RBX,-0x78(%RBP) |
0x43b280 MOV -0x38(%RBP),%R9 |
0x43b284 JNE 43b2a9 |
0x43b286 MOV $0x4aaa40,%EDI |
0x43b28b MOV -0x2c(%RBP),%ESI |
0x43b28e ADD $0x158,%RSP |
0x43b295 POP %RBX |
0x43b296 POP %R12 |
0x43b298 POP %R13 |
0x43b29a POP %R14 |
0x43b29c POP %R15 |
0x43b29e POP %RBP |
0x43b29f JMP 404050 |
0x43b2a4 MOV %RAX,%R12 |
0x43b2a7 JMP 43b2ac |
0x43b2a9 ADD %RBX,%RCX |
0x43b2ac PXOR %XMM0,%XMM0 |
0x43b2b0 MOVAPD 0x4f8b8(%RIP),%XMM1 |
0x43b2b8 MOVSD 0x504d0(%RIP),%XMM2 |
0x43b2c0 MOVSD 0x4f848(%RIP),%XMM3 |
0x43b2c8 MOVSD 0x504c8(%RIP),%XMM4 |
0x43b2d0 MOVAPD 0x504a8(%RIP),%XMM5 |
0x43b2d8 MOV %R14,%RBX |
0x43b2db JMP 43b325 |
0x43b2dd NOPL (%RAX) |
(317) 0x43b2e0 MOVAPD %XMM3,%XMM9 |
(317) 0x43b2e5 SUBSD %XMM7,%XMM9 |
(317) 0x43b2ea MULSD %XMM11,%XMM9 |
(317) 0x43b2ef ADDSD %XMM8,%XMM9 |
(317) 0x43b2f4 MULSD %XMM6,%XMM9 |
(317) 0x43b2f9 IMUL -0x88(%RBP),%RSI |
(317) 0x43b301 ADD %RAX,%RSI |
(317) 0x43b304 MOV -0x80(%RBP),%RAX |
(317) 0x43b308 MOVSD %XMM9,(%RAX,%RSI,8) |
(317) 0x43b30e INC %RCX |
(317) 0x43b311 CMP %RCX,-0xa0(%RBP) |
(317) 0x43b318 MOV %RBX,%R14 |
(317) 0x43b31b MOV -0x38(%RBP),%R9 |
(317) 0x43b31f JE 43b286 |
(317) 0x43b325 MOV %RCX,%RDI |
(317) 0x43b328 SHR $0x20,%RDI |
(317) 0x43b32c JE 43b350 |
(317) 0x43b32e MOV %RCX,%RAX |
(317) 0x43b331 XOR %EDX,%EDX |
(317) 0x43b333 DIV %R9 |
(317) 0x43b336 MOV %RAX,%RSI |
(317) 0x43b339 TEST %RDI,%RDI |
(317) 0x43b33c JE 43b35e |
(317) 0x43b33e MOV %RCX,%RAX |
(317) 0x43b341 CQTO |
(317) 0x43b343 IDIV %R9 |
(317) 0x43b346 JMP 43b365 |
0x43b348 NOPL (%RAX,%RAX,1) |
(317) 0x43b350 MOV %ECX,%EAX |
(317) 0x43b352 XOR %EDX,%EDX |
(317) 0x43b354 DIV %R9D |
(317) 0x43b357 MOV %EAX,%ESI |
(317) 0x43b359 TEST %RDI,%RDI |
(317) 0x43b35c JNE 43b33e |
(317) 0x43b35e MOV %ECX,%EAX |
(317) 0x43b360 XOR %EDX,%EDX |
(317) 0x43b362 DIV %R9D |
(317) 0x43b365 ADD -0x40(%RBP),%RSI |
(317) 0x43b369 LEA (%RDX,%R14,1),%EDI |
(317) 0x43b36d MOVSXD %EDI,%RAX |
(317) 0x43b370 MOVSXD %ESI,%RSI |
(317) 0x43b373 MOV %R12,%R9 |
(317) 0x43b376 IMUL %RSI,%R9 |
(317) 0x43b37a ADD %RAX,%R9 |
(317) 0x43b37d MOVSD (%R13,%R9,8),%XMM6 |
(317) 0x43b384 UCOMISD %XMM6,%XMM0 |
(317) 0x43b388 LEA 0x1(%RDX,%R14,1),%EDX |
(317) 0x43b38d MOVSXD %EDX,%R9 |
(317) 0x43b390 JBE 43b3a0 |
(317) 0x43b392 ADD $0x2,%EDI |
(317) 0x43b395 MOV %RAX,%R10 |
(317) 0x43b398 JMP 43b3aa |
0x43b39a NOPW (%RAX,%RAX,1) |
(317) 0x43b3a0 DEC %EDI |
(317) 0x43b3a2 MOV %R9,%R10 |
(317) 0x43b3a5 MOV %RAX,%R9 |
(317) 0x43b3a8 MOV %EDI,%EDX |
(317) 0x43b3aa MOVAPD %XMM6,%XMM7 |
(317) 0x43b3ae ANDPD %XMM1,%XMM7 |
(317) 0x43b3b2 MOV %R8,%R11 |
(317) 0x43b3b5 IMUL %RSI,%R11 |
(317) 0x43b3b9 ADD %R9,%R11 |
(317) 0x43b3bc MOV -0x98(%RBP),%R14 |
(317) 0x43b3c3 DIVSD (%R14,%R11,8),%XMM7 |
(317) 0x43b3c9 MOV -0x90(%RBP),%R11 |
(317) 0x43b3d0 IMUL %RSI,%R11 |
(317) 0x43b3d4 ADD %R11,%R9 |
(317) 0x43b3d7 MOVSXD %EDI,%RDI |
(317) 0x43b3da ADD %R11,%RDI |
(317) 0x43b3dd ADD %R10,%R11 |
(317) 0x43b3e0 MOVSD (%R15,%R9,8),%XMM8 |
(317) 0x43b3e6 MOVAPD %XMM8,%XMM9 |
(317) 0x43b3eb MOVHPD (%R15,%R11,8),%XMM9 |
(317) 0x43b3f1 MOVSD (%R15,%RDI,8),%XMM10 |
(317) 0x43b3f7 UNPCKLPD %XMM8,%XMM10 |
(317) 0x43b3fc SUBPD %XMM10,%XMM9 |
(317) 0x43b401 MOVAPD %XMM9,%XMM10 |
(317) 0x43b406 UNPCKHPD %XMM9,%XMM10 |
(317) 0x43b40b MOVAPD %XMM10,%XMM12 |
(317) 0x43b410 MULSD %XMM9,%XMM12 |
(317) 0x43b415 PXOR %XMM11,%XMM11 |
(317) 0x43b41a UCOMISD %XMM11,%XMM12 |
(317) 0x43b41f JBE 43b2e0 |
(317) 0x43b425 MOV -0x48(%RBP),%RDI |
(317) 0x43b429 MOV 0x8(%RDI),%RDI |
(317) 0x43b42d ANDPD %XMM1,%XMM9 |
(317) 0x43b432 MOVAPD %XMM2,%XMM11 |
(317) 0x43b437 SUBSD %XMM7,%XMM11 |
(317) 0x43b43c MOVAPD %XMM7,%XMM12 |
(317) 0x43b441 ADDSD %XMM3,%XMM12 |
(317) 0x43b446 UNPCKLPD %XMM11,%XMM12 |
(317) 0x43b44b MOVSXD %EDX,%RDX |
(317) 0x43b44e MOVSD (%RDI,%RAX,8),%XMM11 |
(317) 0x43b454 MULPD %XMM9,%XMM12 |
(317) 0x43b459 MOVSD (%RDI,%RDX,8),%XMM13 |
(317) 0x43b45f UNPCKLPD %XMM11,%XMM13 |
(317) 0x43b464 DIVPD %XMM13,%XMM12 |
(317) 0x43b469 MOVAPD %XMM12,%XMM13 |
(317) 0x43b46e UNPCKHPD %XMM12,%XMM13 |
(317) 0x43b473 ADDSD %XMM12,%XMM13 |
(317) 0x43b478 MULSD %XMM4,%XMM11 |
(317) 0x43b47d MULSD %XMM13,%XMM11 |
(317) 0x43b482 PSHUFD $-0x12,%XMM9,%XMM12 |
(317) 0x43b488 MINSD %XMM9,%XMM12 |
(317) 0x43b48d MINSD %XMM11,%XMM12 |
(317) 0x43b492 XORPD %XMM11,%XMM11 |
(317) 0x43b497 CMPSD $0x1,%XMM10,%XMM11 |
(317) 0x43b49d MOVAPD %XMM11,%XMM9 |
(317) 0x43b4a2 ANDPD %XMM12,%XMM9 |
(317) 0x43b4a7 XORPD %XMM5,%XMM12 |
(317) 0x43b4ac ANDNPD %XMM12,%XMM11 |
(317) 0x43b4b1 ORPD %XMM9,%XMM11 |
(317) 0x43b4b6 JMP 43b2e0 |
0x43b4bb NOPL (%RAX,%RAX,1) |
Path / |
Source file and lines | advec_mom.cpp:108-139 |
Module | exec |
nb instructions | 148 |
nb uops | 153 |
loop length | 681 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 7 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 33 |
micro-operation queue | 25.50 cycles |
front end | 25.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 7.00 | 7.00 | 7.00 | 7.00 | 5.00 | 18.67 | 18.67 | 18.67 | 6.00 | 5.92 | 6.08 | 6.00 | 6.50 | 6.50 |
cycles | 7.00 | 7.00 | 7.00 | 7.00 | 5.00 | 18.67 | 18.67 | 18.67 | 6.00 | 5.92 | 6.08 | 6.00 | 6.50 | 6.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 25.50 |
Dispatch | 18.67 |
Overall L1 | 25.50 |
all | 36% |
load | 9% |
store | 46% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 11% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 45% |
all | 40% |
load | 40% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 36% |
load | 18% |
store | 46% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 11% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 45% |
all | 16% |
load | 12% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 17% |
all | 17% |
load | 17% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 16% |
load | 14% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x20(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JS 43b26a <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x6ca> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R8,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0xa8(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x30(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x58(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x50(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x4aaa20,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404240 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JA 43b286 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x6e6> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RBX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %R14D,%R9D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R13),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R12),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R12),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R15),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R15),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x70(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R10),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R10),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
INC %RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x2,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND %RDX,%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R9,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RSI,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R11,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JE 43b2a4 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x704> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RDX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVD %R9D,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PSHUFD $0x44,%XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVQ -0x40(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x170(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVD %R14D,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PSHUFD $0x50,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x160(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RAX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVQ %R13,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R8,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RSI,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R11,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R15,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RDI,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R10,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RCX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
PADDQ 0x50812(%RIP),%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVDQA %XMM1,-0x180(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
PSHUFD $-0x12,%XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVDQA %XMM2,-0x150(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
PSRLQ $0x20,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVDQA %XMM2,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 43ae97 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x2f7> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
ADD $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RBX,-0x78(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV -0x38(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JNE 43b2a9 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x709> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x4aaa40,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x2c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 404050 <__kmpc_for_static_fini@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 43b2ac <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x70c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
ADD %RBX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PXOR %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVAPD 0x4f8b8(%RIP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSD 0x504d0(%RIP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x4f848(%RIP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x504c8(%RIP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVAPD 0x504a8(%RIP),%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %R14,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 43b325 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x785> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Source file and lines | advec_mom.cpp:108-139 |
Module | exec |
nb instructions | 148 |
nb uops | 153 |
loop length | 681 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 7 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 33 |
micro-operation queue | 25.50 cycles |
front end | 25.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 7.00 | 7.00 | 7.00 | 7.00 | 5.00 | 18.67 | 18.67 | 18.67 | 6.00 | 5.92 | 6.08 | 6.00 | 6.50 | 6.50 |
cycles | 7.00 | 7.00 | 7.00 | 7.00 | 5.00 | 18.67 | 18.67 | 18.67 | 6.00 | 5.92 | 6.08 | 6.00 | 6.50 | 6.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 25.50 |
Dispatch | 18.67 |
Overall L1 | 25.50 |
all | 36% |
load | 9% |
store | 46% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 11% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 45% |
all | 40% |
load | 40% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 36% |
load | 18% |
store | 46% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 11% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 45% |
all | 16% |
load | 12% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 17% |
all | 17% |
load | 17% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 16% |
load | 14% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x20(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JS 43b26a <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x6ca> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R8,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0xa8(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x30(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x58(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x50(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x4aaa20,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404240 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JA 43b286 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x6e6> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RBX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %R14D,%R9D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R13),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R12),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R12),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R15),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R15),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x70(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R10),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R10),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
INC %RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x2,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND %RDX,%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R9,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RSI,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R11,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JE 43b2a4 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x704> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RDX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVD %R9D,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PSHUFD $0x44,%XMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVQ -0x40(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x170(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVD %R14D,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PSHUFD $0x50,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x160(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RAX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVQ %R13,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R8,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RSI,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R11,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R15,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RDI,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R10,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RCX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
PADDQ 0x50812(%RIP),%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVDQA %XMM1,-0x180(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
PSHUFD $-0x12,%XMM1,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVDQA %XMM2,-0x150(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
PSRLQ $0x20,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVDQA %XMM2,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 43ae97 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x2f7> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
ADD $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RBX,-0x78(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV -0x38(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JNE 43b2a9 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x709> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x4aaa40,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x2c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 404050 <__kmpc_for_static_fini@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 43b2ac <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x70c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
ADD %RBX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PXOR %XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVAPD 0x4f8b8(%RIP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSD 0x504d0(%RIP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x4f848(%RIP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x504c8(%RIP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVAPD 0x504a8(%RIP),%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %R14,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 43b325 <_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27+0x785> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_Z16advec_mom_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_RNS_8Buffer1DIdEES5_iii.extracted.27– | 4.83 | 2.65 |
○Loop 318 - advec_mom.cpp:108-139 - exec | 4.83 | 2.65 |
○Loop 317 - advec_mom.cpp:108-139 - exec | 0 | 0 |