Function: _Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_ ... | Module: exec | Source: advec_cell.cpp:65-110 [...] | Coverage: 3.37% |
---|
Function: _Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_ ... | Module: exec | Source: advec_cell.cpp:65-110 [...] | Coverage: 3.37% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/advec_cell.cpp: 65 - 110 |
-------------------------------------------------------------------------------- |
65: #pragma omp parallel for simd collapse(2) |
66: for (int j = (y_min + 1); j < (y_max + 2); j++) { |
67: for (int i = (x_min + 1); i < (x_max + 2 + 2); i++) |
68: ({ |
69: int upwind, donor, downwind, dif; |
70: double sigmat, sigma3, sigma4, sigmav, sigmam, diffuw, diffdw, limiter, wind; |
71: if (vol_flux_x(i, j) > 0.0) { |
72: upwind = i - 2; |
73: donor = i - 1; |
74: downwind = i; |
75: dif = donor; |
76: } else { |
77: upwind = std::min(i + 1, x_max + 2); |
78: donor = i; |
79: downwind = i - 1; |
80: dif = upwind; |
81: } |
82: sigmat = std::fabs(vol_flux_x(i, j)) / pre_vol(donor, j); |
83: sigma3 = (1.0 + sigmat) * (vertexdx[i] / vertexdx[dif]); |
84: sigma4 = 2.0 - sigmat; |
85: sigmav = sigmat; |
86: diffuw = density1(donor, j) - density1(upwind, j); |
87: diffdw = density1(downwind, j) - density1(donor, j); |
88: wind = 1.0; |
89: if (diffdw <= 0.0) wind = -1.0; |
90: if (diffuw * diffdw > 0.0) { |
91: limiter = (1.0 - sigmav) * wind * |
92: std::fmin(std::fmin(std::fabs(diffuw), std::fabs(diffdw)), |
93: one_by_six * (sigma3 * std::fabs(diffuw) + sigma4 * std::fabs(diffdw))); |
94: } else { |
95: limiter = 0.0; |
96: } |
97: mass_flux_x(i, j) = vol_flux_x(i, j) * (density1(donor, j) + limiter); |
98: sigmam = std::fabs(mass_flux_x(i, j)) / (density1(donor, j) * pre_vol(donor, j)); |
99: diffuw = energy1(donor, j) - energy1(upwind, j); |
100: diffdw = energy1(downwind, j) - energy1(donor, j); |
101: wind = 1.0; |
102: if (diffdw <= 0.0) wind = -1.0; |
103: if (diffuw * diffdw > 0.0) { |
104: limiter = (1.0 - sigmam) * wind * |
105: std::fmin(std::fmin(std::fabs(diffuw), std::fabs(diffdw)), |
106: one_by_six * (sigma3 * std::fabs(diffuw) + sigma4 * std::fabs(diffdw))); |
107: } else { |
108: limiter = 0.0; |
109: } |
110: ener_flux(i, j) = mass_flux_x(i, j) * (energy1(donor, j) + limiter); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 46 - 69 |
-------------------------------------------------------------------------------- |
46: T &operator[](size_t i) const { return data[i]; } |
[...] |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
0x436a30 PUSH %RBP |
0x436a31 MOV %RSP,%RBP |
0x436a34 PUSH %R15 |
0x436a36 PUSH %R14 |
0x436a38 PUSH %R13 |
0x436a3a PUSH %R12 |
0x436a3c PUSH %RBX |
0x436a3d SUB $0x208,%RSP |
0x436a44 MOV %R8,%R12 |
0x436a47 MOV 0x50(%RBP),%RAX |
0x436a4b MOV 0x40(%RBP),%R10 |
0x436a4f MOV 0x38(%RBP),%RSI |
0x436a53 MOV 0x30(%RBP),%R8 |
0x436a57 MOV %R8,-0x90(%RBP) |
0x436a5e MOV 0x28(%RBP),%R13 |
0x436a62 MOV 0x20(%RBP),%R14 |
0x436a66 MOV 0x18(%RBP),%R15 |
0x436a6a MOV 0x10(%RBP),%RBX |
0x436a6e MOVL $0,-0x58(%RBP) |
0x436a75 TEST %RAX,%RAX |
0x436a78 JS 4373fe |
0x436a7e MOV %RCX,-0xb0(%RBP) |
0x436a85 MOV %R9,-0xc0(%RBP) |
0x436a8c MOV %RSI,-0x48(%RBP) |
0x436a90 MOV %R10,-0x30(%RBP) |
0x436a94 MOV %RDX,-0x38(%RBP) |
0x436a98 MOV (%RDI),%ESI |
0x436a9a MOVQ $0,-0xa0(%RBP) |
0x436aa5 MOV %RAX,-0x98(%RBP) |
0x436aac MOVQ $0x1,-0xf0(%RBP) |
0x436ab7 SUB $0x8,%RSP |
0x436abb LEA -0xf0(%RBP),%RAX |
0x436ac2 LEA -0x58(%RBP),%RCX |
0x436ac6 LEA -0xa0(%RBP),%R8 |
0x436acd LEA -0x98(%RBP),%R9 |
0x436ad4 MOV $0x4aa720,%EDI |
0x436ad9 MOV %ESI,-0x54(%RBP) |
0x436adc MOV $0x22,%EDX |
0x436ae1 PUSH $0x1 |
0x436ae3 PUSH $0x1 |
0x436ae5 PUSH %RAX |
0x436ae6 CALL 404240 <__kmpc_for_static_init_8@plt> |
0x436aeb ADD $0x20,%RSP |
0x436aef MOV -0xa0(%RBP),%RCX |
0x436af6 MOV -0x98(%RBP),%RAX |
0x436afd CMP %RAX,%RCX |
0x436b00 JA 437419 |
0x436b06 MOV %RAX,%RDI |
0x436b09 MOV -0x30(%RBP),%RDX |
0x436b0d MOV -0x48(%RBP),%RSI |
0x436b11 SUB %ESI,%EDX |
0x436b13 MOV (%R15),%RAX |
0x436b16 MOV %RAX,-0x68(%RBP) |
0x436b1a MOV 0x10(%R15),%R9 |
0x436b1e MOV (%R14),%RAX |
0x436b21 MOV %RAX,-0x40(%RBP) |
0x436b25 MOV 0x10(%R14),%R8 |
0x436b29 MOV -0xb0(%RBP),%RAX |
0x436b30 MOV 0x8(%RAX),%R10 |
0x436b34 MOV (%R12),%R14 |
0x436b38 MOV 0x10(%R12),%R12 |
0x436b3d MOV (%RBX),%RAX |
0x436b40 MOV %RAX,-0x88(%RBP) |
0x436b47 MOV 0x10(%RBX),%R11 |
0x436b4b MOV -0xc0(%RBP),%RAX |
0x436b52 MOV (%RAX),%RBX |
0x436b55 MOV 0x10(%RAX),%R15 |
0x436b59 MOV (%R13),%RAX |
0x436b5d MOV %RAX,-0x60(%RBP) |
0x436b61 MOV 0x10(%R13),%RAX |
0x436b65 MOV %RAX,-0x80(%RBP) |
0x436b69 MOV -0x38(%RBP),%RAX |
0x436b6d ADD $0x2,%EAX |
0x436b70 INC %RDI |
0x436b73 MOV %RDI,-0xe8(%RBP) |
0x436b7a SUB %RCX,%RDI |
0x436b7d MOV $-0x2,%R13D |
0x436b83 MOV %RDI,-0xc8(%RBP) |
0x436b8a AND %RDI,%R13 |
0x436b8d MOV %RBX,%RDI |
0x436b90 MOV %R11,%RBX |
0x436b93 MOV %R14,%R11 |
0x436b96 MOV %R8,%R14 |
0x436b99 MOV -0x40(%RBP),%R8 |
0x436b9d MOV %RAX,-0x38(%RBP) |
0x436ba1 MOV %RDX,-0x30(%RBP) |
0x436ba5 MOV %R9,-0x78(%RBP) |
0x436ba9 MOV %R14,-0x50(%RBP) |
0x436bad MOV %R11,-0x70(%RBP) |
0x436bb1 MOV %RBX,-0xe0(%RBP) |
0x436bb8 MOV %RDI,-0xd8(%RBP) |
0x436bbf MOV %R10,-0xd0(%RBP) |
0x436bc6 JE 437437 |
0x436bcc MOVD %EDX,%XMM0 |
0x436bd0 PSHUFD $0x44,%XMM0,%XMM0 |
0x436bd5 MOVDQA %XMM0,-0x210(%RBP) |
0x436bdd MOVQ -0x90(%RBP),%XMM0 |
0x436be5 PSHUFD $0x44,%XMM0,%XMM0 |
0x436bea MOVDQA %XMM0,-0x200(%RBP) |
0x436bf2 MOVD %ESI,%XMM0 |
0x436bf6 PSHUFD $0x50,%XMM0,%XMM0 |
0x436bfb MOVDQA %XMM0,-0x1f0(%RBP) |
0x436c03 MOV -0x68(%RBP),%RDX |
0x436c07 MOVQ %RDX,%XMM0 |
0x436c0c PSHUFD $0x44,%XMM0,%XMM0 |
0x436c11 MOVDQA %XMM0,-0x1e0(%RBP) |
0x436c19 MOVQ %R9,%XMM0 |
0x436c1e PSHUFD $0x44,%XMM0,%XMM0 |
0x436c23 MOVDQA %XMM0,-0x1d0(%RBP) |
0x436c2b MOVD %EAX,%XMM0 |
0x436c2f PSHUFD $0x50,%XMM0,%XMM0 |
0x436c34 MOVDQA %XMM0,-0x1c0(%RBP) |
0x436c3c MOVQ %R8,%XMM0 |
0x436c41 PSHUFD $0x44,%XMM0,%XMM0 |
0x436c46 MOVDQA %XMM0,-0x1b0(%RBP) |
0x436c4e MOVQ %R14,%XMM0 |
0x436c53 PSHUFD $0x44,%XMM0,%XMM0 |
0x436c58 MOVDQA %XMM0,-0x1a0(%RBP) |
0x436c60 MOVQ %R10,%XMM0 |
0x436c65 PSHUFD $0x44,%XMM0,%XMM0 |
0x436c6a MOVDQA %XMM0,-0x190(%RBP) |
0x436c72 MOVQ %R11,%XMM0 |
0x436c77 PSHUFD $0x44,%XMM0,%XMM0 |
0x436c7c MOVDQA %XMM0,-0x180(%RBP) |
0x436c84 MOVQ %R12,%XMM0 |
0x436c89 PSHUFD $0x44,%XMM0,%XMM0 |
0x436c8e MOVDQA %XMM0,-0x170(%RBP) |
0x436c96 MOVQ -0x88(%RBP),%XMM0 |
0x436c9e PSHUFD $0x44,%XMM0,%XMM0 |
0x436ca3 MOVDQA %XMM0,-0x160(%RBP) |
0x436cab MOVQ %RBX,%XMM0 |
0x436cb0 PSHUFD $0x44,%XMM0,%XMM0 |
0x436cb5 MOVDQA %XMM0,-0x150(%RBP) |
0x436cbd MOVQ %RDI,%XMM0 |
0x436cc2 PSHUFD $0x44,%XMM0,%XMM0 |
0x436cc7 MOVDQA %XMM0,-0x140(%RBP) |
0x436ccf MOVQ %R15,%XMM0 |
0x436cd4 PSHUFD $0x44,%XMM0,%XMM0 |
0x436cd9 MOVDQA %XMM0,-0x130(%RBP) |
0x436ce1 MOV -0x60(%RBP),%R10 |
0x436ce5 MOVQ %R10,%XMM0 |
0x436cea PSHUFD $0x44,%XMM0,%XMM0 |
0x436cef MOVDQA %XMM0,-0x120(%RBP) |
0x436cf7 MOV -0x80(%RBP),%RAX |
0x436cfb MOVQ %RAX,%XMM0 |
0x436d00 PSHUFD $0x44,%XMM0,%XMM0 |
0x436d05 MOVDQA %XMM0,-0x110(%RBP) |
0x436d0d MOVQ %RCX,%XMM0 |
0x436d12 PSHUFD $0x44,%XMM0,%XMM10 |
0x436d18 PADDQ 0x5486f(%RIP),%XMM10 |
0x436d21 XOR %R9D,%R9D |
0x436d24 MOVAPD 0x53e43(%RIP),%XMM14 |
0x436d2d MOVAPD 0x54a1a(%RIP),%XMM15 |
0x436d36 MOV %RDX,%R14 |
0x436d39 JMP 436e24 |
0x436d3e XCHG %AX,%AX |
(302) 0x436d40 MULPD %XMM9,%XMM13 |
(302) 0x436d45 DIVPD %XMM13,%XMM11 |
(302) 0x436d4a XORPD %XMM2,%XMM2 |
(302) 0x436d4e CMPPD $0x1,%XMM5,%XMM2 |
(302) 0x436d53 MOVAPD %XMM15,%XMM9 |
(302) 0x436d58 SUBPD %XMM11,%XMM9 |
(302) 0x436d5d SUBPD %XMM15,%XMM11 |
(302) 0x436d62 ANDPD %XMM2,%XMM9 |
(302) 0x436d67 ANDNPD %XMM11,%XMM2 |
(302) 0x436d6c ORPD %XMM9,%XMM2 |
(302) 0x436d71 ANDPD %XMM14,%XMM4 |
(302) 0x436d76 MOVAPD %XMM4,%XMM9 |
(302) 0x436d7b MULPD %XMM6,%XMM4 |
(302) 0x436d7f ANDPD %XMM14,%XMM5 |
(302) 0x436d84 MINPD %XMM5,%XMM9 |
(302) 0x436d89 MULPD -0xc0(%RBP),%XMM5 |
(302) 0x436d91 ADDPD %XMM4,%XMM5 |
(302) 0x436d95 MULPD 0x549d3(%RIP),%XMM5 |
(302) 0x436d9d MINPD %XMM9,%XMM5 |
(302) 0x436da2 MULPD %XMM2,%XMM5 |
(302) 0x436da6 ANDPD %XMM5,%XMM0 |
(302) 0x436daa ADDPD %XMM3,%XMM0 |
(302) 0x436dae MULPD %XMM7,%XMM0 |
(302) 0x436db2 MOVDQA -0x120(%RBP),%XMM4 |
(302) 0x436dba MOVDQA %XMM4,%XMM2 |
(302) 0x436dbe PSRLQ $0x20,%XMM2 |
(302) 0x436dc3 PMULUDQ %XMM1,%XMM2 |
(302) 0x436dc7 MOVDQA %XMM4,%XMM3 |
(302) 0x436dcb PMULUDQ %XMM1,%XMM3 |
(302) 0x436dcf PSRLQ $0x20,%XMM1 |
(302) 0x436dd4 PMULUDQ %XMM4,%XMM1 |
(302) 0x436dd8 PADDQ %XMM2,%XMM1 |
(302) 0x436ddc PADDQ %XMM12,%XMM3 |
(302) 0x436de1 PSLLQ $0x20,%XMM1 |
(302) 0x436de6 PADDQ %XMM1,%XMM3 |
(302) 0x436dea PSLLQ $0x3,%XMM3 |
(302) 0x436def PADDQ -0x110(%RBP),%XMM3 |
(302) 0x436df7 MOVQ %XMM3,%RAX |
(302) 0x436dfc PSHUFD $-0x12,%XMM3,%XMM1 |
(302) 0x436e01 MOVQ %XMM1,%RDX |
(302) 0x436e06 MOVLPD %XMM0,(%RAX) |
(302) 0x436e0a MOVHPD %XMM0,(%RDX) |
(302) 0x436e0e PADDQ 0x54799(%RIP),%XMM10 |
(302) 0x436e17 ADD $0x2,%R9 |
(302) 0x436e1b CMP %R13,%R9 |
(302) 0x436e1e JAE 437410 |
(302) 0x436e24 MOVQ %XMM10,%RSI |
(302) 0x436e29 MOVDQA -0x210(%RBP),%XMM2 |
(302) 0x436e31 MOVQ %XMM2,%R8 |
(302) 0x436e36 MOV %RSI,%RAX |
(302) 0x436e39 XOR %EDX,%EDX |
(302) 0x436e3b DIV %R8 |
(302) 0x436e3e MOVQ %RAX,%XMM0 |
(302) 0x436e43 MOVDQA %XMM10,-0x100(%RBP) |
(302) 0x436e4c PSHUFD $-0x12,%XMM10,%XMM1 |
(302) 0x436e52 MOVQ %XMM1,%RDI |
(302) 0x436e57 PSHUFD $-0x12,%XMM2,%XMM1 |
(302) 0x436e5c MOVQ %XMM1,%RBX |
(302) 0x436e61 MOV %RDI,%RAX |
(302) 0x436e64 XOR %EDX,%EDX |
(302) 0x436e66 DIV %RBX |
(302) 0x436e69 MOVQ %RAX,%XMM1 |
(302) 0x436e6e PUNPCKLQDQ %XMM1,%XMM0 |
(302) 0x436e72 PADDQ -0x200(%RBP),%XMM0 |
(302) 0x436e7a MOV %RSI,%RAX |
(302) 0x436e7d CQTO |
(302) 0x436e7f IDIV %R8 |
(302) 0x436e82 MOVQ %RDX,%XMM1 |
(302) 0x436e87 MOV %RDI,%RAX |
(302) 0x436e8a CQTO |
(302) 0x436e8c IDIV %RBX |
(302) 0x436e8f MOVQ %RDX,%XMM3 |
(302) 0x436e94 PUNPCKLQDQ %XMM3,%XMM1 |
(302) 0x436e98 PSHUFD $-0x18,%XMM1,%XMM4 |
(302) 0x436e9d PADDD -0x1f0(%RBP),%XMM4 |
(302) 0x436ea5 PXOR %XMM1,%XMM1 |
(302) 0x436ea9 PCMPGTD %XMM4,%XMM1 |
(302) 0x436ead MOVDQA %XMM4,%XMM2 |
(302) 0x436eb1 PUNPCKLDQ %XMM1,%XMM2 |
(302) 0x436eb5 MOVDQA %XMM2,%XMM6 |
(302) 0x436eb9 PSHUFD $-0x18,%XMM0,%XMM1 |
(302) 0x436ebe PSLLQ $0x20,%XMM0 |
(302) 0x436ec3 PSRAD $0x1f,%XMM0 |
(302) 0x436ec8 PSHUFD $-0x13,%XMM0,%XMM3 |
(302) 0x436ecd PUNPCKLDQ %XMM3,%XMM1 |
(302) 0x436ed1 MOVDQA -0x1e0(%RBP),%XMM8 |
(302) 0x436eda MOVDQA %XMM8,%XMM3 |
(302) 0x436edf PMULUDQ %XMM1,%XMM3 |
(302) 0x436ee3 MOVDQA %XMM8,%XMM5 |
(302) 0x436ee8 PSRLQ $0x20,%XMM5 |
(302) 0x436eed PMULUDQ %XMM1,%XMM5 |
(302) 0x436ef1 PSRLQ $0x20,%XMM0 |
(302) 0x436ef6 PMULUDQ %XMM0,%XMM8 |
(302) 0x436efb PADDQ %XMM5,%XMM8 |
(302) 0x436f00 PSLLQ $0x20,%XMM8 |
(302) 0x436f06 PADDQ %XMM2,%XMM3 |
(302) 0x436f0a PADDQ %XMM8,%XMM3 |
(302) 0x436f0f PSLLQ $0x3,%XMM3 |
(302) 0x436f14 PADDQ -0x1d0(%RBP),%XMM3 |
(302) 0x436f1c MOVQ %XMM3,%RAX |
(302) 0x436f21 PSHUFD $-0x12,%XMM3,%XMM3 |
(302) 0x436f26 MOVQ %XMM3,%RDX |
(302) 0x436f2b MOVSD (%RAX),%XMM2 |
(302) 0x436f2f MOVHPD (%RDX),%XMM2 |
(302) 0x436f33 PXOR %XMM3,%XMM3 |
(302) 0x436f37 CMPPD $0x1,%XMM2,%XMM3 |
(302) 0x436f3c MOVAPD %XMM2,%XMM7 |
(302) 0x436f40 MOVAPD %XMM2,-0xb0(%RBP) |
(302) 0x436f48 MOVDQA %XMM4,%XMM8 |
(302) 0x436f4d PCMPEQD %XMM2,%XMM2 |
(302) 0x436f51 PADDD %XMM2,%XMM8 |
(302) 0x436f56 MOVDQA %XMM4,%XMM5 |
(302) 0x436f5a PSUBD %XMM2,%XMM5 |
(302) 0x436f5e MOVDQA %XMM5,%XMM9 |
(302) 0x436f63 MOVDQA -0x1c0(%RBP),%XMM10 |
(302) 0x436f6c PCMPGTD %XMM10,%XMM9 |
(302) 0x436f71 PAND %XMM9,%XMM10 |
(302) 0x436f76 PANDN %XMM5,%XMM9 |
(302) 0x436f7b POR %XMM10,%XMM9 |
(302) 0x436f80 PXOR %XMM5,%XMM5 |
(302) 0x436f84 PCMPGTD %XMM8,%XMM5 |
(302) 0x436f89 PUNPCKLDQ %XMM5,%XMM8 |
(302) 0x436f8e PXOR %XMM5,%XMM5 |
(302) 0x436f92 PCMPGTD %XMM9,%XMM5 |
(302) 0x436f97 PUNPCKLDQ %XMM5,%XMM9 |
(302) 0x436f9c PADDD 0x5479c(%RIP),%XMM4 |
(302) 0x436fa4 PXOR %XMM5,%XMM5 |
(302) 0x436fa8 PCMPGTD %XMM4,%XMM5 |
(302) 0x436fac PUNPCKLDQ %XMM5,%XMM4 |
(302) 0x436fb0 MOVAPD %XMM3,%XMM10 |
(302) 0x436fb5 ANDNPD %XMM9,%XMM10 |
(302) 0x436fba PAND %XMM3,%XMM4 |
(302) 0x436fbe POR %XMM10,%XMM4 |
(302) 0x436fc3 MOVDQA %XMM3,%XMM9 |
(302) 0x436fc8 PANDN %XMM8,%XMM9 |
(302) 0x436fcd PAND %XMM3,%XMM8 |
(302) 0x436fd2 POR %XMM8,%XMM10 |
(302) 0x436fd7 MOVDQA %XMM6,%XMM2 |
(302) 0x436fdb PAND %XMM3,%XMM2 |
(302) 0x436fdf POR %XMM9,%XMM2 |
(302) 0x436fe4 MOVDQA %XMM2,%XMM5 |
(302) 0x436fe8 MOVDQA %XMM2,-0x230(%RBP) |
(302) 0x436ff0 PANDN %XMM6,%XMM3 |
(302) 0x436ff4 MOVDQA %XMM6,-0x220(%RBP) |
(302) 0x436ffc POR %XMM8,%XMM3 |
(302) 0x437001 MOVAPD %XMM7,%XMM9 |
(302) 0x437006 MOVDQA -0x1b0(%RBP),%XMM13 |
(302) 0x43700f MOVDQA %XMM13,%XMM8 |
(302) 0x437014 PMULUDQ %XMM1,%XMM8 |
(302) 0x437019 MOVDQA %XMM13,%XMM12 |
(302) 0x43701e PSRLQ $0x20,%XMM12 |
(302) 0x437024 PMULUDQ %XMM1,%XMM12 |
(302) 0x437029 PMULUDQ %XMM0,%XMM13 |
(302) 0x43702e PADDQ %XMM12,%XMM13 |
(302) 0x437033 PSLLQ $0x20,%XMM13 |
(302) 0x437039 PADDQ %XMM8,%XMM13 |
(302) 0x43703e PADDQ %XMM3,%XMM13 |
(302) 0x437043 PSLLQ $0x3,%XMM13 |
(302) 0x437049 PADDQ -0x1a0(%RBP),%XMM13 |
(302) 0x437052 MOVQ %XMM13,%RDX |
(302) 0x437057 PSHUFD $-0x12,%XMM13,%XMM8 |
(302) 0x43705d MOVQ %XMM8,%RAX |
(302) 0x437062 MOVSD (%RDX),%XMM8 |
(302) 0x437067 MOVHPD (%RAX),%XMM8 |
(302) 0x43706c ANDPD %XMM14,%XMM9 |
(302) 0x437071 DIVPD %XMM8,%XMM9 |
(302) 0x437076 MOVAPD %XMM9,%XMM12 |
(302) 0x43707b MOVDQA %XMM6,%XMM8 |
(302) 0x437080 PSLLQ $0x3,%XMM8 |
(302) 0x437086 MOVDQA -0x190(%RBP),%XMM2 |
(302) 0x43708e PADDQ %XMM2,%XMM8 |
(302) 0x437093 MOVQ %XMM8,%RSI |
(302) 0x437098 PSHUFD $-0x12,%XMM8,%XMM8 |
(302) 0x43709e MOVQ %XMM8,%RDI |
(302) 0x4370a3 MOVSD (%RSI),%XMM11 |
(302) 0x4370a8 MOVHPD (%RDI),%XMM11 |
(302) 0x4370ad ADDPD %XMM15,%XMM12 |
(302) 0x4370b2 MULPD %XMM12,%XMM11 |
(302) 0x4370b7 PSLLQ $0x3,%XMM10 |
(302) 0x4370bd PADDQ %XMM2,%XMM10 |
(302) 0x4370c2 MOVQ %XMM10,%RSI |
(302) 0x4370c7 PSHUFD $-0x12,%XMM10,%XMM10 |
(302) 0x4370cd MOVQ %XMM10,%RDI |
(302) 0x4370d2 MOVSD (%RSI),%XMM10 |
(302) 0x4370d7 MOVHPD (%RDI),%XMM10 |
(302) 0x4370dc DIVPD %XMM10,%XMM11 |
(302) 0x4370e1 MOVAPD 0x54676(%RIP),%XMM8 |
(302) 0x4370ea MOVDQA -0x180(%RBP),%XMM10 |
(302) 0x4370f3 MOVDQA %XMM10,%XMM13 |
(302) 0x4370f8 PMULUDQ %XMM1,%XMM13 |
(302) 0x4370fd MOVAPD %XMM14,%XMM12 |
(302) 0x437102 MOVDQA %XMM10,%XMM14 |
(302) 0x437107 PSRLQ $0x20,%XMM14 |
(302) 0x43710d PMULUDQ %XMM1,%XMM14 |
(302) 0x437112 PMULUDQ %XMM0,%XMM10 |
(302) 0x437117 PADDQ %XMM14,%XMM10 |
(302) 0x43711c PSLLQ $0x20,%XMM10 |
(302) 0x437122 PADDQ %XMM13,%XMM10 |
(302) 0x437127 MOVDQA %XMM10,%XMM13 |
(302) 0x43712c PADDQ %XMM3,%XMM13 |
(302) 0x437131 PSLLQ $0x3,%XMM13 |
(302) 0x437137 MOVDQA -0x170(%RBP),%XMM2 |
(302) 0x43713f PADDQ %XMM2,%XMM13 |
(302) 0x437144 MOVQ %XMM13,%RDI |
(302) 0x437149 PSHUFD $-0x12,%XMM13,%XMM13 |
(302) 0x43714f MOVQ %XMM13,%RSI |
(302) 0x437154 MOVSD (%RDI),%XMM13 |
(302) 0x437159 MOVHPD (%RSI),%XMM13 |
(302) 0x43715e SUBPD %XMM9,%XMM8 |
(302) 0x437163 MOVDQA %XMM10,%XMM14 |
(302) 0x437168 PADDQ %XMM4,%XMM14 |
(302) 0x43716d PSLLQ $0x3,%XMM14 |
(302) 0x437173 PADDQ %XMM2,%XMM14 |
(302) 0x437178 MOVQ %XMM14,%R8 |
(302) 0x43717d PSHUFD $-0x12,%XMM14,%XMM14 |
(302) 0x437183 MOVQ %XMM14,%RBX |
(302) 0x437188 MOVAPD %XMM15,%XMM6 |
(302) 0x43718d MOVSD (%R8),%XMM15 |
(302) 0x437192 MOVHPD (%RBX),%XMM15 |
(302) 0x437197 MOVAPD %XMM13,%XMM14 |
(302) 0x43719c SUBPD %XMM15,%XMM14 |
(302) 0x4371a1 PADDQ %XMM5,%XMM10 |
(302) 0x4371a6 PSLLQ $0x3,%XMM10 |
(302) 0x4371ac PADDQ %XMM2,%XMM10 |
(302) 0x4371b1 MOVQ %XMM10,%R8 |
(302) 0x4371b6 PSHUFD $-0x12,%XMM10,%XMM10 |
(302) 0x4371bc MOVQ %XMM10,%RBX |
(302) 0x4371c1 MOVSD (%R8),%XMM7 |
(302) 0x4371c6 MOVHPD (%RBX),%XMM7 |
(302) 0x4371ca SUBPD %XMM13,%XMM7 |
(302) 0x4371cf MOVAPD %XMM7,%XMM10 |
(302) 0x4371d4 MULPD %XMM14,%XMM10 |
(302) 0x4371d9 XORPD %XMM15,%XMM15 |
(302) 0x4371de CMPPD $0x1,%XMM10,%XMM15 |
(302) 0x4371e4 XORPD %XMM10,%XMM10 |
(302) 0x4371e9 CMPPD $0x1,%XMM7,%XMM10 |
(302) 0x4371ef MOVAPD %XMM6,%XMM2 |
(302) 0x4371f3 SUBPD %XMM9,%XMM2 |
(302) 0x4371f8 SUBPD %XMM6,%XMM9 |
(302) 0x4371fd MOVAPD 0x5456b(%RIP),%XMM5 |
(302) 0x437205 ANDPD %XMM10,%XMM2 |
(302) 0x43720a ANDNPD %XMM9,%XMM10 |
(302) 0x43720f ORPD %XMM2,%XMM10 |
(302) 0x437214 ANDPD %XMM12,%XMM14 |
(302) 0x437219 ANDPD %XMM12,%XMM7 |
(302) 0x43721e MOVDQA -0x220(%RBP),%XMM12 |
(302) 0x437227 MOVAPD %XMM14,%XMM2 |
(302) 0x43722c MINPD %XMM7,%XMM2 |
(302) 0x437230 MOVAPD %XMM11,%XMM6 |
(302) 0x437235 MULPD %XMM11,%XMM14 |
(302) 0x43723a MOVAPD %XMM8,-0xc0(%RBP) |
(302) 0x437243 MULPD %XMM8,%XMM7 |
(302) 0x437248 ADDPD %XMM14,%XMM7 |
(302) 0x43724d MULPD %XMM5,%XMM7 |
(302) 0x437251 MINPD %XMM2,%XMM7 |
(302) 0x437255 MULPD %XMM10,%XMM7 |
(302) 0x43725a ANDPD %XMM15,%XMM7 |
(302) 0x43725f ADDPD %XMM13,%XMM7 |
(302) 0x437264 MULPD -0xb0(%RBP),%XMM7 |
(302) 0x43726c MOVDQA -0x160(%RBP),%XMM10 |
(302) 0x437275 MOVDQA %XMM10,%XMM2 |
(302) 0x43727a PSRLQ $0x20,%XMM2 |
(302) 0x43727f PMULUDQ %XMM1,%XMM2 |
(302) 0x437283 MOVDQA %XMM10,%XMM9 |
(302) 0x437288 PMULUDQ %XMM0,%XMM9 |
(302) 0x43728d PADDQ %XMM2,%XMM9 |
(302) 0x437292 MOVDQA %XMM10,%XMM2 |
(302) 0x437297 PMULUDQ %XMM1,%XMM2 |
(302) 0x43729b PSLLQ $0x20,%XMM9 |
(302) 0x4372a1 PADDQ %XMM12,%XMM2 |
(302) 0x4372a6 PADDQ %XMM9,%XMM2 |
(302) 0x4372ab PSLLQ $0x3,%XMM2 |
(302) 0x4372b0 PADDQ -0x150(%RBP),%XMM2 |
(302) 0x4372b8 MOVQ %XMM2,%R8 |
(302) 0x4372bd MOVLPD %XMM7,(%R8) |
(302) 0x4372c2 PSHUFD $-0x12,%XMM2,%XMM2 |
(302) 0x4372c7 MOVQ %XMM2,%R8 |
(302) 0x4372cc MOVHPD %XMM7,(%R8) |
(302) 0x4372d1 MOVDQA -0x140(%RBP),%XMM9 |
(302) 0x4372da MOVDQA %XMM9,%XMM2 |
(302) 0x4372df PSRLQ $0x20,%XMM2 |
(302) 0x4372e4 PMULUDQ %XMM1,%XMM2 |
(302) 0x4372e8 PMULUDQ %XMM9,%XMM0 |
(302) 0x4372ed PADDQ %XMM2,%XMM0 |
(302) 0x4372f1 MOVDQA %XMM9,%XMM2 |
(302) 0x4372f6 PMULUDQ %XMM1,%XMM2 |
(302) 0x4372fa PSLLQ $0x20,%XMM0 |
(302) 0x4372ff PADDQ %XMM2,%XMM0 |
(302) 0x437303 PADDQ %XMM0,%XMM3 |
(302) 0x437307 PSLLQ $0x3,%XMM3 |
(302) 0x43730c MOVDQA -0x130(%RBP),%XMM9 |
(302) 0x437315 PADDQ %XMM9,%XMM3 |
(302) 0x43731a MOVQ %XMM3,%R8 |
(302) 0x43731f PSHUFD $-0x12,%XMM3,%XMM2 |
(302) 0x437324 MOVQ %XMM2,%RBX |
(302) 0x437329 MOVSD (%R8),%XMM3 |
(302) 0x43732e MOVHPD (%RBX),%XMM3 |
(302) 0x437332 PADDQ %XMM0,%XMM4 |
(302) 0x437336 PSLLQ $0x3,%XMM4 |
(302) 0x43733b PADDQ %XMM9,%XMM4 |
(302) 0x437340 MOVQ %XMM4,%R8 |
(302) 0x437345 PSHUFD $-0x12,%XMM4,%XMM2 |
(302) 0x43734a MOVQ %XMM2,%RBX |
(302) 0x43734f MOVSD (%R8),%XMM2 |
(302) 0x437354 MOVHPD (%RBX),%XMM2 |
(302) 0x437358 MOVAPD %XMM3,%XMM4 |
(302) 0x43735c PADDQ -0x230(%RBP),%XMM0 |
(302) 0x437364 PSLLQ $0x3,%XMM0 |
(302) 0x437369 PADDQ %XMM9,%XMM0 |
(302) 0x43736e MOVQ %XMM0,%R8 |
(302) 0x437373 PSHUFD $-0x12,%XMM0,%XMM0 |
(302) 0x437378 MOVQ %XMM0,%RBX |
(302) 0x43737d MOVSD (%R8),%XMM5 |
(302) 0x437382 MOVHPD (%RBX),%XMM5 |
(302) 0x437386 SUBPD %XMM2,%XMM4 |
(302) 0x43738a SUBPD %XMM3,%XMM5 |
(302) 0x43738e MOVAPD %XMM5,%XMM2 |
(302) 0x437392 MULPD %XMM4,%XMM2 |
(302) 0x437396 PXOR %XMM0,%XMM0 |
(302) 0x43739a CMPPD $0x1,%XMM2,%XMM0 |
(302) 0x43739f MOVMSKPD %XMM0,%R8D |
(302) 0x4373a4 TEST $0x1,%R8B |
(302) 0x4373a8 JE 4373af |
(302) 0x4373aa MOVSD (%RDI),%XMM9 |
(302) 0x4373af TEST $0x2,%R8B |
(302) 0x4373b3 JE 4373ba |
(302) 0x4373b5 MOVHPD (%RSI),%XMM9 |
(302) 0x4373ba MOVDQA -0x100(%RBP),%XMM10 |
(302) 0x4373c3 MOVAPD 0x537a4(%RIP),%XMM14 |
(302) 0x4373cc MOVAPD 0x5437b(%RIP),%XMM15 |
(302) 0x4373d5 TEST $0x1,%R8B |
(302) 0x4373d9 JE 4373e0 |
(302) 0x4373db MOVSD (%RDX),%XMM13 |
(302) 0x4373e0 MOVAPD %XMM7,%XMM11 |
(302) 0x4373e5 ANDPD %XMM14,%XMM11 |
(302) 0x4373ea TEST $0x2,%R8B |
(302) 0x4373ee JE 436d40 |
(302) 0x4373f4 MOVHPD (%RAX),%XMM13 |
(302) 0x4373f9 JMP 436d40 |
0x4373fe ADD $0x208,%RSP |
0x437405 POP %RBX |
0x437406 POP %R12 |
0x437408 POP %R13 |
0x43740a POP %R14 |
0x43740c POP %R15 |
0x43740e POP %RBP |
0x43740f RET |
0x437410 CMP %R13,-0xc8(%RBP) |
0x437417 JNE 437441 |
0x437419 MOV $0x4aa740,%EDI |
0x43741e MOV -0x54(%RBP),%ESI |
0x437421 ADD $0x208,%RSP |
0x437428 POP %RBX |
0x437429 POP %R12 |
0x43742b POP %R13 |
0x43742d POP %R14 |
0x43742f POP %R15 |
0x437431 POP %RBP |
0x437432 JMP 404050 |
0x437437 MOV -0x68(%RBP),%R14 |
0x43743b MOV -0x60(%RBP),%R10 |
0x43743f JMP 437444 |
0x437441 ADD %R13,%RCX |
0x437444 MOVAPD 0x53724(%RIP),%XMM1 |
0x43744c MOVSD 0x536bc(%RIP),%XMM2 |
0x437454 MOVSD 0x54334(%RIP),%XMM3 |
0x43745c MOVAPD 0x5431c(%RIP),%XMM4 |
0x437464 MOVAPD 0x53704(%RIP),%XMM5 |
0x43746c MOVSD 0x54324(%RIP),%XMM6 |
0x437474 MOV %R14,%R13 |
0x437477 JMP 4374b1 |
0x437479 NOPL (%RAX) |
(301) 0x437480 ADDSD %XMM8,%XMM11 |
(301) 0x437485 MULSD %XMM10,%XMM11 |
(301) 0x43748a MOV %R10,%RDX |
(301) 0x43748d IMUL %R10,%RSI |
(301) 0x437491 ADD %RAX,%RSI |
(301) 0x437494 MOV -0x80(%RBP),%RAX |
(301) 0x437498 MOVSD %XMM11,(%RAX,%RSI,8) |
(301) 0x43749e INC %RCX |
(301) 0x4374a1 CMP %RCX,-0xe8(%RBP) |
(301) 0x4374a8 MOV %R13,%R14 |
(301) 0x4374ab JE 437419 |
(301) 0x4374b1 MOV %RCX,%RDI |
(301) 0x4374b4 SHR $0x20,%RDI |
(301) 0x4374b8 JE 4374e0 |
(301) 0x4374ba MOV %RCX,%RAX |
(301) 0x4374bd XOR %EDX,%EDX |
(301) 0x4374bf MOV -0x30(%RBP),%R8 |
(301) 0x4374c3 DIV %R8 |
(301) 0x4374c6 MOV %RAX,%RSI |
(301) 0x4374c9 MOV -0x48(%RBP),%R11 |
(301) 0x4374cd TEST %RDI,%RDI |
(301) 0x4374d0 JE 4374f6 |
(301) 0x4374d2 MOV %RCX,%RAX |
(301) 0x4374d5 CQTO |
(301) 0x4374d7 IDIV %R8 |
(301) 0x4374da JMP 4374fd |
0x4374dc NOPL (%RAX) |
(301) 0x4374e0 MOV %ECX,%EAX |
(301) 0x4374e2 XOR %EDX,%EDX |
(301) 0x4374e4 MOV -0x30(%RBP),%R8 |
(301) 0x4374e8 DIV %R8D |
(301) 0x4374eb MOV %EAX,%ESI |
(301) 0x4374ed MOV -0x48(%RBP),%R11 |
(301) 0x4374f1 TEST %RDI,%RDI |
(301) 0x4374f4 JNE 4374d2 |
(301) 0x4374f6 MOV %ECX,%EAX |
(301) 0x4374f8 XOR %EDX,%EDX |
(301) 0x4374fa DIV %R8D |
(301) 0x4374fd MOV -0x78(%RBP),%R8 |
(301) 0x437501 ADD -0x90(%RBP),%RSI |
(301) 0x437508 LEA (%RDX,%R11,1),%R9D |
(301) 0x43750c MOVSXD %R9D,%RAX |
(301) 0x43750f MOVSXD %ESI,%RSI |
(301) 0x437512 MOV %R14,%RDI |
(301) 0x437515 IMUL %RSI,%RDI |
(301) 0x437519 ADD %RAX,%RDI |
(301) 0x43751c MOVSD (%R8,%RDI,8),%XMM8 |
(301) 0x437522 PXOR %XMM0,%XMM0 |
(301) 0x437526 UCOMISD %XMM8,%XMM0 |
(301) 0x43752b LEA -0x1(%RDX,%R11,1),%EDX |
(301) 0x437530 JAE 437550 |
(301) 0x437532 ADD $-0x2,%R9D |
(301) 0x437536 MOVSXD %EDX,%R8 |
(301) 0x437539 MOVSXD %R9D,%RDX |
(301) 0x43753c MOV %RAX,%RDI |
(301) 0x43753f MOV %R8,%R11 |
(301) 0x437542 JMP 43756a |
0x437544 NOPW %CS:(%RAX,%RAX,1) |
(301) 0x437550 INC %R9D |
(301) 0x437553 MOV -0x38(%RBP),%RDI |
(301) 0x437557 CMP %R9D,%EDI |
(301) 0x43755a CMOVL %EDI,%R9D |
(301) 0x43755e MOVSXD %EDX,%RDI |
(301) 0x437561 MOVSXD %R9D,%RDX |
(301) 0x437564 MOV %RDX,%R8 |
(301) 0x437567 MOV %RAX,%R11 |
(301) 0x43756a MOV -0x40(%RBP),%R9 |
(301) 0x43756e MOV -0x50(%RBP),%RBX |
(301) 0x437572 MOV -0x70(%RBP),%R14 |
(301) 0x437576 MOVAPD %XMM8,%XMM14 |
(301) 0x43757b ANDPD %XMM1,%XMM14 |
(301) 0x437580 IMUL %RSI,%R9 |
(301) 0x437584 ADD %R11,%R9 |
(301) 0x437587 DIVSD (%RBX,%R9,8),%XMM14 |
(301) 0x43758d MOVAPD %XMM14,%XMM7 |
(301) 0x437592 ADDSD %XMM2,%XMM7 |
(301) 0x437596 MOV -0xd0(%RBP),%RBX |
(301) 0x43759d MULSD (%RBX,%RAX,8),%XMM7 |
(301) 0x4375a2 DIVSD (%RBX,%R8,8),%XMM7 |
(301) 0x4375a8 MOV %R14,%RBX |
(301) 0x4375ab IMUL %RSI,%RBX |
(301) 0x4375af LEA (%RBX,%R11,1),%R8 |
(301) 0x4375b3 MOVSD (%R12,%R8,8),%XMM12 |
(301) 0x4375b9 LEA (%RBX,%RDX,1),%R14 |
(301) 0x4375bd MOVAPD %XMM12,%XMM15 |
(301) 0x4375c2 SUBSD (%R12,%R14,8),%XMM15 |
(301) 0x4375c8 ADD %RDI,%RBX |
(301) 0x4375cb MOVSD (%R12,%RBX,8),%XMM13 |
(301) 0x4375d1 MOVAPD %XMM3,%XMM9 |
(301) 0x4375d6 SUBSD %XMM14,%XMM9 |
(301) 0x4375db SUBSD %XMM12,%XMM13 |
(301) 0x4375e0 MOVAPD %XMM13,%XMM10 |
(301) 0x4375e5 MULSD %XMM15,%XMM10 |
(301) 0x4375ea XORPD %XMM11,%XMM11 |
(301) 0x4375ef UCOMISD %XMM11,%XMM10 |
(301) 0x4375f4 XORPD %XMM10,%XMM10 |
(301) 0x4375f9 JBE 437660 |
(301) 0x4375fb MOVAPD %XMM2,%XMM10 |
(301) 0x437600 SUBSD %XMM14,%XMM10 |
(301) 0x437605 XORPD %XMM14,%XMM14 |
(301) 0x43760a CMPSD $0x1,%XMM13,%XMM14 |
(301) 0x437610 MOVAPD %XMM14,%XMM0 |
(301) 0x437615 ANDPD %XMM10,%XMM0 |
(301) 0x43761a XORPD %XMM4,%XMM10 |
(301) 0x43761f ANDNPD %XMM10,%XMM14 |
(301) 0x437624 ORPD %XMM0,%XMM14 |
(301) 0x437629 ANDPD %XMM5,%XMM15 |
(301) 0x43762e ANDPD %XMM5,%XMM13 |
(301) 0x437633 MOVAPD %XMM15,%XMM0 |
(301) 0x437638 MINSD %XMM13,%XMM0 |
(301) 0x43763d MULSD %XMM7,%XMM15 |
(301) 0x437642 MULSD %XMM9,%XMM13 |
(301) 0x437647 ADDSD %XMM15,%XMM13 |
(301) 0x43764c MULSD %XMM6,%XMM13 |
(301) 0x437651 MINSD %XMM0,%XMM13 |
(301) 0x437656 MULSD %XMM14,%XMM13 |
(301) 0x43765b MOVAPD %XMM13,%XMM10 |
(301) 0x437660 ADDSD %XMM12,%XMM10 |
(301) 0x437665 MULSD %XMM8,%XMM10 |
(301) 0x43766a MOV -0x88(%RBP),%RBX |
(301) 0x437671 IMUL %RSI,%RBX |
(301) 0x437675 ADD %RAX,%RBX |
(301) 0x437678 MOV -0xe0(%RBP),%R14 |
(301) 0x43767f MOVSD %XMM10,(%R14,%RBX,8) |
(301) 0x437685 MOV -0xd8(%RBP),%RBX |
(301) 0x43768c IMUL %RSI,%RBX |
(301) 0x437690 ADD %RBX,%R11 |
(301) 0x437693 MOVSD (%R15,%R11,8),%XMM8 |
(301) 0x437699 ADD %RBX,%RDX |
(301) 0x43769c MOVAPD %XMM8,%XMM13 |
(301) 0x4376a1 SUBSD (%R15,%RDX,8),%XMM13 |
(301) 0x4376a7 ADD %RDI,%RBX |
(301) 0x4376aa MOVSD (%R15,%RBX,8),%XMM12 |
(301) 0x4376b0 SUBSD %XMM8,%XMM12 |
(301) 0x4376b5 MOVAPD %XMM12,%XMM0 |
(301) 0x4376ba MULSD %XMM13,%XMM0 |
(301) 0x4376bf UCOMISD %XMM11,%XMM0 |
(301) 0x4376c4 JBE 437480 |
(301) 0x4376ca MOVAPD %XMM10,%XMM0 |
(301) 0x4376cf ANDPD %XMM5,%XMM0 |
(301) 0x4376d3 MOV -0x50(%RBP),%RDX |
(301) 0x4376d7 MOVSD (%RDX,%R9,8),%XMM11 |
(301) 0x4376dd MULSD (%R12,%R8,8),%XMM11 |
(301) 0x4376e3 DIVSD %XMM11,%XMM0 |
(301) 0x4376e8 MOVAPD %XMM2,%XMM11 |
(301) 0x4376ed SUBSD %XMM0,%XMM11 |
(301) 0x4376f2 XORPD %XMM0,%XMM0 |
(301) 0x4376f6 CMPSD $0x1,%XMM12,%XMM0 |
(301) 0x4376fc MOVAPD %XMM0,%XMM14 |
(301) 0x437701 ANDPD %XMM11,%XMM14 |
(301) 0x437706 XORPD %XMM4,%XMM11 |
(301) 0x43770b ANDNPD %XMM11,%XMM0 |
(301) 0x437710 ORPD %XMM14,%XMM0 |
(301) 0x437715 ANDPD %XMM5,%XMM13 |
(301) 0x43771a ANDPD %XMM5,%XMM12 |
(301) 0x43771f MOVAPD %XMM13,%XMM11 |
(301) 0x437724 MINSD %XMM12,%XMM11 |
(301) 0x437729 MULSD %XMM7,%XMM13 |
(301) 0x43772e MULSD %XMM9,%XMM12 |
(301) 0x437733 ADDSD %XMM13,%XMM12 |
(301) 0x437738 MULSD %XMM6,%XMM12 |
(301) 0x43773d MINSD %XMM11,%XMM12 |
(301) 0x437742 MULSD %XMM0,%XMM12 |
(301) 0x437747 MOVAPD %XMM12,%XMM11 |
(301) 0x43774c JMP 437480 |
0x437751 NOPW %CS:(%RAX,%RAX,1) |
Path / |
Source file and lines | advec_cell.cpp:65-110 |
Module | exec |
nb instructions | 192 |
nb uops | 201 |
loop length | 945 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 10 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 49 |
micro-operation queue | 33.50 cycles |
front end | 33.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 7.50 | 7.50 | 7.50 | 7.50 | 5.00 | 30.67 | 30.67 | 30.67 | 8.00 | 8.00 | 8.00 | 8.00 | 8.50 | 8.50 |
cycles | 7.50 | 7.50 | 7.50 | 7.50 | 5.00 | 30.67 | 30.67 | 30.67 | 8.00 | 8.00 | 8.00 | 8.00 | 8.50 | 8.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 33.50 |
Dispatch | 30.67 |
Overall L1 | 33.50 |
all | 33% |
load | 5% |
store | 39% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 14% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 45% |
all | 62% |
load | 62% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 35% |
load | 22% |
store | 39% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 14% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 45% |
all | 16% |
load | 12% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 17% |
all | 20% |
load | 20% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 16% |
load | 14% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x208,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R8,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x40(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x38(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R8,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x28(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x20(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVL $0,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JS 4373fe <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0x9ce> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RCX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R9,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RSI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0xf0(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x58(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0xa0(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x98(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x4aa720,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x54(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404240 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0xa0(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JA 437419 <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0x9e9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %ESI,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%R15),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R14),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%R14),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0xb0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x8(%RAX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R12),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R12),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RBX),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%R13),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x2,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INC %RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x2,%R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND %RDI,%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R11,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R9,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R14,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R11,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JE 437437 <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0xa07> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOVD %EDX,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x210(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ -0x90(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x200(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVD %ESI,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PSHUFD $0x50,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x1f0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ %RDX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x1e0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R9,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x1d0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVD %EAX,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PSHUFD $0x50,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x1c0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R8,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x1b0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R14,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x1a0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R10,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x190(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R11,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x180(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R12,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x170(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ -0x88(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x160(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RBX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x150(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RDI,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R15,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOV -0x60(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ %R10,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOV -0x80(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ %RAX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RCX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
PADDQ 0x5486f(%RIP),%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVAPD 0x53e43(%RIP),%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVAPD 0x54a1a(%RIP),%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 436e24 <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0x3f4> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
ADD $0x208,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R13,-0xc8(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JNE 437441 <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0xa11> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x4aa740,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x54(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x208,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 404050 <__kmpc_for_static_fini@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV -0x68(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x60(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JMP 437444 <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0xa14> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
ADD %R13,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVAPD 0x53724(%RIP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSD 0x536bc(%RIP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x54334(%RIP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVAPD 0x5431c(%RIP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVAPD 0x53704(%RIP),%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSD 0x54324(%RIP),%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R14,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4374b1 <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0xa81> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Source file and lines | advec_cell.cpp:65-110 |
Module | exec |
nb instructions | 192 |
nb uops | 201 |
loop length | 945 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 10 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 49 |
micro-operation queue | 33.50 cycles |
front end | 33.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 7.50 | 7.50 | 7.50 | 7.50 | 5.00 | 30.67 | 30.67 | 30.67 | 8.00 | 8.00 | 8.00 | 8.00 | 8.50 | 8.50 |
cycles | 7.50 | 7.50 | 7.50 | 7.50 | 5.00 | 30.67 | 30.67 | 30.67 | 8.00 | 8.00 | 8.00 | 8.00 | 8.50 | 8.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 33.50 |
Dispatch | 30.67 |
Overall L1 | 33.50 |
all | 33% |
load | 5% |
store | 39% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 14% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 45% |
all | 62% |
load | 62% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 35% |
load | 22% |
store | 39% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 14% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 45% |
all | 16% |
load | 12% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 17% |
all | 20% |
load | 20% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 16% |
load | 14% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 17% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x208,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R8,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x40(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x38(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R8,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x28(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x20(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RBP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVL $0,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JS 4373fe <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0x9ce> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RCX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R9,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RSI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0xf0(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x58(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0xa0(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x98(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x4aa720,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x54(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404240 <__kmpc_for_static_init_8@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0xa0(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x98(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JA 437419 <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0x9e9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %ESI,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%R15),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R14),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%R14),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0xb0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x8(%RAX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R12),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R12),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RBX),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%R13),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x2,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INC %RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x2,%R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND %RDI,%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R11,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R9,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R14,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R11,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JE 437437 <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0xa07> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOVD %EDX,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x210(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ -0x90(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x200(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVD %ESI,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PSHUFD $0x50,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x1f0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ %RDX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x1e0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R9,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x1d0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVD %EAX,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PSHUFD $0x50,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x1c0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R8,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x1b0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R14,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x1a0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R10,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x190(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R11,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x180(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R12,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x170(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ -0x88(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x160(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RBX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x150(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RDI,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %R15,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOV -0x60(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ %R10,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOV -0x80(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ %RAX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
MOVDQA %XMM0,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
MOVQ %RCX,%XMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 6 | 1 |
PSHUFD $0x44,%XMM0,%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 1 | 0.33 |
PADDQ 0x5486f(%RIP),%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOVAPD 0x53e43(%RIP),%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVAPD 0x54a1a(%RIP),%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 436e24 <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0x3f4> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
ADD $0x208,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R13,-0xc8(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JNE 437441 <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0xa11> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x4aa740,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x54(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x208,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 404050 <__kmpc_for_static_fini@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV -0x68(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x60(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JMP 437444 <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0xa14> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
ADD %R13,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVAPD 0x53724(%RIP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSD 0x536bc(%RIP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0x54334(%RIP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVAPD 0x5431c(%RIP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVAPD 0x53704(%RIP),%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVSD 0x54324(%RIP),%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R14,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4374b1 <_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27+0xa81> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_Z17advec_cell_kerneliiiiiiRN6clover8Buffer1DIdEES2_RNS_8Buffer2DIdEES5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_S5_.extracted.27– | 3.37 | 1.85 |
○Loop 302 - advec_cell.cpp:65-110 - exec | 3.37 | 1.85 |
○Loop 301 - advec_cell.cpp:65-110 - exec | 0 | 0 |