Function: _Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted | Module: exec | Source: flux_calc.cpp:36-40 [...] | Coverage: 0.86% |
---|
Function: _Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted | Module: exec | Source: flux_calc.cpp:36-40 [...] | Coverage: 0.86% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-112-9712/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
/home/eoseret/qaas_runs_CPU_9468/171-112-9712/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/flux_calc.cpp: 36 - 40 |
-------------------------------------------------------------------------------- |
36: #pragma omp parallel for simd collapse(2) |
37: for (int j = (y_min + 1); j < (y_max + 1 + 2); j++) { |
38: for (int i = (x_min + 1); i < (x_max + 1 + 2); i++) { |
39: vol_flux_x(i, j) = 0.25 * dt * xarea(i, j) * (xvel0(i, j) + xvel0(i + 0, j + 1) + xvel1(i, j) + xvel1(i + 0, j + 1)); |
40: vol_flux_y(i, j) = 0.25 * dt * yarea(i, j) * (yvel0(i, j) + yvel0(i + 1, j + 0) + yvel1(i, j) + yvel1(i + 1, j + 0)); |
0x429f20 PUSH %RBP |
0x429f21 MOV %RSP,%RBP |
0x429f24 PUSH %R15 |
0x429f26 PUSH %R14 |
0x429f28 PUSH %R13 |
0x429f2a PUSH %R12 |
0x429f2c PUSH %RBX |
0x429f2d AND $-0x20,%RSP |
0x429f31 SUB $0x120,%RSP |
0x429f38 MOV %R9,%R15 |
0x429f3b MOV %RCX,%R12 |
0x429f3e MOV %RDX,%R13 |
0x429f41 MOV 0x58(%RBP),%RAX |
0x429f45 MOV 0x48(%RBP),%R10 |
0x429f49 MOV 0x40(%RBP),%R11 |
0x429f4d MOV 0x30(%RBP),%RDX |
0x429f51 MOV 0x28(%RBP),%R9 |
0x429f55 MOV 0x20(%RBP),%RSI |
0x429f59 MOV 0x18(%RBP),%R14 |
0x429f5d MOV 0x10(%RBP),%RBX |
0x429f61 MOV 0x38(%RBP),%ECX |
0x429f64 MOV %ECX,0x14(%RSP) |
0x429f68 MOVL $0,0x5c(%RSP) |
0x429f70 TEST %RAX,%RAX |
0x429f73 JS 42a5ea |
0x429f79 MOV %RBX,0x40(%RSP) |
0x429f7e MOV %R9,0x30(%RSP) |
0x429f83 MOV %RSI,0x48(%RSP) |
0x429f88 MOV %RDX,0x20(%RSP) |
0x429f8d MOV %R8,0x28(%RSP) |
0x429f92 MOV (%RDI),%ESI |
0x429f94 MOVQ $0,0x88(%RSP) |
0x429fa0 MOV %RAX,0x80(%RSP) |
0x429fa8 MOVQ $0x1,0xb8(%RSP) |
0x429fb4 SUB $0x8,%RSP |
0x429fb8 LEA 0xc0(%RSP),%RAX |
0x429fc0 LEA 0x64(%RSP),%RCX |
0x429fc5 LEA 0x90(%RSP),%R8 |
0x429fcd LEA 0x88(%RSP),%R9 |
0x429fd5 MOV $0x481080,%EDI |
0x429fda MOV %ESI,0x60(%RSP) |
0x429fde MOV $0x22,%EDX |
0x429fe3 PUSH $0x1 |
0x429fe5 PUSH $0x1 |
0x429fe7 PUSH %RAX |
0x429fe8 MOV %R10,%RBX |
0x429feb MOV %R11,0x38(%RSP) |
0x429ff0 CALL 4031e0 <__kmpc_for_static_init_8@plt> |
0x429ff5 ADD $0x20,%RSP |
0x429ff9 MOV 0x88(%RSP),%RSI |
0x42a001 MOV 0x80(%RSP),%RAX |
0x42a009 MOV %RAX,0x78(%RSP) |
0x42a00e CMP %RAX,%RSI |
0x42a011 JA 42a5cb |
0x42a017 MOV %RBX,%R10 |
0x42a01a VMOVQ %R13,%XMM0 |
0x42a01f VMULSD 0x3a4c9(%RIP),%XMM0,%XMM12 |
0x42a027 SUB 0x18(%RSP),%R10D |
0x42a02c MOV (%R12),%RAX |
0x42a030 MOV %RAX,0x50(%RSP) |
0x42a035 MOV 0x10(%R12),%RAX |
0x42a03a MOV %RAX,0x38(%RSP) |
0x42a03f MOV (%R15),%RAX |
0x42a042 MOV %RAX,0x70(%RSP) |
0x42a047 MOV 0x10(%R15),%RBX |
0x42a04b MOV (%R14),%RAX |
0x42a04e MOV %RAX,0x68(%RSP) |
0x42a053 MOV 0x10(%R14),%RDI |
0x42a057 LEA 0x1(%RSI),%RAX |
0x42a05b MOV 0x78(%RSP),%RCX |
0x42a060 LEA 0x1(%RCX),%R15 |
0x42a064 CMP %R15,%RAX |
0x42a067 CMOVG %RAX,%R15 |
0x42a06b MOV 0x30(%RSP),%RAX |
0x42a070 MOV (%RAX),%RCX |
0x42a073 MOV 0x10(%RAX),%RAX |
0x42a077 MOV %RAX,0x30(%RSP) |
0x42a07c MOV 0x28(%RSP),%RAX |
0x42a081 MOV (%RAX),%R9 |
0x42a084 MOV 0x10(%RAX),%RAX |
0x42a088 MOV %RAX,0x28(%RSP) |
0x42a08d MOV 0x40(%RSP),%RAX |
0x42a092 MOV (%RAX),%R11 |
0x42a095 MOV 0x10(%RAX),%R14 |
0x42a099 MOV 0x48(%RSP),%RAX |
0x42a09e MOV (%RAX),%R13 |
0x42a0a1 MOV 0x10(%RAX),%R12 |
0x42a0a5 MOV 0x20(%RSP),%RAX |
0x42a0aa MOV (%RAX),%RDX |
0x42a0ad MOV 0x10(%RAX),%RAX |
0x42a0b1 SUB %RSI,%R15 |
0x42a0b4 MOV $-0x8,%R8D |
0x42a0ba MOV %R15,0x98(%RSP) |
0x42a0c2 AND %R15,%R8 |
0x42a0c5 MOV 0x70(%RSP),%R15 |
0x42a0ca MOV %R8,0x60(%RSP) |
0x42a0cf MOV 0x68(%RSP),%R8 |
0x42a0d4 MOV %R9,0x48(%RSP) |
0x42a0d9 MOV %R11,0x40(%RSP) |
0x42a0de MOV %R13,0xa8(%RSP) |
0x42a0e6 MOV %RDX,0xa0(%RSP) |
0x42a0ee MOV %RAX,0x20(%RSP) |
0x42a0f3 MOV %RCX,0xb0(%RSP) |
0x42a0fb JE 42a5f9 |
0x42a101 MOV %R10,0x90(%RSP) |
0x42a109 VPBROADCASTQ %R10,%YMM8 |
0x42a10f MOV 0x14(%RSP),%EAX |
0x42a113 VPBROADCASTD %EAX,%YMM0 |
0x42a119 VMOVDQU %YMM0,0xe0(%RSP) |
0x42a122 MOV 0x18(%RSP),%RAX |
0x42a127 VPBROADCASTD %EAX,%YMM0 |
0x42a12d VMOVDQU %YMM0,0xc0(%RSP) |
0x42a136 MOV 0x50(%RSP),%RAX |
0x42a13b VPBROADCASTQ %RAX,%YMM15 |
0x42a141 VBROADCASTSD %XMM12,%YMM16 |
0x42a147 VPBROADCASTQ %R15,%YMM17 |
0x42a14d VPBROADCASTQ %R8,%YMM18 |
0x42a153 VPBROADCASTQ %RCX,%YMM19 |
0x42a159 VPBROADCASTQ %R9,%YMM20 |
0x42a15f VPBROADCASTQ %R11,%YMM21 |
0x42a165 VPBROADCASTQ %R13,%YMM22 |
0x42a16b VPBROADCASTQ %RSI,%YMM0 |
0x42a171 VPADDQ 0x3a507(%RIP),%YMM0,%YMM9 |
0x42a179 VPADDQ 0x3a37f(%RIP),%YMM0,%YMM10 |
0x42a181 VPBROADCASTQ %RDX,%YMM23 |
0x42a187 XOR %R13D,%R13D |
0x42a18a VPCMPEQD %YMM13,%YMM13,%YMM13 |
0x42a18f VPBROADCASTQ 0x3a507(%RIP),%YMM25 |
0x42a199 NOPL (%RAX) |
(227) 0x42a1a0 VMOVDQA %YMM10,%YMM0 |
(227) 0x42a1a4 VMOVDQA %YMM8,%YMM1 |
(227) 0x42a1a8 MOV $0x452aa0,%R15 |
(227) 0x42a1af CALL %R15 |
(227) 0x42a1b2 VMOVDQA %YMM0,%YMM11 |
(227) 0x42a1b6 VMOVDQA %YMM9,%YMM0 |
(227) 0x42a1ba VMOVDQA %YMM8,%YMM1 |
(227) 0x42a1be CALL %R15 |
(227) 0x42a1c1 VPMOVQD %YMM11,%XMM1 |
(227) 0x42a1c7 VPMOVQD %YMM0,%XMM0 |
(227) 0x42a1cd VINSERTI128 $0x1,%XMM0,%YMM1,%YMM0 |
(227) 0x42a1d3 VPADDD 0xe0(%RSP),%YMM0,%YMM26 |
(227) 0x42a1db VMOVDQA %YMM10,%YMM0 |
(227) 0x42a1df VMOVDQA %YMM8,%YMM1 |
(227) 0x42a1e3 MOV $0x452870,%R15 |
(227) 0x42a1ea CALL %R15 |
(227) 0x42a1ed VMOVDQA %YMM0,%YMM11 |
(227) 0x42a1f1 VMOVDQA %YMM9,%YMM0 |
(227) 0x42a1f5 VMOVDQA %YMM8,%YMM1 |
(227) 0x42a1f9 CALL %R15 |
(227) 0x42a1fc MOV 0x28(%RSP),%RCX |
(227) 0x42a201 MOV 0x30(%RSP),%RAX |
(227) 0x42a206 VPMOVQD %YMM11,%XMM2 |
(227) 0x42a20c VPMOVQD %YMM0,%XMM3 |
(227) 0x42a212 VPMOVSXDQ %XMM26,%YMM0 |
(227) 0x42a218 VEXTRACTI32X4 $0x1,%YMM26,%XMM1 |
(227) 0x42a21f VPMOVSXDQ %XMM1,%YMM1 |
(227) 0x42a224 VXORPS %XMM5,%XMM5,%XMM5 |
(227) 0x42a228 VPMULLQ %YMM1,%YMM15,%YMM5 |
(227) 0x42a22e VXORPS %XMM6,%XMM6,%XMM6 |
(227) 0x42a232 VPMULLQ %YMM0,%YMM15,%YMM6 |
(227) 0x42a238 VXORPS %XMM7,%XMM7,%XMM7 |
(227) 0x42a23c VPMULLQ %YMM1,%YMM17,%YMM7 |
(227) 0x42a242 VINSERTI128 $0x1,%XMM3,%YMM2,%YMM2 |
(227) 0x42a248 VPADDD 0xc0(%RSP),%YMM2,%YMM4 |
(227) 0x42a251 VXORPS %XMM3,%XMM3,%XMM3 |
(227) 0x42a255 VPMULLQ %YMM0,%YMM17,%YMM3 |
(227) 0x42a25b VPMOVSXDQ %XMM4,%YMM2 |
(227) 0x42a260 VPSUBD %YMM13,%YMM26,%YMM11 |
(227) 0x42a266 VPMOVSXDQ %XMM11,%YMM26 |
(227) 0x42a26c VPXORD %XMM27,%XMM27,%XMM27 |
(227) 0x42a272 VPMULLQ %YMM26,%YMM17,%YMM27 |
(227) 0x42a278 VPADDQ %YMM2,%YMM3,%YMM3 |
(227) 0x42a27c KXNORW %K0,%K0,%K1 |
(227) 0x42a280 VXORPD %XMM28,%XMM28,%XMM28 |
(227) 0x42a286 VPMULLQ %YMM0,%YMM18,%YMM29 |
(227) 0x42a28c VGATHERQPD (%RBX,%YMM3,8),%YMM28{%K1} |
(227) 0x42a293 VPADDQ %YMM2,%YMM27,%YMM3 |
(227) 0x42a299 VPADDQ %YMM2,%YMM29,%YMM27 |
(227) 0x42a29f KXNORW %K0,%K0,%K1 |
(227) 0x42a2a3 VPXORD %XMM29,%XMM29,%XMM29 |
(227) 0x42a2a9 VGATHERQPD (%RDI,%YMM27,8),%YMM29{%K1} |
(227) 0x42a2b0 KXNORW %K0,%K0,%K1 |
(227) 0x42a2b4 VXORPD %XMM27,%XMM27,%XMM27 |
(227) 0x42a2ba VPMULLQ %YMM26,%YMM18,%YMM26 |
(227) 0x42a2c0 VGATHERQPD (%RBX,%YMM3,8),%YMM27{%K1} |
(227) 0x42a2c7 VEXTRACTI128 $0x1,%YMM4,%XMM3 |
(227) 0x42a2cd VPMOVSXDQ %XMM3,%YMM3 |
(227) 0x42a2d2 VPADDQ %YMM2,%YMM26,%YMM26 |
(227) 0x42a2d8 KXNORW %K0,%K0,%K1 |
(227) 0x42a2dc VXORPD %XMM30,%XMM30,%XMM30 |
(227) 0x42a2e2 VGATHERQPD (%RDI,%YMM26,8),%YMM30{%K1} |
(227) 0x42a2e9 VEXTRACTI128 $0x1,%YMM11,%XMM11 |
(227) 0x42a2ef VPMOVSXDQ %XMM11,%YMM11 |
(227) 0x42a2f4 VPXORD %XMM26,%XMM26,%XMM26 |
(227) 0x42a2fa VPMULLQ %YMM11,%YMM17,%YMM26 |
(227) 0x42a300 VPADDQ %YMM3,%YMM7,%YMM7 |
(227) 0x42a304 KXNORW %K0,%K0,%K1 |
(227) 0x42a308 VXORPD %XMM31,%XMM31,%XMM31 |
(227) 0x42a30e VPMULLQ %YMM1,%YMM18,%YMM24 |
(227) 0x42a314 VGATHERQPD (%RBX,%YMM7,8),%YMM31{%K1} |
(227) 0x42a31b VPADDQ %YMM3,%YMM26,%YMM7 |
(227) 0x42a321 VPADDQ %YMM3,%YMM24,%YMM24 |
(227) 0x42a327 KXNORW %K0,%K0,%K1 |
(227) 0x42a32b VPXORD %XMM26,%XMM26,%XMM26 |
(227) 0x42a331 VGATHERQPD (%RDI,%YMM24,8),%YMM26{%K1} |
(227) 0x42a338 KXNORW %K0,%K0,%K1 |
(227) 0x42a33c VXORPD %XMM24,%XMM24,%XMM24 |
(227) 0x42a342 VPMULLQ %YMM11,%YMM18,%YMM11 |
(227) 0x42a348 VGATHERQPD (%RBX,%YMM7,8),%YMM24{%K1} |
(227) 0x42a34f VPADDQ %YMM3,%YMM11,%YMM7 |
(227) 0x42a353 KXNORW %K0,%K0,%K1 |
(227) 0x42a357 VPXOR %XMM11,%XMM11,%XMM11 |
(227) 0x42a35c VGATHERQPD (%RDI,%YMM7,8),%YMM11{%K1} |
(227) 0x42a363 VPADDQ %YMM2,%YMM6,%YMM6 |
(227) 0x42a367 KXNORW %K0,%K0,%K1 |
(227) 0x42a36b VXORPD %XMM7,%XMM7,%XMM7 |
(227) 0x42a36f MOV 0x38(%RSP),%RDX |
(227) 0x42a374 VGATHERQPD (%RDX,%YMM6,8),%YMM7{%K1} |
(227) 0x42a37b VPADDQ %YMM3,%YMM5,%YMM5 |
(227) 0x42a37f KXNORW %K0,%K0,%K1 |
(227) 0x42a383 VXORPD %XMM6,%XMM6,%XMM6 |
(227) 0x42a387 VGATHERQPD (%RDX,%YMM5,8),%YMM6{%K1} |
(227) 0x42a38e VXORPS %XMM5,%XMM5,%XMM5 |
(227) 0x42a392 VPMULLQ %YMM0,%YMM19,%YMM5 |
(227) 0x42a398 VMULPD %YMM16,%YMM7,%YMM7 |
(227) 0x42a39e VPMULLQ %YMM1,%YMM19,%YMM14 |
(227) 0x42a3a4 VMULPD %YMM16,%YMM6,%YMM6 |
(227) 0x42a3aa VADDPD %YMM29,%YMM28,%YMM28 |
(227) 0x42a3b0 VADDPD %YMM26,%YMM31,%YMM26 |
(227) 0x42a3b6 VPXORD %XMM29,%XMM29,%XMM29 |
(227) 0x42a3bc VPMULLQ %YMM1,%YMM20,%YMM29 |
(227) 0x42a3c2 VADDPD %YMM11,%YMM24,%YMM11 |
(227) 0x42a3c8 VADDPD %YMM30,%YMM27,%YMM24 |
(227) 0x42a3ce VADDPD %YMM28,%YMM24,%YMM24 |
(227) 0x42a3d4 VPXORD %XMM27,%XMM27,%XMM27 |
(227) 0x42a3da VPMULLQ %YMM0,%YMM20,%YMM27 |
(227) 0x42a3e0 VADDPD %YMM26,%YMM11,%YMM11 |
(227) 0x42a3e6 VPADDQ %YMM3,%YMM14,%YMM14 |
(227) 0x42a3ea VPADDQ %YMM2,%YMM5,%YMM5 |
(227) 0x42a3ee VPXORD %XMM26,%XMM26,%XMM26 |
(227) 0x42a3f4 VPMULLQ %YMM1,%YMM21,%YMM26 |
(227) 0x42a3fa VMULPD %YMM24,%YMM7,%YMM7 |
(227) 0x42a400 KXNORW %K0,%K0,%K1 |
(227) 0x42a404 KXNORW %K0,%K0,%K2 |
(227) 0x42a408 VPXORD %XMM24,%XMM24,%XMM24 |
(227) 0x42a40e VPMULLQ %YMM0,%YMM21,%YMM24 |
(227) 0x42a414 VMULPD %YMM6,%YMM11,%YMM6 |
(227) 0x42a418 VPADDQ %YMM2,%YMM24,%YMM11 |
(227) 0x42a41e VSCATTERQPD %YMM7,(%RAX,%YMM5,8){%K1} |
(227) 0x42a425 VPADDQ %YMM3,%YMM26,%YMM5 |
(227) 0x42a42b VSCATTERQPD %YMM6,(%RAX,%YMM14,8){%K2} |
(227) 0x42a432 KXNORW %K0,%K0,%K1 |
(227) 0x42a436 VXORPD %XMM6,%XMM6,%XMM6 |
(227) 0x42a43a KXNORW %K0,%K0,%K2 |
(227) 0x42a43e VXORPD %XMM7,%XMM7,%XMM7 |
(227) 0x42a442 VPSUBD %YMM13,%YMM4,%YMM4 |
(227) 0x42a447 VGATHERQPD (%R14,%YMM5,8),%YMM6{%K1} |
(227) 0x42a44e VEXTRACTI128 $0x1,%YMM4,%XMM5 |
(227) 0x42a454 VPMOVSXDQ %XMM5,%YMM5 |
(227) 0x42a459 VPMOVSXDQ %XMM4,%YMM4 |
(227) 0x42a45e VPADDQ %YMM4,%YMM24,%YMM14 |
(227) 0x42a464 VPADDQ %YMM5,%YMM26,%YMM24 |
(227) 0x42a46a VGATHERQPD (%R14,%YMM11,8),%YMM7{%K2} |
(227) 0x42a471 KXNORW %K0,%K0,%K1 |
(227) 0x42a475 VXORPD %XMM11,%XMM11,%XMM11 |
(227) 0x42a47a VPXORD %XMM26,%XMM26,%XMM26 |
(227) 0x42a480 VPMULLQ %YMM0,%YMM22,%YMM26 |
(227) 0x42a486 VGATHERQPD (%R14,%YMM24,8),%YMM11{%K1} |
(227) 0x42a48d KXNORW %K0,%K0,%K1 |
(227) 0x42a491 VXORPD %XMM24,%XMM24,%XMM24 |
(227) 0x42a497 VPXORD %XMM28,%XMM28,%XMM28 |
(227) 0x42a49d VPMULLQ %YMM1,%YMM22,%YMM28 |
(227) 0x42a4a3 VGATHERQPD (%R14,%YMM14,8),%YMM24{%K1} |
(227) 0x42a4aa VPADDQ %YMM2,%YMM26,%YMM14 |
(227) 0x42a4b0 KXNORW %K0,%K0,%K1 |
(227) 0x42a4b4 VXORPD %XMM30,%XMM30,%XMM30 |
(227) 0x42a4ba VGATHERQPD (%R12,%YMM14,8),%YMM30{%K1} |
(227) 0x42a4c1 VPADDQ %YMM3,%YMM28,%YMM14 |
(227) 0x42a4c7 KXNORW %K0,%K0,%K1 |
(227) 0x42a4cb VXORPD %XMM31,%XMM31,%XMM31 |
(227) 0x42a4d1 VGATHERQPD (%R12,%YMM14,8),%YMM31{%K1} |
(227) 0x42a4d8 VPADDQ %YMM5,%YMM28,%YMM5 |
(227) 0x42a4de KXNORW %K0,%K0,%K1 |
(227) 0x42a4e2 VXORPD %XMM14,%XMM14,%XMM14 |
(227) 0x42a4e7 VGATHERQPD (%R12,%YMM5,8),%YMM14{%K1} |
(227) 0x42a4ee VPADDQ %YMM4,%YMM26,%YMM4 |
(227) 0x42a4f4 KXNORW %K0,%K0,%K1 |
(227) 0x42a4f8 VXORPD %XMM5,%XMM5,%XMM5 |
(227) 0x42a4fc VGATHERQPD (%R12,%YMM4,8),%YMM5{%K1} |
(227) 0x42a503 VPADDQ %YMM3,%YMM29,%YMM4 |
(227) 0x42a509 KXNORW %K0,%K0,%K1 |
(227) 0x42a50d VPXORD %XMM26,%XMM26,%XMM26 |
(227) 0x42a513 VGATHERQPD (%RCX,%YMM4,8),%YMM26{%K1} |
(227) 0x42a51a VPADDQ %YMM2,%YMM27,%YMM4 |
(227) 0x42a520 KXNORW %K0,%K0,%K1 |
(227) 0x42a524 VPXORD %XMM27,%XMM27,%XMM27 |
(227) 0x42a52a VGATHERQPD (%RCX,%YMM4,8),%YMM27{%K1} |
(227) 0x42a531 VMULPD %YMM16,%YMM27,%YMM4 |
(227) 0x42a537 VMULPD %YMM16,%YMM26,%YMM26 |
(227) 0x42a53d VADDPD %YMM6,%YMM11,%YMM6 |
(227) 0x42a541 VADDPD %YMM7,%YMM24,%YMM7 |
(227) 0x42a547 VADDPD %YMM14,%YMM31,%YMM11 |
(227) 0x42a54d VADDPD %YMM6,%YMM11,%YMM6 |
(227) 0x42a551 VADDPD %YMM5,%YMM30,%YMM5 |
(227) 0x42a557 VADDPD %YMM5,%YMM7,%YMM5 |
(227) 0x42a55b VPMULLQ %YMM0,%YMM23,%YMM0 |
(227) 0x42a561 VMULPD %YMM6,%YMM26,%YMM6 |
(227) 0x42a567 VMULPD %YMM5,%YMM4,%YMM4 |
(227) 0x42a56b VPMULLQ %YMM1,%YMM23,%YMM1 |
(227) 0x42a571 VPADDQ %YMM2,%YMM0,%YMM0 |
(227) 0x42a575 VPADDQ %YMM3,%YMM1,%YMM1 |
(227) 0x42a579 KXNORW %K0,%K0,%K1 |
(227) 0x42a57d MOV 0x20(%RSP),%RAX |
(227) 0x42a582 VSCATTERQPD %YMM4,(%RAX,%YMM0,8){%K1} |
(227) 0x42a589 KXNORW %K0,%K0,%K1 |
(227) 0x42a58d VSCATTERQPD %YMM6,(%RAX,%YMM1,8){%K1} |
(227) 0x42a594 VPADDQ %YMM25,%YMM10,%YMM10 |
(227) 0x42a59a VPADDQ %YMM25,%YMM9,%YMM9 |
(227) 0x42a5a0 ADD $0x8,%R13 |
(227) 0x42a5a4 CMP 0x60(%RSP),%R13 |
(227) 0x42a5a9 JB 42a1a0 |
0x42a5af MOV 0x38(%RSP),%R15 |
0x42a5b4 MOV 0x60(%RSP),%RAX |
0x42a5b9 CMP %RAX,0x98(%RSP) |
0x42a5c1 MOV 0x90(%RSP),%R10 |
0x42a5c9 JNE 42a603 |
0x42a5cb MOV $0x4810a0,%EDI |
0x42a5d0 MOV 0x58(%RSP),%ESI |
0x42a5d4 LEA -0x28(%RBP),%RSP |
0x42a5d8 POP %RBX |
0x42a5d9 POP %R12 |
0x42a5db POP %R13 |
0x42a5dd POP %R14 |
0x42a5df POP %R15 |
0x42a5e1 POP %RBP |
0x42a5e2 VZEROUPPER |
0x42a5e5 JMP 403050 |
0x42a5ea LEA -0x28(%RBP),%RSP |
0x42a5ee POP %RBX |
0x42a5ef POP %R12 |
0x42a5f1 POP %R13 |
0x42a5f3 POP %R14 |
0x42a5f5 POP %R15 |
0x42a5f7 POP %RBP |
0x42a5f8 RET |
0x42a5f9 MOV 0x38(%RSP),%R15 |
0x42a5fe JMP 42a728 |
0x42a603 ADD %RAX,%RSI |
0x42a606 JMP 42a728 |
0x42a60b NOPL (%RAX,%RAX,1) |
(226) 0x42a610 MOV %RSI,%RAX |
(226) 0x42a613 CQTO |
(226) 0x42a615 IDIV %R10 |
(226) 0x42a618 MOV 0x18(%RSP),%RAX |
(226) 0x42a61d MOV 0x50(%RSP),%R8 |
(226) 0x42a622 ADD %EAX,%EDX |
(226) 0x42a624 MOVSXD %EDX,%RAX |
(226) 0x42a627 MOVSXD %ECX,%RCX |
(226) 0x42a62a MOV %R8,%RDX |
(226) 0x42a62d IMUL %RCX,%RDX |
(226) 0x42a631 ADD %RAX,%RDX |
(226) 0x42a634 MOV 0x70(%RSP),%R11 |
(226) 0x42a639 MOV %R11,%R8 |
(226) 0x42a63c IMUL %RCX,%R8 |
(226) 0x42a640 ADD %RAX,%R8 |
(226) 0x42a643 LEA 0x1(%RCX),%R9D |
(226) 0x42a647 MOVSXD %R9D,%R9 |
(226) 0x42a64a VMOVSD (%RBX,%R8,8),%XMM0 |
(226) 0x42a650 MOV 0x68(%RSP),%R13 |
(226) 0x42a655 MOV %R13,%R8 |
(226) 0x42a658 IMUL %RCX,%R8 |
(226) 0x42a65c ADD %RAX,%R8 |
(226) 0x42a65f VMOVSD (%RDI,%R8,8),%XMM1 |
(226) 0x42a665 IMUL %R9,%R11 |
(226) 0x42a669 ADD %RAX,%R11 |
(226) 0x42a66c IMUL %R13,%R9 |
(226) 0x42a670 ADD %RAX,%R9 |
(226) 0x42a673 VADDSD (%RBX,%R11,8),%XMM0,%XMM0 |
(226) 0x42a679 VADDSD (%RDI,%R9,8),%XMM1,%XMM1 |
(226) 0x42a67f VMULSD (%R15,%RDX,8),%XMM12,%XMM2 |
(226) 0x42a685 VADDSD %XMM0,%XMM1,%XMM0 |
(226) 0x42a689 VMULSD %XMM2,%XMM0,%XMM0 |
(226) 0x42a68d MOV 0xb0(%RSP),%RDX |
(226) 0x42a695 IMUL %RCX,%RDX |
(226) 0x42a699 ADD %RAX,%RDX |
(226) 0x42a69c MOV 0x30(%RSP),%R8 |
(226) 0x42a6a1 VMOVSD %XMM0,(%R8,%RDX,8) |
(226) 0x42a6a7 MOV 0x40(%RSP),%RDX |
(226) 0x42a6ac IMUL %RCX,%RDX |
(226) 0x42a6b0 LEA 0x1(%RDX,%RAX,1),%R8 |
(226) 0x42a6b5 ADD %RAX,%RDX |
(226) 0x42a6b8 VMOVSD (%R14,%RDX,8),%XMM0 |
(226) 0x42a6be MOV 0xa8(%RSP),%RDX |
(226) 0x42a6c6 IMUL %RCX,%RDX |
(226) 0x42a6ca LEA (%RDX,%RAX,1),%R9 |
(226) 0x42a6ce VMOVSD (%R12,%R9,8),%XMM1 |
(226) 0x42a6d4 VADDSD (%R14,%R8,8),%XMM0,%XMM0 |
(226) 0x42a6da LEA 0x1(%RDX,%RAX,1),%RDX |
(226) 0x42a6df VADDSD (%R12,%RDX,8),%XMM1,%XMM1 |
(226) 0x42a6e5 MOV 0x48(%RSP),%RDX |
(226) 0x42a6ea IMUL %RCX,%RDX |
(226) 0x42a6ee ADD %RAX,%RDX |
(226) 0x42a6f1 MOV 0x28(%RSP),%R8 |
(226) 0x42a6f6 VMULSD (%R8,%RDX,8),%XMM12,%XMM2 |
(226) 0x42a6fc IMUL 0xa0(%RSP),%RCX |
(226) 0x42a705 ADD %RAX,%RCX |
(226) 0x42a708 VADDSD %XMM0,%XMM1,%XMM0 |
(226) 0x42a70c VMULSD %XMM2,%XMM0,%XMM0 |
(226) 0x42a710 MOV 0x20(%RSP),%RAX |
(226) 0x42a715 VMOVSD %XMM0,(%RAX,%RCX,8) |
(226) 0x42a71a INC %RSI |
(226) 0x42a71d CMP 0x78(%RSP),%RSI |
(226) 0x42a722 JG 42a5cb |
(226) 0x42a728 MOV %RSI,%R8 |
(226) 0x42a72b SHR $0x20,%R8 |
(226) 0x42a72f JE 42a750 |
(226) 0x42a731 MOV %RSI,%RAX |
(226) 0x42a734 XOR %EDX,%EDX |
(226) 0x42a736 DIV %R10 |
(226) 0x42a739 MOV %RAX,%RCX |
(226) 0x42a73c ADD 0x14(%RSP),%ECX |
(226) 0x42a740 TEST %R8,%R8 |
(226) 0x42a743 JNE 42a610 |
(226) 0x42a749 JMP 42a766 |
0x42a74b NOPL (%RAX,%RAX,1) |
(226) 0x42a750 MOV %ESI,%EAX |
(226) 0x42a752 XOR %EDX,%EDX |
(226) 0x42a754 DIV %R10D |
(226) 0x42a757 MOV %EAX,%ECX |
(226) 0x42a759 ADD 0x14(%RSP),%ECX |
(226) 0x42a75d TEST %R8,%R8 |
(226) 0x42a760 JNE 42a610 |
(226) 0x42a766 MOV %ESI,%EAX |
(226) 0x42a768 XOR %EDX,%EDX |
(226) 0x42a76a DIV %R10D |
(226) 0x42a76d JMP 42a618 |
0x42a772 NOPW %CS:(%RAX,%RAX,1) |
0x42a77c NOPL (%RAX) |
Path / |
Source file and lines | flux_calc.cpp:36-40 |
Module | exec |
nb instructions | 161 |
nb uops | 163 |
loop length | 756 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 15 |
used zmm registers | 0 |
nb stack references | 36 |
micro-operation queue | 27.17 cycles |
front end | 27.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 6.07 | 5.93 | 21.00 | 21.00 | 20.00 | 14.00 | 6.00 | 20.00 | 20.00 | 20.00 | 6.00 | 21.00 |
cycles | 6.07 | 5.93 | 21.00 | 21.00 | 20.00 | 14.00 | 6.00 | 20.00 | 20.00 | 20.00 | 6.00 | 21.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 26.98 |
Stall cycles | 0.00 |
Front-end | 27.17 |
Dispatch | 21.00 |
Overall L1 | 27.17 |
all | 8% |
load | 11% |
store | 6% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 66% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 7% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 8% |
load | 11% |
store | 6% |
mul | 0% |
add-sub | 66% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 7% |
all | 14% |
load | 16% |
store | 13% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 16% |
store | 13% |
mul | 12% |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x120,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ECX,0x14(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,0x5c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 42a5ea <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x6ca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0xc0(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x64(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x90(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x88(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x481080,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %R10,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4031e0 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x88(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 42a5cb <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x6ab> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMULSD 0x3a4c9(%RIP),%XMM0,%XMM12 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
SUB 0x18(%RSP),%R10D | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV (%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R15),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R14),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x78(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RCX),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RSI,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $-0x8,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND %R15,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0x70(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RSP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 42a5f9 <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x6d9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R10,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x14(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x18(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x50(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM12,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R15,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R8,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R9,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R11,%YMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R13,%YMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RSI,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ 0x3a507(%RIP),%YMM0,%YMM9 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
VPADDQ 0x3a37f(%RIP),%YMM0,%YMM10 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
VPBROADCASTQ %RDX,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPCMPEQD %YMM13,%YMM13,%YMM13 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3a507(%RIP),%YMM25 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,0x98(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV 0x90(%RSP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 42a603 <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x6e3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x4810a0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x58(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 403050 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
MOV 0x38(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 42a728 <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x808> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 42a728 <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x808> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | flux_calc.cpp:36-40 |
Module | exec |
nb instructions | 161 |
nb uops | 163 |
loop length | 756 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 15 |
used zmm registers | 0 |
nb stack references | 36 |
micro-operation queue | 27.17 cycles |
front end | 27.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 6.07 | 5.93 | 21.00 | 21.00 | 20.00 | 14.00 | 6.00 | 20.00 | 20.00 | 20.00 | 6.00 | 21.00 |
cycles | 6.07 | 5.93 | 21.00 | 21.00 | 20.00 | 14.00 | 6.00 | 20.00 | 20.00 | 20.00 | 6.00 | 21.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 26.98 |
Stall cycles | 0.00 |
Front-end | 27.17 |
Dispatch | 21.00 |
Overall L1 | 27.17 |
all | 8% |
load | 11% |
store | 6% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 66% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 7% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 8% |
load | 11% |
store | 6% |
mul | 0% |
add-sub | 66% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 7% |
all | 14% |
load | 16% |
store | 13% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 16% |
store | 13% |
mul | 12% |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x120,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ECX,0x14(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,0x5c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 42a5ea <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x6ca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0xc0(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x64(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x90(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x88(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x481080,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %R10,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4031e0 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x88(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 42a5cb <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x6ab> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMULSD 0x3a4c9(%RIP),%XMM0,%XMM12 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
SUB 0x18(%RSP),%R10D | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV (%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R15),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R14),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x78(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RCX),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RSI,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $-0x8,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND %R15,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0x70(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RSP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 42a5f9 <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x6d9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R10,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x14(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x18(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x50(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM12,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R15,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R8,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R9,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R11,%YMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R13,%YMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RSI,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ 0x3a507(%RIP),%YMM0,%YMM9 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
VPADDQ 0x3a37f(%RIP),%YMM0,%YMM10 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
VPBROADCASTQ %RDX,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPCMPEQD %YMM13,%YMM13,%YMM13 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VPBROADCASTQ 0x3a507(%RIP),%YMM25 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,0x98(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV 0x90(%RSP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 42a603 <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x6e3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x4810a0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x58(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 403050 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
MOV 0x38(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 42a728 <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x808> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 42a728 <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x808> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted– | 0.86 | 1.21 |
○Loop 227 - flux_calc.cpp:36-40 - exec | 0.86 | 1.21 |
○Loop 226 - flux_calc.cpp:36-40 - exec | 0 | 0 |