Function: flux_calc_kernel(int, int, int, int, double, clover::Buffer2D<double>&, clover::Buffer2D<d ... | Module: exec | Source: flux_calc.cpp:36-41 [...] | Coverage: 0.88% |
---|
Function: flux_calc_kernel(int, int, int, int, double, clover::Buffer2D<double>&, clover::Buffer2D<d ... | Module: exec | Source: flux_calc.cpp:36-41 [...] | Coverage: 0.88% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-4969/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/flux_calc.cpp: 36 - 41 |
-------------------------------------------------------------------------------- |
36: #pragma omp parallel for simd collapse(2) |
37: for (int j = (y_min + 1); j < (y_max + 1 + 2); j++) { |
38: for (int i = (x_min + 1); i < (x_max + 1 + 2); i++) { |
39: vol_flux_x(i, j) = 0.25 * dt * xarea(i, j) * (xvel0(i, j) + xvel0(i + 0, j + 1) + xvel1(i, j) + xvel1(i + 0, j + 1)); |
40: vol_flux_y(i, j) = 0.25 * dt * yarea(i, j) * (yvel0(i, j) + yvel0(i + 1, j + 0) + yvel1(i, j) + yvel1(i + 1, j + 0)); |
41: } |
/scratch_na/users/xoserete/qaas_runs/171-415-4969/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
0x42b7d0 PUSH %RBP |
0x42b7d1 MOV %RSP,%RBP |
0x42b7d4 PUSH %R15 |
0x42b7d6 PUSH %R14 |
0x42b7d8 PUSH %R13 |
0x42b7da PUSH %R12 |
0x42b7dc PUSH %RBX |
0x42b7dd AND $-0x20,%RSP |
0x42b7e1 SUB $0x120,%RSP |
0x42b7e8 MOV %R9,%R15 |
0x42b7eb MOV %RCX,%R12 |
0x42b7ee MOV %RDX,%R13 |
0x42b7f1 MOV 0x58(%RBP),%RAX |
0x42b7f5 MOV 0x48(%RBP),%R10 |
0x42b7f9 MOV 0x40(%RBP),%R11 |
0x42b7fd MOV 0x30(%RBP),%RDX |
0x42b801 MOV 0x28(%RBP),%RBX |
0x42b805 MOV 0x20(%RBP),%RSI |
0x42b809 MOV 0x18(%RBP),%R14 |
0x42b80d MOV 0x10(%RBP),%R9 |
0x42b811 MOV 0x38(%RBP),%ECX |
0x42b814 MOV %ECX,0x4(%RSP) |
0x42b818 MOVL $0,0x44(%RSP) |
0x42b820 TEST %RAX,%RAX |
0x42b823 JS 42be8d |
0x42b829 MOV %RBX,0x18(%RSP) |
0x42b82e MOV %R9,0x20(%RSP) |
0x42b833 MOV %RSI,0x28(%RSP) |
0x42b838 MOV %RDX,0x30(%RSP) |
0x42b83d MOV %R8,0x10(%RSP) |
0x42b842 MOV (%RDI),%ESI |
0x42b844 MOVQ $0,0x78(%RSP) |
0x42b84d MOV %RAX,0x70(%RSP) |
0x42b852 MOVQ $0x1,0xa8(%RSP) |
0x42b85e SUB $0x8,%RSP |
0x42b862 LEA 0xb0(%RSP),%RAX |
0x42b86a LEA 0x4c(%RSP),%RCX |
0x42b86f LEA 0x80(%RSP),%R8 |
0x42b877 LEA 0x78(%RSP),%R9 |
0x42b87c MOV $0x683070,%EDI |
0x42b881 MOV %ESI,0x48(%RSP) |
0x42b885 MOV $0x22,%EDX |
0x42b88a PUSH $0x1 |
0x42b88c PUSH $0x1 |
0x42b88e PUSH %RAX |
0x42b88f MOV %R10,%RBX |
0x42b892 MOV %R11,0x28(%RSP) |
0x42b897 CALL 403020 <__kmpc_for_static_init_8@plt> |
0x42b89c ADD $0x20,%RSP |
0x42b8a0 MOV 0x78(%RSP),%RSI |
0x42b8a5 MOV 0x70(%RSP),%RAX |
0x42b8aa MOV %RAX,0x60(%RSP) |
0x42b8af CMP %RAX,%RSI |
0x42b8b2 JA 42be6e |
0x42b8b8 VMOVQ %R13,%XMM0 |
0x42b8bd VMULSD 0x3a82b(%RIP),%XMM0,%XMM3 |
0x42b8c5 SUB 0x8(%RSP),%EBX |
0x42b8c9 MOV (%R12),%RAX |
0x42b8cd MOV %RAX,0x38(%RSP) |
0x42b8d2 MOV 0x10(%R12),%RAX |
0x42b8d7 MOV %RAX,0x68(%RSP) |
0x42b8dc MOV (%R15),%RAX |
0x42b8df MOV %RAX,0x58(%RSP) |
0x42b8e4 MOV 0x10(%R15),%R15 |
0x42b8e8 MOV (%R14),%RAX |
0x42b8eb MOV %RAX,0x50(%RSP) |
0x42b8f0 MOV 0x10(%R14),%R14 |
0x42b8f4 LEA 0x1(%RSI),%RAX |
0x42b8f8 MOV 0x60(%RSP),%RCX |
0x42b8fd LEA 0x1(%RCX),%R10 |
0x42b901 CMP %R10,%RAX |
0x42b904 CMOVG %RAX,%R10 |
0x42b908 MOV 0x18(%RSP),%RAX |
0x42b90d MOV (%RAX),%RCX |
0x42b910 MOV 0x10(%RAX),%RAX |
0x42b914 MOV %RAX,0x18(%RSP) |
0x42b919 MOV 0x10(%RSP),%RAX |
0x42b91e MOV (%RAX),%R9 |
0x42b921 MOV 0x10(%RAX),%RAX |
0x42b925 MOV %RAX,0x10(%RSP) |
0x42b92a MOV 0x20(%RSP),%RAX |
0x42b92f MOV (%RAX),%R11 |
0x42b932 MOV 0x10(%RAX),%RDI |
0x42b936 MOV 0x28(%RSP),%RAX |
0x42b93b MOV (%RAX),%R13 |
0x42b93e MOV 0x10(%RAX),%R12 |
0x42b942 MOV 0x30(%RSP),%RAX |
0x42b947 MOV (%RAX),%RDX |
0x42b94a MOV 0x10(%RAX),%RAX |
0x42b94e SUB %RSI,%R10 |
0x42b951 MOV $-0x8,%R8D |
0x42b957 MOV %R10,0x90(%RSP) |
0x42b95f AND %R10,%R8 |
0x42b962 MOV %R8,%R10 |
0x42b965 MOV 0x58(%RSP),%R8 |
0x42b96a MOV %R9,0x30(%RSP) |
0x42b96f MOV %R11,0x28(%RSP) |
0x42b974 MOV %R13,0x20(%RSP) |
0x42b979 MOV %RDX,0x98(%RSP) |
0x42b981 MOV %RCX,0xa0(%RSP) |
0x42b989 JE 42bfcc |
0x42b98f MOV %RBX,0x88(%RSP) |
0x42b997 VPBROADCASTQ %RBX,%YMM8 |
0x42b99d MOV %RAX,0x48(%RSP) |
0x42b9a2 MOV 0x4(%RSP),%EAX |
0x42b9a6 VPBROADCASTD %EAX,%YMM0 |
0x42b9ac VMOVDQU %YMM0,0xe0(%RSP) |
0x42b9b5 MOV 0x8(%RSP),%RAX |
0x42b9ba VPBROADCASTD %EAX,%YMM0 |
0x42b9c0 VMOVDQU %YMM0,0xc0(%RSP) |
0x42b9c9 MOV 0x38(%RSP),%RAX |
0x42b9ce VPBROADCASTQ %RAX,%YMM15 |
0x42b9d4 VMOVUPD %XMM3,0xb0(%RSP) |
0x42b9dd VBROADCASTSD %XMM3,%YMM16 |
0x42b9e3 VPBROADCASTQ %R8,%YMM17 |
0x42b9e9 MOV 0x50(%RSP),%RAX |
0x42b9ee VPBROADCASTQ %RAX,%YMM18 |
0x42b9f4 VPBROADCASTQ %RCX,%YMM19 |
0x42b9fa VPBROADCASTQ %R9,%YMM20 |
0x42ba00 VPBROADCASTQ %R11,%YMM21 |
0x42ba06 VPBROADCASTQ %R13,%YMM22 |
0x42ba0c MOV %RSI,0x80(%RSP) |
0x42ba14 VPBROADCASTQ %RSI,%YMM0 |
0x42ba1a VPADDQ 0x3a85e(%RIP),%YMM0,%YMM9 |
0x42ba22 VPADDQ 0x3a6d6(%RIP),%YMM0,%YMM10 |
0x42ba2a VPBROADCASTQ %RDX,%YMM23 |
0x42ba30 XOR %R13D,%R13D |
0x42ba33 VPCMPEQD %YMM12,%YMM12,%YMM12 |
0x42ba38 NOPL (%RAX,%RAX,1) |
(178) 0x42ba40 VMOVDQA %YMM10,%YMM0 |
(178) 0x42ba44 VMOVDQA %YMM8,%YMM1 |
(178) 0x42ba48 MOV %R10,%RBX |
(178) 0x42ba4b MOV $0x454690,%RSI |
(178) 0x42ba52 CALL %RSI |
(178) 0x42ba54 VMOVDQA %YMM0,%YMM11 |
(178) 0x42ba58 VMOVDQA %YMM9,%YMM0 |
(178) 0x42ba5c VMOVDQA %YMM8,%YMM1 |
(178) 0x42ba60 CALL %RSI |
(178) 0x42ba62 VPMOVQD %YMM11,%XMM1 |
(178) 0x42ba68 VPMOVQD %YMM0,%XMM0 |
(178) 0x42ba6e VINSERTI128 $0x1,%XMM0,%YMM1,%YMM0 |
(178) 0x42ba74 VPADDD 0xe0(%RSP),%YMM0,%YMM27 |
(178) 0x42ba7c VMOVDQA %YMM10,%YMM0 |
(178) 0x42ba80 VMOVDQA %YMM8,%YMM1 |
(178) 0x42ba84 MOV $0x454460,%RSI |
(178) 0x42ba8b CALL %RSI |
(178) 0x42ba8d VMOVDQA %YMM0,%YMM11 |
(178) 0x42ba91 VMOVDQA %YMM9,%YMM0 |
(178) 0x42ba95 VMOVDQA %YMM8,%YMM1 |
(178) 0x42ba99 CALL %RSI |
(178) 0x42ba9b MOV %RBX,%R10 |
(178) 0x42ba9e MOV 0x10(%RSP),%RCX |
(178) 0x42baa3 MOV 0x18(%RSP),%RAX |
(178) 0x42baa8 VPMOVQD %YMM11,%XMM2 |
(178) 0x42baae VPMOVQD %YMM0,%XMM3 |
(178) 0x42bab4 VPMOVSXDQ %XMM27,%YMM1 |
(178) 0x42baba VEXTRACTI32X4 $0x1,%YMM27,%XMM0 |
(178) 0x42bac1 VPMOVSXDQ %XMM0,%YMM0 |
(178) 0x42bac6 VXORPS %XMM5,%XMM5,%XMM5 |
(178) 0x42baca VPMULLQ %YMM0,%YMM15,%YMM5 |
(178) 0x42bad0 VXORPS %XMM6,%XMM6,%XMM6 |
(178) 0x42bad4 VPMULLQ %YMM1,%YMM15,%YMM6 |
(178) 0x42bada VPMULLQ %YMM0,%YMM17,%YMM26 |
(178) 0x42bae0 VINSERTI128 $0x1,%XMM3,%YMM2,%YMM2 |
(178) 0x42bae6 VPADDD 0xc0(%RSP),%YMM2,%YMM4 |
(178) 0x42baef VXORPS %XMM3,%XMM3,%XMM3 |
(178) 0x42baf3 VPMULLQ %YMM1,%YMM17,%YMM3 |
(178) 0x42baf9 VPMOVSXDQ %XMM4,%YMM2 |
(178) 0x42bafe VPSUBD %YMM12,%YMM27,%YMM27 |
(178) 0x42bb04 VPMOVSXDQ %XMM27,%YMM28 |
(178) 0x42bb0a VXORPS %XMM11,%XMM11,%XMM11 |
(178) 0x42bb0f VPMULLQ %YMM28,%YMM17,%YMM11 |
(178) 0x42bb15 VPADDQ %YMM2,%YMM3,%YMM3 |
(178) 0x42bb19 KXNORW %K0,%K0,%K1 |
(178) 0x42bb1d VXORPD %XMM7,%XMM7,%XMM7 |
(178) 0x42bb21 VPMULLQ %YMM1,%YMM18,%YMM29 |
(178) 0x42bb27 VGATHERQPD (%R15,%YMM3,8),%YMM7{%K1} |
(178) 0x42bb2e VPADDQ %YMM2,%YMM11,%YMM3 |
(178) 0x42bb32 VPADDQ %YMM2,%YMM29,%YMM11 |
(178) 0x42bb38 KXNORW %K0,%K0,%K1 |
(178) 0x42bb3c VPXORD %XMM29,%XMM29,%XMM29 |
(178) 0x42bb42 VGATHERQPD (%R14,%YMM11,8),%YMM29{%K1} |
(178) 0x42bb49 KXNORW %K0,%K0,%K1 |
(178) 0x42bb4d VXORPD %XMM11,%XMM11,%XMM11 |
(178) 0x42bb52 VPMULLQ %YMM28,%YMM18,%YMM28 |
(178) 0x42bb58 VGATHERQPD (%R15,%YMM3,8),%YMM11{%K1} |
(178) 0x42bb5f VEXTRACTI128 $0x1,%YMM4,%XMM3 |
(178) 0x42bb65 VPMOVSXDQ %XMM3,%YMM3 |
(178) 0x42bb6a VPADDQ %YMM2,%YMM28,%YMM28 |
(178) 0x42bb70 KXNORW %K0,%K0,%K1 |
(178) 0x42bb74 VXORPD %XMM30,%XMM30,%XMM30 |
(178) 0x42bb7a VGATHERQPD (%R14,%YMM28,8),%YMM30{%K1} |
(178) 0x42bb81 VEXTRACTI32X4 $0x1,%YMM27,%XMM27 |
(178) 0x42bb88 VPMOVSXDQ %XMM27,%YMM27 |
(178) 0x42bb8e VPXORD %XMM28,%XMM28,%XMM28 |
(178) 0x42bb94 VPMULLQ %YMM27,%YMM17,%YMM28 |
(178) 0x42bb9a VPADDQ %YMM3,%YMM26,%YMM26 |
(178) 0x42bba0 KXNORW %K0,%K0,%K1 |
(178) 0x42bba4 VXORPD %XMM31,%XMM31,%XMM31 |
(178) 0x42bbaa VPMULLQ %YMM0,%YMM18,%YMM24 |
(178) 0x42bbb0 VGATHERQPD (%R15,%YMM26,8),%YMM31{%K1} |
(178) 0x42bbb7 VPADDQ %YMM3,%YMM28,%YMM26 |
(178) 0x42bbbd VPADDQ %YMM3,%YMM24,%YMM24 |
(178) 0x42bbc3 KXNORW %K0,%K0,%K1 |
(178) 0x42bbc7 VPXORD %XMM28,%XMM28,%XMM28 |
(178) 0x42bbcd VGATHERQPD (%R14,%YMM24,8),%YMM28{%K1} |
(178) 0x42bbd4 KXNORW %K0,%K0,%K1 |
(178) 0x42bbd8 VXORPD %XMM24,%XMM24,%XMM24 |
(178) 0x42bbde VPMULLQ %YMM27,%YMM18,%YMM27 |
(178) 0x42bbe4 VGATHERQPD (%R15,%YMM26,8),%YMM24{%K1} |
(178) 0x42bbeb VPADDQ %YMM3,%YMM27,%YMM26 |
(178) 0x42bbf1 KXNORW %K0,%K0,%K1 |
(178) 0x42bbf5 VPXORD %XMM27,%XMM27,%XMM27 |
(178) 0x42bbfb VGATHERQPD (%R14,%YMM26,8),%YMM27{%K1} |
(178) 0x42bc02 VPADDQ %YMM2,%YMM6,%YMM6 |
(178) 0x42bc06 KXNORW %K0,%K0,%K1 |
(178) 0x42bc0a VXORPD %XMM26,%XMM26,%XMM26 |
(178) 0x42bc10 MOV 0x68(%RSP),%RDX |
(178) 0x42bc15 VGATHERQPD (%RDX,%YMM6,8),%YMM26{%K1} |
(178) 0x42bc1c VPADDQ %YMM3,%YMM5,%YMM5 |
(178) 0x42bc20 KXNORW %K0,%K0,%K1 |
(178) 0x42bc24 VXORPD %XMM6,%XMM6,%XMM6 |
(178) 0x42bc28 VGATHERQPD (%RDX,%YMM5,8),%YMM6{%K1} |
(178) 0x42bc2f VPMULLQ %YMM1,%YMM19,%YMM14 |
(178) 0x42bc35 VMULPD %YMM16,%YMM26,%YMM26 |
(178) 0x42bc3b VPMULLQ %YMM0,%YMM19,%YMM13 |
(178) 0x42bc41 VMULPD %YMM16,%YMM6,%YMM25 |
(178) 0x42bc47 VADDPD %YMM29,%YMM7,%YMM6 |
(178) 0x42bc4d VADDPD %YMM28,%YMM31,%YMM7 |
(178) 0x42bc53 VXORPS %XMM5,%XMM5,%XMM5 |
(178) 0x42bc57 VPMULLQ %YMM0,%YMM20,%YMM5 |
(178) 0x42bc5d VADDPD %YMM27,%YMM24,%YMM24 |
(178) 0x42bc63 VADDPD %YMM30,%YMM11,%YMM11 |
(178) 0x42bc69 VADDPD %YMM6,%YMM11,%YMM11 |
(178) 0x42bc6d VXORPS %XMM6,%XMM6,%XMM6 |
(178) 0x42bc71 VPMULLQ %YMM1,%YMM20,%YMM6 |
(178) 0x42bc77 VADDPD %YMM7,%YMM24,%YMM7 |
(178) 0x42bc7d VPADDQ %YMM3,%YMM13,%YMM13 |
(178) 0x42bc81 VPADDQ %YMM2,%YMM14,%YMM14 |
(178) 0x42bc85 VPXORD %XMM24,%XMM24,%XMM24 |
(178) 0x42bc8b VPMULLQ %YMM0,%YMM21,%YMM24 |
(178) 0x42bc91 VMULPD %YMM11,%YMM26,%YMM11 |
(178) 0x42bc97 KXNORW %K0,%K0,%K1 |
(178) 0x42bc9b KXNORW %K0,%K0,%K2 |
(178) 0x42bc9f VPXORD %XMM26,%XMM26,%XMM26 |
(178) 0x42bca5 VPMULLQ %YMM1,%YMM21,%YMM26 |
(178) 0x42bcab VMULPD %YMM7,%YMM25,%YMM7 |
(178) 0x42bcb1 VPADDQ %YMM2,%YMM26,%YMM25 |
(178) 0x42bcb7 VSCATTERQPD %YMM11,(%RAX,%YMM14,8){%K1} |
(178) 0x42bcbe VPADDQ %YMM3,%YMM24,%YMM11 |
(178) 0x42bcc4 VSCATTERQPD %YMM7,(%RAX,%YMM13,8){%K2} |
(178) 0x42bccb KXNORW %K0,%K0,%K1 |
(178) 0x42bccf VXORPD %XMM7,%XMM7,%XMM7 |
(178) 0x42bcd3 KXNORW %K0,%K0,%K2 |
(178) 0x42bcd7 VXORPD %XMM13,%XMM13,%XMM13 |
(178) 0x42bcdc VPSUBD %YMM12,%YMM4,%YMM4 |
(178) 0x42bce1 VGATHERQPD (%RDI,%YMM11,8),%YMM7{%K1} |
(178) 0x42bce8 VEXTRACTI128 $0x1,%YMM4,%XMM11 |
(178) 0x42bcee VPMOVSXDQ %XMM11,%YMM11 |
(178) 0x42bcf3 VPMOVSXDQ %XMM4,%YMM4 |
(178) 0x42bcf8 VPADDQ %YMM4,%YMM26,%YMM14 |
(178) 0x42bcfe VPADDQ %YMM11,%YMM24,%YMM24 |
(178) 0x42bd04 VGATHERQPD (%RDI,%YMM25,8),%YMM13{%K2} |
(178) 0x42bd0b KXNORW %K0,%K0,%K1 |
(178) 0x42bd0f VXORPD %XMM25,%XMM25,%XMM25 |
(178) 0x42bd15 VPXORD %XMM26,%XMM26,%XMM26 |
(178) 0x42bd1b VPMULLQ %YMM1,%YMM22,%YMM26 |
(178) 0x42bd21 VGATHERQPD (%RDI,%YMM24,8),%YMM25{%K1} |
(178) 0x42bd28 KXNORW %K0,%K0,%K1 |
(178) 0x42bd2c VXORPD %XMM24,%XMM24,%XMM24 |
(178) 0x42bd32 VPXORD %XMM27,%XMM27,%XMM27 |
(178) 0x42bd38 VPMULLQ %YMM0,%YMM22,%YMM27 |
(178) 0x42bd3e VGATHERQPD (%RDI,%YMM14,8),%YMM24{%K1} |
(178) 0x42bd45 VPADDQ %YMM2,%YMM26,%YMM14 |
(178) 0x42bd4b KXNORW %K0,%K0,%K1 |
(178) 0x42bd4f VXORPD %XMM28,%XMM28,%XMM28 |
(178) 0x42bd55 VGATHERQPD (%R12,%YMM14,8),%YMM28{%K1} |
(178) 0x42bd5c VPADDQ %YMM3,%YMM27,%YMM14 |
(178) 0x42bd62 KXNORW %K0,%K0,%K1 |
(178) 0x42bd66 VXORPD %XMM29,%XMM29,%XMM29 |
(178) 0x42bd6c VGATHERQPD (%R12,%YMM14,8),%YMM29{%K1} |
(178) 0x42bd73 VPADDQ %YMM11,%YMM27,%YMM11 |
(178) 0x42bd79 KXNORW %K0,%K0,%K1 |
(178) 0x42bd7d VXORPD %XMM14,%XMM14,%XMM14 |
(178) 0x42bd82 VGATHERQPD (%R12,%YMM11,8),%YMM14{%K1} |
(178) 0x42bd89 VPADDQ %YMM4,%YMM26,%YMM4 |
(178) 0x42bd8f KXNORW %K0,%K0,%K1 |
(178) 0x42bd93 VXORPD %XMM11,%XMM11,%XMM11 |
(178) 0x42bd98 VGATHERQPD (%R12,%YMM4,8),%YMM11{%K1} |
(178) 0x42bd9f VPADDQ %YMM3,%YMM5,%YMM4 |
(178) 0x42bda3 KXNORW %K0,%K0,%K1 |
(178) 0x42bda7 VPXOR %XMM5,%XMM5,%XMM5 |
(178) 0x42bdab VGATHERQPD (%RCX,%YMM4,8),%YMM5{%K1} |
(178) 0x42bdb2 VPADDQ %YMM2,%YMM6,%YMM4 |
(178) 0x42bdb6 KXNORW %K0,%K0,%K1 |
(178) 0x42bdba VPXOR %XMM6,%XMM6,%XMM6 |
(178) 0x42bdbe VGATHERQPD (%RCX,%YMM4,8),%YMM6{%K1} |
(178) 0x42bdc5 VMULPD %YMM16,%YMM6,%YMM4 |
(178) 0x42bdcb VMULPD %YMM16,%YMM5,%YMM5 |
(178) 0x42bdd1 VADDPD %YMM7,%YMM25,%YMM6 |
(178) 0x42bdd7 VADDPD %YMM13,%YMM24,%YMM7 |
(178) 0x42bddd VADDPD %YMM14,%YMM29,%YMM13 |
(178) 0x42bde3 VADDPD %YMM6,%YMM13,%YMM6 |
(178) 0x42bde7 VADDPD %YMM11,%YMM28,%YMM11 |
(178) 0x42bded VADDPD %YMM7,%YMM11,%YMM7 |
(178) 0x42bdf1 VPMULLQ %YMM1,%YMM23,%YMM1 |
(178) 0x42bdf7 VMULPD %YMM6,%YMM5,%YMM5 |
(178) 0x42bdfb VMULPD %YMM7,%YMM4,%YMM4 |
(178) 0x42bdff VPMULLQ %YMM0,%YMM23,%YMM0 |
(178) 0x42be05 VPADDQ %YMM2,%YMM1,%YMM1 |
(178) 0x42be09 VPADDQ %YMM3,%YMM0,%YMM0 |
(178) 0x42be0d KXNORW %K0,%K0,%K1 |
(178) 0x42be11 MOV 0x48(%RSP),%RAX |
(178) 0x42be16 VSCATTERQPD %YMM4,(%RAX,%YMM1,8){%K1} |
(178) 0x42be1d KXNORW %K0,%K0,%K1 |
(178) 0x42be21 VSCATTERQPD %YMM5,(%RAX,%YMM0,8){%K1} |
(178) 0x42be28 VPBROADCASTQ 0x3a46f(%RIP),%YMM0 |
(178) 0x42be31 VPADDQ %YMM0,%YMM10,%YMM10 |
(178) 0x42be35 VPADDQ %YMM0,%YMM9,%YMM9 |
(178) 0x42be39 ADD $0x8,%R13 |
(178) 0x42be3d CMP %RBX,%R13 |
(178) 0x42be40 JB 42ba40 |
0x42be46 CMP %R10,0x90(%RSP) |
0x42be4e MOV 0x88(%RSP),%RBX |
0x42be56 MOV 0x48(%RSP),%RAX |
0x42be5b MOV 0x80(%RSP),%RSI |
0x42be63 VMOVUPD 0xb0(%RSP),%XMM3 |
0x42be6c JNE 42be9c |
0x42be6e MOV $0x683090,%EDI |
0x42be73 MOV 0x40(%RSP),%ESI |
0x42be77 LEA -0x28(%RBP),%RSP |
0x42be7b POP %RBX |
0x42be7c POP %R12 |
0x42be7e POP %R13 |
0x42be80 POP %R14 |
0x42be82 POP %R15 |
0x42be84 POP %RBP |
0x42be85 VZEROUPPER |
0x42be88 JMP 402e90 |
0x42be8d LEA -0x28(%RBP),%RSP |
0x42be91 POP %RBX |
0x42be92 POP %R12 |
0x42be94 POP %R13 |
0x42be96 POP %R14 |
0x42be98 POP %R15 |
0x42be9a POP %RBP |
0x42be9b RET |
0x42be9c ADD %R10,%RSI |
0x42be9f JMP 42bfcc |
0x42bea4 NOPW %CS:(%RAX,%RAX,1) |
(177) 0x42beb0 MOV %RSI,%RAX |
(177) 0x42beb3 CQTO |
(177) 0x42beb5 IDIV %RBX |
(177) 0x42beb8 MOV 0x8(%RSP),%RAX |
(177) 0x42bebd MOV 0x38(%RSP),%R8 |
(177) 0x42bec2 ADD 0x4(%RSP),%ECX |
(177) 0x42bec6 ADD %EAX,%EDX |
(177) 0x42bec8 MOVSXD %EDX,%RDX |
(177) 0x42becb MOVSXD %ECX,%RAX |
(177) 0x42bece MOV %R8,%RCX |
(177) 0x42bed1 IMUL %RAX,%RCX |
(177) 0x42bed5 ADD %RDX,%RCX |
(177) 0x42bed8 MOV 0x58(%RSP),%R11 |
(177) 0x42bedd MOV %R11,%R8 |
(177) 0x42bee0 IMUL %RAX,%R8 |
(177) 0x42bee4 ADD %RDX,%R8 |
(177) 0x42bee7 LEA 0x1(%RAX),%R9D |
(177) 0x42beeb MOVSXD %R9D,%R9 |
(177) 0x42beee VMOVSD (%R15,%R8,8),%XMM0 |
(177) 0x42bef4 MOV 0x50(%RSP),%R13 |
(177) 0x42bef9 MOV %R13,%R8 |
(177) 0x42befc IMUL %RAX,%R8 |
(177) 0x42bf00 ADD %RDX,%R8 |
(177) 0x42bf03 VMOVSD (%R14,%R8,8),%XMM1 |
(177) 0x42bf09 IMUL %R9,%R11 |
(177) 0x42bf0d ADD %RDX,%R11 |
(177) 0x42bf10 IMUL %R13,%R9 |
(177) 0x42bf14 ADD %RDX,%R9 |
(177) 0x42bf17 VADDSD (%R15,%R11,8),%XMM0,%XMM0 |
(177) 0x42bf1d VADDSD (%R14,%R9,8),%XMM1,%XMM1 |
(177) 0x42bf23 MOV 0x68(%RSP),%R8 |
(177) 0x42bf28 VMULSD (%R8,%RCX,8),%XMM3,%XMM2 |
(177) 0x42bf2e VADDSD %XMM0,%XMM1,%XMM0 |
(177) 0x42bf32 VMULSD %XMM2,%XMM0,%XMM0 |
(177) 0x42bf36 MOV 0xa0(%RSP),%RCX |
(177) 0x42bf3e IMUL %RAX,%RCX |
(177) 0x42bf42 ADD %RDX,%RCX |
(177) 0x42bf45 MOV 0x18(%RSP),%R8 |
(177) 0x42bf4a VMOVSD %XMM0,(%R8,%RCX,8) |
(177) 0x42bf50 MOV 0x28(%RSP),%RCX |
(177) 0x42bf55 IMUL %RAX,%RCX |
(177) 0x42bf59 LEA 0x1(%RCX,%RDX,1),%R8 |
(177) 0x42bf5e ADD %RDX,%RCX |
(177) 0x42bf61 VMOVSD (%RDI,%RCX,8),%XMM0 |
(177) 0x42bf66 MOV 0x20(%RSP),%RCX |
(177) 0x42bf6b IMUL %RAX,%RCX |
(177) 0x42bf6f LEA (%RCX,%RDX,1),%R9 |
(177) 0x42bf73 VMOVSD (%R12,%R9,8),%XMM1 |
(177) 0x42bf79 VADDSD (%RDI,%R8,8),%XMM0,%XMM0 |
(177) 0x42bf7f LEA 0x1(%RCX,%RDX,1),%RCX |
(177) 0x42bf84 VADDSD (%R12,%RCX,8),%XMM1,%XMM1 |
(177) 0x42bf8a MOV 0x30(%RSP),%RCX |
(177) 0x42bf8f IMUL %RAX,%RCX |
(177) 0x42bf93 ADD %RDX,%RCX |
(177) 0x42bf96 MOV 0x10(%RSP),%R8 |
(177) 0x42bf9b VMULSD (%R8,%RCX,8),%XMM3,%XMM2 |
(177) 0x42bfa1 IMUL 0x98(%RSP),%RAX |
(177) 0x42bfaa ADD %RDX,%RAX |
(177) 0x42bfad VADDSD %XMM0,%XMM1,%XMM0 |
(177) 0x42bfb1 VMULSD %XMM2,%XMM0,%XMM0 |
(177) 0x42bfb5 VMOVSD %XMM0,(%R10,%RAX,8) |
(177) 0x42bfbb MOV %R10,%RAX |
(177) 0x42bfbe INC %RSI |
(177) 0x42bfc1 CMP 0x60(%RSP),%RSI |
(177) 0x42bfc6 JG 42be6e |
(177) 0x42bfcc MOV %RAX,%R10 |
(177) 0x42bfcf MOV %RSI,%R8 |
(177) 0x42bfd2 SHR $0x20,%R8 |
(177) 0x42bfd6 JE 42bff0 |
(177) 0x42bfd8 MOV %RSI,%RAX |
(177) 0x42bfdb XOR %EDX,%EDX |
(177) 0x42bfdd DIV %RBX |
(177) 0x42bfe0 MOV %RAX,%RCX |
(177) 0x42bfe3 TEST %R8,%R8 |
(177) 0x42bfe6 JNE 42beb0 |
(177) 0x42bfec JMP 42c001 |
0x42bfee XCHG %AX,%AX |
(177) 0x42bff0 MOV %ESI,%EAX |
(177) 0x42bff2 XOR %EDX,%EDX |
(177) 0x42bff4 DIV %EBX |
(177) 0x42bff6 MOV %EAX,%ECX |
(177) 0x42bff8 TEST %R8,%R8 |
(177) 0x42bffb JNE 42beb0 |
(177) 0x42c001 MOV %ESI,%EAX |
(177) 0x42c003 XOR %EDX,%EDX |
(177) 0x42c005 DIV %EBX |
(177) 0x42c007 JMP 42beb8 |
0x42c00c NOPL (%RAX) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | flux_calc.cpp:36-41 |
Module | exec |
nb instructions | 159 |
nb uops | 161 |
loop length | 736 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 14 |
used zmm registers | 0 |
nb stack references | 37 |
micro-operation queue | 26.83 cycles |
front end | 26.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 6.07 | 5.93 | 20.67 | 20.67 | 20.50 | 14.00 | 6.00 | 20.50 | 20.50 | 20.50 | 6.00 | 20.67 |
cycles | 6.07 | 5.93 | 20.67 | 20.67 | 20.50 | 14.00 | 6.00 | 20.50 | 20.50 | 20.50 | 6.00 | 20.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 26.65 |
Stall cycles | 0.00 |
Front-end | 26.83 |
Dispatch | 20.67 |
Overall L1 | 26.83 |
all | 8% |
load | 14% |
store | 6% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 66% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 8% |
all | 50% |
load | 50% |
store | 100% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 18% |
store | 9% |
mul | 0% |
add-sub | 66% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 7% |
all | 14% |
load | 17% |
store | 13% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 18% |
load | 18% |
store | 25% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 17% |
store | 14% |
mul | 12% |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x120,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ECX,0x4(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,0x44(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 42be8d <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x6bd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0xb0(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x4c(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x80(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x78(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x683070,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %R10,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 403020 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x78(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x70(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 42be6e <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x69e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMULSD 0x3a82b(%RIP),%XMM0,%XMM3 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
SUB 0x8(%RSP),%EBX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV (%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R14),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x60(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RCX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R10 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RSI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $-0x8,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND %R10,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R8,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x58(%RSP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 42bfcc <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x7fc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %RBX,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x4(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM3,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM3,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R8,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x50(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R9,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R11,%YMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R13,%YMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RSI,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %RSI,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ 0x3a85e(%RIP),%YMM0,%YMM9 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
VPADDQ 0x3a6d6(%RIP),%YMM0,%YMM10 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
VPBROADCASTQ %RDX,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPCMPEQD %YMM12,%YMM12,%YMM12 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,0x90(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV 0x88(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0xb0(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
JNE 42be9c <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x6cc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x683090,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x40(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 402e90 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
ADD %R10,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 42bfcc <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x7fc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | flux_calc.cpp:36-41 |
Module | exec |
nb instructions | 159 |
nb uops | 161 |
loop length | 736 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 14 |
used zmm registers | 0 |
nb stack references | 37 |
micro-operation queue | 26.83 cycles |
front end | 26.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 6.07 | 5.93 | 20.67 | 20.67 | 20.50 | 14.00 | 6.00 | 20.50 | 20.50 | 20.50 | 6.00 | 20.67 |
cycles | 6.07 | 5.93 | 20.67 | 20.67 | 20.50 | 14.00 | 6.00 | 20.50 | 20.50 | 20.50 | 6.00 | 20.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 26.65 |
Stall cycles | 0.00 |
Front-end | 26.83 |
Dispatch | 20.67 |
Overall L1 | 26.83 |
all | 8% |
load | 14% |
store | 6% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 66% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 8% |
all | 50% |
load | 50% |
store | 100% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 18% |
store | 9% |
mul | 0% |
add-sub | 66% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 7% |
all | 14% |
load | 17% |
store | 13% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 18% |
load | 18% |
store | 25% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 17% |
store | 14% |
mul | 12% |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x120,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ECX,0x4(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,0x44(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 42be8d <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x6bd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0xb0(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x4c(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x80(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x78(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x683070,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %R10,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 403020 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x78(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x70(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 42be6e <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x69e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMULSD 0x3a82b(%RIP),%XMM0,%XMM3 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
SUB 0x8(%RSP),%EBX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV (%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R14),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x60(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RCX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R10 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RSI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $-0x8,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND %R10,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R8,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x58(%RSP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 42bfcc <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x7fc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %RBX,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x4(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %XMM3,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM3,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R8,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x50(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R9,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R11,%YMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R13,%YMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RSI,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %RSI,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ 0x3a85e(%RIP),%YMM0,%YMM9 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
VPADDQ 0x3a6d6(%RIP),%YMM0,%YMM10 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
VPBROADCASTQ %RDX,%YMM23 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPCMPEQD %YMM12,%YMM12,%YMM12 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,0x90(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV 0x88(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0xb0(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
JNE 42be9c <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x6cc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x683090,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x40(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 402e90 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
ADD %R10,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 42bfcc <_Z16flux_calc_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_.extracted+0x7fc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼flux_calc_kernel(int, int, int, int, double, clover::Buffer2D | 0.88 | 1.07 |
○Loop 178 - flux_calc.cpp:37-41 - exec | 0.88 | 1.07 |
○Loop 177 - flux_calc.cpp:37-41 - exec | 0 | 0 |