Function: .omp_outlined..10#0x239680 | Module: exec | Source: advec_mom.cpp:95-100 [...] | Coverage: 2.98% |
---|
Function: .omp_outlined..10#0x239680 | Module: exec | Source: advec_mom.cpp:95-100 [...] | Coverage: 2.98% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/advec_mom.cpp: 95 - 100 |
-------------------------------------------------------------------------------- |
95: #pragma omp parallel for simd collapse(2) |
96: for (int j = (y_min + 1); j < (y_max + 1 + 2); j++) { |
97: for (int i = (x_min - 1 + 1); i < (x_max + 2 + 2); i++) { |
98: node_mass_post(i, j) = 0.25 * (density1(i + 0, j - 1) * post_vol(i + 0, j - 1) + density1(i, j) * post_vol(i, j) + |
99: density1(i - 1, j - 1) * post_vol(i - 1, j - 1) + density1(i - 1, j + 0) * post_vol(i - 1, j + 0)); |
100: node_mass_pre(i, j) = node_mass_post(i, j) - node_flux(i - 1, j + 0) + node_flux(i, j); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
0x239680 PUSH %RBP |
0x239681 MOV %RSP,%RBP |
0x239684 PUSH %R15 |
0x239686 PUSH %R14 |
0x239688 PUSH %R13 |
0x23968a PUSH %R12 |
0x23968c PUSH %RBX |
0x23968d SUB $0x78,%RSP |
0x239691 MOV (%RCX),%R15D |
0x239694 MOV (%RDX),%EBX |
0x239696 LEA 0x1(%RBX),%R13D |
0x23969a ADD $0x3,%R15D |
0x23969e SUB %R13D,%R15D |
0x2396a1 JLE 239dfe |
0x2396a7 MOV (%R9),%R12D |
0x2396aa MOV (%R8),%R14D |
0x2396ad ADD $0x4,%R12D |
0x2396b1 CMP %R14D,%R12D |
0x2396b4 JLE 239dfe |
0x2396ba SUB %R14D,%R12D |
0x2396bd MOV (%RDI),%ESI |
0x2396bf MOVQ $0,-0x78(%RBP) |
0x2396c7 MOVQ $0x1,-0xa0(%RBP) |
0x2396d2 MOVL $0,-0x48(%RBP) |
0x2396d9 IMUL %R12,%R15 |
0x2396dd DEC %R15 |
0x2396e0 MOV %R15,-0x40(%RBP) |
0x2396e4 SUB $0x8,%RSP |
0x2396e8 LEA -0x48(%RBP),%RCX |
0x2396ec LEA -0xa0(%RBP),%RAX |
0x2396f3 LEA 0x27676(%RIP),%RDI |
0x2396fa LEA -0x78(%RBP),%R8 |
0x2396fe LEA -0x40(%RBP),%R9 |
0x239702 MOV %ESI,-0x44(%RBP) |
0x239705 MOV $0x22,%EDX |
0x23970a PUSH $0x1 |
0x23970c PUSH $0x1 |
0x23970e PUSH %RAX |
0x23970f CALL 25f740 <@plt_start@+0x530> |
0x239714 ADD $0x20,%RSP |
0x239718 MOV -0x40(%RBP),%RAX |
0x23971c MOV -0x78(%RBP),%RCX |
0x239720 CMP %R15,%RAX |
0x239723 CMOVL %RAX,%R15 |
0x239727 MOV %R15,-0x40(%RBP) |
0x23972b CMP %R15,%RCX |
0x23972e JG 239dec |
0x239734 MOV 0x20(%RBP),%RSI |
0x239738 MOV 0x10(%RBP),%R11 |
0x23973c MOV 0x30(%RBP),%RAX |
0x239740 MOV 0x28(%RBP),%RDX |
0x239744 MOV %R14D,-0x2c(%RBP) |
0x239748 MOV 0x18(%RBP),%R8 |
0x23974c MOV %R12,-0x58(%RBP) |
0x239750 MOV %RBX,-0x68(%RBP) |
0x239754 MOV %R13,-0x60(%RBP) |
0x239758 MOV (%RSI),%R9 |
0x23975b MOV 0x10(%RSI),%R10 |
0x23975f MOV (%R11),%RSI |
0x239762 MOV 0x10(%R11),%R11 |
0x239766 MOV 0x10(%RAX),%R14 |
0x23976a MOV (%R8),%RDI |
0x23976d MOV 0x10(%R8),%R8 |
0x239771 MOV %R11,-0x70(%RBP) |
0x239775 MOV (%RAX),%R11 |
0x239778 MOV (%RDX),%RAX |
0x23977b MOV %RDI,-0x90(%RBP) |
0x239782 MOV %RAX,-0x50(%RBP) |
0x239786 MOV 0x10(%RDX),%RAX |
0x23978a MOV %R11,-0x98(%RBP) |
0x239791 MOV %RAX,-0x38(%RBP) |
0x239795 MOV %R15,%RAX |
0x239798 SUB %RCX,%RAX |
0x23979b INC %RAX |
0x23979e CMP $0x4,%RAX |
0x2397a2 JAE 2397af |
0x2397a4 MOV %R9,%R12 |
0x2397a7 MOV %RSI,%R11 |
0x2397aa JMP 239ceb |
0x2397af VBROADCASTSD -0x27fa0(%RIP),%YMM12 |
0x2397b8 VPBROADCASTQ %RCX,%YMM0 |
0x2397be VPADDQ -0x27dc6(%RIP),%YMM0,%YMM0 |
0x2397c6 VPBROADCASTQ -0x2800f(%RIP),%YMM13 |
0x2397cf MOV -0x58(%RBP),%R12 |
0x2397d3 VPBROADCASTD %R13D,%XMM2 |
0x2397d9 MOV -0x2c(%RBP),%R13D |
0x2397dd MOV %RSI,-0x88(%RBP) |
0x2397e4 VPBROADCASTQ %RSI,%YMM7 |
0x2397ea MOV -0x50(%RBP),%RSI |
0x2397ee MOV %RAX,%RDX |
0x2397f1 AND $-0x4,%RDX |
0x2397f5 VPBROADCASTQ %R11,%YMM8 |
0x2397fb VPBROADCASTD %EBX,%XMM4 |
0x239801 VPBROADCASTQ %RDI,%YMM5 |
0x239807 VPBROADCASTQ %R9,%YMM6 |
0x23980d VPCMPEQD %XMM11,%XMM11,%XMM11 |
0x239812 MOV %RAX,-0x80(%RBP) |
0x239816 ADD %RDX,%RCX |
0x239819 MOV %RDX,%R11 |
0x23981c VPBROADCASTQ %R12,%YMM1 |
0x239822 VPBROADCASTD %R13D,%XMM3 |
0x239828 VPBROADCASTQ %RSI,%YMM9 |
0x23982e MOV %R9,%R12 |
0x239831 MOV %RDX,%R13 |
0x239834 VEXTRACTI128 $0x1,%YMM1,%XMM10 |
0x23983a NOPW (%RAX,%RAX,1) |
(274) 0x239840 VEXTRACTI128 $0x1,%YMM0,%XMM14 |
(274) 0x239846 VPEXTRQ $0x1,%XMM10,%RSI |
(274) 0x23984c VMOVQ %XMM10,%RDI |
(274) 0x239851 VPEXTRQ $0x1,%XMM14,%RAX |
(274) 0x239857 CQTO |
(274) 0x239859 IDIV %RSI |
(274) 0x23985c MOV %RAX,%RSI |
(274) 0x23985f VMOVQ %XMM14,%RAX |
(274) 0x239864 VMOVQ %RSI,%XMM14 |
(274) 0x239869 VPEXTRQ $0x1,%XMM1,%RSI |
(274) 0x23986f CQTO |
(274) 0x239871 IDIV %RDI |
(274) 0x239874 VPEXTRQ $0x1,%XMM0,%RDX |
(274) 0x23987a VMOVQ %XMM1,%RDI |
(274) 0x23987f VMOVQ %RAX,%XMM15 |
(274) 0x239884 MOV %RDX,%RAX |
(274) 0x239887 CQTO |
(274) 0x239889 IDIV %RSI |
(274) 0x23988c VPUNPCKLQDQ %XMM14,%XMM15,%XMM14 |
(274) 0x239891 MOV %RAX,%RSI |
(274) 0x239894 VMOVQ %XMM0,%RAX |
(274) 0x239899 VMOVQ %RSI,%XMM15 |
(274) 0x23989e CQTO |
(274) 0x2398a0 IDIV %RDI |
(274) 0x2398a3 ADD $-0x4,%R13 |
(274) 0x2398a7 VMOVQ %RAX,%XMM16 |
(274) 0x2398ad VPUNPCKLQDQ %XMM15,%XMM16,%XMM15 |
(274) 0x2398b3 VINSERTI128 $0x1,%XMM14,%YMM15,%YMM14 |
(274) 0x2398b9 VPMOVQD %YMM14,%XMM15 |
(274) 0x2398bf VPMULLQ %YMM1,%YMM14,%YMM14 |
(274) 0x2398c5 VPSUBQ %YMM14,%YMM0,%YMM14 |
(274) 0x2398ca VPADDQ %YMM0,%YMM13,%YMM0 |
(274) 0x2398ce VPMOVQD %YMM14,%XMM14 |
(274) 0x2398d4 VPADDD %XMM15,%XMM2,%XMM16 |
(274) 0x2398da VPADDD %XMM14,%XMM3,%XMM17 |
(274) 0x2398e0 VPADDD %XMM4,%XMM15,%XMM14 |
(274) 0x2398e4 VPMOVSXDQ %XMM14,%YMM15 |
(274) 0x2398e9 VPMOVSXDQ %XMM17,%YMM14 |
(274) 0x2398ef VPMULLQ %YMM15,%YMM5,%YMM18 |
(274) 0x2398f5 VPMULLQ %YMM15,%YMM6,%YMM20 |
(274) 0x2398fb VPADDQ %YMM14,%YMM18,%YMM19 |
(274) 0x239901 VPADDQ %YMM14,%YMM20,%YMM15 |
(274) 0x239907 VMOVQ %XMM19,%RDX |
(274) 0x23990d VPEXTRQ $0x1,%XMM19,%RSI |
(274) 0x239914 VEXTRACTI32X4 $0x1,%YMM19,%XMM19 |
(274) 0x23991b VPEXTRQ $0x1,%XMM15,%R9 |
(274) 0x239921 VMOVQ %XMM19,%RDI |
(274) 0x239927 VPEXTRQ $0x1,%XMM19,%RAX |
(274) 0x23992e VMOVSD (%R8,%RDX,8),%XMM19 |
(274) 0x239935 VMOVSD (%R8,%RDI,8),%XMM21 |
(274) 0x23993c VMOVQ %XMM15,%RDI |
(274) 0x239941 VEXTRACTI128 $0x1,%YMM15,%XMM15 |
(274) 0x239947 VMOVHPD (%R8,%RSI,8),%XMM19,%XMM19 |
(274) 0x23994e VMOVQ %XMM15,%RBX |
(274) 0x239953 VPEXTRQ $0x1,%XMM15,%RDX |
(274) 0x239959 VPMOVSXDQ %XMM16,%YMM15 |
(274) 0x23995f VMOVSD (%R10,%RDI,8),%XMM22 |
(274) 0x239966 VMOVHPD (%R8,%RAX,8),%XMM21,%XMM21 |
(274) 0x23996d VMOVHPD (%R10,%R9,8),%XMM22,%XMM22 |
(274) 0x239974 VMOVSD (%R10,%RBX,8),%XMM24 |
(274) 0x23997b VPMULLQ %YMM15,%YMM5,%YMM23 |
(274) 0x239981 VPMULLQ %YMM15,%YMM6,%YMM27 |
(274) 0x239987 VPADDQ %YMM14,%YMM23,%YMM16 |
(274) 0x23998d VMOVQ %XMM16,%RSI |
(274) 0x239993 VPEXTRQ $0x1,%XMM16,%RDI |
(274) 0x23999a VEXTRACTI32X4 $0x1,%YMM16,%XMM16 |
(274) 0x2399a1 VMOVQ %XMM16,%R9 |
(274) 0x2399a7 VMOVSD (%R8,%R9,8),%XMM25 |
(274) 0x2399ae VPEXTRQ $0x1,%XMM16,%R9 |
(274) 0x2399b5 VMOVSD (%R8,%RSI,8),%XMM16 |
(274) 0x2399bc VINSERTF32X4 $0x1,%XMM21,%YMM19,%YMM19 |
(274) 0x2399c3 VMOVHPD (%R8,%RDI,8),%XMM16,%XMM26 |
(274) 0x2399ca VPADDQ %YMM14,%YMM27,%YMM16 |
(274) 0x2399d0 VMOVHPD (%R8,%R9,8),%XMM25,%XMM25 |
(274) 0x2399d7 MOV -0x70(%RBP),%R9 |
(274) 0x2399db VMOVQ %XMM16,%RSI |
(274) 0x2399e1 VPEXTRQ $0x1,%XMM16,%RDI |
(274) 0x2399e8 VEXTRACTI32X4 $0x1,%YMM16,%XMM16 |
(274) 0x2399ef VMOVQ %XMM16,%RAX |
(274) 0x2399f5 VMOVSD (%R10,%RAX,8),%XMM28 |
(274) 0x2399fc VPEXTRQ $0x1,%XMM16,%RAX |
(274) 0x239a03 VMOVSD (%R10,%RSI,8),%XMM16 |
(274) 0x239a0a VMOVHPD (%R10,%RDI,8),%XMM16,%XMM29 |
(274) 0x239a11 VPADDD %XMM11,%XMM17,%XMM16 |
(274) 0x239a17 VMOVHPD (%R10,%RDX,8),%XMM24,%XMM17 |
(274) 0x239a1e VMOVHPD (%R10,%RAX,8),%XMM28,%XMM28 |
(274) 0x239a25 VPMOVSXDQ %XMM16,%YMM16 |
(274) 0x239a2b VPADDQ %YMM16,%YMM18,%YMM18 |
(274) 0x239a31 VPADDQ %YMM16,%YMM20,%YMM20 |
(274) 0x239a37 VPADDQ %YMM16,%YMM23,%YMM23 |
(274) 0x239a3d VMOVQ %XMM18,%RAX |
(274) 0x239a43 VPEXTRQ $0x1,%XMM18,%RDX |
(274) 0x239a4a VEXTRACTI32X4 $0x1,%YMM18,%XMM18 |
(274) 0x239a51 VMOVSD (%R8,%RAX,8),%XMM21 |
(274) 0x239a58 VMOVQ %XMM18,%RSI |
(274) 0x239a5e VPEXTRQ $0x1,%XMM18,%RDI |
(274) 0x239a65 VPEXTRQ $0x1,%XMM20,%RAX |
(274) 0x239a6c VMOVSD (%R8,%RSI,8),%XMM18 |
(274) 0x239a73 VMOVHPD (%R8,%RDX,8),%XMM21,%XMM21 |
(274) 0x239a7a VMOVQ %XMM20,%RDX |
(274) 0x239a80 VEXTRACTI32X4 $0x1,%YMM20,%XMM20 |
(274) 0x239a87 VMOVHPD (%R8,%RDI,8),%XMM18,%XMM18 |
(274) 0x239a8e VMOVQ %XMM20,%RSI |
(274) 0x239a94 VPEXTRQ $0x1,%XMM20,%RDI |
(274) 0x239a9b VMOVSD (%R10,%RSI,8),%XMM24 |
(274) 0x239aa2 VINSERTF32X4 $0x1,%XMM17,%YMM22,%YMM17 |
(274) 0x239aa9 VINSERTF32X4 $0x1,%XMM25,%YMM26,%YMM22 |
(274) 0x239ab0 VMOVSD (%R10,%RDX,8),%XMM25 |
(274) 0x239ab7 VINSERTF32X4 $0x1,%XMM28,%YMM29,%YMM20 |
(274) 0x239abe VPEXTRQ $0x1,%XMM23,%RDX |
(274) 0x239ac5 VMOVHPD (%R10,%RAX,8),%XMM25,%XMM25 |
(274) 0x239acc VMOVHPD (%R10,%RDI,8),%XMM24,%XMM24 |
(274) 0x239ad3 VMOVQ %XMM23,%RAX |
(274) 0x239ad9 VMULPD %YMM20,%YMM22,%YMM20 |
(274) 0x239adf VFMADD231PD %YMM17,%YMM19,%YMM20 |
(274) 0x239ae5 VPMULLQ %YMM15,%YMM8,%YMM19 |
(274) 0x239aeb VINSERTF32X4 $0x1,%XMM18,%YMM21,%YMM18 |
(274) 0x239af2 VEXTRACTI32X4 $0x1,%YMM23,%XMM21 |
(274) 0x239af9 VMOVQ %XMM21,%RSI |
(274) 0x239aff VPEXTRQ $0x1,%XMM21,%RDI |
(274) 0x239b06 VINSERTF32X4 $0x1,%XMM24,%YMM25,%YMM23 |
(274) 0x239b0d VMOVSD (%R8,%RSI,8),%XMM21 |
(274) 0x239b14 VMOVSD (%R8,%RAX,8),%XMM25 |
(274) 0x239b1b VMOVHPD (%R8,%RDI,8),%XMM21,%XMM21 |
(274) 0x239b22 VMOVHPD (%R8,%RDX,8),%XMM25,%XMM22 |
(274) 0x239b29 VFMADD213PD %YMM20,%YMM18,%YMM23 |
(274) 0x239b2f VINSERTF32X4 $0x1,%XMM21,%YMM22,%YMM21 |
(274) 0x239b36 VPADDQ %YMM16,%YMM27,%YMM22 |
(274) 0x239b3c VPADDQ %YMM16,%YMM19,%YMM16 |
(274) 0x239b42 VPADDQ %YMM14,%YMM19,%YMM19 |
(274) 0x239b48 VEXTRACTI32X4 $0x1,%YMM22,%XMM17 |
(274) 0x239b4f VMOVQ %XMM22,%RDX |
(274) 0x239b55 VPEXTRQ $0x1,%XMM22,%RAX |
(274) 0x239b5c VMOVQ %XMM17,%RSI |
(274) 0x239b62 VMOVSD (%R10,%RDX,8),%XMM18 |
(274) 0x239b69 VPEXTRQ $0x1,%XMM17,%RDI |
(274) 0x239b70 VMOVSD (%R10,%RSI,8),%XMM17 |
(274) 0x239b77 VMOVHPD (%R10,%RAX,8),%XMM18,%XMM18 |
(274) 0x239b7e VMOVHPD (%R10,%RDI,8),%XMM17,%XMM17 |
(274) 0x239b85 VINSERTF32X4 $0x1,%XMM17,%YMM18,%YMM17 |
(274) 0x239b8c VPMULLQ %YMM15,%YMM7,%YMM18 |
(274) 0x239b92 VPMULLQ %YMM15,%YMM9,%YMM15 |
(274) 0x239b98 VFMADD213PD %YMM23,%YMM21,%YMM17 |
(274) 0x239b9e VPADDQ %YMM14,%YMM18,%YMM18 |
(274) 0x239ba4 VPADDQ %YMM14,%YMM15,%YMM14 |
(274) 0x239ba9 VMOVQ %XMM18,%RAX |
(274) 0x239baf VPEXTRQ $0x1,%XMM18,%RDX |
(274) 0x239bb6 VEXTRACTI32X4 $0x1,%YMM18,%XMM18 |
(274) 0x239bbd VMOVQ %XMM18,%RSI |
(274) 0x239bc3 VPEXTRQ $0x1,%XMM18,%RDI |
(274) 0x239bca VMULPD %YMM12,%YMM17,%YMM17 |
(274) 0x239bd0 VEXTRACTF32X4 $0x1,%YMM17,%XMM18 |
(274) 0x239bd7 VMOVLPD %XMM17,(%R9,%RAX,8) |
(274) 0x239bde VMOVHPD %XMM17,(%R9,%RDX,8) |
(274) 0x239be5 VMOVQ %XMM16,%RAX |
(274) 0x239beb VPEXTRQ $0x1,%XMM16,%RDX |
(274) 0x239bf2 VEXTRACTI32X4 $0x1,%YMM16,%XMM16 |
(274) 0x239bf9 VMOVLPD %XMM18,(%R9,%RSI,8) |
(274) 0x239c00 VMOVHPD %XMM18,(%R9,%RDI,8) |
(274) 0x239c07 VMOVQ %XMM16,%RSI |
(274) 0x239c0d VPEXTRQ $0x1,%XMM16,%RDI |
(274) 0x239c14 MOV -0x38(%RBP),%R9 |
(274) 0x239c18 VMOVSD (%R14,%RAX,8),%XMM18 |
(274) 0x239c1f VMOVSD (%R14,%RSI,8),%XMM16 |
(274) 0x239c26 VMOVQ %XMM19,%RAX |
(274) 0x239c2c VMOVHPD (%R14,%RDX,8),%XMM18,%XMM18 |
(274) 0x239c33 VMOVHPD (%R14,%RDI,8),%XMM16,%XMM16 |
(274) 0x239c3a VPEXTRQ $0x1,%XMM19,%RDX |
(274) 0x239c41 VEXTRACTI32X4 $0x1,%YMM19,%XMM19 |
(274) 0x239c48 VMOVQ %XMM19,%RDI |
(274) 0x239c4e VPEXTRQ $0x1,%XMM19,%RSI |
(274) 0x239c55 VMOVSD (%R14,%RAX,8),%XMM19 |
(274) 0x239c5c VPEXTRQ $0x1,%XMM14,%RAX |
(274) 0x239c62 VMOVHPD (%R14,%RDX,8),%XMM19,%XMM19 |
(274) 0x239c69 VMOVQ %XMM14,%RDX |
(274) 0x239c6e VEXTRACTI128 $0x1,%YMM14,%XMM14 |
(274) 0x239c74 VINSERTF32X4 $0x1,%XMM16,%YMM18,%YMM16 |
(274) 0x239c7b VMOVSD (%R14,%RDI,8),%XMM18 |
(274) 0x239c82 VPEXTRQ $0x1,%XMM14,%RDI |
(274) 0x239c88 VMOVHPD (%R14,%RSI,8),%XMM18,%XMM18 |
(274) 0x239c8f VMOVQ %XMM14,%RSI |
(274) 0x239c94 VSUBPD %YMM16,%YMM17,%YMM16 |
(274) 0x239c9a VINSERTF32X4 $0x1,%XMM18,%YMM19,%YMM17 |
(274) 0x239ca1 VADDPD %YMM17,%YMM16,%YMM16 |
(274) 0x239ca7 VMOVLPD %XMM16,(%R9,%RDX,8) |
(274) 0x239cae MOV -0x38(%RBP),%R9 |
(274) 0x239cb2 VEXTRACTF32X4 $0x1,%YMM16,%XMM14 |
(274) 0x239cb9 VMOVHPD %XMM16,(%R9,%RAX,8) |
(274) 0x239cc0 VMOVLPD %XMM14,(%R9,%RSI,8) |
(274) 0x239cc6 VMOVHPD %XMM14,(%R9,%RDI,8) |
(274) 0x239ccc JNE 239840 |
0x239cd2 MOV -0x68(%RBP),%RBX |
0x239cd6 MOV -0x60(%RBP),%R13 |
0x239cda CMP %R11,-0x80(%RBP) |
0x239cde MOV -0x88(%RBP),%R11 |
0x239ce5 JE 239dec |
0x239ceb VMOVSD -0x284db(%RIP),%XMM0 |
0x239cf3 NOPW %CS:(%RAX,%RAX,1) |
(275) 0x239d00 MOV %RCX,%RAX |
(275) 0x239d03 CQTO |
(275) 0x239d05 IDIVQ -0x58(%RBP) |
(275) 0x239d09 ADD -0x2c(%RBP),%EDX |
(275) 0x239d0c MOVSXD %EDX,%RDX |
(275) 0x239d0f LEA (%R13,%RAX,1),%ESI |
(275) 0x239d14 MOV -0x90(%RBP),%R13 |
(275) 0x239d1b ADD %EBX,%EAX |
(275) 0x239d1d MOVSXD %EAX,%RDI |
(275) 0x239d20 MOV %R13,%R9 |
(275) 0x239d23 IMUL %RDI,%R9 |
(275) 0x239d27 IMUL %R12,%RDI |
(275) 0x239d2b LEA (%R9,%RDX,1),%RAX |
(275) 0x239d2f LEA -0x1(%R9,%RDX,1),%R9 |
(275) 0x239d34 VMOVSD (%R8,%RAX,8),%XMM1 |
(275) 0x239d3a MOVSXD %ESI,%RAX |
(275) 0x239d3d MOV %R13,%RSI |
(275) 0x239d40 IMUL %RAX,%RSI |
(275) 0x239d44 LEA (%RSI,%RDX,1),%RBX |
(275) 0x239d48 LEA -0x1(%RSI,%RDX,1),%RSI |
(275) 0x239d4d VMOVSD (%R8,%RBX,8),%XMM2 |
(275) 0x239d53 MOV %R12,%RBX |
(275) 0x239d56 IMUL %RAX,%RBX |
(275) 0x239d5a LEA (%RBX,%RDX,1),%R13 |
(275) 0x239d5e VMULSD (%R10,%R13,8),%XMM2,%XMM2 |
(275) 0x239d64 LEA (%RDI,%RDX,1),%R13 |
(275) 0x239d68 LEA -0x1(%RDI,%RDX,1),%RDI |
(275) 0x239d6d VFMADD231SD (%R10,%R13,8),%XMM1,%XMM2 |
(275) 0x239d73 VMOVSD (%R8,%R9,8),%XMM1 |
(275) 0x239d79 MOV -0x60(%RBP),%R13 |
(275) 0x239d7d VFMADD132SD (%R10,%RDI,8),%XMM2,%XMM1 |
(275) 0x239d83 VMOVSD (%R8,%RSI,8),%XMM2 |
(275) 0x239d89 LEA -0x1(%RBX,%RDX,1),%RSI |
(275) 0x239d8e MOV -0x70(%RBP),%RDI |
(275) 0x239d92 MOV -0x68(%RBP),%RBX |
(275) 0x239d96 VFMADD132SD (%R10,%RSI,8),%XMM1,%XMM2 |
(275) 0x239d9c MOV %R11,%RSI |
(275) 0x239d9f IMUL %RAX,%RSI |
(275) 0x239da3 ADD %RDX,%RSI |
(275) 0x239da6 VMULSD %XMM0,%XMM2,%XMM1 |
(275) 0x239daa VMOVSD %XMM1,(%RDI,%RSI,8) |
(275) 0x239daf MOV -0x98(%RBP),%RSI |
(275) 0x239db6 IMUL %RAX,%RSI |
(275) 0x239dba IMUL -0x50(%RBP),%RAX |
(275) 0x239dbf LEA -0x1(%RSI,%RDX,1),%RDI |
(275) 0x239dc4 ADD %RDX,%RSI |
(275) 0x239dc7 VSUBSD (%R14,%RDI,8),%XMM1,%XMM1 |
(275) 0x239dcd ADD %RDX,%RAX |
(275) 0x239dd0 MOV -0x38(%RBP),%RDX |
(275) 0x239dd4 VADDSD (%R14,%RSI,8),%XMM1,%XMM1 |
(275) 0x239dda VMOVSD %XMM1,(%RDX,%RAX,8) |
(275) 0x239ddf CMP %R15,%RCX |
(275) 0x239de2 LEA 0x1(%RCX),%RCX |
(275) 0x239de6 JL 239d00 |
0x239dec MOV -0x44(%RBP),%ESI |
0x239def LEA 0x26f92(%RIP),%RDI |
0x239df6 VZEROUPPER |
0x239df9 CALL 25f750 <@plt_start@+0x540> |
0x239dfe ADD $0x78,%RSP |
0x239e02 POP %RBX |
0x239e03 POP %R12 |
0x239e05 POP %R13 |
0x239e07 POP %R14 |
0x239e09 POP %R15 |
0x239e0b POP %RBP |
0x239e0c RET |
Path / |
Source file and lines | advec_mom.cpp:95-100 |
Module | exec |
nb instructions | 125 |
nb uops | 135 |
loop length | 527 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 6 |
used ymm registers | 9 |
used zmm registers | 0 |
nb stack references | 21 |
micro-operation queue | 22.50 cycles |
front end | 22.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 8.25 | 8.25 | 8.00 | 8.00 | 4.50 | 17.67 | 17.67 | 17.67 | 1.00 | 10.00 | 1.00 | 1.00 | 0.00 | 0.00 |
cycles | 8.25 | 8.25 | 8.00 | 8.00 | 4.50 | 17.67 | 17.67 | 17.67 | 1.00 | 10.00 | 1.00 | 1.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 22.50 |
Dispatch | 17.67 |
Overall L1 | 22.50 |
all | 7% |
load | 9% |
store | 0% |
mul | 0% |
add-sub | 16% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 7% |
load | 7% |
store | 0% |
mul | 0% |
add-sub | 16% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 13% |
store | 10% |
mul | 12% |
add-sub | 14% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 13% |
store | 10% |
mul | 12% |
add-sub | 14% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x78,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RCX),%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x1(%RBX),%R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x3,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %R13D,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 239dfe <.omp_outlined..10+0x77e> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV (%R9),%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x4,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R14D,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 239dfe <.omp_outlined..10+0x77e> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
SUB %R14D,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
IMUL %R12,%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x48(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0xa0(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x27676(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x78(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x40(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x44(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 25f740 <@plt_start@+0x530> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x78(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %R15,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVL %RAX,%R15 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R15,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JG 239dec <.omp_outlined..10+0x76c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x20(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R14D,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R12,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R13,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RSI),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RSI),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R11),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R11),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %RCX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INC %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x4,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JAE 2397af <.omp_outlined..10+0x12f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R9,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 239ceb <.omp_outlined..10+0x66b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VBROADCASTSD -0x27fa0(%RIP),%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %RCX,%YMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPADDQ -0x27dc6(%RIP),%YMM0,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ -0x2800f(%RIP),%YMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV -0x58(%RBP),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTD %R13D,%XMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x2c(%RBP),%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RSI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %RSI,%YMM7 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x50(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x4,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VPBROADCASTQ %R11,%YMM8 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTD %EBX,%XMM4 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RDI,%YMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %R9,%YMM6 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPCMPEQD %XMM11,%XMM11,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
ADD %RDX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPBROADCASTQ %R12,%YMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTD %R13D,%XMM3 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RSI,%YMM9 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV %R9,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV -0x68(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x60(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %R11,-0x80(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV -0x88(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JE 239dec <.omp_outlined..10+0x76c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VMOVSD -0x284db(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV -0x44(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x26f92(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 25f750 <@plt_start@+0x540> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x78,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
Source file and lines | advec_mom.cpp:95-100 |
Module | exec |
nb instructions | 125 |
nb uops | 135 |
loop length | 527 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 6 |
used ymm registers | 9 |
used zmm registers | 0 |
nb stack references | 21 |
micro-operation queue | 22.50 cycles |
front end | 22.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 8.25 | 8.25 | 8.00 | 8.00 | 4.50 | 17.67 | 17.67 | 17.67 | 1.00 | 10.00 | 1.00 | 1.00 | 0.00 | 0.00 |
cycles | 8.25 | 8.25 | 8.00 | 8.00 | 4.50 | 17.67 | 17.67 | 17.67 | 1.00 | 10.00 | 1.00 | 1.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 22.50 |
Dispatch | 17.67 |
Overall L1 | 22.50 |
all | 7% |
load | 9% |
store | 0% |
mul | 0% |
add-sub | 16% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 7% |
load | 7% |
store | 0% |
mul | 0% |
add-sub | 16% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 13% |
store | 10% |
mul | 12% |
add-sub | 14% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 13% |
store | 10% |
mul | 12% |
add-sub | 14% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x78,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RCX),%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x1(%RBX),%R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x3,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %R13D,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 239dfe <.omp_outlined..10+0x77e> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV (%R9),%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x4,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R14D,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 239dfe <.omp_outlined..10+0x77e> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
SUB %R14D,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
IMUL %R12,%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x48(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0xa0(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x27676(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x78(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x40(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x44(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 25f740 <@plt_start@+0x530> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x78(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %R15,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVL %RAX,%R15 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R15,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JG 239dec <.omp_outlined..10+0x76c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x20(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R14D,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R12,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R13,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RSI),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RSI),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R11),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R11),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %RCX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INC %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x4,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JAE 2397af <.omp_outlined..10+0x12f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R9,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 239ceb <.omp_outlined..10+0x66b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VBROADCASTSD -0x27fa0(%RIP),%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %RCX,%YMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPADDQ -0x27dc6(%RIP),%YMM0,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ -0x2800f(%RIP),%YMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV -0x58(%RBP),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTD %R13D,%XMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x2c(%RBP),%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RSI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %RSI,%YMM7 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x50(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x4,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VPBROADCASTQ %R11,%YMM8 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTD %EBX,%XMM4 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RDI,%YMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %R9,%YMM6 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPCMPEQD %XMM11,%XMM11,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
ADD %RDX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPBROADCASTQ %R12,%YMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTD %R13D,%XMM3 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RSI,%YMM9 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV %R9,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV -0x68(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x60(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %R11,-0x80(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV -0x88(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JE 239dec <.omp_outlined..10+0x76c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VMOVSD -0x284db(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV -0x44(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x26f92(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 25f750 <@plt_start@+0x540> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x78,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼.omp_outlined..10#0x239680– | 2.98 | 1.52 |
○Loop 274 - advec_mom.cpp:96-100 - exec | 2.98 | 1.52 |
○Loop 275 - advec_mom.cpp:96-100 - exec | 0 | 0 |