Function: .omp_outlined..2#0x237ce0 | Module: exec | Source: advec_mom.cpp:53-57 [...] | Coverage: 2.9% |
---|
Function: .omp_outlined..2#0x237ce0 | Module: exec | Source: advec_mom.cpp:53-57 [...] | Coverage: 2.9% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/advec_mom.cpp: 53 - 57 |
-------------------------------------------------------------------------------- |
53: #pragma omp parallel for simd collapse(2) |
54: for (int j = (y_min - 2 + 1); j < (y_max + 2 + 2); j++) { |
55: for (int i = (x_min - 2 + 1); i < (x_max + 2 + 2); i++) { |
56: post_vol(i, j) = volume(i, j) + vol_flux_x(i + 1, j + 0) - vol_flux_x(i, j); |
57: pre_vol(i, j) = post_vol(i, j) + vol_flux_y(i + 0, j + 1) - vol_flux_y(i, j); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
0x237ce0 PUSH %RBP |
0x237ce1 MOV %RSP,%RBP |
0x237ce4 PUSH %R15 |
0x237ce6 PUSH %R14 |
0x237ce8 PUSH %R13 |
0x237cea PUSH %R12 |
0x237cec PUSH %RBX |
0x237ced SUB $0x88,%RSP |
0x237cf4 MOV (%RCX),%R15D |
0x237cf7 MOV (%RDX),%EAX |
0x237cf9 ADD $0x4,%R15D |
0x237cfd CMP %EAX,%R15D |
0x237d00 JL 23845b |
0x237d06 MOV (%R9),%R13D |
0x237d09 MOV (%R8),%ECX |
0x237d0c ADD $0x4,%R13D |
0x237d10 CMP %ECX,%R13D |
0x237d13 JL 23845b |
0x237d19 LEA -0x1(%RAX),%EBX |
0x237d1c LEA -0x1(%RCX),%R14D |
0x237d20 MOV (%RDI),%ESI |
0x237d22 MOVQ $0,-0x68(%RBP) |
0x237d2a MOVQ $0x1,-0xa8(%RBP) |
0x237d35 MOVL $0,-0x40(%RBP) |
0x237d3c SUB %R14D,%R13D |
0x237d3f SUB %EBX,%R15D |
0x237d42 IMUL %R13,%R15 |
0x237d46 DEC %R15 |
0x237d49 MOV %R15,-0x38(%RBP) |
0x237d4d SUB $0x8,%RSP |
0x237d51 MOV %RCX,%R12 |
0x237d54 LEA -0x40(%RBP),%RCX |
0x237d58 MOV %RAX,-0x60(%RBP) |
0x237d5c LEA -0xa8(%RBP),%RAX |
0x237d63 LEA 0x28ee6(%RIP),%RDI |
0x237d6a LEA -0x68(%RBP),%R8 |
0x237d6e LEA -0x38(%RBP),%R9 |
0x237d72 MOV %ESI,-0x3c(%RBP) |
0x237d75 MOV $0x22,%EDX |
0x237d7a PUSH $0x1 |
0x237d7c PUSH $0x1 |
0x237d7e PUSH %RAX |
0x237d7f CALL 25f740 <@plt_start@+0x530> |
0x237d84 ADD $0x20,%RSP |
0x237d88 MOV -0x38(%RBP),%RAX |
0x237d8c MOV -0x68(%RBP),%RCX |
0x237d90 CMP %R15,%RAX |
0x237d93 CMOVL %RAX,%R15 |
0x237d97 MOV %R15,-0x38(%RBP) |
0x237d9b CMP %R15,%RCX |
0x237d9e JG 238449 |
0x237da4 MOV 0x20(%RBP),%RSI |
0x237da8 MOV 0x18(%RBP),%RDI |
0x237dac MOV 0x30(%RBP),%RAX |
0x237db0 MOV 0x28(%RBP),%RDX |
0x237db4 MOV 0x10(%RBP),%R8 |
0x237db8 MOV %R12,-0x58(%RBP) |
0x237dbc MOV %R14,-0x50(%RBP) |
0x237dc0 MOV %RBX,-0x30(%RBP) |
0x237dc4 MOV %R15,%R10 |
0x237dc7 SUB %RCX,%R10 |
0x237dca INC %R10 |
0x237dcd MOV (%RDI),%R12 |
0x237dd0 MOV 0x10(%RDI),%R9 |
0x237dd4 MOV (%RSI),%RDI |
0x237dd7 MOV 0x10(%RSI),%R11 |
0x237ddb MOV (%R8),%RSI |
0x237dde MOV 0x10(%R8),%R14 |
0x237de2 MOV (%RAX),%R8 |
0x237de5 MOV 0x10(%RAX),%RBX |
0x237de9 MOV (%RDX),%RAX |
0x237dec MOV 0x10(%RDX),%RDX |
0x237df0 MOV %RDX,-0x48(%RBP) |
0x237df4 MOV %RDI,-0xa0(%RBP) |
0x237dfb MOV %R12,-0x98(%RBP) |
0x237e02 MOV %RSI,-0x90(%RBP) |
0x237e09 MOV %RAX,-0x88(%RBP) |
0x237e10 CMP $0x8,%R10 |
0x237e14 JAE 237e22 |
0x237e16 MOV -0x30(%RBP),%R10 |
0x237e1a MOV %R14,%RDX |
0x237e1d JMP 238390 |
0x237e22 MOV %RAX,%RDX |
0x237e25 MOV -0x30(%RBP),%RAX |
0x237e29 VPBROADCASTQ %RCX,%ZMM0 |
0x237e2f VPADDQ -0x261b9(%RIP),%ZMM0,%ZMM0 |
0x237e39 VPBROADCASTQ -0x2663b(%RIP),%ZMM13 |
0x237e43 MOV %R8,-0x80(%RBP) |
0x237e47 VPBROADCASTQ %R8,%ZMM9 |
0x237e4d MOV -0x48(%RBP),%R8 |
0x237e51 VPBROADCASTQ %R13,%ZMM1 |
0x237e57 MOV %R10,-0x78(%RBP) |
0x237e5b AND $-0x8,%R10 |
0x237e5f VPBROADCASTQ %R12,%ZMM4 |
0x237e65 VPBROADCASTQ %RDI,%ZMM6 |
0x237e6b VPBROADCASTQ %RSI,%ZMM7 |
0x237e71 VPBROADCASTQ %RDX,%ZMM10 |
0x237e77 ADD %R10,%RCX |
0x237e7a VEXTRACTI32X4 $0x3,%ZMM1,%XMM11 |
0x237e81 VEXTRACTI32X4 $0x2,%ZMM1,%XMM12 |
0x237e88 MOV %R10,-0x70(%RBP) |
0x237e8c VPBROADCASTD %EAX,%YMM2 |
0x237e92 MOV -0x50(%RBP),%RAX |
0x237e96 VPBROADCASTD %EAX,%YMM3 |
0x237e9c MOV -0x58(%RBP),%RAX |
0x237ea0 VPBROADCASTD %EAX,%YMM5 |
0x237ea6 MOV -0x60(%RBP),%RAX |
0x237eaa VPBROADCASTD %EAX,%YMM8 |
(202) 0x237eb0 VEXTRACTI32X4 $0x3,%ZMM0,%XMM14 |
(202) 0x237eb7 VPEXTRQ $0x1,%XMM11,%RSI |
(202) 0x237ebd VMOVQ %XMM11,%RDI |
(202) 0x237ec2 VPEXTRQ $0x1,%XMM12,%R12 |
(202) 0x237ec8 VEXTRACTI32X4 $0x1,%YMM1,%XMM18 |
(202) 0x237ecf KXNORW %K0,%K0,%K1 |
(202) 0x237ed3 VPEXTRQ $0x1,%XMM14,%RAX |
(202) 0x237ed9 CQTO |
(202) 0x237edb IDIV %RSI |
(202) 0x237ede MOV %RAX,%RSI |
(202) 0x237ee1 VMOVQ %XMM14,%RAX |
(202) 0x237ee6 VEXTRACTI32X4 $0x2,%ZMM0,%XMM14 |
(202) 0x237eed VMOVQ %RSI,%XMM15 |
(202) 0x237ef2 VMOVQ %XMM12,%RSI |
(202) 0x237ef7 CQTO |
(202) 0x237ef9 IDIV %RDI |
(202) 0x237efc MOV %RAX,%RDI |
(202) 0x237eff VPEXTRQ $0x1,%XMM14,%RAX |
(202) 0x237f05 VMOVQ %RDI,%XMM16 |
(202) 0x237f0b VMOVQ %XMM18,%RDI |
(202) 0x237f11 CQTO |
(202) 0x237f13 VPUNPCKLQDQ %XMM15,%XMM16,%XMM15 |
(202) 0x237f19 IDIV %R12 |
(202) 0x237f1c VMOVQ %RAX,%XMM16 |
(202) 0x237f22 VMOVQ %XMM14,%RAX |
(202) 0x237f27 VEXTRACTI128 $0x1,%YMM0,%XMM14 |
(202) 0x237f2d CQTO |
(202) 0x237f2f IDIV %RSI |
(202) 0x237f32 VPEXTRQ $0x1,%XMM18,%RSI |
(202) 0x237f39 VMOVQ %RAX,%XMM17 |
(202) 0x237f3f VPEXTRQ $0x1,%XMM14,%RAX |
(202) 0x237f45 CQTO |
(202) 0x237f47 IDIV %RSI |
(202) 0x237f4a MOV %RAX,%RSI |
(202) 0x237f4d VMOVQ %XMM14,%RAX |
(202) 0x237f52 VPUNPCKLQDQ %XMM16,%XMM17,%XMM14 |
(202) 0x237f58 CQTO |
(202) 0x237f5a VINSERTI128 $0x1,%XMM15,%YMM14,%YMM14 |
(202) 0x237f60 VMOVQ %RSI,%XMM15 |
(202) 0x237f65 VPEXTRQ $0x1,%XMM1,%RSI |
(202) 0x237f6b IDIV %RDI |
(202) 0x237f6e VPEXTRQ $0x1,%XMM0,%RDX |
(202) 0x237f74 VMOVQ %RAX,%XMM16 |
(202) 0x237f7a MOV %RDX,%RAX |
(202) 0x237f7d CQTO |
(202) 0x237f7f IDIV %RSI |
(202) 0x237f82 VMOVQ %XMM1,%RSI |
(202) 0x237f87 VPUNPCKLQDQ %XMM15,%XMM16,%XMM15 |
(202) 0x237f8d VMOVQ %RAX,%XMM17 |
(202) 0x237f93 VMOVQ %XMM0,%RAX |
(202) 0x237f98 CQTO |
(202) 0x237f9a IDIV %RSI |
(202) 0x237f9d ADD $-0x8,%R10 |
(202) 0x237fa1 VMOVQ %RAX,%XMM16 |
(202) 0x237fa7 VPUNPCKLQDQ %XMM17,%XMM16,%XMM16 |
(202) 0x237fad VINSERTI32X4 $0x1,%XMM15,%YMM16,%YMM15 |
(202) 0x237fb4 VINSERTI64X4 $0x1,%YMM14,%ZMM15,%ZMM14 |
(202) 0x237fbb VPMOVQD %ZMM14,%YMM16 |
(202) 0x237fc1 VPMULLQ %ZMM1,%ZMM14,%ZMM14 |
(202) 0x237fc7 VPSUBQ %ZMM14,%ZMM0,%ZMM14 |
(202) 0x237fcd VPADDQ %ZMM13,%ZMM0,%ZMM0 |
(202) 0x237fd3 VPMOVQD %ZMM14,%YMM17 |
(202) 0x237fd9 VPADDD %YMM16,%YMM2,%YMM15 |
(202) 0x237fdf VPADDD %YMM16,%YMM8,%YMM16 |
(202) 0x237fe5 VPMOVSXDQ %YMM15,%ZMM15 |
(202) 0x237feb VPMOVSXDQ %YMM16,%ZMM16 |
(202) 0x237ff1 VPADDD %YMM17,%YMM3,%YMM14 |
(202) 0x237ff7 VPADDD %YMM17,%YMM5,%YMM17 |
(202) 0x237ffd VPMOVSXDQ %YMM14,%ZMM14 |
(202) 0x238003 VPMULLQ %ZMM15,%ZMM4,%ZMM18 |
(202) 0x238009 VPMOVSXDQ %YMM17,%ZMM17 |
(202) 0x23800f VPMULLQ %ZMM15,%ZMM6,%ZMM28 |
(202) 0x238015 VPMULLQ %ZMM16,%ZMM9,%ZMM16 |
(202) 0x23801b VPADDQ %ZMM14,%ZMM18,%ZMM18 |
(202) 0x238021 VPADDQ %ZMM17,%ZMM28,%ZMM17 |
(202) 0x238027 VPADDQ %ZMM14,%ZMM16,%ZMM16 |
(202) 0x23802d VEXTRACTI32X4 $0x3,%ZMM18,%XMM21 |
(202) 0x238034 VEXTRACTI32X4 $0x2,%ZMM18,%XMM20 |
(202) 0x23803b VEXTRACTI32X4 $0x1,%YMM18,%XMM19 |
(202) 0x238042 VEXTRACTI32X4 $0x3,%ZMM17,%XMM25 |
(202) 0x238049 VMOVQ %XMM21,%RAX |
(202) 0x23804f VMOVSD (%R9,%RAX,8),%XMM22 |
(202) 0x238056 VPEXTRQ $0x1,%XMM21,%RAX |
(202) 0x23805d VMOVHPD (%R9,%RAX,8),%XMM22,%XMM21 |
(202) 0x238064 VMOVQ %XMM20,%RAX |
(202) 0x23806a VMOVSD (%R9,%RAX,8),%XMM22 |
(202) 0x238071 VMOVQ %XMM19,%RAX |
(202) 0x238077 VMOVSD (%R9,%RAX,8),%XMM23 |
(202) 0x23807e VMOVQ %XMM18,%RAX |
(202) 0x238084 VMOVSD (%R9,%RAX,8),%XMM24 |
(202) 0x23808b VPEXTRQ $0x1,%XMM20,%RAX |
(202) 0x238092 VMOVHPD (%R9,%RAX,8),%XMM22,%XMM20 |
(202) 0x238099 VPEXTRQ $0x1,%XMM18,%RAX |
(202) 0x2380a0 VEXTRACTI32X4 $0x1,%YMM17,%XMM22 |
(202) 0x2380a7 VMOVHPD (%R9,%RAX,8),%XMM24,%XMM18 |
(202) 0x2380ae VPEXTRQ $0x1,%XMM19,%RAX |
(202) 0x2380b5 VEXTRACTI32X4 $0x2,%ZMM17,%XMM24 |
(202) 0x2380bc VPADDQ %ZMM14,%ZMM28,%ZMM19 |
(202) 0x2380c2 VMOVHPD (%R9,%RAX,8),%XMM23,%XMM23 |
(202) 0x2380c9 VMOVQ %XMM25,%RAX |
(202) 0x2380cf VMOVSD (%R11,%RAX,8),%XMM26 |
(202) 0x2380d6 VPEXTRQ $0x1,%XMM25,%RAX |
(202) 0x2380dd VMOVHPD (%R11,%RAX,8),%XMM26,%XMM25 |
(202) 0x2380e4 VMOVQ %XMM24,%RAX |
(202) 0x2380ea VMOVSD (%R11,%RAX,8),%XMM26 |
(202) 0x2380f1 VPEXTRQ $0x1,%XMM24,%RAX |
(202) 0x2380f8 VMOVHPD (%R11,%RAX,8),%XMM26,%XMM24 |
(202) 0x2380ff VMOVQ %XMM22,%RAX |
(202) 0x238105 VMOVSD (%R11,%RAX,8),%XMM26 |
(202) 0x23810c VPEXTRQ $0x1,%XMM22,%RAX |
(202) 0x238113 VMOVHPD (%R11,%RAX,8),%XMM26,%XMM22 |
(202) 0x23811a VMOVQ %XMM17,%RAX |
(202) 0x238120 VINSERTF32X4 $0x1,%XMM21,%YMM20,%YMM20 |
(202) 0x238127 VEXTRACTI32X4 $0x3,%ZMM19,%XMM26 |
(202) 0x23812e VMOVSD (%R11,%RAX,8),%XMM21 |
(202) 0x238135 VPEXTRQ $0x1,%XMM17,%RAX |
(202) 0x23813c VMOVHPD (%R11,%RAX,8),%XMM21,%XMM17 |
(202) 0x238143 VMOVQ %XMM26,%RAX |
(202) 0x238149 VINSERTF32X4 $0x1,%XMM23,%YMM18,%YMM18 |
(202) 0x238150 VEXTRACTI32X4 $0x2,%ZMM19,%XMM23 |
(202) 0x238157 VEXTRACTI32X4 $0x1,%YMM19,%XMM21 |
(202) 0x23815e VMOVSD (%R11,%RAX,8),%XMM27 |
(202) 0x238165 VPEXTRQ $0x1,%XMM26,%RAX |
(202) 0x23816c VINSERTF64X4 $0x1,%YMM20,%ZMM18,%ZMM18 |
(202) 0x238173 VINSERTF32X4 $0x1,%XMM25,%YMM24,%YMM24 |
(202) 0x23817a VMOVHPD (%R11,%RAX,8),%XMM27,%XMM25 |
(202) 0x238181 VMOVQ %XMM23,%RAX |
(202) 0x238187 VMOVSD (%R11,%RAX,8),%XMM26 |
(202) 0x23818e VPEXTRQ $0x1,%XMM23,%RAX |
(202) 0x238195 VINSERTF32X4 $0x1,%XMM22,%YMM17,%YMM17 |
(202) 0x23819c VMOVHPD (%R11,%RAX,8),%XMM26,%XMM22 |
(202) 0x2381a3 VMOVQ %XMM21,%RAX |
(202) 0x2381a9 VPMULLQ %ZMM15,%ZMM9,%ZMM26 |
(202) 0x2381af VMOVSD (%R11,%RAX,8),%XMM23 |
(202) 0x2381b6 VPEXTRQ $0x1,%XMM21,%RAX |
(202) 0x2381bd VMOVHPD (%R11,%RAX,8),%XMM23,%XMM20 |
(202) 0x2381c4 VMOVQ %XMM19,%RAX |
(202) 0x2381ca VINSERTF64X4 $0x1,%YMM24,%ZMM17,%ZMM17 |
(202) 0x2381d1 VMOVSD (%R11,%RAX,8),%XMM21 |
(202) 0x2381d8 VPEXTRQ $0x1,%XMM19,%RAX |
(202) 0x2381df VMOVHPD (%R11,%RAX,8),%XMM21,%XMM21 |
(202) 0x2381e6 VADDPD %ZMM17,%ZMM18,%ZMM17 |
(202) 0x2381ec VINSERTF32X4 $0x1,%XMM25,%YMM22,%YMM19 |
(202) 0x2381f3 VINSERTF32X4 $0x1,%XMM20,%YMM21,%YMM20 |
(202) 0x2381fa VINSERTF64X4 $0x1,%YMM19,%ZMM20,%ZMM18 |
(202) 0x238201 VPMULLQ %ZMM15,%ZMM7,%ZMM19 |
(202) 0x238207 VEXTRACTI32X4 $0x2,%ZMM16,%XMM20 |
(202) 0x23820e VPMULLQ %ZMM15,%ZMM10,%ZMM15 |
(202) 0x238214 VSUBPD %ZMM18,%ZMM17,%ZMM17 |
(202) 0x23821a VEXTRACTI32X4 $0x1,%YMM16,%XMM18 |
(202) 0x238221 VPADDQ %ZMM14,%ZMM19,%ZMM19 |
(202) 0x238227 VSCATTERQPD %ZMM17,(%R14,%ZMM19,8){%K1} |
(202) 0x23822e VEXTRACTI32X4 $0x3,%ZMM16,%XMM19 |
(202) 0x238235 KXNORW %K0,%K0,%K1 |
(202) 0x238239 VMOVQ %XMM19,%RAX |
(202) 0x23823f VMOVSD (%RBX,%RAX,8),%XMM21 |
(202) 0x238246 VPEXTRQ $0x1,%XMM19,%RAX |
(202) 0x23824d VMOVHPD (%RBX,%RAX,8),%XMM21,%XMM19 |
(202) 0x238254 VMOVQ %XMM20,%RAX |
(202) 0x23825a VMOVSD (%RBX,%RAX,8),%XMM21 |
(202) 0x238261 VPEXTRQ $0x1,%XMM20,%RAX |
(202) 0x238268 VMOVHPD (%RBX,%RAX,8),%XMM21,%XMM20 |
(202) 0x23826f VMOVQ %XMM18,%RAX |
(202) 0x238275 VMOVSD (%RBX,%RAX,8),%XMM21 |
(202) 0x23827c VMOVQ %XMM16,%RAX |
(202) 0x238282 VMOVSD (%RBX,%RAX,8),%XMM22 |
(202) 0x238289 VPEXTRQ $0x1,%XMM18,%RAX |
(202) 0x238290 VMOVHPD (%RBX,%RAX,8),%XMM21,%XMM18 |
(202) 0x238297 VPEXTRQ $0x1,%XMM16,%RAX |
(202) 0x23829e VPADDQ %ZMM14,%ZMM26,%ZMM16 |
(202) 0x2382a4 VPADDQ %ZMM14,%ZMM15,%ZMM14 |
(202) 0x2382aa VEXTRACTI32X4 $0x3,%ZMM16,%XMM24 |
(202) 0x2382b1 VMOVHPD (%RBX,%RAX,8),%XMM22,%XMM22 |
(202) 0x2382b8 VEXTRACTI32X4 $0x2,%ZMM16,%XMM23 |
(202) 0x2382bf VEXTRACTI32X4 $0x1,%YMM16,%XMM21 |
(202) 0x2382c6 VMOVQ %XMM24,%RAX |
(202) 0x2382cc VMOVSD (%RBX,%RAX,8),%XMM25 |
(202) 0x2382d3 VPEXTRQ $0x1,%XMM24,%RAX |
(202) 0x2382da VMOVHPD (%RBX,%RAX,8),%XMM25,%XMM24 |
(202) 0x2382e1 VMOVQ %XMM23,%RAX |
(202) 0x2382e7 VMOVSD (%RBX,%RAX,8),%XMM25 |
(202) 0x2382ee VPEXTRQ $0x1,%XMM23,%RAX |
(202) 0x2382f5 VINSERTF32X4 $0x1,%XMM19,%YMM20,%YMM19 |
(202) 0x2382fc VMOVHPD (%RBX,%RAX,8),%XMM25,%XMM23 |
(202) 0x238303 VMOVQ %XMM21,%RAX |
(202) 0x238309 VMOVSD (%RBX,%RAX,8),%XMM25 |
(202) 0x238310 VPEXTRQ $0x1,%XMM21,%RAX |
(202) 0x238317 VMOVHPD (%RBX,%RAX,8),%XMM25,%XMM21 |
(202) 0x23831e VMOVQ %XMM16,%RAX |
(202) 0x238324 VMOVSD (%RBX,%RAX,8),%XMM25 |
(202) 0x23832b VPEXTRQ $0x1,%XMM16,%RAX |
(202) 0x238332 VINSERTF32X4 $0x1,%XMM18,%YMM22,%YMM18 |
(202) 0x238339 VMOVHPD (%RBX,%RAX,8),%XMM25,%XMM16 |
(202) 0x238340 VINSERTF64X4 $0x1,%YMM19,%ZMM18,%ZMM18 |
(202) 0x238347 VADDPD %ZMM18,%ZMM17,%ZMM17 |
(202) 0x23834d VINSERTF32X4 $0x1,%XMM24,%YMM23,%YMM18 |
(202) 0x238354 VINSERTF32X4 $0x1,%XMM21,%YMM16,%YMM16 |
(202) 0x23835b VINSERTF64X4 $0x1,%YMM18,%ZMM16,%ZMM16 |
(202) 0x238362 VSUBPD %ZMM16,%ZMM17,%ZMM16 |
(202) 0x238368 VSCATTERQPD %ZMM16,(%R8,%ZMM14,8){%K1} |
(202) 0x23836f JNE 237eb0 |
0x238375 MOV -0x70(%RBP),%RAX |
0x238379 MOV -0x30(%RBP),%R10 |
0x23837d MOV -0x80(%RBP),%R8 |
0x238381 MOV %R14,%RDX |
0x238384 CMP %RAX,-0x78(%RBP) |
0x238388 JE 238449 |
0x23838e XCHG %AX,%AX |
(203) 0x238390 MOV %RCX,%RAX |
(203) 0x238393 MOV %RDX,%R14 |
(203) 0x238396 CQTO |
(203) 0x238398 MOV %R13,%R12 |
(203) 0x23839b IDIV %R13 |
(203) 0x23839e MOV %R10,%R13 |
(203) 0x2383a1 MOV -0x50(%RBP),%RSI |
(203) 0x2383a5 ADD %EDX,%ESI |
(203) 0x2383a7 ADD -0x58(%RBP),%EDX |
(203) 0x2383aa MOVSXD %ESI,%RSI |
(203) 0x2383ad MOVSXD %EDX,%RDX |
(203) 0x2383b0 LEA (%R10,%RAX,1),%EDI |
(203) 0x2383b4 MOV -0x98(%RBP),%R10 |
(203) 0x2383bb ADD -0x60(%RBP),%EAX |
(203) 0x2383be MOVSXD %EDI,%RDI |
(203) 0x2383c1 IMUL %RDI,%R10 |
(203) 0x2383c5 CLTQ |
(203) 0x2383c7 IMUL %R8,%RAX |
(203) 0x2383cb ADD %RSI,%R10 |
(203) 0x2383ce VMOVSD (%R9,%R10,8),%XMM0 |
(203) 0x2383d4 MOV -0xa0(%RBP),%R10 |
(203) 0x2383db ADD %RSI,%RAX |
(203) 0x2383de IMUL %RDI,%R10 |
(203) 0x2383e2 ADD %R10,%RDX |
(203) 0x2383e5 ADD %RSI,%R10 |
(203) 0x2383e8 VADDSD (%R11,%RDX,8),%XMM0,%XMM0 |
(203) 0x2383ee MOV -0x90(%RBP),%RDX |
(203) 0x2383f5 VSUBSD (%R11,%R10,8),%XMM0,%XMM0 |
(203) 0x2383fb MOV %R13,%R10 |
(203) 0x2383fe MOV %R12,%R13 |
(203) 0x238401 IMUL %RDI,%RDX |
(203) 0x238405 ADD %RSI,%RDX |
(203) 0x238408 VMOVSD %XMM0,(%R14,%RDX,8) |
(203) 0x23840e MOV %R14,%RDX |
(203) 0x238411 MOV -0x88(%RBP),%R14 |
(203) 0x238418 VADDSD (%RBX,%RAX,8),%XMM0,%XMM0 |
(203) 0x23841d MOV %R8,%RAX |
(203) 0x238420 IMUL %RDI,%RAX |
(203) 0x238424 ADD %RSI,%RAX |
(203) 0x238427 VSUBSD (%RBX,%RAX,8),%XMM0,%XMM0 |
(203) 0x23842c MOV -0x48(%RBP),%RAX |
(203) 0x238430 IMUL %R14,%RDI |
(203) 0x238434 ADD %RSI,%RDI |
(203) 0x238437 VMOVSD %XMM0,(%RAX,%RDI,8) |
(203) 0x23843c CMP %R15,%RCX |
(203) 0x23843f LEA 0x1(%RCX),%RCX |
(203) 0x238443 JL 238390 |
0x238449 MOV -0x3c(%RBP),%ESI |
0x23844c LEA 0x28815(%RIP),%RDI |
0x238453 VZEROUPPER |
0x238456 CALL 25f750 <@plt_start@+0x540> |
0x23845b ADD $0x88,%RSP |
0x238462 POP %RBX |
0x238463 POP %R12 |
0x238465 POP %R13 |
0x238467 POP %R14 |
0x238469 POP %R15 |
0x23846b POP %RBP |
0x23846c RET |
Path / |
Source file and lines | advec_mom.cpp:53-57 |
Module | exec |
nb instructions | 127 |
nb uops | 139 |
loop length | 527 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 4 |
used zmm registers | 8 |
nb stack references | 22 |
micro-operation queue | 23.17 cycles |
front end | 23.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 8.75 | 8.75 | 8.50 | 8.50 | 4.50 | 18.33 | 18.33 | 18.33 | 0.50 | 10.00 | 10.00 | 0.50 | 0.00 | 0.00 |
cycles | 8.75 | 8.75 | 8.50 | 8.50 | 4.50 | 18.67 | 18.67 | 18.67 | 0.50 | 10.00 | 10.00 | 0.50 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 23.17 |
Dispatch | 18.67 |
Overall L1 | 23.17 |
all | 6% |
load | 9% |
store | 0% |
mul | 0% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 19% |
store | 11% |
mul | 12% |
add-sub | 20% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x88,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RCX),%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x4,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %EAX,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JL 23845b <.omp_outlined..2+0x77b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV (%R9),%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x4,%R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %ECX,%R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JL 23845b <.omp_outlined..2+0x77b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
LEA -0x1(%RAX),%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x1(%RCX),%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %R14D,%R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %EBX,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
IMUL %R13,%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x40(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA -0xa8(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x28ee6(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x68(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x38(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 25f740 <@plt_start@+0x530> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x68(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %R15,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVL %RAX,%R15 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R15,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JG 238449 <.omp_outlined..2+0x769> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x20(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R12,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R14,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R15,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %RCX,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INC %R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDI),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RDI),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RSI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RSI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R8),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RDX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R12,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RSI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JAE 237e22 <.omp_outlined..2+0x142> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV -0x30(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 238390 <.omp_outlined..2+0x6b0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %RCX,%ZMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPADDQ -0x261b9(%RIP),%ZMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 1 |
VPBROADCASTQ -0x2663b(%RIP),%ZMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 0.50 |
MOV %R8,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %R8,%ZMM9 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
MOV -0x48(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %R13,%ZMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
MOV %R10,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND $-0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VPBROADCASTQ %R12,%ZMM4 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RDI,%ZMM6 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RSI,%ZMM7 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RDX,%ZMM10 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
ADD %R10,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VEXTRACTI32X4 $0x3,%ZMM1,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 1 |
VEXTRACTI32X4 $0x2,%ZMM1,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 1 |
MOV %R10,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTD %EAX,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTD %EAX,%YMM3 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTD %EAX,%YMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x60(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTD %EAX,%YMM8 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x70(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x30(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x80(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RAX,-0x78(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JE 238449 <.omp_outlined..2+0x769> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x28815(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 25f750 <@plt_start@+0x540> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x88,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
Source file and lines | advec_mom.cpp:53-57 |
Module | exec |
nb instructions | 127 |
nb uops | 139 |
loop length | 527 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 4 |
used zmm registers | 8 |
nb stack references | 22 |
micro-operation queue | 23.17 cycles |
front end | 23.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 8.75 | 8.75 | 8.50 | 8.50 | 4.50 | 18.33 | 18.33 | 18.33 | 0.50 | 10.00 | 10.00 | 0.50 | 0.00 | 0.00 |
cycles | 8.75 | 8.75 | 8.50 | 8.50 | 4.50 | 18.67 | 18.67 | 18.67 | 0.50 | 10.00 | 10.00 | 0.50 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 23.17 |
Dispatch | 18.67 |
Overall L1 | 23.17 |
all | 6% |
load | 9% |
store | 0% |
mul | 0% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 19% |
store | 11% |
mul | 12% |
add-sub | 20% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x88,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RCX),%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x4,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %EAX,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JL 23845b <.omp_outlined..2+0x77b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV (%R9),%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x4,%R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %ECX,%R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JL 23845b <.omp_outlined..2+0x77b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
LEA -0x1(%RAX),%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x1(%RCX),%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %R14D,%R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %EBX,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
IMUL %R13,%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x40(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA -0xa8(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x28ee6(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x68(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x38(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 25f740 <@plt_start@+0x530> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x68(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %R15,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVL %RAX,%R15 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R15,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JG 238449 <.omp_outlined..2+0x769> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x20(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R12,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R14,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R15,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %RCX,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INC %R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDI),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RDI),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RSI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RSI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R8),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RDX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R12,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RSI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JAE 237e22 <.omp_outlined..2+0x142> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV -0x30(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 238390 <.omp_outlined..2+0x6b0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %RCX,%ZMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPADDQ -0x261b9(%RIP),%ZMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 1 |
VPBROADCASTQ -0x2663b(%RIP),%ZMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 0.50 |
MOV %R8,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %R8,%ZMM9 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
MOV -0x48(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %R13,%ZMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
MOV %R10,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND $-0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VPBROADCASTQ %R12,%ZMM4 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RDI,%ZMM6 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RSI,%ZMM7 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RDX,%ZMM10 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
ADD %R10,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VEXTRACTI32X4 $0x3,%ZMM1,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 1 |
VEXTRACTI32X4 $0x2,%ZMM1,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 1 |
MOV %R10,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTD %EAX,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTD %EAX,%YMM3 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTD %EAX,%YMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x60(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTD %EAX,%YMM8 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x70(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x30(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x80(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RAX,-0x78(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JE 238449 <.omp_outlined..2+0x769> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
XCHG %AX,%AX | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x28815(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 25f750 <@plt_start@+0x540> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x88,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼.omp_outlined..2#0x237ce0– | 2.9 | 1.48 |
○Loop 202 - advec_mom.cpp:54-57 - exec | 2.9 | 1.48 |
○Loop 203 - advec_mom.cpp:54-57 - exec | 0 | 0 |