Function: .omp_outlined..8 | Module: exec | Source: advec_cell.cpp:136-140 [...] | Coverage: 1.46% |
---|
Function: .omp_outlined..8 | Module: exec | Source: advec_cell.cpp:136-140 [...] | Coverage: 1.46% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/advec_cell.cpp: 136 - 140 |
-------------------------------------------------------------------------------- |
136: #pragma omp parallel for simd collapse(2) |
137: for (int j = (y_min - 2 + 1); j < (y_max + 2 + 2); j++) { |
138: for (int i = (x_min - 2 + 1); i < (x_max + 2 + 2); i++) { |
139: pre_vol(i, j) = volume(i, j) + (vol_flux_y(i + 0, j + 1) - vol_flux_y(i, j) + vol_flux_x(i + 1, j + 0) - vol_flux_x(i, j)); |
140: post_vol(i, j) = pre_vol(i, j) - (vol_flux_y(i + 0, j + 1) - vol_flux_y(i, j)); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/update_tile_halo_kernel.cpp: 94 - 96 |
-------------------------------------------------------------------------------- |
94: #pragma omp parallel for simd |
95: for (int k = (y_min - depth + 1); k < (y_max + depth + 2); k++) { |
96: for (int j = 0; j < depth; ++j) { |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
0x233bb0 PUSH %RBP |
0x233bb1 MOV %RSP,%RBP |
0x233bb4 PUSH %R15 |
0x233bb6 PUSH %R14 |
0x233bb8 PUSH %R13 |
0x233bba PUSH %R12 |
0x233bbc PUSH %RBX |
0x233bbd AND $-0x40,%RSP |
0x233bc1 SUB $0x1c0,%RSP |
0x233bc8 MOV (%RCX),%R14D |
0x233bcb MOV (%RDX),%R15D |
0x233bce ADD $0x4,%R14D |
0x233bd2 CMP %R15D,%R14D |
0x233bd5 JL 234504 |
0x233bdb MOV (%R9),%R12D |
0x233bde MOV (%R8),%R13D |
0x233be1 ADD $0x4,%R12D |
0x233be5 CMP %R13D,%R12D |
0x233be8 JL 234504 |
0x233bee LEA -0x1(%R13),%EAX |
0x233bf2 LEA -0x1(%R15),%EBX |
0x233bf6 MOV (%RDI),%ESI |
0x233bf8 MOVQ $0,0x58(%RSP) |
0x233c01 MOVQ $0x1,0xf8(%RSP) |
0x233c0d MOVL $0,0x2c(%RSP) |
0x233c15 SUB %EAX,%R12D |
0x233c18 SUB %EBX,%R14D |
0x233c1b MOV %RAX,0x40(%RSP) |
0x233c20 IMUL %R12,%R14 |
0x233c24 DEC %R14 |
0x233c27 MOV %R14,0x20(%RSP) |
0x233c2c SUB $0x8,%RSP |
0x233c30 LEA 0x34(%RSP),%RCX |
0x233c35 LEA 0x100(%RSP),%RAX |
0x233c3d LEA 0x2cea4(%RIP),%RDI |
0x233c44 LEA 0x60(%RSP),%R8 |
0x233c49 LEA 0x28(%RSP),%R9 |
0x233c4e MOV %ESI,0x30(%RSP) |
0x233c52 MOV $0x22,%EDX |
0x233c57 PUSH $0x1 |
0x233c59 PUSH $0x1 |
0x233c5b PUSH %RAX |
0x233c5c CALL 25f740 <@plt_start@+0x530> |
0x233c61 ADD $0x20,%RSP |
0x233c65 MOV 0x20(%RSP),%RAX |
0x233c6a MOV 0x58(%RSP),%RCX |
0x233c6f CMP %R14,%RAX |
0x233c72 CMOVL %RAX,%R14 |
0x233c76 MOV %R14,0x20(%RSP) |
0x233c7b CMP %R14,%RCX |
0x233c7e JG 2344f1 |
0x233c84 MOV 0x18(%RBP),%RDI |
0x233c88 MOV 0x10(%RBP),%R10 |
0x233c8c MOV 0x20(%RBP),%RSI |
0x233c90 MOV 0x30(%RBP),%RAX |
0x233c94 MOV 0x28(%RBP),%RDX |
0x233c98 MOV %R12,0x18(%RSP) |
0x233c9d MOV %RBX,0x38(%RSP) |
0x233ca2 MOV (%RDI),%R8 |
0x233ca5 MOV 0x10(%RDI),%R9 |
0x233ca9 MOV 0x10(%R10),%RDI |
0x233cad MOV (%RSI),%R12 |
0x233cb0 MOV 0x10(%RSI),%R11 |
0x233cb4 MOV (%RDX),%RSI |
0x233cb7 MOV %R8,0x30(%RSP) |
0x233cbc MOV 0x10(%RDX),%R8 |
0x233cc0 MOV (%R10),%RDX |
0x233cc3 MOV %RDI,0x50(%RSP) |
0x233cc8 MOV (%RAX),%R10 |
0x233ccb MOV 0x10(%RAX),%RDI |
0x233ccf MOV %R14,%RAX |
0x233cd2 SUB %RCX,%RAX |
0x233cd5 MOV %R12,0xa0(%RSP) |
0x233cdd MOV %RSI,0x98(%RSP) |
0x233ce5 INC %RAX |
0x233ce8 MOV %RDX,0x90(%RSP) |
0x233cf0 MOV %R10,0x88(%RSP) |
0x233cf8 MOV %RDI,0x48(%RSP) |
0x233cfd CMP $0x8,%RAX |
0x233d01 JAE 233d0d |
0x233d03 MOV 0x18(%RSP),%R12 |
0x233d08 JMP 234410 |
0x233d0d MOV %R14,0x60(%RSP) |
0x233d12 MOV %R15,%R14 |
0x233d15 MOV %RAX,%R15 |
0x233d18 MOV %RAX,0x70(%RSP) |
0x233d1d MOV 0x18(%RSP),%RAX |
0x233d22 VPBROADCASTQ %RCX,%ZMM0 |
0x233d28 VPADDQ -0x221f2(%RIP),%ZMM0,%ZMM0 |
0x233d32 VPBROADCASTQ -0x22534(%RIP),%ZMM13 |
0x233d3c MOV 0x30(%RSP),%RDI |
0x233d41 VPBROADCASTD %EBX,%YMM2 |
0x233d47 AND $-0x8,%R15 |
0x233d4b VPBROADCASTD %R14D,%YMM5 |
0x233d51 VPBROADCASTQ %R12,%ZMM6 |
0x233d57 VPBROADCASTD %R13D,%YMM7 |
0x233d5d VPBROADCASTQ %RSI,%ZMM8 |
0x233d63 VPBROADCASTQ %RDX,%ZMM9 |
0x233d69 VPBROADCASTQ %R10,%ZMM10 |
0x233d6f MOV %R14,0x80(%RSP) |
0x233d77 MOV %R13,0x78(%RSP) |
0x233d7c VMOVDQA %YMM2,0x120(%RSP) |
0x233d85 ADD %R15,%RCX |
0x233d88 MOV %R15,0x68(%RSP) |
0x233d8d VPBROADCASTQ %RAX,%ZMM1 |
0x233d93 MOV 0x40(%RSP),%RAX |
0x233d98 VEXTRACTI32X4 $0x3,%ZMM1,%XMM11 |
0x233d9f VEXTRACTI32X4 $0x2,%ZMM1,%XMM12 |
0x233da6 VPBROADCASTD %EAX,%YMM2 |
0x233dac MOV %R15,%RAX |
0x233daf VMOVDQA %YMM2,0x100(%RSP) |
0x233db8 VPBROADCASTQ %RDI,%ZMM2 |
0x233dbe VMOVDQA64 %ZMM2,0x140(%RSP) |
0x233dc6 NOPW %CS:(%RAX,%RAX,1) |
(260) 0x233dd0 VEXTRACTI32X4 $0x3,%ZMM0,%XMM14 |
(260) 0x233dd7 MOV %RAX,0xf0(%RSP) |
(260) 0x233ddf VPEXTRQ $0x1,%XMM11,%RSI |
(260) 0x233de5 VMOVQ %XMM11,%RDI |
(260) 0x233dea VPEXTRQ $0x1,%XMM12,%R10 |
(260) 0x233df0 VEXTRACTI32X4 $0x1,%YMM1,%XMM18 |
(260) 0x233df7 KXNORW %K0,%K0,%K1 |
(260) 0x233dfb VPEXTRQ $0x1,%XMM14,%RAX |
(260) 0x233e01 CQTO |
(260) 0x233e03 IDIV %RSI |
(260) 0x233e06 MOV %RAX,%RSI |
(260) 0x233e09 VMOVQ %XMM14,%RAX |
(260) 0x233e0e VEXTRACTI32X4 $0x2,%ZMM0,%XMM14 |
(260) 0x233e15 VMOVQ %RSI,%XMM15 |
(260) 0x233e1a VMOVQ %XMM12,%RSI |
(260) 0x233e1f CQTO |
(260) 0x233e21 IDIV %RDI |
(260) 0x233e24 MOV %RAX,%RDI |
(260) 0x233e27 VPEXTRQ $0x1,%XMM14,%RAX |
(260) 0x233e2d VMOVQ %RDI,%XMM16 |
(260) 0x233e33 VMOVQ %XMM18,%RDI |
(260) 0x233e39 CQTO |
(260) 0x233e3b VPUNPCKLQDQ %XMM15,%XMM16,%XMM15 |
(260) 0x233e41 IDIV %R10 |
(260) 0x233e44 VMOVQ %RAX,%XMM16 |
(260) 0x233e4a VMOVQ %XMM14,%RAX |
(260) 0x233e4f VEXTRACTI128 $0x1,%YMM0,%XMM14 |
(260) 0x233e55 CQTO |
(260) 0x233e57 IDIV %RSI |
(260) 0x233e5a VPEXTRQ $0x1,%XMM18,%RSI |
(260) 0x233e61 VMOVQ %RAX,%XMM17 |
(260) 0x233e67 VPEXTRQ $0x1,%XMM14,%RAX |
(260) 0x233e6d CQTO |
(260) 0x233e6f IDIV %RSI |
(260) 0x233e72 MOV %RAX,%RSI |
(260) 0x233e75 VMOVQ %XMM14,%RAX |
(260) 0x233e7a VPUNPCKLQDQ %XMM16,%XMM17,%XMM14 |
(260) 0x233e80 CQTO |
(260) 0x233e82 VINSERTI128 $0x1,%XMM15,%YMM14,%YMM14 |
(260) 0x233e88 VMOVQ %RSI,%XMM15 |
(260) 0x233e8d VPEXTRQ $0x1,%XMM1,%RSI |
(260) 0x233e93 IDIV %RDI |
(260) 0x233e96 VPEXTRQ $0x1,%XMM0,%RDX |
(260) 0x233e9c VMOVQ %XMM1,%RDI |
(260) 0x233ea1 VMOVQ %RAX,%XMM16 |
(260) 0x233ea7 MOV %RDX,%RAX |
(260) 0x233eaa CQTO |
(260) 0x233eac IDIV %RSI |
(260) 0x233eaf VPUNPCKLQDQ %XMM15,%XMM16,%XMM15 |
(260) 0x233eb5 MOV %RAX,%RSI |
(260) 0x233eb8 VMOVQ %XMM0,%RAX |
(260) 0x233ebd VMOVQ %RSI,%XMM16 |
(260) 0x233ec3 CQTO |
(260) 0x233ec5 IDIV %RDI |
(260) 0x233ec8 VMOVQ %RAX,%XMM17 |
(260) 0x233ece VPUNPCKLQDQ %XMM16,%XMM17,%XMM16 |
(260) 0x233ed4 VINSERTI32X4 $0x1,%XMM15,%YMM16,%YMM15 |
(260) 0x233edb VINSERTI64X4 $0x1,%YMM14,%ZMM15,%ZMM14 |
(260) 0x233ee2 VPMOVQD %ZMM14,%YMM16 |
(260) 0x233ee8 VPADDD 0x120(%RSP),%YMM16,%YMM15 |
(260) 0x233ef0 VPMULLQ %ZMM1,%ZMM14,%ZMM14 |
(260) 0x233ef6 VPSUBQ %ZMM14,%ZMM0,%ZMM14 |
(260) 0x233efc VPADDQ %ZMM13,%ZMM0,%ZMM0 |
(260) 0x233f02 VPMOVQD %ZMM14,%YMM17 |
(260) 0x233f08 VPADDD 0x100(%RSP),%YMM17,%YMM14 |
(260) 0x233f10 VPADDD %YMM16,%YMM5,%YMM16 |
(260) 0x233f16 VPMOVSXDQ %YMM16,%ZMM16 |
(260) 0x233f1c VPMOVSXDQ %YMM15,%ZMM15 |
(260) 0x233f22 VPMULLQ 0x140(%RSP),%ZMM15,%ZMM18 |
(260) 0x233f2a VPADDD %YMM17,%YMM7,%YMM17 |
(260) 0x233f30 VPMULLQ %ZMM16,%ZMM6,%ZMM16 |
(260) 0x233f36 VPMOVSXDQ %YMM17,%ZMM17 |
(260) 0x233f3c VPMOVSXDQ %YMM14,%ZMM14 |
(260) 0x233f42 VPMULLQ %ZMM15,%ZMM6,%ZMM28 |
(260) 0x233f48 VPADDQ %ZMM14,%ZMM18,%ZMM18 |
(260) 0x233f4e VEXTRACTI32X4 $0x1,%YMM18,%XMM19 |
(260) 0x233f55 VEXTRACTI32X4 $0x2,%ZMM18,%XMM2 |
(260) 0x233f5c VMOVQ %XMM18,%RSI |
(260) 0x233f62 VPEXTRQ $0x1,%XMM18,%RDX |
(260) 0x233f69 VEXTRACTI32X4 $0x3,%ZMM18,%XMM18 |
(260) 0x233f70 VMOVQ %XMM18,%RBX |
(260) 0x233f76 VPEXTRQ $0x1,%XMM18,%RAX |
(260) 0x233f7d VPEXTRQ $0x1,%XMM2,0xb8(%RSP) |
(260) 0x233f88 VMOVQ %XMM19,%RDI |
(260) 0x233f8e VPEXTRQ $0x1,%XMM19,0xc8(%RSP) |
(260) 0x233f97 VPADDQ %ZMM14,%ZMM16,%ZMM19 |
(260) 0x233f9d VMOVQ %XMM2,%R10 |
(260) 0x233fa2 VMOVSD (%R9,%RSI,8),%XMM18 |
(260) 0x233fa9 VMOVSD (%R9,%RBX,8),%XMM21 |
(260) 0x233fb0 VEXTRACTI32X4 $0x1,%YMM19,%XMM16 |
(260) 0x233fb7 VMOVSD (%R9,%RDI,8),%XMM25 |
(260) 0x233fbe VMOVSD (%R9,%R10,8),%XMM22 |
(260) 0x233fc5 VMOVQ %XMM19,%RBX |
(260) 0x233fcb VEXTRACTI32X4 $0x3,%ZMM19,%XMM2 |
(260) 0x233fd2 VPEXTRQ $0x1,%XMM19,%RSI |
(260) 0x233fd9 VMOVHPD (%R9,%RAX,8),%XMM21,%XMM21 |
(260) 0x233fe0 MOV 0xb8(%RSP),%RAX |
(260) 0x233fe8 VMOVQ %XMM16,%RDI |
(260) 0x233fee VPEXTRQ $0x1,%XMM16,%R15 |
(260) 0x233ff5 VEXTRACTI32X4 $0x2,%ZMM19,%XMM16 |
(260) 0x233ffc VMOVSD (%R11,%RBX,8),%XMM27 |
(260) 0x234003 MOV %RBX,0xd0(%RSP) |
(260) 0x23400b VPEXTRQ $0x1,%XMM2,%R13 |
(260) 0x234011 MOV %RSI,0xc0(%RSP) |
(260) 0x234019 VMOVQ %XMM16,%R10 |
(260) 0x23401f VPEXTRQ $0x1,%XMM16,%R12 |
(260) 0x234026 VMOVHPD (%R9,%RDX,8),%XMM18,%XMM16 |
(260) 0x23402d VPADDQ %ZMM14,%ZMM28,%ZMM18 |
(260) 0x234033 VPMULLQ %ZMM15,%ZMM8,%ZMM28 |
(260) 0x234039 VMOVQ %XMM2,%RDX |
(260) 0x23403e VMOVSD (%R11,%RDI,8),%XMM19 |
(260) 0x234045 VMOVHPD (%R11,%RSI,8),%XMM27,%XMM27 |
(260) 0x23404c MOV %RDI,0xd8(%RSP) |
(260) 0x234054 MOV %R15,%RDI |
(260) 0x234057 MOV %R13,0xb0(%RSP) |
(260) 0x23405f VEXTRACTI32X4 $0x2,%ZMM18,%XMM23 |
(260) 0x234066 VMOVSD (%R11,%R10,8),%XMM24 |
(260) 0x23406d MOV %R10,0xe0(%RSP) |
(260) 0x234075 VMOVHPD (%R11,%R15,8),%XMM19,%XMM19 |
(260) 0x23407c VMOVSD (%R11,%RDX,8),%XMM26 |
(260) 0x234083 MOV %RDX,0xe8(%RSP) |
(260) 0x23408b VEXTRACTI32X4 $0x1,%YMM18,%XMM20 |
(260) 0x234092 VMOVQ %XMM18,%R15 |
(260) 0x234098 MOV %R12,0xa8(%RSP) |
(260) 0x2340a0 VMOVQ %XMM23,%RBX |
(260) 0x2340a6 VPEXTRQ $0x1,%XMM23,%R10 |
(260) 0x2340ad VMOVHPD (%R11,%R13,8),%XMM26,%XMM26 |
(260) 0x2340b4 VMOVHPD (%R11,%R12,8),%XMM24,%XMM24 |
(260) 0x2340bb VMOVQ %XMM20,%R14 |
(260) 0x2340c1 VPEXTRQ $0x1,%XMM20,%RSI |
(260) 0x2340c8 VPEXTRQ $0x1,%XMM18,%R12 |
(260) 0x2340cf MOV 0x50(%RSP),%R13 |
(260) 0x2340d4 VPADDQ %ZMM17,%ZMM28,%ZMM17 |
(260) 0x2340da VPADDQ %ZMM14,%ZMM28,%ZMM28 |
(260) 0x2340e0 VMOVHPD (%R9,%RAX,8),%XMM22,%XMM23 |
(260) 0x2340e7 MOV 0xc8(%RSP),%RAX |
(260) 0x2340ef VEXTRACTI32X4 $0x3,%ZMM17,%XMM31 |
(260) 0x2340f6 VEXTRACTI32X4 $0x2,%ZMM17,%XMM30 |
(260) 0x2340fd VEXTRACTI32X4 $0x1,%YMM17,%XMM29 |
(260) 0x234104 VMOVQ %XMM17,%RDX |
(260) 0x23410a VEXTRACTI32X4 $0x3,%ZMM28,%XMM4 |
(260) 0x234111 VEXTRACTI32X4 $0x3,%ZMM18,%XMM22 |
(260) 0x234118 VMOVHPD (%R9,%RAX,8),%XMM25,%XMM25 |
(260) 0x23411f VMOVQ %XMM31,%RAX |
(260) 0x234125 VINSERTF32X4 $0x1,%XMM19,%YMM27,%YMM19 |
(260) 0x23412c VMOVSD (%R11,%R14,8),%XMM27 |
(260) 0x234133 VMOVSD (%R8,%RAX,8),%XMM2 |
(260) 0x234139 VPEXTRQ $0x1,%XMM31,%RAX |
(260) 0x234140 VINSERTF32X4 $0x1,%XMM26,%YMM24,%YMM24 |
(260) 0x234147 VMOVSD (%R11,%RBX,8),%XMM26 |
(260) 0x23414e VMOVHPD (%R11,%RSI,8),%XMM27,%XMM20 |
(260) 0x234155 VMOVSD (%R11,%R15,8),%XMM27 |
(260) 0x23415c VMOVHPD (%R8,%RAX,8),%XMM2,%XMM2 |
(260) 0x234162 VMOVQ %XMM30,%RAX |
(260) 0x234168 VMOVHPD (%R11,%R12,8),%XMM27,%XMM18 |
(260) 0x23416f VMOVHPD (%R11,%R10,8),%XMM26,%XMM26 |
(260) 0x234176 VMOVSD (%R8,%RAX,8),%XMM31 |
(260) 0x23417d VMOVQ %XMM29,%RAX |
(260) 0x234183 VINSERTF32X4 $0x1,%XMM21,%YMM23,%YMM21 |
(260) 0x23418a VINSERTF64X4 $0x1,%YMM24,%ZMM19,%ZMM19 |
(260) 0x234191 VMOVSD (%R8,%RAX,8),%XMM3 |
(260) 0x234197 VPEXTRQ $0x1,%XMM30,%RAX |
(260) 0x23419e VMOVHPD (%R8,%RAX,8),%XMM31,%XMM30 |
(260) 0x2341a5 VPEXTRQ $0x1,%XMM17,%RAX |
(260) 0x2341ac VMOVSD (%R8,%RDX,8),%XMM17 |
(260) 0x2341b3 VPEXTRQ $0x1,%XMM29,%RDX |
(260) 0x2341ba VEXTRACTI32X4 $0x2,%ZMM28,%XMM31 |
(260) 0x2341c1 VEXTRACTI32X4 $0x1,%YMM28,%XMM29 |
(260) 0x2341c8 VMOVHPD (%R8,%RAX,8),%XMM17,%XMM17 |
(260) 0x2341cf VMOVQ %XMM4,%RAX |
(260) 0x2341d4 VMOVHPD (%R8,%RDX,8),%XMM3,%XMM3 |
(260) 0x2341da VPEXTRQ $0x1,%XMM4,%RDX |
(260) 0x2341e0 VMOVSD (%R8,%RAX,8),%XMM4 |
(260) 0x2341e6 VMOVQ %XMM31,%RAX |
(260) 0x2341ec VMOVHPD (%R8,%RDX,8),%XMM4,%XMM4 |
(260) 0x2341f2 VPEXTRQ $0x1,%XMM31,%RDX |
(260) 0x2341f9 VMOVSD (%R8,%RAX,8),%XMM31 |
(260) 0x234200 VMOVQ %XMM29,%RAX |
(260) 0x234206 VINSERTF32X4 $0x1,%XMM25,%YMM16,%YMM16 |
(260) 0x23420d VMOVHPD (%R8,%RDX,8),%XMM31,%XMM31 |
(260) 0x234214 VPEXTRQ $0x1,%XMM29,%RDX |
(260) 0x23421b VMOVSD (%R8,%RAX,8),%XMM29 |
(260) 0x234222 VMOVQ %XMM28,%RAX |
(260) 0x234228 VMOVHPD (%R8,%RDX,8),%XMM29,%XMM29 |
(260) 0x23422f VMOVSD (%R8,%RAX,8),%XMM23 |
(260) 0x234236 VPEXTRQ $0x1,%XMM28,%RDX |
(260) 0x23423d VMOVQ %XMM22,%RAX |
(260) 0x234243 VINSERTF32X4 $0x1,%XMM20,%YMM18,%YMM18 |
(260) 0x23424a VMOVHPD (%R8,%RDX,8),%XMM23,%XMM23 |
(260) 0x234251 VPEXTRQ $0x1,%XMM22,%RDX |
(260) 0x234258 VMOVSD (%R11,%RAX,8),%XMM22 |
(260) 0x23425f VMOVHPD (%R11,%RDX,8),%XMM22,%XMM22 |
(260) 0x234266 VINSERTF32X4 $0x1,%XMM2,%YMM30,%YMM2 |
(260) 0x23426d VINSERTF32X4 $0x1,%XMM3,%YMM17,%YMM3 |
(260) 0x234274 VINSERTF64X4 $0x1,%YMM2,%ZMM3,%ZMM2 |
(260) 0x23427b VINSERTF32X4 $0x1,%XMM4,%YMM31,%YMM3 |
(260) 0x234282 VINSERTF32X4 $0x1,%XMM29,%YMM23,%YMM4 |
(260) 0x234289 VINSERTF32X4 $0x1,%XMM22,%YMM26,%YMM22 |
(260) 0x234290 VINSERTF64X4 $0x1,%YMM3,%ZMM4,%ZMM3 |
(260) 0x234297 VINSERTF64X4 $0x1,%YMM21,%ZMM16,%ZMM4 |
(260) 0x23429e VINSERTF64X4 $0x1,%YMM22,%ZMM18,%ZMM18 |
(260) 0x2342a5 VSUBPD %ZMM18,%ZMM19,%ZMM18 |
(260) 0x2342ab VADDPD %ZMM2,%ZMM18,%ZMM2 |
(260) 0x2342b1 VSUBPD %ZMM3,%ZMM2,%ZMM2 |
(260) 0x2342b7 VPMULLQ %ZMM15,%ZMM9,%ZMM3 |
(260) 0x2342bd VADDPD %ZMM2,%ZMM4,%ZMM2 |
(260) 0x2342c3 VPADDQ %ZMM14,%ZMM3,%ZMM3 |
(260) 0x2342c9 VSCATTERQPD %ZMM2,(%R13,%ZMM3,8){%K1} |
(260) 0x2342d1 KXNORW %K0,%K0,%K1 |
(260) 0x2342d5 MOV 0xe8(%RSP),%R13 |
(260) 0x2342dd VMOVSD (%R11,%RAX,8),%XMM18 |
(260) 0x2342e4 VMOVSD (%R11,%RBX,8),%XMM19 |
(260) 0x2342eb VMOVSD (%R11,%R14,8),%XMM20 |
(260) 0x2342f2 VMOVSD (%R11,%R15,8),%XMM21 |
(260) 0x2342f9 MOV 0xf0(%RSP),%RAX |
(260) 0x234301 VMOVHPD (%R11,%RDX,8),%XMM18,%XMM18 |
(260) 0x234308 VMOVHPD (%R11,%R10,8),%XMM19,%XMM19 |
(260) 0x23430f VMOVHPD (%R11,%RSI,8),%XMM20,%XMM20 |
(260) 0x234316 VMOVHPD (%R11,%R12,8),%XMM21,%XMM21 |
(260) 0x23431d VMOVSD (%R11,%R13,8),%XMM3 |
(260) 0x234323 MOV 0xb0(%RSP),%R13 |
(260) 0x23432b ADD $-0x8,%RAX |
(260) 0x23432f VMOVHPD (%R11,%R13,8),%XMM3,%XMM3 |
(260) 0x234335 MOV 0xe0(%RSP),%R13 |
(260) 0x23433d VMOVSD (%R11,%R13,8),%XMM4 |
(260) 0x234343 MOV 0xa8(%RSP),%R13 |
(260) 0x23434b VMOVHPD (%R11,%R13,8),%XMM4,%XMM4 |
(260) 0x234351 MOV 0xd8(%RSP),%R13 |
(260) 0x234359 VMOVSD (%R11,%R13,8),%XMM16 |
(260) 0x234360 VMOVHPD (%R11,%RDI,8),%XMM16,%XMM16 |
(260) 0x234367 MOV 0xd0(%RSP),%RDI |
(260) 0x23436f VINSERTF128 $0x1,%XMM3,%YMM4,%YMM3 |
(260) 0x234375 VMOVSD (%R11,%RDI,8),%XMM17 |
(260) 0x23437c MOV 0xc0(%RSP),%RDI |
(260) 0x234384 VMOVHPD (%R11,%RDI,8),%XMM17,%XMM17 |
(260) 0x23438b MOV 0x48(%RSP),%RDI |
(260) 0x234390 VINSERTF32X4 $0x1,%XMM16,%YMM17,%YMM4 |
(260) 0x234397 VINSERTF32X4 $0x1,%XMM18,%YMM19,%YMM17 |
(260) 0x23439e VINSERTF32X4 $0x1,%XMM20,%YMM21,%YMM16 |
(260) 0x2343a5 VINSERTF64X4 $0x1,%YMM3,%ZMM4,%ZMM3 |
(260) 0x2343ac VINSERTF64X4 $0x1,%YMM17,%ZMM16,%ZMM4 |
(260) 0x2343b3 VSUBPD %ZMM4,%ZMM3,%ZMM3 |
(260) 0x2343b9 VPMULLQ %ZMM15,%ZMM10,%ZMM4 |
(260) 0x2343bf VSUBPD %ZMM3,%ZMM2,%ZMM2 |
(260) 0x2343c5 VPADDQ %ZMM14,%ZMM4,%ZMM3 |
(260) 0x2343cb VSCATTERQPD %ZMM2,(%RDI,%ZMM3,8){%K1} |
(260) 0x2343d2 JNE 233dd0 |
0x2343d8 MOV 0x68(%RSP),%RAX |
0x2343dd MOV 0x80(%RSP),%R15 |
0x2343e5 MOV 0x78(%RSP),%R13 |
0x2343ea MOV 0x18(%RSP),%R12 |
0x2343ef MOV 0x38(%RSP),%RBX |
0x2343f4 MOV 0x60(%RSP),%R14 |
0x2343f9 CMP %RAX,0x70(%RSP) |
0x2343fe JE 2344f1 |
0x234404 NOPW %CS:(%RAX,%RAX,1) |
(261) 0x234410 MOV %RCX,%RAX |
(261) 0x234413 CQTO |
(261) 0x234415 IDIV %R12 |
(261) 0x234418 MOV 0xa0(%RSP),%R10 |
(261) 0x234420 MOV 0x40(%RSP),%RSI |
(261) 0x234425 MOV %R13,%R12 |
(261) 0x234428 ADD %EDX,%ESI |
(261) 0x23442a ADD %R13D,%EDX |
(261) 0x23442d MOV %R14,%R13 |
(261) 0x234430 MOV %R15,%R14 |
(261) 0x234433 MOVSXD %ESI,%RSI |
(261) 0x234436 MOVSXD %EDX,%RDX |
(261) 0x234439 LEA (%RBX,%RAX,1),%EDI |
(261) 0x23443c ADD %R15D,%EAX |
(261) 0x23443f MOV 0x98(%RSP),%RBX |
(261) 0x234447 MOV 0x50(%RSP),%R15 |
(261) 0x23444c CLTQ |
(261) 0x23444e MOVSXD %EDI,%RDI |
(261) 0x234451 IMUL %R10,%RAX |
(261) 0x234455 IMUL %RDI,%R10 |
(261) 0x234459 ADD %RSI,%RAX |
(261) 0x23445c IMUL %RDI,%RBX |
(261) 0x234460 ADD %RSI,%R10 |
(261) 0x234463 VMOVSD (%R11,%RAX,8),%XMM0 |
(261) 0x234469 VSUBSD (%R11,%R10,8),%XMM0,%XMM0 |
(261) 0x23446f ADD %RBX,%RDX |
(261) 0x234472 ADD %RSI,%RBX |
(261) 0x234475 VADDSD (%R8,%RDX,8),%XMM0,%XMM0 |
(261) 0x23447b MOV 0x30(%RSP),%RDX |
(261) 0x234480 VSUBSD (%R8,%RBX,8),%XMM0,%XMM0 |
(261) 0x234486 MOV 0x38(%RSP),%RBX |
(261) 0x23448b IMUL %RDI,%RDX |
(261) 0x23448f ADD %RSI,%RDX |
(261) 0x234492 VADDSD (%R9,%RDX,8),%XMM0,%XMM0 |
(261) 0x234498 MOV 0x90(%RSP),%RDX |
(261) 0x2344a0 IMUL %RDI,%RDX |
(261) 0x2344a4 ADD %RSI,%RDX |
(261) 0x2344a7 VMOVSD %XMM0,(%R15,%RDX,8) |
(261) 0x2344ad MOV %R14,%R15 |
(261) 0x2344b0 MOV %R13,%R14 |
(261) 0x2344b3 MOV %R12,%R13 |
(261) 0x2344b6 MOV 0x18(%RSP),%R12 |
(261) 0x2344bb VMOVSD (%R11,%RAX,8),%XMM1 |
(261) 0x2344c1 MOV 0x48(%RSP),%RAX |
(261) 0x2344c6 VSUBSD (%R11,%R10,8),%XMM1,%XMM1 |
(261) 0x2344cc MOV 0x88(%RSP),%R10 |
(261) 0x2344d4 IMUL %R10,%RDI |
(261) 0x2344d8 ADD %RSI,%RDI |
(261) 0x2344db VSUBSD %XMM1,%XMM0,%XMM0 |
(261) 0x2344df VMOVSD %XMM0,(%RAX,%RDI,8) |
(261) 0x2344e4 CMP %R14,%RCX |
(261) 0x2344e7 LEA 0x1(%RCX),%RCX |
(261) 0x2344eb JL 234410 |
0x2344f1 MOV 0x28(%RSP),%ESI |
0x2344f5 LEA 0x2c604(%RIP),%RDI |
0x2344fc VZEROUPPER |
0x2344ff CALL 25f750 <@plt_start@+0x540> |
0x234504 LEA -0x28(%RBP),%RSP |
0x234508 POP %RBX |
0x234509 POP %R12 |
0x23450b POP %R13 |
0x23450d POP %R14 |
0x23450f POP %R15 |
0x234511 POP %RBP |
0x234512 RET |
0x234513 NOPW %CS:(%RAX,%RAX,1) |
0x23967a NOPW (%RAX,%RAX,1) |
0x23df36 NOPW %CS:(%RAX,%RAX,1) |
0x2443be INT $0x3 |
0x2443bf INT $0x3 |
0x2471b3 NOPW %CS:(%RAX,%RAX,1) |
0x24cbad NOPL (%RAX) |
0x2524fd NOPL (%RAX) |
0x25258b NOPL (%RAX,%RAX,1) |
0x2525a1 NOPW %CS:(%RAX,%RAX,1) |
0x252716 NOPW %CS:(%RAX,%RAX,1) |
Path / |
Source file and lines | advec_cell.cpp:136-140 |
Module | exec |
nb instructions | 146 |
nb uops | 147 |
loop length | 714 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 3 |
used zmm registers | 8 |
nb stack references | 30 |
micro-operation queue | 24.50 cycles |
front end | 24.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.00 | 9.00 | 8.75 | 8.75 | 4.50 | 20.67 | 20.67 | 20.67 | 0.50 | 10.00 | 10.00 | 0.50 | 2.00 | 2.00 |
cycles | 9.00 | 9.00 | 8.75 | 8.75 | 4.50 | 21.00 | 21.00 | 21.00 | 0.50 | 10.00 | 10.00 | 0.50 | 2.00 | 2.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 24.50 |
Dispatch | 21.00 |
Overall L1 | 24.50 |
all | 11% |
load | 10% |
store | 12% |
mul | 0% |
add-sub | 16% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
all | 15% |
load | 20% |
store | 18% |
mul | 12% |
add-sub | 22% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x1c0,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RCX),%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x4,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R15D,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JL 234504 <.omp_outlined..8+0x954> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV (%R9),%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x4,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R13D,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JL 234504 <.omp_outlined..8+0x954> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
LEA -0x1(%R13),%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x1(%R15),%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,0xf8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,0x2c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %EAX,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %EBX,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
IMUL %R12,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x34(%RSP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x100(%RSP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x2cea4(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x60(%RSP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x28(%RSP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 25f740 <@plt_start@+0x530> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x58(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %R14,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVL %RAX,%R14 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R14,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JG 2344f1 <.omp_outlined..8+0x941> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x18(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x20(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R12,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RDI),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R10),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RSI),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RSI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R8,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RDX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R10),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDI,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %RCX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R12,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RSI,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
INC %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP $0x8,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JAE 233d0d <.omp_outlined..8+0x15d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x18(%RSP),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JMP 234410 <.omp_outlined..8+0x860> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %R14,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R15,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %RCX,%ZMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPADDQ -0x221f2(%RIP),%ZMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 1 |
VPBROADCASTQ -0x22534(%RIP),%ZMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 0.50 |
MOV 0x30(%RSP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTD %EBX,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
AND $-0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VPBROADCASTD %R14D,%YMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %R12,%ZMM6 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTD %R13D,%YMM7 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RSI,%ZMM8 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RDX,%ZMM9 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %R10,%ZMM10 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
MOV %R14,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R13,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDQA %YMM2,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
ADD %R15,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %RAX,%ZMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
MOV 0x40(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VEXTRACTI32X4 $0x3,%ZMM1,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 1 |
VEXTRACTI32X4 $0x2,%ZMM1,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 1 |
VPBROADCASTD %EAX,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDQA %YMM2,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPBROADCASTQ %RDI,%ZMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VMOVDQA64 %ZMM2,0x140(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 4 | 2 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV 0x68(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x80(%RSP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x78(%RSP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RSP),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x38(%RSP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x60(%RSP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,0x70(%RSP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JE 2344f1 <.omp_outlined..8+0x941> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV 0x28(%RSP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x2c604(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 25f750 <@plt_start@+0x540> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Source file and lines | advec_cell.cpp:136-140 |
Module | exec |
nb instructions | 146 |
nb uops | 147 |
loop length | 714 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 3 |
used zmm registers | 8 |
nb stack references | 30 |
micro-operation queue | 24.50 cycles |
front end | 24.50 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.00 | 9.00 | 8.75 | 8.75 | 4.50 | 20.67 | 20.67 | 20.67 | 0.50 | 10.00 | 10.00 | 0.50 | 2.00 | 2.00 |
cycles | 9.00 | 9.00 | 8.75 | 8.75 | 4.50 | 21.00 | 21.00 | 21.00 | 0.50 | 10.00 | 10.00 | 0.50 | 2.00 | 2.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 24.50 |
Dispatch | 21.00 |
Overall L1 | 24.50 |
all | 11% |
load | 10% |
store | 12% |
mul | 0% |
add-sub | 16% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
all | 15% |
load | 20% |
store | 18% |
mul | 12% |
add-sub | 22% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x40,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x1c0,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RCX),%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x4,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R15D,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JL 234504 <.omp_outlined..8+0x954> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV (%R9),%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x4,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R13D,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JL 234504 <.omp_outlined..8+0x954> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
LEA -0x1(%R13),%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x1(%R15),%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,0xf8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,0x2c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %EAX,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %EBX,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
IMUL %R12,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x34(%RSP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x100(%RSP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x2cea4(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x60(%RSP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x28(%RSP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 25f740 <@plt_start@+0x530> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x58(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %R14,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVL %RAX,%R14 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R14,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JG 2344f1 <.omp_outlined..8+0x941> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x18(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x20(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R12,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RDI),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R10),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RSI),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RSI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R8,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RDX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R10),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDI,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %RCX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R12,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RSI,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
INC %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R10,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP $0x8,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JAE 233d0d <.omp_outlined..8+0x15d> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x18(%RSP),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JMP 234410 <.omp_outlined..8+0x860> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %R14,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R15,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %RCX,%ZMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPADDQ -0x221f2(%RIP),%ZMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 1 |
VPBROADCASTQ -0x22534(%RIP),%ZMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 0.50 |
MOV 0x30(%RSP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTD %EBX,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
AND $-0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VPBROADCASTD %R14D,%YMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %R12,%ZMM6 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTD %R13D,%YMM7 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RSI,%ZMM8 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RDX,%ZMM9 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %R10,%ZMM10 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
MOV %R14,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R13,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDQA %YMM2,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
ADD %R15,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %RAX,%ZMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
MOV 0x40(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VEXTRACTI32X4 $0x3,%ZMM1,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 1 |
VEXTRACTI32X4 $0x2,%ZMM1,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 1 |
VPBROADCASTD %EAX,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDQA %YMM2,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPBROADCASTQ %RDI,%ZMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VMOVDQA64 %ZMM2,0x140(%RSP) | 2 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 1 | 1 | 4 | 2 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV 0x68(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x80(%RSP),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x78(%RSP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RSP),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x38(%RSP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x60(%RSP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,0x70(%RSP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JE 2344f1 <.omp_outlined..8+0x941> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV 0x28(%RSP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x2c604(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 25f750 <@plt_start@+0x540> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
INT $0x3 | |||||||||||||||||
INT $0x3 | |||||||||||||||||
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼.omp_outlined..8– | 1.46 | 0.75 |
○Loop 260 - advec_cell.cpp:137-140 - exec | 1.46 | 0.75 |
○Loop 261 - advec_cell.cpp:137-140 - exec | 0 | 0 |