Function: .omp_outlined.#0x247e10 | Module: exec | Source: PdV.cpp:48-63 [...] | Coverage: 5.4% |
---|
Function: .omp_outlined.#0x247e10 | Module: exec | Source: PdV.cpp:48-63 [...] | Coverage: 5.4% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/PdV.cpp: 48 - 63 |
-------------------------------------------------------------------------------- |
48: #pragma omp parallel for simd collapse(2) |
49: for (int j = (y_min + 1); j < (y_max + 2); j++) { |
50: for (int i = (x_min + 1); i < (x_max + 2); i++) { |
51: double left_flux = (xarea(i, j) * (xvel0(i, j) + xvel0(i + 0, j + 1) + xvel0(i, j) + xvel0(i + 0, j + 1))) * 0.25 * dt * 0.5; |
52: double right_flux = |
53: (xarea(i + 1, j + 0) * (xvel0(i + 1, j + 0) + xvel0(i + 1, j + 1) + xvel0(i + 1, j + 0) + xvel0(i + 1, j + 1))) * 0.25 * dt * |
54: 0.5; |
55: double bottom_flux = (yarea(i, j) * (yvel0(i, j) + yvel0(i + 1, j + 0) + yvel0(i, j) + yvel0(i + 1, j + 0))) * 0.25 * dt * 0.5; |
56: double top_flux = (yarea(i + 0, j + 1) * (yvel0(i + 0, j + 1) + yvel0(i + 1, j + 1) + yvel0(i + 0, j + 1) + yvel0(i + 1, j + 1))) * |
57: 0.25 * dt * 0.5; |
58: double total_flux = right_flux - left_flux + top_flux - bottom_flux; |
59: double volume_change_s = volume(i, j) / (volume(i, j) + total_flux); |
60: double recip_volume = 1.0 / volume(i, j); |
61: double energy_change = (pressure(i, j) / density0(i, j) + viscosity(i, j) / density0(i, j)) * total_flux * recip_volume; |
62: energy1(i, j) = energy0(i, j) - energy_change; |
63: density1(i, j) = density0(i, j) * volume_change_s; |
0x247e10 PUSH %RBP |
0x247e11 MOV %RSP,%RBP |
0x247e14 PUSH %R15 |
0x247e16 PUSH %R14 |
0x247e18 PUSH %R13 |
0x247e1a PUSH %R12 |
0x247e1c PUSH %RBX |
0x247e1d AND $-0x20,%RSP |
0x247e21 SUB $0x1a0,%RSP |
0x247e28 MOV (%RDX),%EAX |
0x247e2a MOV (%RCX),%R14D |
0x247e2d INC %EAX |
0x247e2f ADD $0x2,%R14D |
0x247e33 SUB %EAX,%R14D |
0x247e36 JLE 248b5c |
0x247e3c MOV (%R9),%EBX |
0x247e3f MOV (%R8),%R13D |
0x247e42 INC %R13D |
0x247e45 ADD $0x2,%EBX |
0x247e48 CMP %R13D,%EBX |
0x247e4b JLE 248b5c |
0x247e51 SUB %R13D,%EBX |
0x247e54 MOV (%RDI),%ESI |
0x247e56 MOV %RAX,%R15 |
0x247e59 MOVQ $0,0xa8(%RSP) |
0x247e65 MOVQ $0x1,0xe8(%RSP) |
0x247e71 MOVL $0,0x1c(%RSP) |
0x247e79 IMUL %RBX,%R14 |
0x247e7d DEC %R14 |
0x247e80 MOV %R14,0x10(%RSP) |
0x247e85 SUB $0x8,%RSP |
0x247e89 LEA 0x24(%RSP),%RCX |
0x247e8e LEA 0xf0(%RSP),%RAX |
0x247e96 LEA 0x198a3(%RIP),%RDI |
0x247e9d LEA 0xb0(%RSP),%R8 |
0x247ea5 LEA 0x18(%RSP),%R9 |
0x247eaa MOV %ESI,0x20(%RSP) |
0x247eae MOV $0x22,%EDX |
0x247eb3 PUSH $0x1 |
0x247eb5 PUSH $0x1 |
0x247eb7 PUSH %RAX |
0x247eb8 CALL 25f740 <@plt_start@+0x530> |
0x247ebd ADD $0x20,%RSP |
0x247ec1 MOV 0x10(%RSP),%RAX |
0x247ec6 MOV 0xa8(%RSP),%RCX |
0x247ece CMP %R14,%RAX |
0x247ed1 CMOVL %RAX,%R14 |
0x247ed5 MOV %R14,0x10(%RSP) |
0x247eda CMP %R14,%RCX |
0x247edd JG 248b49 |
0x247ee3 MOV 0x10(%RBP),%R8 |
0x247ee7 MOV 0x28(%RBP),%R9 |
0x247eeb MOV %RBX,0x30(%RSP) |
0x247ef0 MOV 0x18(%RBP),%R10 |
0x247ef4 MOV 0x40(%RBP),%RDX |
0x247ef8 MOV 0x30(%RBP),%RDI |
0x247efc MOV 0x48(%RBP),%RAX |
0x247f00 MOV 0x38(%RBP),%RSI |
0x247f04 MOV %R13D,0x4(%RSP) |
0x247f09 MOV %R14,0xe0(%RSP) |
0x247f11 MOV (%R8),%R11 |
0x247f14 MOV (%R9),%RBX |
0x247f17 MOV (%R10),%R12 |
0x247f1a MOV 0x10(%R8),%R8 |
0x247f1e MOV 0x10(%R10),%R10 |
0x247f22 MOV %R11,0x78(%RSP) |
0x247f27 MOV %RBX,0x68(%RSP) |
0x247f2c MOV 0x10(%R9),%RBX |
0x247f30 MOV (%RDI),%R11 |
0x247f33 MOV 0x10(%RDI),%R9 |
0x247f37 MOV (%RDX),%RDI |
0x247f3a MOV 0x10(%RDX),%RDX |
0x247f3e MOV %R12,0x70(%RSP) |
0x247f43 MOV 0x10(%RAX),%R12 |
0x247f47 MOV %R11,0x60(%RSP) |
0x247f4c MOV (%RSI),%R11 |
0x247f4f MOV 0x10(%RSI),%RSI |
0x247f53 MOV %RDX,0x90(%RSP) |
0x247f5b MOV (%RAX),%RDX |
0x247f5e MOV 0x50(%RBP),%RAX |
0x247f62 MOV %RDI,0x50(%RSP) |
0x247f67 MOV %RSI,0xa0(%RSP) |
0x247f6f MOV %RDX,0x48(%RSP) |
0x247f74 MOV (%RAX),%RDX |
0x247f77 MOV 0x10(%RAX),%RSI |
0x247f7b MOV 0x60(%RBP),%RAX |
0x247f7f MOV %R11,0x58(%RSP) |
0x247f84 MOV %RDX,0x40(%RSP) |
0x247f89 MOV (%RAX),%RDX |
0x247f8c MOV 0x10(%RAX),%RDI |
0x247f90 MOV 0x58(%RBP),%RAX |
0x247f94 MOV %RSI,0x88(%RSP) |
0x247f9c MOV %RDX,0x38(%RSP) |
0x247fa1 MOV (%RAX),%RDX |
0x247fa4 MOV 0x10(%RAX),%R11 |
0x247fa8 MOV 0x68(%RBP),%RAX |
0x247fac MOV %RDI,0xd8(%RSP) |
0x247fb4 MOV %RDX,0x28(%RSP) |
0x247fb9 MOV (%RAX),%RDX |
0x247fbc MOV 0x10(%RAX),%RAX |
0x247fc0 MOV %R11,0x80(%RSP) |
0x247fc8 MOV %RDX,0x20(%RSP) |
0x247fcd MOV %R14,%RDX |
0x247fd0 SUB %RCX,%RDX |
0x247fd3 MOV %RAX,0x98(%RSP) |
0x247fdb INC %RDX |
0x247fde CMP $0x4,%RDX |
0x247fe2 JB 2488ca |
0x247fe8 MOV 0x78(%RSP),%RSI |
0x247fed VPBROADCASTD %R15D,%XMM2 |
0x247ff3 MOV 0x70(%RSP),%R11 |
0x247ff8 VBROADCASTSD -0x367ea(%RIP),%YMM16 |
0x248002 VBROADCASTSD -0x367b4(%RIP),%YMM17 |
0x24800c VBROADCASTSD -0x367f6(%RIP),%YMM19 |
0x248016 VPBROADCASTQ %RCX,%YMM0 |
0x24801c VPADDQ -0x36624(%RIP),%YMM0,%YMM0 |
0x248024 VPBROADCASTQ -0x3686e(%RIP),%YMM20 |
0x24802e MOV 0x30(%RSP),%RAX |
0x248033 MOV %RDX,0xc8(%RSP) |
0x24803b AND $-0x4,%RDX |
0x24803f VMOVDQA %XMM2,0xb0(%RSP) |
0x248048 VPBROADCASTD %R13D,%XMM2 |
0x24804e ADD %RDX,%RCX |
0x248051 MOV %RDX,0xc0(%RSP) |
0x248059 VMOVDQA %XMM2,0xf0(%RSP) |
0x248062 VPBROADCASTQ %RSI,%YMM2 |
0x248068 MOV 0x68(%RSP),%RSI |
0x24806d VPBROADCASTQ %R11,%YMM5 |
0x248073 MOV 0x60(%RSP),%R11 |
0x248078 VPBROADCASTQ %RAX,%YMM1 |
0x24807e VMOVDQA %YMM2,0x160(%RSP) |
0x248087 VEXTRACTI128 $0x1,%YMM1,%XMM15 |
0x24808d VPBROADCASTQ %RSI,%YMM6 |
0x248093 MOV 0x58(%RSP),%RSI |
0x248098 VPBROADCASTQ %R11,%YMM7 |
0x24809e MOV 0x50(%RSP),%R11 |
0x2480a3 VPBROADCASTQ %RSI,%YMM2 |
0x2480a9 MOV 0x48(%RSP),%RSI |
0x2480ae VMOVDQA %YMM2,0x140(%RSP) |
0x2480b7 VPBROADCASTQ %R11,%YMM2 |
0x2480bd MOV 0x40(%RSP),%R11 |
0x2480c2 VMOVDQA %YMM2,0x120(%RSP) |
0x2480cb VPBROADCASTQ %RSI,%YMM2 |
0x2480d1 MOV 0x38(%RSP),%RSI |
0x2480d6 VPBROADCASTQ %R11,%YMM11 |
0x2480dc MOV 0x28(%RSP),%R11 |
0x2480e1 VMOVDQA %YMM2,0x100(%RSP) |
0x2480ea VPCMPEQD %XMM2,%XMM2,%XMM2 |
0x2480ee VPBROADCASTQ %RSI,%YMM12 |
0x2480f4 MOV 0x20(%RSP),%RSI |
0x2480f9 VPBROADCASTQ %R11,%YMM13 |
0x2480ff VPBROADCASTQ %RSI,%YMM14 |
0x248105 NOPW %CS:(%RAX,%RAX,1) |
(153) 0x248110 VEXTRACTI32X4 $0x1,%YMM0,%XMM21 |
(153) 0x248117 MOV %RDX,0x8(%RSP) |
(153) 0x24811c VPEXTRQ $0x1,%XMM15,%RSI |
(153) 0x248122 VMOVQ %XMM1,%R14 |
(153) 0x248127 MOV 0x20(%RBP),%R11 |
(153) 0x24812b VPEXTRQ $0x1,%XMM21,%RAX |
(153) 0x248132 CQTO |
(153) 0x248134 IDIV %RSI |
(153) 0x248137 VMOVQ %XMM21,%RDX |
(153) 0x24813d VMOVQ %XMM15,%RSI |
(153) 0x248142 VMOVQ %RAX,%XMM21 |
(153) 0x248148 MOV %RDX,%RAX |
(153) 0x24814b CQTO |
(153) 0x24814d IDIV %RSI |
(153) 0x248150 VPEXTRQ $0x1,%XMM1,%RSI |
(153) 0x248156 VMOVQ %RAX,%XMM22 |
(153) 0x24815c VPEXTRQ $0x1,%XMM0,%RAX |
(153) 0x248162 CQTO |
(153) 0x248164 VPUNPCKLQDQ %XMM21,%XMM22,%XMM21 |
(153) 0x24816a IDIV %RSI |
(153) 0x24816d MOV %RAX,%RSI |
(153) 0x248170 VMOVQ %XMM0,%RAX |
(153) 0x248175 VMOVQ %RSI,%XMM22 |
(153) 0x24817b CQTO |
(153) 0x24817d IDIV %R14 |
(153) 0x248180 VMOVQ %RAX,%XMM23 |
(153) 0x248186 VPUNPCKLQDQ %XMM22,%XMM23,%XMM22 |
(153) 0x24818c VINSERTI32X4 $0x1,%XMM21,%YMM22,%YMM21 |
(153) 0x248193 VPMOVQD %YMM21,%XMM22 |
(153) 0x248199 VPADDD 0xb0(%RSP),%XMM22,%XMM23 |
(153) 0x2481a1 VPMULLQ %YMM1,%YMM21,%YMM21 |
(153) 0x2481a7 VPSUBQ %YMM21,%YMM0,%YMM21 |
(153) 0x2481ad VPADDQ %YMM20,%YMM0,%YMM0 |
(153) 0x2481b3 VPMOVQD %YMM21,%XMM21 |
(153) 0x2481b9 VPADDD 0xf0(%RSP),%XMM21,%XMM25 |
(153) 0x2481c1 VPMOVSXDQ %XMM23,%YMM22 |
(153) 0x2481c7 VPMULLQ 0x160(%RSP),%YMM22,%YMM28 |
(153) 0x2481cf VPSUBD %XMM2,%XMM23,%XMM23 |
(153) 0x2481d5 VPMULLQ %YMM22,%YMM5,%YMM30 |
(153) 0x2481db VPMOVSXDQ %XMM25,%YMM21 |
(153) 0x2481e1 VPSUBD %XMM2,%XMM25,%XMM25 |
(153) 0x2481e7 VPMOVSXDQ %XMM25,%YMM25 |
(153) 0x2481ed VPADDQ %YMM21,%YMM30,%YMM27 |
(153) 0x2481f3 VPADDQ %YMM25,%YMM30,%YMM30 |
(153) 0x2481f9 VPADDQ %YMM21,%YMM28,%YMM24 |
(153) 0x2481ff VPADDQ %YMM25,%YMM28,%YMM28 |
(153) 0x248205 VPEXTRQ $0x1,%XMM24,%RDX |
(153) 0x24820c VMOVQ %XMM24,%RSI |
(153) 0x248212 VEXTRACTI32X4 $0x1,%YMM24,%XMM24 |
(153) 0x248219 VMOVQ %XMM24,%R14 |
(153) 0x24821f VPEXTRQ $0x1,%XMM24,%RAX |
(153) 0x248226 VMOVSD (%R8,%RSI,8),%XMM24 |
(153) 0x24822d VPEXTRQ $0x1,%XMM27,%RSI |
(153) 0x248234 VMOVHPD (%R8,%RDX,8),%XMM24,%XMM26 |
(153) 0x24823b VEXTRACTI32X4 $0x1,%YMM27,%XMM24 |
(153) 0x248242 VMOVSD (%R8,%R14,8),%XMM29 |
(153) 0x248249 VMOVQ %XMM27,%R14 |
(153) 0x24824f VMOVQ %XMM24,%R13 |
(153) 0x248255 VPEXTRQ $0x1,%XMM24,%RDX |
(153) 0x24825c VPMOVSXDQ %XMM23,%YMM24 |
(153) 0x248262 VMOVHPD (%R8,%RAX,8),%XMM29,%XMM29 |
(153) 0x248269 VMOVSD (%R10,%R14,8),%XMM27 |
(153) 0x248270 VMOVQ %XMM28,%RAX |
(153) 0x248276 VMOVSD (%R10,%R13,8),%XMM31 |
(153) 0x24827d VMOVHPD (%R10,%RSI,8),%XMM27,%XMM27 |
(153) 0x248284 VPMULLQ %YMM24,%YMM5,%YMM18 |
(153) 0x24828a VMOVHPD (%R10,%RDX,8),%XMM31,%XMM31 |
(153) 0x248291 VPEXTRQ $0x1,%XMM28,%RDX |
(153) 0x248298 VEXTRACTI32X4 $0x1,%YMM28,%XMM28 |
(153) 0x24829f VPADDQ %YMM21,%YMM18,%YMM23 |
(153) 0x2482a5 VPADDQ %YMM25,%YMM18,%YMM18 |
(153) 0x2482ab VMOVQ %XMM23,%RSI |
(153) 0x2482b1 VPEXTRQ $0x1,%XMM23,%R14 |
(153) 0x2482b8 VEXTRACTI32X4 $0x1,%YMM23,%XMM23 |
(153) 0x2482bf VMOVQ %XMM23,%R13 |
(153) 0x2482c5 VMOVSD (%R10,%RSI,8),%XMM4 |
(153) 0x2482cb VMOVQ %XMM28,%RSI |
(153) 0x2482d1 VMOVSD (%R10,%R13,8),%XMM3 |
(153) 0x2482d7 VPEXTRQ $0x1,%XMM23,%R13 |
(153) 0x2482de VMOVHPD (%R10,%R14,8),%XMM4,%XMM4 |
(153) 0x2482e4 VINSERTF32X4 $0x1,%XMM29,%YMM26,%YMM26 |
(153) 0x2482eb VPMULLQ %YMM22,%YMM6,%YMM29 |
(153) 0x2482f1 VPEXTRQ $0x1,%XMM28,%R14 |
(153) 0x2482f8 VMOVSD (%R8,%RAX,8),%XMM28 |
(153) 0x2482ff VMOVSD (%R8,%RSI,8),%XMM8 |
(153) 0x248305 VMOVQ %XMM30,%RAX |
(153) 0x24830b VPEXTRQ $0x1,%XMM30,%RSI |
(153) 0x248312 VEXTRACTI32X4 $0x1,%YMM30,%XMM30 |
(153) 0x248319 VBROADCASTSD (%R11),%YMM23 |
(153) 0x24831f VMOVHPD (%R10,%R13,8),%XMM3,%XMM3 |
(153) 0x248325 VMOVHPD (%R8,%RDX,8),%XMM28,%XMM28 |
(153) 0x24832c VMOVQ %XMM30,%RDX |
(153) 0x248332 VMOVSD (%R10,%RAX,8),%XMM9 |
(153) 0x248338 VPEXTRQ $0x1,%XMM30,%R13 |
(153) 0x24833f VMOVQ %XMM18,%RAX |
(153) 0x248345 VMOVHPD (%R8,%R14,8),%XMM8,%XMM8 |
(153) 0x24834b VMOVSD (%R10,%RDX,8),%XMM30 |
(153) 0x248352 VPEXTRQ $0x1,%XMM18,%RDX |
(153) 0x248359 VEXTRACTI32X4 $0x1,%YMM18,%XMM18 |
(153) 0x248360 VMOVSD (%R10,%RAX,8),%XMM10 |
(153) 0x248366 VMOVHPD (%R10,%RSI,8),%XMM9,%XMM9 |
(153) 0x24836c VINSERTF32X4 $0x1,%XMM31,%YMM27,%YMM31 |
(153) 0x248373 VPADDQ %YMM21,%YMM29,%YMM29 |
(153) 0x248379 VMOVQ %XMM18,%RSI |
(153) 0x24837f VPEXTRQ $0x1,%XMM18,%R14 |
(153) 0x248386 VMOVHPD (%R10,%RDX,8),%XMM10,%XMM10 |
(153) 0x24838c VMOVHPD (%R10,%R13,8),%XMM30,%XMM30 |
(153) 0x248393 MOV 0xa0(%RSP),%R13 |
(153) 0x24839b VEXTRACTI32X4 $0x1,%YMM29,%XMM27 |
(153) 0x2483a2 VMOVSD (%R10,%RSI,8),%XMM18 |
(153) 0x2483a9 VMOVQ %XMM29,%RDX |
(153) 0x2483af VPEXTRQ $0x1,%XMM29,%RAX |
(153) 0x2483b6 VMOVQ %XMM27,%RSI |
(153) 0x2483bc VMOVHPD (%R10,%R14,8),%XMM18,%XMM18 |
(153) 0x2483c3 VPEXTRQ $0x1,%XMM27,%R14 |
(153) 0x2483ca VMOVSD (%RBX,%RDX,8),%XMM27 |
(153) 0x2483d1 VMOVHPD (%RBX,%RAX,8),%XMM27,%XMM27 |
(153) 0x2483d8 VINSERTF128 $0x1,%XMM3,%YMM4,%YMM3 |
(153) 0x2483de VMOVSD (%RBX,%RSI,8),%XMM4 |
(153) 0x2483e3 VINSERTF32X4 $0x1,%XMM8,%YMM28,%YMM28 |
(153) 0x2483ea VMOVHPD (%RBX,%R14,8),%XMM4,%XMM4 |
(153) 0x2483f0 VINSERTF32X4 $0x1,%XMM30,%YMM9,%YMM9 |
(153) 0x2483f7 VINSERTF32X4 $0x1,%XMM18,%YMM10,%YMM10 |
(153) 0x2483fe VADDPD %YMM10,%YMM9,%YMM29 |
(153) 0x248404 VINSERTF32X4 $0x1,%XMM4,%YMM27,%YMM27 |
(153) 0x24840b VPMULLQ %YMM22,%YMM7,%YMM4 |
(153) 0x248411 VADDPD %YMM29,%YMM9,%YMM9 |
(153) 0x248417 VPADDQ %YMM21,%YMM4,%YMM8 |
(153) 0x24841d VPADDQ %YMM25,%YMM4,%YMM4 |
(153) 0x248423 VADDPD %YMM9,%YMM10,%YMM9 |
(153) 0x248428 VMOVQ %XMM8,%RAX |
(153) 0x24842d VPEXTRQ $0x1,%XMM8,%RDX |
(153) 0x248433 VEXTRACTI128 $0x1,%YMM8,%XMM8 |
(153) 0x248439 VMOVQ %XMM8,%RSI |
(153) 0x24843e VMOVSD (%R9,%RAX,8),%XMM18 |
(153) 0x248445 VPEXTRQ $0x1,%XMM8,%R14 |
(153) 0x24844b VMOVQ %XMM4,%RAX |
(153) 0x248450 VMOVSD (%R9,%RSI,8),%XMM8 |
(153) 0x248456 VMOVHPD (%R9,%RDX,8),%XMM18,%XMM18 |
(153) 0x24845d VPEXTRQ $0x1,%XMM4,%RDX |
(153) 0x248463 VEXTRACTI128 $0x1,%YMM4,%XMM4 |
(153) 0x248469 VMOVSD (%R9,%RAX,8),%XMM30 |
(153) 0x248470 VMULPD %YMM9,%YMM28,%YMM9 |
(153) 0x248476 VMOVHPD (%R9,%R14,8),%XMM8,%XMM8 |
(153) 0x24847c VMOVQ %XMM4,%RSI |
(153) 0x248481 VPEXTRQ $0x1,%XMM4,%R14 |
(153) 0x248487 VMOVHPD (%R9,%RDX,8),%XMM30,%XMM30 |
(153) 0x24848e VMOVSD (%R9,%RSI,8),%XMM4 |
(153) 0x248494 VMOVHPD (%R9,%R14,8),%XMM4,%XMM4 |
(153) 0x24849a VMULPD %YMM16,%YMM9,%YMM9 |
(153) 0x2484a0 VMULPD %YMM9,%YMM23,%YMM9 |
(153) 0x2484a6 VINSERTF32X4 $0x1,%XMM8,%YMM18,%YMM8 |
(153) 0x2484ad VADDPD %YMM3,%YMM31,%YMM18 |
(153) 0x2484b3 VMULPD %YMM17,%YMM9,%YMM9 |
(153) 0x2484b9 VINSERTF32X4 $0x1,%XMM4,%YMM30,%YMM4 |
(153) 0x2484c0 VADDPD %YMM18,%YMM31,%YMM18 |
(153) 0x2484c6 VPMULLQ %YMM24,%YMM6,%YMM31 |
(153) 0x2484cc VPMULLQ %YMM24,%YMM7,%YMM24 |
(153) 0x2484d2 VADDPD %YMM4,%YMM8,%YMM30 |
(153) 0x2484d8 VPADDQ %YMM21,%YMM31,%YMM31 |
(153) 0x2484de VADDPD %YMM18,%YMM3,%YMM3 |
(153) 0x2484e4 VEXTRACTI32X4 $0x1,%YMM31,%XMM29 |
(153) 0x2484eb VMOVQ %XMM31,%RAX |
(153) 0x2484f1 VADDPD %YMM30,%YMM8,%YMM8 |
(153) 0x2484f7 VPEXTRQ $0x1,%XMM31,%RDX |
(153) 0x2484fe VMOVQ %XMM29,%RSI |
(153) 0x248504 VPEXTRQ $0x1,%XMM29,%R14 |
(153) 0x24850b VMOVSD (%RBX,%RAX,8),%XMM30 |
(153) 0x248512 VMOVSD (%RBX,%RSI,8),%XMM29 |
(153) 0x248519 VMOVHPD (%RBX,%RDX,8),%XMM30,%XMM18 |
(153) 0x248520 VMULPD %YMM3,%YMM26,%YMM3 |
(153) 0x248526 VMOVHPD (%RBX,%R14,8),%XMM29,%XMM29 |
(153) 0x24852d VADDPD %YMM4,%YMM8,%YMM4 |
(153) 0x248531 VMULPD %YMM16,%YMM3,%YMM3 |
(153) 0x248537 VMULPD %YMM4,%YMM27,%YMM4 |
(153) 0x24853d VMULPD %YMM3,%YMM23,%YMM3 |
(153) 0x248543 VMULPD %YMM16,%YMM4,%YMM4 |
(153) 0x248549 VINSERTF32X4 $0x1,%XMM29,%YMM18,%YMM18 |
(153) 0x248550 VPADDQ %YMM21,%YMM24,%YMM29 |
(153) 0x248556 VMULPD %YMM17,%YMM3,%YMM3 |
(153) 0x24855c VEXTRACTI32X4 $0x1,%YMM29,%XMM10 |
(153) 0x248563 VMOVQ %XMM29,%RAX |
(153) 0x248569 VPEXTRQ $0x1,%XMM29,%RDX |
(153) 0x248570 VMULPD %YMM4,%YMM23,%YMM4 |
(153) 0x248576 VMOVQ %XMM10,%R14 |
(153) 0x24857b VPEXTRQ $0x1,%XMM10,%RSI |
(153) 0x248581 VMOVSD (%R9,%RAX,8),%XMM10 |
(153) 0x248587 VMOVSD (%R9,%R14,8),%XMM8 |
(153) 0x24858d VMOVHPD (%R9,%RDX,8),%XMM10,%XMM10 |
(153) 0x248593 VSUBPD %YMM3,%YMM9,%YMM3 |
(153) 0x248597 VMOVHPD (%R9,%RSI,8),%XMM8,%XMM8 |
(153) 0x24859d VMULPD %YMM17,%YMM4,%YMM4 |
(153) 0x2485a3 VINSERTF128 $0x1,%XMM8,%YMM10,%YMM8 |
(153) 0x2485a9 VPADDQ %YMM25,%YMM24,%YMM10 |
(153) 0x2485af VMOVQ %XMM10,%RAX |
(153) 0x2485b4 VPEXTRQ $0x1,%XMM10,%RDX |
(153) 0x2485ba VEXTRACTI128 $0x1,%YMM10,%XMM10 |
(153) 0x2485c0 VMOVQ %XMM10,%RSI |
(153) 0x2485c5 VMOVSD (%R9,%RAX,8),%XMM24 |
(153) 0x2485cc VPEXTRQ $0x1,%XMM10,%R14 |
(153) 0x2485d2 VMOVSD (%R9,%RSI,8),%XMM10 |
(153) 0x2485d8 VMOVHPD (%R9,%RDX,8),%XMM24,%XMM24 |
(153) 0x2485df VMOVHPD (%R9,%R14,8),%XMM10,%XMM10 |
(153) 0x2485e5 VINSERTF32X4 $0x1,%XMM10,%YMM24,%YMM10 |
(153) 0x2485ec VADDPD %YMM10,%YMM8,%YMM24 |
(153) 0x2485f2 VADDPD %YMM24,%YMM8,%YMM8 |
(153) 0x2485f8 VADDPD %YMM8,%YMM10,%YMM8 |
(153) 0x2485fd VPMULLQ 0x140(%RSP),%YMM22,%YMM10 |
(153) 0x248605 VMULPD %YMM8,%YMM18,%YMM8 |
(153) 0x24860b VMULPD %YMM16,%YMM8,%YMM8 |
(153) 0x248611 VMULPD %YMM8,%YMM23,%YMM8 |
(153) 0x248617 VPADDQ %YMM21,%YMM10,%YMM10 |
(153) 0x24861d VMOVQ %XMM10,%RAX |
(153) 0x248622 VPEXTRQ $0x1,%XMM10,%RDX |
(153) 0x248628 VEXTRACTI128 $0x1,%YMM10,%XMM10 |
(153) 0x24862e VMOVQ %XMM10,%RSI |
(153) 0x248633 VMOVSD (%R13,%RAX,8),%XMM18 |
(153) 0x24863b VPEXTRQ $0x1,%XMM10,%R14 |
(153) 0x248641 VMULPD %YMM17,%YMM8,%YMM8 |
(153) 0x248647 VMOVSD (%R13,%RSI,8),%XMM10 |
(153) 0x24864e VMOVHPD (%R13,%RDX,8),%XMM18,%XMM18 |
(153) 0x248656 VMOVHPD (%R13,%R14,8),%XMM10,%XMM10 |
(153) 0x24865d MOV 0x90(%RSP),%R13 |
(153) 0x248665 VADDPD %YMM3,%YMM8,%YMM3 |
(153) 0x248669 VSUBPD %YMM4,%YMM3,%YMM3 |
(153) 0x24866d VINSERTF32X4 $0x1,%XMM10,%YMM18,%YMM24 |
(153) 0x248674 VPMULLQ 0x120(%RSP),%YMM22,%YMM10 |
(153) 0x24867c VPADDQ %YMM21,%YMM10,%YMM10 |
(153) 0x248682 VMOVQ %XMM10,%RAX |
(153) 0x248687 VPEXTRQ $0x1,%XMM10,%RDX |
(153) 0x24868d VEXTRACTI128 $0x1,%YMM10,%XMM10 |
(153) 0x248693 VMOVQ %XMM10,%R14 |
(153) 0x248698 VMOVSD (%R13,%RAX,8),%XMM18 |
(153) 0x2486a0 VPEXTRQ $0x1,%XMM10,%RSI |
(153) 0x2486a6 MOV 0x88(%RSP),%RAX |
(153) 0x2486ae VMOVSD (%R13,%R14,8),%XMM10 |
(153) 0x2486b5 VMOVHPD (%R13,%RDX,8),%XMM18,%XMM18 |
(153) 0x2486bd VMOVHPD (%R13,%RSI,8),%XMM10,%XMM10 |
(153) 0x2486c4 VINSERTF32X4 $0x1,%XMM10,%YMM18,%YMM10 |
(153) 0x2486cb VPMULLQ 0x100(%RSP),%YMM22,%YMM18 |
(153) 0x2486d3 VPADDQ %YMM21,%YMM18,%YMM18 |
(153) 0x2486d9 VMOVQ %XMM18,%RDX |
(153) 0x2486df VPEXTRQ $0x1,%XMM18,%R11 |
(153) 0x2486e6 VEXTRACTI32X4 $0x1,%YMM18,%XMM18 |
(153) 0x2486ed VMOVQ %XMM18,%RSI |
(153) 0x2486f3 VMOVSD (%R12,%RDX,8),%XMM23 |
(153) 0x2486fa VPEXTRQ $0x1,%XMM18,%R13 |
(153) 0x248701 VMOVSD (%R12,%RSI,8),%XMM18 |
(153) 0x248708 VMOVHPD (%R12,%R11,8),%XMM23,%XMM23 |
(153) 0x24870f VMOVHPD (%R12,%R13,8),%XMM18,%XMM18 |
(153) 0x248716 VINSERTF32X4 $0x1,%XMM18,%YMM23,%YMM18 |
(153) 0x24871d VPMULLQ %YMM22,%YMM11,%YMM23 |
(153) 0x248723 VDIVPD %YMM18,%YMM10,%YMM10 |
(153) 0x248729 VPADDQ %YMM21,%YMM23,%YMM23 |
(153) 0x24872f VEXTRACTI32X4 $0x1,%YMM23,%XMM25 |
(153) 0x248736 VMOVQ %XMM25,%R14 |
(153) 0x24873c VMOVSD (%RAX,%R14,8),%XMM26 |
(153) 0x248743 VPEXTRQ $0x1,%XMM25,%R14 |
(153) 0x24874a VMOVHPD (%RAX,%R14,8),%XMM26,%XMM25 |
(153) 0x248751 VMOVQ %XMM23,%R14 |
(153) 0x248757 VMOVSD (%RAX,%R14,8),%XMM26 |
(153) 0x24875e VPEXTRQ $0x1,%XMM23,%R14 |
(153) 0x248765 VDIVPD %YMM24,%YMM19,%YMM23 |
(153) 0x24876b VMOVHPD (%RAX,%R14,8),%XMM26,%XMM26 |
(153) 0x248772 MOV 0x80(%RSP),%RAX |
(153) 0x24877a VINSERTF32X4 $0x1,%XMM25,%YMM26,%YMM9 |
(153) 0x248781 VDIVPD %YMM18,%YMM9,%YMM9 |
(153) 0x248787 VADDPD %YMM9,%YMM10,%YMM9 |
(153) 0x24878c VPMULLQ %YMM22,%YMM12,%YMM10 |
(153) 0x248792 VPADDQ %YMM21,%YMM10,%YMM10 |
(153) 0x248798 VMULPD %YMM3,%YMM9,%YMM9 |
(153) 0x24879c VADDPD %YMM3,%YMM24,%YMM3 |
(153) 0x2487a2 VEXTRACTI128 $0x1,%YMM10,%XMM8 |
(153) 0x2487a8 VMOVQ %XMM8,%R14 |
(153) 0x2487ad VMOVSD (%RDI,%R14,8),%XMM18 |
(153) 0x2487b4 VPEXTRQ $0x1,%XMM8,%R14 |
(153) 0x2487ba VMULPD %YMM9,%YMM23,%YMM9 |
(153) 0x2487c0 VDIVPD %YMM3,%YMM24,%YMM3 |
(153) 0x2487c6 VMOVHPD (%RDI,%R14,8),%XMM18,%XMM4 |
(153) 0x2487cd VMOVQ %XMM10,%R14 |
(153) 0x2487d2 VMOVSD (%RDI,%R14,8),%XMM8 |
(153) 0x2487d8 VPEXTRQ $0x1,%XMM10,%R14 |
(153) 0x2487de VMOVHPD (%RDI,%R14,8),%XMM8,%XMM8 |
(153) 0x2487e4 VINSERTF128 $0x1,%XMM4,%YMM8,%YMM4 |
(153) 0x2487ea VPMULLQ %YMM22,%YMM13,%YMM8 |
(153) 0x2487f0 VADDPD %YMM4,%YMM9,%YMM4 |
(153) 0x2487f4 VPADDQ %YMM21,%YMM8,%YMM8 |
(153) 0x2487fa VMOVQ %XMM8,%R14 |
(153) 0x2487ff VMOVLPD %XMM4,(%RAX,%R14,8) |
(153) 0x248805 VPEXTRQ $0x1,%XMM8,%R14 |
(153) 0x24880b VEXTRACTI128 $0x1,%YMM8,%XMM8 |
(153) 0x248811 VMOVHPD %XMM4,(%RAX,%R14,8) |
(153) 0x248817 VEXTRACTF128 $0x1,%YMM4,%XMM4 |
(153) 0x24881d VMOVQ %XMM8,%R14 |
(153) 0x248822 VMOVLPD %XMM4,(%RAX,%R14,8) |
(153) 0x248828 VPEXTRQ $0x1,%XMM8,%R14 |
(153) 0x24882e VMOVHPD %XMM4,(%RAX,%R14,8) |
(153) 0x248834 VMOVSD (%R12,%RDX,8),%XMM8 |
(153) 0x24883a VMOVSD (%R12,%RSI,8),%XMM4 |
(153) 0x248840 MOV 0x98(%RSP),%RDX |
(153) 0x248848 VMOVHPD (%R12,%R13,8),%XMM4,%XMM4 |
(153) 0x24884e VMOVHPD (%R12,%R11,8),%XMM8,%XMM8 |
(153) 0x248854 VINSERTF128 $0x1,%XMM4,%YMM8,%YMM4 |
(153) 0x24885a VMULPD %YMM3,%YMM4,%YMM3 |
(153) 0x24885e VPMULLQ %YMM22,%YMM14,%YMM4 |
(153) 0x248864 VPADDQ %YMM21,%YMM4,%YMM4 |
(153) 0x24886a VMOVQ %XMM4,%RAX |
(153) 0x24886f VMOVLPD %XMM3,(%RDX,%RAX,8) |
(153) 0x248874 VPEXTRQ $0x1,%XMM4,%RAX |
(153) 0x24887a VEXTRACTI128 $0x1,%YMM4,%XMM4 |
(153) 0x248880 VMOVHPD %XMM3,(%RDX,%RAX,8) |
(153) 0x248885 VEXTRACTF128 $0x1,%YMM3,%XMM3 |
(153) 0x24888b VMOVQ %XMM4,%RAX |
(153) 0x248890 VMOVLPD %XMM3,(%RDX,%RAX,8) |
(153) 0x248895 VPEXTRQ $0x1,%XMM4,%RAX |
(153) 0x24889b VMOVHPD %XMM3,(%RDX,%RAX,8) |
(153) 0x2488a0 MOV 0x8(%RSP),%RDX |
(153) 0x2488a5 ADD $-0x4,%RDX |
(153) 0x2488a9 JNE 248110 |
0x2488af MOV 0xc0(%RSP),%RAX |
0x2488b7 MOV 0x4(%RSP),%R13D |
0x2488bc CMP %RAX,0xc8(%RSP) |
0x2488c4 JE 248b49 |
0x2488ca VMOVSD -0x370ba(%RIP),%XMM0 |
0x2488d2 VMOVSD -0x37082(%RIP),%XMM1 |
0x2488da VMOVDDUP -0x370ca(%RIP),%XMM2 |
0x2488e2 VMOVDDUP -0x37092(%RIP),%XMM3 |
0x2488ea VMOVSD -0x370d2(%RIP),%XMM4 |
0x2488f2 MOV %R15,0xd0(%RSP) |
0x2488fa NOPW (%RAX,%RAX,1) |
(152) 0x248900 MOV %RCX,%RAX |
(152) 0x248903 MOV %RCX,0x8(%RSP) |
(152) 0x248908 CQTO |
(152) 0x24890a IDIVQ 0x30(%RSP) |
(152) 0x24890f MOV 0x70(%RSP),%RCX |
(152) 0x248914 ADD %R13D,%EDX |
(152) 0x248917 MOV 0x78(%RSP),%R13 |
(152) 0x24891c MOV %RCX,%RDI |
(152) 0x24891f MOVSXD %EDX,%RDX |
(152) 0x248922 LEA (%R15,%RAX,1),%ESI |
(152) 0x248926 LEA 0x1(%R15,%RAX,1),%EAX |
(152) 0x24892b MOVSXD %ESI,%RSI |
(152) 0x24892e IMUL %RSI,%RDI |
(152) 0x248932 CLTQ |
(152) 0x248934 IMUL %RSI,%R13 |
(152) 0x248938 LEA (%RDI,%RDX,1),%R14 |
(152) 0x24893c LEA (%R13,%RDX,1),%R11 |
(152) 0x248941 VMOVSD (%R10,%R14,8),%XMM5 |
(152) 0x248947 MOV %RCX,%R14 |
(152) 0x24894a IMUL %RAX,%R14 |
(152) 0x24894e LEA 0x1(%RDI,%RDX,1),%RCX |
(152) 0x248953 MOV 0x60(%RSP),%RDI |
(152) 0x248958 MOV %RCX,0xb0(%RSP) |
(152) 0x248960 MOV 0x68(%RSP),%RCX |
(152) 0x248965 LEA (%R14,%RDX,1),%R15 |
(152) 0x248969 VMOVSD (%R10,%R15,8),%XMM6 |
(152) 0x24896f VADDSD %XMM6,%XMM5,%XMM7 |
(152) 0x248973 VADDSD %XMM7,%XMM5,%XMM5 |
(152) 0x248977 VADDSD %XMM5,%XMM6,%XMM5 |
(152) 0x24897b VMULSD (%R8,%R11,8),%XMM5,%XMM5 |
(152) 0x248981 MOV %RDI,%R11 |
(152) 0x248984 IMUL %RSI,%R11 |
(152) 0x248988 LEA (%R11,%RDX,1),%R15 |
(152) 0x24898c LEA 0x1(%R11,%RDX,1),%R11 |
(152) 0x248991 VMOVSD (%R9,%R15,8),%XMM6 |
(152) 0x248997 MOV 0xd0(%RSP),%R15 |
(152) 0x24899f VMOVSD (%R9,%R11,8),%XMM7 |
(152) 0x2489a5 MOV %RCX,%R11 |
(152) 0x2489a8 IMUL %RSI,%R11 |
(152) 0x2489ac ADD %RDX,%R11 |
(152) 0x2489af VMULSD %XMM0,%XMM5,%XMM5 |
(152) 0x2489b3 VADDSD %XMM7,%XMM6,%XMM8 |
(152) 0x2489b7 VADDSD %XMM6,%XMM8,%XMM6 |
(152) 0x2489bb VADDSD %XMM6,%XMM7,%XMM6 |
(152) 0x2489bf VMULSD (%RBX,%R11,8),%XMM6,%XMM6 |
(152) 0x2489c5 MOV %RCX,%R11 |
(152) 0x2489c8 MOV 0xb0(%RSP),%RCX |
(152) 0x2489d0 IMUL %RAX,%R11 |
(152) 0x2489d4 IMUL %RDI,%RAX |
(152) 0x2489d8 LEA 0x1(%RAX,%RDX,1),%RDI |
(152) 0x2489dd ADD %RDX,%RAX |
(152) 0x2489e0 ADD %RDX,%R11 |
(152) 0x2489e3 VMOVSD (%R10,%RCX,8),%XMM7 |
(152) 0x2489e9 MOV 0xd8(%RSP),%RCX |
(152) 0x2489f1 VMOVHPD (%R9,%RAX,8),%XMM7,%XMM7 |
(152) 0x2489f7 LEA 0x1(%R14,%RDX,1),%RAX |
(152) 0x2489fc MOV 0xe0(%RSP),%R14 |
(152) 0x248a04 VMOVSD (%R10,%RAX,8),%XMM8 |
(152) 0x248a0a MOV 0x20(%RBP),%RAX |
(152) 0x248a0e VMOVHPD (%R9,%RDI,8),%XMM8,%XMM8 |
(152) 0x248a14 MOV 0xa0(%RSP),%RDI |
(152) 0x248a1c VMULSD %XMM0,%XMM6,%XMM6 |
(152) 0x248a20 VMOVDDUP (%RAX),%XMM9 |
(152) 0x248a24 LEA 0x1(%R13,%RDX,1),%RAX |
(152) 0x248a29 MOV 0x4(%RSP),%R13D |
(152) 0x248a2e VADDPD %XMM7,%XMM8,%XMM10 |
(152) 0x248a32 VADDPD %XMM7,%XMM10,%XMM7 |
(152) 0x248a36 VMULSD %XMM5,%XMM9,%XMM5 |
(152) 0x248a3a VMULSD %XMM6,%XMM9,%XMM6 |
(152) 0x248a3e VADDPD %XMM7,%XMM8,%XMM7 |
(152) 0x248a42 VMOVSD (%R8,%RAX,8),%XMM8 |
(152) 0x248a48 MOV 0x58(%RSP),%RAX |
(152) 0x248a4d VMOVHPD (%RBX,%R11,8),%XMM8,%XMM8 |
(152) 0x248a53 MOV 0x90(%RSP),%R11 |
(152) 0x248a5b VMULSD %XMM1,%XMM5,%XMM5 |
(152) 0x248a5f VMULSD %XMM1,%XMM6,%XMM6 |
(152) 0x248a63 IMUL %RSI,%RAX |
(152) 0x248a67 ADD %RDX,%RAX |
(152) 0x248a6a VMOVSD (%RDI,%RAX,8),%XMM10 |
(152) 0x248a6f MOV 0x50(%RSP),%RAX |
(152) 0x248a74 VMULPD %XMM7,%XMM8,%XMM7 |
(152) 0x248a78 MOV 0x48(%RSP),%RDI |
(152) 0x248a7d VMULPD %XMM2,%XMM7,%XMM7 |
(152) 0x248a81 IMUL %RSI,%RAX |
(152) 0x248a85 IMUL %RSI,%RDI |
(152) 0x248a89 VMULPD %XMM7,%XMM9,%XMM7 |
(152) 0x248a8d ADD %RDX,%RAX |
(152) 0x248a90 ADD %RDX,%RDI |
(152) 0x248a93 VMOVSD (%R11,%RAX,8),%XMM8 |
(152) 0x248a99 MOV 0x40(%RSP),%RAX |
(152) 0x248a9e MOV 0x88(%RSP),%R11 |
(152) 0x248aa6 VMULPD %XMM3,%XMM7,%XMM7 |
(152) 0x248aaa VSUBSD %XMM5,%XMM7,%XMM5 |
(152) 0x248aae VPERMILPD $0x1,%XMM7,%XMM7 |
(152) 0x248ab4 IMUL %RSI,%RAX |
(152) 0x248ab8 VADDSD %XMM7,%XMM5,%XMM5 |
(152) 0x248abc VDIVSD %XMM10,%XMM4,%XMM7 |
(152) 0x248ac1 ADD %RDX,%RAX |
(152) 0x248ac4 VMOVHPD (%R11,%RAX,8),%XMM8,%XMM8 |
(152) 0x248aca MOV 0x38(%RSP),%RAX |
(152) 0x248acf VSUBSD %XMM6,%XMM5,%XMM5 |
(152) 0x248ad3 MOV 0x80(%RSP),%R11 |
(152) 0x248adb VDIVPD (%R12,%RDI,8){1to2},%XMM8,%XMM8 |
(152) 0x248ae2 IMUL %RSI,%RAX |
(152) 0x248ae6 ADD %RDX,%RAX |
(152) 0x248ae9 VPERMILPD $0x1,%XMM8,%XMM9 |
(152) 0x248aef VADDSD %XMM9,%XMM8,%XMM8 |
(152) 0x248af4 VMULSD %XMM5,%XMM8,%XMM8 |
(152) 0x248af8 VADDSD %XMM5,%XMM10,%XMM5 |
(152) 0x248afc VMULSD %XMM7,%XMM8,%XMM7 |
(152) 0x248b00 VADDSD (%RCX,%RAX,8),%XMM7,%XMM7 |
(152) 0x248b05 MOV 0x28(%RSP),%RAX |
(152) 0x248b0a VDIVSD %XMM5,%XMM10,%XMM5 |
(152) 0x248b0e IMUL %RSI,%RAX |
(152) 0x248b12 IMUL 0x20(%RSP),%RSI |
(152) 0x248b18 ADD %RDX,%RAX |
(152) 0x248b1b VMOVSD %XMM7,(%R11,%RAX,8) |
(152) 0x248b21 MOV 0x8(%RSP),%RAX |
(152) 0x248b26 VMULSD (%R12,%RDI,8),%XMM5,%XMM5 |
(152) 0x248b2c ADD %RDX,%RSI |
(152) 0x248b2f MOV 0x98(%RSP),%RDX |
(152) 0x248b37 LEA 0x1(%RAX),%RCX |
(152) 0x248b3b VMOVSD %XMM5,(%RDX,%RSI,8) |
(152) 0x248b40 CMP %R14,%RAX |
(152) 0x248b43 JL 248900 |
0x248b49 MOV 0x18(%RSP),%ESI |
0x248b4d LEA 0x18c04(%RIP),%RDI |
0x248b54 VZEROUPPER |
0x248b57 CALL 25f750 <@plt_start@+0x540> |
0x248b5c LEA -0x28(%RBP),%RSP |
0x248b60 POP %RBX |
0x248b61 POP %R12 |
0x248b63 POP %R13 |
0x248b65 POP %R14 |
0x248b67 POP %R15 |
0x248b69 POP %RBP |
0x248b6a RET |
Path / |
Source file and lines | PdV.cpp:48-63 |
Module | exec |
nb instructions | 176 |
nb uops | 191 |
loop length | 883 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 6 |
used ymm registers | 14 |
used zmm registers | 0 |
nb stack references | 47 |
micro-operation queue | 31.83 cycles |
front end | 31.83 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 8.50 | 8.50 | 8.50 | 8.50 | 4.00 | 34.33 | 34.33 | 34.33 | 1.00 | 15.00 | 1.00 | 1.00 | 3.00 | 3.00 |
cycles | 8.50 | 8.50 | 8.50 | 8.50 | 4.00 | 34.33 | 34.33 | 34.33 | 1.00 | 15.00 | 1.00 | 1.00 | 3.00 | 3.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 31.83 |
Dispatch | 34.33 |
Overall L1 | 34.33 |
all | 11% |
load | 5% |
store | 17% |
mul | 0% |
add-sub | 14% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 3% |
store | 17% |
mul | 0% |
add-sub | 14% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
all | 14% |
load | 13% |
store | 16% |
mul | 12% |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 12% |
store | 16% |
mul | 12% |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x1a0,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDX),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RCX),%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
INC %EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x2,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %EAX,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 248b5c <.omp_outlined.+0xd4c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV (%R9),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
INC %R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x2,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R13D,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 248b5c <.omp_outlined.+0xd4c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
SUB %R13D,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVQ $0,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
IMUL %RBX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x24(%RSP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0xf0(%RSP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x198a3(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0xb0(%RSP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x18(%RSP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 25f740 <@plt_start@+0x530> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x10(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xa8(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %R14,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVL %RAX,%R14 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R14,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JG 248b49 <.omp_outlined.+0xd39> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RBX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x40(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x38(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R13D,0x4(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R14,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%R8),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R9),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R10),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R10),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%R9),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RDI),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RDX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R12,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RAX),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RSI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RSI),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDI,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RSI,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RSI,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x68(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDI,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %RCX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
INC %RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x4,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JB 2488ca <.omp_outlined.+0xaba> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x78(%RSP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTD %R15D,%XMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x70(%RSP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VBROADCASTSD -0x367ea(%RIP),%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD -0x367b4(%RIP),%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD -0x367f6(%RIP),%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %RCX,%YMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPADDQ -0x36624(%RIP),%YMM0,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ -0x3686e(%RIP),%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND $-0x4,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VMOVDQA %XMM2,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPBROADCASTD %R13D,%XMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
ADD %RDX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDQA %XMM2,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPBROADCASTQ %RSI,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x68(%RSP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %R11,%YMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x60(%RSP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %RAX,%YMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVDQA %YMM2,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VEXTRACTI128 $0x1,%YMM1,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VPBROADCASTQ %RSI,%YMM6 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x58(%RSP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %R11,%YMM7 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x50(%RSP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %RSI,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x48(%RSP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVDQA %YMM2,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPBROADCASTQ %R11,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x40(%RSP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVDQA %YMM2,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPBROADCASTQ %RSI,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x38(%RSP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %R11,%YMM11 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x28(%RSP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVDQA %YMM2,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPCMPEQD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VPBROADCASTQ %RSI,%YMM12 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x20(%RSP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %R11,%YMM13 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RSI,%YMM14 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV 0xc0(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x4(%RSP),%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,0xc8(%RSP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JE 248b49 <.omp_outlined.+0xd39> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VMOVSD -0x370ba(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x37082(%RIP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVDDUP -0x370ca(%RIP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVDDUP -0x37092(%RIP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x370d2(%RIP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV 0x18(%RSP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x18c04(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 25f750 <@plt_start@+0x540> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
Source file and lines | PdV.cpp:48-63 |
Module | exec |
nb instructions | 176 |
nb uops | 191 |
loop length | 883 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 6 |
used ymm registers | 14 |
used zmm registers | 0 |
nb stack references | 47 |
micro-operation queue | 31.83 cycles |
front end | 31.83 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 8.50 | 8.50 | 8.50 | 8.50 | 4.00 | 34.33 | 34.33 | 34.33 | 1.00 | 15.00 | 1.00 | 1.00 | 3.00 | 3.00 |
cycles | 8.50 | 8.50 | 8.50 | 8.50 | 4.00 | 34.33 | 34.33 | 34.33 | 1.00 | 15.00 | 1.00 | 1.00 | 3.00 | 3.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 31.83 |
Dispatch | 34.33 |
Overall L1 | 34.33 |
all | 11% |
load | 5% |
store | 17% |
mul | 0% |
add-sub | 14% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 10% |
load | 3% |
store | 17% |
mul | 0% |
add-sub | 14% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
all | 14% |
load | 13% |
store | 16% |
mul | 12% |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 12% |
store | 16% |
mul | 12% |
add-sub | 13% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x1a0,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDX),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RCX),%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
INC %EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x2,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %EAX,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 248b5c <.omp_outlined.+0xd4c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV (%R9),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
INC %R13D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x2,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R13D,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 248b5c <.omp_outlined.+0xd4c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
SUB %R13D,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOVQ $0,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
IMUL %RBX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x24(%RSP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0xf0(%RSP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x198a3(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0xb0(%RSP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x18(%RSP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 25f740 <@plt_start@+0x530> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x10(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0xa8(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %R14,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVL %RAX,%R14 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R14,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JG 248b49 <.omp_outlined.+0xd39> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x10(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RBX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x40(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x38(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R13D,0x4(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R14,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%R8),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R9),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R10),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%R10),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%R9),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RDI),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RDX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R12,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RAX),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RSI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RSI),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDI,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RSI,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RSI,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x68(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDI,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %RCX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
INC %RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x4,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JB 2488ca <.omp_outlined.+0xaba> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x78(%RSP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTD %R15D,%XMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x70(%RSP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VBROADCASTSD -0x367ea(%RIP),%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD -0x367b4(%RIP),%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD -0x367f6(%RIP),%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %RCX,%YMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPADDQ -0x36624(%RIP),%YMM0,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ -0x3686e(%RIP),%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND $-0x4,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VMOVDQA %XMM2,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPBROADCASTD %R13D,%XMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
ADD %RDX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVDQA %XMM2,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPBROADCASTQ %RSI,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x68(%RSP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %R11,%YMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x60(%RSP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %RAX,%YMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVDQA %YMM2,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VEXTRACTI128 $0x1,%YMM1,%XMM15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VPBROADCASTQ %RSI,%YMM6 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x58(%RSP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %R11,%YMM7 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x50(%RSP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %RSI,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x48(%RSP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVDQA %YMM2,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPBROADCASTQ %R11,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x40(%RSP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVDQA %YMM2,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPBROADCASTQ %RSI,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x38(%RSP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %R11,%YMM11 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x28(%RSP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VMOVDQA %YMM2,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
VPCMPEQD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
VPBROADCASTQ %RSI,%YMM12 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV 0x20(%RSP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VPBROADCASTQ %R11,%YMM13 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %RSI,%YMM14 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV 0xc0(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x4(%RSP),%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,0xc8(%RSP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JE 248b49 <.omp_outlined.+0xd39> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VMOVSD -0x370ba(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x37082(%RIP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVDDUP -0x370ca(%RIP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVDDUP -0x37092(%RIP),%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x370d2(%RIP),%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV 0x18(%RSP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x18c04(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 25f750 <@plt_start@+0x540> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼.omp_outlined.#0x247e10– | 5.4 | 2.76 |
○Loop 153 - PdV.cpp:49-63 - exec | 5.4 | 2.75 |
○Loop 152 - PdV.cpp:49-63 - exec | 0 | 0 |