Function: .omp_outlined..8#0x239050 | Module: exec | Source: advec_mom.cpp:85-88 [...] | Coverage: 1.26% |
---|
Function: .omp_outlined..8#0x239050 | Module: exec | Source: advec_mom.cpp:85-88 [...] | Coverage: 1.26% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/advec_mom.cpp: 85 - 88 |
-------------------------------------------------------------------------------- |
85: #pragma omp parallel for simd collapse(2) |
86: for (int j = (y_min + 1); j < (y_max + 1 + 2); j++) { |
87: for (int i = (x_min - 2 + 1); i < (x_max + 2 + 2); i++) { |
88: node_flux(i, j) = 0.25 * (mass_flux_x(i + 0, j - 1) + mass_flux_x(i, j) + mass_flux_x(i + 1, j - 1) + mass_flux_x(i + 1, j + 0)); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
0x239050 PUSH %RBP |
0x239051 MOV %RSP,%RBP |
0x239054 PUSH %R15 |
0x239056 PUSH %R14 |
0x239058 PUSH %R13 |
0x23905a PUSH %R12 |
0x23905c PUSH %RBX |
0x23905d SUB $0x68,%RSP |
0x239061 MOV (%RCX),%R15D |
0x239064 MOV (%RDX),%EAX |
0x239066 LEA 0x1(%RAX),%R12D |
0x23906a ADD $0x3,%R15D |
0x23906e SUB %R12D,%R15D |
0x239071 JLE 23966b |
0x239077 MOV (%R9),%EBX |
0x23907a MOV (%R8),%ECX |
0x23907d ADD $0x4,%EBX |
0x239080 CMP %ECX,%EBX |
0x239082 JL 23966b |
0x239088 LEA -0x1(%RCX),%EDX |
0x23908b MOV (%RDI),%ESI |
0x23908d MOVQ $0,-0x58(%RBP) |
0x239095 MOVQ $0x1,-0x88(%RBP) |
0x2390a0 MOVL $0,-0x40(%RBP) |
0x2390a7 SUB %EDX,%EBX |
0x2390a9 MOV %RDX,-0x30(%RBP) |
0x2390ad IMUL %RBX,%R15 |
0x2390b1 DEC %R15 |
0x2390b4 MOV %R15,-0x38(%RBP) |
0x2390b8 SUB $0x8,%RSP |
0x2390bc MOV %RCX,%R13 |
0x2390bf LEA -0x40(%RBP),%RCX |
0x2390c3 MOV %RAX,%R14 |
0x2390c6 LEA -0x88(%RBP),%RAX |
0x2390cd LEA 0x27c54(%RIP),%RDI |
0x2390d4 LEA -0x58(%RBP),%R8 |
0x2390d8 LEA -0x38(%RBP),%R9 |
0x2390dc MOV %ESI,-0x3c(%RBP) |
0x2390df MOV $0x22,%EDX |
0x2390e4 PUSH $0x1 |
0x2390e6 PUSH $0x1 |
0x2390e8 PUSH %RAX |
0x2390e9 CALL 25f740 <@plt_start@+0x530> |
0x2390ee ADD $0x20,%RSP |
0x2390f2 MOV -0x38(%RBP),%RAX |
0x2390f6 MOV -0x58(%RBP),%RCX |
0x2390fa CMP %R15,%RAX |
0x2390fd CMOVL %RAX,%R15 |
0x239101 MOV %R15,-0x38(%RBP) |
0x239105 CMP %R15,%RCX |
0x239108 JG 239659 |
0x23910e MOV %RBX,%RAX |
0x239111 MOV %RAX,-0x48(%RBP) |
0x239115 MOV 0x18(%RBP),%RAX |
0x239119 MOV 0x10(%RBP),%RDX |
0x23911d MOV %R13,%RBX |
0x239120 MOV %R14,%R9 |
0x239123 MOV %R15,%R11 |
0x239126 SUB %RCX,%R11 |
0x239129 MOV %R12,-0x50(%RBP) |
0x23912d INC %R11 |
0x239130 MOV (%RDX),%R8 |
0x239133 MOV (%RAX),%R13 |
0x239136 MOV 0x10(%RAX),%RDI |
0x23913a MOV 0x10(%RDX),%R14 |
0x23913e MOV %R8,-0x80(%RBP) |
0x239142 CMP $0x8,%R11 |
0x239146 JAE 239154 |
0x239148 MOV -0x30(%RBP),%RSI |
0x23914c MOV %R9,%R10 |
0x23914f JMP 2395cf |
0x239154 MOV -0x48(%RBP),%RAX |
0x239158 VBROADCASTSD -0x2794a(%RIP),%ZMM10 |
0x239162 VPBROADCASTQ %RCX,%ZMM0 |
0x239168 VPADDQ -0x27432(%RIP),%ZMM0,%ZMM0 |
0x239172 VPBROADCASTQ -0x27974(%RIP),%ZMM11 |
0x23917c MOV %R11,-0x68(%RBP) |
0x239180 AND $-0x8,%R11 |
0x239184 VPBROADCASTD %R12D,%YMM2 |
0x23918a VPBROADCASTD %R9D,%YMM4 |
0x239190 VPBROADCASTQ %R13,%ZMM5 |
0x239196 VPBROADCASTD %EBX,%YMM6 |
0x23919c VPBROADCASTQ %R8,%ZMM7 |
0x2391a2 MOV %RBX,-0x70(%RBP) |
0x2391a6 MOV %R9,-0x78(%RBP) |
0x2391aa MOV %R13,-0x60(%RBP) |
0x2391ae MOV %R14,%RSI |
0x2391b1 ADD %R11,%RCX |
0x2391b4 MOV %R11,%RBX |
0x2391b7 VPBROADCASTQ %RAX,%ZMM1 |
0x2391bd MOV -0x30(%RBP),%RAX |
0x2391c1 VEXTRACTI32X4 $0x3,%ZMM1,%XMM8 |
0x2391c8 VEXTRACTI32X4 $0x2,%ZMM1,%XMM9 |
0x2391cf VPBROADCASTD %EAX,%YMM3 |
0x2391d5 NOPW %CS:(%RAX,%RAX,1) |
(258) 0x2391e0 VEXTRACTI32X4 $0x3,%ZMM0,%XMM12 |
(258) 0x2391e7 VPEXTRQ $0x1,%XMM8,%R10 |
(258) 0x2391ed KXNORW %K0,%K0,%K1 |
(258) 0x2391f1 VPEXTRQ $0x1,%XMM12,%RAX |
(258) 0x2391f7 CQTO |
(258) 0x2391f9 IDIV %R10 |
(258) 0x2391fc VMOVQ %XMM8,%R10 |
(258) 0x239201 VMOVQ %RAX,%XMM13 |
(258) 0x239206 VMOVQ %XMM12,%RAX |
(258) 0x23920b CQTO |
(258) 0x23920d IDIV %R10 |
(258) 0x239210 VPEXTRQ $0x1,%XMM9,%R10 |
(258) 0x239216 VMOVQ %RAX,%XMM12 |
(258) 0x23921b VPUNPCKLQDQ %XMM13,%XMM12,%XMM12 |
(258) 0x239220 VEXTRACTI32X4 $0x2,%ZMM0,%XMM13 |
(258) 0x239227 VPEXTRQ $0x1,%XMM13,%RAX |
(258) 0x23922d CQTO |
(258) 0x23922f IDIV %R10 |
(258) 0x239232 VMOVQ %XMM9,%R10 |
(258) 0x239237 VMOVQ %RAX,%XMM14 |
(258) 0x23923c VMOVQ %XMM13,%RAX |
(258) 0x239241 CQTO |
(258) 0x239243 IDIV %R10 |
(258) 0x239246 VMOVQ %RAX,%XMM13 |
(258) 0x23924b VPUNPCKLQDQ %XMM14,%XMM13,%XMM13 |
(258) 0x239250 VEXTRACTI128 $0x1,%YMM0,%XMM14 |
(258) 0x239256 VPEXTRQ $0x1,%XMM14,%RAX |
(258) 0x23925c VINSERTI128 $0x1,%XMM12,%YMM13,%YMM12 |
(258) 0x239262 VEXTRACTI128 $0x1,%YMM1,%XMM13 |
(258) 0x239268 VPEXTRQ $0x1,%XMM13,%R10 |
(258) 0x23926e CQTO |
(258) 0x239270 IDIV %R10 |
(258) 0x239273 VMOVQ %XMM13,%R10 |
(258) 0x239278 VMOVQ %RAX,%XMM15 |
(258) 0x23927d VMOVQ %XMM14,%RAX |
(258) 0x239282 CQTO |
(258) 0x239284 IDIV %R10 |
(258) 0x239287 VPEXTRQ $0x1,%XMM1,%R10 |
(258) 0x23928d VMOVQ %RAX,%XMM13 |
(258) 0x239292 VPEXTRQ $0x1,%XMM0,%RAX |
(258) 0x239298 CQTO |
(258) 0x23929a VPUNPCKLQDQ %XMM15,%XMM13,%XMM13 |
(258) 0x23929f IDIV %R10 |
(258) 0x2392a2 VMOVQ %XMM1,%R10 |
(258) 0x2392a7 VMOVQ %RAX,%XMM14 |
(258) 0x2392ac VMOVQ %XMM0,%RAX |
(258) 0x2392b1 CQTO |
(258) 0x2392b3 IDIV %R10 |
(258) 0x2392b6 ADD $-0x8,%R11 |
(258) 0x2392ba VMOVQ %RAX,%XMM15 |
(258) 0x2392bf VPUNPCKLQDQ %XMM14,%XMM15,%XMM14 |
(258) 0x2392c4 VINSERTI128 $0x1,%XMM13,%YMM14,%YMM13 |
(258) 0x2392ca VINSERTI64X4 $0x1,%YMM12,%ZMM13,%ZMM12 |
(258) 0x2392d1 VPMOVQD %ZMM12,%YMM13 |
(258) 0x2392d7 VPMULLQ %ZMM1,%ZMM12,%ZMM12 |
(258) 0x2392dd VPSUBQ %ZMM12,%ZMM0,%ZMM12 |
(258) 0x2392e3 VPADDQ %ZMM11,%ZMM0,%ZMM0 |
(258) 0x2392e9 VPMOVQD %ZMM12,%YMM14 |
(258) 0x2392ef VPADDD %YMM2,%YMM13,%YMM15 |
(258) 0x2392f3 VPADDD %YMM4,%YMM13,%YMM13 |
(258) 0x2392f7 VPMOVSXDQ %YMM13,%ZMM13 |
(258) 0x2392fd VPMOVSXDQ %YMM15,%ZMM21 |
(258) 0x239303 VPADDD %YMM3,%YMM14,%YMM12 |
(258) 0x239307 VPADDD %YMM6,%YMM14,%YMM14 |
(258) 0x23930b VPMOVSXDQ %YMM12,%ZMM12 |
(258) 0x239311 VPMULLQ %ZMM13,%ZMM5,%ZMM16 |
(258) 0x239317 VPMULLQ %ZMM21,%ZMM5,%ZMM15 |
(258) 0x23931d VPMOVSXDQ %YMM14,%ZMM14 |
(258) 0x239323 VPADDQ %ZMM12,%ZMM16,%ZMM13 |
(258) 0x239329 VPADDQ %ZMM14,%ZMM16,%ZMM16 |
(258) 0x23932f VPADDQ %ZMM14,%ZMM15,%ZMM14 |
(258) 0x239335 VEXTRACTI32X4 $0x1,%YMM13,%XMM17 |
(258) 0x23933c VMOVQ %XMM13,%RAX |
(258) 0x239341 VPEXTRQ $0x1,%XMM13,%RDX |
(258) 0x239347 VMOVQ %XMM17,%R10 |
(258) 0x23934d VPEXTRQ $0x1,%XMM17,%R8 |
(258) 0x239354 VEXTRACTI32X4 $0x2,%ZMM13,%XMM17 |
(258) 0x23935b VEXTRACTI32X4 $0x3,%ZMM13,%XMM13 |
(258) 0x239362 VMOVSD (%RDI,%RAX,8),%XMM18 |
(258) 0x239369 VMOVQ %XMM17,%R14 |
(258) 0x23936f VMOVQ %XMM13,%R9 |
(258) 0x239374 VPEXTRQ $0x1,%XMM17,%R12 |
(258) 0x23937b VPEXTRQ $0x1,%XMM13,%R13 |
(258) 0x239381 VMOVHPD (%RDI,%RDX,8),%XMM18,%XMM18 |
(258) 0x239388 VMOVSD (%RDI,%R9,8),%XMM13 |
(258) 0x23938e VMOVSD (%RDI,%R14,8),%XMM17 |
(258) 0x239395 VMOVHPD (%RDI,%R13,8),%XMM13,%XMM13 |
(258) 0x23939b VMOVHPD (%RDI,%R12,8),%XMM17,%XMM17 |
(258) 0x2393a2 VINSERTF32X4 $0x1,%XMM13,%YMM17,%YMM13 |
(258) 0x2393a9 VMOVSD (%RDI,%R10,8),%XMM17 |
(258) 0x2393b0 VMOVHPD (%RDI,%R8,8),%XMM17,%XMM17 |
(258) 0x2393b7 VINSERTF32X4 $0x1,%XMM17,%YMM18,%YMM17 |
(258) 0x2393be VPADDQ %ZMM12,%ZMM15,%ZMM18 |
(258) 0x2393c4 VEXTRACTI128 $0x1,%YMM14,%XMM15 |
(258) 0x2393ca VEXTRACTI32X4 $0x1,%YMM18,%XMM19 |
(258) 0x2393d1 VMOVQ %XMM18,%RDX |
(258) 0x2393d7 VPEXTRQ $0x1,%XMM18,%RAX |
(258) 0x2393de VMOVQ %XMM19,%R8 |
(258) 0x2393e4 VPEXTRQ $0x1,%XMM19,%R9 |
(258) 0x2393eb VEXTRACTI32X4 $0x2,%ZMM18,%XMM19 |
(258) 0x2393f2 VEXTRACTI32X4 $0x3,%ZMM18,%XMM18 |
(258) 0x2393f9 VMOVSD (%RDI,%RDX,8),%XMM20 |
(258) 0x239400 VINSERTF64X4 $0x1,%YMM13,%ZMM17,%ZMM17 |
(258) 0x239407 VMOVQ %XMM16,%RDX |
(258) 0x23940d VPMULLQ %ZMM21,%ZMM7,%ZMM13 |
(258) 0x239413 VMOVQ %XMM19,%R10 |
(258) 0x239419 VMOVQ %XMM18,%R13 |
(258) 0x23941f VPEXTRQ $0x1,%XMM19,%R14 |
(258) 0x239426 VPEXTRQ $0x1,%XMM18,%R12 |
(258) 0x23942d VMOVHPD (%RDI,%RAX,8),%XMM20,%XMM20 |
(258) 0x239434 VPEXTRQ $0x1,%XMM16,%RAX |
(258) 0x23943b VMOVSD (%RDI,%R13,8),%XMM18 |
(258) 0x239442 VMOVSD (%RDI,%R10,8),%XMM19 |
(258) 0x239449 VMOVHPD (%RDI,%R12,8),%XMM18,%XMM18 |
(258) 0x239450 VMOVHPD (%RDI,%R14,8),%XMM19,%XMM19 |
(258) 0x239457 VPADDQ %ZMM12,%ZMM13,%ZMM12 |
(258) 0x23945d VINSERTF32X4 $0x1,%XMM18,%YMM19,%YMM18 |
(258) 0x239464 VMOVSD (%RDI,%R8,8),%XMM19 |
(258) 0x23946b VMOVHPD (%RDI,%R9,8),%XMM19,%XMM19 |
(258) 0x239472 VINSERTF32X4 $0x1,%XMM19,%YMM20,%YMM19 |
(258) 0x239479 VINSERTF64X4 $0x1,%YMM18,%ZMM19,%ZMM18 |
(258) 0x239480 VMOVSD (%RDI,%RDX,8),%XMM19 |
(258) 0x239487 VPEXTRQ $0x1,%XMM14,%RDX |
(258) 0x23948d VMOVHPD (%RDI,%RAX,8),%XMM19,%XMM19 |
(258) 0x239494 VMOVQ %XMM14,%RAX |
(258) 0x239499 VADDPD %ZMM18,%ZMM17,%ZMM17 |
(258) 0x23949f VEXTRACTI32X4 $0x1,%YMM16,%XMM18 |
(258) 0x2394a6 VMOVQ %XMM18,%R8 |
(258) 0x2394ac VPEXTRQ $0x1,%XMM18,%R9 |
(258) 0x2394b3 VEXTRACTI32X4 $0x2,%ZMM16,%XMM18 |
(258) 0x2394ba VEXTRACTI32X4 $0x3,%ZMM16,%XMM16 |
(258) 0x2394c1 VMOVQ %XMM18,%R10 |
(258) 0x2394c7 VMOVQ %XMM16,%R13 |
(258) 0x2394cd VPEXTRQ $0x1,%XMM18,%R14 |
(258) 0x2394d4 VPEXTRQ $0x1,%XMM16,%R12 |
(258) 0x2394db VMOVSD (%RDI,%R13,8),%XMM16 |
(258) 0x2394e2 VMOVSD (%RDI,%R10,8),%XMM18 |
(258) 0x2394e9 VMOVHPD (%RDI,%R12,8),%XMM16,%XMM16 |
(258) 0x2394f0 VMOVHPD (%RDI,%R14,8),%XMM18,%XMM18 |
(258) 0x2394f7 VINSERTF32X4 $0x1,%XMM16,%YMM18,%YMM16 |
(258) 0x2394fe VMOVSD (%RDI,%R8,8),%XMM18 |
(258) 0x239505 VMOVQ %XMM15,%R8 |
(258) 0x23950a VMOVHPD (%RDI,%R9,8),%XMM18,%XMM18 |
(258) 0x239511 VPEXTRQ $0x1,%XMM15,%R9 |
(258) 0x239517 VEXTRACTI32X4 $0x2,%ZMM14,%XMM15 |
(258) 0x23951e VEXTRACTI32X4 $0x3,%ZMM14,%XMM14 |
(258) 0x239525 VMOVQ %XMM15,%R14 |
(258) 0x23952a VMOVQ %XMM14,%R12 |
(258) 0x23952f VPEXTRQ $0x1,%XMM15,%R10 |
(258) 0x239535 VPEXTRQ $0x1,%XMM14,%R13 |
(258) 0x23953b VMOVSD (%RDI,%R12,8),%XMM14 |
(258) 0x239541 VMOVSD (%RDI,%R14,8),%XMM15 |
(258) 0x239547 VMOVHPD (%RDI,%R13,8),%XMM14,%XMM14 |
(258) 0x23954d VMOVHPD (%RDI,%R10,8),%XMM15,%XMM15 |
(258) 0x239553 VINSERTF32X4 $0x1,%XMM18,%YMM19,%YMM18 |
(258) 0x23955a VINSERTF64X4 $0x1,%YMM16,%ZMM18,%ZMM16 |
(258) 0x239561 VINSERTF128 $0x1,%XMM14,%YMM15,%YMM14 |
(258) 0x239567 VMOVSD (%RDI,%R8,8),%XMM15 |
(258) 0x23956d VADDPD %ZMM16,%ZMM17,%ZMM16 |
(258) 0x239573 VMOVSD (%RDI,%RAX,8),%XMM17 |
(258) 0x23957a VMOVHPD (%RDI,%R9,8),%XMM15,%XMM15 |
(258) 0x239580 VMOVHPD (%RDI,%RDX,8),%XMM17,%XMM17 |
(258) 0x239587 VINSERTF32X4 $0x1,%XMM15,%YMM17,%YMM15 |
(258) 0x23958e VINSERTF64X4 $0x1,%YMM14,%ZMM15,%ZMM14 |
(258) 0x239595 VADDPD %ZMM14,%ZMM16,%ZMM14 |
(258) 0x23959b VMULPD %ZMM10,%ZMM14,%ZMM14 |
(258) 0x2395a1 VSCATTERQPD %ZMM14,(%RSI,%ZMM12,8){%K1} |
(258) 0x2395a8 JNE 2391e0 |
0x2395ae MOV %RSI,%R14 |
0x2395b1 MOV -0x78(%RBP),%R10 |
0x2395b5 MOV -0x50(%RBP),%R12 |
0x2395b9 MOV -0x30(%RBP),%RSI |
0x2395bd MOV -0x60(%RBP),%R13 |
0x2395c1 CMP %RBX,-0x68(%RBP) |
0x2395c5 MOV -0x70(%RBP),%RBX |
0x2395c9 JE 239659 |
0x2395cf VMOVSD -0x27dbf(%RIP),%XMM0 |
0x2395d7 NOPW (%RAX,%RAX,1) |
(259) 0x2395e0 MOV %RCX,%RAX |
(259) 0x2395e3 CQTO |
(259) 0x2395e5 IDIVQ -0x48(%RBP) |
(259) 0x2395e9 LEA (%RSI,%RDX,1),%R9D |
(259) 0x2395ed ADD %EBX,%EDX |
(259) 0x2395ef MOVSXD %R9D,%R9 |
(259) 0x2395f2 MOVSXD %EDX,%RDX |
(259) 0x2395f5 LEA (%R12,%RAX,1),%R8D |
(259) 0x2395f9 ADD %R10D,%EAX |
(259) 0x2395fc MOV %R10,%R12 |
(259) 0x2395ff CLTQ |
(259) 0x239601 MOVSXD %R8D,%R8 |
(259) 0x239604 IMUL %R13,%RAX |
(259) 0x239608 LEA (%RAX,%R9,1),%R10 |
(259) 0x23960c ADD %RDX,%RAX |
(259) 0x23960f VMOVSD (%RDI,%R10,8),%XMM1 |
(259) 0x239615 MOV %R13,%R10 |
(259) 0x239618 IMUL %R8,%R10 |
(259) 0x23961c LEA (%R10,%R9,1),%R11 |
(259) 0x239620 ADD %RDX,%R10 |
(259) 0x239623 VADDSD (%RDI,%R11,8),%XMM1,%XMM1 |
(259) 0x239629 VADDSD (%RDI,%RAX,8),%XMM1,%XMM1 |
(259) 0x23962e MOV -0x80(%RBP),%RAX |
(259) 0x239632 VADDSD (%RDI,%R10,8),%XMM1,%XMM1 |
(259) 0x239638 MOV %R12,%R10 |
(259) 0x23963b MOV -0x50(%RBP),%R12 |
(259) 0x23963f IMUL %RAX,%R8 |
(259) 0x239643 ADD %R9,%R8 |
(259) 0x239646 VMULSD %XMM0,%XMM1,%XMM1 |
(259) 0x23964a VMOVSD %XMM1,(%R14,%R8,8) |
(259) 0x239650 CMP %R15,%RCX |
(259) 0x239653 LEA 0x1(%RCX),%RCX |
(259) 0x239657 JL 2395e0 |
0x239659 MOV -0x3c(%RBP),%ESI |
0x23965c LEA 0x276dd(%RIP),%RDI |
0x239663 VZEROUPPER |
0x239666 CALL 25f750 <@plt_start@+0x540> |
0x23966b ADD $0x68,%RSP |
0x23966f POP %RBX |
0x239670 POP %R12 |
0x239672 POP %R13 |
0x239674 POP %R14 |
0x239676 POP %R15 |
0x239678 POP %RBP |
0x239679 RET |
Path / |
Source file and lines | advec_mom.cpp:85-88 |
Module | exec |
nb instructions | 117 |
nb uops | 125 |
loop length | 483 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 4 |
used zmm registers | 6 |
nb stack references | 15 |
micro-operation queue | 20.83 cycles |
front end | 20.83 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 8.50 | 8.50 | 8.25 | 8.25 | 4.50 | 14.33 | 14.33 | 14.33 | 0.50 | 7.50 | 7.50 | 0.50 | 0.00 | 0.00 |
cycles | 8.50 | 8.50 | 8.25 | 8.25 | 4.50 | 14.67 | 14.67 | 14.67 | 0.50 | 7.50 | 7.50 | 0.50 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 20.83 |
Dispatch | 14.67 |
Overall L1 | 20.83 |
all | 6% |
load | 6% |
store | 0% |
mul | 0% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 6% |
load | 5% |
store | 0% |
mul | 0% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
all | 12% |
load | 16% |
store | 10% |
mul | 12% |
add-sub | 20% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 16% |
store | 10% |
mul | 12% |
add-sub | 20% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x68,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RCX),%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x1(%RAX),%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x3,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %R12D,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 23966b <.omp_outlined..8+0x61b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV (%R9),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x4,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %ECX,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JL 23966b <.omp_outlined..8+0x61b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
LEA -0x1(%RCX),%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %EDX,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
IMUL %RBX,%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x40(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x88(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x27c54(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x58(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x38(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 25f740 <@plt_start@+0x530> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %R15,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVL %RAX,%R15 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R15,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JG 239659 <.omp_outlined..8+0x609> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R13,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %RCX,%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R12,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
INC %R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RDX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R8,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP $0x8,%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JAE 239154 <.omp_outlined..8+0x104> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R9,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 2395cf <.omp_outlined..8+0x57f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VBROADCASTSD -0x2794a(%RIP),%ZMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 |
VPBROADCASTQ %RCX,%ZMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPADDQ -0x27432(%RIP),%ZMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 1 |
VPBROADCASTQ -0x27974(%RIP),%ZMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 0.50 |
MOV %R11,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND $-0x8,%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VPBROADCASTD %R12D,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTD %R9D,%YMM4 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %R13,%ZMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTD %EBX,%YMM6 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %R8,%ZMM7 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
MOV %RBX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R9,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R13,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R11,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R11,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPBROADCASTQ %RAX,%ZMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VEXTRACTI32X4 $0x3,%ZMM1,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 1 |
VEXTRACTI32X4 $0x2,%ZMM1,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 1 |
VPBROADCASTD %EAX,%YMM3 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x78(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x50(%RBP),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x60(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RBX,-0x68(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV -0x70(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JE 239659 <.omp_outlined..8+0x609> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VMOVSD -0x27dbf(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x276dd(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 25f750 <@plt_start@+0x540> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x68,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
Source file and lines | advec_mom.cpp:85-88 |
Module | exec |
nb instructions | 117 |
nb uops | 125 |
loop length | 483 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 4 |
used zmm registers | 6 |
nb stack references | 15 |
micro-operation queue | 20.83 cycles |
front end | 20.83 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 8.50 | 8.50 | 8.25 | 8.25 | 4.50 | 14.33 | 14.33 | 14.33 | 0.50 | 7.50 | 7.50 | 0.50 | 0.00 | 0.00 |
cycles | 8.50 | 8.50 | 8.25 | 8.25 | 4.50 | 14.67 | 14.67 | 14.67 | 0.50 | 7.50 | 7.50 | 0.50 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 20.83 |
Dispatch | 14.67 |
Overall L1 | 20.83 |
all | 6% |
load | 6% |
store | 0% |
mul | 0% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 6% |
load | 5% |
store | 0% |
mul | 0% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
all | 12% |
load | 16% |
store | 10% |
mul | 12% |
add-sub | 20% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | 16% |
store | 10% |
mul | 12% |
add-sub | 20% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x68,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RCX),%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x1(%RAX),%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x3,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %R12D,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 23966b <.omp_outlined..8+0x61b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV (%R9),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R8),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x4,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %ECX,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JL 23966b <.omp_outlined..8+0x61b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
LEA -0x1(%RCX),%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVQ $0,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %EDX,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
IMUL %RBX,%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x40(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x88(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x27c54(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x58(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x38(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 25f740 <@plt_start@+0x530> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %R15,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVL %RAX,%R15 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R15,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JG 239659 <.omp_outlined..8+0x609> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R13,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %RCX,%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R12,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
INC %R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RAX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x10(%RDX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R8,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP $0x8,%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JAE 239154 <.omp_outlined..8+0x104> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R9,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 2395cf <.omp_outlined..8+0x57f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VBROADCASTSD -0x2794a(%RIP),%ZMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 5 | 1 |
VPBROADCASTQ %RCX,%ZMM0 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPADDQ -0x27432(%RIP),%ZMM0,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 1 |
VPBROADCASTQ -0x27974(%RIP),%ZMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 0.50 |
MOV %R11,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
AND $-0x8,%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VPBROADCASTD %R12D,%YMM2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTD %R9D,%YMM4 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %R13,%ZMM5 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTD %EBX,%YMM6 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VPBROADCASTQ %R8,%ZMM7 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
MOV %RBX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R9,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R13,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R11,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R11,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPBROADCASTQ %RAX,%ZMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 | 0 | 0 | 0 | 1 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VEXTRACTI32X4 $0x3,%ZMM1,%XMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 1 |
VEXTRACTI32X4 $0x2,%ZMM1,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 4 | 1 |
VPBROADCASTD %EAX,%YMM3 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV %RSI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x78(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x50(%RBP),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x60(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RBX,-0x68(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV -0x70(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JE 239659 <.omp_outlined..8+0x609> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
VMOVSD -0x27dbf(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x276dd(%RIP),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 25f750 <@plt_start@+0x540> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x68,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼.omp_outlined..8#0x239050– | 1.26 | 0.64 |
○Loop 258 - advec_mom.cpp:86-88 - exec | 1.26 | 0.64 |
○Loop 259 - advec_mom.cpp:86-88 - exec | 0 | 0 |