Function: .omp_outlined. | Module: exec | Source: accelerate.cpp:40-53 [...] | Coverage: 5.19% |
---|
Function: .omp_outlined. | Module: exec | Source: accelerate.cpp:40-53 [...] | Coverage: 5.19% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/accelerate.cpp: 40 - 53 |
-------------------------------------------------------------------------------- |
40: #pragma omp parallel for simd collapse(2) |
41: for (int j = (y_min + 1); j < (y_max + 1 + 2); j++) { |
42: for (int i = (x_min + 1); i < (x_max + 1 + 2); i++) { |
43: double stepbymass_s = halfdt / ((density0(i - 1, j - 1) * volume(i - 1, j - 1) + density0(i - 1, j + 0) * volume(i - 1, j + 0) + |
44: density0(i, j) * volume(i, j) + density0(i + 0, j - 1) * volume(i + 0, j - 1)) * |
45: 0.25); |
46: xvel1(i, j) = xvel0(i, j) - stepbymass_s * (xarea(i, j) * (pressure(i, j) - pressure(i - 1, j + 0)) + |
47: xarea(i + 0, j - 1) * (pressure(i + 0, j - 1) - pressure(i - 1, j - 1))); |
48: yvel1(i, j) = yvel0(i, j) - stepbymass_s * (yarea(i, j) * (pressure(i, j) - pressure(i + 0, j - 1)) + |
49: yarea(i - 1, j + 0) * (pressure(i - 1, j + 0) - pressure(i - 1, j - 1))); |
50: xvel1(i, j) = xvel1(i, j) - stepbymass_s * (xarea(i, j) * (viscosity(i, j) - viscosity(i - 1, j + 0)) + |
51: xarea(i + 0, j - 1) * (viscosity(i + 0, j - 1) - viscosity(i - 1, j - 1))); |
52: yvel1(i, j) = yvel1(i, j) - stepbymass_s * (yarea(i, j) * (viscosity(i, j) - viscosity(i + 0, j - 1)) + |
53: yarea(i - 1, j + 0) * (viscosity(i - 1, j + 0) - viscosity(i - 1, j - 1))); |
/beegfs/hackathon/users/eoseret/qaas_runs/170-854-8685/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
0x231450 PUSH %RBP |
0x231451 MOV %RSP,%RBP |
0x231454 PUSH %R15 |
0x231456 PUSH %R14 |
0x231458 PUSH %R13 |
0x23145a PUSH %R12 |
0x23145c PUSH %RBX |
0x23145d SUB $0x198,%RSP |
0x231464 MOV (%RDX),%EAX |
0x231466 MOV %RAX,-0x90(%RBP) |
0x23146d INC %EAX |
0x23146f MOV (%RCX),%EBX |
0x231471 ADD $0x3,%EBX |
0x231474 MOV %RAX,-0x88(%RBP) |
0x23147b SUB %EAX,%EBX |
0x23147d JLE 231cf9 |
0x231483 MOV (%R8),%EAX |
0x231486 MOV %RAX,-0x150(%RBP) |
0x23148d INC %EAX |
0x23148f MOV (%R9),%R14D |
0x231492 ADD $0x3,%R14D |
0x231496 CMP %EAX,%R14D |
0x231499 JLE 231cf9 |
0x23149f MOV %RAX,-0x48(%RBP) |
0x2314a3 SUB %EAX,%R14D |
0x2314a6 IMUL %R14,%RBX |
0x2314aa DEC %RBX |
0x2314ad MOVQ $0,-0x170(%RBP) |
0x2314b8 MOV %RBX,-0xa8(%RBP) |
0x2314bf MOVQ $0x1,-0x1b8(%RBP) |
0x2314ca MOVL $0,-0xb0(%RBP) |
0x2314d4 MOV (%RDI),%ESI |
0x2314d6 SUB $0x8,%RSP |
0x2314da LEA -0x1b8(%RBP),%RAX |
0x2314e1 LEA -0xb0(%RBP),%RCX |
0x2314e8 LEA -0x170(%RBP),%R8 |
0x2314ef LEA -0xa8(%RBP),%R9 |
0x2314f6 MOV $0x211b20,%EDI |
0x2314fb MOV %ESI,-0xac(%RBP) |
0x231501 MOV $0x22,%EDX |
0x231506 PUSH $0x1 |
0x231508 PUSH $0x1 |
0x23150a PUSH %RAX |
0x23150b CALL 261360 <@plt_start@+0x4f0> |
0x231510 ADD $0x20,%RSP |
0x231514 MOV -0xa8(%RBP),%RAX |
0x23151b CMP %RBX,%RAX |
0x23151e CMOVL %RAX,%RBX |
0x231522 MOV %RBX,-0xa8(%RBP) |
0x231529 MOV -0x170(%RBP),%RCX |
0x231530 MOV %RBX,-0xb8(%RBP) |
0x231537 CMP %RBX,%RCX |
0x23153a JG 231ce9 |
0x231540 MOV 0x50(%RBP),%RAX |
0x231544 MOV %RCX,-0x58(%RBP) |
0x231548 MOV 0x40(%RBP),%RCX |
0x23154c MOV 0x38(%RBP),%RDX |
0x231550 MOV 0x30(%RBP),%RSI |
0x231554 MOV 0x28(%RBP),%RDI |
0x231558 MOV 0x20(%RBP),%R8 |
0x23155c MOV 0x18(%RBP),%R9 |
0x231560 MOV (%R9),%R10 |
0x231563 MOV %R10,-0x140(%RBP) |
0x23156a MOV 0x10(%R9),%R9 |
0x23156e MOV %R9,-0x138(%RBP) |
0x231575 MOV (%R8),%R9 |
0x231578 MOV %R9,-0x130(%RBP) |
0x23157f MOV 0x10(%R8),%R8 |
0x231583 MOV %R8,-0x128(%RBP) |
0x23158a MOV (%RSI),%R8 |
0x23158d MOV %R8,-0x120(%RBP) |
0x231594 MOV 0x10(%RSI),%RSI |
0x231598 MOV %RSI,-0x118(%RBP) |
0x23159f MOV (%RDX),%RSI |
0x2315a2 MOV %RSI,-0x110(%RBP) |
0x2315a9 MOV 0x10(%RDX),%RDX |
0x2315ad MOV %RDX,-0x40(%RBP) |
0x2315b1 MOV (%RCX),%RDX |
0x2315b4 MOV %RDX,-0x108(%RBP) |
0x2315bb MOV 0x10(%RCX),%RCX |
0x2315bf MOV %RCX,-0x100(%RBP) |
0x2315c6 MOV -0x58(%RBP),%RCX |
0x2315ca MOV (%RDI),%RDX |
0x2315cd MOV %RDX,-0xf8(%RBP) |
0x2315d4 MOV 0x10(%RDI),%RDX |
0x2315d8 MOV %RDX,-0x60(%RBP) |
0x2315dc MOV (%RAX),%RDX |
0x2315df MOV %RDX,-0xf0(%RBP) |
0x2315e6 MOV 0x10(%RAX),%RAX |
0x2315ea MOV %RAX,-0xe8(%RBP) |
0x2315f1 MOV 0x58(%RBP),%RAX |
0x2315f5 MOV (%RAX),%RDX |
0x2315f8 MOV %RDX,-0xe0(%RBP) |
0x2315ff MOV 0x10(%RAX),%RAX |
0x231603 MOV %RAX,-0xd8(%RBP) |
0x23160a MOV 0x48(%RBP),%RAX |
0x23160e MOV (%RAX),%RDX |
0x231611 MOV %RDX,-0xd0(%RBP) |
0x231618 MOV 0x10(%RAX),%RAX |
0x23161c MOV %RAX,-0x98(%RBP) |
0x231623 MOV 0x60(%RBP),%RAX |
0x231627 MOV (%RAX),%RDX |
0x23162a MOV %RDX,-0xc8(%RBP) |
0x231631 MOV 0x10(%RAX),%RAX |
0x231635 MOV %RAX,-0xc0(%RBP) |
0x23163c MOV -0xb8(%RBP),%RAX |
0x231643 SUB %RCX,%RAX |
0x231646 INC %RAX |
0x231649 CMP $0x2,%RAX |
0x23164d MOV %R14,-0x148(%RBP) |
0x231654 JB 231fc1 |
0x23165a MOV %RAX,-0x180(%RBP) |
0x231661 MOV %RAX,%RDX |
0x231664 AND $-0x2,%RDX |
0x231668 VMOVAPD -0x2e8f0(%RIP),%XMM0 |
0x231670 MOV %RCX,%RAX |
0x231673 MOV %RDX,-0x178(%RBP) |
0x23167a MOV %RDX,%RSI |
0x23167d JMP 231c69 |
0x231682 NOPW %CS:(%RAX,%RAX,1) |
(139) 0x231690 MOV %RCX,%RAX |
(139) 0x231693 CQTO |
(139) 0x231695 IDIV %R14 |
(139) 0x231698 LEA (%R9,%RDI,1),%R11D |
(139) 0x23169c LEA (%R9,%RAX,1),%R10D |
(139) 0x2316a0 LEA (%RBX,%R8,1),%ECX |
(139) 0x2316a4 MOV %ECX,-0x80(%RBP) |
(139) 0x2316a7 LEA (%RBX,%RDX,1),%ECX |
(139) 0x2316aa MOV %ECX,-0x38(%RBP) |
(139) 0x2316ad MOV -0x150(%RBP),%RBX |
(139) 0x2316b4 ADD %EBX,%R8D |
(139) 0x2316b7 ADD %EBX,%EDX |
(139) 0x2316b9 MOVSXD %R8D,%RBX |
(139) 0x2316bc MOVSXD %EDX,%R14 |
(139) 0x2316bf ADD %ESI,%EDI |
(139) 0x2316c1 ADD %ESI,%EAX |
(139) 0x2316c3 MOVSXD %EDI,%R8 |
(139) 0x2316c6 MOV %R8,-0x50(%RBP) |
(139) 0x2316ca CLTQ |
(139) 0x2316cc MOV %RAX,-0x168(%RBP) |
(139) 0x2316d3 MOV -0x140(%RBP),%R15 |
(139) 0x2316da MOV %R15,%RCX |
(139) 0x2316dd IMUL %R8,%RCX |
(139) 0x2316e1 MOV %R15,%RDX |
(139) 0x2316e4 IMUL %RAX,%RDX |
(139) 0x2316e8 LEA (%RCX,%RBX,1),%RSI |
(139) 0x2316ec LEA (%RDX,%R14,1),%RDI |
(139) 0x2316f0 MOV -0x138(%RBP),%R9 |
(139) 0x2316f7 VMOVSD (%R9,%RSI,8),%XMM1 |
(139) 0x2316fd VMOVHPD (%R9,%RDI,8),%XMM1,%XMM2 |
(139) 0x231703 MOV -0x130(%RBP),%R12 |
(139) 0x23170a MOV %R12,%RSI |
(139) 0x23170d IMUL %R8,%RSI |
(139) 0x231711 MOV %R12,%R8 |
(139) 0x231714 IMUL %RAX,%R8 |
(139) 0x231718 LEA (%RSI,%RBX,1),%RDI |
(139) 0x23171c MOV -0x128(%RBP),%RAX |
(139) 0x231723 VMOVSD (%RAX,%RDI,8),%XMM1 |
(139) 0x231728 LEA (%R8,%R14,1),%RDI |
(139) 0x23172c VMOVHPD (%RAX,%RDI,8),%XMM1,%XMM3 |
(139) 0x231731 MOVSXD %R11D,%RDI |
(139) 0x231734 MOV %RDI,-0x30(%RBP) |
(139) 0x231738 MOV %R15,%R11 |
(139) 0x23173b IMUL %RDI,%R11 |
(139) 0x23173f MOV %RBX,%RDI |
(139) 0x231742 MOV %RBX,-0x160(%RBP) |
(139) 0x231749 ADD %R11,%RBX |
(139) 0x23174c VMOVSD (%R9,%RBX,8),%XMM1 |
(139) 0x231752 MOVSXD %R10D,%R13 |
(139) 0x231755 MOV %R15,%R10 |
(139) 0x231758 IMUL %R13,%R10 |
(139) 0x23175c MOV %R13,-0x158(%RBP) |
(139) 0x231763 MOV %R14,-0xa0(%RBP) |
(139) 0x23176a LEA (%R10,%R14,1),%RBX |
(139) 0x23176e VMOVHPD (%R9,%RBX,8),%XMM1,%XMM4 |
(139) 0x231774 MOV %R12,%RBX |
(139) 0x231777 IMUL -0x30(%RBP),%RBX |
(139) 0x23177c LEA (%RBX,%RDI,1),%R15 |
(139) 0x231780 VMOVSD (%RAX,%R15,8),%XMM1 |
(139) 0x231786 MOV %R12,%R15 |
(139) 0x231789 IMUL %R13,%R15 |
(139) 0x23178d LEA (%R15,%R14,1),%R12 |
(139) 0x231791 VMOVHPD (%RAX,%R12,8),%XMM1,%XMM5 |
(139) 0x231797 MOVSXD -0x80(%RBP),%R14 |
(139) 0x23179b ADD %R14,%R11 |
(139) 0x23179e VMOVSD (%R9,%R11,8),%XMM1 |
(139) 0x2317a4 MOVSXD -0x38(%RBP),%R13 |
(139) 0x2317a8 ADD %R13,%R10 |
(139) 0x2317ab VMOVHPD (%R9,%R10,8),%XMM1,%XMM6 |
(139) 0x2317b1 ADD %R14,%RBX |
(139) 0x2317b4 VMOVSD (%RAX,%RBX,8),%XMM7 |
(139) 0x2317b9 MOV 0x10(%RBP),%RDI |
(139) 0x2317bd VMOVDDUP (%RDI),%XMM1 |
(139) 0x2317c1 VMULPD %XMM3,%XMM2,%XMM2 |
(139) 0x2317c5 VMULPD %XMM5,%XMM4,%XMM3 |
(139) 0x2317c9 ADD %R13,%R15 |
(139) 0x2317cc VMOVHPD (%RAX,%R15,8),%XMM7,%XMM4 |
(139) 0x2317d2 VADDPD %XMM3,%XMM2,%XMM2 |
(139) 0x2317d6 VMULPD %XMM4,%XMM6,%XMM3 |
(139) 0x2317da ADD %R14,%RCX |
(139) 0x2317dd ADD %R13,%RDX |
(139) 0x2317e0 VMOVSD (%R9,%RCX,8),%XMM4 |
(139) 0x2317e6 VMOVHPD (%R9,%RDX,8),%XMM4,%XMM4 |
(139) 0x2317ec ADD %R14,%RSI |
(139) 0x2317ef MOV %R14,%R11 |
(139) 0x2317f2 ADD %R13,%R8 |
(139) 0x2317f5 VMOVSD (%RAX,%RSI,8),%XMM5 |
(139) 0x2317fa VMOVHPD (%RAX,%R8,8),%XMM5,%XMM5 |
(139) 0x231800 VADDPD %XMM2,%XMM3,%XMM2 |
(139) 0x231804 VMULPD %XMM5,%XMM4,%XMM3 |
(139) 0x231808 VADDPD %XMM2,%XMM3,%XMM3 |
(139) 0x23180c MOV -0x120(%RBP),%RCX |
(139) 0x231813 MOV %RCX,%RAX |
(139) 0x231816 MOV -0x30(%RBP),%R9 |
(139) 0x23181a IMUL %R9,%RAX |
(139) 0x23181e MOV -0x158(%RBP),%RDI |
(139) 0x231825 IMUL %RDI,%RCX |
(139) 0x231829 ADD %R14,%RAX |
(139) 0x23182c ADD %R13,%RCX |
(139) 0x23182f MOV -0x118(%RBP),%RDX |
(139) 0x231836 VMOVSD (%RDX,%RAX,8),%XMM2 |
(139) 0x23183b VMOVHPD (%RDX,%RCX,8),%XMM2,%XMM2 |
(139) 0x231840 VMULPD %XMM0,%XMM3,%XMM4 |
(139) 0x231844 MOV -0x110(%RBP),%RBX |
(139) 0x23184b MOV %RBX,%RCX |
(139) 0x23184e IMUL %R9,%RCX |
(139) 0x231852 MOV %RBX,%RDX |
(139) 0x231855 IMUL %RDI,%RDX |
(139) 0x231859 ADD %R14,%RCX |
(139) 0x23185c MOV %RCX,-0x38(%RBP) |
(139) 0x231860 ADD %R13,%RDX |
(139) 0x231863 MOV %RDX,-0x80(%RBP) |
(139) 0x231867 MOV -0x40(%RBP),%RAX |
(139) 0x23186b VMOVSD (%RAX,%RCX,8),%XMM3 |
(139) 0x231870 VMOVHPD (%RAX,%RDX,8),%XMM3,%XMM3 |
(139) 0x231875 MOV -0x108(%RBP),%R8 |
(139) 0x23187c MOV %R8,%R12 |
(139) 0x23187f IMUL %R9,%R12 |
(139) 0x231883 MOV %R8,%R9 |
(139) 0x231886 IMUL %RDI,%R9 |
(139) 0x23188a MOV %RDI,%R14 |
(139) 0x23188d LEA (%R12,%R11,1),%RCX |
(139) 0x231891 MOV %RCX,-0x78(%RBP) |
(139) 0x231895 MOV -0x100(%RBP),%RAX |
(139) 0x23189c VMOVSD (%RAX,%RCX,8),%XMM5 |
(139) 0x2318a1 LEA (%R9,%R13,1),%RCX |
(139) 0x2318a5 MOV %RCX,-0x70(%RBP) |
(139) 0x2318a9 VMOVHPD (%RAX,%RCX,8),%XMM5,%XMM5 |
(139) 0x2318ae MOV -0x160(%RBP),%R15 |
(139) 0x2318b5 ADD %R15,%R12 |
(139) 0x2318b8 MOV -0xa0(%RBP),%R10 |
(139) 0x2318bf ADD %R10,%R9 |
(139) 0x2318c2 VMOVSD (%RAX,%R12,8),%XMM6 |
(139) 0x2318c8 VMOVHPD (%RAX,%R9,8),%XMM6,%XMM6 |
(139) 0x2318ce VDIVPD %XMM4,%XMM1,%XMM1 |
(139) 0x2318d2 VSUBPD %XMM6,%XMM5,%XMM4 |
(139) 0x2318d6 MOV %RBX,%RDI |
(139) 0x2318d9 MOV -0x50(%RBP),%RDX |
(139) 0x2318dd IMUL %RDX,%RDI |
(139) 0x2318e1 MOV -0x168(%RBP),%RSI |
(139) 0x2318e8 IMUL %RSI,%RBX |
(139) 0x2318ec ADD %R11,%RDI |
(139) 0x2318ef MOV %RDI,-0x1a0(%RBP) |
(139) 0x2318f6 ADD %R13,%RBX |
(139) 0x2318f9 MOV -0x40(%RBP),%RCX |
(139) 0x2318fd VMOVSD (%RCX,%RDI,8),%XMM5 |
(139) 0x231902 VMOVHPD (%RCX,%RBX,8),%XMM5,%XMM5 |
(139) 0x231907 MOV %R8,%RDI |
(139) 0x23190a IMUL %RDX,%RDI |
(139) 0x23190e MOV %R8,%RDX |
(139) 0x231911 IMUL %RSI,%RDX |
(139) 0x231915 LEA (%RDI,%R11,1),%RCX |
(139) 0x231919 MOV %RCX,-0x68(%RBP) |
(139) 0x23191d VMOVSD (%RAX,%RCX,8),%XMM6 |
(139) 0x231922 LEA (%RDX,%R13,1),%RCX |
(139) 0x231926 MOV %RCX,-0x188(%RBP) |
(139) 0x23192d VMOVHPD (%RAX,%RCX,8),%XMM6,%XMM6 |
(139) 0x231932 VMULPD %XMM4,%XMM3,%XMM3 |
(139) 0x231936 ADD %R15,%RDI |
(139) 0x231939 ADD %R10,%RDX |
(139) 0x23193c VMOVSD (%RAX,%RDI,8),%XMM4 |
(139) 0x231941 VMOVHPD (%RAX,%RDX,8),%XMM4,%XMM4 |
(139) 0x231946 VSUBPD %XMM4,%XMM6,%XMM4 |
(139) 0x23194a VMULPD %XMM4,%XMM5,%XMM4 |
(139) 0x23194e VADDPD %XMM4,%XMM3,%XMM3 |
(139) 0x231952 VMULPD %XMM3,%XMM1,%XMM3 |
(139) 0x231956 VADDPD %XMM2,%XMM3,%XMM2 |
(139) 0x23195a MOV -0xf8(%RBP),%R10 |
(139) 0x231961 MOV %R10,%RCX |
(139) 0x231964 MOV -0x30(%RBP),%R8 |
(139) 0x231968 IMUL %R8,%RCX |
(139) 0x23196c IMUL %R14,%R10 |
(139) 0x231970 ADD %R11,%RCX |
(139) 0x231973 MOV %RCX,-0x198(%RBP) |
(139) 0x23197a ADD %R13,%R10 |
(139) 0x23197d MOV %R10,-0x190(%RBP) |
(139) 0x231984 MOV -0x60(%RBP),%RSI |
(139) 0x231988 VMOVLPD %XMM2,(%RSI,%RCX,8) |
(139) 0x23198d VMOVHPD %XMM2,(%RSI,%R10,8) |
(139) 0x231993 MOV -0xf0(%RBP),%RSI |
(139) 0x23199a MOV %RSI,%R15 |
(139) 0x23199d IMUL %R8,%R15 |
(139) 0x2319a1 ADD %R11,%R15 |
(139) 0x2319a4 MOV %R11,%R8 |
(139) 0x2319a7 MOV -0xe8(%RBP),%RCX |
(139) 0x2319ae VMOVSD (%RCX,%R15,8),%XMM2 |
(139) 0x2319b4 IMUL %R14,%RSI |
(139) 0x2319b8 ADD %R13,%RSI |
(139) 0x2319bb VMOVHPD (%RCX,%RSI,8),%XMM2,%XMM2 |
(139) 0x2319c0 MOV -0x78(%RBP),%RCX |
(139) 0x2319c4 VMOVSD (%RAX,%RCX,8),%XMM3 |
(139) 0x2319c9 MOV -0x70(%RBP),%RCX |
(139) 0x2319cd VMOVHPD (%RAX,%RCX,8),%XMM3,%XMM3 |
(139) 0x2319d2 MOV -0x68(%RBP),%RCX |
(139) 0x2319d6 VMOVSD (%RAX,%RCX,8),%XMM4 |
(139) 0x2319db MOV -0x188(%RBP),%RCX |
(139) 0x2319e2 VMOVHPD (%RAX,%RCX,8),%XMM4,%XMM4 |
(139) 0x2319e7 VMOVSD (%RAX,%R12,8),%XMM5 |
(139) 0x2319ed VMOVHPD (%RAX,%R9,8),%XMM5,%XMM5 |
(139) 0x2319f3 VMOVSD (%RAX,%RDI,8),%XMM6 |
(139) 0x2319f8 VMOVHPD (%RAX,%RDX,8),%XMM6,%XMM6 |
(139) 0x2319fd MOV -0xe0(%RBP),%R11 |
(139) 0x231a04 MOV %R11,%R10 |
(139) 0x231a07 MOV -0x30(%RBP),%R12 |
(139) 0x231a0b IMUL %R12,%R10 |
(139) 0x231a0f IMUL %R14,%R11 |
(139) 0x231a13 MOV %R8,%RAX |
(139) 0x231a16 LEA (%R10,%R8,1),%RCX |
(139) 0x231a1a MOV %RCX,-0x78(%RBP) |
(139) 0x231a1e MOV -0xd8(%RBP),%RDI |
(139) 0x231a25 VMOVSD (%RDI,%RCX,8),%XMM7 |
(139) 0x231a2a LEA (%R11,%R13,1),%RCX |
(139) 0x231a2e MOV %RCX,-0x70(%RBP) |
(139) 0x231a32 VMOVHPD (%RDI,%RCX,8),%XMM7,%XMM7 |
(139) 0x231a37 VSUBPD %XMM4,%XMM3,%XMM3 |
(139) 0x231a3b VMULPD %XMM3,%XMM7,%XMM3 |
(139) 0x231a3f MOV -0x160(%RBP),%RDX |
(139) 0x231a46 ADD %RDX,%R10 |
(139) 0x231a49 ADD -0xa0(%RBP),%R11 |
(139) 0x231a50 VMOVSD (%RDI,%R10,8),%XMM4 |
(139) 0x231a56 VMOVHPD (%RDI,%R11,8),%XMM4,%XMM4 |
(139) 0x231a5c VSUBPD %XMM6,%XMM5,%XMM5 |
(139) 0x231a60 VMULPD %XMM5,%XMM4,%XMM4 |
(139) 0x231a64 VADDPD %XMM4,%XMM3,%XMM3 |
(139) 0x231a68 VMULPD %XMM3,%XMM1,%XMM3 |
(139) 0x231a6c VADDPD %XMM2,%XMM3,%XMM2 |
(139) 0x231a70 MOV -0xd0(%RBP),%R9 |
(139) 0x231a77 MOV %R9,%R8 |
(139) 0x231a7a IMUL %R12,%R8 |
(139) 0x231a7e MOV %R12,%RSI |
(139) 0x231a81 MOV %R9,%R12 |
(139) 0x231a84 IMUL %R14,%R12 |
(139) 0x231a88 ADD %RAX,%R8 |
(139) 0x231a8b MOV %R8,-0x68(%RBP) |
(139) 0x231a8f MOV %RAX,%RCX |
(139) 0x231a92 ADD %R13,%R12 |
(139) 0x231a95 MOV -0x98(%RBP),%RAX |
(139) 0x231a9c VMOVLPD %XMM2,(%RAX,%R8,8) |
(139) 0x231aa2 VMOVHPD %XMM2,(%RAX,%R12,8) |
(139) 0x231aa8 MOV -0x40(%RBP),%RAX |
(139) 0x231aac MOV -0x38(%RBP),%R15 |
(139) 0x231ab0 VMOVSD (%RAX,%R15,8),%XMM2 |
(139) 0x231ab6 MOV -0x80(%RBP),%R15 |
(139) 0x231aba VMOVHPD (%RAX,%R15,8),%XMM2,%XMM2 |
(139) 0x231ac0 MOV -0x1a0(%RBP),%R15 |
(139) 0x231ac7 VMOVSD (%RAX,%R15,8),%XMM3 |
(139) 0x231acd VMOVHPD (%RAX,%RBX,8),%XMM3,%XMM3 |
(139) 0x231ad2 MOV -0xc8(%RBP),%R15 |
(139) 0x231ad9 MOV %RSI,%R8 |
(139) 0x231adc IMUL %R15,%R8 |
(139) 0x231ae0 LEA (%R8,%RCX,1),%RAX |
(139) 0x231ae4 MOV %RAX,-0x38(%RBP) |
(139) 0x231ae8 ADD %RDX,%R8 |
(139) 0x231aeb MOV %R8,-0x30(%RBP) |
(139) 0x231aef MOV -0x50(%RBP),%RBX |
(139) 0x231af3 IMUL %R15,%RBX |
(139) 0x231af7 ADD %RBX,%RCX |
(139) 0x231afa MOV %RCX,-0x50(%RBP) |
(139) 0x231afe ADD %RDX,%RBX |
(139) 0x231b01 MOV -0x158(%RBP),%RDX |
(139) 0x231b08 IMUL %R15,%RDX |
(139) 0x231b0c LEA (%RDX,%R13,1),%RSI |
(139) 0x231b10 MOV -0xa0(%RBP),%RCX |
(139) 0x231b17 ADD %RCX,%RDX |
(139) 0x231b1a MOV -0x168(%RBP),%RAX |
(139) 0x231b21 IMUL %R15,%RAX |
(139) 0x231b25 ADD %RAX,%R13 |
(139) 0x231b28 ADD %RCX,%RAX |
(139) 0x231b2b MOV -0x60(%RBP),%RCX |
(139) 0x231b2f MOV -0x198(%RBP),%R9 |
(139) 0x231b36 VMOVSD (%RCX,%R9,8),%XMM4 |
(139) 0x231b3c MOV -0x190(%RBP),%R8 |
(139) 0x231b43 VMOVHPD (%RCX,%R8,8),%XMM4,%XMM4 |
(139) 0x231b49 MOV -0xc0(%RBP),%R15 |
(139) 0x231b50 MOV -0x38(%RBP),%R14 |
(139) 0x231b54 VMOVSD (%R15,%R14,8),%XMM5 |
(139) 0x231b5a VMOVHPD (%R15,%RSI,8),%XMM5,%XMM5 |
(139) 0x231b60 MOV %RSI,%R14 |
(139) 0x231b63 MOV -0x30(%RBP),%RSI |
(139) 0x231b67 VMOVSD (%R15,%RSI,8),%XMM6 |
(139) 0x231b6d VMOVHPD (%R15,%RDX,8),%XMM6,%XMM6 |
(139) 0x231b73 VSUBPD %XMM6,%XMM5,%XMM5 |
(139) 0x231b77 VMULPD %XMM5,%XMM2,%XMM2 |
(139) 0x231b7b MOV -0x50(%RBP),%RSI |
(139) 0x231b7f VMOVSD (%R15,%RSI,8),%XMM5 |
(139) 0x231b85 VMOVHPD (%R15,%R13,8),%XMM5,%XMM5 |
(139) 0x231b8b VMOVSD (%R15,%RBX,8),%XMM6 |
(139) 0x231b91 VMOVHPD (%R15,%RAX,8),%XMM6,%XMM6 |
(139) 0x231b97 VSUBPD %XMM6,%XMM5,%XMM5 |
(139) 0x231b9b VMULPD %XMM5,%XMM3,%XMM3 |
(139) 0x231b9f VADDPD %XMM3,%XMM2,%XMM2 |
(139) 0x231ba3 VMULPD %XMM2,%XMM1,%XMM2 |
(139) 0x231ba7 VADDPD %XMM4,%XMM2,%XMM2 |
(139) 0x231bab VMOVLPD %XMM2,(%RCX,%R9,8) |
(139) 0x231bb1 VMOVHPD %XMM2,(%RCX,%R8,8) |
(139) 0x231bb7 MOV -0x78(%RBP),%RCX |
(139) 0x231bbb VMOVSD (%RDI,%RCX,8),%XMM2 |
(139) 0x231bc0 MOV -0x70(%RBP),%RCX |
(139) 0x231bc4 VMOVHPD (%RDI,%RCX,8),%XMM2,%XMM2 |
(139) 0x231bc9 MOV -0x38(%RBP),%RCX |
(139) 0x231bcd VMOVSD (%R15,%RCX,8),%XMM3 |
(139) 0x231bd3 VMOVHPD (%R15,%R14,8),%XMM3,%XMM3 |
(139) 0x231bd9 VMOVSD (%R15,%RSI,8),%XMM4 |
(139) 0x231bdf VMOVHPD (%R15,%R13,8),%XMM4,%XMM4 |
(139) 0x231be5 VMOVSD (%RDI,%R10,8),%XMM5 |
(139) 0x231beb VMOVHPD (%RDI,%R11,8),%XMM5,%XMM5 |
(139) 0x231bf1 MOV -0x30(%RBP),%RCX |
(139) 0x231bf5 VMOVSD (%R15,%RCX,8),%XMM6 |
(139) 0x231bfb VMOVHPD (%R15,%RDX,8),%XMM6,%XMM6 |
(139) 0x231c01 VMOVSD (%R15,%RBX,8),%XMM7 |
(139) 0x231c07 VMOVHPD (%R15,%RAX,8),%XMM7,%XMM7 |
(139) 0x231c0d VSUBPD %XMM4,%XMM3,%XMM3 |
(139) 0x231c11 VMULPD %XMM3,%XMM2,%XMM2 |
(139) 0x231c15 MOV -0x68(%RBP),%RAX |
(139) 0x231c19 MOV -0x98(%RBP),%RCX |
(139) 0x231c20 VMOVSD (%RCX,%RAX,8),%XMM3 |
(139) 0x231c25 VMOVHPD (%RCX,%R12,8),%XMM3,%XMM3 |
(139) 0x231c2b VSUBPD %XMM7,%XMM6,%XMM4 |
(139) 0x231c2f VMULPD %XMM4,%XMM5,%XMM4 |
(139) 0x231c33 VADDPD %XMM4,%XMM2,%XMM2 |
(139) 0x231c37 VMULPD %XMM2,%XMM1,%XMM1 |
(139) 0x231c3b VADDPD %XMM3,%XMM1,%XMM1 |
(139) 0x231c3f VMOVLPD %XMM1,(%RCX,%RAX,8) |
(139) 0x231c44 VMOVHPD %XMM1,(%RCX,%R12,8) |
(139) 0x231c4a MOV -0x1b0(%RBP),%RAX |
(139) 0x231c51 ADD $0x2,%RAX |
(139) 0x231c55 MOV -0x1a8(%RBP),%RSI |
(139) 0x231c5c ADD $-0x2,%RSI |
(139) 0x231c60 MOV -0x148(%RBP),%R14 |
(139) 0x231c67 JE 231cd5 |
(139) 0x231c69 LEA 0x1(%RAX),%RCX |
(139) 0x231c6d MOV %RAX,%RDX |
(139) 0x231c70 SHR $0x20,%RDX |
(139) 0x231c74 MOV %RAX,-0x1b0(%RBP) |
(139) 0x231c7b MOV %RSI,-0x1a8(%RBP) |
(139) 0x231c82 JE 231ca0 |
(139) 0x231c84 CQTO |
(139) 0x231c86 IDIV %R14 |
(139) 0x231c89 MOV %RDX,%R8 |
(139) 0x231c8c MOV %RAX,%RDI |
(139) 0x231c8f JMP 231caa |
0x231c91 NOPW %CS:(%RAX,%RAX,1) |
(139) 0x231ca0 XOR %EDX,%EDX |
(139) 0x231ca2 DIV %R14D |
(139) 0x231ca5 MOV %EDX,%R8D |
(139) 0x231ca8 MOV %EAX,%EDI |
(139) 0x231caa MOV -0x90(%RBP),%RSI |
(139) 0x231cb1 MOV -0x88(%RBP),%R9 |
(139) 0x231cb8 MOV -0x48(%RBP),%RBX |
(139) 0x231cbc MOV %RCX,%RAX |
(139) 0x231cbf SHR $0x20,%RAX |
(139) 0x231cc3 JNE 231690 |
(139) 0x231cc9 MOV %ECX,%EAX |
(139) 0x231ccb XOR %EDX,%EDX |
(139) 0x231ccd DIV %R14D |
(139) 0x231cd0 JMP 231698 |
0x231cd5 MOV -0x178(%RBP),%RAX |
0x231cdc CMP %RAX,-0x180(%RBP) |
0x231ce3 MOV -0x58(%RBP),%RCX |
0x231ce7 JNE 231d0b |
0x231ce9 MOV $0x211b38,%EDI |
0x231cee MOV -0xac(%RBP),%ESI |
0x231cf4 CALL 261370 <@plt_start@+0x500> |
0x231cf9 ADD $0x198,%RSP |
0x231d00 POP %RBX |
0x231d01 POP %R12 |
0x231d03 POP %R13 |
0x231d05 POP %R14 |
0x231d07 POP %R15 |
0x231d09 POP %RBP |
0x231d0a RET |
0x231d0b ADD %RAX,%RCX |
0x231d0e JMP 231fc1 |
0x231d13 NOPW %CS:(%RAX,%RAX,1) |
(138) 0x231d20 MOV %RCX,%RAX |
(138) 0x231d23 CQTO |
(138) 0x231d25 IDIV %R14 |
(138) 0x231d28 MOV -0x48(%RBP),%RSI |
(138) 0x231d2c MOV -0x88(%RBP),%RCX |
(138) 0x231d33 ADD %EAX,%ECX |
(138) 0x231d35 LEA (%RSI,%RDX,1),%EDI |
(138) 0x231d38 MOV 0x10(%RBP),%RSI |
(138) 0x231d3c VMOVSD (%RSI),%XMM0 |
(138) 0x231d40 ADD -0x150(%RBP),%EDX |
(138) 0x231d46 MOVSXD %EDX,%R13 |
(138) 0x231d49 ADD -0x90(%RBP),%EAX |
(138) 0x231d4f MOVSXD %EAX,%RDX |
(138) 0x231d52 MOV -0x140(%RBP),%R10 |
(138) 0x231d59 MOV %R10,%R8 |
(138) 0x231d5c IMUL %RDX,%R8 |
(138) 0x231d60 LEA (%R8,%R13,1),%RSI |
(138) 0x231d64 MOV -0x138(%RBP),%RBX |
(138) 0x231d6b VMOVSD (%RBX,%RSI,8),%XMM1 |
(138) 0x231d70 MOV -0x130(%RBP),%R11 |
(138) 0x231d77 MOV %R11,%R9 |
(138) 0x231d7a IMUL %RDX,%R9 |
(138) 0x231d7e MOVSXD %ECX,%RSI |
(138) 0x231d81 MOV %R10,%RCX |
(138) 0x231d84 IMUL %RSI,%RCX |
(138) 0x231d88 LEA (%RCX,%R13,1),%R10 |
(138) 0x231d8c VMOVSD (%RBX,%R10,8),%XMM2 |
(138) 0x231d92 MOV %R11,%R10 |
(138) 0x231d95 IMUL %RSI,%R10 |
(138) 0x231d99 LEA (%R10,%R13,1),%R11 |
(138) 0x231d9d MOV -0x128(%RBP),%R14 |
(138) 0x231da4 VMULSD (%R14,%R11,8),%XMM2,%XMM2 |
(138) 0x231daa LEA (%R9,%R13,1),%R11 |
(138) 0x231dae VMULSD (%R14,%R11,8),%XMM1,%XMM1 |
(138) 0x231db4 VADDSD %XMM2,%XMM1,%XMM1 |
(138) 0x231db8 MOVSXD %EDI,%RDI |
(138) 0x231dbb ADD %RDI,%RCX |
(138) 0x231dbe VMOVSD (%RBX,%RCX,8),%XMM2 |
(138) 0x231dc3 ADD %RDI,%R10 |
(138) 0x231dc6 VMULSD (%R14,%R10,8),%XMM2,%XMM2 |
(138) 0x231dcc VADDSD %XMM1,%XMM2,%XMM1 |
(138) 0x231dd0 ADD %RDI,%R8 |
(138) 0x231dd3 VMOVSD (%RBX,%R8,8),%XMM2 |
(138) 0x231dd9 ADD %RDI,%R9 |
(138) 0x231ddc VMULSD (%R14,%R9,8),%XMM2,%XMM2 |
(138) 0x231de2 VADDSD %XMM1,%XMM2,%XMM1 |
(138) 0x231de6 VMULSD -0x2f176(%RIP),%XMM1,%XMM1 |
(138) 0x231dee VDIVSD %XMM1,%XMM0,%XMM0 |
(138) 0x231df2 MOV -0x120(%RBP),%R9 |
(138) 0x231df9 IMUL %RSI,%R9 |
(138) 0x231dfd ADD %RDI,%R9 |
(138) 0x231e00 MOV -0x110(%RBP),%R8 |
(138) 0x231e07 MOV %R8,%RCX |
(138) 0x231e0a IMUL %RSI,%RCX |
(138) 0x231e0e MOV -0x108(%RBP),%RBX |
(138) 0x231e15 MOV %RBX,%R10 |
(138) 0x231e18 IMUL %RSI,%R10 |
(138) 0x231e1c LEA (%R10,%RDI,1),%R11 |
(138) 0x231e20 MOV -0x100(%RBP),%R12 |
(138) 0x231e27 VMOVSD (%R12,%R11,8),%XMM1 |
(138) 0x231e2d ADD %R13,%R10 |
(138) 0x231e30 VSUBSD (%R12,%R10,8),%XMM1,%XMM1 |
(138) 0x231e36 IMUL %RDX,%R8 |
(138) 0x231e3a ADD %RDI,%R8 |
(138) 0x231e3d IMUL %RDX,%RBX |
(138) 0x231e41 LEA (%RBX,%RDI,1),%R14 |
(138) 0x231e45 VMOVSD (%R12,%R14,8),%XMM2 |
(138) 0x231e4b ADD %R13,%RBX |
(138) 0x231e4e VSUBSD (%R12,%RBX,8),%XMM2,%XMM2 |
(138) 0x231e54 MOV -0x40(%RBP),%RAX |
(138) 0x231e58 VMULSD (%RAX,%R8,8),%XMM2,%XMM2 |
(138) 0x231e5e ADD %RDI,%RCX |
(138) 0x231e61 VMULSD (%RAX,%RCX,8),%XMM1,%XMM1 |
(138) 0x231e66 VADDSD %XMM2,%XMM1,%XMM1 |
(138) 0x231e6a VMULSD %XMM1,%XMM0,%XMM1 |
(138) 0x231e6e MOV -0x118(%RBP),%R15 |
(138) 0x231e75 VADDSD (%R15,%R9,8),%XMM1,%XMM1 |
(138) 0x231e7b MOV -0xf8(%RBP),%R9 |
(138) 0x231e82 IMUL %RSI,%R9 |
(138) 0x231e86 ADD %RDI,%R9 |
(138) 0x231e89 MOV -0x60(%RBP),%RAX |
(138) 0x231e8d VMOVSD %XMM1,(%RAX,%R9,8) |
(138) 0x231e93 VMOVSD (%R12,%R11,8),%XMM1 |
(138) 0x231e99 MOV -0xf0(%RBP),%R15 |
(138) 0x231ea0 IMUL %RSI,%R15 |
(138) 0x231ea4 VSUBSD (%R12,%R14,8),%XMM1,%XMM1 |
(138) 0x231eaa ADD %RDI,%R15 |
(138) 0x231ead MOV -0xe0(%RBP),%R11 |
(138) 0x231eb4 IMUL %RSI,%R11 |
(138) 0x231eb8 VMOVSD (%R12,%R10,8),%XMM2 |
(138) 0x231ebe LEA (%R11,%RDI,1),%R10 |
(138) 0x231ec2 ADD %R13,%R11 |
(138) 0x231ec5 VSUBSD (%R12,%RBX,8),%XMM2,%XMM2 |
(138) 0x231ecb MOV -0xd8(%RBP),%R12 |
(138) 0x231ed2 VMULSD (%R12,%R11,8),%XMM2,%XMM2 |
(138) 0x231ed8 VMULSD (%R12,%R10,8),%XMM1,%XMM1 |
(138) 0x231ede VADDSD %XMM2,%XMM1,%XMM1 |
(138) 0x231ee2 VMULSD %XMM1,%XMM0,%XMM1 |
(138) 0x231ee6 MOV -0xe8(%RBP),%RBX |
(138) 0x231eed VADDSD (%RBX,%R15,8),%XMM1,%XMM1 |
(138) 0x231ef3 MOV -0xd0(%RBP),%RBX |
(138) 0x231efa IMUL %RSI,%RBX |
(138) 0x231efe ADD %RDI,%RBX |
(138) 0x231f01 MOV -0x98(%RBP),%R15 |
(138) 0x231f08 VMOVSD %XMM1,(%R15,%RBX,8) |
(138) 0x231f0e MOV -0xc8(%RBP),%RAX |
(138) 0x231f15 IMUL %RAX,%RSI |
(138) 0x231f19 LEA (%RSI,%RDI,1),%R14 |
(138) 0x231f1d IMUL %RAX,%RDX |
(138) 0x231f21 ADD %RDX,%RDI |
(138) 0x231f24 MOV -0xc0(%RBP),%RAX |
(138) 0x231f2b VMOVSD (%RAX,%RDI,8),%XMM1 |
(138) 0x231f30 ADD %R13,%RDX |
(138) 0x231f33 VSUBSD (%RAX,%RDX,8),%XMM1,%XMM1 |
(138) 0x231f38 ADD %R13,%RSI |
(138) 0x231f3b MOV -0x40(%RBP),%R13 |
(138) 0x231f3f VMULSD (%R13,%R8,8),%XMM1,%XMM1 |
(138) 0x231f46 VMOVSD (%RAX,%R14,8),%XMM2 |
(138) 0x231f4c VSUBSD (%RAX,%RSI,8),%XMM2,%XMM2 |
(138) 0x231f51 VMULSD (%R13,%RCX,8),%XMM2,%XMM2 |
(138) 0x231f58 VADDSD %XMM1,%XMM2,%XMM1 |
(138) 0x231f5c VMULSD %XMM1,%XMM0,%XMM1 |
(138) 0x231f60 MOV -0x60(%RBP),%RCX |
(138) 0x231f64 VADDSD (%RCX,%R9,8),%XMM1,%XMM1 |
(138) 0x231f6a VMOVSD %XMM1,(%RCX,%R9,8) |
(138) 0x231f70 VMOVSD (%RAX,%R14,8),%XMM1 |
(138) 0x231f76 VSUBSD (%RAX,%RDI,8),%XMM1,%XMM1 |
(138) 0x231f7b VMOVSD (%RAX,%RSI,8),%XMM2 |
(138) 0x231f80 VSUBSD (%RAX,%RDX,8),%XMM2,%XMM2 |
(138) 0x231f85 VMULSD (%R12,%R11,8),%XMM2,%XMM2 |
(138) 0x231f8b VMULSD (%R12,%R10,8),%XMM1,%XMM1 |
(138) 0x231f91 VADDSD %XMM2,%XMM1,%XMM1 |
(138) 0x231f95 VMULSD %XMM1,%XMM0,%XMM0 |
(138) 0x231f99 VADDSD (%R15,%RBX,8),%XMM0,%XMM0 |
(138) 0x231f9f VMOVSD %XMM0,(%R15,%RBX,8) |
(138) 0x231fa5 MOV -0x58(%RBP),%RAX |
(138) 0x231fa9 CMP -0xb8(%RBP),%RAX |
(138) 0x231fb0 LEA 0x1(%RAX),%RCX |
(138) 0x231fb4 MOV -0x148(%RBP),%R14 |
(138) 0x231fbb JGE 231ce9 |
(138) 0x231fc1 MOV %RCX,%RAX |
(138) 0x231fc4 SHR $0x20,%RAX |
(138) 0x231fc8 MOV %RCX,-0x58(%RBP) |
(138) 0x231fcc JNE 231d20 |
(138) 0x231fd2 MOV %ECX,%EAX |
(138) 0x231fd4 XOR %EDX,%EDX |
(138) 0x231fd6 DIV %R14D |
(138) 0x231fd9 JMP 231d28 |
0x231fde INT $0x3 |
0x231fdf INT $0x3 |
Path / |
Source file and lines | accelerate.cpp:40-53 |
Module | exec |
nb instructions | 141 |
nb uops | 138 |
loop length | 668 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 44 |
micro-operation queue | 23.00 cycles |
front end | 23.00 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 8.50 | 8.50 | 8.50 | 8.50 | 5.00 | 27.00 | 27.00 | 27.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 8.50 | 8.50 | 8.50 | 8.50 | 5.00 | 27.00 | 27.00 | 27.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 23.00 |
Dispatch | 27.00 |
Overall L1 | 27.00 |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 100% |
load | 100% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 1% |
load | 20% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 9% |
store | 11% |
mul | 12% |
add-sub | 9% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 25% |
load | 25% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 11% |
load | 12% |
store | 11% |
mul | 12% |
add-sub | 9% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 11% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x198,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDX),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
INC %EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RCX),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x3,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %EAX,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 231cf9 <.omp_outlined.+0x8a9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV (%R8),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x150(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
INC %EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%R9),%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x3,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %EAX,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 231cf9 <.omp_outlined.+0x8a9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %EAX,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
IMUL %R14,%RBX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVQ $0,-0x170(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0x1b8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x1b8(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0xb0(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x170(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0xa8(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x211b20,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0xac(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 261360 <@plt_start@+0x4f0> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RBX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVL %RAX,%RBX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0x170(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RBX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %RBX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JG 231ce9 <.omp_outlined.+0x899> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x40(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x38(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x20(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R9),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R10,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%R9),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R9,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%R8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R9,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%R8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R8,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RSI),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R8,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RSI),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RSI,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RSI,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RDX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RCX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RCX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDI),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RDI),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %RCX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INC %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x2,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,-0x148(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JB 231fc1 <.omp_outlined.+0xb71> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RAX,-0x180(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x2,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VMOVAPD -0x2e8f0(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,-0x178(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 231c69 <.omp_outlined.+0x819> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV -0x178(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,-0x180(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JNE 231d0b <.omp_outlined.+0x8bb> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x211b38,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0xac(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CALL 261370 <@plt_start@+0x500> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x198,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JMP 231fc1 <.omp_outlined.+0xb71> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
INT $0x3 | |||||||||||||||||
INT $0x3 |
Source file and lines | accelerate.cpp:40-53 |
Module | exec |
nb instructions | 141 |
nb uops | 138 |
loop length | 668 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 44 |
micro-operation queue | 23.00 cycles |
front end | 23.00 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 8.50 | 8.50 | 8.50 | 8.50 | 5.00 | 27.00 | 27.00 | 27.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 8.50 | 8.50 | 8.50 | 8.50 | 5.00 | 27.00 | 27.00 | 27.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 23.00 |
Dispatch | 27.00 |
Overall L1 | 27.00 |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 100% |
load | 100% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 1% |
load | 20% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 9% |
store | 11% |
mul | 12% |
add-sub | 9% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 25% |
load | 25% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | NA (no other vectorizable/vectorized instructions) |
all | 11% |
load | 12% |
store | 11% |
mul | 12% |
add-sub | 9% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 11% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x198,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RDX),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
INC %EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%RCX),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x3,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %EAX,%EBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 231cf9 <.omp_outlined.+0x8a9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV (%R8),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x150(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
INC %EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%R9),%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x3,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %EAX,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 231cf9 <.omp_outlined.+0x8a9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %EAX,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
IMUL %R14,%RBX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVQ $0,-0x170(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVQ $0x1,-0x1b8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x1b8(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0xb0(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x170(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0xa8(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x211b20,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0xac(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 261360 <@plt_start@+0x4f0> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RBX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVL %RAX,%RBX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0x170(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RBX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %RBX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JG 231ce9 <.omp_outlined.+0x899> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x40(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x38(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x20(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R9),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R10,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%R9),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R9,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%R8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R9,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%R8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R8,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RSI),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R8,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RSI),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RSI,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RSI,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RDX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RCX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RCX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDI),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RDI),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0xb8(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %RCX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INC %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x2,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,-0x148(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JB 231fc1 <.omp_outlined.+0xb71> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RAX,-0x180(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $-0x2,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
VMOVAPD -0x2e8f0(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,-0x178(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 231c69 <.omp_outlined.+0x819> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV -0x178(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,-0x180(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JNE 231d0b <.omp_outlined.+0x8bb> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x211b38,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0xac(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CALL 261370 <@plt_start@+0x500> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x198,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JMP 231fc1 <.omp_outlined.+0xb71> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
INT $0x3 | |||||||||||||||||
INT $0x3 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼.omp_outlined.– | 5.19 | 2.63 |
○Loop 139 - accelerate.cpp:41-53 - exec | 5.19 | 2.63 |
○Loop 138 - accelerate.cpp:41-53 - exec | 0 | 0 |