Function: hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3 | Module: exec | Source: csr_matvec.c:178-204 [...] | Coverage: 0.04% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3 | Module: exec | Source: csr_matvec.c:178-204 [...] | Coverage: 0.04% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-859-5251/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 178 - 204 |
-------------------------------------------------------------------------------- |
178: #pragma omp parallel for private(i,j,jj,m,tempx) HYPRE_SMP_SCHEDULE |
179: #endif |
180: |
181: for (i = 0; i < num_rownnz; i++) |
182: { |
183: m = A_rownnz[i]; |
[...] |
191: if ( num_vectors==1 ) |
192: { |
193: tempx = 0; |
194: for (jj = A_i[m]; jj < A_i[m+1]; jj++) |
195: tempx += A_data[jj] * x_data[A_j[jj]]; |
196: y_data[m] += tempx; |
197: } |
198: else |
199: for ( j=0; j<num_vectors; ++j ) |
200: { |
201: tempx = 0; |
202: for (jj = A_i[m]; jj < A_i[m+1]; jj++) |
203: tempx += A_data[jj] * x_data[ j*vecstride_x + A_j[jj]*idxstride_x ]; |
204: y_data[ j*vecstride_y + m*idxstride_y] += tempx; |
0x53b4f0 PUSH %RBP |
0x53b4f1 MOV %RSP,%RBP |
0x53b4f4 PUSH %R15 |
0x53b4f6 PUSH %R14 |
0x53b4f8 PUSH %R13 |
0x53b4fa PUSH %R12 |
0x53b4fc PUSH %RBX |
0x53b4fd MOV %RDI,%RBX |
0x53b500 SUB $0x38,%RSP |
0x53b504 CALL 4110b0 <omp_get_num_threads@plt> |
0x53b509 MOV %EAX,%R12D |
0x53b50c CALL 4111f0 <omp_get_thread_num@plt> |
0x53b511 MOVSXD %R12D,%RSI |
0x53b514 MOVSXD %EAX,%RCX |
0x53b517 MOV 0x20(%RBX),%RAX |
0x53b51b CQTO |
0x53b51d IDIV %RSI |
0x53b520 CMP %RDX,%RCX |
0x53b523 JL 53b81b |
0x53b529 IMUL %RAX,%RCX |
0x53b52d LEA (%RCX,%RDX,1),%RDI |
0x53b531 ADD %RDI,%RAX |
0x53b534 CMP %RAX,%RDI |
0x53b537 JGE 53b80c |
0x53b53d MOV 0x40(%RBX),%R8 |
0x53b541 MOV 0x30(%RBX),%R10 |
0x53b545 MOV 0x18(%RBX),%R11 |
0x53b549 MOV 0x50(%RBX),%R9 |
0x53b54d MOV 0x58(%RBX),%R13 |
0x53b551 MOV 0x48(%RBX),%R14 |
0x53b555 MOV %R8,-0x50(%RBP) |
0x53b559 MOV 0x38(%RBX),%R12 |
0x53b55d MOV 0x28(%RBX),%RDX |
0x53b561 MOV %R10,-0x40(%RBP) |
0x53b565 LEA (%R11,%RDI,8),%RDI |
0x53b569 MOV 0x10(%RBX),%RCX |
0x53b56d MOV 0x8(%RBX),%R8 |
0x53b571 MOV (%RBX),%RSI |
0x53b574 CMP $0x1,%R9 |
0x53b578 JNE 53b825 |
0x53b57e LEA (%R11,%RAX,8),%R10 |
0x53b582 MOV %RDI,%R15 |
0x53b585 MOV (%RDI),%RAX |
0x53b588 SAL $0x3,%R14 |
0x53b58c MOV %R10,-0x48(%RBP) |
0x53b590 CMP $0x1,%R12 |
0x53b594 JE 53bc57 |
0x53b59a TEST %R12,%R12 |
0x53b59d JLE 53b79d |
(2879) 0x53b5a3 MOV -0x50(%RBP),%R9 |
(2879) 0x53b5a7 MOV (%R8,%RAX,8),%R11 |
(2879) 0x53b5ab MOV %R8,-0x38(%RBP) |
(2879) 0x53b5af XOR %EDI,%EDI |
(2879) 0x53b5b1 MOV 0x8(%R8,%RAX,8),%R10 |
(2879) 0x53b5b6 MOV -0x40(%RBP),%RBX |
(2879) 0x53b5ba IMUL %R9,%RAX |
(2879) 0x53b5be LEA (%RBX,%RAX,8),%R9 |
(2879) 0x53b5c2 XOR %EBX,%EBX |
(2879) 0x53b5c4 NOPL (%RAX) |
(2878) 0x53b5c8 MOV %R11,%RAX |
(2878) 0x53b5cb VXORPD %XMM9,%XMM9,%XMM9 |
(2878) 0x53b5d0 CMP %R11,%R10 |
(2878) 0x53b5d3 JLE 53b76b |
(2878) 0x53b5d9 MOV %R10,%R8 |
(2878) 0x53b5dc SUB %R11,%R8 |
(2878) 0x53b5df AND $0x7,%R8D |
(2878) 0x53b5e3 JE 53b6b8 |
(2878) 0x53b5e9 CMP $0x1,%R8 |
(2878) 0x53b5ed JE 53b699 |
(2878) 0x53b5f3 CMP $0x2,%R8 |
(2878) 0x53b5f7 JE 53b683 |
(2878) 0x53b5fd CMP $0x3,%R8 |
(2878) 0x53b601 JE 53b66d |
(2878) 0x53b603 CMP $0x4,%R8 |
(2878) 0x53b607 JE 53b657 |
(2878) 0x53b609 CMP $0x5,%R8 |
(2878) 0x53b60d JE 53b641 |
(2878) 0x53b60f CMP $0x6,%R8 |
(2878) 0x53b613 JE 53b62b |
(2878) 0x53b615 MOV (%RCX,%R11,8),%RAX |
(2878) 0x53b619 ADD %RDI,%RAX |
(2878) 0x53b61c VMOVSD (%RDX,%RAX,8),%XMM4 |
(2878) 0x53b621 VFMADD231SD (%RSI,%R11,8),%XMM4,%XMM9 |
(2878) 0x53b627 LEA 0x1(%R11),%RAX |
(2878) 0x53b62b MOV (%RCX,%RAX,8),%R8 |
(2878) 0x53b62f ADD %RDI,%R8 |
(2878) 0x53b632 VMOVSD (%RDX,%R8,8),%XMM5 |
(2878) 0x53b638 VFMADD231SD (%RSI,%RAX,8),%XMM5,%XMM9 |
(2878) 0x53b63e INC %RAX |
(2878) 0x53b641 MOV (%RCX,%RAX,8),%R8 |
(2878) 0x53b645 ADD %RDI,%R8 |
(2878) 0x53b648 VMOVSD (%RDX,%R8,8),%XMM7 |
(2878) 0x53b64e VFMADD231SD (%RSI,%RAX,8),%XMM7,%XMM9 |
(2878) 0x53b654 INC %RAX |
(2878) 0x53b657 MOV (%RCX,%RAX,8),%R8 |
(2878) 0x53b65b ADD %RDI,%R8 |
(2878) 0x53b65e VMOVSD (%RDX,%R8,8),%XMM1 |
(2878) 0x53b664 VFMADD231SD (%RSI,%RAX,8),%XMM1,%XMM9 |
(2878) 0x53b66a INC %RAX |
(2878) 0x53b66d MOV (%RCX,%RAX,8),%R8 |
(2878) 0x53b671 ADD %RDI,%R8 |
(2878) 0x53b674 VMOVSD (%RDX,%R8,8),%XMM2 |
(2878) 0x53b67a VFMADD231SD (%RSI,%RAX,8),%XMM2,%XMM9 |
(2878) 0x53b680 INC %RAX |
(2878) 0x53b683 MOV (%RCX,%RAX,8),%R8 |
(2878) 0x53b687 ADD %RDI,%R8 |
(2878) 0x53b68a VMOVSD (%RDX,%R8,8),%XMM6 |
(2878) 0x53b690 VFMADD231SD (%RSI,%RAX,8),%XMM6,%XMM9 |
(2878) 0x53b696 INC %RAX |
(2878) 0x53b699 MOV (%RCX,%RAX,8),%R8 |
(2878) 0x53b69d ADD %RDI,%R8 |
(2878) 0x53b6a0 VMOVSD (%RDX,%R8,8),%XMM3 |
(2878) 0x53b6a6 VFMADD231SD (%RSI,%RAX,8),%XMM3,%XMM9 |
(2878) 0x53b6ac INC %RAX |
(2878) 0x53b6af CMP %R10,%RAX |
(2878) 0x53b6b2 JE 53b76b |
(2880) 0x53b6b8 MOV (%RCX,%RAX,8),%R8 |
(2880) 0x53b6bc ADD %RDI,%R8 |
(2880) 0x53b6bf VMOVSD (%RDX,%R8,8),%XMM10 |
(2880) 0x53b6c5 MOV 0x8(%RCX,%RAX,8),%R8 |
(2880) 0x53b6ca VFMADD231SD (%RSI,%RAX,8),%XMM10,%XMM9 |
(2880) 0x53b6d0 ADD %RDI,%R8 |
(2880) 0x53b6d3 VMOVSD (%RDX,%R8,8),%XMM11 |
(2880) 0x53b6d9 MOV 0x10(%RCX,%RAX,8),%R8 |
(2880) 0x53b6de VFMADD231SD 0x8(%RSI,%RAX,8),%XMM11,%XMM9 |
(2880) 0x53b6e5 ADD %RDI,%R8 |
(2880) 0x53b6e8 VMOVSD (%RDX,%R8,8),%XMM12 |
(2880) 0x53b6ee MOV 0x18(%RCX,%RAX,8),%R8 |
(2880) 0x53b6f3 VFMADD231SD 0x10(%RSI,%RAX,8),%XMM12,%XMM9 |
(2880) 0x53b6fa ADD %RDI,%R8 |
(2880) 0x53b6fd VMOVSD (%RDX,%R8,8),%XMM13 |
(2880) 0x53b703 MOV 0x20(%RCX,%RAX,8),%R8 |
(2880) 0x53b708 VFMADD231SD 0x18(%RSI,%RAX,8),%XMM13,%XMM9 |
(2880) 0x53b70f ADD %RDI,%R8 |
(2880) 0x53b712 VMOVSD (%RDX,%R8,8),%XMM14 |
(2880) 0x53b718 MOV 0x28(%RCX,%RAX,8),%R8 |
(2880) 0x53b71d VFMADD231SD 0x20(%RSI,%RAX,8),%XMM14,%XMM9 |
(2880) 0x53b724 ADD %RDI,%R8 |
(2880) 0x53b727 VMOVSD (%RDX,%R8,8),%XMM15 |
(2880) 0x53b72d MOV 0x30(%RCX,%RAX,8),%R8 |
(2880) 0x53b732 VFMADD231SD 0x28(%RSI,%RAX,8),%XMM15,%XMM9 |
(2880) 0x53b739 ADD %RDI,%R8 |
(2880) 0x53b73c VMOVSD (%RDX,%R8,8),%XMM0 |
(2880) 0x53b742 MOV 0x38(%RCX,%RAX,8),%R8 |
(2880) 0x53b747 VFMADD231SD 0x30(%RSI,%RAX,8),%XMM0,%XMM9 |
(2880) 0x53b74e ADD %RDI,%R8 |
(2880) 0x53b751 VMOVSD (%RDX,%R8,8),%XMM8 |
(2880) 0x53b757 VFMADD231SD 0x38(%RSI,%RAX,8),%XMM8,%XMM9 |
(2880) 0x53b75e ADD $0x8,%RAX |
(2880) 0x53b762 CMP %R10,%RAX |
(2880) 0x53b765 JNE 53b6b8 |
(2878) 0x53b76b VADDSD (%R9),%XMM9,%XMM9 |
(2878) 0x53b770 INC %RBX |
(2878) 0x53b773 ADD %R13,%RDI |
(2878) 0x53b776 VMOVSD %XMM9,(%R9) |
(2878) 0x53b77b ADD %R14,%R9 |
(2878) 0x53b77e CMP %RBX,%R12 |
(2878) 0x53b781 JNE 53b5c8 |
(2879) 0x53b787 MOV -0x38(%RBP),%R8 |
(2879) 0x53b78b ADD $0x8,%R15 |
(2879) 0x53b78f CMP %R15,-0x48(%RBP) |
(2879) 0x53b793 JE 53b80c |
(2879) 0x53b795 MOV (%R15),%RAX |
(2879) 0x53b798 JMP 53b5a3 |
0x53b79d MOV -0x48(%RBP),%RDX |
0x53b7a1 SUB %RDI,%RDX |
0x53b7a4 SUB $0x8,%RDX |
0x53b7a8 SHR $0x3,%RDX |
0x53b7ac INC %RDX |
0x53b7af AND $0x7,%EDX |
0x53b7b2 JE 53b7ff |
0x53b7b4 CMP $0x1,%RDX |
0x53b7b8 JE 53b7f2 |
0x53b7ba CMP $0x2,%RDX |
0x53b7be JE 53b7ee |
0x53b7c0 CMP $0x3,%RDX |
0x53b7c4 JE 53b7ea |
0x53b7c6 CMP $0x4,%RDX |
0x53b7ca JE 53b7e6 |
0x53b7cc CMP $0x5,%RDX |
0x53b7d0 JE 53b7e2 |
0x53b7d2 ADD $0x8,%RDI |
0x53b7d6 CMP $0x6,%RDX |
0x53b7da CMOVNE %RDI,%R15 |
0x53b7de ADD $0x8,%R15 |
0x53b7e2 ADD $0x8,%R15 |
0x53b7e6 ADD $0x8,%R15 |
0x53b7ea ADD $0x8,%R15 |
0x53b7ee ADD $0x8,%R15 |
0x53b7f2 MOV -0x48(%RBP),%RCX |
0x53b7f6 ADD $0x8,%R15 |
0x53b7fa CMP %RCX,%R15 |
0x53b7fd JE 53b80c |
(2877) 0x53b7ff MOV -0x48(%RBP),%RSI |
(2877) 0x53b803 ADD $0x40,%R15 |
(2877) 0x53b807 CMP %RSI,%R15 |
(2877) 0x53b80a JNE 53b7ff |
0x53b80c ADD $0x38,%RSP |
0x53b810 POP %RBX |
0x53b811 POP %R12 |
0x53b813 POP %R13 |
0x53b815 POP %R14 |
0x53b817 POP %R15 |
0x53b819 POP %RBP |
0x53b81a RET |
0x53b81b INC %RAX |
0x53b81e XOR %EDX,%EDX |
0x53b820 JMP 53b529 |
0x53b825 LEA (%R11,%RAX,8),%R15 |
0x53b829 MOV %RDI,%R10 |
0x53b82c LEA (,%R14,8),%RBX |
0x53b834 MOV %R15,-0x38(%RBP) |
0x53b838 MOV (%RDI),%R15 |
0x53b83b CMP $0x1,%R12 |
0x53b83f JE 53bbeb |
0x53b845 TEST %R12,%R12 |
0x53b848 JLE 53be05 |
0x53b84e MOV %R15,%RDI |
0x53b851 MOV %R8,%RAX |
0x53b854 MOV %RBX,%R15 |
0x53b857 MOV %R10,%R8 |
(2873) 0x53b85a MOV -0x50(%RBP),%R14 |
(2873) 0x53b85e MOV (%RAX,%RDI,8),%RBX |
(2873) 0x53b862 MOV %RAX,-0x48(%RBP) |
(2873) 0x53b866 MOV 0x8(%RAX,%RDI,8),%R11 |
(2873) 0x53b86b MOV -0x40(%RBP),%R10 |
(2873) 0x53b86f MOV %R8,-0x58(%RBP) |
(2873) 0x53b873 IMUL %R14,%RDI |
(2873) 0x53b877 XOR %R14D,%R14D |
(2873) 0x53b87a LEA (%R10,%RDI,8),%R10 |
(2873) 0x53b87e XOR %EDI,%EDI |
(2872) 0x53b880 MOV %RBX,%RAX |
(2872) 0x53b883 VXORPD %XMM0,%XMM0,%XMM0 |
(2872) 0x53b887 CMP %R11,%RBX |
(2872) 0x53b88a JGE 53ba50 |
(2872) 0x53b890 MOV %R11,%R8 |
(2872) 0x53b893 SUB %RBX,%R8 |
(2872) 0x53b896 AND $0x7,%R8D |
(2872) 0x53b89a JE 53b985 |
(2872) 0x53b8a0 CMP $0x1,%R8 |
(2872) 0x53b8a4 JE 53b963 |
(2872) 0x53b8aa CMP $0x2,%R8 |
(2872) 0x53b8ae JE 53b94a |
(2872) 0x53b8b4 CMP $0x3,%R8 |
(2872) 0x53b8b8 JE 53b931 |
(2872) 0x53b8ba CMP $0x4,%R8 |
(2872) 0x53b8be JE 53b918 |
(2872) 0x53b8c0 CMP $0x5,%R8 |
(2872) 0x53b8c4 JE 53b8ff |
(2872) 0x53b8c6 CMP $0x6,%R8 |
(2872) 0x53b8ca JE 53b8e6 |
(2872) 0x53b8cc MOV (%RCX,%RBX,8),%RAX |
(2872) 0x53b8d0 VMOVSD (%RSI,%RBX,8),%XMM4 |
(2872) 0x53b8d5 IMUL %R9,%RAX |
(2872) 0x53b8d9 ADD %RDI,%RAX |
(2872) 0x53b8dc VFMADD231SD (%RDX,%RAX,8),%XMM4,%XMM0 |
(2872) 0x53b8e2 LEA 0x1(%RBX),%RAX |
(2872) 0x53b8e6 MOV (%RCX,%RAX,8),%R8 |
(2872) 0x53b8ea VMOVSD (%RSI,%RAX,8),%XMM5 |
(2872) 0x53b8ef INC %RAX |
(2872) 0x53b8f2 IMUL %R9,%R8 |
(2872) 0x53b8f6 ADD %RDI,%R8 |
(2872) 0x53b8f9 VFMADD231SD (%RDX,%R8,8),%XMM5,%XMM0 |
(2872) 0x53b8ff MOV (%RCX,%RAX,8),%R8 |
(2872) 0x53b903 VMOVSD (%RSI,%RAX,8),%XMM7 |
(2872) 0x53b908 INC %RAX |
(2872) 0x53b90b IMUL %R9,%R8 |
(2872) 0x53b90f ADD %RDI,%R8 |
(2872) 0x53b912 VFMADD231SD (%RDX,%R8,8),%XMM7,%XMM0 |
(2872) 0x53b918 MOV (%RCX,%RAX,8),%R8 |
(2872) 0x53b91c VMOVSD (%RSI,%RAX,8),%XMM1 |
(2872) 0x53b921 INC %RAX |
(2872) 0x53b924 IMUL %R9,%R8 |
(2872) 0x53b928 ADD %RDI,%R8 |
(2872) 0x53b92b VFMADD231SD (%RDX,%R8,8),%XMM1,%XMM0 |
(2872) 0x53b931 MOV (%RCX,%RAX,8),%R8 |
(2872) 0x53b935 VMOVSD (%RSI,%RAX,8),%XMM2 |
(2872) 0x53b93a INC %RAX |
(2872) 0x53b93d IMUL %R9,%R8 |
(2872) 0x53b941 ADD %RDI,%R8 |
(2872) 0x53b944 VFMADD231SD (%RDX,%R8,8),%XMM2,%XMM0 |
(2872) 0x53b94a MOV (%RCX,%RAX,8),%R8 |
(2872) 0x53b94e VMOVSD (%RSI,%RAX,8),%XMM6 |
(2872) 0x53b953 INC %RAX |
(2872) 0x53b956 IMUL %R9,%R8 |
(2872) 0x53b95a ADD %RDI,%R8 |
(2872) 0x53b95d VFMADD231SD (%RDX,%R8,8),%XMM6,%XMM0 |
(2872) 0x53b963 MOV (%RCX,%RAX,8),%R8 |
(2872) 0x53b967 VMOVSD (%RSI,%RAX,8),%XMM3 |
(2872) 0x53b96c INC %RAX |
(2872) 0x53b96f IMUL %R9,%R8 |
(2872) 0x53b973 ADD %RDI,%R8 |
(2872) 0x53b976 VFMADD231SD (%RDX,%R8,8),%XMM3,%XMM0 |
(2872) 0x53b97c CMP %R11,%RAX |
(2872) 0x53b97f JE 53ba50 |
(2874) 0x53b985 MOV (%RCX,%RAX,8),%R8 |
(2874) 0x53b989 VMOVSD (%RSI,%RAX,8),%XMM8 |
(2874) 0x53b98e VMOVSD 0x8(%RSI,%RAX,8),%XMM9 |
(2874) 0x53b994 VMOVSD 0x10(%RSI,%RAX,8),%XMM10 |
(2874) 0x53b99a IMUL %R9,%R8 |
(2874) 0x53b99e VMOVSD 0x18(%RSI,%RAX,8),%XMM11 |
(2874) 0x53b9a4 VMOVSD 0x20(%RSI,%RAX,8),%XMM12 |
(2874) 0x53b9aa VMOVSD 0x28(%RSI,%RAX,8),%XMM13 |
(2874) 0x53b9b0 VMOVSD 0x30(%RSI,%RAX,8),%XMM14 |
(2874) 0x53b9b6 VMOVSD 0x38(%RSI,%RAX,8),%XMM15 |
(2874) 0x53b9bc ADD %RDI,%R8 |
(2874) 0x53b9bf VFMADD231SD (%RDX,%R8,8),%XMM8,%XMM0 |
(2874) 0x53b9c5 MOV 0x8(%RCX,%RAX,8),%R8 |
(2874) 0x53b9ca IMUL %R9,%R8 |
(2874) 0x53b9ce ADD %RDI,%R8 |
(2874) 0x53b9d1 VFMADD231SD (%RDX,%R8,8),%XMM9,%XMM0 |
(2874) 0x53b9d7 MOV 0x10(%RCX,%RAX,8),%R8 |
(2874) 0x53b9dc IMUL %R9,%R8 |
(2874) 0x53b9e0 ADD %RDI,%R8 |
(2874) 0x53b9e3 VFMADD231SD (%RDX,%R8,8),%XMM10,%XMM0 |
(2874) 0x53b9e9 MOV 0x18(%RCX,%RAX,8),%R8 |
(2874) 0x53b9ee IMUL %R9,%R8 |
(2874) 0x53b9f2 ADD %RDI,%R8 |
(2874) 0x53b9f5 VFMADD231SD (%RDX,%R8,8),%XMM11,%XMM0 |
(2874) 0x53b9fb MOV 0x20(%RCX,%RAX,8),%R8 |
(2874) 0x53ba00 IMUL %R9,%R8 |
(2874) 0x53ba04 ADD %RDI,%R8 |
(2874) 0x53ba07 VFMADD231SD (%RDX,%R8,8),%XMM12,%XMM0 |
(2874) 0x53ba0d MOV 0x28(%RCX,%RAX,8),%R8 |
(2874) 0x53ba12 IMUL %R9,%R8 |
(2874) 0x53ba16 ADD %RDI,%R8 |
(2874) 0x53ba19 VFMADD231SD (%RDX,%R8,8),%XMM13,%XMM0 |
(2874) 0x53ba1f MOV 0x30(%RCX,%RAX,8),%R8 |
(2874) 0x53ba24 IMUL %R9,%R8 |
(2874) 0x53ba28 ADD %RDI,%R8 |
(2874) 0x53ba2b VFMADD231SD (%RDX,%R8,8),%XMM14,%XMM0 |
(2874) 0x53ba31 MOV 0x38(%RCX,%RAX,8),%R8 |
(2874) 0x53ba36 ADD $0x8,%RAX |
(2874) 0x53ba3a IMUL %R9,%R8 |
(2874) 0x53ba3e ADD %RDI,%R8 |
(2874) 0x53ba41 VFMADD231SD (%RDX,%R8,8),%XMM15,%XMM0 |
(2874) 0x53ba47 CMP %R11,%RAX |
(2874) 0x53ba4a JNE 53b985 |
(2872) 0x53ba50 VADDSD (%R10),%XMM0,%XMM0 |
(2872) 0x53ba55 INC %R14 |
(2872) 0x53ba58 ADD %R13,%RDI |
(2872) 0x53ba5b VMOVSD %XMM0,(%R10) |
(2872) 0x53ba60 ADD %R15,%R10 |
(2872) 0x53ba63 CMP %R14,%R12 |
(2872) 0x53ba66 JNE 53b880 |
(2873) 0x53ba6c MOV -0x58(%RBP),%R8 |
(2873) 0x53ba70 MOV -0x38(%RBP),%RBX |
(2873) 0x53ba74 MOV -0x48(%RBP),%RAX |
(2873) 0x53ba78 ADD $0x8,%R8 |
(2873) 0x53ba7c CMP %RBX,%R8 |
(2873) 0x53ba7f JE 53b80c |
(2873) 0x53ba85 MOV (%R8),%RDI |
(2873) 0x53ba88 JMP 53b85a |
(2869) 0x53ba8d MOV (%RCX,%R13,8),%R11 |
(2869) 0x53ba91 VMOVSD (%RSI,%R13,8),%XMM4 |
(2869) 0x53ba97 INC %R13 |
(2869) 0x53ba9a VFMADD231SD (%RDX,%R11,8),%XMM4,%XMM8 |
(2869) 0x53baa0 MOV (%RCX,%R13,8),%RDI |
(2869) 0x53baa4 VMOVSD (%RSI,%R13,8),%XMM5 |
(2869) 0x53baaa INC %R13 |
(2869) 0x53baad VFMADD231SD (%RDX,%RDI,8),%XMM5,%XMM8 |
(2869) 0x53bab3 MOV (%RCX,%R13,8),%R14 |
(2869) 0x53bab7 VMOVSD (%RSI,%R13,8),%XMM7 |
(2869) 0x53babd INC %R13 |
(2869) 0x53bac0 VFMADD231SD (%RDX,%R14,8),%XMM7,%XMM8 |
(2869) 0x53bac6 MOV (%RCX,%R13,8),%RAX |
(2869) 0x53baca VMOVSD (%RSI,%R13,8),%XMM1 |
(2869) 0x53bad0 INC %R13 |
(2869) 0x53bad3 VFMADD231SD (%RDX,%RAX,8),%XMM1,%XMM8 |
(2869) 0x53bad9 MOV (%RCX,%R13,8),%RBX |
(2869) 0x53badd VMOVSD (%RSI,%R13,8),%XMM2 |
(2869) 0x53bae3 INC %R13 |
(2869) 0x53bae6 VFMADD231SD (%RDX,%RBX,8),%XMM2,%XMM8 |
(2869) 0x53baec MOV (%RCX,%R13,8),%R15 |
(2869) 0x53baf0 VMOVSD (%RSI,%R13,8),%XMM6 |
(2869) 0x53baf6 INC %R13 |
(2869) 0x53baf9 VFMADD231SD (%RDX,%R15,8),%XMM6,%XMM8 |
(2869) 0x53baff MOV (%RCX,%R13,8),%R11 |
(2869) 0x53bb03 VMOVSD (%RSI,%R13,8),%XMM3 |
(2869) 0x53bb09 INC %R13 |
(2869) 0x53bb0c VFMADD231SD (%RDX,%R11,8),%XMM3,%XMM8 |
(2869) 0x53bb12 CMP %R9,%R13 |
(2869) 0x53bb15 JE 53bbc4 |
(2870) 0x53bb1b LEA 0x1(%R13),%R14 |
(2870) 0x53bb1f MOV (%RCX,%R13,8),%RDI |
(2870) 0x53bb23 LEA 0x2(%R13),%R15 |
(2870) 0x53bb27 VMOVSD (%RSI,%R13,8),%XMM9 |
(2870) 0x53bb2d MOV (%RCX,%R14,8),%RAX |
(2870) 0x53bb31 LEA 0x3(%R13),%R11 |
(2870) 0x53bb35 MOV (%RCX,%R15,8),%RBX |
(2870) 0x53bb39 VFMADD231SD (%RDX,%RDI,8),%XMM9,%XMM8 |
(2870) 0x53bb3f VMOVSD (%RSI,%R14,8),%XMM10 |
(2870) 0x53bb45 LEA 0x4(%R13),%R14 |
(2870) 0x53bb49 MOV (%RCX,%R11,8),%RDI |
(2870) 0x53bb4d VFMADD231SD (%RDX,%RAX,8),%XMM10,%XMM8 |
(2870) 0x53bb53 VMOVSD (%RSI,%R15,8),%XMM11 |
(2870) 0x53bb59 MOV (%RCX,%R14,8),%RAX |
(2870) 0x53bb5d LEA 0x5(%R13),%R15 |
(2870) 0x53bb61 VFMADD231SD (%RDX,%RBX,8),%XMM11,%XMM8 |
(2870) 0x53bb67 VMOVSD (%RSI,%R11,8),%XMM12 |
(2870) 0x53bb6d LEA 0x6(%R13),%R11 |
(2870) 0x53bb71 VFMADD231SD (%RDX,%RDI,8),%XMM12,%XMM8 |
(2870) 0x53bb77 MOV (%RCX,%R15,8),%RBX |
(2870) 0x53bb7b VMOVSD (%RSI,%R14,8),%XMM13 |
(2870) 0x53bb81 MOV (%RCX,%R11,8),%RDI |
(2870) 0x53bb85 LEA 0x7(%R13),%R14 |
(2870) 0x53bb89 ADD $0x8,%R13 |
(2870) 0x53bb8d VFMADD231SD (%RDX,%RAX,8),%XMM13,%XMM8 |
(2870) 0x53bb93 VMOVSD (%RSI,%R15,8),%XMM14 |
(2870) 0x53bb99 MOV (%RCX,%R14,8),%RAX |
(2870) 0x53bb9d VFMADD231SD (%RDX,%RBX,8),%XMM14,%XMM8 |
(2870) 0x53bba3 VMOVSD (%RSI,%R11,8),%XMM15 |
(2870) 0x53bba9 VFMADD231SD (%RDX,%RDI,8),%XMM15,%XMM8 |
(2870) 0x53bbaf VMOVSD (%RSI,%R14,8),%XMM0 |
(2870) 0x53bbb5 VFMADD231SD (%RDX,%RAX,8),%XMM0,%XMM8 |
(2870) 0x53bbbb CMP %R9,%R13 |
(2870) 0x53bbbe JNE 53bb1b |
(2869) 0x53bbc4 MOV -0x40(%RBP),%R13 |
(2869) 0x53bbc8 ADD $0x8,%R10 |
(2869) 0x53bbcc ADD %R13,%R12 |
(2869) 0x53bbcf VADDSD (%R12),%XMM8,%XMM8 |
(2869) 0x53bbd5 VMOVSD %XMM8,(%R12) |
(2869) 0x53bbdb MOV -0x38(%RBP),%R12 |
(2869) 0x53bbdf CMP %R12,%R10 |
(2869) 0x53bbe2 JE 53b80c |
(2869) 0x53bbe8 MOV (%R10),%R15 |
(2869) 0x53bbeb LEA (,%R15,8),%R12 |
(2869) 0x53bbf3 MOV (%R8,%R15,8),%R13 |
(2869) 0x53bbf7 VXORPD %XMM8,%XMM8,%XMM8 |
(2869) 0x53bbfc MOV 0x8(%R8,%R12,1),%R9 |
(2869) 0x53bc01 CMP %R9,%R13 |
(2869) 0x53bc04 JGE 53bbc4 |
(2869) 0x53bc06 MOV %R9,%R15 |
(2869) 0x53bc09 SUB %R13,%R15 |
(2869) 0x53bc0c AND $0x7,%R15D |
(2869) 0x53bc10 JE 53bb1b |
(2869) 0x53bc16 CMP $0x1,%R15 |
(2869) 0x53bc1a JE 53baff |
(2869) 0x53bc20 CMP $0x2,%R15 |
(2869) 0x53bc24 JE 53baec |
(2869) 0x53bc2a CMP $0x3,%R15 |
(2869) 0x53bc2e JE 53bad9 |
(2869) 0x53bc34 CMP $0x4,%R15 |
(2869) 0x53bc38 JE 53bac6 |
(2869) 0x53bc3e CMP $0x5,%R15 |
(2869) 0x53bc42 JE 53bab3 |
(2869) 0x53bc48 CMP $0x6,%R15 |
(2869) 0x53bc4c JE 53baa0 |
(2869) 0x53bc52 JMP 53ba8d |
0x53bc57 MOV -0x40(%RBP),%R14 |
0x53bc5b MOV -0x48(%RBP),%R13 |
(2875) 0x53bc5f LEA (,%RAX,8),%R10 |
(2875) 0x53bc67 MOV (%R8,%RAX,8),%R9 |
(2875) 0x53bc6b VXORPD %XMM10,%XMM10,%XMM10 |
(2875) 0x53bc70 MOV 0x8(%R8,%R10,1),%R11 |
(2875) 0x53bc75 CMP %R9,%R11 |
(2875) 0x53bc78 JLE 53bde3 |
(2875) 0x53bc7e MOV %R11,%R12 |
(2875) 0x53bc81 SUB %R9,%R12 |
(2875) 0x53bc84 AND $0x7,%R12D |
(2875) 0x53bc88 JE 53bd3e |
(2875) 0x53bc8e CMP $0x1,%R12 |
(2875) 0x53bc92 JE 53bd23 |
(2875) 0x53bc98 CMP $0x2,%R12 |
(2875) 0x53bc9c JE 53bd11 |
(2875) 0x53bc9e CMP $0x3,%R12 |
(2875) 0x53bca2 JE 53bcff |
(2875) 0x53bca4 CMP $0x4,%R12 |
(2875) 0x53bca8 JE 53bcec |
(2875) 0x53bcaa CMP $0x5,%R12 |
(2875) 0x53bcae JE 53bcda |
(2875) 0x53bcb0 CMP $0x6,%R12 |
(2875) 0x53bcb4 JE 53bcc8 |
(2875) 0x53bcb6 MOV (%RCX,%R9,8),%RDI |
(2875) 0x53bcba VMOVSD (%RDX,%RDI,8),%XMM4 |
(2875) 0x53bcbf VFMADD231SD (%RSI,%R9,8),%XMM4,%XMM10 |
(2875) 0x53bcc5 INC %R9 |
(2875) 0x53bcc8 MOV (%RCX,%R9,8),%RBX |
(2875) 0x53bccc VMOVSD (%RDX,%RBX,8),%XMM5 |
(2875) 0x53bcd1 VFMADD231SD (%RSI,%R9,8),%XMM5,%XMM10 |
(2875) 0x53bcd7 INC %R9 |
(2875) 0x53bcda MOV (%RCX,%R9,8),%RAX |
(2875) 0x53bcde VMOVSD (%RDX,%RAX,8),%XMM7 |
(2875) 0x53bce3 VFMADD231SD (%RSI,%R9,8),%XMM7,%XMM10 |
(2875) 0x53bce9 INC %R9 |
(2875) 0x53bcec MOV (%RCX,%R9,8),%R12 |
(2875) 0x53bcf0 VMOVSD (%RDX,%R12,8),%XMM1 |
(2875) 0x53bcf6 VFMADD231SD (%RSI,%R9,8),%XMM1,%XMM10 |
(2875) 0x53bcfc INC %R9 |
(2875) 0x53bcff MOV (%RCX,%R9,8),%RDI |
(2875) 0x53bd03 VMOVSD (%RDX,%RDI,8),%XMM2 |
(2875) 0x53bd08 VFMADD231SD (%RSI,%R9,8),%XMM2,%XMM10 |
(2875) 0x53bd0e INC %R9 |
(2875) 0x53bd11 MOV (%RCX,%R9,8),%RBX |
(2875) 0x53bd15 VMOVSD (%RDX,%RBX,8),%XMM6 |
(2875) 0x53bd1a VFMADD231SD (%RSI,%R9,8),%XMM6,%XMM10 |
(2875) 0x53bd20 INC %R9 |
(2875) 0x53bd23 MOV (%RCX,%R9,8),%RAX |
(2875) 0x53bd27 VMOVSD (%RDX,%RAX,8),%XMM3 |
(2875) 0x53bd2c VFMADD231SD (%RSI,%R9,8),%XMM3,%XMM10 |
(2875) 0x53bd32 INC %R9 |
(2875) 0x53bd35 CMP %R11,%R9 |
(2875) 0x53bd38 JE 53bde3 |
(2876) 0x53bd3e LEA 0x1(%R9),%RDI |
(2876) 0x53bd42 MOV (%RCX,%R9,8),%R12 |
(2876) 0x53bd46 LEA 0x2(%R9),%RAX |
(2876) 0x53bd4a MOV (%RCX,%RDI,8),%RBX |
(2876) 0x53bd4e VMOVSD (%RDX,%R12,8),%XMM11 |
(2876) 0x53bd54 VFMADD231SD (%RSI,%R9,8),%XMM11,%XMM10 |
(2876) 0x53bd5a MOV (%RCX,%RAX,8),%R12 |
(2876) 0x53bd5e VMOVSD (%RDX,%RBX,8),%XMM12 |
(2876) 0x53bd63 VFMADD231SD (%RSI,%RDI,8),%XMM12,%XMM10 |
(2876) 0x53bd69 LEA 0x3(%R9),%RDI |
(2876) 0x53bd6d MOV (%RCX,%RDI,8),%RBX |
(2876) 0x53bd71 VMOVSD (%RDX,%R12,8),%XMM13 |
(2876) 0x53bd77 VFMADD231SD (%RSI,%RAX,8),%XMM13,%XMM10 |
(2876) 0x53bd7d LEA 0x4(%R9),%RAX |
(2876) 0x53bd81 MOV (%RCX,%RAX,8),%R12 |
(2876) 0x53bd85 VMOVSD (%RDX,%RBX,8),%XMM14 |
(2876) 0x53bd8a VFMADD231SD (%RSI,%RDI,8),%XMM14,%XMM10 |
(2876) 0x53bd90 LEA 0x5(%R9),%RDI |
(2876) 0x53bd94 MOV (%RCX,%RDI,8),%RBX |
(2876) 0x53bd98 VMOVSD (%RDX,%R12,8),%XMM15 |
(2876) 0x53bd9e VFMADD231SD (%RSI,%RAX,8),%XMM15,%XMM10 |
(2876) 0x53bda4 LEA 0x6(%R9),%RAX |
(2876) 0x53bda8 VMOVSD (%RDX,%RBX,8),%XMM0 |
(2876) 0x53bdad MOV (%RCX,%RAX,8),%R12 |
(2876) 0x53bdb1 VFMADD231SD (%RSI,%RDI,8),%XMM0,%XMM10 |
(2876) 0x53bdb7 LEA 0x7(%R9),%RDI |
(2876) 0x53bdbb ADD $0x8,%R9 |
(2876) 0x53bdbf MOV (%RCX,%RDI,8),%RBX |
(2876) 0x53bdc3 VMOVSD (%RDX,%R12,8),%XMM8 |
(2876) 0x53bdc9 VFMADD231SD (%RSI,%RAX,8),%XMM8,%XMM10 |
(2876) 0x53bdcf VMOVSD (%RDX,%RBX,8),%XMM9 |
(2876) 0x53bdd4 VFMADD231SD (%RSI,%RDI,8),%XMM9,%XMM10 |
(2876) 0x53bdda CMP %R11,%R9 |
(2876) 0x53bddd JNE 53bd3e |
(2875) 0x53bde3 ADD %R14,%R10 |
(2875) 0x53bde6 ADD $0x8,%R15 |
(2875) 0x53bdea VADDSD (%R10),%XMM10,%XMM10 |
(2875) 0x53bdef VMOVSD %XMM10,(%R10) |
(2875) 0x53bdf4 CMP %R15,%R13 |
(2875) 0x53bdf7 JE 53b80c |
(2875) 0x53bdfd MOV (%R15),%RAX |
(2875) 0x53be00 JMP 53bc5f |
0x53be05 MOV -0x38(%RBP),%RAX |
0x53be09 SUB %RDI,%RAX |
0x53be0c SUB $0x8,%RAX |
0x53be10 SHR $0x3,%RAX |
0x53be14 INC %RAX |
0x53be17 AND $0x7,%EAX |
0x53be1a JE 53be6b |
0x53be1c CMP $0x1,%RAX |
0x53be20 JE 53be5a |
0x53be22 CMP $0x2,%RAX |
0x53be26 JE 53be56 |
0x53be28 CMP $0x3,%RAX |
0x53be2c JE 53be52 |
0x53be2e CMP $0x4,%RAX |
0x53be32 JE 53be4e |
0x53be34 CMP $0x5,%RAX |
0x53be38 JE 53be4a |
0x53be3a ADD $0x8,%RDI |
0x53be3e CMP $0x6,%RAX |
0x53be42 CMOVNE %RDI,%R10 |
0x53be46 ADD $0x8,%R10 |
0x53be4a ADD $0x8,%R10 |
0x53be4e ADD $0x8,%R10 |
0x53be52 ADD $0x8,%R10 |
0x53be56 ADD $0x8,%R10 |
0x53be5a MOV -0x38(%RBP),%R13 |
0x53be5e ADD $0x8,%R10 |
0x53be62 CMP %R13,%R10 |
0x53be65 JE 53b80c |
(2871) 0x53be6b MOV -0x38(%RBP),%R9 |
(2871) 0x53be6f ADD $0x40,%R10 |
(2871) 0x53be73 CMP %R9,%R10 |
(2871) 0x53be76 JNE 53be6b |
0x53be78 JMP 53b80c |
0x53be7d NOPL (%RAX) |
Path / |
Source file and lines | csr_matvec.c:178-204 |
Module | exec |
nb instructions | 135 |
nb uops | 136 |
loop length | 473 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 4 |
micro-operation queue | 22.67 cycles |
front end | 22.67 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 18.50 | 18.50 | 18.50 | 18.50 | 14.00 | 8.67 | 8.67 | 8.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 18.50 | 18.50 | 18.50 | 18.50 | 14.00 | 8.67 | 8.67 | 8.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | 7.00-12.00 |
Front-end | 22.67 |
Dispatch | 18.50 |
DIV/SQRT | 7.00-12.00 |
Overall L1 | 22.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 12% |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB $0x38,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CALL 4110b0 <omp_get_num_threads@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %EAX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4111f0 <omp_get_thread_num@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD %R12D,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVSXD %EAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x20(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CQTO | |||||||||||||||||
IDIV %RSI | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-19 | 7-12 |
CMP %RDX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JL 53b81b <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x32b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%RCX,%RDX,1),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD %RDI,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %RAX,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JGE 53b80c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x31c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x40(%RBX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RBX),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x50(%RBX),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x58(%RBX),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x48(%RBX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R8,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x38(%RBX),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R10,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%R11,%RDI,8),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x10(%RBX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x8(%RBX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RBX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP $0x1,%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JNE 53b825 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x335> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
LEA (%R11,%RAX,8),%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SAL $0x3,%R14 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R10,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP $0x1,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53bc57 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x767> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
TEST %R12,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 53b79d <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x2ad> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV -0x48(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %RDI,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x8,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SHR $0x3,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
INC %RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND $0x7,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b7ff <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x30f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x1,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b7f2 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x302> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x2,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b7ee <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x2fe> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x3,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b7ea <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x2fa> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x4,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b7e6 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x2f6> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x5,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b7e2 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x2f2> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
ADD $0x8,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x6,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNE %RDI,%R15 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD $0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x48(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %RCX,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b80c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x31c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
ADD $0x38,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
INC %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 53b529 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x39> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA (%R11,%RAX,8),%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (,%R14,8),%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP $0x1,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53bbeb <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x6fb> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
TEST %R12,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 53be05 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x915> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R10,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x40(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x48(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %RDI,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x8,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SHR $0x3,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
INC %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND $0x7,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53be6b <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x97b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x1,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53be5a <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x96a> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x2,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53be56 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x966> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x3,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53be52 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x962> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x4,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53be4e <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x95e> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x5,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53be4a <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x95a> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
ADD $0x8,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x6,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNE %RDI,%R10 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x38(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R13,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b80c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x31c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
JMP 53b80c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x31c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Source file and lines | csr_matvec.c:178-204 |
Module | exec |
nb instructions | 135 |
nb uops | 136 |
loop length | 473 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 4 |
micro-operation queue | 22.67 cycles |
front end | 22.67 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 18.50 | 18.50 | 18.50 | 18.50 | 14.00 | 8.67 | 8.67 | 8.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 18.50 | 18.50 | 18.50 | 18.50 | 14.00 | 8.67 | 8.67 | 8.67 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | 7.00-12.00 |
Front-end | 22.67 |
Dispatch | 18.50 |
DIV/SQRT | 7.00-12.00 |
Overall L1 | 22.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 12% |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB $0x38,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CALL 4110b0 <omp_get_num_threads@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %EAX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4111f0 <omp_get_thread_num@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD %R12D,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVSXD %EAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x20(%RBX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CQTO | |||||||||||||||||
IDIV %RSI | 2 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 9-19 | 7-12 |
CMP %RDX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JL 53b81b <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x32b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%RCX,%RDX,1),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD %RDI,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %RAX,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JGE 53b80c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x31c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV 0x40(%RBX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RBX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x18(%RBX),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x50(%RBX),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x58(%RBX),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x48(%RBX),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R8,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x38(%RBX),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBX),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R10,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%R11,%RDI,8),%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x10(%RBX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x8(%RBX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RBX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP $0x1,%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JNE 53b825 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x335> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
LEA (%R11,%RAX,8),%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SAL $0x3,%R14 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R10,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP $0x1,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53bc57 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x767> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
TEST %R12,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 53b79d <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x2ad> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV -0x48(%RBP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %RDI,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x8,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SHR $0x3,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
INC %RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND $0x7,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b7ff <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x30f> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x1,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b7f2 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x302> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x2,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b7ee <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x2fe> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x3,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b7ea <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x2fa> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x4,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b7e6 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x2f6> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x5,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b7e2 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x2f2> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
ADD $0x8,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x6,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNE %RDI,%R15 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD $0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x48(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x8,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %RCX,%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b80c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x31c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
ADD $0x38,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
INC %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
JMP 53b529 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x39> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA (%R11,%RAX,8),%R15 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (,%R14,8),%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP $0x1,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53bbeb <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x6fb> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
TEST %R12,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 53be05 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x915> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R10,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x40(%RBP),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x48(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %RDI,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x8,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SHR $0x3,%RAX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
INC %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND $0x7,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53be6b <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x97b> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x1,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53be5a <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x96a> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x2,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53be56 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x966> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x3,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53be52 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x962> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x4,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53be4e <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x95e> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
CMP $0x5,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53be4a <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x95a> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
ADD $0x8,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x6,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNE %RDI,%R10 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x38(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD $0x8,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R13,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JE 53b80c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x31c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
JMP 53b80c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3+0x31c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace._omp_fn.3– | 0.04 | 0.01 |
▼Loop 2875 - csr_matvec.c:183-196 - exec– | 0.01 | 0 |
○Loop 2876 - csr_matvec.c:194-195 - exec | 0.03 | 0 |
▼Loop 2869 - csr_matvec.c:183-196 - exec– | 0 | 0 |
○Loop 2870 - csr_matvec.c:194-195 - exec | 0 | 0 |
▼Loop 2873 - csr_matvec.c:183-204 - exec– | 0 | 0 |
▼Loop 2872 - csr_matvec.c:199-204 - exec– | 0 | 0 |
○Loop 2874 - csr_matvec.c:202-203 - exec | 0 | 0 |
▼Loop 2879 - csr_matvec.c:183-204 - exec– | 0 | 0 |
▼Loop 2878 - csr_matvec.c:199-204 - exec– | 0 | 0 |
○Loop 2880 - csr_matvec.c:202-203 - exec | 0 | 0 |
○Loop 2871 - csr_matvec.c:191-191 - exec | 0 | 0 |
○Loop 2877 - csr_matvec.c:191-191 - exec | 0 | 0 |