Function: hypre_ParTMatmul.extracted | Module: exec | Source: par_csr_matop.c:3454-3640 [...] | Coverage: 0.07% |
---|
Function: hypre_ParTMatmul.extracted | Module: exec | Source: par_csr_matop.c:3454-3640 [...] | Coverage: 0.07% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-147-2675/intel/AMG/build/AMG/AMG/parcsr_mv/par_csr_matop.c: 3454 - 3640 |
-------------------------------------------------------------------------------- |
3454: #pragma omp parallel |
[...] |
3462: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
3463: |
3464: size = num_cols_diag_A/num_threads; |
3465: rest = num_cols_diag_A - size*num_threads; |
3466: ii = hypre_GetThreadNum(); |
3467: if (ii < rest) |
3468: { |
3469: ns = ii*size+ii; |
3470: ne = (ii+1)*size+ii+1; |
3471: } |
3472: else |
3473: { |
3474: ns = ii*size+rest; |
3475: ne = (ii+1)*size+rest; |
3476: } |
3477: |
3478: B_marker = hypre_CTAlloc(HYPRE_Int, num_cols_diag_B); |
3479: B_marker_offd = hypre_CTAlloc(HYPRE_Int, num_cols_offd_C); |
3480: |
3481: for (ik = 0; ik < num_cols_diag_B; ik++) |
3482: B_marker[ik] = -1; |
3483: |
3484: for (ik = 0; ik < num_cols_offd_C; ik++) |
3485: B_marker_offd[ik] = -1; |
3486: |
3487: nnz_d = 0; |
3488: nnz_o = 0; |
3489: for (ik = ns; ik < ne; ik++) |
3490: { |
3491: for (jk = C_tmp_diag_i[ik]; jk < C_tmp_diag_i[ik+1]; jk++) |
3492: { |
3493: jcol = C_tmp_diag_j[jk]; |
3494: B_marker[jcol] = ik; |
3495: nnz_d++; |
3496: } |
3497: for (jk = C_tmp_offd_i[ik]; jk < C_tmp_offd_i[ik+1]; jk++) |
3498: { |
3499: jcol = C_tmp_offd_j[jk]; |
3500: B_marker_offd[jcol] = ik; |
3501: nnz_o++; |
3502: } |
3503: for (jk = 0; jk < num_sends_A; jk++) |
3504: for (j1 = send_map_starts_A[jk]; j1 < send_map_starts_A[jk+1]; j1++) |
3505: if (send_map_elmts_A[j1] == ik) |
3506: { |
3507: for (j2 = C_ext_diag_i[j1]; j2 < C_ext_diag_i[j1+1]; j2++) |
3508: { |
3509: jcol = C_ext_diag_j[j2]; |
3510: if (B_marker[jcol] < ik) |
3511: { |
3512: B_marker[jcol] = ik; |
3513: nnz_d++; |
3514: } |
3515: } |
3516: for (j2 = C_ext_offd_i[j1]; j2 < C_ext_offd_i[j1+1]; j2++) |
3517: { |
3518: jcol = C_ext_offd_j[j2]; |
3519: if (B_marker_offd[jcol] < ik) |
3520: { |
3521: B_marker_offd[jcol] = ik; |
3522: nnz_o++; |
3523: } |
3524: } |
3525: break; |
3526: } |
3527: C_diag_array[ii] = nnz_d; |
3528: C_offd_array[ii] = nnz_o; |
3529: } |
3530: #ifdef HYPRE_USING_OPENMP |
3531: #pragma omp barrier |
3532: #endif |
3533: if (ii == 0) |
3534: { |
3535: nnz_d = 0; |
3536: nnz_o = 0; |
3537: for (ik = 0; ik < num_threads-1; ik++) |
3538: { |
3539: C_diag_array[ik+1] += C_diag_array[ik]; |
3540: C_offd_array[ik+1] += C_offd_array[ik]; |
3541: } |
3542: nnz_d = C_diag_array[num_threads-1]; |
3543: nnz_o = C_offd_array[num_threads-1]; |
3544: C_diag_i[num_cols_diag_A] = nnz_d; |
3545: C_offd_i[num_cols_diag_A] = nnz_o; |
3546: |
3547: C_diag = hypre_CSRMatrixCreate(num_cols_diag_A, num_cols_diag_A, nnz_d); |
3548: C_offd = hypre_CSRMatrixCreate(num_cols_diag_A, num_cols_offd_C, nnz_o); |
3549: hypre_CSRMatrixI(C_diag) = C_diag_i; |
3550: hypre_CSRMatrixInitialize(C_diag); |
3551: C_diag_j = hypre_CSRMatrixJ(C_diag); |
3552: C_diag_data = hypre_CSRMatrixData(C_diag); |
3553: hypre_CSRMatrixI(C_offd) = C_offd_i; |
3554: hypre_CSRMatrixInitialize(C_offd); |
3555: C_offd_j = hypre_CSRMatrixJ(C_offd); |
3556: C_offd_data = hypre_CSRMatrixData(C_offd); |
[...] |
3568: for (ik = 0; ik < num_cols_diag_B; ik++) |
3569: B_marker[ik] = -1; |
3570: |
3571: for (ik = 0; ik < num_cols_offd_C; ik++) |
3572: B_marker_offd[ik] = -1; |
[...] |
3581: if (ii) |
3582: { |
3583: nnz_d = C_diag_array[ii-1]; |
3584: nnz_o = C_offd_array[ii-1]; |
3585: } |
3586: for (ik = ns; ik < ne; ik++) |
3587: { |
3588: C_diag_i[ik] = nnz_d; |
3589: C_offd_i[ik] = nnz_o; |
3590: for (jk = C_tmp_diag_i[ik]; jk < C_tmp_diag_i[ik+1]; jk++) |
3591: { |
3592: jcol = C_tmp_diag_j[jk]; |
3593: C_diag_j[nnz_d] = jcol; |
3594: C_diag_data[nnz_d] = C_tmp_diag_data[jk]; |
3595: B_marker[jcol] = nnz_d; |
3596: nnz_d++; |
3597: } |
3598: for (jk = C_tmp_offd_i[ik]; jk < C_tmp_offd_i[ik+1]; jk++) |
3599: { |
3600: jcol = C_tmp_offd_j[jk]; |
3601: C_offd_j[nnz_o] = jcol; |
3602: C_offd_data[nnz_o] = C_tmp_offd_data[jk]; |
3603: B_marker_offd[jcol] = nnz_o; |
3604: nnz_o++; |
3605: } |
3606: for (jk = 0; jk < num_sends_A; jk++) |
3607: for (j1 = send_map_starts_A[jk]; j1 < send_map_starts_A[jk+1]; j1++) |
3608: if (send_map_elmts_A[j1] == ik) |
3609: { |
3610: for (j2 = C_ext_diag_i[j1]; j2 < C_ext_diag_i[j1+1]; j2++) |
3611: { |
3612: jcol = C_ext_diag_j[j2]; |
3613: if (B_marker[jcol] < C_diag_i[ik]) |
3614: { |
3615: C_diag_j[nnz_d] = jcol; |
3616: C_diag_data[nnz_d] = C_ext_diag_data[j2]; |
3617: B_marker[jcol] = nnz_d; |
3618: nnz_d++; |
3619: } |
3620: else |
3621: C_diag_data[B_marker[jcol]] += C_ext_diag_data[j2]; |
3622: } |
3623: for (j2 = C_ext_offd_i[j1]; j2 < C_ext_offd_i[j1+1]; j2++) |
3624: { |
3625: jcol = C_ext_offd_j[j2]; |
3626: if (B_marker_offd[jcol] < C_offd_i[ik]) |
3627: { |
3628: C_offd_j[nnz_o] = jcol; |
3629: C_offd_data[nnz_o] = C_ext_offd_data[j2]; |
3630: B_marker_offd[jcol] = nnz_o; |
3631: nnz_o++; |
3632: } |
3633: else |
3634: C_offd_data[B_marker_offd[jcol]] += C_ext_offd_data[j2]; |
3635: } |
3636: break; |
3637: } |
3638: } |
3639: hypre_TFree(B_marker); |
3640: hypre_TFree(B_marker_offd); |
0x4c08b0 PUSH %RBP |
0x4c08b1 MOV %RSP,%RBP |
0x4c08b4 PUSH %R15 |
0x4c08b6 PUSH %R14 |
0x4c08b8 PUSH %R13 |
0x4c08ba PUSH %R12 |
0x4c08bc PUSH %RBX |
0x4c08bd SUB $0x128,%RSP |
0x4c08c4 MOV %R9,-0xe8(%RBP) |
0x4c08cb MOV %R8,-0x128(%RBP) |
0x4c08d2 MOV %RCX,-0x100(%RBP) |
0x4c08d9 MOV %RDX,%R15 |
0x4c08dc MOV %RDI,-0xc0(%RBP) |
0x4c08e3 MOV 0xc8(%RBP),%RAX |
0x4c08ea MOV %RAX,-0xd0(%RBP) |
0x4c08f1 MOV 0xc0(%RBP),%RAX |
0x4c08f8 MOV %RAX,-0xc8(%RBP) |
0x4c08ff MOV 0xb8(%RBP),%RAX |
0x4c0906 MOV %RAX,-0x78(%RBP) |
0x4c090a MOV 0xb0(%RBP),%RBX |
0x4c0911 MOV 0xa8(%RBP),%RAX |
0x4c0918 MOV %RAX,-0x50(%RBP) |
0x4c091c MOV 0xa0(%RBP),%RAX |
0x4c0923 MOV %RAX,-0x38(%RBP) |
0x4c0927 MOV 0x98(%RBP),%RAX |
0x4c092e MOV %RAX,-0xf8(%RBP) |
0x4c0935 MOV 0x90(%RBP),%RAX |
0x4c093c MOV %RAX,-0xa8(%RBP) |
0x4c0943 MOV 0x88(%RBP),%RAX |
0x4c094a MOV %RAX,-0xe0(%RBP) |
0x4c0951 MOV 0x80(%RBP),%R13 |
0x4c0958 MOV 0x78(%RBP),%RAX |
0x4c095c MOV %RAX,-0x58(%RBP) |
0x4c0960 MOV 0x70(%RBP),%RAX |
0x4c0964 MOV %RAX,-0x90(%RBP) |
0x4c096b MOV 0x68(%RBP),%R12 |
0x4c096f MOV 0x60(%RBP),%RAX |
0x4c0973 MOV %RAX,-0x60(%RBP) |
0x4c0977 MOV 0x58(%RBP),%RAX |
0x4c097b MOV %RAX,-0x80(%RBP) |
0x4c097f MOV 0x50(%RBP),%RAX |
0x4c0983 MOV %RAX,-0x148(%RBP) |
0x4c098a MOV 0x48(%RBP),%RAX |
0x4c098e MOV %RAX,-0x110(%RBP) |
0x4c0995 MOV 0x40(%RBP),%RAX |
0x4c0999 MOV %RAX,-0xb8(%RBP) |
0x4c09a0 MOV 0x38(%RBP),%RAX |
0x4c09a4 MOV %RAX,-0x140(%RBP) |
0x4c09ab MOV 0x30(%RBP),%RAX |
0x4c09af MOV %RAX,-0x108(%RBP) |
0x4c09b6 MOV 0x28(%RBP),%RAX |
0x4c09ba MOV %RAX,-0xb0(%RBP) |
0x4c09c1 MOV 0x20(%RBP),%RAX |
0x4c09c5 MOV %RAX,-0x120(%RBP) |
0x4c09cc MOV 0x18(%RBP),%RAX |
0x4c09d0 MOV %RAX,-0xf0(%RBP) |
0x4c09d7 MOV 0x10(%RBP),%RAX |
0x4c09db MOV %RAX,-0xa0(%RBP) |
0x4c09e2 CALL 4e8fe0 <hypre_NumActiveThreads> |
0x4c09e7 MOV %RAX,%RCX |
0x4c09ea MOV %R15,%RAX |
0x4c09ed OR %RCX,%RAX |
0x4c09f0 SHR $0x20,%RAX |
0x4c09f4 MOV %R15,-0x130(%RBP) |
0x4c09fb MOV %RCX,-0x118(%RBP) |
0x4c0a02 JE 4c0a14 |
0x4c0a04 MOV %R15,%RAX |
0x4c0a07 CQTO |
0x4c0a09 IDIV %RCX |
0x4c0a0c MOV %RDX,%R15 |
0x4c0a0f MOV %RAX,%R14 |
0x4c0a12 JMP 4c0a21 |
0x4c0a14 MOV %R15D,%EAX |
0x4c0a17 XOR %EDX,%EDX |
0x4c0a19 DIV %ECX |
0x4c0a1b MOV %EDX,%R15D |
0x4c0a1e MOV %EAX,%R14D |
0x4c0a21 CALL 4e8ff0 <hypre_GetThreadNum> |
0x4c0a26 LEA 0x1(%RAX),%RCX |
0x4c0a2a MOV %RCX,%RDX |
0x4c0a2d IMUL %R14,%RDX |
0x4c0a31 CMP %R15,%RAX |
0x4c0a34 MOV %R12,-0x138(%RBP) |
0x4c0a3b MOV %RAX,-0xd8(%RBP) |
0x4c0a42 JGE 4c0a58 |
0x4c0a44 INC %R14 |
0x4c0a47 IMUL %RAX,%R14 |
0x4c0a4b MOV %R14,-0x48(%RBP) |
0x4c0a4f ADD %RDX,%RCX |
0x4c0a52 MOV %RCX,-0x68(%RBP) |
0x4c0a56 JMP 4c0a6a |
0x4c0a58 IMUL %RAX,%R14 |
0x4c0a5c ADD %R15,%R14 |
0x4c0a5f MOV %R14,-0x48(%RBP) |
0x4c0a63 ADD %R15,%RDX |
0x4c0a66 MOV %RDX,-0x68(%RBP) |
0x4c0a6a MOV -0x50(%RBP),%R15 |
0x4c0a6e MOV $0x8,%ESI |
0x4c0a73 MOV -0x100(%RBP),%R12 |
0x4c0a7a MOV %R12,%RDI |
0x4c0a7d CALL 4e72c0 <hypre_CAlloc> |
0x4c0a82 MOV %RAX,%R14 |
0x4c0a85 MOV $0x8,%ESI |
0x4c0a8a MOV -0x78(%RBP),%RDI |
0x4c0a8e CALL 4e72c0 <hypre_CAlloc> |
0x4c0a93 MOV %R12,%RCX |
0x4c0a96 MOV %RAX,%R12 |
0x4c0a99 TEST %RCX,%RCX |
0x4c0a9c JLE 4c0ab3 |
0x4c0a9e LEA (,%RCX,8),%RDX |
0x4c0aa6 MOV %R14,%RDI |
0x4c0aa9 MOV $0xff,%ESI |
0x4c0aae CALL 4f03c0 <_intel_fast_memset> |
0x4c0ab3 MOV -0x78(%RBP),%RAX |
0x4c0ab7 TEST %RAX,%RAX |
0x4c0aba JLE 4c0ad1 |
0x4c0abc LEA (,%RAX,8),%RDX |
0x4c0ac4 MOV %R12,%RDI |
0x4c0ac7 MOV $0xff,%ESI |
0x4c0acc CALL 4f03c0 <_intel_fast_memset> |
0x4c0ad1 MOV -0x48(%RBP),%RAX |
0x4c0ad5 CMP -0x68(%RBP),%RAX |
0x4c0ad9 MOV %RBX,-0x40(%RBP) |
0x4c0add MOV -0x38(%RBP),%R11 |
0x4c0ae1 MOV %R13,-0x88(%RBP) |
0x4c0ae8 MOV -0x60(%RBP),%R9 |
0x4c0aec MOV %R14,-0x30(%RBP) |
0x4c0af0 JGE 4c0e32 |
0x4c0af6 XOR %EAX,%EAX |
0x4c0af8 MOV -0x48(%RBP),%RDX |
0x4c0afc XOR %ECX,%ECX |
0x4c0afe JMP 4c0b2e |
(3670) 0x4c0b00 MOV -0xc8(%RBP),%RDX |
(3670) 0x4c0b07 MOV -0xd8(%RBP),%RSI |
(3670) 0x4c0b0e MOV %RCX,(%RDX,%RSI,8) |
(3670) 0x4c0b12 MOV -0xd0(%RBP),%RDX |
(3670) 0x4c0b19 MOV %RAX,(%RDX,%RSI,8) |
(3670) 0x4c0b1d MOV -0x70(%RBP),%RSI |
(3670) 0x4c0b21 MOV %RSI,%RDX |
(3670) 0x4c0b24 CMP -0x68(%RBP),%RSI |
(3670) 0x4c0b28 JGE 4c0e32 |
(3670) 0x4c0b2e MOV -0x80(%RBP),%RDI |
(3670) 0x4c0b32 MOV (%RDI,%RDX,8),%RSI |
(3670) 0x4c0b36 LEA 0x1(%RDX),%R8 |
(3670) 0x4c0b3a MOV %R8,-0x70(%RBP) |
(3670) 0x4c0b3e CMP 0x8(%RDI,%RDX,8),%RSI |
(3670) 0x4c0b43 JGE 4c0bc0 |
(3670) 0x4c0b45 MOV -0x58(%RBP),%R8 |
(3670) 0x4c0b49 MOV -0x80(%RBP),%R10 |
(3670) 0x4c0b4d MOV -0x70(%RBP),%RBX |
(3670) 0x4c0b51 NOPW %CS:(%RAX,%RAX,1) |
(3677) 0x4c0b60 MOV (%R9,%RSI,8),%RDI |
(3677) 0x4c0b64 MOV %RDX,(%R14,%RDI,8) |
(3677) 0x4c0b68 INC %RCX |
(3677) 0x4c0b6b INC %RSI |
(3677) 0x4c0b6e CMP (%R10,%RBX,8),%RSI |
(3677) 0x4c0b72 JL 4c0b60 |
(3670) 0x4c0b74 MOV -0x90(%RBP),%RDI |
(3670) 0x4c0b7b MOV (%RDI,%RDX,8),%RSI |
(3670) 0x4c0b7f CMP (%RDI,%RBX,8),%RSI |
(3670) 0x4c0b83 JGE 4c0bd9 |
(3670) 0x4c0b85 MOV -0x40(%RBP),%RBX |
(3670) 0x4c0b89 NOPL (%RAX) |
(3669) 0x4c0b90 MOV (%R8,%RSI,8),%RDI |
(3669) 0x4c0b94 MOV %RDX,(%R12,%RDI,8) |
(3669) 0x4c0b98 INC %RAX |
(3669) 0x4c0b9b INC %RSI |
(3669) 0x4c0b9e MOV -0x90(%RBP),%RDI |
(3669) 0x4c0ba5 MOV -0x70(%RBP),%R10 |
(3669) 0x4c0ba9 CMP (%RDI,%R10,8),%RSI |
(3669) 0x4c0bad JL 4c0b90 |
(3670) 0x4c0baf TEST %RBX,%RBX |
(3670) 0x4c0bb2 JG 4c0be6 |
(3670) 0x4c0bb4 JMP 4c0b00 |
0x4c0bb9 NOPL (%RAX) |
(3670) 0x4c0bc0 MOV -0x58(%RBP),%R8 |
(3670) 0x4c0bc4 MOV -0x70(%RBP),%RBX |
(3670) 0x4c0bc8 MOV -0x90(%RBP),%RDI |
(3670) 0x4c0bcf MOV (%RDI,%RDX,8),%RSI |
(3670) 0x4c0bd3 CMP (%RDI,%RBX,8),%RSI |
(3670) 0x4c0bd7 JL 4c0b85 |
(3670) 0x4c0bd9 MOV -0x40(%RBP),%RBX |
(3670) 0x4c0bdd TEST %RBX,%RBX |
(3670) 0x4c0be0 JLE 4c0b00 |
(3670) 0x4c0be6 VPBROADCASTQ %RDX,%YMM0 |
(3670) 0x4c0bec XOR %EDI,%EDI |
(3670) 0x4c0bee JMP 4c0c03 |
(3671) 0x4c0bf0 MOV -0x60(%RBP),%R9 |
(3671) 0x4c0bf4 MOV %RSI,%R11 |
(3671) 0x4c0bf7 INC %RDI |
(3671) 0x4c0bfa CMP %RBX,%RDI |
(3671) 0x4c0bfd JE 4c0b00 |
(3671) 0x4c0c03 MOV (%R11,%RDI,8),%R10 |
(3671) 0x4c0c07 MOV 0x8(%R11,%RDI,8),%R9 |
(3671) 0x4c0c0c MOV %R11,%RSI |
(3671) 0x4c0c0f MOV %R9,%R11 |
(3671) 0x4c0c12 SUB %R10,%R11 |
(3671) 0x4c0c15 JLE 4c0bf0 |
(3671) 0x4c0c17 LEA (%R15,%R10,8),%ESI |
(3671) 0x4c0c1b AND $0x7f,%ESI |
(3671) 0x4c0c1e MOV $0x80,%EBX |
(3671) 0x4c0c23 SUB %ESI,%EBX |
(3671) 0x4c0c25 SHR $0x3,%EBX |
(3671) 0x4c0c28 CMP %RBX,%R11 |
(3671) 0x4c0c2b MOV %RBX,%RSI |
(3671) 0x4c0c2e CMOVB %R11,%RSI |
(3671) 0x4c0c32 TEST %RSI,%RSI |
(3671) 0x4c0c35 JE 4c0c52 |
(3671) 0x4c0c37 MOV %R10,%R8 |
(3671) 0x4c0c3a MOV %RSI,%R14 |
(3671) 0x4c0c3d NOPL (%RAX) |
(3676) 0x4c0c40 CMP %RDX,(%R15,%R8,8) |
(3676) 0x4c0c44 JE 4c0d2e |
(3676) 0x4c0c4a INC %R8 |
(3676) 0x4c0c4d DEC %R14 |
(3676) 0x4c0c50 JNE 4c0c40 |
(3671) 0x4c0c52 CMP %RBX,%R11 |
(3671) 0x4c0c55 JBE 4c0d19 |
(3671) 0x4c0c5b SUB %RSI,%R11 |
(3671) 0x4c0c5e MOV %R11,%RBX |
(3671) 0x4c0c61 AND $-0x10,%RBX |
(3671) 0x4c0c65 JE 4c0cba |
(3671) 0x4c0c67 LEA -0x1(%RBX),%R13 |
(3671) 0x4c0c6b LEA (%R10,%RSI,1),%R8 |
(3671) 0x4c0c6f MOV -0x50(%RBP),%R14 |
(3671) 0x4c0c73 LEA (%R14,%R8,8),%R15 |
(3671) 0x4c0c77 XOR %R14D,%R14D |
(3671) 0x4c0c7a NOPW (%RAX,%RAX,1) |
(3675) 0x4c0c80 VPCMPEQQ 0x20(%R15,%R14,8),%YMM0,%K0 |
(3675) 0x4c0c88 VPCMPEQQ (%R15,%R14,8),%YMM0,%K1 |
(3675) 0x4c0c8f VPCMPEQQ 0x60(%R15,%R14,8),%YMM0,%K2 |
(3675) 0x4c0c97 VPCMPEQQ 0x40(%R15,%R14,8),%YMM0,%K3 |
(3675) 0x4c0c9f KORB %K0,%K1,%K4 |
(3675) 0x4c0ca3 KORB %K2,%K3,%K5 |
(3675) 0x4c0ca7 KORTESTB %K5,%K4 |
(3675) 0x4c0cab JNE 4c0d5c |
(3675) 0x4c0cb1 ADD $0x10,%R14 |
(3675) 0x4c0cb5 CMP %R13,%R14 |
(3675) 0x4c0cb8 JBE 4c0c80 |
(3671) 0x4c0cba CMP %R11,%RBX |
(3671) 0x4c0cbd JAE 4c0d3c |
(3671) 0x4c0cbf ADD %RSI,%R10 |
(3671) 0x4c0cc2 ADD %RBX,%R10 |
(3671) 0x4c0cc5 MOV %R10,%R8 |
(3671) 0x4c0cc8 MOV -0x40(%RBP),%RBX |
(3671) 0x4c0ccc MOV -0x50(%RBP),%R15 |
(3671) 0x4c0cd0 MOV -0x38(%RBP),%R11 |
(3671) 0x4c0cd4 MOV -0x88(%RBP),%R13 |
(3671) 0x4c0cdb MOV -0x48(%RBP),%RSI |
(3671) 0x4c0cdf MOV -0x30(%RBP),%R14 |
(3671) 0x4c0ce3 MOV %RSI,-0x48(%RBP) |
(3671) 0x4c0ce7 NOPW (%RAX,%RAX,1) |
(3674) 0x4c0cf0 CMP %RDX,(%R15,%R8,8) |
(3674) 0x4c0cf4 JE 4c0d99 |
(3674) 0x4c0cfa INC %R8 |
(3674) 0x4c0cfd CMP %R8,%R9 |
(3674) 0x4c0d00 JNE 4c0cf0 |
(3671) 0x4c0d02 NOPW %CS:(%RAX,%RAX,1) |
(3671) 0x4c0d10 MOV -0x60(%RBP),%R9 |
(3671) 0x4c0d14 JMP 4c0bf7 |
(3671) 0x4c0d19 MOV -0x38(%RBP),%R11 |
(3671) 0x4c0d1d MOV -0x60(%RBP),%R9 |
(3671) 0x4c0d21 MOV -0x30(%RBP),%R14 |
(3671) 0x4c0d25 MOV -0x40(%RBP),%RBX |
(3671) 0x4c0d29 JMP 4c0bf7 |
(3671) 0x4c0d2e MOV -0x38(%RBP),%R11 |
(3671) 0x4c0d32 MOV -0x30(%RBP),%R14 |
(3671) 0x4c0d36 MOV -0x40(%RBP),%RBX |
(3671) 0x4c0d3a JMP 4c0d99 |
(3671) 0x4c0d3c MOV -0x40(%RBP),%RBX |
(3671) 0x4c0d40 MOV -0x50(%RBP),%R15 |
(3671) 0x4c0d44 MOV -0x38(%RBP),%R11 |
(3671) 0x4c0d48 MOV -0x88(%RBP),%R13 |
(3671) 0x4c0d4f MOV -0x60(%RBP),%R9 |
(3671) 0x4c0d53 MOV -0x30(%RBP),%R14 |
(3671) 0x4c0d57 JMP 4c0bf7 |
(3671) 0x4c0d5c KSHIFTLB $0x4,%K0,%K0 |
(3671) 0x4c0d62 KORB %K0,%K1,%K0 |
(3671) 0x4c0d66 KSHIFTLB $0x4,%K2,%K1 |
(3671) 0x4c0d6c KORB %K1,%K3,%K1 |
(3671) 0x4c0d70 KUNPCKBW %K0,%K1,%K0 |
(3671) 0x4c0d74 KMOVD %K0,%ESI |
(3671) 0x4c0d78 TZCNT %ESI,%ESI |
(3671) 0x4c0d7c ADD %R14,%R8 |
(3671) 0x4c0d7f ADD %RSI,%R8 |
(3671) 0x4c0d82 MOV -0x40(%RBP),%RBX |
(3671) 0x4c0d86 MOV -0x50(%RBP),%R15 |
(3671) 0x4c0d8a MOV -0x38(%RBP),%R11 |
(3671) 0x4c0d8e MOV -0x88(%RBP),%R13 |
(3671) 0x4c0d95 MOV -0x30(%RBP),%R14 |
(3671) 0x4c0d99 MOV -0xb0(%RBP),%R9 |
(3671) 0x4c0da0 MOV (%R9,%R8,8),%RSI |
(3671) 0x4c0da4 MOV 0x8(%R9,%R8,8),%R9 |
(3671) 0x4c0da9 JMP 4c0db3 |
0x4c0dab NOPL (%RAX,%RAX,1) |
(3673) 0x4c0db0 INC %RSI |
(3673) 0x4c0db3 CMP %R9,%RSI |
(3673) 0x4c0db6 JGE 4c0de0 |
(3673) 0x4c0db8 MOV -0x108(%RBP),%R10 |
(3673) 0x4c0dbf MOV (%R10,%RSI,8),%R10 |
(3673) 0x4c0dc3 CMP %RDX,(%R14,%R10,8) |
(3673) 0x4c0dc7 JGE 4c0db0 |
(3673) 0x4c0dc9 MOV %RDX,(%R14,%R10,8) |
(3673) 0x4c0dcd INC %RCX |
(3673) 0x4c0dd0 MOV -0xb0(%RBP),%R9 |
(3673) 0x4c0dd7 MOV 0x8(%R9,%R8,8),%R9 |
(3673) 0x4c0ddc JMP 4c0db0 |
0x4c0dde XCHG %AX,%AX |
(3671) 0x4c0de0 MOV -0xb8(%RBP),%R9 |
(3671) 0x4c0de7 MOV (%R9,%R8,8),%RSI |
(3671) 0x4c0deb MOV 0x8(%R9,%R8,8),%R9 |
(3671) 0x4c0df0 JMP 4c0e03 |
0x4c0df2 NOPW %CS:(%RAX,%RAX,1) |
(3672) 0x4c0e00 INC %RSI |
(3672) 0x4c0e03 CMP %R9,%RSI |
(3672) 0x4c0e06 JGE 4c0d10 |
(3672) 0x4c0e0c MOV -0x110(%RBP),%R10 |
(3672) 0x4c0e13 MOV (%R10,%RSI,8),%R10 |
(3672) 0x4c0e17 CMP %RDX,(%R12,%R10,8) |
(3672) 0x4c0e1b JGE 4c0e00 |
(3672) 0x4c0e1d MOV %RDX,(%R12,%R10,8) |
(3672) 0x4c0e21 INC %RAX |
(3672) 0x4c0e24 MOV -0xb8(%RBP),%R9 |
(3672) 0x4c0e2b MOV 0x8(%R9,%R8,8),%R9 |
(3672) 0x4c0e30 JMP 4c0e00 |
0x4c0e32 MOV -0xc0(%RBP),%RAX |
0x4c0e39 MOV (%RAX),%ESI |
0x4c0e3b MOV $0x537270,%EDI |
0x4c0e40 VZEROUPPER |
0x4c0e43 CALL 410560 <__kmpc_barrier@plt> |
0x4c0e48 MOV -0xc0(%RBP),%RAX |
0x4c0e4f CMPQ $0,-0xd8(%RBP) |
0x4c0e57 JNE 4c1090 |
0x4c0e5d MOV -0x118(%RBP),%RDI |
0x4c0e64 CMP $0x1,%RDI |
0x4c0e68 MOV -0xd0(%RBP),%R10 |
0x4c0e6f MOV -0xc8(%RBP),%R11 |
0x4c0e76 JLE 4c0fcc |
0x4c0e7c LEA -0x1(%RDI),%RAX |
0x4c0e80 LEA (%R11,%RAX,8),%RCX |
0x4c0e84 CMP %R10,%RCX |
0x4c0e87 JB 4c0ef1 |
0x4c0e89 LEA (%R10,%RAX,8),%RCX |
0x4c0e8d CMP %R11,%RCX |
0x4c0e90 JB 4c0ef1 |
0x4c0e92 LEA (%R10,%RDI,8),%RAX |
0x4c0e96 CMP %R11,%RAX |
0x4c0e99 JBE 4c0f9e |
0x4c0e9f LEA (%R11,%RDI,8),%RAX |
0x4c0ea3 CMP %R10,%RAX |
0x4c0ea6 JBE 4c0f9e |
0x4c0eac MOV $0x1,%EAX |
0x4c0eb1 NOPW %CS:(%RAX,%RAX,1) |
(3668) 0x4c0ec0 MOV -0x8(%R11,%RAX,8),%RCX |
(3668) 0x4c0ec5 LEA (%R11,%RAX,8),%RDX |
(3668) 0x4c0ec9 MOV (%RDX),%RSI |
(3668) 0x4c0ecc ADD %RCX,%RSI |
(3668) 0x4c0ecf MOV %RSI,(%RDX) |
(3668) 0x4c0ed2 MOV -0x8(%R10,%RAX,8),%RCX |
(3668) 0x4c0ed7 LEA (%R10,%RAX,8),%RDX |
(3668) 0x4c0edb MOV (%RDX),%RSI |
(3668) 0x4c0ede ADD %RCX,%RSI |
(3668) 0x4c0ee1 MOV %RSI,(%RDX) |
(3668) 0x4c0ee4 INC %RAX |
(3668) 0x4c0ee7 CMP %RAX,%RDI |
(3668) 0x4c0eea JNE 4c0ec0 |
0x4c0eec JMP 4c0fcc |
0x4c0ef1 MOV %RDI,%RBX |
0x4c0ef4 CMP $0x5,%RDI |
0x4c0ef8 JB 4c0f5d |
0x4c0efa MOV %RAX,%RCX |
0x4c0efd SHR $0x2,%RCX |
0x4c0f01 MOV (%R11),%RDX |
0x4c0f04 MOV (%R10),%RSI |
0x4c0f07 MOV $0x20,%EDI |
0x4c0f0c NOPL (%RAX) |
(3666) 0x4c0f10 LEA (%R11,%RDI,1),%R8 |
(3666) 0x4c0f14 ADD -0x18(%R8),%RDX |
(3666) 0x4c0f18 MOV %RDX,-0x18(%R8) |
(3666) 0x4c0f1c LEA (%R10,%RDI,1),%R9 |
(3666) 0x4c0f20 ADD -0x18(%R9),%RSI |
(3666) 0x4c0f24 MOV %RSI,-0x18(%R9) |
(3666) 0x4c0f28 ADD -0x10(%R8),%RDX |
(3666) 0x4c0f2c MOV %RDX,-0x10(%R8) |
(3666) 0x4c0f30 ADD -0x10(%R9),%RSI |
(3666) 0x4c0f34 MOV %RSI,-0x10(%R9) |
(3666) 0x4c0f38 ADD -0x8(%R8),%RDX |
(3666) 0x4c0f3c MOV %RDX,-0x8(%R8) |
(3666) 0x4c0f40 ADD -0x8(%R9),%RSI |
(3666) 0x4c0f44 MOV %RSI,-0x8(%R9) |
(3666) 0x4c0f48 ADD (%R8),%RDX |
(3666) 0x4c0f4b MOV %RDX,(%R8) |
(3666) 0x4c0f4e ADD (%R9),%RSI |
(3666) 0x4c0f51 MOV %RSI,(%R9) |
(3666) 0x4c0f54 ADD $0x20,%RDI |
(3666) 0x4c0f58 DEC %RCX |
(3666) 0x4c0f5b JNE 4c0f10 |
0x4c0f5d MOV %RAX,%RCX |
0x4c0f60 AND $-0x4,%RCX |
0x4c0f64 CMP %RAX,%RCX |
0x4c0f67 MOV %RBX,%RDI |
0x4c0f6a JAE 4c0fcc |
0x4c0f6c MOV (%R11,%RCX,8),%RAX |
0x4c0f70 MOV (%R10,%RCX,8),%RDX |
0x4c0f74 INC %RCX |
0x4c0f77 NOPW (%RAX,%RAX,1) |
(3665) 0x4c0f80 LEA (%R11,%RCX,8),%RSI |
(3665) 0x4c0f84 ADD (%RSI),%RAX |
(3665) 0x4c0f87 MOV %RAX,(%RSI) |
(3665) 0x4c0f8a LEA (%R10,%RCX,8),%RSI |
(3665) 0x4c0f8e ADD (%RSI),%RDX |
(3665) 0x4c0f91 MOV %RDX,(%RSI) |
(3665) 0x4c0f94 INC %RCX |
(3665) 0x4c0f97 CMP %RCX,%RDI |
(3665) 0x4c0f9a JNE 4c0f80 |
0x4c0f9c JMP 4c0fcc |
0x4c0f9e MOV (%R11),%RAX |
0x4c0fa1 MOV (%R10),%RCX |
0x4c0fa4 MOV $0x1,%EDX |
0x4c0fa9 NOPL (%RAX) |
(3667) 0x4c0fb0 LEA (%R11,%RDX,8),%RSI |
(3667) 0x4c0fb4 ADD (%RSI),%RAX |
(3667) 0x4c0fb7 MOV %RAX,(%RSI) |
(3667) 0x4c0fba LEA (%R10,%RDX,8),%RSI |
(3667) 0x4c0fbe ADD (%RSI),%RCX |
(3667) 0x4c0fc1 MOV %RCX,(%RSI) |
(3667) 0x4c0fc4 INC %RDX |
(3667) 0x4c0fc7 CMP %RDX,%RDI |
(3667) 0x4c0fca JNE 4c0fb0 |
0x4c0fcc MOV -0x8(%R11,%RDI,8),%RDX |
0x4c0fd1 MOV -0x8(%R10,%RDI,8),%RCX |
0x4c0fd6 MOV %RCX,-0x70(%RBP) |
0x4c0fda MOV -0x130(%RBP),%RBX |
0x4c0fe1 MOV -0xa0(%RBP),%RAX |
0x4c0fe8 MOV %RDX,(%RAX,%RBX,8) |
0x4c0fec MOV -0xa8(%RBP),%RAX |
0x4c0ff3 MOV %RCX,(%RAX,%RBX,8) |
0x4c0ff7 MOV %RBX,%RDI |
0x4c0ffa MOV %RBX,%RSI |
0x4c0ffd CALL 4daf70 <hypre_CSRMatrixCreate> |
0x4c1002 MOV %RAX,%R13 |
0x4c1005 MOV -0x128(%RBP),%RAX |
0x4c100c MOV %R13,(%RAX) |
0x4c100f MOV %RBX,%RDI |
0x4c1012 MOV -0x78(%RBP),%RSI |
0x4c1016 MOV -0x70(%RBP),%RDX |
0x4c101a CALL 4daf70 <hypre_CSRMatrixCreate> |
0x4c101f MOV %RAX,%RBX |
0x4c1022 MOV -0x120(%RBP),%RAX |
0x4c1029 MOV %RBX,(%RAX) |
0x4c102c MOV -0xa0(%RBP),%RAX |
0x4c1033 MOV %RAX,(%R13) |
0x4c1037 MOV %R13,%RDI |
0x4c103a CALL 4db050 <hypre_CSRMatrixInitialize> |
0x4c103f MOV 0x8(%R13),%RAX |
0x4c1043 MOV -0xf0(%RBP),%RCX |
0x4c104a MOV %RAX,(%RCX) |
0x4c104d MOV 0x30(%R13),%RAX |
0x4c1051 MOV -0xe8(%RBP),%RCX |
0x4c1058 MOV %RAX,(%RCX) |
0x4c105b MOV -0xa8(%RBP),%RAX |
0x4c1062 MOV %RAX,(%RBX) |
0x4c1065 MOV %RBX,%RDI |
0x4c1068 CALL 4db050 <hypre_CSRMatrixInitialize> |
0x4c106d MOV 0x8(%RBX),%RAX |
0x4c1071 MOV -0xf8(%RBP),%RCX |
0x4c1078 MOV %RAX,(%RCX) |
0x4c107b MOV 0x30(%RBX),%RAX |
0x4c107f MOV -0xe0(%RBP),%RCX |
0x4c1086 MOV %RAX,(%RCX) |
0x4c1089 MOV -0xc0(%RBP),%RAX |
0x4c1090 MOV (%RAX),%ESI |
0x4c1092 MOV $0x537290,%EDI |
0x4c1097 CALL 410560 <__kmpc_barrier@plt> |
0x4c109c MOV -0x100(%RBP),%RDX |
0x4c10a3 TEST %RDX,%RDX |
0x4c10a6 JLE 4c10b9 |
0x4c10a8 SAL $0x3,%RDX |
0x4c10ac MOV %R14,%RDI |
0x4c10af MOV $0xff,%ESI |
0x4c10b4 CALL 4f03c0 <_intel_fast_memset> |
0x4c10b9 MOV -0x78(%RBP),%RDX |
0x4c10bd TEST %RDX,%RDX |
0x4c10c0 JLE 4c10d3 |
0x4c10c2 SAL $0x3,%RDX |
0x4c10c6 MOV %R12,%RDI |
0x4c10c9 MOV $0xff,%ESI |
0x4c10ce CALL 4f03c0 <_intel_fast_memset> |
0x4c10d3 MOV -0xd8(%RBP),%RDX |
0x4c10da TEST %RDX,%RDX |
0x4c10dd JE 4c1109 |
0x4c10df MOV -0xc8(%RBP),%RAX |
0x4c10e6 MOV -0x8(%RAX,%RDX,8),%RAX |
0x4c10eb MOV -0xd0(%RBP),%RCX |
0x4c10f2 MOV -0x8(%RCX,%RDX,8),%RCX |
0x4c10f7 MOV -0x68(%RBP),%RDX |
0x4c10fb MOV -0x48(%RBP),%RSI |
0x4c10ff CMP %RDX,%RSI |
0x4c1102 JL 4c111e |
0x4c1104 JMP 4c155f |
0x4c1109 XOR %EAX,%EAX |
0x4c110b XOR %ECX,%ECX |
0x4c110d MOV -0x68(%RBP),%RDX |
0x4c1111 MOV -0x48(%RBP),%RSI |
0x4c1115 CMP %RDX,%RSI |
0x4c1118 JGE 4c155f |
0x4c111e MOV %R12,-0x98(%RBP) |
0x4c1125 JMP 4c1148 |
0x4c1127 NOPW (%RAX,%RAX,1) |
(3657) 0x4c1130 MOV -0x98(%RBP),%R12 |
(3657) 0x4c1137 MOV -0x68(%RBP),%RDX |
(3657) 0x4c113b MOV -0x48(%RBP),%RSI |
(3657) 0x4c113f CMP %RDX,%RSI |
(3657) 0x4c1142 JGE 4c155f |
(3657) 0x4c1148 MOV %RSI,%RDX |
(3657) 0x4c114b MOV -0xa0(%RBP),%RSI |
(3657) 0x4c1152 MOV %RAX,(%RSI,%RDX,8) |
(3657) 0x4c1156 MOV -0xa8(%RBP),%RSI |
(3657) 0x4c115d MOV %RCX,(%RSI,%RDX,8) |
(3657) 0x4c1161 MOV -0x80(%RBP),%R8 |
(3657) 0x4c1165 MOV (%R8,%RDX,8),%RSI |
(3657) 0x4c1169 LEA 0x1(%RDX),%RDI |
(3657) 0x4c116d MOV %RDI,-0x48(%RBP) |
(3657) 0x4c1171 CMP 0x8(%R8,%RDX,8),%RSI |
(3657) 0x4c1176 JGE 4c1270 |
(3657) 0x4c117c MOV -0xf0(%RBP),%RDI |
(3657) 0x4c1183 MOV (%RDI),%RDI |
(3657) 0x4c1186 MOV -0xe8(%RBP),%R8 |
(3657) 0x4c118d MOV (%R8),%R8 |
(3657) 0x4c1190 MOV -0x138(%RBP),%R10 |
(3657) 0x4c1197 MOV -0x60(%RBP),%R14 |
(3657) 0x4c119b MOV -0x80(%RBP),%RBX |
(3657) 0x4c119f MOV -0x48(%RBP),%R13 |
(3657) 0x4c11a3 MOV -0x30(%RBP),%R11 |
(3657) 0x4c11a7 NOPW (%RAX,%RAX,1) |
(3664) 0x4c11b0 MOV (%R14,%RSI,8),%R9 |
(3664) 0x4c11b4 MOV %R9,(%RDI,%RAX,8) |
(3664) 0x4c11b8 VMOVQ (%R10,%RSI,8),%XMM0 |
(3664) 0x4c11be VMOVQ %XMM0,(%R8,%RAX,8) |
(3664) 0x4c11c4 MOV %RAX,(%R11,%R9,8) |
(3664) 0x4c11c8 INC %RAX |
(3664) 0x4c11cb INC %RSI |
(3664) 0x4c11ce CMP (%RBX,%R13,8),%RSI |
(3664) 0x4c11d2 JL 4c11b0 |
(3657) 0x4c11d4 MOV -0x90(%RBP),%RDI |
(3657) 0x4c11db MOV (%RDI,%RDX,8),%RSI |
(3657) 0x4c11df CMP (%RDI,%R13,8),%RSI |
(3657) 0x4c11e3 JGE 4c1289 |
(3657) 0x4c11e9 MOV -0xf8(%RBP),%RDI |
(3657) 0x4c11f0 MOV (%RDI),%RDI |
(3657) 0x4c11f3 MOV -0xe0(%RBP),%R8 |
(3657) 0x4c11fa MOV (%R8),%R8 |
(3657) 0x4c11fd MOV -0x30(%RBP),%R14 |
(3657) 0x4c1201 MOV -0x88(%RBP),%R13 |
(3657) 0x4c1208 MOV -0x38(%RBP),%R11 |
(3657) 0x4c120c MOV -0x48(%RBP),%R10 |
(3657) 0x4c1210 MOV -0x90(%RBP),%RBX |
(3657) 0x4c1217 MOV -0x58(%RBP),%R12 |
(3657) 0x4c121b MOV -0x98(%RBP),%R15 |
(3657) 0x4c1222 NOPW %CS:(%RAX,%RAX,1) |
(3656) 0x4c1230 MOV (%R12,%RSI,8),%R9 |
(3656) 0x4c1234 MOV %R9,(%RDI,%RCX,8) |
(3656) 0x4c1238 VMOVQ (%R13,%RSI,8),%XMM0 |
(3656) 0x4c123f VMOVQ %XMM0,(%R8,%RCX,8) |
(3656) 0x4c1245 MOV %RCX,(%R15,%R9,8) |
(3656) 0x4c1249 INC %RCX |
(3656) 0x4c124c INC %RSI |
(3656) 0x4c124f CMP (%RBX,%R10,8),%RSI |
(3656) 0x4c1253 JL 4c1230 |
(3657) 0x4c1255 MOV -0x40(%RBP),%RBX |
(3657) 0x4c1259 TEST %RBX,%RBX |
(3657) 0x4c125c JG 4c129e |
(3657) 0x4c125e JMP 4c1130 |
0x4c1263 NOPW %CS:(%RAX,%RAX,1) |
(3657) 0x4c1270 MOV -0x48(%RBP),%R13 |
(3657) 0x4c1274 MOV -0x90(%RBP),%RDI |
(3657) 0x4c127b MOV (%RDI,%RDX,8),%RSI |
(3657) 0x4c127f CMP (%RDI,%R13,8),%RSI |
(3657) 0x4c1283 JL 4c11e9 |
(3657) 0x4c1289 MOV -0x30(%RBP),%R14 |
(3657) 0x4c128d MOV -0x38(%RBP),%R11 |
(3657) 0x4c1291 MOV -0x40(%RBP),%RBX |
(3657) 0x4c1295 TEST %RBX,%RBX |
(3657) 0x4c1298 JLE 4c1130 |
(3657) 0x4c129e VPBROADCASTQ %RDX,%YMM0 |
(3657) 0x4c12a4 XOR %ESI,%ESI |
(3657) 0x4c12a6 MOV -0x58(%RBP),%R10 |
(3657) 0x4c12aa MOV -0x50(%RBP),%R15 |
(3657) 0x4c12ae JMP 4c12c6 |
(3658) 0x4c12b0 MOV %R12,%R10 |
(3658) 0x4c12b3 MOV -0x98(%RBP),%R12 |
(3658) 0x4c12ba INC %RSI |
(3658) 0x4c12bd CMP %RBX,%RSI |
(3658) 0x4c12c0 JE 4c1137 |
(3658) 0x4c12c6 MOV %R10,%R12 |
(3658) 0x4c12c9 MOV (%R11,%RSI,8),%R9 |
(3658) 0x4c12cd MOV 0x8(%R11,%RSI,8),%R8 |
(3658) 0x4c12d2 MOV %R8,%R10 |
(3658) 0x4c12d5 SUB %R9,%R10 |
(3658) 0x4c12d8 JLE 4c12b0 |
(3658) 0x4c12da LEA (%R15,%R9,8),%EDI |
(3658) 0x4c12de AND $0x7f,%EDI |
(3658) 0x4c12e1 MOV $0x80,%EBX |
(3658) 0x4c12e6 SUB %EDI,%EBX |
(3658) 0x4c12e8 SHR $0x3,%EBX |
(3658) 0x4c12eb CMP %RBX,%R10 |
(3658) 0x4c12ee MOV %RBX,%R11 |
(3658) 0x4c12f1 CMOVB %R10,%R11 |
(3658) 0x4c12f5 TEST %R11,%R11 |
(3658) 0x4c12f8 MOV -0x98(%RBP),%R12 |
(3658) 0x4c12ff JE 4c1322 |
(3658) 0x4c1301 MOV %R9,%RDI |
(3658) 0x4c1304 MOV %R11,%R14 |
(3658) 0x4c1307 NOPW (%RAX,%RAX,1) |
(3663) 0x4c1310 CMP %RDX,(%R15,%RDI,8) |
(3663) 0x4c1314 JE 4c141c |
(3663) 0x4c131a INC %RDI |
(3663) 0x4c131d DEC %R14 |
(3663) 0x4c1320 JNE 4c1310 |
(3658) 0x4c1322 CMP %RBX,%R10 |
(3658) 0x4c1325 JBE 4c13c3 |
(3658) 0x4c132b SUB %R11,%R10 |
(3658) 0x4c132e MOV %R10,%RBX |
(3658) 0x4c1331 AND $-0x10,%RBX |
(3658) 0x4c1335 JE 4c1386 |
(3658) 0x4c1337 LEA -0x1(%RBX),%R13 |
(3658) 0x4c133b LEA (%R9,%R11,1),%RDI |
(3658) 0x4c133f MOV -0x50(%RBP),%R14 |
(3658) 0x4c1343 LEA (%R14,%RDI,8),%R15 |
(3658) 0x4c1347 XOR %R14D,%R14D |
(3658) 0x4c134a NOPW (%RAX,%RAX,1) |
(3662) 0x4c1350 VPCMPEQQ 0x20(%R15,%R14,8),%YMM0,%K0 |
(3662) 0x4c1358 VPCMPEQQ (%R15,%R14,8),%YMM0,%K1 |
(3662) 0x4c135f VPCMPEQQ 0x60(%R15,%R14,8),%YMM0,%K2 |
(3662) 0x4c1367 VPCMPEQQ 0x40(%R15,%R14,8),%YMM0,%K3 |
(3662) 0x4c136f KORB %K0,%K1,%K4 |
(3662) 0x4c1373 KORB %K2,%K3,%K5 |
(3662) 0x4c1377 KORTESTB %K5,%K4 |
(3662) 0x4c137b JNE 4c13f1 |
(3662) 0x4c137d ADD $0x10,%R14 |
(3662) 0x4c1381 CMP %R13,%R14 |
(3662) 0x4c1384 JBE 4c1350 |
(3658) 0x4c1386 CMP %R10,%RBX |
(3658) 0x4c1389 JAE 4c13d8 |
(3658) 0x4c138b ADD %R11,%R9 |
(3658) 0x4c138e ADD %RBX,%R9 |
(3658) 0x4c1391 MOV %R9,%RDI |
(3658) 0x4c1394 MOV -0x40(%RBP),%RBX |
(3658) 0x4c1398 MOV -0x50(%RBP),%R15 |
(3658) 0x4c139c MOV -0x38(%RBP),%R11 |
(3658) 0x4c13a0 MOV -0x58(%RBP),%R10 |
(3658) 0x4c13a4 MOV -0x30(%RBP),%R14 |
(3658) 0x4c13a8 NOPL (%RAX,%RAX,1) |
(3661) 0x4c13b0 CMP %RDX,(%R15,%RDI,8) |
(3661) 0x4c13b4 JE 4c1420 |
(3661) 0x4c13b6 INC %RDI |
(3661) 0x4c13b9 CMP %RDI,%R8 |
(3661) 0x4c13bc JNE 4c13b0 |
(3658) 0x4c13be JMP 4c12ba |
(3658) 0x4c13c3 MOV -0x38(%RBP),%R11 |
(3658) 0x4c13c7 MOV -0x58(%RBP),%R10 |
(3658) 0x4c13cb MOV -0x30(%RBP),%R14 |
(3658) 0x4c13cf MOV -0x40(%RBP),%RBX |
(3658) 0x4c13d3 JMP 4c12ba |
(3658) 0x4c13d8 MOV -0x40(%RBP),%RBX |
(3658) 0x4c13dc MOV -0x50(%RBP),%R15 |
(3658) 0x4c13e0 MOV -0x38(%RBP),%R11 |
(3658) 0x4c13e4 MOV -0x58(%RBP),%R10 |
(3658) 0x4c13e8 MOV -0x30(%RBP),%R14 |
(3658) 0x4c13ec JMP 4c12ba |
(3658) 0x4c13f1 KSHIFTLB $0x4,%K0,%K0 |
(3658) 0x4c13f7 KORB %K0,%K1,%K0 |
(3658) 0x4c13fb KSHIFTLB $0x4,%K2,%K1 |
(3658) 0x4c1401 KORB %K1,%K3,%K1 |
(3658) 0x4c1405 KUNPCKBW %K0,%K1,%K0 |
(3658) 0x4c1409 KMOVD %K0,%R8D |
(3658) 0x4c140d TZCNT %R8D,%R8D |
(3658) 0x4c1412 ADD %R14,%RDI |
(3658) 0x4c1415 ADD %R8,%RDI |
(3658) 0x4c1418 MOV -0x50(%RBP),%R15 |
(3658) 0x4c141c MOV -0x30(%RBP),%R14 |
(3658) 0x4c1420 MOV -0xb0(%RBP),%R9 |
(3658) 0x4c1427 MOV (%R9,%RDI,8),%R8 |
(3658) 0x4c142b MOV 0x8(%R9,%RDI,8),%R10 |
(3658) 0x4c1430 CMP %R10,%R8 |
(3658) 0x4c1433 JGE 4c14be |
(3658) 0x4c1439 MOV -0xe8(%RBP),%R9 |
(3658) 0x4c1440 MOV (%R9),%R9 |
(3658) 0x4c1443 JMP 4c1464 |
0x4c1445 NOPW %CS:(%RAX,%RAX,1) |
(3660) 0x4c1450 VADDSD (%R9,%RBX,8),%XMM1,%XMM1 |
(3660) 0x4c1456 VMOVSD %XMM1,(%R9,%RBX,8) |
(3660) 0x4c145c INC %R8 |
(3660) 0x4c145f CMP %R10,%R8 |
(3660) 0x4c1462 JGE 4c14be |
(3660) 0x4c1464 MOV -0x108(%RBP),%R11 |
(3660) 0x4c146b MOV (%R11,%R8,8),%R11 |
(3660) 0x4c146f MOV (%R14,%R11,8),%RBX |
(3660) 0x4c1473 MOV -0x140(%RBP),%R13 |
(3660) 0x4c147a VMOVSD (%R13,%R8,8),%XMM1 |
(3660) 0x4c1481 MOV -0xa0(%RBP),%R13 |
(3660) 0x4c1488 CMP (%R13,%RDX,8),%RBX |
(3660) 0x4c148d JGE 4c1450 |
(3660) 0x4c148f MOV -0xf0(%RBP),%R10 |
(3660) 0x4c1496 MOV (%R10),%R10 |
(3660) 0x4c1499 MOV %R11,(%R10,%RAX,8) |
(3660) 0x4c149d VMOVSD %XMM1,(%R9,%RAX,8) |
(3660) 0x4c14a3 MOV %RAX,(%R14,%R11,8) |
(3660) 0x4c14a7 INC %RAX |
(3660) 0x4c14aa MOV -0xb0(%RBP),%R10 |
(3660) 0x4c14b1 MOV 0x8(%R10,%RDI,8),%R10 |
(3660) 0x4c14b6 INC %R8 |
(3660) 0x4c14b9 CMP %R10,%R8 |
(3660) 0x4c14bc JL 4c1464 |
(3658) 0x4c14be MOV -0xb8(%RBP),%R9 |
(3658) 0x4c14c5 MOV (%R9,%RDI,8),%R8 |
(3658) 0x4c14c9 MOV 0x8(%R9,%RDI,8),%R10 |
(3658) 0x4c14ce CMP %R10,%R8 |
(3658) 0x4c14d1 JGE 4c154e |
(3658) 0x4c14d3 MOV -0xe0(%RBP),%R9 |
(3658) 0x4c14da MOV (%R9),%R9 |
(3658) 0x4c14dd JMP 4c14f4 |
0x4c14df NOP |
(3659) 0x4c14e0 VADDSD (%R9,%RBX,8),%XMM1,%XMM1 |
(3659) 0x4c14e6 VMOVSD %XMM1,(%R9,%RBX,8) |
(3659) 0x4c14ec INC %R8 |
(3659) 0x4c14ef CMP %R10,%R8 |
(3659) 0x4c14f2 JGE 4c154e |
(3659) 0x4c14f4 MOV -0x110(%RBP),%R11 |
(3659) 0x4c14fb MOV (%R11,%R8,8),%R11 |
(3659) 0x4c14ff MOV (%R12,%R11,8),%RBX |
(3659) 0x4c1503 MOV -0x148(%RBP),%R13 |
(3659) 0x4c150a VMOVSD (%R13,%R8,8),%XMM1 |
(3659) 0x4c1511 MOV -0xa8(%RBP),%R13 |
(3659) 0x4c1518 CMP (%R13,%RDX,8),%RBX |
(3659) 0x4c151d JGE 4c14e0 |
(3659) 0x4c151f MOV -0xf8(%RBP),%R10 |
(3659) 0x4c1526 MOV (%R10),%R10 |
(3659) 0x4c1529 MOV %R11,(%R10,%RCX,8) |
(3659) 0x4c152d VMOVSD %XMM1,(%R9,%RCX,8) |
(3659) 0x4c1533 MOV %RCX,(%R12,%R11,8) |
(3659) 0x4c1537 INC %RCX |
(3659) 0x4c153a MOV -0xb8(%RBP),%R10 |
(3659) 0x4c1541 MOV 0x8(%R10,%RDI,8),%R10 |
(3659) 0x4c1546 INC %R8 |
(3659) 0x4c1549 CMP %R10,%R8 |
(3659) 0x4c154c JL 4c14f4 |
(3658) 0x4c154e MOV -0x58(%RBP),%R10 |
(3658) 0x4c1552 MOV -0x40(%RBP),%RBX |
(3658) 0x4c1556 MOV -0x38(%RBP),%R11 |
(3658) 0x4c155a JMP 4c12ba |
0x4c155f MOV %R14,%RDI |
0x4c1562 VZEROUPPER |
0x4c1565 CALL 4e7390 <hypre_Free> |
0x4c156a MOV %R12,%RDI |
0x4c156d ADD $0x128,%RSP |
0x4c1574 POP %RBX |
0x4c1575 POP %R12 |
0x4c1577 POP %R13 |
0x4c1579 POP %R14 |
0x4c157b POP %R15 |
0x4c157d POP %RBP |
0x4c157e JMP 4e7390 |
0x4c1583 NOPW %CS:(%RAX,%RAX,1) |
0x4c158d NOPL (%RAX) |
Path / |
Source file and lines | par_csr_matop.c:3454-3640 |
Module | exec |
nb instructions | 285 |
nb uops | 309 |
loop length | 1283 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 60 |
micro-operation queue | 51.50 cycles |
front end | 51.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 13.50 | 13.40 | 28.00 | 28.00 | 34.50 | 13.40 | 13.30 | 34.50 | 34.50 | 34.50 | 13.40 | 28.00 |
cycles | 13.50 | 16.00 | 28.00 | 28.00 | 34.50 | 13.40 | 13.30 | 34.50 | 34.50 | 34.50 | 13.40 | 28.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 48.35-48.40 |
Stall cycles | 0.00 |
Front-end | 51.50 |
Dispatch | 34.50 |
DIV/SQRT | 16.00 |
Overall L1 | 51.50 |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 5% |
all | 12% |
load | 11% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x80(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x148(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4e8fe0 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R15,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4c0a14 <hypre_ParTMatmul.extracted+0x164> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4c0a21 <hypre_ParTMatmul.extracted+0x171> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R15D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %EDX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e8ff0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c0a58 <hypre_ParTMatmul.extracted+0x1a8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RAX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R14,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c0a6a <hypre_ParTMatmul.extracted+0x1ba> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
IMUL %RAX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R15,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x50(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x100(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e72c0 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x78(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e72c0 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0ab3 <hypre_ParTMatmul.extracted+0x203> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RCX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4f03c0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0ad1 <hypre_ParTMatmul.extracted+0x221> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RAX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4f03c0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP -0x68(%RBP),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RBX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x60(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c0e32 <hypre_ParTMatmul.extracted+0x582> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c0b2e <hypre_ParTMatmul.extracted+0x27e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x537270,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,-0xd8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 4c1090 <hypre_ParTMatmul.extracted+0x7e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x118(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xd0(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c0fcc <hypre_ParTMatmul.extracted+0x71c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R11,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c0ef1 <hypre_ParTMatmul.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c0ef1 <hypre_ParTMatmul.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4c0f9e <hypre_ParTMatmul.extracted+0x6ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R11,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4c0f9e <hypre_ParTMatmul.extracted+0x6ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c0fcc <hypre_ParTMatmul.extracted+0x71c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x5,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c0f5d <hypre_ParTMatmul.extracted+0x6ad> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R11),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JAE 4c0fcc <hypre_ParTMatmul.extracted+0x71c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R11,%RCX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c0fcc <hypre_ParTMatmul.extracted+0x71c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV (%R11),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%R11,%RDI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%R10,%RDI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x130(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4daf70 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x128(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x78(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4daf70 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x120(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4db050 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x8(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4db050 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x8(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x537290,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x100(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c10b9 <hypre_ParTMatmul.extracted+0x809> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4f03c0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c10d3 <hypre_ParTMatmul.extracted+0x823> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4f03c0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xd8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4c1109 <hypre_ParTMatmul.extracted+0x859> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RAX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RCX,%RDX,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4c111e <hypre_ParTMatmul.extracted+0x86e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4c155f <hypre_ParTMatmul.extracted+0xcaf> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c155f <hypre_ParTMatmul.extracted+0xcaf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c1148 <hypre_ParTMatmul.extracted+0x898> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e7390 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 4e7390 <hypre_Free> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | par_csr_matop.c:3454-3640 |
Module | exec |
nb instructions | 285 |
nb uops | 309 |
loop length | 1283 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 60 |
micro-operation queue | 51.50 cycles |
front end | 51.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 13.50 | 13.40 | 28.00 | 28.00 | 34.50 | 13.40 | 13.30 | 34.50 | 34.50 | 34.50 | 13.40 | 28.00 |
cycles | 13.50 | 16.00 | 28.00 | 28.00 | 34.50 | 13.40 | 13.30 | 34.50 | 34.50 | 34.50 | 13.40 | 28.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 48.35-48.40 |
Stall cycles | 0.00 |
Front-end | 51.50 |
Dispatch | 34.50 |
DIV/SQRT | 16.00 |
Overall L1 | 51.50 |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 5% |
all | 12% |
load | 11% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x80(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x148(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4e8fe0 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R15,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4c0a14 <hypre_ParTMatmul.extracted+0x164> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4c0a21 <hypre_ParTMatmul.extracted+0x171> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R15D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %EDX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e8ff0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c0a58 <hypre_ParTMatmul.extracted+0x1a8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RAX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R14,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c0a6a <hypre_ParTMatmul.extracted+0x1ba> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
IMUL %RAX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R15,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x50(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x100(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e72c0 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x78(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e72c0 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0ab3 <hypre_ParTMatmul.extracted+0x203> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RCX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4f03c0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0ad1 <hypre_ParTMatmul.extracted+0x221> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RAX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4f03c0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP -0x68(%RBP),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RBX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x60(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c0e32 <hypre_ParTMatmul.extracted+0x582> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c0b2e <hypre_ParTMatmul.extracted+0x27e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x537270,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,-0xd8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 4c1090 <hypre_ParTMatmul.extracted+0x7e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x118(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xd0(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c0fcc <hypre_ParTMatmul.extracted+0x71c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R11,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c0ef1 <hypre_ParTMatmul.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c0ef1 <hypre_ParTMatmul.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4c0f9e <hypre_ParTMatmul.extracted+0x6ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R11,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4c0f9e <hypre_ParTMatmul.extracted+0x6ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c0fcc <hypre_ParTMatmul.extracted+0x71c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x5,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c0f5d <hypre_ParTMatmul.extracted+0x6ad> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R11),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JAE 4c0fcc <hypre_ParTMatmul.extracted+0x71c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R11,%RCX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c0fcc <hypre_ParTMatmul.extracted+0x71c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV (%R11),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%R11,%RDI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%R10,%RDI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x130(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4daf70 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x128(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x78(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4daf70 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x120(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4db050 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x8(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4db050 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x8(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x537290,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x100(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c10b9 <hypre_ParTMatmul.extracted+0x809> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4f03c0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c10d3 <hypre_ParTMatmul.extracted+0x823> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4f03c0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xd8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4c1109 <hypre_ParTMatmul.extracted+0x859> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RAX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RCX,%RDX,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4c111e <hypre_ParTMatmul.extracted+0x86e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4c155f <hypre_ParTMatmul.extracted+0xcaf> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c155f <hypre_ParTMatmul.extracted+0xcaf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c1148 <hypre_ParTMatmul.extracted+0x898> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e7390 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 4e7390 <hypre_Free> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_ParTMatmul.extracted– | 0.07 | 0.01 |
○Loop 3668 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
○Loop 3667 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
▼Loop 3657 - par_csr_matop.c:3467-3634 - exec– | 0 | 0 |
○Loop 3664 - par_csr_matop.c:3590-3596 - exec | 0.01 | 0.01 |
○Loop 3656 - par_csr_matop.c:3598-3604 - exec | 0 | 0 |
▼Loop 3658 - par_csr_matop.c:3467-3634 - exec– | 0 | 0 |
○Loop 3662 - par_csr_matop.c:3505-3608 - exec | 0.02 | 0.01 |
○Loop 3661 - par_csr_matop.c:3607-3608 - exec | 0 | 0 |
○Loop 3663 - par_csr_matop.c:3607-3608 - exec | 0 | 0 |
○Loop 3659 - par_csr_matop.c:3623-3634 - exec | 0 | 0 |
○Loop 3660 - par_csr_matop.c:3610-3621 - exec | 0 | 0 |
○Loop 3666 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
○Loop 3665 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
▼Loop 3670 - par_csr_matop.c:3467-3528 - exec– | 0 | 0 |
○Loop 3677 - par_csr_matop.c:3491-3495 - exec | 0.01 | 0 |
▼Loop 3671 - par_csr_matop.c:3467-3522 - exec– | 0 | 0 |
○Loop 3675 - par_csr_matop.c:3504-3505 - exec | 0.03 | 0.01 |
○Loop 3673 - par_csr_matop.c:3507-3513 - exec | 0 | 0 |
○Loop 3672 - par_csr_matop.c:3516-3522 - exec | 0 | 0 |
○Loop 3676 - par_csr_matop.c:3504-3505 - exec | 0 | 0 |
○Loop 3674 - par_csr_matop.c:3504-3505 - exec | 0 | 0 |
○Loop 3669 - par_csr_matop.c:3497-3501 - exec | 0 | 0 |