Function: hypre_ParTMatmul.extracted | Module: libparcsr_mv.so | Source: par_csr_matop.c:3454-3640 [...] | Coverage: 0.06% |
---|
Function: hypre_ParTMatmul.extracted | Module: libparcsr_mv.so | Source: par_csr_matop.c:3454-3640 [...] | Coverage: 0.06% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-147-2675/intel/AMG/build/AMG/AMG/parcsr_mv/par_csr_matop.c: 3454 - 3640 |
-------------------------------------------------------------------------------- |
3454: #pragma omp parallel |
[...] |
3462: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
3463: |
3464: size = num_cols_diag_A/num_threads; |
3465: rest = num_cols_diag_A - size*num_threads; |
3466: ii = hypre_GetThreadNum(); |
3467: if (ii < rest) |
3468: { |
3469: ns = ii*size+ii; |
3470: ne = (ii+1)*size+ii+1; |
3471: } |
3472: else |
3473: { |
3474: ns = ii*size+rest; |
3475: ne = (ii+1)*size+rest; |
3476: } |
3477: |
3478: B_marker = hypre_CTAlloc(HYPRE_Int, num_cols_diag_B); |
3479: B_marker_offd = hypre_CTAlloc(HYPRE_Int, num_cols_offd_C); |
3480: |
3481: for (ik = 0; ik < num_cols_diag_B; ik++) |
3482: B_marker[ik] = -1; |
3483: |
3484: for (ik = 0; ik < num_cols_offd_C; ik++) |
3485: B_marker_offd[ik] = -1; |
3486: |
3487: nnz_d = 0; |
3488: nnz_o = 0; |
3489: for (ik = ns; ik < ne; ik++) |
3490: { |
3491: for (jk = C_tmp_diag_i[ik]; jk < C_tmp_diag_i[ik+1]; jk++) |
3492: { |
3493: jcol = C_tmp_diag_j[jk]; |
3494: B_marker[jcol] = ik; |
3495: nnz_d++; |
3496: } |
3497: for (jk = C_tmp_offd_i[ik]; jk < C_tmp_offd_i[ik+1]; jk++) |
3498: { |
3499: jcol = C_tmp_offd_j[jk]; |
3500: B_marker_offd[jcol] = ik; |
3501: nnz_o++; |
3502: } |
3503: for (jk = 0; jk < num_sends_A; jk++) |
3504: for (j1 = send_map_starts_A[jk]; j1 < send_map_starts_A[jk+1]; j1++) |
3505: if (send_map_elmts_A[j1] == ik) |
3506: { |
3507: for (j2 = C_ext_diag_i[j1]; j2 < C_ext_diag_i[j1+1]; j2++) |
3508: { |
3509: jcol = C_ext_diag_j[j2]; |
3510: if (B_marker[jcol] < ik) |
3511: { |
3512: B_marker[jcol] = ik; |
3513: nnz_d++; |
3514: } |
3515: } |
3516: for (j2 = C_ext_offd_i[j1]; j2 < C_ext_offd_i[j1+1]; j2++) |
3517: { |
3518: jcol = C_ext_offd_j[j2]; |
3519: if (B_marker_offd[jcol] < ik) |
3520: { |
3521: B_marker_offd[jcol] = ik; |
3522: nnz_o++; |
3523: } |
3524: } |
3525: break; |
3526: } |
3527: C_diag_array[ii] = nnz_d; |
3528: C_offd_array[ii] = nnz_o; |
3529: } |
3530: #ifdef HYPRE_USING_OPENMP |
3531: #pragma omp barrier |
3532: #endif |
3533: if (ii == 0) |
3534: { |
3535: nnz_d = 0; |
3536: nnz_o = 0; |
3537: for (ik = 0; ik < num_threads-1; ik++) |
3538: { |
3539: C_diag_array[ik+1] += C_diag_array[ik]; |
3540: C_offd_array[ik+1] += C_offd_array[ik]; |
3541: } |
3542: nnz_d = C_diag_array[num_threads-1]; |
3543: nnz_o = C_offd_array[num_threads-1]; |
3544: C_diag_i[num_cols_diag_A] = nnz_d; |
3545: C_offd_i[num_cols_diag_A] = nnz_o; |
3546: |
3547: C_diag = hypre_CSRMatrixCreate(num_cols_diag_A, num_cols_diag_A, nnz_d); |
3548: C_offd = hypre_CSRMatrixCreate(num_cols_diag_A, num_cols_offd_C, nnz_o); |
3549: hypre_CSRMatrixI(C_diag) = C_diag_i; |
3550: hypre_CSRMatrixInitialize(C_diag); |
3551: C_diag_j = hypre_CSRMatrixJ(C_diag); |
3552: C_diag_data = hypre_CSRMatrixData(C_diag); |
3553: hypre_CSRMatrixI(C_offd) = C_offd_i; |
3554: hypre_CSRMatrixInitialize(C_offd); |
3555: C_offd_j = hypre_CSRMatrixJ(C_offd); |
3556: C_offd_data = hypre_CSRMatrixData(C_offd); |
[...] |
3568: for (ik = 0; ik < num_cols_diag_B; ik++) |
3569: B_marker[ik] = -1; |
3570: |
3571: for (ik = 0; ik < num_cols_offd_C; ik++) |
3572: B_marker_offd[ik] = -1; |
[...] |
3581: if (ii) |
3582: { |
3583: nnz_d = C_diag_array[ii-1]; |
3584: nnz_o = C_offd_array[ii-1]; |
3585: } |
3586: for (ik = ns; ik < ne; ik++) |
3587: { |
3588: C_diag_i[ik] = nnz_d; |
3589: C_offd_i[ik] = nnz_o; |
3590: for (jk = C_tmp_diag_i[ik]; jk < C_tmp_diag_i[ik+1]; jk++) |
3591: { |
3592: jcol = C_tmp_diag_j[jk]; |
3593: C_diag_j[nnz_d] = jcol; |
3594: C_diag_data[nnz_d] = C_tmp_diag_data[jk]; |
3595: B_marker[jcol] = nnz_d; |
3596: nnz_d++; |
3597: } |
3598: for (jk = C_tmp_offd_i[ik]; jk < C_tmp_offd_i[ik+1]; jk++) |
3599: { |
3600: jcol = C_tmp_offd_j[jk]; |
3601: C_offd_j[nnz_o] = jcol; |
3602: C_offd_data[nnz_o] = C_tmp_offd_data[jk]; |
3603: B_marker_offd[jcol] = nnz_o; |
3604: nnz_o++; |
3605: } |
3606: for (jk = 0; jk < num_sends_A; jk++) |
3607: for (j1 = send_map_starts_A[jk]; j1 < send_map_starts_A[jk+1]; j1++) |
3608: if (send_map_elmts_A[j1] == ik) |
3609: { |
3610: for (j2 = C_ext_diag_i[j1]; j2 < C_ext_diag_i[j1+1]; j2++) |
3611: { |
3612: jcol = C_ext_diag_j[j2]; |
3613: if (B_marker[jcol] < C_diag_i[ik]) |
3614: { |
3615: C_diag_j[nnz_d] = jcol; |
3616: C_diag_data[nnz_d] = C_ext_diag_data[j2]; |
3617: B_marker[jcol] = nnz_d; |
3618: nnz_d++; |
3619: } |
3620: else |
3621: C_diag_data[B_marker[jcol]] += C_ext_diag_data[j2]; |
3622: } |
3623: for (j2 = C_ext_offd_i[j1]; j2 < C_ext_offd_i[j1+1]; j2++) |
3624: { |
3625: jcol = C_ext_offd_j[j2]; |
3626: if (B_marker_offd[jcol] < C_offd_i[ik]) |
3627: { |
3628: C_offd_j[nnz_o] = jcol; |
3629: C_offd_data[nnz_o] = C_ext_offd_data[j2]; |
3630: B_marker_offd[jcol] = nnz_o; |
3631: nnz_o++; |
3632: } |
3633: else |
3634: C_offd_data[B_marker_offd[jcol]] += C_ext_offd_data[j2]; |
3635: } |
3636: break; |
3637: } |
3638: } |
3639: hypre_TFree(B_marker); |
3640: hypre_TFree(B_marker_offd); |
0x14680 PUSH %RBP |
0x14681 MOV %RSP,%RBP |
0x14684 PUSH %R15 |
0x14686 PUSH %R14 |
0x14688 PUSH %R13 |
0x1468a PUSH %R12 |
0x1468c PUSH %RBX |
0x1468d SUB $0x128,%RSP |
0x14694 MOV %R9,-0x98(%RBP) |
0x1469b MOV %R8,%R15 |
0x1469e MOV %RCX,-0xf8(%RBP) |
0x146a5 MOV %RDX,%R13 |
0x146a8 MOV %RDI,%R14 |
0x146ab MOV 0xc8(%RBP),%RAX |
0x146b2 MOV %RAX,-0xc8(%RBP) |
0x146b9 MOV 0xc0(%RBP),%RAX |
0x146c0 MOV %RAX,-0xc0(%RBP) |
0x146c7 MOV 0xb8(%RBP),%RAX |
0x146ce MOV %RAX,-0x78(%RBP) |
0x146d2 MOV 0xb0(%RBP),%RAX |
0x146d9 MOV %RAX,-0x38(%RBP) |
0x146dd MOV 0xa8(%RBP),%RAX |
0x146e4 MOV %RAX,-0x50(%RBP) |
0x146e8 MOV 0xa0(%RBP),%RAX |
0x146ef MOV %RAX,-0x108(%RBP) |
0x146f6 MOV 0x98(%RBP),%RAX |
0x146fd MOV %RAX,-0xe8(%RBP) |
0x14704 MOV 0x90(%RBP),%RAX |
0x1470b MOV %RAX,-0xa8(%RBP) |
0x14712 MOV 0x88(%RBP),%RAX |
0x14719 MOV %RAX,-0x90(%RBP) |
0x14720 MOV 0x80(%RBP),%RAX |
0x14727 MOV %RAX,-0x148(%RBP) |
0x1472e MOV 0x78(%RBP),%RAX |
0x14732 MOV %RAX,-0x60(%RBP) |
0x14736 MOV 0x70(%RBP),%RAX |
0x1473a MOV %RAX,-0xd8(%RBP) |
0x14741 MOV 0x68(%RBP),%R12 |
0x14745 MOV 0x60(%RBP),%RAX |
0x14749 MOV %RAX,-0x100(%RBP) |
0x14750 MOV 0x58(%RBP),%RAX |
0x14754 MOV %RAX,-0x80(%RBP) |
0x14758 MOV 0x50(%RBP),%RAX |
0x1475c MOV %RAX,-0x118(%RBP) |
0x14763 MOV 0x48(%RBP),%RAX |
0x14767 MOV %RAX,-0x40(%RBP) |
0x1476b MOV 0x40(%RBP),%RAX |
0x1476f MOV %RAX,-0xb8(%RBP) |
0x14776 MOV 0x38(%RBP),%RAX |
0x1477a MOV %RAX,-0x110(%RBP) |
0x14781 MOV 0x30(%RBP),%RBX |
0x14785 MOV 0x28(%RBP),%RAX |
0x14789 MOV %RAX,-0xb0(%RBP) |
0x14790 MOV 0x20(%RBP),%RAX |
0x14794 MOV %RAX,-0x130(%RBP) |
0x1479b MOV 0x18(%RBP),%RAX |
0x1479f MOV %RAX,-0xe0(%RBP) |
0x147a6 MOV 0x10(%RBP),%RAX |
0x147aa MOV %RAX,-0xa0(%RBP) |
0x147b1 CALL 5500 <hypre_NumActiveThreads@plt> |
0x147b6 MOV %RAX,%RSI |
0x147b9 MOV %R13,%RAX |
0x147bc OR %RSI,%RAX |
0x147bf SHR $0x20,%RAX |
0x147c3 MOV %R14,-0xf0(%RBP) |
0x147ca MOV %R15,-0x138(%RBP) |
0x147d1 MOV %R13,-0x128(%RBP) |
0x147d8 MOV %RSI,-0x120(%RBP) |
0x147df JE 147f1 |
0x147e1 MOV %R13,%RAX |
0x147e4 CQTO |
0x147e6 IDIV %RSI |
0x147e9 MOV %RDX,%R15 |
0x147ec MOV %RAX,%R14 |
0x147ef JMP 147fe |
0x147f1 MOV %R13D,%EAX |
0x147f4 XOR %EDX,%EDX |
0x147f6 DIV %ESI |
0x147f8 MOV %EDX,%R15D |
0x147fb MOV %EAX,%R14D |
0x147fe MOV %RBX,%R13 |
0x14801 CALL 50d0 <hypre_GetThreadNum@plt> |
0x14806 MOV %RAX,%RCX |
0x14809 INC %RAX |
0x1480c CMP %R15,%RCX |
0x1480f MOV %RCX,-0xd0(%RBP) |
0x14816 JGE 14829 |
0x14818 INC %R14 |
0x1481b IMUL %R14,%RCX |
0x1481f MOV %RCX,-0x58(%RBP) |
0x14823 IMUL %R14,%RAX |
0x14827 JMP 1483b |
0x14829 IMUL %R14,%RCX |
0x1482d ADD %R15,%RCX |
0x14830 MOV %RCX,-0x58(%RBP) |
0x14834 IMUL %R14,%RAX |
0x14838 ADD %R15,%RAX |
0x1483b MOV %RAX,-0x70(%RBP) |
0x1483f MOV $0x8,%ESI |
0x14844 MOV -0xf8(%RBP),%R14 |
0x1484b MOV %R14,%RDI |
0x1484e CALL 55c0 <hypre_CAlloc@plt> |
0x14853 MOV %RAX,%RBX |
0x14856 MOV -0x78(%RBP),%RAX |
0x1485a MOV (%RAX),%RDI |
0x1485d MOV $0x8,%ESI |
0x14862 CALL 55c0 <hypre_CAlloc@plt> |
0x14867 MOV %RAX,%R15 |
0x1486a TEST %R14,%R14 |
0x1486d JLE 14884 |
0x1486f LEA (,%R14,8),%RDX |
0x14877 MOV %RBX,%RDI |
0x1487a MOV $0xff,%ESI |
0x1487f CALL 51d0 <__intel_avx_rep_memset@plt> |
0x14884 MOV -0x78(%RBP),%RDX |
0x14888 CMPQ $0,(%RDX) |
0x1488c MOV -0x70(%RBP),%RCX |
0x14890 JLE 148b0 |
0x14892 XOR %EAX,%EAX |
0x14894 NOPW %CS:(%RAX,%RAX,1) |
(364) 0x148a0 MOVQ $-0x1,(%R15,%RAX,8) |
(364) 0x148a8 INC %RAX |
(364) 0x148ab CMP (%RDX),%RAX |
(364) 0x148ae JL 148a0 |
0x148b0 CMP %RCX,-0x58(%RBP) |
0x148b4 MOV -0x60(%RBP),%R8 |
0x148b8 MOV %R12,-0x140(%RBP) |
0x148bf MOV -0x40(%RBP),%R14 |
0x148c3 MOV %R13,-0x68(%RBP) |
0x148c7 MOV -0x38(%RBP),%R13 |
0x148cb MOV %RBX,-0x30(%RBP) |
0x148cf MOV %R15,-0x88(%RBP) |
0x148d6 JGE 14c09 |
0x148dc XOR %EAX,%EAX |
0x148de MOV -0x58(%RBP),%RDX |
0x148e2 XOR %ECX,%ECX |
0x148e4 JMP 1491a |
0x148e6 NOPW %CS:(%RAX,%RAX,1) |
(355) 0x148f0 MOV -0xc0(%RBP),%RDX |
(355) 0x148f7 MOV -0xd0(%RBP),%RSI |
(355) 0x148fe MOV %RCX,(%RDX,%RSI,8) |
(355) 0x14902 MOV -0xc8(%RBP),%RDX |
(355) 0x14909 MOV %RAX,(%RDX,%RSI,8) |
(355) 0x1490d MOV %R11,%RDX |
(355) 0x14910 CMP -0x70(%RBP),%R11 |
(355) 0x14914 JGE 14c09 |
(355) 0x1491a MOV -0x80(%RBP),%RDI |
(355) 0x1491e MOV (%RDI,%RDX,8),%RSI |
(355) 0x14922 LEA 0x1(%RDX),%R11 |
(355) 0x14926 CMP 0x8(%RDI,%RDX,8),%RSI |
(355) 0x1492b JGE 14954 |
(355) 0x1492d MOV -0x100(%RBP),%R9 |
(355) 0x14934 MOV -0x80(%RBP),%R10 |
(355) 0x14938 NOPL (%RAX,%RAX,1) |
(363) 0x14940 MOV (%R9,%RSI,8),%RDI |
(363) 0x14944 MOV %RDX,(%RBX,%RDI,8) |
(363) 0x14948 INC %RCX |
(363) 0x1494b INC %RSI |
(363) 0x1494e CMP (%R10,%R11,8),%RSI |
(363) 0x14952 JL 14940 |
(355) 0x14954 MOV -0xd8(%RBP),%RDI |
(355) 0x1495b MOV (%RDI,%RDX,8),%RSI |
(355) 0x1495f CMP (%RDI,%R11,8),%RSI |
(355) 0x14963 JGE 1498b |
(355) 0x14965 NOPW %CS:(%RAX,%RAX,1) |
(362) 0x14970 MOV (%R8,%RSI,8),%RDI |
(362) 0x14974 MOV %RDX,(%R15,%RDI,8) |
(362) 0x14978 INC %RAX |
(362) 0x1497b INC %RSI |
(362) 0x1497e MOV -0xd8(%RBP),%RDI |
(362) 0x14985 CMP (%RDI,%R11,8),%RSI |
(362) 0x14989 JL 14970 |
(355) 0x1498b TEST %R13,%R13 |
(355) 0x1498e JLE 148f0 |
(355) 0x14994 VPBROADCASTQ %RDX,%YMM0 |
(355) 0x1499a XOR %EDI,%EDI |
(355) 0x1499c MOV %R11,-0x48(%RBP) |
(355) 0x149a0 JMP 149d0 |
(356) 0x149a2 MOV %R12,%R13 |
(356) 0x149a5 MOV %R15,%R14 |
(356) 0x149a8 MOV -0x60(%RBP),%R8 |
(356) 0x149ac MOV -0x30(%RBP),%RBX |
(356) 0x149b0 MOV -0x88(%RBP),%R15 |
(356) 0x149b7 NOPW (%RAX,%RAX,1) |
(356) 0x149c0 MOV -0x48(%RBP),%R11 |
(356) 0x149c4 INC %RDI |
(356) 0x149c7 CMP %R13,%RDI |
(356) 0x149ca JE 148f0 |
(356) 0x149d0 MOV -0x108(%RBP),%RSI |
(356) 0x149d7 MOV (%RSI,%RDI,8),%R10 |
(356) 0x149db MOV 0x8(%RSI,%RDI,8),%R9 |
(356) 0x149e0 MOV %R9,%R11 |
(356) 0x149e3 SUB %R10,%R11 |
(356) 0x149e6 JLE 149c0 |
(356) 0x149e8 MOV %R14,%R15 |
(356) 0x149eb MOV %R13,%R12 |
(356) 0x149ee MOV -0x50(%RBP),%RSI |
(356) 0x149f2 LEA (%RSI,%R10,8),%ESI |
(356) 0x149f6 AND $0x7f,%ESI |
(356) 0x149f9 MOV $0x80,%EBX |
(356) 0x149fe SUB %ESI,%EBX |
(356) 0x14a00 SHR $0x3,%EBX |
(356) 0x14a03 CMP %RBX,%R11 |
(356) 0x14a06 MOV %RBX,%RSI |
(356) 0x14a09 CMOVB %R11,%RSI |
(356) 0x14a0d TEST %RSI,%RSI |
(356) 0x14a10 JE 14a37 |
(356) 0x14a12 MOV %R10,%R8 |
(356) 0x14a15 MOV %RSI,%R14 |
(356) 0x14a18 NOPL (%RAX,%RAX,1) |
(361) 0x14a20 MOV -0x50(%RBP),%R13 |
(361) 0x14a24 CMP %RDX,(%R13,%R8,8) |
(361) 0x14a29 JE 14ae7 |
(361) 0x14a2f INC %R8 |
(361) 0x14a32 DEC %R14 |
(361) 0x14a35 JNE 14a20 |
(356) 0x14a37 CMP %RBX,%R11 |
(356) 0x14a3a JBE 149a2 |
(356) 0x14a40 SUB %RSI,%R11 |
(356) 0x14a43 MOV %R11,%RBX |
(356) 0x14a46 AND $-0x10,%RBX |
(356) 0x14a4a MOV -0x88(%RBP),%R15 |
(356) 0x14a51 JE 14aa6 |
(356) 0x14a53 LEA -0x1(%RBX),%R13 |
(356) 0x14a57 LEA (%R10,%RSI,1),%R8 |
(356) 0x14a5b MOV -0x50(%RBP),%R14 |
(356) 0x14a5f LEA (%R14,%R8,8),%R14 |
(356) 0x14a63 XOR %R12D,%R12D |
(356) 0x14a66 NOPW %CS:(%RAX,%RAX,1) |
(360) 0x14a70 VPCMPEQQ 0x20(%R14,%R12,8),%YMM0,%K0 |
(360) 0x14a78 VPCMPEQQ (%R14,%R12,8),%YMM0,%K1 |
(360) 0x14a7f VPCMPEQQ 0x60(%R14,%R12,8),%YMM0,%K2 |
(360) 0x14a87 VPCMPEQQ 0x40(%R14,%R12,8),%YMM0,%K3 |
(360) 0x14a8f KORB %K2,%K3,%K4 |
(360) 0x14a93 KORB %K0,%K1,%K5 |
(360) 0x14a97 KORTESTB %K4,%K5 |
(360) 0x14a9b JNE 14b13 |
(360) 0x14a9d ADD $0x10,%R12 |
(360) 0x14aa1 CMP %R13,%R12 |
(360) 0x14aa4 JBE 14a70 |
(356) 0x14aa6 CMP %R11,%RBX |
(356) 0x14aa9 JAE 14afe |
(356) 0x14aab ADD %RSI,%R10 |
(356) 0x14aae ADD %RBX,%R10 |
(356) 0x14ab1 MOV %R10,%R8 |
(356) 0x14ab4 MOV -0x38(%RBP),%R13 |
(356) 0x14ab8 MOV -0x40(%RBP),%R14 |
(356) 0x14abc MOV -0x68(%RBP),%R11 |
(356) 0x14ac0 MOV -0x30(%RBP),%RBX |
(356) 0x14ac4 NOPW %CS:(%RAX,%RAX,1) |
(359) 0x14ad0 MOV -0x50(%RBP),%RSI |
(359) 0x14ad4 CMP %RDX,(%RSI,%R8,8) |
(359) 0x14ad8 JE 14b4e |
(359) 0x14ada INC %R8 |
(359) 0x14add CMP %R8,%R9 |
(359) 0x14ae0 JNE 14ad0 |
(356) 0x14ae2 JMP 14bf7 |
(356) 0x14ae7 MOV -0x68(%RBP),%R11 |
(356) 0x14aeb MOV -0x30(%RBP),%RBX |
(356) 0x14aef MOV %R12,%R13 |
(356) 0x14af2 MOV -0x88(%RBP),%R10 |
(356) 0x14af9 MOV %R15,%R14 |
(356) 0x14afc JMP 14b60 |
(356) 0x14afe MOV -0x38(%RBP),%R13 |
(356) 0x14b02 MOV -0x60(%RBP),%R8 |
(356) 0x14b06 MOV -0x40(%RBP),%R14 |
(356) 0x14b0a MOV -0x30(%RBP),%RBX |
(356) 0x14b0e JMP 149c0 |
(356) 0x14b13 MOV %R15,%R10 |
(356) 0x14b16 KSHIFTLB $0x4,%K0,%K0 |
(356) 0x14b1c KORB %K0,%K1,%K0 |
(356) 0x14b20 KSHIFTLB $0x4,%K2,%K1 |
(356) 0x14b26 KORB %K1,%K3,%K1 |
(356) 0x14b2a KUNPCKBW %K0,%K1,%K0 |
(356) 0x14b2e KMOVD %K0,%ESI |
(356) 0x14b32 TZCNT %ESI,%ESI |
(356) 0x14b36 ADD %R12,%R8 |
(356) 0x14b39 ADD %RSI,%R8 |
(356) 0x14b3c MOV -0x38(%RBP),%R13 |
(356) 0x14b40 MOV -0x40(%RBP),%R14 |
(356) 0x14b44 MOV -0x68(%RBP),%R11 |
(356) 0x14b48 MOV -0x30(%RBP),%RBX |
(356) 0x14b4c JMP 14b60 |
(356) 0x14b4e MOV %R15,%R10 |
(356) 0x14b51 NOPW %CS:(%RAX,%RAX,1) |
(356) 0x14b60 MOV -0xb0(%RBP),%R9 |
(356) 0x14b67 MOV (%R9,%R8,8),%RSI |
(356) 0x14b6b MOV 0x8(%R9,%R8,8),%R9 |
(356) 0x14b70 MOV %R10,%R15 |
(356) 0x14b73 JMP 14b83 |
0x14b75 NOPW %CS:(%RAX,%RAX,1) |
(358) 0x14b80 INC %RSI |
(358) 0x14b83 CMP %R9,%RSI |
(358) 0x14b86 JGE 14bb0 |
(358) 0x14b88 MOV (%R11,%RSI,8),%R10 |
(358) 0x14b8c CMP %RDX,(%RBX,%R10,8) |
(358) 0x14b90 JGE 14b80 |
(358) 0x14b92 MOV %RDX,(%RBX,%R10,8) |
(358) 0x14b96 INC %RCX |
(358) 0x14b99 MOV -0xb0(%RBP),%R9 |
(358) 0x14ba0 MOV 0x8(%R9,%R8,8),%R9 |
(358) 0x14ba5 JMP 14b80 |
0x14ba7 NOPW (%RAX,%RAX,1) |
(356) 0x14bb0 MOV -0xb8(%RBP),%R9 |
(356) 0x14bb7 MOV (%R9,%R8,8),%RSI |
(356) 0x14bbb MOV 0x8(%R9,%R8,8),%R9 |
(356) 0x14bc0 CMP %R9,%RSI |
(356) 0x14bc3 JGE 14bf7 |
(356) 0x14bc5 MOV -0x48(%RBP),%R11 |
(356) 0x14bc9 JMP 14bd8 |
0x14bcb NOPL (%RAX,%RAX,1) |
(357) 0x14bd0 INC %RSI |
(357) 0x14bd3 CMP %R9,%RSI |
(357) 0x14bd6 JGE 14c00 |
(357) 0x14bd8 MOV (%R14,%RSI,8),%R10 |
(357) 0x14bdc CMP %RDX,(%R15,%R10,8) |
(357) 0x14be0 JGE 14bd0 |
(357) 0x14be2 MOV %RDX,(%R15,%R10,8) |
(357) 0x14be6 INC %RAX |
(357) 0x14be9 MOV -0xb8(%RBP),%R9 |
(357) 0x14bf0 MOV 0x8(%R9,%R8,8),%R9 |
(357) 0x14bf5 JMP 14bd0 |
(356) 0x14bf7 MOV -0x60(%RBP),%R8 |
(356) 0x14bfb JMP 149c0 |
(356) 0x14c00 MOV -0x60(%RBP),%R8 |
(356) 0x14c04 JMP 149c4 |
0x14c09 MOV -0xf0(%RBP),%R14 |
0x14c10 MOV (%R14),%ESI |
0x14c13 LEA 0xd8a6(%RIP),%RDI |
0x14c1a VZEROUPPER |
0x14c1d CALL 55e0 <__kmpc_barrier@plt> |
0x14c22 CMPQ $0,-0xd0(%RBP) |
0x14c2a MOV -0x58(%RBP),%R12 |
0x14c2e JNE 14f36 |
0x14c34 MOV -0x120(%RBP),%R8 |
0x14c3b CMP $0x2,%R8 |
0x14c3f MOV -0xc8(%RBP),%R10 |
0x14c46 MOV -0xc0(%RBP),%R11 |
0x14c4d JL 14e6c |
0x14c53 LEA -0x1(%R8),%RAX |
0x14c57 LEA (%R10,%R8,8),%RCX |
0x14c5b CMP %R11,%RCX |
0x14c5e JBE 14cc1 |
0x14c60 LEA (%R11,%R8,8),%RCX |
0x14c64 CMP %R10,%RCX |
0x14c67 JBE 14cc1 |
0x14c69 LEA (%R11,%RAX,8),%RCX |
0x14c6d CMP %R10,%RCX |
0x14c70 JB 14dc1 |
0x14c76 LEA (%R10,%RAX,8),%RCX |
0x14c7a CMP %R11,%RCX |
0x14c7d JB 14dc1 |
0x14c83 MOV $0x1,%EAX |
0x14c88 NOPL (%RAX,%RAX,1) |
(354) 0x14c90 MOV -0x8(%R11,%RAX,8),%RCX |
(354) 0x14c95 LEA (%R11,%RAX,8),%RDX |
(354) 0x14c99 MOV (%RDX),%RSI |
(354) 0x14c9c ADD %RCX,%RSI |
(354) 0x14c9f MOV %RSI,(%RDX) |
(354) 0x14ca2 MOV -0x8(%R10,%RAX,8),%RCX |
(354) 0x14ca7 LEA (%R10,%RAX,8),%RDX |
(354) 0x14cab MOV (%RDX),%RSI |
(354) 0x14cae ADD %RCX,%RSI |
(354) 0x14cb1 MOV %RSI,(%RDX) |
(354) 0x14cb4 INC %RAX |
(354) 0x14cb7 CMP %RAX,%R8 |
(354) 0x14cba JNE 14c90 |
0x14cbc JMP 14e6c |
0x14cc1 MOV (%R11),%RCX |
0x14cc4 MOV (%R10),%RDX |
0x14cc7 LEA (%R11,%RAX,8),%RSI |
0x14ccb LEA 0x8(%R10),%RDI |
0x14ccf CMP %RDI,%RSI |
0x14cd2 JB 14d11 |
0x14cd4 LEA 0x8(%R11),%RSI |
0x14cd8 LEA (%R10,%RAX,8),%RDI |
0x14cdc CMP %RSI,%RDI |
0x14cdf JB 14d11 |
0x14ce1 MOV $0x1,%EAX |
0x14ce6 NOPW %CS:(%RAX,%RAX,1) |
(351) 0x14cf0 LEA (%R11,%RAX,8),%RSI |
(351) 0x14cf4 ADD (%RSI),%RCX |
(351) 0x14cf7 MOV %RCX,(%RSI) |
(351) 0x14cfa LEA (%R10,%RAX,8),%RSI |
(351) 0x14cfe ADD (%RSI),%RDX |
(351) 0x14d01 MOV %RDX,(%RSI) |
(351) 0x14d04 INC %RAX |
(351) 0x14d07 CMP %RAX,%R8 |
(351) 0x14d0a JNE 14cf0 |
0x14d0c JMP 14e6c |
0x14d11 MOV %R8,%RBX |
0x14d14 CMP $0x5,%R8 |
0x14d18 JB 14d7d |
0x14d1a MOV %RAX,%RSI |
0x14d1d SHR $0x2,%RSI |
0x14d21 MOV $0x20,%EDI |
0x14d26 NOPW %CS:(%RAX,%RAX,1) |
(350) 0x14d30 LEA (%R11,%RDI,1),%R8 |
(350) 0x14d34 ADD -0x18(%R8),%RCX |
(350) 0x14d38 MOV %RCX,-0x18(%R8) |
(350) 0x14d3c LEA (%R10,%RDI,1),%R9 |
(350) 0x14d40 ADD -0x18(%R9),%RDX |
(350) 0x14d44 MOV %RDX,-0x18(%R9) |
(350) 0x14d48 ADD -0x10(%R8),%RCX |
(350) 0x14d4c MOV %RCX,-0x10(%R8) |
(350) 0x14d50 ADD -0x10(%R9),%RDX |
(350) 0x14d54 MOV %RDX,-0x10(%R9) |
(350) 0x14d58 ADD -0x8(%R8),%RCX |
(350) 0x14d5c MOV %RCX,-0x8(%R8) |
(350) 0x14d60 ADD -0x8(%R9),%RDX |
(350) 0x14d64 MOV %RDX,-0x8(%R9) |
(350) 0x14d68 ADD (%R8),%RCX |
(350) 0x14d6b MOV %RCX,(%R8) |
(350) 0x14d6e ADD (%R9),%RDX |
(350) 0x14d71 MOV %RDX,(%R9) |
(350) 0x14d74 ADD $0x20,%RDI |
(350) 0x14d78 DEC %RSI |
(350) 0x14d7b JNE 14d30 |
0x14d7d MOV %RAX,%RSI |
0x14d80 AND $-0x4,%RSI |
0x14d84 CMP %RAX,%RSI |
0x14d87 MOV %RBX,%R8 |
0x14d8a JAE 14e6c |
0x14d90 INC %RSI |
0x14d93 NOPW %CS:(%RAX,%RAX,1) |
(349) 0x14da0 LEA (%R11,%RSI,8),%RAX |
(349) 0x14da4 ADD (%RAX),%RCX |
(349) 0x14da7 MOV %RCX,(%RAX) |
(349) 0x14daa LEA (%R10,%RSI,8),%RAX |
(349) 0x14dae ADD (%RAX),%RDX |
(349) 0x14db1 MOV %RDX,(%RAX) |
(349) 0x14db4 INC %RSI |
(349) 0x14db7 CMP %RSI,%R8 |
(349) 0x14dba JNE 14da0 |
0x14dbc JMP 14e6c |
0x14dc1 MOV %R8,%RBX |
0x14dc4 CMP $0x5,%R8 |
0x14dc8 JB 14e2d |
0x14dca MOV %RAX,%RCX |
0x14dcd SHR $0x2,%RCX |
0x14dd1 MOV (%R11),%RDX |
0x14dd4 MOV (%R10),%RSI |
0x14dd7 MOV $0x20,%EDI |
0x14ddc NOPL (%RAX) |
(353) 0x14de0 LEA (%R11,%RDI,1),%R8 |
(353) 0x14de4 ADD -0x18(%R8),%RDX |
(353) 0x14de8 MOV %RDX,-0x18(%R8) |
(353) 0x14dec LEA (%R10,%RDI,1),%R9 |
(353) 0x14df0 ADD -0x18(%R9),%RSI |
(353) 0x14df4 MOV %RSI,-0x18(%R9) |
(353) 0x14df8 ADD -0x10(%R8),%RDX |
(353) 0x14dfc MOV %RDX,-0x10(%R8) |
(353) 0x14e00 ADD -0x10(%R9),%RSI |
(353) 0x14e04 MOV %RSI,-0x10(%R9) |
(353) 0x14e08 ADD -0x8(%R8),%RDX |
(353) 0x14e0c MOV %RDX,-0x8(%R8) |
(353) 0x14e10 ADD -0x8(%R9),%RSI |
(353) 0x14e14 MOV %RSI,-0x8(%R9) |
(353) 0x14e18 ADD (%R8),%RDX |
(353) 0x14e1b MOV %RDX,(%R8) |
(353) 0x14e1e ADD (%R9),%RSI |
(353) 0x14e21 MOV %RSI,(%R9) |
(353) 0x14e24 ADD $0x20,%RDI |
(353) 0x14e28 DEC %RCX |
(353) 0x14e2b JNE 14de0 |
0x14e2d MOV %RAX,%RCX |
0x14e30 AND $-0x4,%RCX |
0x14e34 CMP %RAX,%RCX |
0x14e37 MOV %RBX,%R8 |
0x14e3a JAE 14e6c |
0x14e3c MOV (%R11,%RCX,8),%RAX |
0x14e40 MOV (%R10,%RCX,8),%RDX |
0x14e44 INC %RCX |
0x14e47 NOPW (%RAX,%RAX,1) |
(352) 0x14e50 LEA (%R11,%RCX,8),%RSI |
(352) 0x14e54 ADD (%RSI),%RAX |
(352) 0x14e57 MOV %RAX,(%RSI) |
(352) 0x14e5a LEA (%R10,%RCX,8),%RSI |
(352) 0x14e5e ADD (%RSI),%RDX |
(352) 0x14e61 MOV %RDX,(%RSI) |
(352) 0x14e64 INC %RCX |
(352) 0x14e67 CMP %RCX,%R8 |
(352) 0x14e6a JNE 14e50 |
0x14e6c MOV -0x8(%R11,%R8,8),%RDX |
0x14e71 MOV -0x8(%R10,%R8,8),%RCX |
0x14e76 MOV %RCX,-0x48(%RBP) |
0x14e7a MOV -0x128(%RBP),%RBX |
0x14e81 MOV -0xa0(%RBP),%RAX |
0x14e88 MOV %RDX,(%RAX,%RBX,8) |
0x14e8c MOV -0xa8(%RBP),%RAX |
0x14e93 MOV %RCX,(%RAX,%RBX,8) |
0x14e97 MOV %RBX,%RDI |
0x14e9a MOV %RBX,%RSI |
0x14e9d CALL 5670 <hypre_CSRMatrixCreate@plt> |
0x14ea2 MOV -0x138(%RBP),%R14 |
0x14ea9 MOV %RAX,(%R14) |
0x14eac MOV -0x78(%RBP),%RAX |
0x14eb0 MOV (%RAX),%RSI |
0x14eb3 MOV %RBX,%RDI |
0x14eb6 MOV -0x48(%RBP),%RDX |
0x14eba CALL 5670 <hypre_CSRMatrixCreate@plt> |
0x14ebf MOV -0x130(%RBP),%RBX |
0x14ec6 MOV %RAX,(%RBX) |
0x14ec9 MOV (%R14),%RDI |
0x14ecc MOV -0xa0(%RBP),%RAX |
0x14ed3 MOV %RAX,(%RDI) |
0x14ed6 CALL 53c0 <hypre_CSRMatrixInitialize@plt> |
0x14edb MOV (%R14),%RAX |
0x14ede MOV 0x8(%RAX),%RCX |
0x14ee2 MOV -0xe0(%RBP),%RDX |
0x14ee9 MOV %RCX,(%RDX) |
0x14eec MOV 0x30(%RAX),%RAX |
0x14ef0 MOV -0x98(%RBP),%RCX |
0x14ef7 MOV %RAX,(%RCX) |
0x14efa MOV (%RBX),%RDI |
0x14efd MOV -0xa8(%RBP),%RAX |
0x14f04 MOV %RAX,(%RDI) |
0x14f07 CALL 53c0 <hypre_CSRMatrixInitialize@plt> |
0x14f0c MOV (%RBX),%RAX |
0x14f0f MOV 0x8(%RAX),%RCX |
0x14f13 MOV -0xe8(%RBP),%RDX |
0x14f1a MOV %RCX,(%RDX) |
0x14f1d MOV 0x30(%RAX),%RAX |
0x14f21 MOV -0x90(%RBP),%RCX |
0x14f28 MOV %RAX,(%RCX) |
0x14f2b MOV -0x30(%RBP),%RBX |
0x14f2f MOV -0xf0(%RBP),%R14 |
0x14f36 MOV (%R14),%ESI |
0x14f39 LEA 0xd5a0(%RIP),%RDI |
0x14f40 CALL 55e0 <__kmpc_barrier@plt> |
0x14f45 MOV -0xf8(%RBP),%RDX |
0x14f4c TEST %RDX,%RDX |
0x14f4f JLE 14f62 |
0x14f51 SAL $0x3,%RDX |
0x14f55 MOV %RBX,%RDI |
0x14f58 MOV $0xff,%ESI |
0x14f5d CALL 51d0 <__intel_avx_rep_memset@plt> |
0x14f62 MOV -0x78(%RBP),%RCX |
0x14f66 CMPQ $0,(%RCX) |
0x14f6a MOV -0xd0(%RBP),%RSI |
0x14f71 JLE 14f90 |
0x14f73 XOR %EAX,%EAX |
0x14f75 NOPW %CS:(%RAX,%RAX,1) |
(348) 0x14f80 MOVQ $-0x1,(%R15,%RAX,8) |
(348) 0x14f88 INC %RAX |
(348) 0x14f8b CMP (%RCX),%RAX |
(348) 0x14f8e JL 14f80 |
0x14f90 TEST %RSI,%RSI |
0x14f93 MOV -0x70(%RBP),%RDX |
0x14f97 JE 14fb3 |
0x14f99 MOV -0xc0(%RBP),%RAX |
0x14fa0 MOV -0x8(%RAX,%RSI,8),%RAX |
0x14fa5 MOV -0xc8(%RBP),%RCX |
0x14fac MOV -0x8(%RCX,%RSI,8),%RCX |
0x14fb1 JMP 14fcc |
0x14fb3 XOR %EAX,%EAX |
0x14fb5 XOR %ECX,%ECX |
0x14fb7 JMP 14fcc |
0x14fb9 NOPL (%RAX) |
(339) 0x14fc0 MOV -0x30(%RBP),%RBX |
(339) 0x14fc4 MOV -0x70(%RBP),%RDX |
(339) 0x14fc8 MOV -0x58(%RBP),%R12 |
(339) 0x14fcc CMP %RDX,%R12 |
(339) 0x14fcf JGE 15378 |
(339) 0x14fd5 MOV %R12,%RDX |
(339) 0x14fd8 MOV -0xa0(%RBP),%RSI |
(339) 0x14fdf MOV %RAX,(%RSI,%R12,8) |
(339) 0x14fe3 MOV -0xa8(%RBP),%RSI |
(339) 0x14fea MOV %RCX,(%RSI,%R12,8) |
(339) 0x14fee MOV -0x80(%RBP),%RDI |
(339) 0x14ff2 MOV (%RDI,%R12,8),%RSI |
(339) 0x14ff6 LEA 0x1(%R12),%RBX |
(339) 0x14ffb CMP 0x8(%RDI,%R12,8),%RSI |
(339) 0x15000 JGE 15054 |
(339) 0x15002 MOV -0xe0(%RBP),%RDI |
(339) 0x15009 MOV (%RDI),%RDI |
(339) 0x1500c MOV -0x98(%RBP),%R8 |
(339) 0x15013 MOV (%R8),%R8 |
(339) 0x15016 MOV -0x100(%RBP),%R10 |
(339) 0x1501d MOV -0x80(%RBP),%R11 |
(339) 0x15021 MOV -0x30(%RBP),%R14 |
(339) 0x15025 MOV -0x140(%RBP),%R15 |
(339) 0x1502c NOPL (%RAX) |
(347) 0x15030 MOV (%R10,%RSI,8),%R9 |
(347) 0x15034 MOV %R9,(%RDI,%RAX,8) |
(347) 0x15038 VMOVQ (%R15,%RSI,8),%XMM0 |
(347) 0x1503e VMOVQ %XMM0,(%R8,%RAX,8) |
(347) 0x15044 MOV %RAX,(%R14,%R9,8) |
(347) 0x15048 INC %RAX |
(347) 0x1504b INC %RSI |
(347) 0x1504e CMP (%R11,%RBX,8),%RSI |
(347) 0x15052 JL 15030 |
(339) 0x15054 MOV -0xd8(%RBP),%R12 |
(339) 0x1505b MOV (%R12,%RDX,8),%RSI |
(339) 0x1505f MOV %RBX,-0x58(%RBP) |
(339) 0x15063 CMP (%R12,%RBX,8),%RSI |
(339) 0x15067 MOV -0x88(%RBP),%R15 |
(339) 0x1506e JGE 150c4 |
(339) 0x15070 MOV -0xe8(%RBP),%RDI |
(339) 0x15077 MOV (%RDI),%RDI |
(339) 0x1507a MOV -0x90(%RBP),%R8 |
(339) 0x15081 MOV (%R8),%R8 |
(339) 0x15084 MOV -0x148(%RBP),%R10 |
(339) 0x1508b MOV -0x60(%RBP),%R11 |
(339) 0x1508f MOV -0x58(%RBP),%RBX |
(339) 0x15093 NOPW %CS:(%RAX,%RAX,1) |
(346) 0x150a0 MOV (%R11,%RSI,8),%R9 |
(346) 0x150a4 MOV %R9,(%RDI,%RCX,8) |
(346) 0x150a8 VMOVQ (%R10,%RSI,8),%XMM0 |
(346) 0x150ae VMOVQ %XMM0,(%R8,%RCX,8) |
(346) 0x150b4 MOV %RCX,(%R15,%R9,8) |
(346) 0x150b8 INC %RCX |
(346) 0x150bb INC %RSI |
(346) 0x150be CMP (%R12,%RBX,8),%RSI |
(346) 0x150c2 JL 150a0 |
(339) 0x150c4 TEST %R13,%R13 |
(339) 0x150c7 JLE 14fc0 |
(339) 0x150cd VPBROADCASTQ %RDX,%YMM0 |
(339) 0x150d3 XOR %ESI,%ESI |
(339) 0x150d5 MOV -0x40(%RBP),%R12 |
(339) 0x150d9 MOV -0x30(%RBP),%RBX |
(339) 0x150dd JMP 150f3 |
(340) 0x150df MOV -0x30(%RBP),%RBX |
(340) 0x150e3 MOV -0x38(%RBP),%R13 |
(340) 0x150e7 INC %RSI |
(340) 0x150ea CMP %R13,%RSI |
(340) 0x150ed JE 14fc4 |
(340) 0x150f3 MOV -0x108(%RBP),%RDI |
(340) 0x150fa MOV (%RDI,%RSI,8),%R9 |
(340) 0x150fe MOV 0x8(%RDI,%RSI,8),%R8 |
(340) 0x15103 MOV %R8,%R10 |
(340) 0x15106 SUB %R9,%R10 |
(340) 0x15109 JLE 150e7 |
(340) 0x1510b MOV -0x50(%RBP),%RDI |
(340) 0x1510f LEA (%RDI,%R9,8),%EDI |
(340) 0x15113 AND $0x7f,%EDI |
(340) 0x15116 MOV $0x80,%EBX |
(340) 0x1511b SUB %EDI,%EBX |
(340) 0x1511d SHR $0x3,%EBX |
(340) 0x15120 CMP %RBX,%R10 |
(340) 0x15123 MOV %RBX,%R11 |
(340) 0x15126 CMOVB %R10,%R11 |
(340) 0x1512a TEST %R11,%R11 |
(340) 0x1512d JE 15157 |
(340) 0x1512f MOV %R9,%RDI |
(340) 0x15132 MOV %R11,%R14 |
(340) 0x15135 NOPW %CS:(%RAX,%RAX,1) |
(345) 0x15140 MOV -0x50(%RBP),%R13 |
(345) 0x15144 CMP %RDX,(%R13,%RDI,8) |
(345) 0x15149 JE 15223 |
(345) 0x1514f INC %RDI |
(345) 0x15152 DEC %R14 |
(345) 0x15155 JNE 15140 |
(340) 0x15157 CMP %RBX,%R10 |
(340) 0x1515a JBE 150df |
(340) 0x1515c SUB %R11,%R10 |
(340) 0x1515f MOV %R10,%RBX |
(340) 0x15162 AND $-0x10,%RBX |
(340) 0x15166 JE 151b6 |
(340) 0x15168 LEA -0x1(%RBX),%R13 |
(340) 0x1516c LEA (%R9,%R11,1),%RDI |
(340) 0x15170 MOV -0x50(%RBP),%R14 |
(340) 0x15174 LEA (%R14,%RDI,8),%R14 |
(340) 0x15178 XOR %R12D,%R12D |
(340) 0x1517b NOPL (%RAX,%RAX,1) |
(344) 0x15180 VPCMPEQQ 0x20(%R14,%R12,8),%YMM0,%K0 |
(344) 0x15188 VPCMPEQQ (%R14,%R12,8),%YMM0,%K1 |
(344) 0x1518f VPCMPEQQ 0x60(%R14,%R12,8),%YMM0,%K2 |
(344) 0x15197 VPCMPEQQ 0x40(%R14,%R12,8),%YMM0,%K3 |
(344) 0x1519f KORB %K2,%K3,%K4 |
(344) 0x151a3 KORB %K0,%K1,%K5 |
(344) 0x151a7 KORTESTB %K4,%K5 |
(344) 0x151ab JNE 151f8 |
(344) 0x151ad ADD $0x10,%R12 |
(344) 0x151b1 CMP %R13,%R12 |
(344) 0x151b4 JBE 15180 |
(340) 0x151b6 CMP %R10,%RBX |
(340) 0x151b9 JAE 151e7 |
(340) 0x151bb ADD %R11,%R9 |
(340) 0x151be ADD %RBX,%R9 |
(340) 0x151c1 MOV %R9,%RDI |
(340) 0x151c4 MOV -0x40(%RBP),%R12 |
(340) 0x151c8 MOV -0x68(%RBP),%R13 |
(340) 0x151cc MOV -0x30(%RBP),%RBX |
(343) 0x151d0 MOV -0x50(%RBP),%R9 |
(343) 0x151d4 CMP %RDX,(%R9,%RDI,8) |
(343) 0x151d8 JE 1522b |
(343) 0x151da INC %RDI |
(343) 0x151dd CMP %RDI,%R8 |
(343) 0x151e0 JNE 151d0 |
(340) 0x151e2 JMP 150e3 |
(340) 0x151e7 MOV -0x38(%RBP),%R13 |
(340) 0x151eb MOV -0x40(%RBP),%R12 |
(340) 0x151ef MOV -0x30(%RBP),%RBX |
(340) 0x151f3 JMP 150e7 |
(340) 0x151f8 KSHIFTLB $0x4,%K0,%K0 |
(340) 0x151fe KORB %K0,%K1,%K0 |
(340) 0x15202 KSHIFTLB $0x4,%K2,%K1 |
(340) 0x15208 KORB %K1,%K3,%K1 |
(340) 0x1520c KUNPCKBW %K0,%K1,%K0 |
(340) 0x15210 KMOVD %K0,%R8D |
(340) 0x15214 TZCNT %R8D,%R8D |
(340) 0x15219 ADD %R12,%RDI |
(340) 0x1521c ADD %R8,%RDI |
(340) 0x1521f MOV -0x40(%RBP),%R12 |
(340) 0x15223 MOV -0x68(%RBP),%R13 |
(340) 0x15227 MOV -0x30(%RBP),%RBX |
(340) 0x1522b MOV -0xb0(%RBP),%R9 |
(340) 0x15232 MOV (%R9,%RDI,8),%R8 |
(340) 0x15236 MOV 0x8(%R9,%RDI,8),%R9 |
(340) 0x1523b JMP 1526e |
0x1523d NOPL (%RAX) |
(342) 0x15240 MOV -0x98(%RBP),%R10 |
(342) 0x15247 MOV (%R10),%R10 |
(342) 0x1524a VMOVSD (%R10,%R11,8),%XMM1 |
(342) 0x15250 MOV -0x110(%RBP),%R13 |
(342) 0x15257 VADDSD (%R13,%R8,8),%XMM1,%XMM1 |
(342) 0x1525e MOV -0x68(%RBP),%R13 |
(342) 0x15262 VMOVSD %XMM1,(%R10,%R11,8) |
(342) 0x15268 MOV %R14,%RBX |
(342) 0x1526b INC %R8 |
(342) 0x1526e CMP %R9,%R8 |
(342) 0x15271 JGE 152d0 |
(342) 0x15273 MOV (%R13,%R8,8),%R10 |
(342) 0x15278 MOV (%RBX,%R10,8),%R11 |
(342) 0x1527c MOV %RBX,%R14 |
(342) 0x1527f MOV -0xa0(%RBP),%RBX |
(342) 0x15286 CMP (%RBX,%RDX,8),%R11 |
(342) 0x1528a JGE 15240 |
(342) 0x1528c MOV -0xe0(%RBP),%R9 |
(342) 0x15293 MOV (%R9),%R9 |
(342) 0x15296 MOV %R10,(%R9,%RAX,8) |
(342) 0x1529a MOV -0x110(%RBP),%R9 |
(342) 0x152a1 VMOVSD (%R9,%R8,8),%XMM1 |
(342) 0x152a7 MOV -0x98(%RBP),%R9 |
(342) 0x152ae MOV (%R9),%R9 |
(342) 0x152b1 VMOVSD %XMM1,(%R9,%RAX,8) |
(342) 0x152b7 MOV %RAX,(%R14,%R10,8) |
(342) 0x152bb INC %RAX |
(342) 0x152be MOV -0xb0(%RBP),%R9 |
(342) 0x152c5 MOV 0x8(%R9,%RDI,8),%R9 |
(342) 0x152ca JMP 15268 |
0x152cc NOPL (%RAX) |
(340) 0x152d0 MOV -0xb8(%RBP),%R9 |
(340) 0x152d7 MOV (%R9,%RDI,8),%R8 |
(340) 0x152db MOV 0x8(%R9,%RDI,8),%R9 |
(340) 0x152e0 CMP %R9,%R8 |
(340) 0x152e3 JGE 150e3 |
(340) 0x152e9 MOV -0x38(%RBP),%R13 |
(340) 0x152ed JMP 15323 |
0x152ef NOP |
(341) 0x152f0 MOV -0x90(%RBP),%R10 |
(341) 0x152f7 MOV (%R10),%R10 |
(341) 0x152fa VMOVSD (%R10,%R11,8),%XMM1 |
(341) 0x15300 MOV -0x118(%RBP),%R12 |
(341) 0x15307 VADDSD (%R12,%R8,8),%XMM1,%XMM1 |
(341) 0x1530d MOV -0x40(%RBP),%R12 |
(341) 0x15311 VMOVSD %XMM1,(%R10,%R11,8) |
(341) 0x15317 INC %R8 |
(341) 0x1531a CMP %R9,%R8 |
(341) 0x1531d JGE 150e7 |
(341) 0x15323 MOV (%R12,%R8,8),%R10 |
(341) 0x15327 MOV (%R15,%R10,8),%R11 |
(341) 0x1532b MOV -0xa8(%RBP),%R14 |
(341) 0x15332 CMP (%R14,%RDX,8),%R11 |
(341) 0x15336 JGE 152f0 |
(341) 0x15338 MOV -0xe8(%RBP),%R9 |
(341) 0x1533f MOV (%R9),%R9 |
(341) 0x15342 MOV %R10,(%R9,%RCX,8) |
(341) 0x15346 MOV -0x118(%RBP),%R9 |
(341) 0x1534d VMOVSD (%R9,%R8,8),%XMM1 |
(341) 0x15353 MOV -0x90(%RBP),%R9 |
(341) 0x1535a MOV (%R9),%R9 |
(341) 0x1535d VMOVSD %XMM1,(%R9,%RCX,8) |
(341) 0x15363 MOV %RCX,(%R15,%R10,8) |
(341) 0x15367 INC %RCX |
(341) 0x1536a MOV -0xb8(%RBP),%R9 |
(341) 0x15371 MOV 0x8(%R9,%RDI,8),%R9 |
(341) 0x15376 JMP 15317 |
0x15378 MOV %RBX,%RDI |
0x1537b VZEROUPPER |
0x1537e CALL 5310 <hypre_Free@plt> |
0x15383 MOV %R15,%RDI |
0x15386 ADD $0x128,%RSP |
0x1538d POP %RBX |
0x1538e POP %R12 |
0x15390 POP %R13 |
0x15392 POP %R14 |
0x15394 POP %R15 |
0x15396 POP %RBP |
0x15397 JMP 5310 |
0x1539c NOPL (%RAX) |
Path / |
Source file and lines | par_csr_matop.c:3454-3640 |
Module | libparcsr_mv.so |
nb instructions | 300 |
nb uops | 322 |
loop length | 1334 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 60 |
micro-operation queue | 53.67 cycles |
front end | 53.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 13.90 | 13.80 | 30.00 | 30.00 | 33.00 | 13.80 | 13.70 | 33.00 | 33.00 | 33.00 | 13.80 | 30.00 |
cycles | 13.90 | 16.80 | 30.00 | 30.00 | 33.00 | 13.80 | 13.70 | 33.00 | 33.00 | 33.00 | 13.80 | 30.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 50.84-50.89 |
Stall cycles | 0.00 |
Front-end | 53.67 |
Dispatch | 33.00 |
DIV/SQRT | 16.00 |
Overall L1 | 53.67 |
all | 2% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 7% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x80(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x148(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 5500 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RSI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 147f1 <hypre_ParTMatmul.extracted+0x171> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RSI | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 147fe <hypre_ParTMatmul.extracted+0x17e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R13D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ESI | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %EDX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 50d0 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
INC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R15,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 14829 <hypre_ParTMatmul.extracted+0x1a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP 1483b <hypre_ParTMatmul.extracted+0x1bb> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xf8(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 55c0 <hypre_CAlloc@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 55c0 <hypre_CAlloc@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 14884 <hypre_ParTMatmul.extracted+0x204> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%R14,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 51d0 <__intel_avx_rep_memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,(%RDX) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 148b0 <hypre_ParTMatmul.extracted+0x230> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,-0x58(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x40(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 14c09 <hypre_ParTMatmul.extracted+0x589> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 1491a <hypre_ParTMatmul.extracted+0x29a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xf0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R14),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xd8a6(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 55e0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,-0xd0(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 14f36 <hypre_ParTMatmul.extracted+0x8b6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x120(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x2,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xc8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc0(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JL 14e6c <hypre_ParTMatmul.extracted+0x7ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%R8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R10,%R8,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 14cc1 <hypre_ParTMatmul.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R11,%R8,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 14cc1 <hypre_ParTMatmul.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R11,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 14dc1 <hypre_ParTMatmul.extracted+0x741> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 14dc1 <hypre_ParTMatmul.extracted+0x741> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 14e6c <hypre_ParTMatmul.extracted+0x7ec> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV (%R11),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R11,%RAX,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x8(%R10),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 14d11 <hypre_ParTMatmul.extracted+0x691> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x8(%R11),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R10,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 14d11 <hypre_ParTMatmul.extracted+0x691> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 14e6c <hypre_ParTMatmul.extracted+0x7ec> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x5,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 14d7d <hypre_ParTMatmul.extracted+0x6fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JAE 14e6c <hypre_ParTMatmul.extracted+0x7ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 14e6c <hypre_ParTMatmul.extracted+0x7ec> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x5,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 14e2d <hypre_ParTMatmul.extracted+0x7ad> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R11),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JAE 14e6c <hypre_ParTMatmul.extracted+0x7ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R11,%RCX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%R11,%R8,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%R10,%R8,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x128(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 5670 <hypre_CSRMatrixCreate@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x138(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%R14) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x48(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 5670 <hypre_CSRMatrixCreate@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x130(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R14),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 53c0 <hypre_CSRMatrixInitialize@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x98(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 53c0 <hypre_CSRMatrixInitialize@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R14),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xd5a0(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 55e0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xf8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 14f62 <hypre_ParTMatmul.extracted+0x8e2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 51d0 <__intel_avx_rep_memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x78(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,(%RCX) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 14f90 <hypre_ParTMatmul.extracted+0x910> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x70(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 14fb3 <hypre_ParTMatmul.extracted+0x933> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RAX,%RSI,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RCX,%RSI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 14fcc <hypre_ParTMatmul.extracted+0x94c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 14fcc <hypre_ParTMatmul.extracted+0x94c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 5310 <hypre_Free@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 5310 <hypre_Free@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | par_csr_matop.c:3454-3640 |
Module | libparcsr_mv.so |
nb instructions | 300 |
nb uops | 322 |
loop length | 1334 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 60 |
micro-operation queue | 53.67 cycles |
front end | 53.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 13.90 | 13.80 | 30.00 | 30.00 | 33.00 | 13.80 | 13.70 | 33.00 | 33.00 | 33.00 | 13.80 | 30.00 |
cycles | 13.90 | 16.80 | 30.00 | 30.00 | 33.00 | 13.80 | 13.70 | 33.00 | 33.00 | 33.00 | 13.80 | 30.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 50.84-50.89 |
Stall cycles | 0.00 |
Front-end | 53.67 |
Dispatch | 33.00 |
DIV/SQRT | 16.00 |
Overall L1 | 53.67 |
all | 2% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 7% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x80(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x148(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 5500 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RSI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 147f1 <hypre_ParTMatmul.extracted+0x171> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RSI | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 147fe <hypre_ParTMatmul.extracted+0x17e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R13D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ESI | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %EDX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 50d0 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
INC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R15,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 14829 <hypre_ParTMatmul.extracted+0x1a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP 1483b <hypre_ParTMatmul.extracted+0x1bb> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xf8(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 55c0 <hypre_CAlloc@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 55c0 <hypre_CAlloc@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 14884 <hypre_ParTMatmul.extracted+0x204> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%R14,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 51d0 <__intel_avx_rep_memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,(%RDX) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 148b0 <hypre_ParTMatmul.extracted+0x230> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,-0x58(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x40(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 14c09 <hypre_ParTMatmul.extracted+0x589> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 1491a <hypre_ParTMatmul.extracted+0x29a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xf0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R14),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xd8a6(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 55e0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,-0xd0(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 14f36 <hypre_ParTMatmul.extracted+0x8b6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x120(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x2,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xc8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc0(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JL 14e6c <hypre_ParTMatmul.extracted+0x7ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%R8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R10,%R8,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 14cc1 <hypre_ParTMatmul.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R11,%R8,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 14cc1 <hypre_ParTMatmul.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R11,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 14dc1 <hypre_ParTMatmul.extracted+0x741> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 14dc1 <hypre_ParTMatmul.extracted+0x741> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 14e6c <hypre_ParTMatmul.extracted+0x7ec> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV (%R11),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R11,%RAX,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x8(%R10),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 14d11 <hypre_ParTMatmul.extracted+0x691> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x8(%R11),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R10,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 14d11 <hypre_ParTMatmul.extracted+0x691> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 14e6c <hypre_ParTMatmul.extracted+0x7ec> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x5,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 14d7d <hypre_ParTMatmul.extracted+0x6fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JAE 14e6c <hypre_ParTMatmul.extracted+0x7ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 14e6c <hypre_ParTMatmul.extracted+0x7ec> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x5,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 14e2d <hypre_ParTMatmul.extracted+0x7ad> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R11),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JAE 14e6c <hypre_ParTMatmul.extracted+0x7ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R11,%RCX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%R11,%R8,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%R10,%R8,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x128(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 5670 <hypre_CSRMatrixCreate@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x138(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%R14) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x48(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 5670 <hypre_CSRMatrixCreate@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x130(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R14),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 53c0 <hypre_CSRMatrixInitialize@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x98(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RDI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 53c0 <hypre_CSRMatrixInitialize@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R14),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xd5a0(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 55e0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xf8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 14f62 <hypre_ParTMatmul.extracted+0x8e2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 51d0 <__intel_avx_rep_memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x78(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,(%RCX) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 14f90 <hypre_ParTMatmul.extracted+0x910> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x70(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 14fb3 <hypre_ParTMatmul.extracted+0x933> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RAX,%RSI,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RCX,%RSI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 14fcc <hypre_ParTMatmul.extracted+0x94c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 14fcc <hypre_ParTMatmul.extracted+0x94c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 5310 <hypre_Free@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 5310 <hypre_Free@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_ParTMatmul.extracted– | 0.06 | 0.01 |
○Loop 364 - par_csr_matop.c:3484-3485 - libparcsr_mv.so | 0 | 0 |
○Loop 348 - par_csr_matop.c:3571-3572 - libparcsr_mv.so | 0 | 0 |
▼Loop 339 - par_csr_matop.c:3467-3634 - libparcsr_mv.so– | 0 | 0 |
○Loop 347 - par_csr_matop.c:3590-3596 - libparcsr_mv.so | 0.01 | 0.01 |
○Loop 346 - par_csr_matop.c:3598-3604 - libparcsr_mv.so | 0 | 0 |
▼Loop 340 - par_csr_matop.c:3467-3634 - libparcsr_mv.so– | 0 | 0 |
○Loop 344 - par_csr_matop.c:3505-3608 - libparcsr_mv.so | 0.02 | 0.01 |
○Loop 345 - par_csr_matop.c:3505-3608 - libparcsr_mv.so | 0 | 0 |
○Loop 341 - par_csr_matop.c:3623-3634 - libparcsr_mv.so | 0 | 0 |
○Loop 343 - par_csr_matop.c:3505-3608 - libparcsr_mv.so | 0 | 0 |
○Loop 342 - par_csr_matop.c:3610-3621 - libparcsr_mv.so | 0 | 0 |
○Loop 351 - par_csr_matop.c:3537-3540 - libparcsr_mv.so | 0 | 0 |
○Loop 354 - par_csr_matop.c:3537-3540 - libparcsr_mv.so | 0 | 0 |
▼Loop 355 - par_csr_matop.c:3467-3528 - libparcsr_mv.so– | 0 | 0 |
○Loop 363 - par_csr_matop.c:3491-3495 - libparcsr_mv.so | 0.01 | 0.01 |
▼Loop 356 - par_csr_matop.c:3467-3522 - libparcsr_mv.so– | 0 | 0 |
○Loop 360 - par_csr_matop.c:3504-3505 - libparcsr_mv.so | 0.02 | 0.01 |
○Loop 358 - par_csr_matop.c:3507-3513 - libparcsr_mv.so | 0 | 0 |
○Loop 357 - par_csr_matop.c:3516-3522 - libparcsr_mv.so | 0 | 0 |
○Loop 359 - par_csr_matop.c:3504-3505 - libparcsr_mv.so | 0 | 0 |
○Loop 361 - par_csr_matop.c:3467-3505 - libparcsr_mv.so | 0 | 0 |
○Loop 362 - par_csr_matop.c:3497-3501 - libparcsr_mv.so | 0 | 0 |
○Loop 350 - par_csr_matop.c:3537-3540 - libparcsr_mv.so | 0 | 0 |
○Loop 353 - par_csr_matop.c:3537-3540 - libparcsr_mv.so | 0 | 0 |
○Loop 349 - par_csr_matop.c:3537-3540 - libparcsr_mv.so | 0 | 0 |
○Loop 352 - par_csr_matop.c:3537-3540 - libparcsr_mv.so | 0 | 0 |