Function: hypre_ParTMatmul.extracted | Module: exec | Source: par_csr_matop.c:3454-3640 [...] | Coverage: 0.06% |
---|
Function: hypre_ParTMatmul.extracted | Module: exec | Source: par_csr_matop.c:3454-3640 [...] | Coverage: 0.06% |
---|
/scratch_na/users/xoserete/qaas_runs/171-172-8218/intel/AMG/build/AMG/AMG/parcsr_mv/par_csr_matop.c: 3454 - 3640 |
-------------------------------------------------------------------------------- |
3454: #pragma omp parallel |
[...] |
3462: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
3463: |
3464: size = num_cols_diag_A/num_threads; |
3465: rest = num_cols_diag_A - size*num_threads; |
3466: ii = hypre_GetThreadNum(); |
3467: if (ii < rest) |
3468: { |
3469: ns = ii*size+ii; |
3470: ne = (ii+1)*size+ii+1; |
3471: } |
3472: else |
3473: { |
3474: ns = ii*size+rest; |
3475: ne = (ii+1)*size+rest; |
3476: } |
3477: |
3478: B_marker = hypre_CTAlloc(HYPRE_Int, num_cols_diag_B); |
3479: B_marker_offd = hypre_CTAlloc(HYPRE_Int, num_cols_offd_C); |
3480: |
3481: for (ik = 0; ik < num_cols_diag_B; ik++) |
3482: B_marker[ik] = -1; |
3483: |
3484: for (ik = 0; ik < num_cols_offd_C; ik++) |
3485: B_marker_offd[ik] = -1; |
3486: |
3487: nnz_d = 0; |
3488: nnz_o = 0; |
3489: for (ik = ns; ik < ne; ik++) |
3490: { |
3491: for (jk = C_tmp_diag_i[ik]; jk < C_tmp_diag_i[ik+1]; jk++) |
3492: { |
3493: jcol = C_tmp_diag_j[jk]; |
3494: B_marker[jcol] = ik; |
3495: nnz_d++; |
3496: } |
3497: for (jk = C_tmp_offd_i[ik]; jk < C_tmp_offd_i[ik+1]; jk++) |
3498: { |
3499: jcol = C_tmp_offd_j[jk]; |
3500: B_marker_offd[jcol] = ik; |
3501: nnz_o++; |
3502: } |
3503: for (jk = 0; jk < num_sends_A; jk++) |
3504: for (j1 = send_map_starts_A[jk]; j1 < send_map_starts_A[jk+1]; j1++) |
3505: if (send_map_elmts_A[j1] == ik) |
3506: { |
3507: for (j2 = C_ext_diag_i[j1]; j2 < C_ext_diag_i[j1+1]; j2++) |
3508: { |
3509: jcol = C_ext_diag_j[j2]; |
3510: if (B_marker[jcol] < ik) |
3511: { |
3512: B_marker[jcol] = ik; |
3513: nnz_d++; |
3514: } |
3515: } |
3516: for (j2 = C_ext_offd_i[j1]; j2 < C_ext_offd_i[j1+1]; j2++) |
3517: { |
3518: jcol = C_ext_offd_j[j2]; |
3519: if (B_marker_offd[jcol] < ik) |
3520: { |
3521: B_marker_offd[jcol] = ik; |
3522: nnz_o++; |
3523: } |
3524: } |
3525: break; |
3526: } |
3527: C_diag_array[ii] = nnz_d; |
3528: C_offd_array[ii] = nnz_o; |
3529: } |
3530: #ifdef HYPRE_USING_OPENMP |
3531: #pragma omp barrier |
3532: #endif |
3533: if (ii == 0) |
3534: { |
3535: nnz_d = 0; |
3536: nnz_o = 0; |
3537: for (ik = 0; ik < num_threads-1; ik++) |
3538: { |
3539: C_diag_array[ik+1] += C_diag_array[ik]; |
3540: C_offd_array[ik+1] += C_offd_array[ik]; |
3541: } |
3542: nnz_d = C_diag_array[num_threads-1]; |
3543: nnz_o = C_offd_array[num_threads-1]; |
3544: C_diag_i[num_cols_diag_A] = nnz_d; |
3545: C_offd_i[num_cols_diag_A] = nnz_o; |
3546: |
3547: C_diag = hypre_CSRMatrixCreate(num_cols_diag_A, num_cols_diag_A, nnz_d); |
3548: C_offd = hypre_CSRMatrixCreate(num_cols_diag_A, num_cols_offd_C, nnz_o); |
3549: hypre_CSRMatrixI(C_diag) = C_diag_i; |
3550: hypre_CSRMatrixInitialize(C_diag); |
3551: C_diag_j = hypre_CSRMatrixJ(C_diag); |
3552: C_diag_data = hypre_CSRMatrixData(C_diag); |
3553: hypre_CSRMatrixI(C_offd) = C_offd_i; |
3554: hypre_CSRMatrixInitialize(C_offd); |
3555: C_offd_j = hypre_CSRMatrixJ(C_offd); |
3556: C_offd_data = hypre_CSRMatrixData(C_offd); |
[...] |
3568: for (ik = 0; ik < num_cols_diag_B; ik++) |
3569: B_marker[ik] = -1; |
3570: |
3571: for (ik = 0; ik < num_cols_offd_C; ik++) |
3572: B_marker_offd[ik] = -1; |
[...] |
3581: if (ii) |
3582: { |
3583: nnz_d = C_diag_array[ii-1]; |
3584: nnz_o = C_offd_array[ii-1]; |
3585: } |
3586: for (ik = ns; ik < ne; ik++) |
3587: { |
3588: C_diag_i[ik] = nnz_d; |
3589: C_offd_i[ik] = nnz_o; |
3590: for (jk = C_tmp_diag_i[ik]; jk < C_tmp_diag_i[ik+1]; jk++) |
3591: { |
3592: jcol = C_tmp_diag_j[jk]; |
3593: C_diag_j[nnz_d] = jcol; |
3594: C_diag_data[nnz_d] = C_tmp_diag_data[jk]; |
3595: B_marker[jcol] = nnz_d; |
3596: nnz_d++; |
3597: } |
3598: for (jk = C_tmp_offd_i[ik]; jk < C_tmp_offd_i[ik+1]; jk++) |
3599: { |
3600: jcol = C_tmp_offd_j[jk]; |
3601: C_offd_j[nnz_o] = jcol; |
3602: C_offd_data[nnz_o] = C_tmp_offd_data[jk]; |
3603: B_marker_offd[jcol] = nnz_o; |
3604: nnz_o++; |
3605: } |
3606: for (jk = 0; jk < num_sends_A; jk++) |
3607: for (j1 = send_map_starts_A[jk]; j1 < send_map_starts_A[jk+1]; j1++) |
3608: if (send_map_elmts_A[j1] == ik) |
3609: { |
3610: for (j2 = C_ext_diag_i[j1]; j2 < C_ext_diag_i[j1+1]; j2++) |
3611: { |
3612: jcol = C_ext_diag_j[j2]; |
3613: if (B_marker[jcol] < C_diag_i[ik]) |
3614: { |
3615: C_diag_j[nnz_d] = jcol; |
3616: C_diag_data[nnz_d] = C_ext_diag_data[j2]; |
3617: B_marker[jcol] = nnz_d; |
3618: nnz_d++; |
3619: } |
3620: else |
3621: C_diag_data[B_marker[jcol]] += C_ext_diag_data[j2]; |
3622: } |
3623: for (j2 = C_ext_offd_i[j1]; j2 < C_ext_offd_i[j1+1]; j2++) |
3624: { |
3625: jcol = C_ext_offd_j[j2]; |
3626: if (B_marker_offd[jcol] < C_offd_i[ik]) |
3627: { |
3628: C_offd_j[nnz_o] = jcol; |
3629: C_offd_data[nnz_o] = C_ext_offd_data[j2]; |
3630: B_marker_offd[jcol] = nnz_o; |
3631: nnz_o++; |
3632: } |
3633: else |
3634: C_offd_data[B_marker_offd[jcol]] += C_ext_offd_data[j2]; |
3635: } |
3636: break; |
3637: } |
3638: } |
3639: hypre_TFree(B_marker); |
3640: hypre_TFree(B_marker_offd); |
0x4c0370 PUSH %RBP |
0x4c0371 MOV %RSP,%RBP |
0x4c0374 PUSH %R15 |
0x4c0376 PUSH %R14 |
0x4c0378 PUSH %R13 |
0x4c037a PUSH %R12 |
0x4c037c PUSH %RBX |
0x4c037d SUB $0x128,%RSP |
0x4c0384 MOV %R9,-0xe8(%RBP) |
0x4c038b MOV %R8,-0x128(%RBP) |
0x4c0392 MOV %RCX,-0x100(%RBP) |
0x4c0399 MOV %RDX,%R15 |
0x4c039c MOV %RDI,-0xc0(%RBP) |
0x4c03a3 MOV 0xc8(%RBP),%RAX |
0x4c03aa MOV %RAX,-0xd0(%RBP) |
0x4c03b1 MOV 0xc0(%RBP),%RAX |
0x4c03b8 MOV %RAX,-0xc8(%RBP) |
0x4c03bf MOV 0xb8(%RBP),%RAX |
0x4c03c6 MOV %RAX,-0x78(%RBP) |
0x4c03ca MOV 0xb0(%RBP),%RBX |
0x4c03d1 MOV 0xa8(%RBP),%RAX |
0x4c03d8 MOV %RAX,-0x50(%RBP) |
0x4c03dc MOV 0xa0(%RBP),%RAX |
0x4c03e3 MOV %RAX,-0x38(%RBP) |
0x4c03e7 MOV 0x98(%RBP),%RAX |
0x4c03ee MOV %RAX,-0xf8(%RBP) |
0x4c03f5 MOV 0x90(%RBP),%RAX |
0x4c03fc MOV %RAX,-0xa8(%RBP) |
0x4c0403 MOV 0x88(%RBP),%RAX |
0x4c040a MOV %RAX,-0xe0(%RBP) |
0x4c0411 MOV 0x80(%RBP),%R13 |
0x4c0418 MOV 0x78(%RBP),%RAX |
0x4c041c MOV %RAX,-0x58(%RBP) |
0x4c0420 MOV 0x70(%RBP),%RAX |
0x4c0424 MOV %RAX,-0x90(%RBP) |
0x4c042b MOV 0x68(%RBP),%R12 |
0x4c042f MOV 0x60(%RBP),%RAX |
0x4c0433 MOV %RAX,-0x60(%RBP) |
0x4c0437 MOV 0x58(%RBP),%RAX |
0x4c043b MOV %RAX,-0x80(%RBP) |
0x4c043f MOV 0x50(%RBP),%RAX |
0x4c0443 MOV %RAX,-0x148(%RBP) |
0x4c044a MOV 0x48(%RBP),%RAX |
0x4c044e MOV %RAX,-0x110(%RBP) |
0x4c0455 MOV 0x40(%RBP),%RAX |
0x4c0459 MOV %RAX,-0xb8(%RBP) |
0x4c0460 MOV 0x38(%RBP),%RAX |
0x4c0464 MOV %RAX,-0x140(%RBP) |
0x4c046b MOV 0x30(%RBP),%RAX |
0x4c046f MOV %RAX,-0x108(%RBP) |
0x4c0476 MOV 0x28(%RBP),%RAX |
0x4c047a MOV %RAX,-0xb0(%RBP) |
0x4c0481 MOV 0x20(%RBP),%RAX |
0x4c0485 MOV %RAX,-0x120(%RBP) |
0x4c048c MOV 0x18(%RBP),%RAX |
0x4c0490 MOV %RAX,-0xf0(%RBP) |
0x4c0497 MOV 0x10(%RBP),%RAX |
0x4c049b MOV %RAX,-0xa0(%RBP) |
0x4c04a2 CALL 4e8aa0 <hypre_NumActiveThreads> |
0x4c04a7 MOV %RAX,%RCX |
0x4c04aa MOV %R15,%RAX |
0x4c04ad OR %RCX,%RAX |
0x4c04b0 SHR $0x20,%RAX |
0x4c04b4 MOV %R15,-0x130(%RBP) |
0x4c04bb MOV %RCX,-0x118(%RBP) |
0x4c04c2 JE 4c04d4 |
0x4c04c4 MOV %R15,%RAX |
0x4c04c7 CQTO |
0x4c04c9 IDIV %RCX |
0x4c04cc MOV %RDX,%R15 |
0x4c04cf MOV %RAX,%R14 |
0x4c04d2 JMP 4c04e1 |
0x4c04d4 MOV %R15D,%EAX |
0x4c04d7 XOR %EDX,%EDX |
0x4c04d9 DIV %ECX |
0x4c04db MOV %EDX,%R15D |
0x4c04de MOV %EAX,%R14D |
0x4c04e1 CALL 4e8ab0 <hypre_GetThreadNum> |
0x4c04e6 LEA 0x1(%RAX),%RCX |
0x4c04ea MOV %RCX,%RDX |
0x4c04ed IMUL %R14,%RDX |
0x4c04f1 CMP %R15,%RAX |
0x4c04f4 MOV %R12,-0x138(%RBP) |
0x4c04fb MOV %RAX,-0xd8(%RBP) |
0x4c0502 JGE 4c0518 |
0x4c0504 INC %R14 |
0x4c0507 IMUL %RAX,%R14 |
0x4c050b MOV %R14,-0x48(%RBP) |
0x4c050f ADD %RDX,%RCX |
0x4c0512 MOV %RCX,-0x68(%RBP) |
0x4c0516 JMP 4c052a |
0x4c0518 IMUL %RAX,%R14 |
0x4c051c ADD %R15,%R14 |
0x4c051f MOV %R14,-0x48(%RBP) |
0x4c0523 ADD %R15,%RDX |
0x4c0526 MOV %RDX,-0x68(%RBP) |
0x4c052a MOV -0x50(%RBP),%R15 |
0x4c052e MOV $0x8,%ESI |
0x4c0533 MOV -0x100(%RBP),%R12 |
0x4c053a MOV %R12,%RDI |
0x4c053d CALL 4e6d80 <hypre_CAlloc> |
0x4c0542 MOV %RAX,%R14 |
0x4c0545 MOV $0x8,%ESI |
0x4c054a MOV -0x78(%RBP),%RDI |
0x4c054e CALL 4e6d80 <hypre_CAlloc> |
0x4c0553 MOV %R12,%RCX |
0x4c0556 MOV %RAX,%R12 |
0x4c0559 TEST %RCX,%RCX |
0x4c055c JLE 4c0573 |
0x4c055e LEA (,%RCX,8),%RDX |
0x4c0566 MOV %R14,%RDI |
0x4c0569 MOV $0xff,%ESI |
0x4c056e CALL 4efe80 <_intel_fast_memset> |
0x4c0573 MOV -0x78(%RBP),%RAX |
0x4c0577 TEST %RAX,%RAX |
0x4c057a JLE 4c0591 |
0x4c057c LEA (,%RAX,8),%RDX |
0x4c0584 MOV %R12,%RDI |
0x4c0587 MOV $0xff,%ESI |
0x4c058c CALL 4efe80 <_intel_fast_memset> |
0x4c0591 MOV -0x48(%RBP),%RAX |
0x4c0595 CMP -0x68(%RBP),%RAX |
0x4c0599 MOV %RBX,-0x40(%RBP) |
0x4c059d MOV -0x38(%RBP),%R11 |
0x4c05a1 MOV %R13,-0x88(%RBP) |
0x4c05a8 MOV -0x60(%RBP),%R9 |
0x4c05ac MOV %R14,-0x30(%RBP) |
0x4c05b0 JGE 4c08f2 |
0x4c05b6 XOR %EAX,%EAX |
0x4c05b8 MOV -0x48(%RBP),%RDX |
0x4c05bc XOR %ECX,%ECX |
0x4c05be JMP 4c05ee |
(3670) 0x4c05c0 MOV -0xc8(%RBP),%RDX |
(3670) 0x4c05c7 MOV -0xd8(%RBP),%RSI |
(3670) 0x4c05ce MOV %RCX,(%RDX,%RSI,8) |
(3670) 0x4c05d2 MOV -0xd0(%RBP),%RDX |
(3670) 0x4c05d9 MOV %RAX,(%RDX,%RSI,8) |
(3670) 0x4c05dd MOV -0x70(%RBP),%RSI |
(3670) 0x4c05e1 MOV %RSI,%RDX |
(3670) 0x4c05e4 CMP -0x68(%RBP),%RSI |
(3670) 0x4c05e8 JGE 4c08f2 |
(3670) 0x4c05ee MOV -0x80(%RBP),%RDI |
(3670) 0x4c05f2 MOV (%RDI,%RDX,8),%RSI |
(3670) 0x4c05f6 LEA 0x1(%RDX),%R8 |
(3670) 0x4c05fa MOV %R8,-0x70(%RBP) |
(3670) 0x4c05fe CMP 0x8(%RDI,%RDX,8),%RSI |
(3670) 0x4c0603 JGE 4c0680 |
(3670) 0x4c0605 MOV -0x58(%RBP),%R8 |
(3670) 0x4c0609 MOV -0x80(%RBP),%R10 |
(3670) 0x4c060d MOV -0x70(%RBP),%RBX |
(3670) 0x4c0611 NOPW %CS:(%RAX,%RAX,1) |
(3677) 0x4c0620 MOV (%R9,%RSI,8),%RDI |
(3677) 0x4c0624 MOV %RDX,(%R14,%RDI,8) |
(3677) 0x4c0628 INC %RCX |
(3677) 0x4c062b INC %RSI |
(3677) 0x4c062e CMP (%R10,%RBX,8),%RSI |
(3677) 0x4c0632 JL 4c0620 |
(3670) 0x4c0634 MOV -0x90(%RBP),%RDI |
(3670) 0x4c063b MOV (%RDI,%RDX,8),%RSI |
(3670) 0x4c063f CMP (%RDI,%RBX,8),%RSI |
(3670) 0x4c0643 JGE 4c0699 |
(3670) 0x4c0645 MOV -0x40(%RBP),%RBX |
(3670) 0x4c0649 NOPL (%RAX) |
(3669) 0x4c0650 MOV (%R8,%RSI,8),%RDI |
(3669) 0x4c0654 MOV %RDX,(%R12,%RDI,8) |
(3669) 0x4c0658 INC %RAX |
(3669) 0x4c065b INC %RSI |
(3669) 0x4c065e MOV -0x90(%RBP),%RDI |
(3669) 0x4c0665 MOV -0x70(%RBP),%R10 |
(3669) 0x4c0669 CMP (%RDI,%R10,8),%RSI |
(3669) 0x4c066d JL 4c0650 |
(3670) 0x4c066f TEST %RBX,%RBX |
(3670) 0x4c0672 JG 4c06a6 |
(3670) 0x4c0674 JMP 4c05c0 |
0x4c0679 NOPL (%RAX) |
(3670) 0x4c0680 MOV -0x58(%RBP),%R8 |
(3670) 0x4c0684 MOV -0x70(%RBP),%RBX |
(3670) 0x4c0688 MOV -0x90(%RBP),%RDI |
(3670) 0x4c068f MOV (%RDI,%RDX,8),%RSI |
(3670) 0x4c0693 CMP (%RDI,%RBX,8),%RSI |
(3670) 0x4c0697 JL 4c0645 |
(3670) 0x4c0699 MOV -0x40(%RBP),%RBX |
(3670) 0x4c069d TEST %RBX,%RBX |
(3670) 0x4c06a0 JLE 4c05c0 |
(3670) 0x4c06a6 VPBROADCASTQ %RDX,%YMM0 |
(3670) 0x4c06ac XOR %EDI,%EDI |
(3670) 0x4c06ae JMP 4c06c3 |
(3671) 0x4c06b0 MOV -0x60(%RBP),%R9 |
(3671) 0x4c06b4 MOV %RSI,%R11 |
(3671) 0x4c06b7 INC %RDI |
(3671) 0x4c06ba CMP %RBX,%RDI |
(3671) 0x4c06bd JE 4c05c0 |
(3671) 0x4c06c3 MOV (%R11,%RDI,8),%R10 |
(3671) 0x4c06c7 MOV 0x8(%R11,%RDI,8),%R9 |
(3671) 0x4c06cc MOV %R11,%RSI |
(3671) 0x4c06cf MOV %R9,%R11 |
(3671) 0x4c06d2 SUB %R10,%R11 |
(3671) 0x4c06d5 JLE 4c06b0 |
(3671) 0x4c06d7 LEA (%R15,%R10,8),%ESI |
(3671) 0x4c06db AND $0x7f,%ESI |
(3671) 0x4c06de MOV $0x80,%EBX |
(3671) 0x4c06e3 SUB %ESI,%EBX |
(3671) 0x4c06e5 SHR $0x3,%EBX |
(3671) 0x4c06e8 CMP %RBX,%R11 |
(3671) 0x4c06eb MOV %RBX,%RSI |
(3671) 0x4c06ee CMOVB %R11,%RSI |
(3671) 0x4c06f2 TEST %RSI,%RSI |
(3671) 0x4c06f5 JE 4c0712 |
(3671) 0x4c06f7 MOV %R10,%R8 |
(3671) 0x4c06fa MOV %RSI,%R14 |
(3671) 0x4c06fd NOPL (%RAX) |
(3676) 0x4c0700 CMP %RDX,(%R15,%R8,8) |
(3676) 0x4c0704 JE 4c07ee |
(3676) 0x4c070a INC %R8 |
(3676) 0x4c070d DEC %R14 |
(3676) 0x4c0710 JNE 4c0700 |
(3671) 0x4c0712 CMP %RBX,%R11 |
(3671) 0x4c0715 JBE 4c07d9 |
(3671) 0x4c071b SUB %RSI,%R11 |
(3671) 0x4c071e MOV %R11,%RBX |
(3671) 0x4c0721 AND $-0x10,%RBX |
(3671) 0x4c0725 JE 4c077a |
(3671) 0x4c0727 LEA -0x1(%RBX),%R13 |
(3671) 0x4c072b LEA (%R10,%RSI,1),%R8 |
(3671) 0x4c072f MOV -0x50(%RBP),%R14 |
(3671) 0x4c0733 LEA (%R14,%R8,8),%R15 |
(3671) 0x4c0737 XOR %R14D,%R14D |
(3671) 0x4c073a NOPW (%RAX,%RAX,1) |
(3675) 0x4c0740 VPCMPEQQ 0x20(%R15,%R14,8),%YMM0,%K0 |
(3675) 0x4c0748 VPCMPEQQ (%R15,%R14,8),%YMM0,%K1 |
(3675) 0x4c074f VPCMPEQQ 0x60(%R15,%R14,8),%YMM0,%K2 |
(3675) 0x4c0757 VPCMPEQQ 0x40(%R15,%R14,8),%YMM0,%K3 |
(3675) 0x4c075f KORB %K0,%K1,%K4 |
(3675) 0x4c0763 KORB %K2,%K3,%K5 |
(3675) 0x4c0767 KORTESTB %K5,%K4 |
(3675) 0x4c076b JNE 4c081c |
(3675) 0x4c0771 ADD $0x10,%R14 |
(3675) 0x4c0775 CMP %R13,%R14 |
(3675) 0x4c0778 JBE 4c0740 |
(3671) 0x4c077a CMP %R11,%RBX |
(3671) 0x4c077d JAE 4c07fc |
(3671) 0x4c077f ADD %RSI,%R10 |
(3671) 0x4c0782 ADD %RBX,%R10 |
(3671) 0x4c0785 MOV %R10,%R8 |
(3671) 0x4c0788 MOV -0x40(%RBP),%RBX |
(3671) 0x4c078c MOV -0x50(%RBP),%R15 |
(3671) 0x4c0790 MOV -0x38(%RBP),%R11 |
(3671) 0x4c0794 MOV -0x88(%RBP),%R13 |
(3671) 0x4c079b MOV -0x48(%RBP),%RSI |
(3671) 0x4c079f MOV -0x30(%RBP),%R14 |
(3671) 0x4c07a3 MOV %RSI,-0x48(%RBP) |
(3671) 0x4c07a7 NOPW (%RAX,%RAX,1) |
(3674) 0x4c07b0 CMP %RDX,(%R15,%R8,8) |
(3674) 0x4c07b4 JE 4c0859 |
(3674) 0x4c07ba INC %R8 |
(3674) 0x4c07bd CMP %R8,%R9 |
(3674) 0x4c07c0 JNE 4c07b0 |
(3671) 0x4c07c2 NOPW %CS:(%RAX,%RAX,1) |
(3671) 0x4c07d0 MOV -0x60(%RBP),%R9 |
(3671) 0x4c07d4 JMP 4c06b7 |
(3671) 0x4c07d9 MOV -0x38(%RBP),%R11 |
(3671) 0x4c07dd MOV -0x60(%RBP),%R9 |
(3671) 0x4c07e1 MOV -0x30(%RBP),%R14 |
(3671) 0x4c07e5 MOV -0x40(%RBP),%RBX |
(3671) 0x4c07e9 JMP 4c06b7 |
(3671) 0x4c07ee MOV -0x38(%RBP),%R11 |
(3671) 0x4c07f2 MOV -0x30(%RBP),%R14 |
(3671) 0x4c07f6 MOV -0x40(%RBP),%RBX |
(3671) 0x4c07fa JMP 4c0859 |
(3671) 0x4c07fc MOV -0x40(%RBP),%RBX |
(3671) 0x4c0800 MOV -0x50(%RBP),%R15 |
(3671) 0x4c0804 MOV -0x38(%RBP),%R11 |
(3671) 0x4c0808 MOV -0x88(%RBP),%R13 |
(3671) 0x4c080f MOV -0x60(%RBP),%R9 |
(3671) 0x4c0813 MOV -0x30(%RBP),%R14 |
(3671) 0x4c0817 JMP 4c06b7 |
(3671) 0x4c081c KSHIFTLB $0x4,%K0,%K0 |
(3671) 0x4c0822 KORB %K0,%K1,%K0 |
(3671) 0x4c0826 KSHIFTLB $0x4,%K2,%K1 |
(3671) 0x4c082c KORB %K1,%K3,%K1 |
(3671) 0x4c0830 KUNPCKBW %K0,%K1,%K0 |
(3671) 0x4c0834 KMOVD %K0,%ESI |
(3671) 0x4c0838 TZCNT %ESI,%ESI |
(3671) 0x4c083c ADD %R14,%R8 |
(3671) 0x4c083f ADD %RSI,%R8 |
(3671) 0x4c0842 MOV -0x40(%RBP),%RBX |
(3671) 0x4c0846 MOV -0x50(%RBP),%R15 |
(3671) 0x4c084a MOV -0x38(%RBP),%R11 |
(3671) 0x4c084e MOV -0x88(%RBP),%R13 |
(3671) 0x4c0855 MOV -0x30(%RBP),%R14 |
(3671) 0x4c0859 MOV -0xb0(%RBP),%R9 |
(3671) 0x4c0860 MOV (%R9,%R8,8),%RSI |
(3671) 0x4c0864 MOV 0x8(%R9,%R8,8),%R9 |
(3671) 0x4c0869 JMP 4c0873 |
0x4c086b NOPL (%RAX,%RAX,1) |
(3673) 0x4c0870 INC %RSI |
(3673) 0x4c0873 CMP %R9,%RSI |
(3673) 0x4c0876 JGE 4c08a0 |
(3673) 0x4c0878 MOV -0x108(%RBP),%R10 |
(3673) 0x4c087f MOV (%R10,%RSI,8),%R10 |
(3673) 0x4c0883 CMP %RDX,(%R14,%R10,8) |
(3673) 0x4c0887 JGE 4c0870 |
(3673) 0x4c0889 MOV %RDX,(%R14,%R10,8) |
(3673) 0x4c088d INC %RCX |
(3673) 0x4c0890 MOV -0xb0(%RBP),%R9 |
(3673) 0x4c0897 MOV 0x8(%R9,%R8,8),%R9 |
(3673) 0x4c089c JMP 4c0870 |
0x4c089e XCHG %AX,%AX |
(3671) 0x4c08a0 MOV -0xb8(%RBP),%R9 |
(3671) 0x4c08a7 MOV (%R9,%R8,8),%RSI |
(3671) 0x4c08ab MOV 0x8(%R9,%R8,8),%R9 |
(3671) 0x4c08b0 JMP 4c08c3 |
0x4c08b2 NOPW %CS:(%RAX,%RAX,1) |
(3672) 0x4c08c0 INC %RSI |
(3672) 0x4c08c3 CMP %R9,%RSI |
(3672) 0x4c08c6 JGE 4c07d0 |
(3672) 0x4c08cc MOV -0x110(%RBP),%R10 |
(3672) 0x4c08d3 MOV (%R10,%RSI,8),%R10 |
(3672) 0x4c08d7 CMP %RDX,(%R12,%R10,8) |
(3672) 0x4c08db JGE 4c08c0 |
(3672) 0x4c08dd MOV %RDX,(%R12,%R10,8) |
(3672) 0x4c08e1 INC %RAX |
(3672) 0x4c08e4 MOV -0xb8(%RBP),%R9 |
(3672) 0x4c08eb MOV 0x8(%R9,%R8,8),%R9 |
(3672) 0x4c08f0 JMP 4c08c0 |
0x4c08f2 MOV -0xc0(%RBP),%RAX |
0x4c08f9 MOV (%RAX),%ESI |
0x4c08fb MOV $0x736270,%EDI |
0x4c0900 VZEROUPPER |
0x4c0903 CALL 410020 <__kmpc_barrier@plt> |
0x4c0908 MOV -0xc0(%RBP),%RAX |
0x4c090f CMPQ $0,-0xd8(%RBP) |
0x4c0917 JNE 4c0b50 |
0x4c091d MOV -0x118(%RBP),%RDI |
0x4c0924 CMP $0x1,%RDI |
0x4c0928 MOV -0xd0(%RBP),%R10 |
0x4c092f MOV -0xc8(%RBP),%R11 |
0x4c0936 JLE 4c0a8c |
0x4c093c LEA -0x1(%RDI),%RAX |
0x4c0940 LEA (%R11,%RAX,8),%RCX |
0x4c0944 CMP %R10,%RCX |
0x4c0947 JB 4c09b1 |
0x4c0949 LEA (%R10,%RAX,8),%RCX |
0x4c094d CMP %R11,%RCX |
0x4c0950 JB 4c09b1 |
0x4c0952 LEA (%R10,%RDI,8),%RAX |
0x4c0956 CMP %R11,%RAX |
0x4c0959 JBE 4c0a5e |
0x4c095f LEA (%R11,%RDI,8),%RAX |
0x4c0963 CMP %R10,%RAX |
0x4c0966 JBE 4c0a5e |
0x4c096c MOV $0x1,%EAX |
0x4c0971 NOPW %CS:(%RAX,%RAX,1) |
(3668) 0x4c0980 MOV -0x8(%R11,%RAX,8),%RCX |
(3668) 0x4c0985 LEA (%R11,%RAX,8),%RDX |
(3668) 0x4c0989 MOV (%RDX),%RSI |
(3668) 0x4c098c ADD %RCX,%RSI |
(3668) 0x4c098f MOV %RSI,(%RDX) |
(3668) 0x4c0992 MOV -0x8(%R10,%RAX,8),%RCX |
(3668) 0x4c0997 LEA (%R10,%RAX,8),%RDX |
(3668) 0x4c099b MOV (%RDX),%RSI |
(3668) 0x4c099e ADD %RCX,%RSI |
(3668) 0x4c09a1 MOV %RSI,(%RDX) |
(3668) 0x4c09a4 INC %RAX |
(3668) 0x4c09a7 CMP %RAX,%RDI |
(3668) 0x4c09aa JNE 4c0980 |
0x4c09ac JMP 4c0a8c |
0x4c09b1 MOV %RDI,%RBX |
0x4c09b4 CMP $0x5,%RDI |
0x4c09b8 JB 4c0a1d |
0x4c09ba MOV %RAX,%RCX |
0x4c09bd SHR $0x2,%RCX |
0x4c09c1 MOV (%R11),%RDX |
0x4c09c4 MOV (%R10),%RSI |
0x4c09c7 MOV $0x20,%EDI |
0x4c09cc NOPL (%RAX) |
(3666) 0x4c09d0 LEA (%R11,%RDI,1),%R8 |
(3666) 0x4c09d4 ADD -0x18(%R8),%RDX |
(3666) 0x4c09d8 MOV %RDX,-0x18(%R8) |
(3666) 0x4c09dc LEA (%R10,%RDI,1),%R9 |
(3666) 0x4c09e0 ADD -0x18(%R9),%RSI |
(3666) 0x4c09e4 MOV %RSI,-0x18(%R9) |
(3666) 0x4c09e8 ADD -0x10(%R8),%RDX |
(3666) 0x4c09ec MOV %RDX,-0x10(%R8) |
(3666) 0x4c09f0 ADD -0x10(%R9),%RSI |
(3666) 0x4c09f4 MOV %RSI,-0x10(%R9) |
(3666) 0x4c09f8 ADD -0x8(%R8),%RDX |
(3666) 0x4c09fc MOV %RDX,-0x8(%R8) |
(3666) 0x4c0a00 ADD -0x8(%R9),%RSI |
(3666) 0x4c0a04 MOV %RSI,-0x8(%R9) |
(3666) 0x4c0a08 ADD (%R8),%RDX |
(3666) 0x4c0a0b MOV %RDX,(%R8) |
(3666) 0x4c0a0e ADD (%R9),%RSI |
(3666) 0x4c0a11 MOV %RSI,(%R9) |
(3666) 0x4c0a14 ADD $0x20,%RDI |
(3666) 0x4c0a18 DEC %RCX |
(3666) 0x4c0a1b JNE 4c09d0 |
0x4c0a1d MOV %RAX,%RCX |
0x4c0a20 AND $-0x4,%RCX |
0x4c0a24 CMP %RAX,%RCX |
0x4c0a27 MOV %RBX,%RDI |
0x4c0a2a JAE 4c0a8c |
0x4c0a2c MOV (%R11,%RCX,8),%RAX |
0x4c0a30 MOV (%R10,%RCX,8),%RDX |
0x4c0a34 INC %RCX |
0x4c0a37 NOPW (%RAX,%RAX,1) |
(3665) 0x4c0a40 LEA (%R11,%RCX,8),%RSI |
(3665) 0x4c0a44 ADD (%RSI),%RAX |
(3665) 0x4c0a47 MOV %RAX,(%RSI) |
(3665) 0x4c0a4a LEA (%R10,%RCX,8),%RSI |
(3665) 0x4c0a4e ADD (%RSI),%RDX |
(3665) 0x4c0a51 MOV %RDX,(%RSI) |
(3665) 0x4c0a54 INC %RCX |
(3665) 0x4c0a57 CMP %RCX,%RDI |
(3665) 0x4c0a5a JNE 4c0a40 |
0x4c0a5c JMP 4c0a8c |
0x4c0a5e MOV (%R11),%RAX |
0x4c0a61 MOV (%R10),%RCX |
0x4c0a64 MOV $0x1,%EDX |
0x4c0a69 NOPL (%RAX) |
(3667) 0x4c0a70 LEA (%R11,%RDX,8),%RSI |
(3667) 0x4c0a74 ADD (%RSI),%RAX |
(3667) 0x4c0a77 MOV %RAX,(%RSI) |
(3667) 0x4c0a7a LEA (%R10,%RDX,8),%RSI |
(3667) 0x4c0a7e ADD (%RSI),%RCX |
(3667) 0x4c0a81 MOV %RCX,(%RSI) |
(3667) 0x4c0a84 INC %RDX |
(3667) 0x4c0a87 CMP %RDX,%RDI |
(3667) 0x4c0a8a JNE 4c0a70 |
0x4c0a8c MOV -0x8(%R11,%RDI,8),%RDX |
0x4c0a91 MOV -0x8(%R10,%RDI,8),%RCX |
0x4c0a96 MOV %RCX,-0x70(%RBP) |
0x4c0a9a MOV -0x130(%RBP),%RBX |
0x4c0aa1 MOV -0xa0(%RBP),%RAX |
0x4c0aa8 MOV %RDX,(%RAX,%RBX,8) |
0x4c0aac MOV -0xa8(%RBP),%RAX |
0x4c0ab3 MOV %RCX,(%RAX,%RBX,8) |
0x4c0ab7 MOV %RBX,%RDI |
0x4c0aba MOV %RBX,%RSI |
0x4c0abd CALL 4daa30 <hypre_CSRMatrixCreate> |
0x4c0ac2 MOV %RAX,%R13 |
0x4c0ac5 MOV -0x128(%RBP),%RAX |
0x4c0acc MOV %R13,(%RAX) |
0x4c0acf MOV %RBX,%RDI |
0x4c0ad2 MOV -0x78(%RBP),%RSI |
0x4c0ad6 MOV -0x70(%RBP),%RDX |
0x4c0ada CALL 4daa30 <hypre_CSRMatrixCreate> |
0x4c0adf MOV %RAX,%RBX |
0x4c0ae2 MOV -0x120(%RBP),%RAX |
0x4c0ae9 MOV %RBX,(%RAX) |
0x4c0aec MOV -0xa0(%RBP),%RAX |
0x4c0af3 MOV %RAX,(%R13) |
0x4c0af7 MOV %R13,%RDI |
0x4c0afa CALL 4dab10 <hypre_CSRMatrixInitialize> |
0x4c0aff MOV 0x8(%R13),%RAX |
0x4c0b03 MOV -0xf0(%RBP),%RCX |
0x4c0b0a MOV %RAX,(%RCX) |
0x4c0b0d MOV 0x30(%R13),%RAX |
0x4c0b11 MOV -0xe8(%RBP),%RCX |
0x4c0b18 MOV %RAX,(%RCX) |
0x4c0b1b MOV -0xa8(%RBP),%RAX |
0x4c0b22 MOV %RAX,(%RBX) |
0x4c0b25 MOV %RBX,%RDI |
0x4c0b28 CALL 4dab10 <hypre_CSRMatrixInitialize> |
0x4c0b2d MOV 0x8(%RBX),%RAX |
0x4c0b31 MOV -0xf8(%RBP),%RCX |
0x4c0b38 MOV %RAX,(%RCX) |
0x4c0b3b MOV 0x30(%RBX),%RAX |
0x4c0b3f MOV -0xe0(%RBP),%RCX |
0x4c0b46 MOV %RAX,(%RCX) |
0x4c0b49 MOV -0xc0(%RBP),%RAX |
0x4c0b50 MOV (%RAX),%ESI |
0x4c0b52 MOV $0x736290,%EDI |
0x4c0b57 CALL 410020 <__kmpc_barrier@plt> |
0x4c0b5c MOV -0x100(%RBP),%RDX |
0x4c0b63 TEST %RDX,%RDX |
0x4c0b66 JLE 4c0b79 |
0x4c0b68 SAL $0x3,%RDX |
0x4c0b6c MOV %R14,%RDI |
0x4c0b6f MOV $0xff,%ESI |
0x4c0b74 CALL 4efe80 <_intel_fast_memset> |
0x4c0b79 MOV -0x78(%RBP),%RDX |
0x4c0b7d TEST %RDX,%RDX |
0x4c0b80 JLE 4c0b93 |
0x4c0b82 SAL $0x3,%RDX |
0x4c0b86 MOV %R12,%RDI |
0x4c0b89 MOV $0xff,%ESI |
0x4c0b8e CALL 4efe80 <_intel_fast_memset> |
0x4c0b93 MOV -0xd8(%RBP),%RDX |
0x4c0b9a TEST %RDX,%RDX |
0x4c0b9d JE 4c0bc9 |
0x4c0b9f MOV -0xc8(%RBP),%RAX |
0x4c0ba6 MOV -0x8(%RAX,%RDX,8),%RAX |
0x4c0bab MOV -0xd0(%RBP),%RCX |
0x4c0bb2 MOV -0x8(%RCX,%RDX,8),%RCX |
0x4c0bb7 MOV -0x68(%RBP),%RDX |
0x4c0bbb MOV -0x48(%RBP),%RSI |
0x4c0bbf CMP %RDX,%RSI |
0x4c0bc2 JL 4c0bde |
0x4c0bc4 JMP 4c101f |
0x4c0bc9 XOR %EAX,%EAX |
0x4c0bcb XOR %ECX,%ECX |
0x4c0bcd MOV -0x68(%RBP),%RDX |
0x4c0bd1 MOV -0x48(%RBP),%RSI |
0x4c0bd5 CMP %RDX,%RSI |
0x4c0bd8 JGE 4c101f |
0x4c0bde MOV %R12,-0x98(%RBP) |
0x4c0be5 JMP 4c0c08 |
0x4c0be7 NOPW (%RAX,%RAX,1) |
(3657) 0x4c0bf0 MOV -0x98(%RBP),%R12 |
(3657) 0x4c0bf7 MOV -0x68(%RBP),%RDX |
(3657) 0x4c0bfb MOV -0x48(%RBP),%RSI |
(3657) 0x4c0bff CMP %RDX,%RSI |
(3657) 0x4c0c02 JGE 4c101f |
(3657) 0x4c0c08 MOV %RSI,%RDX |
(3657) 0x4c0c0b MOV -0xa0(%RBP),%RSI |
(3657) 0x4c0c12 MOV %RAX,(%RSI,%RDX,8) |
(3657) 0x4c0c16 MOV -0xa8(%RBP),%RSI |
(3657) 0x4c0c1d MOV %RCX,(%RSI,%RDX,8) |
(3657) 0x4c0c21 MOV -0x80(%RBP),%R8 |
(3657) 0x4c0c25 MOV (%R8,%RDX,8),%RSI |
(3657) 0x4c0c29 LEA 0x1(%RDX),%RDI |
(3657) 0x4c0c2d MOV %RDI,-0x48(%RBP) |
(3657) 0x4c0c31 CMP 0x8(%R8,%RDX,8),%RSI |
(3657) 0x4c0c36 JGE 4c0d30 |
(3657) 0x4c0c3c MOV -0xf0(%RBP),%RDI |
(3657) 0x4c0c43 MOV (%RDI),%RDI |
(3657) 0x4c0c46 MOV -0xe8(%RBP),%R8 |
(3657) 0x4c0c4d MOV (%R8),%R8 |
(3657) 0x4c0c50 MOV -0x138(%RBP),%R10 |
(3657) 0x4c0c57 MOV -0x60(%RBP),%R14 |
(3657) 0x4c0c5b MOV -0x80(%RBP),%RBX |
(3657) 0x4c0c5f MOV -0x48(%RBP),%R13 |
(3657) 0x4c0c63 MOV -0x30(%RBP),%R11 |
(3657) 0x4c0c67 NOPW (%RAX,%RAX,1) |
(3664) 0x4c0c70 MOV (%R14,%RSI,8),%R9 |
(3664) 0x4c0c74 MOV %R9,(%RDI,%RAX,8) |
(3664) 0x4c0c78 VMOVQ (%R10,%RSI,8),%XMM0 |
(3664) 0x4c0c7e VMOVQ %XMM0,(%R8,%RAX,8) |
(3664) 0x4c0c84 MOV %RAX,(%R11,%R9,8) |
(3664) 0x4c0c88 INC %RAX |
(3664) 0x4c0c8b INC %RSI |
(3664) 0x4c0c8e CMP (%RBX,%R13,8),%RSI |
(3664) 0x4c0c92 JL 4c0c70 |
(3657) 0x4c0c94 MOV -0x90(%RBP),%RDI |
(3657) 0x4c0c9b MOV (%RDI,%RDX,8),%RSI |
(3657) 0x4c0c9f CMP (%RDI,%R13,8),%RSI |
(3657) 0x4c0ca3 JGE 4c0d49 |
(3657) 0x4c0ca9 MOV -0xf8(%RBP),%RDI |
(3657) 0x4c0cb0 MOV (%RDI),%RDI |
(3657) 0x4c0cb3 MOV -0xe0(%RBP),%R8 |
(3657) 0x4c0cba MOV (%R8),%R8 |
(3657) 0x4c0cbd MOV -0x30(%RBP),%R14 |
(3657) 0x4c0cc1 MOV -0x88(%RBP),%R13 |
(3657) 0x4c0cc8 MOV -0x38(%RBP),%R11 |
(3657) 0x4c0ccc MOV -0x48(%RBP),%R10 |
(3657) 0x4c0cd0 MOV -0x90(%RBP),%RBX |
(3657) 0x4c0cd7 MOV -0x58(%RBP),%R12 |
(3657) 0x4c0cdb MOV -0x98(%RBP),%R15 |
(3657) 0x4c0ce2 NOPW %CS:(%RAX,%RAX,1) |
(3656) 0x4c0cf0 MOV (%R12,%RSI,8),%R9 |
(3656) 0x4c0cf4 MOV %R9,(%RDI,%RCX,8) |
(3656) 0x4c0cf8 VMOVQ (%R13,%RSI,8),%XMM0 |
(3656) 0x4c0cff VMOVQ %XMM0,(%R8,%RCX,8) |
(3656) 0x4c0d05 MOV %RCX,(%R15,%R9,8) |
(3656) 0x4c0d09 INC %RCX |
(3656) 0x4c0d0c INC %RSI |
(3656) 0x4c0d0f CMP (%RBX,%R10,8),%RSI |
(3656) 0x4c0d13 JL 4c0cf0 |
(3657) 0x4c0d15 MOV -0x40(%RBP),%RBX |
(3657) 0x4c0d19 TEST %RBX,%RBX |
(3657) 0x4c0d1c JG 4c0d5e |
(3657) 0x4c0d1e JMP 4c0bf0 |
0x4c0d23 NOPW %CS:(%RAX,%RAX,1) |
(3657) 0x4c0d30 MOV -0x48(%RBP),%R13 |
(3657) 0x4c0d34 MOV -0x90(%RBP),%RDI |
(3657) 0x4c0d3b MOV (%RDI,%RDX,8),%RSI |
(3657) 0x4c0d3f CMP (%RDI,%R13,8),%RSI |
(3657) 0x4c0d43 JL 4c0ca9 |
(3657) 0x4c0d49 MOV -0x30(%RBP),%R14 |
(3657) 0x4c0d4d MOV -0x38(%RBP),%R11 |
(3657) 0x4c0d51 MOV -0x40(%RBP),%RBX |
(3657) 0x4c0d55 TEST %RBX,%RBX |
(3657) 0x4c0d58 JLE 4c0bf0 |
(3657) 0x4c0d5e VPBROADCASTQ %RDX,%YMM0 |
(3657) 0x4c0d64 XOR %ESI,%ESI |
(3657) 0x4c0d66 MOV -0x58(%RBP),%R10 |
(3657) 0x4c0d6a MOV -0x50(%RBP),%R15 |
(3657) 0x4c0d6e JMP 4c0d86 |
(3658) 0x4c0d70 MOV %R12,%R10 |
(3658) 0x4c0d73 MOV -0x98(%RBP),%R12 |
(3658) 0x4c0d7a INC %RSI |
(3658) 0x4c0d7d CMP %RBX,%RSI |
(3658) 0x4c0d80 JE 4c0bf7 |
(3658) 0x4c0d86 MOV %R10,%R12 |
(3658) 0x4c0d89 MOV (%R11,%RSI,8),%R9 |
(3658) 0x4c0d8d MOV 0x8(%R11,%RSI,8),%R8 |
(3658) 0x4c0d92 MOV %R8,%R10 |
(3658) 0x4c0d95 SUB %R9,%R10 |
(3658) 0x4c0d98 JLE 4c0d70 |
(3658) 0x4c0d9a LEA (%R15,%R9,8),%EDI |
(3658) 0x4c0d9e AND $0x7f,%EDI |
(3658) 0x4c0da1 MOV $0x80,%EBX |
(3658) 0x4c0da6 SUB %EDI,%EBX |
(3658) 0x4c0da8 SHR $0x3,%EBX |
(3658) 0x4c0dab CMP %RBX,%R10 |
(3658) 0x4c0dae MOV %RBX,%R11 |
(3658) 0x4c0db1 CMOVB %R10,%R11 |
(3658) 0x4c0db5 TEST %R11,%R11 |
(3658) 0x4c0db8 MOV -0x98(%RBP),%R12 |
(3658) 0x4c0dbf JE 4c0de2 |
(3658) 0x4c0dc1 MOV %R9,%RDI |
(3658) 0x4c0dc4 MOV %R11,%R14 |
(3658) 0x4c0dc7 NOPW (%RAX,%RAX,1) |
(3663) 0x4c0dd0 CMP %RDX,(%R15,%RDI,8) |
(3663) 0x4c0dd4 JE 4c0edc |
(3663) 0x4c0dda INC %RDI |
(3663) 0x4c0ddd DEC %R14 |
(3663) 0x4c0de0 JNE 4c0dd0 |
(3658) 0x4c0de2 CMP %RBX,%R10 |
(3658) 0x4c0de5 JBE 4c0e83 |
(3658) 0x4c0deb SUB %R11,%R10 |
(3658) 0x4c0dee MOV %R10,%RBX |
(3658) 0x4c0df1 AND $-0x10,%RBX |
(3658) 0x4c0df5 JE 4c0e46 |
(3658) 0x4c0df7 LEA -0x1(%RBX),%R13 |
(3658) 0x4c0dfb LEA (%R9,%R11,1),%RDI |
(3658) 0x4c0dff MOV -0x50(%RBP),%R14 |
(3658) 0x4c0e03 LEA (%R14,%RDI,8),%R15 |
(3658) 0x4c0e07 XOR %R14D,%R14D |
(3658) 0x4c0e0a NOPW (%RAX,%RAX,1) |
(3662) 0x4c0e10 VPCMPEQQ 0x20(%R15,%R14,8),%YMM0,%K0 |
(3662) 0x4c0e18 VPCMPEQQ (%R15,%R14,8),%YMM0,%K1 |
(3662) 0x4c0e1f VPCMPEQQ 0x60(%R15,%R14,8),%YMM0,%K2 |
(3662) 0x4c0e27 VPCMPEQQ 0x40(%R15,%R14,8),%YMM0,%K3 |
(3662) 0x4c0e2f KORB %K0,%K1,%K4 |
(3662) 0x4c0e33 KORB %K2,%K3,%K5 |
(3662) 0x4c0e37 KORTESTB %K5,%K4 |
(3662) 0x4c0e3b JNE 4c0eb1 |
(3662) 0x4c0e3d ADD $0x10,%R14 |
(3662) 0x4c0e41 CMP %R13,%R14 |
(3662) 0x4c0e44 JBE 4c0e10 |
(3658) 0x4c0e46 CMP %R10,%RBX |
(3658) 0x4c0e49 JAE 4c0e98 |
(3658) 0x4c0e4b ADD %R11,%R9 |
(3658) 0x4c0e4e ADD %RBX,%R9 |
(3658) 0x4c0e51 MOV %R9,%RDI |
(3658) 0x4c0e54 MOV -0x40(%RBP),%RBX |
(3658) 0x4c0e58 MOV -0x50(%RBP),%R15 |
(3658) 0x4c0e5c MOV -0x38(%RBP),%R11 |
(3658) 0x4c0e60 MOV -0x58(%RBP),%R10 |
(3658) 0x4c0e64 MOV -0x30(%RBP),%R14 |
(3658) 0x4c0e68 NOPL (%RAX,%RAX,1) |
(3661) 0x4c0e70 CMP %RDX,(%R15,%RDI,8) |
(3661) 0x4c0e74 JE 4c0ee0 |
(3661) 0x4c0e76 INC %RDI |
(3661) 0x4c0e79 CMP %RDI,%R8 |
(3661) 0x4c0e7c JNE 4c0e70 |
(3658) 0x4c0e7e JMP 4c0d7a |
(3658) 0x4c0e83 MOV -0x38(%RBP),%R11 |
(3658) 0x4c0e87 MOV -0x58(%RBP),%R10 |
(3658) 0x4c0e8b MOV -0x30(%RBP),%R14 |
(3658) 0x4c0e8f MOV -0x40(%RBP),%RBX |
(3658) 0x4c0e93 JMP 4c0d7a |
(3658) 0x4c0e98 MOV -0x40(%RBP),%RBX |
(3658) 0x4c0e9c MOV -0x50(%RBP),%R15 |
(3658) 0x4c0ea0 MOV -0x38(%RBP),%R11 |
(3658) 0x4c0ea4 MOV -0x58(%RBP),%R10 |
(3658) 0x4c0ea8 MOV -0x30(%RBP),%R14 |
(3658) 0x4c0eac JMP 4c0d7a |
(3658) 0x4c0eb1 KSHIFTLB $0x4,%K0,%K0 |
(3658) 0x4c0eb7 KORB %K0,%K1,%K0 |
(3658) 0x4c0ebb KSHIFTLB $0x4,%K2,%K1 |
(3658) 0x4c0ec1 KORB %K1,%K3,%K1 |
(3658) 0x4c0ec5 KUNPCKBW %K0,%K1,%K0 |
(3658) 0x4c0ec9 KMOVD %K0,%R8D |
(3658) 0x4c0ecd TZCNT %R8D,%R8D |
(3658) 0x4c0ed2 ADD %R14,%RDI |
(3658) 0x4c0ed5 ADD %R8,%RDI |
(3658) 0x4c0ed8 MOV -0x50(%RBP),%R15 |
(3658) 0x4c0edc MOV -0x30(%RBP),%R14 |
(3658) 0x4c0ee0 MOV -0xb0(%RBP),%R9 |
(3658) 0x4c0ee7 MOV (%R9,%RDI,8),%R8 |
(3658) 0x4c0eeb MOV 0x8(%R9,%RDI,8),%R10 |
(3658) 0x4c0ef0 CMP %R10,%R8 |
(3658) 0x4c0ef3 JGE 4c0f7e |
(3658) 0x4c0ef9 MOV -0xe8(%RBP),%R9 |
(3658) 0x4c0f00 MOV (%R9),%R9 |
(3658) 0x4c0f03 JMP 4c0f24 |
0x4c0f05 NOPW %CS:(%RAX,%RAX,1) |
(3660) 0x4c0f10 VADDSD (%R9,%RBX,8),%XMM1,%XMM1 |
(3660) 0x4c0f16 VMOVSD %XMM1,(%R9,%RBX,8) |
(3660) 0x4c0f1c INC %R8 |
(3660) 0x4c0f1f CMP %R10,%R8 |
(3660) 0x4c0f22 JGE 4c0f7e |
(3660) 0x4c0f24 MOV -0x108(%RBP),%R11 |
(3660) 0x4c0f2b MOV (%R11,%R8,8),%R11 |
(3660) 0x4c0f2f MOV (%R14,%R11,8),%RBX |
(3660) 0x4c0f33 MOV -0x140(%RBP),%R13 |
(3660) 0x4c0f3a VMOVSD (%R13,%R8,8),%XMM1 |
(3660) 0x4c0f41 MOV -0xa0(%RBP),%R13 |
(3660) 0x4c0f48 CMP (%R13,%RDX,8),%RBX |
(3660) 0x4c0f4d JGE 4c0f10 |
(3660) 0x4c0f4f MOV -0xf0(%RBP),%R10 |
(3660) 0x4c0f56 MOV (%R10),%R10 |
(3660) 0x4c0f59 MOV %R11,(%R10,%RAX,8) |
(3660) 0x4c0f5d VMOVSD %XMM1,(%R9,%RAX,8) |
(3660) 0x4c0f63 MOV %RAX,(%R14,%R11,8) |
(3660) 0x4c0f67 INC %RAX |
(3660) 0x4c0f6a MOV -0xb0(%RBP),%R10 |
(3660) 0x4c0f71 MOV 0x8(%R10,%RDI,8),%R10 |
(3660) 0x4c0f76 INC %R8 |
(3660) 0x4c0f79 CMP %R10,%R8 |
(3660) 0x4c0f7c JL 4c0f24 |
(3658) 0x4c0f7e MOV -0xb8(%RBP),%R9 |
(3658) 0x4c0f85 MOV (%R9,%RDI,8),%R8 |
(3658) 0x4c0f89 MOV 0x8(%R9,%RDI,8),%R10 |
(3658) 0x4c0f8e CMP %R10,%R8 |
(3658) 0x4c0f91 JGE 4c100e |
(3658) 0x4c0f93 MOV -0xe0(%RBP),%R9 |
(3658) 0x4c0f9a MOV (%R9),%R9 |
(3658) 0x4c0f9d JMP 4c0fb4 |
0x4c0f9f NOP |
(3659) 0x4c0fa0 VADDSD (%R9,%RBX,8),%XMM1,%XMM1 |
(3659) 0x4c0fa6 VMOVSD %XMM1,(%R9,%RBX,8) |
(3659) 0x4c0fac INC %R8 |
(3659) 0x4c0faf CMP %R10,%R8 |
(3659) 0x4c0fb2 JGE 4c100e |
(3659) 0x4c0fb4 MOV -0x110(%RBP),%R11 |
(3659) 0x4c0fbb MOV (%R11,%R8,8),%R11 |
(3659) 0x4c0fbf MOV (%R12,%R11,8),%RBX |
(3659) 0x4c0fc3 MOV -0x148(%RBP),%R13 |
(3659) 0x4c0fca VMOVSD (%R13,%R8,8),%XMM1 |
(3659) 0x4c0fd1 MOV -0xa8(%RBP),%R13 |
(3659) 0x4c0fd8 CMP (%R13,%RDX,8),%RBX |
(3659) 0x4c0fdd JGE 4c0fa0 |
(3659) 0x4c0fdf MOV -0xf8(%RBP),%R10 |
(3659) 0x4c0fe6 MOV (%R10),%R10 |
(3659) 0x4c0fe9 MOV %R11,(%R10,%RCX,8) |
(3659) 0x4c0fed VMOVSD %XMM1,(%R9,%RCX,8) |
(3659) 0x4c0ff3 MOV %RCX,(%R12,%R11,8) |
(3659) 0x4c0ff7 INC %RCX |
(3659) 0x4c0ffa MOV -0xb8(%RBP),%R10 |
(3659) 0x4c1001 MOV 0x8(%R10,%RDI,8),%R10 |
(3659) 0x4c1006 INC %R8 |
(3659) 0x4c1009 CMP %R10,%R8 |
(3659) 0x4c100c JL 4c0fb4 |
(3658) 0x4c100e MOV -0x58(%RBP),%R10 |
(3658) 0x4c1012 MOV -0x40(%RBP),%RBX |
(3658) 0x4c1016 MOV -0x38(%RBP),%R11 |
(3658) 0x4c101a JMP 4c0d7a |
0x4c101f MOV %R14,%RDI |
0x4c1022 VZEROUPPER |
0x4c1025 CALL 4e6e50 <hypre_Free> |
0x4c102a MOV %R12,%RDI |
0x4c102d ADD $0x128,%RSP |
0x4c1034 POP %RBX |
0x4c1035 POP %R12 |
0x4c1037 POP %R13 |
0x4c1039 POP %R14 |
0x4c103b POP %R15 |
0x4c103d POP %RBP |
0x4c103e JMP 4e6e50 |
0x4c1043 NOPW %CS:(%RAX,%RAX,1) |
0x4c104d NOPL (%RAX) |
Path / |
Source file and lines | par_csr_matop.c:3454-3640 |
Module | exec |
nb instructions | 285 |
nb uops | 309 |
loop length | 1283 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 60 |
micro-operation queue | 51.50 cycles |
front end | 51.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 13.50 | 13.40 | 28.00 | 28.00 | 34.50 | 13.40 | 13.30 | 34.50 | 34.50 | 34.50 | 13.40 | 28.00 |
cycles | 13.50 | 16.00 | 28.00 | 28.00 | 34.50 | 13.40 | 13.30 | 34.50 | 34.50 | 34.50 | 13.40 | 28.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 48.35-48.40 |
Stall cycles | 0.00 |
Front-end | 51.50 |
Dispatch | 34.50 |
DIV/SQRT | 16.00 |
Overall L1 | 51.50 |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 5% |
all | 12% |
load | 11% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x80(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x148(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4e8aa0 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R15,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4c04d4 <hypre_ParTMatmul.extracted+0x164> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4c04e1 <hypre_ParTMatmul.extracted+0x171> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R15D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %EDX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e8ab0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c0518 <hypre_ParTMatmul.extracted+0x1a8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RAX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R14,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c052a <hypre_ParTMatmul.extracted+0x1ba> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
IMUL %RAX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R15,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x50(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x100(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e6d80 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x78(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e6d80 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0573 <hypre_ParTMatmul.extracted+0x203> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RCX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efe80 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0591 <hypre_ParTMatmul.extracted+0x221> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RAX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efe80 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP -0x68(%RBP),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RBX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x60(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c08f2 <hypre_ParTMatmul.extracted+0x582> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c05ee <hypre_ParTMatmul.extracted+0x27e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x736270,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 410020 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,-0xd8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 4c0b50 <hypre_ParTMatmul.extracted+0x7e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x118(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xd0(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c0a8c <hypre_ParTMatmul.extracted+0x71c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R11,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c09b1 <hypre_ParTMatmul.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c09b1 <hypre_ParTMatmul.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4c0a5e <hypre_ParTMatmul.extracted+0x6ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R11,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4c0a5e <hypre_ParTMatmul.extracted+0x6ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c0a8c <hypre_ParTMatmul.extracted+0x71c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x5,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c0a1d <hypre_ParTMatmul.extracted+0x6ad> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R11),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JAE 4c0a8c <hypre_ParTMatmul.extracted+0x71c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R11,%RCX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c0a8c <hypre_ParTMatmul.extracted+0x71c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV (%R11),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%R11,%RDI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%R10,%RDI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x130(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4daa30 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x128(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x78(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4daa30 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x120(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4dab10 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x8(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4dab10 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x8(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x736290,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410020 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x100(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0b79 <hypre_ParTMatmul.extracted+0x809> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efe80 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0b93 <hypre_ParTMatmul.extracted+0x823> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efe80 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xd8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4c0bc9 <hypre_ParTMatmul.extracted+0x859> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RAX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RCX,%RDX,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4c0bde <hypre_ParTMatmul.extracted+0x86e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4c101f <hypre_ParTMatmul.extracted+0xcaf> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c101f <hypre_ParTMatmul.extracted+0xcaf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c0c08 <hypre_ParTMatmul.extracted+0x898> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e6e50 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 4e6e50 <hypre_Free> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | par_csr_matop.c:3454-3640 |
Module | exec |
nb instructions | 285 |
nb uops | 309 |
loop length | 1283 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 60 |
micro-operation queue | 51.50 cycles |
front end | 51.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 13.50 | 13.40 | 28.00 | 28.00 | 34.50 | 13.40 | 13.30 | 34.50 | 34.50 | 34.50 | 13.40 | 28.00 |
cycles | 13.50 | 16.00 | 28.00 | 28.00 | 34.50 | 13.40 | 13.30 | 34.50 | 34.50 | 34.50 | 13.40 | 28.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 48.35-48.40 |
Stall cycles | 0.00 |
Front-end | 51.50 |
Dispatch | 34.50 |
DIV/SQRT | 16.00 |
Overall L1 | 51.50 |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 5% |
all | 12% |
load | 11% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x128(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x80(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x148(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x140(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x120(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4e8aa0 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R15,-0x130(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x118(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4c04d4 <hypre_ParTMatmul.extracted+0x164> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4c04e1 <hypre_ParTMatmul.extracted+0x171> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R15D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %EDX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e8ab0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c0518 <hypre_ParTMatmul.extracted+0x1a8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RAX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R14,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c052a <hypre_ParTMatmul.extracted+0x1ba> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
IMUL %RAX,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R15,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x50(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x100(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e6d80 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x78(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e6d80 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0573 <hypre_ParTMatmul.extracted+0x203> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RCX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efe80 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0591 <hypre_ParTMatmul.extracted+0x221> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (,%RAX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efe80 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP -0x68(%RBP),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RBX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x60(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c08f2 <hypre_ParTMatmul.extracted+0x582> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c05ee <hypre_ParTMatmul.extracted+0x27e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x736270,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 410020 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,-0xd8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 4c0b50 <hypre_ParTMatmul.extracted+0x7e0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x118(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xd0(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4c0a8c <hypre_ParTMatmul.extracted+0x71c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R11,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c09b1 <hypre_ParTMatmul.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RAX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c09b1 <hypre_ParTMatmul.extracted+0x641> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R10,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4c0a5e <hypre_ParTMatmul.extracted+0x6ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R11,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JBE 4c0a5e <hypre_ParTMatmul.extracted+0x6ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c0a8c <hypre_ParTMatmul.extracted+0x71c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x5,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c0a1d <hypre_ParTMatmul.extracted+0x6ad> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R11),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x20,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JAE 4c0a8c <hypre_ParTMatmul.extracted+0x71c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R11,%RCX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4c0a8c <hypre_ParTMatmul.extracted+0x71c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV (%R11),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%R11,%RDI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%R10,%RDI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x130(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,(%RAX,%RBX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RBX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4daa30 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x128(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x78(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4daa30 <hypre_CSRMatrixCreate> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x120(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4dab10 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x8(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xa8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RBX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4dab10 <hypre_CSRMatrixInitialize> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x8(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xe0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xc0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x736290,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410020 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x100(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0b79 <hypre_ParTMatmul.extracted+0x809> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efe80 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c0b93 <hypre_ParTMatmul.extracted+0x823> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4efe80 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0xd8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4c0bc9 <hypre_ParTMatmul.extracted+0x859> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RAX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x8(%RCX,%RDX,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4c0bde <hypre_ParTMatmul.extracted+0x86e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4c101f <hypre_ParTMatmul.extracted+0xcaf> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c101f <hypre_ParTMatmul.extracted+0xcaf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c0c08 <hypre_ParTMatmul.extracted+0x898> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e6e50 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD $0x128,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
JMP 4e6e50 <hypre_Free> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_ParTMatmul.extracted– | 0.06 | 0.01 |
○Loop 3668 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
○Loop 3667 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
▼Loop 3657 - par_csr_matop.c:3467-3634 - exec– | 0 | 0 |
○Loop 3664 - par_csr_matop.c:3590-3596 - exec | 0.01 | 0.01 |
○Loop 3656 - par_csr_matop.c:3598-3604 - exec | 0 | 0 |
▼Loop 3658 - par_csr_matop.c:3467-3634 - exec– | 0 | 0 |
○Loop 3662 - par_csr_matop.c:3505-3608 - exec | 0.02 | 0.01 |
○Loop 3661 - par_csr_matop.c:3607-3608 - exec | 0 | 0 |
○Loop 3663 - par_csr_matop.c:3607-3608 - exec | 0 | 0 |
○Loop 3659 - par_csr_matop.c:3623-3634 - exec | 0 | 0 |
○Loop 3660 - par_csr_matop.c:3610-3621 - exec | 0 | 0 |
○Loop 3666 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
○Loop 3665 - par_csr_matop.c:3537-3540 - exec | 0 | 0 |
▼Loop 3670 - par_csr_matop.c:3467-3528 - exec– | 0 | 0 |
○Loop 3669 - par_csr_matop.c:3497-3501 - exec | 0 | 0 |
▼Loop 3671 - par_csr_matop.c:3467-3522 - exec– | 0 | 0 |
○Loop 3675 - par_csr_matop.c:3504-3505 - exec | 0.02 | 0.01 |
○Loop 3673 - par_csr_matop.c:3507-3513 - exec | 0 | 0 |
○Loop 3672 - par_csr_matop.c:3516-3522 - exec | 0 | 0 |
○Loop 3676 - par_csr_matop.c:3504-3505 - exec | 0 | 0 |
○Loop 3674 - par_csr_matop.c:3504-3505 - exec | 0 | 0 |
○Loop 3677 - par_csr_matop.c:3491-3495 - exec | 0 | 0.01 |