Function: hypre_IJMatrixSetValuesOMPParCSR.extracted.28 | Module: libIJ_mv.so | Source: IJMatrix_parcsr.c:3240-3484 [...] | Coverage: 0.81% |
---|
Function: hypre_IJMatrixSetValuesOMPParCSR.extracted.28 | Module: libIJ_mv.so | Source: IJMatrix_parcsr.c:3240-3484 [...] | Coverage: 0.81% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-147-2675/intel/AMG/build/AMG/AMG/IJ_mv/IJMatrix_parcsr.c: 3240 - 3484 |
-------------------------------------------------------------------------------- |
3240: #pragma omp parallel |
[...] |
3256: num_threads = hypre_NumActiveThreads(); |
3257: my_thread_num = hypre_GetThreadNum(); |
3258: |
3259: len = nrows/num_threads; |
3260: rest = nrows - len*num_threads; |
3261: |
3262: if (my_thread_num < rest) |
3263: { |
3264: ns = my_thread_num*(len+1); |
3265: ne = (my_thread_num+1)*(len+1); |
3266: } |
3267: else |
3268: { |
3269: ns = my_thread_num*len+rest; |
3270: ne = (my_thread_num+1)*len+rest; |
3271: } |
3272: |
3273: value_start[my_thread_num] = 0; |
3274: for (ii=ns; ii < ne; ii++) |
3275: value_start[my_thread_num] += ncols[ii]; |
3276: |
3277: #ifdef HYPRE_USING_OPENMP |
3278: #pragma omp barrier |
3279: #endif |
3280: if (my_thread_num == 0) |
3281: { |
3282: for (i=0; i < max_num_threads; i++) |
3283: value_start[i+1] += value_start[i]; |
[...] |
3289: if (my_thread_num) |
3290: indx = value_start[my_thread_num-1]; |
3291: for (ii=ns; ii < ne; ii++) |
3292: { |
3293: row = rows[ii]; |
3294: n = ncols[ii]; |
3295: /* processor owns the row */ |
3296: if (row >= row_partitioning[pstart] && row < row_partitioning[pstart+1]) |
3297: { |
3298: row_local = row - row_partitioning[pstart]; |
3299: /* compute local row number */ |
3300: if (need_aux) |
3301: { |
3302: local_j = aux_j[row_local]; |
3303: local_data = aux_data[row_local]; |
3304: space = row_space[row_local]; |
3305: old_size = row_length[row_local]; |
3306: size = space - old_size; |
3307: if (size < n) |
3308: { |
3309: size = n - size; |
3310: tmp_j = hypre_CTAlloc(HYPRE_Int,size); |
3311: tmp_data = hypre_CTAlloc(HYPRE_Complex,size); |
3312: } |
3313: tmp_indx = 0; |
3314: not_found = 1; |
3315: size = old_size; |
3316: for (i=0; i < n; i++) |
3317: { |
3318: for (j=0; j < old_size; j++) |
3319: { |
3320: if (local_j[j] == cols[indx]) |
3321: { |
3322: local_data[j] = values[indx]; |
[...] |
3329: if (size < space) |
3330: { |
3331: local_j[size] = cols[indx]; |
3332: local_data[size++] = values[indx]; |
3333: } |
3334: else |
3335: { |
3336: tmp_j[tmp_indx] = cols[indx]; |
3337: tmp_data[tmp_indx++] = values[indx]; |
[...] |
3344: row_length[row_local] = size+tmp_indx; |
3345: |
3346: if (tmp_indx) |
3347: { |
3348: aux_j[row_local] = hypre_TReAlloc(aux_j[row_local],HYPRE_Int, |
3349: size+tmp_indx); |
3350: aux_data[row_local] = hypre_TReAlloc(aux_data[row_local], |
3351: HYPRE_Complex,size+tmp_indx); |
3352: row_space[row_local] = size+tmp_indx; |
3353: local_j = aux_j[row_local]; |
[...] |
3359: for (i=0; i < tmp_indx; i++) |
3360: { |
3361: local_j[cnt] = tmp_j[i]; |
3362: local_data[cnt++] = tmp_data[i]; |
3363: } |
3364: |
3365: if (tmp_j) |
3366: { |
3367: hypre_TFree(tmp_j); |
3368: hypre_TFree(tmp_data); |
[...] |
3376: offd_indx = hypre_AuxParCSRMatrixIndxOffd(aux_matrix)[row_local]; |
3377: diag_indx = hypre_AuxParCSRMatrixIndxDiag(aux_matrix)[row_local]; |
3378: cnt_diag = diag_indx; |
3379: cnt_offd = offd_indx; |
3380: diag_space = diag_i[row_local+1]; |
3381: offd_space = offd_i[row_local+1]; |
3382: not_found = 1; |
3383: for (i=0; i < n; i++) |
3384: { |
3385: if (cols[indx] < col_0 || cols[indx] > col_n) |
3386: /* insert into offd */ |
3387: { |
3388: for (j=offd_i[row_local]; j < offd_indx; j++) |
3389: { |
3390: if (offd_j[j] == cols[indx]) |
3391: { |
3392: offd_data[j] = values[indx]; |
[...] |
3399: if (cnt_offd < offd_space) |
3400: { |
3401: offd_j[cnt_offd] = cols[indx]; |
3402: offd_data[cnt_offd++] = values[indx]; |
3403: } |
3404: else |
3405: { |
3406: hypre_error(HYPRE_ERROR_GENERIC); |
3407: #ifdef HYPRE_USING_OPENMP |
3408: #pragma omp atomic |
3409: #endif |
3410: error_flag++; |
3411: if (print_level) |
3412: hypre_printf("Error in row %d ! Too many elements!\n", |
[...] |
3422: for (j=diag_i[row_local]; j < diag_indx; j++) |
3423: { |
3424: if (diag_j[j] == cols[indx]) |
3425: { |
3426: diag_data[j] = values[indx]; |
[...] |
3433: if (cnt_diag < diag_space) |
3434: { |
3435: diag_j[cnt_diag] = cols[indx]; |
3436: diag_data[cnt_diag++] = values[indx]; |
3437: } |
3438: else |
3439: { |
3440: hypre_error(HYPRE_ERROR_GENERIC); |
3441: #ifdef HYPRE_USING_OPENMP |
3442: #pragma omp atomic |
3443: #endif |
3444: error_flag++; |
3445: if (print_level) |
3446: hypre_printf("Error in row %d ! Too many elements !\n", |
[...] |
3454: indx++; |
3455: } |
3456: |
3457: hypre_AuxParCSRMatrixIndxDiag(aux_matrix)[row_local] = cnt_diag; |
3458: hypre_AuxParCSRMatrixIndxOffd(aux_matrix)[row_local] = cnt_offd; |
[...] |
3466: indx += n; |
3467: if (aux_matrix) |
3468: { |
3469: col_indx = 0; |
3470: for (i=0; i < off_proc_i_indx; i=i+2) |
3471: { |
3472: row_len = off_proc_i[i+1]; |
3473: if (off_proc_i[i] == row) |
3474: { |
3475: for (j=0; j < n; j++) |
3476: { |
3477: cnt1 = col_indx; |
3478: for (k=0; k < row_len; k++) |
3479: { |
3480: if (off_proc_j[cnt1] == cols[j]) |
3481: { |
3482: off_proc_j[cnt1++] = -1; |
3483: /*cancel_indx++;*/ |
3484: offproc_cnt[my_thread_num]++; |
0xe510 PUSH %RBP |
0xe511 MOV %RSP,%RBP |
0xe514 PUSH %R15 |
0xe516 PUSH %R14 |
0xe518 PUSH %R13 |
0xe51a PUSH %R12 |
0xe51c PUSH %RBX |
0xe51d SUB $0x88,%RSP |
0xe524 MOV %R9,%RBX |
0xe527 MOV %R8,-0xa0(%RBP) |
0xe52e MOV %RCX,-0x38(%RBP) |
0xe532 MOV %RDX,%R15 |
0xe535 MOV %RDI,%R14 |
0xe538 CALL 3300 <hypre_NumActiveThreads@plt> |
0xe53d MOV %RAX,%R13 |
0xe540 CALL 30c0 <hypre_GetThreadNum@plt> |
0xe545 MOV %RAX,%R12 |
0xe548 MOV %R13,%RAX |
0xe54b OR %R15,%RAX |
0xe54e SHR $0x20,%RAX |
0xe552 JE e55e |
0xe554 MOV %R15,%RAX |
0xe557 CQTO |
0xe559 IDIV %R13 |
0xe55c JMP e566 |
0xe55e MOV %R15D,%EAX |
0xe561 XOR %EDX,%EDX |
0xe563 DIV %R13D |
0xe566 MOV -0x38(%RBP),%R8 |
0xe56a MOV 0xb8(%RBP),%R15 |
0xe571 LEA 0x1(%R12),%RCX |
0xe576 CMP %RDX,%R12 |
0xe579 JGE e58c |
0xe57b LEA 0x1(%RAX),%RDI |
0xe57f MOV %RDI,%RSI |
0xe582 IMUL %R12,%RSI |
0xe586 IMUL %RCX,%RDI |
0xe58a JMP e5a0 |
0xe58c MOV %RAX,%RSI |
0xe58f IMUL %R12,%RSI |
0xe593 ADD %RDX,%RSI |
0xe596 IMUL %RAX,%RCX |
0xe59a ADD %RDX,%RCX |
0xe59d MOV %RCX,%RDI |
0xe5a0 MOVQ $0,(%R15,%R12,8) |
0xe5a8 MOV %RSI,%R13 |
0xe5ab CMP %RDI,%RSI |
0xe5ae MOV %RDI,-0x30(%RBP) |
0xe5b2 JGE e68f |
0xe5b8 LEA (%R15,%R12,8),%RCX |
0xe5bc LEA -0x8(%R8,%RDI,8),%RDI |
0xe5c1 CMP %RDX,%R12 |
0xe5c4 CMOVL %R12,%RDX |
0xe5c8 IMUL %R12,%RAX |
0xe5cc LEA (%RDX,%RAX,1),%RSI |
0xe5d0 CMP %RCX,%RDI |
0xe5d3 JB e604 |
0xe5d5 LEA (%R8,%RSI,8),%RDI |
0xe5d9 CMP %RDI,%RCX |
0xe5dc JB e604 |
0xe5de XOR %EAX,%EAX |
0xe5e0 MOV %R13,%RDX |
0xe5e3 MOV -0x30(%RBP),%RSI |
0xe5e7 NOPW (%RAX,%RAX,1) |
(217) 0xe5f0 ADD (%R8,%RDX,8),%RAX |
(217) 0xe5f4 MOV %RAX,(%RCX) |
(217) 0xe5f7 INC %RDX |
(217) 0xe5fa CMP %RDX,%RSI |
(217) 0xe5fd JNE e5f0 |
0xe5ff JMP e68f |
0xe604 MOV -0x30(%RBP),%R8 |
0xe608 SUB %RSI,%R8 |
0xe60b MOV %R8,%RSI |
0xe60e AND $-0x4,%RSI |
0xe612 JE e666 |
0xe614 LEA -0x1(%RSI),%RDI |
0xe618 MOV -0x38(%RBP),%R9 |
0xe61c LEA (%R9,%R13,8),%R9 |
0xe620 VPXOR %XMM0,%XMM0,%XMM0 |
0xe624 XOR %R10D,%R10D |
0xe627 NOPW (%RAX,%RAX,1) |
(216) 0xe630 VPADDQ (%R9,%R10,8),%YMM0,%YMM0 |
(216) 0xe636 ADD $0x4,%R10 |
(216) 0xe63a CMP %RDI,%R10 |
(216) 0xe63d JBE e630 |
0xe63f VEXTRACTI128 $0x1,%YMM0,%XMM1 |
0xe645 VPADDQ %XMM1,%XMM0,%XMM0 |
0xe649 VPSHUFD $-0x12,%XMM0,%XMM1 |
0xe64e VPADDQ %XMM1,%XMM0,%XMM0 |
0xe652 VMOVQ %XMM0,%RDI |
0xe657 CMP %RSI,%R8 |
0xe65a MOV -0x38(%RBP),%R8 |
0xe65e MOV -0x30(%RBP),%R9 |
0xe662 JNE e672 |
0xe664 JMP e68c |
0xe666 XOR %ESI,%ESI |
0xe668 XOR %EDI,%EDI |
0xe66a MOV -0x38(%RBP),%R8 |
0xe66e MOV -0x30(%RBP),%R9 |
0xe672 ADD %RDX,%RSI |
0xe675 ADD %RAX,%RSI |
0xe678 NOPL (%RAX,%RAX,1) |
(215) 0xe680 ADD (%R8,%RSI,8),%RDI |
(215) 0xe684 INC %RSI |
(215) 0xe687 CMP %RSI,%R9 |
(215) 0xe68a JNE e680 |
0xe68c MOV %RDI,(%RCX) |
0xe68f MOV (%R14),%ESI |
0xe692 LEA 0xabf7(%RIP),%RDI |
0xe699 VZEROUPPER |
0xe69c CALL 3390 <__kmpc_barrier@plt> |
0xe6a1 TEST %R12,%R12 |
0xe6a4 JNE e744 |
0xe6aa MOV 0xc8(%RBP),%RAX |
0xe6b1 TEST %RAX,%RAX |
0xe6b4 JLE e744 |
0xe6ba MOV (%R15),%RCX |
0xe6bd CMP $0x8,%RAX |
0xe6c1 JB e717 |
0xe6c3 MOV %RAX,%RDX |
0xe6c6 SHR $0x3,%RDX |
0xe6ca LEA 0x40(%R15),%RSI |
0xe6ce XCHG %AX,%AX |
(214) 0xe6d0 ADD -0x38(%RSI),%RCX |
(214) 0xe6d4 MOV %RCX,-0x38(%RSI) |
(214) 0xe6d8 ADD -0x30(%RSI),%RCX |
(214) 0xe6dc MOV %RCX,-0x30(%RSI) |
(214) 0xe6e0 ADD -0x28(%RSI),%RCX |
(214) 0xe6e4 MOV %RCX,-0x28(%RSI) |
(214) 0xe6e8 ADD -0x20(%RSI),%RCX |
(214) 0xe6ec MOV %RCX,-0x20(%RSI) |
(214) 0xe6f0 ADD -0x18(%RSI),%RCX |
(214) 0xe6f4 MOV %RCX,-0x18(%RSI) |
(214) 0xe6f8 ADD -0x10(%RSI),%RCX |
(214) 0xe6fc MOV %RCX,-0x10(%RSI) |
(214) 0xe700 ADD -0x8(%RSI),%RCX |
(214) 0xe704 MOV %RCX,-0x8(%RSI) |
(214) 0xe708 ADD (%RSI),%RCX |
(214) 0xe70b MOV %RCX,(%RSI) |
(214) 0xe70e ADD $0x40,%RSI |
(214) 0xe712 DEC %RDX |
(214) 0xe715 JNE e6d0 |
0xe717 MOV %RAX,%RDX |
0xe71a AND $-0x8,%RDX |
0xe71e CMP %RAX,%RDX |
0xe721 JAE e744 |
0xe723 NOPW %CS:(%RAX,%RAX,1) |
(213) 0xe730 LEA (%R15,%RDX,8),%RSI |
(213) 0xe734 INC %RDX |
(213) 0xe737 ADD 0x8(%RSI),%RCX |
(213) 0xe73b MOV %RCX,0x8(%RSI) |
(213) 0xe73f CMP %RDX,%RAX |
(213) 0xe742 JNE e730 |
0xe744 MOV (%R14),%ESI |
0xe747 LEA 0xab62(%RIP),%RDI |
0xe74e CALL 3390 <__kmpc_barrier@plt> |
0xe753 TEST %R12,%R12 |
0xe756 JE e763 |
0xe758 MOV -0x8(%R15,%R12,8),%RAX |
0xe75d MOV %RAX,-0x40(%RBP) |
0xe761 JMP e76b |
0xe763 MOVQ $0,-0x40(%RBP) |
0xe76b MOV -0x38(%RBP),%RDX |
0xe76f MOV %R13,%RSI |
0xe772 MOV -0x30(%RBP),%RDI |
0xe776 CMP %RDI,%R13 |
0xe779 JGE f320 |
0xe77f MOV 0xb0(%RBP),%RAX |
0xe786 MOV 0xa8(%RBP),%RCX |
0xe78d MOV 0x98(%RBP),%R8 |
0xe794 LEA (%RAX,%R12,8),%R15 |
0xe798 MOV 0x20(%RBP),%RAX |
0xe79c ADD $0x18,%RCX |
0xe7a0 MOV %RCX,-0xa8(%RBP) |
0xe7a7 MOV %RAX,%RCX |
0xe7aa MOVQ $0,-0x70(%RBP) |
0xe7b2 JMP e815 |
(192) 0xe7b4 SAL $0x3,%R14 |
(192) 0xe7b8 MOV %R11,%RSI |
(192) 0xe7bb MOV %R14,%RDX |
(192) 0xe7be CALL 3350 <__intel_avx_rep_memcpy@plt> |
(192) 0xe7c3 MOV %R12,%RDI |
(192) 0xe7c6 MOV -0x70(%RBP),%RSI |
(192) 0xe7ca MOV %R14,%RDX |
(192) 0xe7cd CALL 3350 <__intel_avx_rep_memcpy@plt> |
(192) 0xe7d2 MOV -0x68(%RBP),%R11 |
(192) 0xe7d6 MOV %R11,%RDI |
(192) 0xe7d9 VZEROUPPER |
(192) 0xe7dc CALL 31c0 <hypre_Free@plt> |
(192) 0xe7e1 MOV -0x70(%RBP),%RDI |
(192) 0xe7e5 CALL 31c0 <hypre_Free@plt> |
(192) 0xe7ea MOVQ $0,-0x70(%RBP) |
(192) 0xe7f2 MOV -0x38(%RBP),%RDX |
(192) 0xe7f6 MOV -0x48(%RBP),%RSI |
(192) 0xe7fa MOV -0x30(%RBP),%RDI |
(192) 0xe7fe MOV 0x98(%RBP),%R8 |
(192) 0xe805 MOV 0x20(%RBP),%RCX |
(192) 0xe809 INC %RSI |
(192) 0xe80c CMP %RDI,%RSI |
(192) 0xe80f JGE f320 |
(192) 0xe815 MOV -0xa0(%RBP),%RAX |
(192) 0xe81c MOV (%RAX,%RSI,8),%R10 |
(192) 0xe820 MOV (%RDX,%RSI,8),%R14 |
(192) 0xe824 MOV %R10,-0x80(%RBP) |
(192) 0xe828 SUB (%RCX),%R10 |
(192) 0xe82b JL e8c0 |
(192) 0xe831 MOV -0x80(%RBP),%RAX |
(192) 0xe835 CMP 0x8(%RCX),%RAX |
(192) 0xe839 JGE e8c0 |
(192) 0xe83f CMPQ $0,0x58(%RBP) |
(192) 0xe844 MOV %R10,-0x50(%RBP) |
(192) 0xe848 JE eaef |
(192) 0xe84e MOV 0x38(%RBP),%RAX |
(192) 0xe852 MOV (%RAX,%R10,8),%R12 |
(192) 0xe856 MOV 0x40(%RBP),%RAX |
(192) 0xe85a MOV (%RAX,%R10,8),%RAX |
(192) 0xe85e MOV %RAX,-0x58(%RBP) |
(192) 0xe862 MOV 0x50(%RBP),%RAX |
(192) 0xe866 MOV (%RAX,%R10,8),%RCX |
(192) 0xe86a MOV 0x48(%RBP),%RAX |
(192) 0xe86e MOV (%RAX,%R10,8),%R13 |
(192) 0xe872 MOV %RCX,-0x88(%RBP) |
(192) 0xe879 MOV %RCX,%RAX |
(192) 0xe87c SUB %R13,%RAX |
(192) 0xe87f MOV %R14,-0x78(%RBP) |
(192) 0xe883 SUB %RAX,%R14 |
(192) 0xe886 MOV %RSI,-0x48(%RBP) |
(192) 0xe88a JLE eb5d |
(192) 0xe890 MOV $0x8,%ESI |
(192) 0xe895 MOV %R14,%RDI |
(192) 0xe898 VZEROUPPER |
(192) 0xe89b CALL 3360 <hypre_CAlloc@plt> |
(192) 0xe8a0 MOV %RAX,-0x68(%RBP) |
(192) 0xe8a4 MOV $0x8,%ESI |
(192) 0xe8a9 MOV %R14,%RDI |
(192) 0xe8ac CALL 3360 <hypre_CAlloc@plt> |
(192) 0xe8b1 MOV -0x68(%RBP),%R11 |
(192) 0xe8b5 MOV %RAX,-0x70(%RBP) |
(192) 0xe8b9 JMP eb60 |
0xe8be XCHG %AX,%AX |
(192) 0xe8c0 MOV -0x40(%RBP),%RAX |
(192) 0xe8c4 ADD %R14,%RAX |
(192) 0xe8c7 MOV 0x18(%RBP),%R9 |
(192) 0xe8cb CMPQ $0,(%R9) |
(192) 0xe8cf MOV %RAX,-0x40(%RBP) |
(192) 0xe8d3 JE e809 |
(192) 0xe8d9 TEST %R8,%R8 |
(192) 0xe8dc JLE e809 |
(192) 0xe8e2 MOV %RSI,-0x48(%RBP) |
(192) 0xe8e6 LEA -0x1(%R8),%RAX |
(192) 0xe8ea SHR $0x1,%RAX |
(192) 0xe8ed MOV %RAX,-0x60(%RBP) |
(192) 0xe8f1 LEA -0x1(%R14),%RCX |
(192) 0xe8f5 MOV %R14,-0x78(%RBP) |
(192) 0xe8f9 LEA -0x8(%RBX,%R14,8),%RAX |
(192) 0xe8fe MOV %RAX,-0x88(%RBP) |
(192) 0xe905 XOR %EDI,%EDI |
(192) 0xe907 XOR %ESI,%ESI |
(192) 0xe909 JMP e921 |
0xe90b NOPL (%RAX,%RAX,1) |
(193) 0xe910 LEA 0x1(%RSI),%RAX |
(193) 0xe914 CMP -0x60(%RBP),%RSI |
(193) 0xe918 MOV %RAX,%RSI |
(193) 0xe91b JE e7f2 |
(193) 0xe921 MOV %RDI,%R10 |
(193) 0xe924 MOV %RSI,%RAX |
(193) 0xe927 SAL $0x4,%RAX |
(193) 0xe92b MOV 0xa0(%RBP),%RDX |
(193) 0xe932 MOV 0x8(%RDX,%RAX,1),%R8 |
(193) 0xe937 ADD %R8,%RDI |
(193) 0xe93a MOV -0x80(%RBP),%R9 |
(193) 0xe93e CMP %R9,(%RDX,%RAX,1) |
(193) 0xe942 JNE e910 |
(193) 0xe944 CMPQ $0,-0x78(%RBP) |
(193) 0xe949 JLE e910 |
(193) 0xe94b MOV 0xa8(%RBP),%RDX |
(193) 0xe952 LEA -0x8(%RDX,%RDI,8),%RAX |
(193) 0xe957 CMP %R15,%RAX |
(193) 0xe95a SETAE %R12B |
(193) 0xe95e LEA (%RDX,%R10,8),%R9 |
(193) 0xe962 CMP %R9,%R15 |
(193) 0xe965 SETAE %R13B |
(193) 0xe969 CMP %RBX,%RAX |
(193) 0xe96c SETB %DL |
(193) 0xe96f MOV -0x88(%RBP),%RAX |
(193) 0xe976 CMP %R9,%RAX |
(193) 0xe979 SETB %R14B |
(193) 0xe97d CMP %R15,%RAX |
(193) 0xe980 SETB %AL |
(193) 0xe983 CMP %RBX,%R15 |
(193) 0xe986 SETB %R11B |
(193) 0xe98a TEST %R13B,%R12B |
(193) 0xe98d JNE eaa0 |
(193) 0xe993 OR %R14B,%DL |
(193) 0xe996 JE eaa0 |
(193) 0xe99c OR %R11B,%AL |
(193) 0xe99f JE eaa0 |
(193) 0xe9a5 MOV -0xa8(%RBP),%RAX |
(193) 0xe9ac LEA (%RAX,%R10,8),%RAX |
(193) 0xe9b0 MOV %R8,%RDX |
(193) 0xe9b3 SHR $0x2,%RDX |
(193) 0xe9b7 MOV %R8,%R14 |
(193) 0xe9ba AND $-0x4,%R14 |
(193) 0xe9be XOR %R13D,%R13D |
(193) 0xe9c1 JMP e9e0 |
0xe9c3 NOPW %CS:(%RAX,%RAX,1) |
(196) 0xe9d0 LEA 0x1(%R13),%R10 |
(196) 0xe9d4 CMP %RCX,%R13 |
(196) 0xe9d7 MOV %R10,%R13 |
(196) 0xe9da JE e910 |
(196) 0xe9e0 TEST %R8,%R8 |
(196) 0xe9e3 JLE e9d0 |
(196) 0xe9e5 MOV (%RBX,%R13,8),%R12 |
(196) 0xe9e9 CMP $0x4,%R8 |
(196) 0xe9ed JAE ea20 |
(196) 0xe9ef CMP %R8,%R14 |
(196) 0xe9f2 JAE e9d0 |
(196) 0xe9f4 MOV %R14,%R10 |
(196) 0xe9f7 JMP ea08 |
0xe9f9 NOPL (%RAX) |
(197) 0xea00 INC %R10 |
(197) 0xea03 CMP %R10,%R8 |
(197) 0xea06 JE e9d0 |
(197) 0xea08 CMP %R12,(%R9,%R10,8) |
(197) 0xea0c JNE ea00 |
(197) 0xea0e MOVQ $-0x1,(%R9,%R10,8) |
(197) 0xea16 INCQ (%R15) |
(197) 0xea19 JMP ea00 |
0xea1b NOPL (%RAX,%RAX,1) |
(196) 0xea20 MOV %RDX,%R11 |
(196) 0xea23 MOV %RAX,%R10 |
(196) 0xea26 JMP ea39 |
0xea28 NOPL (%RAX,%RAX,1) |
(198) 0xea30 ADD $0x20,%R10 |
(198) 0xea34 DEC %R11 |
(198) 0xea37 JE e9ef |
(198) 0xea39 CMP %R12,-0x18(%R10) |
(198) 0xea3d JNE ea70 |
(198) 0xea3f MOVQ $-0x1,-0x18(%R10) |
(198) 0xea47 INCQ (%R15) |
(198) 0xea4a CMP %R12,-0x10(%R10) |
(198) 0xea4e JE ea76 |
(198) 0xea50 CMP %R12,-0x8(%R10) |
(198) 0xea54 JNE ea87 |
(198) 0xea56 MOVQ $-0x1,-0x8(%R10) |
(198) 0xea5e INCQ (%R15) |
(198) 0xea61 CMP %R12,(%R10) |
(198) 0xea64 JNE ea30 |
(198) 0xea66 JMP ea8c |
0xea68 NOPL (%RAX,%RAX,1) |
(198) 0xea70 CMP %R12,-0x10(%R10) |
(198) 0xea74 JNE ea50 |
(198) 0xea76 MOVQ $-0x1,-0x10(%R10) |
(198) 0xea7e INCQ (%R15) |
(198) 0xea81 CMP %R12,-0x8(%R10) |
(198) 0xea85 JE ea56 |
(198) 0xea87 CMP %R12,(%R10) |
(198) 0xea8a JNE ea30 |
(198) 0xea8c MOVQ $-0x1,(%R10) |
(198) 0xea93 INCQ (%R15) |
(198) 0xea96 JMP ea30 |
0xea98 NOPL (%RAX,%RAX,1) |
(193) 0xeaa0 XOR %EAX,%EAX |
(193) 0xeaa2 JMP eac0 |
0xeaa4 NOPW %CS:(%RAX,%RAX,1) |
(194) 0xeab0 LEA 0x1(%RAX),%RDX |
(194) 0xeab4 CMP %RCX,%RAX |
(194) 0xeab7 MOV %RDX,%RAX |
(194) 0xeaba JE e910 |
(194) 0xeac0 TEST %R8,%R8 |
(194) 0xeac3 JLE eab0 |
(194) 0xeac5 XOR %EDX,%EDX |
(194) 0xeac7 JMP ead8 |
0xeac9 NOPL (%RAX) |
(195) 0xead0 INC %RDX |
(195) 0xead3 CMP %RDX,%R8 |
(195) 0xead6 JE eab0 |
(195) 0xead8 MOV (%R9,%RDX,8),%R10 |
(195) 0xeadc CMP (%RBX,%RAX,8),%R10 |
(195) 0xeae0 JNE ead0 |
(195) 0xeae2 MOVQ $-0x1,(%R9,%RDX,8) |
(195) 0xeaea INCQ (%R15) |
(195) 0xeaed JMP ead0 |
(192) 0xeaef MOV 0x18(%RBP),%RAX |
(192) 0xeaf3 MOV (%RAX),%RAX |
(192) 0xeaf6 MOV 0x38(%RAX),%RCX |
(192) 0xeafa MOV 0x40(%RAX),%RAX |
(192) 0xeafe MOV (%RAX,%R10,8),%R9 |
(192) 0xeb02 MOV (%RCX,%R10,8),%RCX |
(192) 0xeb06 TEST %R14,%R14 |
(192) 0xeb09 JLE ee97 |
(192) 0xeb0f MOV %RSI,-0x48(%RBP) |
(192) 0xeb13 MOV 0x60(%RBP),%RAX |
(192) 0xeb17 MOV 0x8(%RAX,%R10,8),%RAX |
(192) 0xeb1c MOV %RAX,-0x68(%RBP) |
(192) 0xeb20 MOV 0x78(%RBP),%RAX |
(192) 0xeb24 MOV 0x8(%RAX,%R10,8),%RAX |
(192) 0xeb29 MOV %RAX,-0x90(%RBP) |
(192) 0xeb30 MOV -0x40(%RBP),%RAX |
(192) 0xeb34 MOV %R14,-0x78(%RBP) |
(192) 0xeb38 LEA (%RAX,%R14,1),%RDX |
(192) 0xeb3c MOV %RDX,-0x98(%RBP) |
(192) 0xeb43 XOR %R8D,%R8D |
(192) 0xeb46 MOV %R9,-0x60(%RBP) |
(192) 0xeb4a MOV %R9,-0x58(%RBP) |
(192) 0xeb4e MOV %RCX,-0x88(%RBP) |
(192) 0xeb55 MOV %RCX,%R14 |
(192) 0xeb58 JMP eef6 |
(192) 0xeb5d XOR %R11D,%R11D |
(192) 0xeb60 MOV -0x78(%RBP),%RAX |
(192) 0xeb64 TEST %RAX,%RAX |
(192) 0xeb67 JLE ee7d |
(192) 0xeb6d DEC %RAX |
(192) 0xeb70 MOV %RAX,-0x80(%RBP) |
(192) 0xeb74 MOV %R12D,%EAX |
(192) 0xeb77 AND $0x7f,%EAX |
(192) 0xeb7a MOV $0x80,%ECX |
(192) 0xeb7f SUB %EAX,%ECX |
(192) 0xeb81 SHR $0x3,%ECX |
(192) 0xeb84 CMP %RCX,%R13 |
(192) 0xeb87 CMOVB %R13,%RCX |
(192) 0xeb8b LEA (%R12,%RCX,8),%RDX |
(192) 0xeb8f MOV %R13,%RAX |
(192) 0xeb92 SUB %RCX,%RAX |
(192) 0xeb95 AND $-0x10,%RAX |
(192) 0xeb99 ADD %RCX,%RAX |
(192) 0xeb9c MOV %RAX,-0x90(%RBP) |
(192) 0xeba3 MOV %R13,%R14 |
(192) 0xeba6 MOVQ $0,-0x60(%RBP) |
(192) 0xebae XOR %EDI,%EDI |
(192) 0xebb0 MOV %R11,-0x68(%RBP) |
(192) 0xebb4 JMP ebf3 |
0xebb6 NOPW %CS:(%RAX,%RAX,1) |
(209) 0xebc0 MOV -0x60(%RBP),%R8 |
(209) 0xebc4 MOV %RSI,(%R11,%R8,8) |
(209) 0xebc8 MOV 0x10(%RBP),%RSI |
(209) 0xebcc VMOVQ (%RSI,%RAX,8),%XMM0 |
(209) 0xebd1 MOV -0x70(%RBP),%RAX |
(209) 0xebd5 VMOVQ %XMM0,(%RAX,%R8,8) |
(209) 0xebdb INC %R8 |
(209) 0xebde MOV %R8,-0x60(%RBP) |
(209) 0xebe2 LEA 0x1(%RDI),%RAX |
(209) 0xebe6 CMP -0x80(%RBP),%RDI |
(209) 0xebea MOV %RAX,%RDI |
(209) 0xebed JE ed4a |
(209) 0xebf3 TEST %R13,%R13 |
(209) 0xebf6 JLE ecd0 |
(209) 0xebfc MOV -0x40(%RBP),%RAX |
(209) 0xec00 LEA (%RAX,%RDI,1),%R8 |
(209) 0xec04 MOV (%RBX,%R8,8),%R9 |
(209) 0xec08 MOV %R12D,%EAX |
(209) 0xec0b AND $0x7f,%EAX |
(209) 0xec0e MOV $0x80,%ESI |
(209) 0xec13 SUB %EAX,%ESI |
(209) 0xec15 SHR $0x3,%ESI |
(209) 0xec18 CMP %RSI,%R13 |
(209) 0xec1b MOV %RSI,%RAX |
(209) 0xec1e CMOVB %R13,%RAX |
(209) 0xec22 TEST %RAX,%RAX |
(209) 0xec25 JE ec42 |
(209) 0xec27 XOR %R10D,%R10D |
(209) 0xec2a NOPW (%RAX,%RAX,1) |
(212) 0xec30 CMP %R9,(%R12,%R10,8) |
(212) 0xec34 JE ed31 |
(212) 0xec3a INC %R10 |
(212) 0xec3d CMP %R10,%RCX |
(212) 0xec40 JNE ec30 |
(209) 0xec42 CMP %RSI,%R13 |
(209) 0xec45 JBE ecd0 |
(209) 0xec4b MOV %R13,%R11 |
(209) 0xec4e SUB %RAX,%R11 |
(209) 0xec51 MOV %R11,%RSI |
(209) 0xec54 AND $-0x10,%RSI |
(209) 0xec58 JE eca6 |
(209) 0xec5a LEA -0x1(%RSI),%RAX |
(209) 0xec5e VPBROADCASTQ %R9,%YMM0 |
(209) 0xec64 XOR %R10D,%R10D |
(209) 0xec67 NOPW (%RAX,%RAX,1) |
(211) 0xec70 VPCMPEQQ 0x20(%RDX,%R10,8),%YMM0,%K0 |
(211) 0xec78 VPCMPEQQ (%RDX,%R10,8),%YMM0,%K1 |
(211) 0xec7f VPCMPEQQ 0x60(%RDX,%R10,8),%YMM0,%K2 |
(211) 0xec87 VPCMPEQQ 0x40(%RDX,%R10,8),%YMM0,%K3 |
(211) 0xec8f KORB %K2,%K3,%K4 |
(211) 0xec93 KORB %K0,%K1,%K5 |
(211) 0xec97 KORTESTB %K4,%K5 |
(211) 0xec9b JNE ed07 |
(211) 0xec9d ADD $0x10,%R10 |
(211) 0xeca1 CMP %RAX,%R10 |
(211) 0xeca4 JBE ec70 |
(209) 0xeca6 CMP %R11,%RSI |
(209) 0xeca9 MOV -0x68(%RBP),%R11 |
(209) 0xecad JAE ecd0 |
(209) 0xecaf MOV -0x90(%RBP),%R10 |
(209) 0xecb6 NOPW %CS:(%RAX,%RAX,1) |
(210) 0xecc0 CMP %R9,(%R12,%R10,8) |
(210) 0xecc4 JE ed31 |
(210) 0xecc6 INC %R10 |
(210) 0xecc9 CMP %R10,%R13 |
(210) 0xeccc JNE ecc0 |
(209) 0xecce XCHG %AX,%AX |
(209) 0xecd0 MOV -0x40(%RBP),%RAX |
(209) 0xecd4 ADD %RDI,%RAX |
(209) 0xecd7 MOV (%RBX,%RAX,8),%RSI |
(209) 0xecdb CMP -0x88(%RBP),%R14 |
(209) 0xece2 JGE ebc0 |
(209) 0xece8 MOV %RSI,(%R12,%R14,8) |
(209) 0xecec MOV 0x10(%RBP),%RSI |
(209) 0xecf0 VMOVQ (%RSI,%RAX,8),%XMM0 |
(209) 0xecf5 MOV -0x58(%RBP),%RAX |
(209) 0xecf9 VMOVQ %XMM0,(%RAX,%R14,8) |
(209) 0xecff INC %R14 |
(209) 0xed02 JMP ebe2 |
(209) 0xed07 KSHIFTLB $0x4,%K0,%K0 |
(209) 0xed0d KORB %K0,%K1,%K0 |
(209) 0xed11 KSHIFTLB $0x4,%K2,%K1 |
(209) 0xed17 KORB %K1,%K3,%K1 |
(209) 0xed1b KUNPCKBW %K0,%K1,%K0 |
(209) 0xed1f KMOVD %K0,%EAX |
(209) 0xed23 TZCNT %EAX,%EAX |
(209) 0xed27 ADD %RCX,%R10 |
(209) 0xed2a ADD %RAX,%R10 |
(209) 0xed2d MOV -0x68(%RBP),%R11 |
(209) 0xed31 MOV 0x10(%RBP),%RAX |
(209) 0xed35 VMOVQ (%RAX,%R8,8),%XMM0 |
(209) 0xed3b MOV -0x58(%RBP),%RAX |
(209) 0xed3f VMOVQ %XMM0,(%RAX,%R10,8) |
(209) 0xed45 JMP ebe2 |
(192) 0xed4a MOV -0x40(%RBP),%RAX |
(192) 0xed4e ADD -0x78(%RBP),%RAX |
(192) 0xed52 MOV -0x60(%RBP),%R13 |
(192) 0xed56 LEA (%R14,%R13,1),%RDX |
(192) 0xed5a MOV 0x48(%RBP),%RCX |
(192) 0xed5e MOV -0x50(%RBP),%R12 |
(192) 0xed62 MOV %RDX,(%RCX,%R12,8) |
(192) 0xed66 TEST %R13,%R13 |
(192) 0xed69 MOV %RAX,-0x40(%RBP) |
(192) 0xed6d JE ee89 |
(192) 0xed73 MOV 0x38(%RBP),%RAX |
(192) 0xed77 MOV (%RAX,%R12,8),%RDI |
(192) 0xed7b LEA (,%RDX,8),%RSI |
(192) 0xed83 MOV %RSI,-0x78(%RBP) |
(192) 0xed87 MOV %RDX,-0x80(%RBP) |
(192) 0xed8b VZEROUPPER |
(192) 0xed8e CALL 30e0 <hypre_ReAlloc@plt> |
(192) 0xed93 MOV 0x38(%RBP),%RCX |
(192) 0xed97 MOV %RAX,(%RCX,%R12,8) |
(192) 0xed9b MOV 0x40(%RBP),%RAX |
(192) 0xed9f MOV (%RAX,%R12,8),%RDI |
(192) 0xeda3 MOV -0x78(%RBP),%RSI |
(192) 0xeda7 CALL 30e0 <hypre_ReAlloc@plt> |
(192) 0xedac MOV -0x80(%RBP),%R9 |
(192) 0xedb0 MOV 0x40(%RBP),%RCX |
(192) 0xedb4 MOV %RAX,(%RCX,%R12,8) |
(192) 0xedb8 MOV 0x50(%RBP),%RCX |
(192) 0xedbc MOV %R9,(%RCX,%R12,8) |
(192) 0xedc0 TEST %R13,%R13 |
(192) 0xedc3 JLE f1fb |
(192) 0xedc9 MOV 0x38(%RBP),%RCX |
(192) 0xedcd MOV (%RCX,%R12,8),%RCX |
(192) 0xedd1 MOV -0x68(%RBP),%R11 |
(192) 0xedd5 LEA -0x8(%R11,%R13,8),%RDX |
(192) 0xedda LEA (%RCX,%R14,8),%RDI |
(192) 0xedde CMP %RDI,%RDX |
(192) 0xede1 SETAE %DL |
(192) 0xede4 LEA -0x8(%RCX,%R9,8),%RCX |
(192) 0xede9 CMP %R11,%RCX |
(192) 0xedec SETAE %SIL |
(192) 0xedf0 MOV -0x70(%RBP),%R8 |
(192) 0xedf4 LEA -0x8(%R8,%R13,8),%RCX |
(192) 0xedf9 LEA (%RAX,%R14,8),%R12 |
(192) 0xedfd CMP %R12,%RCX |
(192) 0xee00 SETB %CL |
(192) 0xee03 LEA -0x8(%RAX,%R9,8),%RAX |
(192) 0xee08 CMP %R8,%RAX |
(192) 0xee0b SETB %AL |
(192) 0xee0e TEST %SIL,%DL |
(192) 0xee11 JNE f20d |
(192) 0xee17 OR %AL,%CL |
(192) 0xee19 JE f20d |
(192) 0xee1f MOV -0x60(%RBP),%R14 |
(192) 0xee23 CMP $0xd,%R14 |
(192) 0xee27 JAE e7b4 |
(192) 0xee2d MOV %R14,%RAX |
(192) 0xee30 AND $-0x4,%RAX |
(192) 0xee34 JE f2fa |
(192) 0xee3a LEA -0x1(%RAX),%RCX |
(192) 0xee3e XOR %EDX,%EDX |
(192) 0xee40 MOV -0x70(%RBP),%RSI |
(192) 0xee44 NOPW %CS:(%RAX,%RAX,1) |
(208) 0xee50 VMOVUPS (%R11,%RDX,8),%YMM0 |
(208) 0xee56 VMOVUPS %YMM0,(%RDI,%RDX,8) |
(208) 0xee5b VMOVDQU (%RSI,%RDX,8),%YMM0 |
(208) 0xee60 VMOVDQU %YMM0,(%R12,%RDX,8) |
(208) 0xee66 ADD $0x4,%RDX |
(208) 0xee6a CMP %RCX,%RDX |
(208) 0xee6d JLE ee50 |
(192) 0xee6f CMP %RAX,%R14 |
(192) 0xee72 JE e7d6 |
(192) 0xee78 JMP f2fc |
(192) 0xee7d MOV 0x48(%RBP),%RAX |
(192) 0xee81 MOV -0x50(%RBP),%RCX |
(192) 0xee85 MOV %R13,(%RAX,%RCX,8) |
(192) 0xee89 TEST %R11,%R11 |
(192) 0xee8c JNE e7d6 |
(192) 0xee92 JMP e7f2 |
(192) 0xee97 MOV %RCX,%R14 |
(192) 0xee9a JMP f2de |
(199) 0xee9f KSHIFTLB $0x4,%K0,%K0 |
(199) 0xeea5 KORB %K0,%K1,%K0 |
(199) 0xeea9 KSHIFTLB $0x4,%K2,%K1 |
(199) 0xeeaf KORB %K1,%K3,%K1 |
(199) 0xeeb3 KUNPCKBW %K0,%K1,%K0 |
(199) 0xeeb7 KMOVD %K0,%EAX |
(199) 0xeebb TZCNT %EAX,%EAX |
(199) 0xeebf ADD %RDX,%R13 |
(199) 0xeec2 ADD %RAX,%R13 |
(199) 0xeec5 MOV -0x30(%RBP),%RDI |
(199) 0xeec9 MOV %RCX,%RAX |
(199) 0xeecc MOV 0x10(%RBP),%RCX |
(199) 0xeed0 VMOVQ (%RCX,%RAX,8),%XMM0 |
(199) 0xeed5 MOV 0x88(%RBP),%RCX |
(199) 0xeedc VMOVQ %XMM0,(%RCX,%R13,8) |
(199) 0xeee2 MOV -0x50(%RBP),%R10 |
(199) 0xeee6 INC %RAX |
(199) 0xeee9 INC %R8 |
(199) 0xeeec CMP -0x78(%RBP),%R8 |
(199) 0xeef0 JE f1dc |
(199) 0xeef6 MOV (%RBX,%RAX,8),%R9 |
(199) 0xeefa CMP 0x28(%RBP),%R9 |
(199) 0xeefe JL f050 |
(199) 0xef04 CMP 0x30(%RBP),%R9 |
(199) 0xef08 JG f050 |
(199) 0xef0e MOV 0x60(%RBP),%RCX |
(199) 0xef12 MOV (%RCX,%R10,8),%R10 |
(199) 0xef16 MOV -0x88(%RBP),%R11 |
(199) 0xef1d SUB %R10,%R11 |
(199) 0xef20 JLE f020 |
(199) 0xef26 MOV %RAX,%RCX |
(199) 0xef29 MOV 0x68(%RBP),%RSI |
(199) 0xef2d LEA (%RSI,%R10,8),%EAX |
(199) 0xef31 AND $0x7f,%EAX |
(199) 0xef34 MOV $0x80,%EDX |
(199) 0xef39 SUB %EAX,%EDX |
(199) 0xef3b SHR $0x3,%EDX |
(199) 0xef3e CMP %RDX,%R11 |
(199) 0xef41 MOV %RDX,%R12 |
(199) 0xef44 CMOVB %R11,%R12 |
(199) 0xef48 TEST %R12,%R12 |
(199) 0xef4b JE ef72 |
(199) 0xef4d MOV %R10,%R13 |
(199) 0xef50 MOV %R12,%RAX |
(199) 0xef53 NOPW %CS:(%RAX,%RAX,1) |
(205) 0xef60 CMP %R9,(%RSI,%R13,8) |
(205) 0xef64 JE f1c7 |
(205) 0xef6a INC %R13 |
(205) 0xef6d DEC %RAX |
(205) 0xef70 JNE ef60 |
(199) 0xef72 CMP %RDX,%R11 |
(199) 0xef75 MOV %RCX,%RAX |
(199) 0xef78 JBE f020 |
(199) 0xef7e SUB %R12,%R11 |
(199) 0xef81 MOV %R11,%RSI |
(199) 0xef84 AND $-0x10,%RSI |
(199) 0xef88 JE efea |
(199) 0xef8a LEA -0x1(%RSI),%RDI |
(199) 0xef8e LEA (%R10,%R12,1),%R13 |
(199) 0xef92 MOV 0x68(%RBP),%RAX |
(199) 0xef96 LEA (%RAX,%R13,8),%RAX |
(199) 0xef9a VPBROADCASTQ %R9,%YMM0 |
(199) 0xefa0 XOR %EDX,%EDX |
(199) 0xefa2 NOPW %CS:(%RAX,%RAX,1) |
(204) 0xefb0 VPCMPEQQ 0x20(%RAX,%RDX,8),%YMM0,%K0 |
(204) 0xefb8 VPCMPEQQ (%RAX,%RDX,8),%YMM0,%K1 |
(204) 0xefbf VPCMPEQQ 0x60(%RAX,%RDX,8),%YMM0,%K2 |
(204) 0xefc7 VPCMPEQQ 0x40(%RAX,%RDX,8),%YMM0,%K3 |
(204) 0xefcf KORB %K2,%K3,%K4 |
(204) 0xefd3 KORB %K0,%K1,%K5 |
(204) 0xefd7 KORTESTB %K4,%K5 |
(204) 0xefdb JNE f19d |
(204) 0xefe1 ADD $0x10,%RDX |
(204) 0xefe5 CMP %RDI,%RDX |
(204) 0xefe8 JBE efb0 |
(199) 0xefea CMP %R11,%RSI |
(199) 0xefed MOV -0x30(%RBP),%RDI |
(199) 0xeff1 MOV %RCX,%RAX |
(199) 0xeff4 JAE f020 |
(199) 0xeff6 ADD %R12,%R10 |
(199) 0xeff9 ADD %RSI,%R10 |
(199) 0xeffc MOV %R10,%R13 |
(199) 0xefff NOP |
(203) 0xf000 MOV 0x68(%RBP),%RCX |
(203) 0xf004 CMP %R9,(%RCX,%R13,8) |
(203) 0xf008 JE f1ca |
(203) 0xf00e INC %R13 |
(203) 0xf011 CMP %R13,-0x88(%RBP) |
(203) 0xf018 JNE f000 |
(199) 0xf01a NOPW (%RAX,%RAX,1) |
(199) 0xf020 CMP -0x68(%RBP),%R14 |
(199) 0xf024 JGE f240 |
(199) 0xf02a MOV 0x68(%RBP),%RCX |
(199) 0xf02e MOV %R9,(%RCX,%R14,8) |
(199) 0xf032 MOV 0x10(%RBP),%RCX |
(199) 0xf036 VMOVQ (%RCX,%RAX,8),%XMM0 |
(199) 0xf03b MOV 0x70(%RBP),%RCX |
(199) 0xf03f VMOVQ %XMM0,(%RCX,%R14,8) |
(199) 0xf045 INC %R14 |
(199) 0xf048 JMP eee2 |
0xf04d NOPL (%RAX) |
(199) 0xf050 MOV 0x78(%RBP),%RCX |
(199) 0xf054 MOV (%RCX,%R10,8),%R10 |
(199) 0xf058 MOV -0x60(%RBP),%R11 |
(199) 0xf05c SUB %R10,%R11 |
(199) 0xf05f JLE f160 |
(199) 0xf065 MOV %RAX,%RCX |
(199) 0xf068 MOV 0x80(%RBP),%RAX |
(199) 0xf06f LEA (%RAX,%R10,8),%EAX |
(199) 0xf073 AND $0x7f,%EAX |
(199) 0xf076 MOV $0x80,%EDX |
(199) 0xf07b SUB %EAX,%EDX |
(199) 0xf07d SHR $0x3,%EDX |
(199) 0xf080 CMP %RDX,%R11 |
(199) 0xf083 MOV %RDX,%R12 |
(199) 0xf086 CMOVB %R11,%R12 |
(199) 0xf08a TEST %R12,%R12 |
(199) 0xf08d JE f0b9 |
(199) 0xf08f MOV %R10,%R13 |
(199) 0xf092 MOV %R12,%RAX |
(199) 0xf095 NOPW %CS:(%RAX,%RAX,1) |
(202) 0xf0a0 MOV 0x80(%RBP),%RSI |
(202) 0xf0a7 CMP %R9,(%RSI,%R13,8) |
(202) 0xf0ab JE eec9 |
(202) 0xf0b1 INC %R13 |
(202) 0xf0b4 DEC %RAX |
(202) 0xf0b7 JNE f0a0 |
(199) 0xf0b9 CMP %RDX,%R11 |
(199) 0xf0bc MOV %RCX,%RAX |
(199) 0xf0bf JBE f160 |
(199) 0xf0c5 SUB %R12,%R11 |
(199) 0xf0c8 MOV %R11,%RSI |
(199) 0xf0cb AND $-0x10,%RSI |
(199) 0xf0cf JE f12a |
(199) 0xf0d1 LEA -0x1(%RSI),%RDI |
(199) 0xf0d5 LEA (%R10,%R12,1),%R13 |
(199) 0xf0d9 MOV 0x80(%RBP),%RAX |
(199) 0xf0e0 LEA (%RAX,%R13,8),%RAX |
(199) 0xf0e4 VPBROADCASTQ %R9,%YMM0 |
(199) 0xf0ea XOR %EDX,%EDX |
(199) 0xf0ec NOPL (%RAX) |
(201) 0xf0f0 VPCMPEQQ 0x20(%RAX,%RDX,8),%YMM0,%K0 |
(201) 0xf0f8 VPCMPEQQ (%RAX,%RDX,8),%YMM0,%K1 |
(201) 0xf0ff VPCMPEQQ 0x60(%RAX,%RDX,8),%YMM0,%K2 |
(201) 0xf107 VPCMPEQQ 0x40(%RAX,%RDX,8),%YMM0,%K3 |
(201) 0xf10f KORB %K2,%K3,%K4 |
(201) 0xf113 KORB %K0,%K1,%K5 |
(201) 0xf117 KORTESTB %K4,%K5 |
(201) 0xf11b JNE ee9f |
(201) 0xf121 ADD $0x10,%RDX |
(201) 0xf125 CMP %RDI,%RDX |
(201) 0xf128 JBE f0f0 |
(199) 0xf12a CMP %R11,%RSI |
(199) 0xf12d MOV -0x30(%RBP),%RDI |
(199) 0xf131 MOV %RCX,%RAX |
(199) 0xf134 JAE f160 |
(199) 0xf136 ADD %R12,%R10 |
(199) 0xf139 ADD %RSI,%R10 |
(199) 0xf13c MOV %R10,%R13 |
(199) 0xf13f NOP |
(200) 0xf140 MOV 0x80(%RBP),%RCX |
(200) 0xf147 CMP %R9,(%RCX,%R13,8) |
(200) 0xf14b JE eecc |
(200) 0xf151 INC %R13 |
(200) 0xf154 CMP %R13,-0x60(%RBP) |
(200) 0xf158 JNE f140 |
(199) 0xf15a NOPW (%RAX,%RAX,1) |
(199) 0xf160 MOV -0x58(%RBP),%RDX |
(199) 0xf164 CMP -0x90(%RBP),%RDX |
(199) 0xf16b JGE f27d |
(199) 0xf171 MOV 0x80(%RBP),%RCX |
(199) 0xf178 MOV %R9,(%RCX,%RDX,8) |
(199) 0xf17c MOV 0x10(%RBP),%RCX |
(199) 0xf180 VMOVQ (%RCX,%RAX,8),%XMM0 |
(199) 0xf185 MOV 0x88(%RBP),%RCX |
(199) 0xf18c VMOVQ %XMM0,(%RCX,%RDX,8) |
(199) 0xf191 INC %RDX |
(199) 0xf194 MOV %RDX,-0x58(%RBP) |
(199) 0xf198 JMP eee2 |
(199) 0xf19d KSHIFTLB $0x4,%K0,%K0 |
(199) 0xf1a3 KORB %K0,%K1,%K0 |
(199) 0xf1a7 KSHIFTLB $0x4,%K2,%K1 |
(199) 0xf1ad KORB %K1,%K3,%K1 |
(199) 0xf1b1 KUNPCKBW %K0,%K1,%K0 |
(199) 0xf1b5 KMOVD %K0,%EAX |
(199) 0xf1b9 TZCNT %EAX,%EAX |
(199) 0xf1bd ADD %RDX,%R13 |
(199) 0xf1c0 ADD %RAX,%R13 |
(199) 0xf1c3 MOV -0x30(%RBP),%RDI |
(199) 0xf1c7 MOV %RCX,%RAX |
(199) 0xf1ca MOV 0x10(%RBP),%RCX |
(199) 0xf1ce VMOVQ (%RCX,%RAX,8),%XMM0 |
(199) 0xf1d3 MOV 0x70(%RBP),%RCX |
(199) 0xf1d7 JMP eedc |
(192) 0xf1dc MOV -0x98(%RBP),%RAX |
(192) 0xf1e3 MOV %RAX,-0x40(%RBP) |
(192) 0xf1e7 MOV -0x38(%RBP),%RDX |
(192) 0xf1eb MOV -0x48(%RBP),%RSI |
(192) 0xf1ef MOV 0x98(%RBP),%R8 |
(192) 0xf1f6 JMP f2da |
(192) 0xf1fb MOV -0x68(%RBP),%R11 |
(192) 0xf1ff TEST %R11,%R11 |
(192) 0xf202 JNE e7d6 |
(192) 0xf208 JMP e7f2 |
(192) 0xf20d XOR %EAX,%EAX |
(192) 0xf20f MOV -0x70(%RBP),%RDX |
(192) 0xf213 MOV -0x60(%RBP),%RSI |
(192) 0xf217 NOPW (%RAX,%RAX,1) |
(206) 0xf220 MOV (%R11,%RAX,8),%RCX |
(206) 0xf224 MOV %RCX,(%RDI,%RAX,8) |
(206) 0xf228 VMOVQ (%RDX,%RAX,8),%XMM0 |
(206) 0xf22d VMOVQ %XMM0,(%R12,%RAX,8) |
(206) 0xf233 INC %RAX |
(206) 0xf236 CMP %RAX,%RSI |
(206) 0xf239 JNE f220 |
(192) 0xf23b JMP e7d6 |
(192) 0xf240 MOV %RAX,-0x40(%RBP) |
(192) 0xf244 MOV $0xd70,%ESI |
(192) 0xf249 MOV $0x1,%EDX |
(192) 0xf24e LEA 0x501e(%RIP),%RDI |
(192) 0xf255 XOR %ECX,%ECX |
(192) 0xf257 VZEROUPPER |
(192) 0xf25a CALL 3420 <hypre_error_handler@plt> |
(192) 0xf25f MOV 0xd0(%RBP),%RAX |
(192) 0xf266 LOCK INCQ (%RAX) |
(192) 0xf26a CMPQ $0,0xc0(%RBP) |
(192) 0xf272 JE f2c3 |
(192) 0xf274 LEA 0x5176(%RIP),%RDI |
(192) 0xf27b JMP f2b8 |
(192) 0xf27d MOV %RAX,-0x40(%RBP) |
(192) 0xf281 MOV $0xd4e,%ESI |
(192) 0xf286 MOV $0x1,%EDX |
(192) 0xf28b LEA 0x4fe1(%RIP),%RDI |
(192) 0xf292 XOR %ECX,%ECX |
(192) 0xf294 VZEROUPPER |
(192) 0xf297 CALL 3420 <hypre_error_handler@plt> |
(192) 0xf29c MOV 0xd0(%RBP),%RAX |
(192) 0xf2a3 LOCK INCQ (%RAX) |
(192) 0xf2a7 CMPQ $0,0xc0(%RBP) |
(192) 0xf2af JE f2c3 |
(192) 0xf2b1 LEA 0x5113(%RIP),%RDI |
(192) 0xf2b8 MOV -0x80(%RBP),%RSI |
(192) 0xf2bc XOR %EAX,%EAX |
(192) 0xf2be CALL 3410 <hypre_printf@plt> |
(192) 0xf2c3 MOV -0x38(%RBP),%RDX |
(192) 0xf2c7 MOV -0x48(%RBP),%RSI |
(192) 0xf2cb MOV -0x30(%RBP),%RDI |
(192) 0xf2cf MOV 0x98(%RBP),%R8 |
(192) 0xf2d6 MOV -0x50(%RBP),%R10 |
(192) 0xf2da MOV -0x58(%RBP),%R9 |
(192) 0xf2de MOV 0x18(%RBP),%RAX |
(192) 0xf2e2 MOV (%RAX),%RAX |
(192) 0xf2e5 MOV 0x38(%RAX),%RCX |
(192) 0xf2e9 MOV %R14,(%RCX,%R10,8) |
(192) 0xf2ed MOV 0x40(%RAX),%RAX |
(192) 0xf2f1 MOV %R9,(%RAX,%R10,8) |
(192) 0xf2f5 JMP e805 |
(192) 0xf2fa XOR %EAX,%EAX |
(192) 0xf2fc MOV -0x70(%RBP),%RDX |
(207) 0xf300 MOV (%R11,%RAX,8),%RCX |
(207) 0xf304 MOV %RCX,(%RDI,%RAX,8) |
(207) 0xf308 VMOVQ (%RDX,%RAX,8),%XMM0 |
(207) 0xf30d VMOVQ %XMM0,(%R12,%RAX,8) |
(207) 0xf313 INC %RAX |
(207) 0xf316 CMP %RAX,%R14 |
(207) 0xf319 JNE f300 |
(192) 0xf31b JMP e7d6 |
0xf320 ADD $0x88,%RSP |
0xf327 POP %RBX |
0xf328 POP %R12 |
0xf32a POP %R13 |
0xf32c POP %R14 |
0xf32e POP %R15 |
0xf330 POP %RBP |
0xf331 VZEROUPPER |
0xf334 RET |
0xf335 NOPW %CS:(%RAX,%RAX,1) |
0xf33f NOP |
Path / |
Source file and lines | IJMatrix_parcsr.c:3240-3484 |
Module | libIJ_mv.so |
nb instructions | 162 |
nb uops | 175 |
loop length | 663 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 12 |
micro-operation queue | 29.17 cycles |
front end | 29.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 11.30 | 12.00 | 9.00 | 9.00 | 9.50 | 11.20 | 11.30 | 9.50 | 9.50 | 9.50 | 11.20 | 9.00 |
cycles | 11.30 | 16.40 | 9.00 | 9.00 | 9.50 | 11.20 | 11.30 | 9.50 | 9.50 | 9.50 | 11.20 | 9.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 27.84-27.91 |
Stall cycles | 0.00 |
Front-end | 29.17 |
Dispatch | 16.40 |
DIV/SQRT | 16.00 |
Overall L1 | 29.17 |
all | 20% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 23% |
all | 14% |
load | NA (no load vectorizable/vectorized instructions) |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x88,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3300 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 30c0 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE e55e <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x4e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R13 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP e566 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x56> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R15D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R13D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%R12),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE e58c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x1(%RAX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R12,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
IMUL %RCX,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP e5a0 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x90> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R12,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVQ $0,(%R15,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE e68f <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x17f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R15,%R12,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(%R8,%RDI,8),%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %R12,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %R12,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%RDX,%RAX,1),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB e604 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xf4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R8,%RSI,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB e604 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xf4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP e68f <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x17f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RSI,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE e666 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x156> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RSI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R9,%R13,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%RDI | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RSI,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE e672 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x162> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP e68c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x17c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R14),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xabf7(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 3390 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE e744 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x234> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE e744 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x234> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R15),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x8,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB e717 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x207> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x40(%R15),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x8,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE e744 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x234> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R14),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xab62(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3390 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE e763 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x253> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x8(%R15,%R12,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP e76b <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x25b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOVQ $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE f320 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xe10> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x98(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RAX,%R12,8),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x18,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVQ $0,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP e815 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x305> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x88,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | IJMatrix_parcsr.c:3240-3484 |
Module | libIJ_mv.so |
nb instructions | 162 |
nb uops | 175 |
loop length | 663 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 12 |
micro-operation queue | 29.17 cycles |
front end | 29.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 11.30 | 12.00 | 9.00 | 9.00 | 9.50 | 11.20 | 11.30 | 9.50 | 9.50 | 9.50 | 11.20 | 9.00 |
cycles | 11.30 | 16.40 | 9.00 | 9.00 | 9.50 | 11.20 | 11.30 | 9.50 | 9.50 | 9.50 | 11.20 | 9.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 27.84-27.91 |
Stall cycles | 0.00 |
Front-end | 29.17 |
Dispatch | 16.40 |
DIV/SQRT | 16.00 |
Overall L1 | 29.17 |
all | 20% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 23% |
all | 14% |
load | NA (no load vectorizable/vectorized instructions) |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x88,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3300 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 30c0 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE e55e <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x4e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R13 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP e566 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x56> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R15D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R13D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%R12),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE e58c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x1(%RAX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R12,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
IMUL %RCX,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP e5a0 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x90> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R12,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVQ $0,(%R15,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE e68f <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x17f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R15,%R12,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(%R8,%RDI,8),%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %R12,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %R12,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%RDX,%RAX,1),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB e604 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xf4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R8,%RSI,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB e604 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xf4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP e68f <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x17f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RSI,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE e666 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x156> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RSI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R9,%R13,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%RDI | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RSI,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE e672 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x162> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP e68c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x17c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R14),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xabf7(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 3390 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE e744 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x234> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE e744 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x234> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R15),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x8,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB e717 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x207> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x40(%R15),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x8,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE e744 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x234> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R14),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xab62(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3390 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE e763 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x253> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x8(%R15,%R12,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP e76b <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x25b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOVQ $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE f320 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xe10> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x98(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RAX,%R12,8),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x18,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVQ $0,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP e815 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x305> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x88,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_IJMatrixSetValuesOMPParCSR.extracted.28– | 0.81 | 0.17 |
○Loop 217 - IJMatrix_parcsr.c:3274-3275 - libIJ_mv.so | 0.35 | 0.07 |
▼Loop 192 - IJMatrix_parcsr.c:3262-3484 - libIJ_mv.so– | 0.14 | 0.03 |
▼Loop 199 - IJMatrix_parcsr.c:3262-3454 - libIJ_mv.so– | 0.66 | 0.12 |
○Loop 205 - IJMatrix_parcsr.c:3422-3424 - libIJ_mv.so | 0 | 0 |
○Loop 204 - IJMatrix_parcsr.c:3422-3424 - libIJ_mv.so | 0 | 0 |
○Loop 201 - IJMatrix_parcsr.c:3388-3424 - libIJ_mv.so | 0 | 0 |
○Loop 202 - IJMatrix_parcsr.c:3388-3390 - libIJ_mv.so | 0 | 0 |
○Loop 200 - IJMatrix_parcsr.c:3388-3390 - libIJ_mv.so | 0 | 0 |
○Loop 203 - IJMatrix_parcsr.c:3422-3424 - libIJ_mv.so | 0 | 0 |
▼Loop 193 - IJMatrix_parcsr.c:3262-3484 - libIJ_mv.so– | 0 | 0 |
▼Loop 194 - IJMatrix_parcsr.c:3475-3484 - libIJ_mv.so– | 0 | 0 |
○Loop 195 - IJMatrix_parcsr.c:3478-3484 - libIJ_mv.so | 0 | 0 |
▼Loop 196 - IJMatrix_parcsr.c:3475-3484 - libIJ_mv.so– | 0 | 0 |
○Loop 197 - IJMatrix_parcsr.c:3478-3484 - libIJ_mv.so | 0 | 0 |
○Loop 198 - IJMatrix_parcsr.c:3478-3484 - libIJ_mv.so | 0 | 0 |
○Loop 208 - IJMatrix_parcsr.c:3359-3362 - libIJ_mv.so | 0 | 0 |
▼Loop 209 - IJMatrix_parcsr.c:3262-3337 - libIJ_mv.so– | 0 | 0 |
○Loop 211 - IJMatrix_parcsr.c:3318-3320 - libIJ_mv.so | 0.15 | 0.03 |
○Loop 212 - IJMatrix_parcsr.c:3318-3320 - libIJ_mv.so | 0 | 0 |
○Loop 210 - IJMatrix_parcsr.c:3318-3320 - libIJ_mv.so | 0 | 0 |
○Loop 207 - IJMatrix_parcsr.c:3359-3362 - libIJ_mv.so | 0 | 0 |
○Loop 206 - IJMatrix_parcsr.c:3359-3362 - libIJ_mv.so | 0 | 0 |
○Loop 216 - IJMatrix_parcsr.c:3274-3275 - libIJ_mv.so | 0.01 | 0 |
○Loop 214 - IJMatrix_parcsr.c:3282-3283 - libIJ_mv.so | 0 | 0 |
○Loop 215 - IJMatrix_parcsr.c:3274-3275 - libIJ_mv.so | 0 | 0 |
○Loop 213 - IJMatrix_parcsr.c:3282-3283 - libIJ_mv.so | 0 | 0 |