Function: hypre_ParMatmul_RowSizes.extracted | Module: exec | Source: par_csr_matop.c:102-276 [...] | Coverage: 2.36% |
---|
Function: hypre_ParMatmul_RowSizes.extracted | Module: exec | Source: par_csr_matop.c:102-276 [...] | Coverage: 2.36% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-112-7443/intel/AMG/build/AMG/AMG/parcsr_mv/par_csr_matop.c: 102 - 276 |
-------------------------------------------------------------------------------- |
102: #pragma omp parallel private(ii, i1, jj_row_begin_diag, jj_row_begin_offd, jj_count_diag, jj_count_offd, jj2, i2, jj3, i3) |
[...] |
108: ii = hypre_GetThreadNum(); |
109: if (ii < rest) |
110: { |
111: ns = ii*size+ii; |
112: ne = (ii+1)*size+ii+1; |
113: } |
114: else |
115: { |
116: ns = ii*size+rest; |
117: ne = (ii+1)*size+rest; |
118: } |
119: jj_count_diag = start_indexing; |
120: jj_count_offd = start_indexing; |
121: |
122: if (num_cols_diag_B || num_cols_offd_C) |
123: B_marker = hypre_CTAlloc(HYPRE_Int, num_cols_diag_B+num_cols_offd_C); |
124: for (i1 = 0; i1 < num_cols_diag_B+num_cols_offd_C; i1++) |
125: B_marker[i1] = -1; |
126: |
127: for (i1 = ns; i1 < ne; i1++) |
[...] |
135: if ( allsquare ) { |
136: B_marker[i1] = jj_count_diag; |
137: jj_count_diag++; |
[...] |
144: if (num_cols_offd_A) |
145: { |
146: for (jj2 = A_offd_i[i1]; jj2 < A_offd_i[i1+1]; jj2++) |
147: { |
148: i2 = A_offd_j[jj2]; |
[...] |
154: for (jj3 = B_ext_offd_i[i2]; jj3 < B_ext_offd_i[i2+1]; jj3++) |
[...] |
164: if (B_marker[i3] < jj_row_begin_offd) |
165: { |
166: B_marker[i3] = jj_count_offd; |
167: jj_count_offd++; |
168: } |
169: } |
170: for (jj3 = B_ext_diag_i[i2]; jj3 < B_ext_diag_i[i2+1]; jj3++) |
171: { |
172: i3 = B_ext_diag_j[jj3]; |
173: |
174: if (B_marker[i3] < jj_row_begin_diag) |
175: { |
176: B_marker[i3] = jj_count_diag; |
177: jj_count_diag++; |
[...] |
187: for (jj2 = A_diag_i[i1]; jj2 < A_diag_i[i1+1]; jj2++) |
188: { |
189: i2 = A_diag_j[jj2]; |
[...] |
195: for (jj3 = B_diag_i[i2]; jj3 < B_diag_i[i2+1]; jj3++) |
196: { |
197: i3 = B_diag_j[jj3]; |
[...] |
205: if (B_marker[i3] < jj_row_begin_diag) |
206: { |
207: B_marker[i3] = jj_count_diag; |
208: jj_count_diag++; |
[...] |
216: if (num_cols_offd_B) |
217: { |
218: for (jj3 = B_offd_i[i2]; jj3 < B_offd_i[i2+1]; jj3++) |
219: { |
220: i3 = num_cols_diag_B+map_B_to_C[B_offd_j[jj3]]; |
[...] |
228: if (B_marker[i3] < jj_row_begin_offd) |
229: { |
230: B_marker[i3] = jj_count_offd; |
231: jj_count_offd++; |
[...] |
241: (*C_diag_i)[i1] = jj_row_begin_diag; |
242: (*C_offd_i)[i1] = jj_row_begin_offd; |
243: |
244: } |
245: jj_count_diag_array[ii] = jj_count_diag; |
246: jj_count_offd_array[ii] = jj_count_offd; |
247: |
248: hypre_TFree(B_marker); |
249: #ifdef HYPRE_USING_OPENMP |
250: #pragma omp barrier |
251: #endif |
252: |
253: if (ii) |
254: { |
255: jj_count_diag = jj_count_diag_array[0]; |
256: jj_count_offd = jj_count_offd_array[0]; |
257: for (i1 = 1; i1 < ii; i1++) |
258: { |
259: jj_count_diag += jj_count_diag_array[i1]; |
260: jj_count_offd += jj_count_offd_array[i1]; |
261: } |
262: |
263: for (i1 = ns; i1 < ne; i1++) |
264: { |
265: (*C_diag_i)[i1] += jj_count_diag; |
266: (*C_offd_i)[i1] += jj_count_offd; |
267: } |
268: } |
269: else |
270: { |
271: (*C_diag_i)[num_rows_diag_A] = 0; |
272: (*C_offd_i)[num_rows_diag_A] = 0; |
273: for (i1 = 0; i1 < num_threads; i1++) |
274: { |
275: (*C_diag_i)[num_rows_diag_A] += jj_count_diag_array[i1]; |
276: (*C_offd_i)[num_rows_diag_A] += jj_count_offd_array[i1]; |
0x4bc4a0 PUSH %RBP |
0x4bc4a1 MOV %RSP,%RBP |
0x4bc4a4 PUSH %R15 |
0x4bc4a6 PUSH %R14 |
0x4bc4a8 PUSH %R13 |
0x4bc4aa PUSH %R12 |
0x4bc4ac PUSH %RBX |
0x4bc4ad SUB $0xb8,%RSP |
0x4bc4b4 MOV %R9,-0x88(%RBP) |
0x4bc4bb MOV %R8,-0xb8(%RBP) |
0x4bc4c2 MOV %RCX,-0x58(%RBP) |
0x4bc4c6 MOV %RDX,-0x50(%RBP) |
0x4bc4ca MOV %RDI,-0x90(%RBP) |
0x4bc4d1 MOV 0xc0(%RBP),%R14 |
0x4bc4d8 MOV 0xb8(%RBP),%R13 |
0x4bc4df MOV 0x90(%RBP),%R12 |
0x4bc4e6 MOV 0x80(%RBP),%R15 |
0x4bc4ed CALL 4e8ff0 <hypre_GetThreadNum> |
0x4bc4f2 MOV %RAX,%RCX |
0x4bc4f5 LEA 0x1(%RAX),%RBX |
0x4bc4f9 MOV %RBX,%RAX |
0x4bc4fc IMUL %R14,%RAX |
0x4bc500 CMP %R13,%RCX |
0x4bc503 JGE 4bc648 |
0x4bc509 LEA 0x1(%R14),%RDX |
0x4bc50d IMUL %RCX,%RDX |
0x4bc511 ADD %RAX,%RBX |
0x4bc514 MOV %R15,%RAX |
0x4bc517 OR %R12,%RAX |
0x4bc51a MOV %RCX,-0x60(%RBP) |
0x4bc51e JE 4bc668 |
0x4bc524 MOV %RDX,%R13 |
0x4bc527 LEA (%R12,%R15,1),%RDI |
0x4bc52b MOV $0x8,%ESI |
0x4bc530 CALL 4e72c0 <hypre_CAlloc> |
0x4bc535 MOV %RAX,%R14 |
0x4bc538 ADD %R15,%R12 |
0x4bc53b JLE 4bc551 |
0x4bc53d SAL $0x3,%R12 |
0x4bc541 MOV %R14,%RDI |
0x4bc544 MOV $0xff,%ESI |
0x4bc549 MOV %R12,%RDX |
0x4bc54c CALL 4f03c0 <_intel_fast_memset> |
0x4bc551 MOV -0x60(%RBP),%RCX |
0x4bc555 MOV %R13,%RDX |
0x4bc558 MOV %RDX,-0x40(%RBP) |
0x4bc55c CMP %RBX,%RDX |
0x4bc55f MOV %RBX,-0x48(%RBP) |
0x4bc563 JL 4bc67c |
0x4bc569 XOR %EBX,%EBX |
0x4bc56b XOR %EDX,%EDX |
0x4bc56d MOV 0xa8(%RBP),%R15 |
0x4bc574 MOV -0x60(%RBP),%R12 |
0x4bc578 MOV %RBX,(%R15,%R12,8) |
0x4bc57c MOV 0xb0(%RBP),%RBX |
0x4bc583 MOV %RDX,(%RBX,%R12,8) |
0x4bc587 MOV %R14,%RDI |
0x4bc58a CALL 4e7390 <hypre_Free> |
0x4bc58f MOV -0x90(%RBP),%RAX |
0x4bc596 MOV (%RAX),%ESI |
0x4bc598 MOV $0x537190,%EDI |
0x4bc59d CALL 410560 <__kmpc_barrier@plt> |
0x4bc5a2 TEST %R12,%R12 |
0x4bc5a5 JE 4bcfaa |
0x4bc5ab MOV %R12,%RDI |
0x4bc5ae MOV (%R15),%RAX |
0x4bc5b1 MOV (%RBX),%RCX |
0x4bc5b4 CMP $0x1,%R12 |
0x4bc5b8 JLE 4bd0e3 |
0x4bc5be LEA -0x1(%RDI),%RSI |
0x4bc5c2 MOV %RSI,%RDX |
0x4bc5c5 AND $-0x4,%RDX |
0x4bc5c9 JE 4bd0f4 |
0x4bc5cf VMOVQ %RAX,%XMM1 |
0x4bc5d4 VMOVQ %RCX,%XMM0 |
0x4bc5d9 LEA -0x1(%RDX),%RAX |
0x4bc5dd XOR %ECX,%ECX |
0x4bc5df MOV -0x48(%RBP),%R11 |
0x4bc5e3 MOV 0xc0(%RBP),%R14 |
0x4bc5ea NOPW (%RAX,%RAX,1) |
(3557) 0x4bc5f0 VPADDQ 0x8(%R15,%RCX,8),%YMM1,%YMM1 |
(3557) 0x4bc5f7 VPADDQ 0x8(%RBX,%RCX,8),%YMM0,%YMM0 |
(3557) 0x4bc5fd ADD $0x4,%RCX |
(3557) 0x4bc601 CMP %RAX,%RCX |
(3557) 0x4bc604 JLE 4bc5f0 |
0x4bc606 VEXTRACTI128 $0x1,%YMM1,%XMM2 |
0x4bc60c VPADDQ %XMM2,%XMM1,%XMM1 |
0x4bc610 VPSHUFD $-0x12,%XMM1,%XMM2 |
0x4bc615 VPADDQ %XMM2,%XMM1,%XMM1 |
0x4bc619 VMOVQ %XMM1,%RAX |
0x4bc61e VEXTRACTI128 $0x1,%YMM0,%XMM1 |
0x4bc624 VPADDQ %XMM1,%XMM0,%XMM0 |
0x4bc628 VPSHUFD $-0x12,%XMM0,%XMM1 |
0x4bc62d VPADDQ %XMM1,%XMM0,%XMM0 |
0x4bc631 VMOVQ %XMM0,%RCX |
0x4bc636 CMP %RDX,%RSI |
0x4bc639 MOV -0x40(%RBP),%RSI |
0x4bc63d JNE 4bd105 |
0x4bc643 JMP 4bd120 |
0x4bc648 MOV %RCX,%RDX |
0x4bc64b IMUL %R14,%RDX |
0x4bc64f ADD %R13,%RDX |
0x4bc652 ADD %R13,%RAX |
0x4bc655 MOV %RAX,%RBX |
0x4bc658 MOV %R15,%RAX |
0x4bc65b OR %R12,%RAX |
0x4bc65e MOV %RCX,-0x60(%RBP) |
0x4bc662 JNE 4bc524 |
0x4bc668 XOR %R14D,%R14D |
0x4bc66b MOV %RDX,-0x40(%RBP) |
0x4bc66f CMP %RBX,%RDX |
0x4bc672 MOV %RBX,-0x48(%RBP) |
0x4bc676 JGE 4bc569 |
0x4bc67c MOV 0x60(%RBP),%RSI |
0x4bc680 MOV 0x58(%RBP),%RDX |
0x4bc684 MOV 0x48(%RBP),%RDI |
0x4bc688 MOV 0x38(%RBP),%R8 |
0x4bc68c MOV 0x28(%RBP),%R9 |
0x4bc690 MOV 0xb8(%RBP),%RAX |
0x4bc697 CMP %RAX,%RCX |
0x4bc69a CMOVL %RCX,%RAX |
0x4bc69e IMUL 0xc0(%RBP),%RCX |
0x4bc6a6 ADD %RAX,%RCX |
0x4bc6a9 MOV %RCX,-0xb0(%RBP) |
0x4bc6b0 NOT %RCX |
0x4bc6b3 ADD %RBX,%RCX |
0x4bc6b6 MOV %RCX,-0xa8(%RBP) |
0x4bc6bd MOV -0x50(%RBP),%RAX |
0x4bc6c1 MOV (%RAX),%RAX |
0x4bc6c4 MOV %RAX,-0xa0(%RBP) |
0x4bc6cb MOV -0x58(%RBP),%RAX |
0x4bc6cf MOV (%RAX),%RAX |
0x4bc6d2 MOV %RAX,-0x98(%RBP) |
0x4bc6d9 LEA 0x38(%RDX),%RAX |
0x4bc6dd MOV %RAX,-0xd8(%RBP) |
0x4bc6e4 LEA 0x38(%RDI),%RAX |
0x4bc6e8 MOV %RAX,-0xd0(%RBP) |
0x4bc6ef LEA 0x38(%R9),%RAX |
0x4bc6f3 MOV %RAX,-0x80(%RBP) |
0x4bc6f7 LEA 0x18(%R8),%RAX |
0x4bc6fb MOV %RAX,-0xc8(%RBP) |
0x4bc702 XOR %EDI,%EDI |
0x4bc704 XOR %R10D,%R10D |
0x4bc707 XOR %R8D,%R8D |
0x4bc70a MOV %R8,%RBX |
0x4bc70d JMP 4bc748 |
0x4bc70f NOP |
(3558) 0x4bc710 MOV -0xa0(%RBP),%RAX |
(3558) 0x4bc717 MOV -0x78(%RBP),%RCX |
(3558) 0x4bc71b MOV %R8,(%RAX,%RCX,8) |
(3558) 0x4bc71f MOV -0x98(%RBP),%RAX |
(3558) 0x4bc726 MOV %R10,(%RAX,%RCX,8) |
(3558) 0x4bc72a MOV -0xc0(%RBP),%RCX |
(3558) 0x4bc731 LEA 0x1(%RCX),%RDI |
(3558) 0x4bc735 MOV %RDX,%R10 |
(3558) 0x4bc738 MOV %RBX,%R8 |
(3558) 0x4bc73b CMP -0xa8(%RBP),%RCX |
(3558) 0x4bc742 JE 4bc56d |
(3558) 0x4bc748 MOV 0x78(%RBP),%RAX |
(3558) 0x4bc74c TEST %RAX,%RAX |
(3558) 0x4bc74f MOV -0xb0(%RBP),%RCX |
(3558) 0x4bc756 JE 4bc764 |
(3558) 0x4bc758 LEA (%RCX,%RDI,1),%RAX |
(3558) 0x4bc75c MOV %R8,(%R14,%RAX,8) |
(3558) 0x4bc760 LEA 0x1(%R8),%RBX |
(3558) 0x4bc764 ADD %RDI,%RCX |
(3558) 0x4bc767 CMPQ $0,0x70(%RBP) |
(3558) 0x4bc76c MOV %RCX,-0x78(%RBP) |
(3558) 0x4bc770 MOV %RDI,-0xc0(%RBP) |
(3558) 0x4bc777 JE 4bcb30 |
(3558) 0x4bc77d MOV 0x10(%RBP),%RAX |
(3558) 0x4bc781 MOV (%RAX,%RCX,8),%R13 |
(3558) 0x4bc785 MOV 0x8(%RAX,%RCX,8),%RDX |
(3558) 0x4bc78a LEA 0x1(%RCX),%R9 |
(3558) 0x4bc78e CMP %RDX,%R13 |
(3558) 0x4bc791 JGE 4bcb34 |
(3558) 0x4bc797 MOV %R13,%RAX |
(3558) 0x4bc79a NOT %RAX |
(3558) 0x4bc79d ADD %RAX,%RDX |
(3558) 0x4bc7a0 MOV %RDX,-0x30(%RBP) |
(3558) 0x4bc7a4 XOR %EAX,%EAX |
(3558) 0x4bc7a6 MOV %R10,%RDX |
(3558) 0x4bc7a9 MOV %R9,-0x38(%RBP) |
(3558) 0x4bc7ad MOV %R13,-0x68(%RBP) |
(3558) 0x4bc7b1 JMP 4bc7da |
0x4bc7b3 NOPW %CS:(%RAX,%RAX,1) |
(3567) 0x4bc7c0 MOV -0x68(%RBP),%R13 |
(3567) 0x4bc7c4 MOV -0x70(%RBP),%RCX |
(3567) 0x4bc7c8 LEA 0x1(%RCX),%RAX |
(3567) 0x4bc7cc CMP -0x30(%RBP),%RCX |
(3567) 0x4bc7d0 MOV -0x38(%RBP),%R9 |
(3567) 0x4bc7d4 JE 4bcb40 |
(3567) 0x4bc7da MOV %RAX,-0x70(%RBP) |
(3567) 0x4bc7de ADD %R13,%RAX |
(3567) 0x4bc7e1 MOV 0x18(%RBP),%RCX |
(3567) 0x4bc7e5 MOV (%RCX,%RAX,8),%RAX |
(3567) 0x4bc7e9 MOV 0x50(%RBP),%RCX |
(3567) 0x4bc7ed MOV (%RCX,%RAX,8),%R13 |
(3567) 0x4bc7f1 MOV 0x8(%RCX,%RAX,8),%RDI |
(3567) 0x4bc7f6 MOV %RDI,%R11 |
(3567) 0x4bc7f9 SUB %R13,%R11 |
(3567) 0x4bc7fc JLE 4bc840 |
(3567) 0x4bc7fe CMP $0x8,%R11 |
(3567) 0x4bc802 JAE 4bc8a0 |
(3567) 0x4bc808 MOV %R11,%RCX |
(3567) 0x4bc80b AND $-0x8,%RCX |
(3567) 0x4bc80f CMP %R11,%RCX |
(3567) 0x4bc812 JAE 4bc840 |
(3567) 0x4bc814 ADD %RCX,%R13 |
(3567) 0x4bc817 MOV 0x58(%RBP),%R9 |
(3567) 0x4bc81b JMP 4bc828 |
0x4bc81d NOPL (%RAX) |
(3570) 0x4bc820 INC %R13 |
(3570) 0x4bc823 CMP %R13,%RDI |
(3570) 0x4bc826 JE 4bc840 |
(3570) 0x4bc828 MOV (%R9,%R13,8),%RCX |
(3570) 0x4bc82c ADD %R15,%RCX |
(3570) 0x4bc82f CMP %R10,(%R14,%RCX,8) |
(3570) 0x4bc833 JGE 4bc820 |
(3570) 0x4bc835 MOV %RDX,(%R14,%RCX,8) |
(3570) 0x4bc839 INC %RDX |
(3570) 0x4bc83c JMP 4bc820 |
0x4bc83e XCHG %AX,%AX |
(3567) 0x4bc840 MOV 0x40(%RBP),%RCX |
(3567) 0x4bc844 MOV (%RCX,%RAX,8),%RDI |
(3567) 0x4bc848 MOV 0x8(%RCX,%RAX,8),%RAX |
(3567) 0x4bc84d MOV %RAX,%R9 |
(3567) 0x4bc850 SUB %RDI,%R9 |
(3567) 0x4bc853 JLE 4bc7c0 |
(3567) 0x4bc859 CMP $0x8,%R9 |
(3567) 0x4bc85d JAE 4bca20 |
(3567) 0x4bc863 MOV -0x68(%RBP),%R13 |
(3567) 0x4bc867 MOV %R9,%RCX |
(3567) 0x4bc86a AND $-0x8,%RCX |
(3567) 0x4bc86e CMP %R9,%RCX |
(3567) 0x4bc871 JAE 4bc7c4 |
(3567) 0x4bc877 ADD %RCX,%RDI |
(3567) 0x4bc87a MOV 0x48(%RBP),%R9 |
(3567) 0x4bc87e JMP 4bc88c |
(3568) 0x4bc880 INC %RDI |
(3568) 0x4bc883 CMP %RDI,%RAX |
(3568) 0x4bc886 JE 4bc7c4 |
(3568) 0x4bc88c MOV (%R9,%RDI,8),%RCX |
(3568) 0x4bc890 CMP %R8,(%R14,%RCX,8) |
(3568) 0x4bc894 JGE 4bc880 |
(3568) 0x4bc896 MOV %RBX,(%R14,%RCX,8) |
(3568) 0x4bc89a INC %RBX |
(3568) 0x4bc89d JMP 4bc880 |
0x4bc89f NOP |
(3567) 0x4bc8a0 MOV %R11,%R9 |
(3567) 0x4bc8a3 SHR $0x3,%R9 |
(3567) 0x4bc8a7 MOV -0xd8(%RBP),%RCX |
(3567) 0x4bc8ae LEA (%RCX,%R13,8),%RCX |
(3567) 0x4bc8b2 JMP 4bc8cd |
0x4bc8b4 NOPW %CS:(%RAX,%RAX,1) |
(3571) 0x4bc8c0 ADD $0x40,%RCX |
(3571) 0x4bc8c4 DEC %R9 |
(3571) 0x4bc8c7 JE 4bc808 |
(3571) 0x4bc8cd MOV -0x38(%RCX),%R12 |
(3571) 0x4bc8d1 ADD %R15,%R12 |
(3571) 0x4bc8d4 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc8d8 JGE 4bc980 |
(3571) 0x4bc8de MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc8e2 INC %RDX |
(3571) 0x4bc8e5 MOV -0x30(%RCX),%R12 |
(3571) 0x4bc8e9 ADD %R15,%R12 |
(3571) 0x4bc8ec CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc8f0 JL 4bc991 |
(3571) 0x4bc8f6 MOV -0x28(%RCX),%R12 |
(3571) 0x4bc8fa ADD %R15,%R12 |
(3571) 0x4bc8fd CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc901 JGE 4bc9a9 |
(3571) 0x4bc907 MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc90b INC %RDX |
(3571) 0x4bc90e MOV -0x20(%RCX),%R12 |
(3571) 0x4bc912 ADD %R15,%R12 |
(3571) 0x4bc915 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc919 JL 4bc9ba |
(3571) 0x4bc91f MOV -0x18(%RCX),%R12 |
(3571) 0x4bc923 ADD %R15,%R12 |
(3571) 0x4bc926 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc92a JGE 4bc9d2 |
(3571) 0x4bc930 MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc934 INC %RDX |
(3571) 0x4bc937 MOV -0x10(%RCX),%R12 |
(3571) 0x4bc93b ADD %R15,%R12 |
(3571) 0x4bc93e CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc942 JL 4bc9e3 |
(3571) 0x4bc948 MOV -0x8(%RCX),%R12 |
(3571) 0x4bc94c ADD %R15,%R12 |
(3571) 0x4bc94f CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc953 JGE 4bc9fb |
(3571) 0x4bc959 MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc95d INC %RDX |
(3571) 0x4bc960 MOV (%RCX),%R12 |
(3571) 0x4bc963 ADD %R15,%R12 |
(3571) 0x4bc966 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc96a JGE 4bc8c0 |
(3571) 0x4bc970 JMP 4bca0b |
0x4bc975 NOPW %CS:(%RAX,%RAX,1) |
(3571) 0x4bc980 MOV -0x30(%RCX),%R12 |
(3571) 0x4bc984 ADD %R15,%R12 |
(3571) 0x4bc987 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc98b JGE 4bc8f6 |
(3571) 0x4bc991 MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc995 INC %RDX |
(3571) 0x4bc998 MOV -0x28(%RCX),%R12 |
(3571) 0x4bc99c ADD %R15,%R12 |
(3571) 0x4bc99f CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc9a3 JL 4bc907 |
(3571) 0x4bc9a9 MOV -0x20(%RCX),%R12 |
(3571) 0x4bc9ad ADD %R15,%R12 |
(3571) 0x4bc9b0 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc9b4 JGE 4bc91f |
(3571) 0x4bc9ba MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc9be INC %RDX |
(3571) 0x4bc9c1 MOV -0x18(%RCX),%R12 |
(3571) 0x4bc9c5 ADD %R15,%R12 |
(3571) 0x4bc9c8 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc9cc JL 4bc930 |
(3571) 0x4bc9d2 MOV -0x10(%RCX),%R12 |
(3571) 0x4bc9d6 ADD %R15,%R12 |
(3571) 0x4bc9d9 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc9dd JGE 4bc948 |
(3571) 0x4bc9e3 MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc9e7 INC %RDX |
(3571) 0x4bc9ea MOV -0x8(%RCX),%R12 |
(3571) 0x4bc9ee ADD %R15,%R12 |
(3571) 0x4bc9f1 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc9f5 JL 4bc959 |
(3571) 0x4bc9fb MOV (%RCX),%R12 |
(3571) 0x4bc9fe ADD %R15,%R12 |
(3571) 0x4bca01 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bca05 JGE 4bc8c0 |
(3571) 0x4bca0b MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bca0f INC %RDX |
(3571) 0x4bca12 JMP 4bc8c0 |
0x4bca17 NOPW (%RAX,%RAX,1) |
(3567) 0x4bca20 MOV %R9,%RCX |
(3567) 0x4bca23 SHR $0x3,%RCX |
(3567) 0x4bca27 MOV -0xd0(%RBP),%R11 |
(3567) 0x4bca2e LEA (%R11,%RDI,8),%R11 |
(3567) 0x4bca32 MOV -0x68(%RBP),%R13 |
(3567) 0x4bca36 JMP 4bca4d |
0x4bca38 NOPL (%RAX,%RAX,1) |
(3569) 0x4bca40 ADD $0x40,%R11 |
(3569) 0x4bca44 DEC %RCX |
(3569) 0x4bca47 JE 4bc867 |
(3569) 0x4bca4d MOV -0x38(%R11),%R12 |
(3569) 0x4bca51 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bca55 JGE 4bcac0 |
(3569) 0x4bca57 MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bca5b INC %RBX |
(3569) 0x4bca5e MOV -0x30(%R11),%R12 |
(3569) 0x4bca62 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bca66 JL 4bcaca |
(3569) 0x4bca68 MOV -0x28(%R11),%R12 |
(3569) 0x4bca6c CMP %R8,(%R14,%R12,8) |
(3569) 0x4bca70 JGE 4bcadb |
(3569) 0x4bca72 MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bca76 INC %RBX |
(3569) 0x4bca79 MOV -0x20(%R11),%R12 |
(3569) 0x4bca7d CMP %R8,(%R14,%R12,8) |
(3569) 0x4bca81 JL 4bcae5 |
(3569) 0x4bca83 MOV -0x18(%R11),%R12 |
(3569) 0x4bca87 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bca8b JGE 4bcaf6 |
(3569) 0x4bca8d MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bca91 INC %RBX |
(3569) 0x4bca94 MOV -0x10(%R11),%R12 |
(3569) 0x4bca98 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bca9c JL 4bcb00 |
(3569) 0x4bca9e MOV -0x8(%R11),%R12 |
(3569) 0x4bcaa2 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bcaa6 JGE 4bcb11 |
(3569) 0x4bcaa8 MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bcaac INC %RBX |
(3569) 0x4bcaaf MOV (%R11),%R12 |
(3569) 0x4bcab2 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bcab6 JGE 4bca40 |
(3569) 0x4bcab8 JMP 4bcb1e |
0x4bcaba NOPW (%RAX,%RAX,1) |
(3569) 0x4bcac0 MOV -0x30(%R11),%R12 |
(3569) 0x4bcac4 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bcac8 JGE 4bca68 |
(3569) 0x4bcaca MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bcace INC %RBX |
(3569) 0x4bcad1 MOV -0x28(%R11),%R12 |
(3569) 0x4bcad5 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bcad9 JL 4bca72 |
(3569) 0x4bcadb MOV -0x20(%R11),%R12 |
(3569) 0x4bcadf CMP %R8,(%R14,%R12,8) |
(3569) 0x4bcae3 JGE 4bca83 |
(3569) 0x4bcae5 MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bcae9 INC %RBX |
(3569) 0x4bcaec MOV -0x18(%R11),%R12 |
(3569) 0x4bcaf0 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bcaf4 JL 4bca8d |
(3569) 0x4bcaf6 MOV -0x10(%R11),%R12 |
(3569) 0x4bcafa CMP %R8,(%R14,%R12,8) |
(3569) 0x4bcafe JGE 4bca9e |
(3569) 0x4bcb00 MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bcb04 INC %RBX |
(3569) 0x4bcb07 MOV -0x8(%R11),%R12 |
(3569) 0x4bcb0b CMP %R8,(%R14,%R12,8) |
(3569) 0x4bcb0f JL 4bcaa8 |
(3569) 0x4bcb11 MOV (%R11),%R12 |
(3569) 0x4bcb14 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bcb18 JGE 4bca40 |
(3569) 0x4bcb1e MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bcb22 INC %RBX |
(3569) 0x4bcb25 JMP 4bca40 |
0x4bcb2a NOPW (%RAX,%RAX,1) |
(3558) 0x4bcb30 LEA 0x1(%RCX),%R9 |
(3558) 0x4bcb34 MOV %R10,%RDX |
(3558) 0x4bcb37 JMP 4bcb44 |
0x4bcb39 NOPL (%RAX) |
(3558) 0x4bcb40 MOV -0x78(%RBP),%RCX |
(3558) 0x4bcb44 MOV -0xb8(%RBP),%RAX |
(3558) 0x4bcb4b MOV (%RAX,%RCX,8),%R11 |
(3558) 0x4bcb4f MOV (%RAX,%R9,8),%RCX |
(3558) 0x4bcb53 CMP %RCX,%R11 |
(3558) 0x4bcb56 JGE 4bc710 |
(3558) 0x4bcb5c MOV %R11,%RAX |
(3558) 0x4bcb5f NOT %RAX |
(3558) 0x4bcb62 ADD %RAX,%RCX |
(3558) 0x4bcb65 MOV %RCX,-0x38(%RBP) |
(3558) 0x4bcb69 CMPQ $0,0x88(%RBP) |
(3558) 0x4bcb71 MOV %R11,-0x30(%RBP) |
(3558) 0x4bcb75 JE 4bce1a |
(3558) 0x4bcb7b XOR %EAX,%EAX |
(3558) 0x4bcb7d JMP 4bcb99 |
0x4bcb7f NOP |
(3562) 0x4bcb80 MOV -0x30(%RBP),%R11 |
(3562) 0x4bcb84 MOV -0x70(%RBP),%RDI |
(3562) 0x4bcb88 LEA 0x1(%RDI),%RAX |
(3562) 0x4bcb8c MOV -0x38(%RBP),%RCX |
(3562) 0x4bcb90 CMP %RCX,%RDI |
(3562) 0x4bcb93 JE 4bc710 |
(3562) 0x4bcb99 MOV %RAX,-0x70(%RBP) |
(3562) 0x4bcb9d ADD %R11,%RAX |
(3562) 0x4bcba0 MOV -0x88(%RBP),%RCX |
(3562) 0x4bcba7 MOV (%RCX,%RAX,8),%RDI |
(3562) 0x4bcbab MOV 0x20(%RBP),%RCX |
(3562) 0x4bcbaf MOV (%RCX,%RDI,8),%RAX |
(3562) 0x4bcbb3 MOV 0x8(%RCX,%RDI,8),%R13 |
(3562) 0x4bcbb8 MOV %R13,%R9 |
(3562) 0x4bcbbb SUB %RAX,%R9 |
(3562) 0x4bcbbe JLE 4bcd24 |
(3562) 0x4bcbc4 CMP $0x8,%R9 |
(3562) 0x4bcbc8 JAE 4bcc10 |
(3562) 0x4bcbca MOV %R9,%RCX |
(3562) 0x4bcbcd AND $-0x8,%RCX |
(3562) 0x4bcbd1 CMP %R9,%RCX |
(3562) 0x4bcbd4 JAE 4bcd20 |
(3562) 0x4bcbda ADD %RCX,%RAX |
(3562) 0x4bcbdd MOV 0x28(%RBP),%R9 |
(3562) 0x4bcbe1 MOV -0x30(%RBP),%R11 |
(3562) 0x4bcbe5 JMP 4bcbfc |
0x4bcbe7 NOPW (%RAX,%RAX,1) |
(3565) 0x4bcbf0 INC %RAX |
(3565) 0x4bcbf3 CMP %RAX,%R13 |
(3565) 0x4bcbf6 JE 4bcd24 |
(3565) 0x4bcbfc MOV (%R9,%RAX,8),%RCX |
(3565) 0x4bcc00 CMP %R8,(%R14,%RCX,8) |
(3565) 0x4bcc04 JGE 4bcbf0 |
(3565) 0x4bcc06 MOV %RBX,(%R14,%RCX,8) |
(3565) 0x4bcc0a INC %RBX |
(3565) 0x4bcc0d JMP 4bcbf0 |
0x4bcc0f NOP |
(3562) 0x4bcc10 MOV %R9,%RCX |
(3562) 0x4bcc13 SHR $0x3,%RCX |
(3562) 0x4bcc17 MOV -0x80(%RBP),%R11 |
(3562) 0x4bcc1b LEA (%R11,%RAX,8),%R11 |
(3562) 0x4bcc1f JMP 4bcc39 |
0x4bcc21 NOPW %CS:(%RAX,%RAX,1) |
(3566) 0x4bcc30 ADD $0x40,%R11 |
(3566) 0x4bcc34 DEC %RCX |
(3566) 0x4bcc37 JE 4bcbca |
(3566) 0x4bcc39 MOV -0x38(%R11),%R12 |
(3566) 0x4bcc3d CMP %R8,(%R14,%R12,8) |
(3566) 0x4bcc41 JGE 4bccb0 |
(3566) 0x4bcc43 MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bcc47 INC %RBX |
(3566) 0x4bcc4a MOV -0x30(%R11),%R12 |
(3566) 0x4bcc4e CMP %R8,(%R14,%R12,8) |
(3566) 0x4bcc52 JL 4bccba |
(3566) 0x4bcc54 MOV -0x28(%R11),%R12 |
(3566) 0x4bcc58 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bcc5c JGE 4bcccb |
(3566) 0x4bcc5e MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bcc62 INC %RBX |
(3566) 0x4bcc65 MOV -0x20(%R11),%R12 |
(3566) 0x4bcc69 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bcc6d JL 4bccd5 |
(3566) 0x4bcc6f MOV -0x18(%R11),%R12 |
(3566) 0x4bcc73 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bcc77 JGE 4bcce6 |
(3566) 0x4bcc79 MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bcc7d INC %RBX |
(3566) 0x4bcc80 MOV -0x10(%R11),%R12 |
(3566) 0x4bcc84 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bcc88 JL 4bccf0 |
(3566) 0x4bcc8a MOV -0x8(%R11),%R12 |
(3566) 0x4bcc8e CMP %R8,(%R14,%R12,8) |
(3566) 0x4bcc92 JGE 4bcd01 |
(3566) 0x4bcc94 MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bcc98 INC %RBX |
(3566) 0x4bcc9b MOV (%R11),%R12 |
(3566) 0x4bcc9e CMP %R8,(%R14,%R12,8) |
(3566) 0x4bcca2 JGE 4bcc30 |
(3566) 0x4bcca4 JMP 4bcd0e |
0x4bcca6 NOPW %CS:(%RAX,%RAX,1) |
(3566) 0x4bccb0 MOV -0x30(%R11),%R12 |
(3566) 0x4bccb4 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bccb8 JGE 4bcc54 |
(3566) 0x4bccba MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bccbe INC %RBX |
(3566) 0x4bccc1 MOV -0x28(%R11),%R12 |
(3566) 0x4bccc5 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bccc9 JL 4bcc5e |
(3566) 0x4bcccb MOV -0x20(%R11),%R12 |
(3566) 0x4bcccf CMP %R8,(%R14,%R12,8) |
(3566) 0x4bccd3 JGE 4bcc6f |
(3566) 0x4bccd5 MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bccd9 INC %RBX |
(3566) 0x4bccdc MOV -0x18(%R11),%R12 |
(3566) 0x4bcce0 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bcce4 JL 4bcc79 |
(3566) 0x4bcce6 MOV -0x10(%R11),%R12 |
(3566) 0x4bccea CMP %R8,(%R14,%R12,8) |
(3566) 0x4bccee JGE 4bcc8a |
(3566) 0x4bccf0 MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bccf4 INC %RBX |
(3566) 0x4bccf7 MOV -0x8(%R11),%R12 |
(3566) 0x4bccfb CMP %R8,(%R14,%R12,8) |
(3566) 0x4bccff JL 4bcc94 |
(3566) 0x4bcd01 MOV (%R11),%R12 |
(3566) 0x4bcd04 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bcd08 JGE 4bcc30 |
(3566) 0x4bcd0e MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bcd12 INC %RBX |
(3566) 0x4bcd15 JMP 4bcc30 |
0x4bcd1a NOPW (%RAX,%RAX,1) |
(3562) 0x4bcd20 MOV -0x30(%RBP),%R11 |
(3562) 0x4bcd24 MOV 0x30(%RBP),%RCX |
(3562) 0x4bcd28 MOV (%RCX,%RDI,8),%RAX |
(3562) 0x4bcd2c MOV 0x8(%RCX,%RDI,8),%RCX |
(3562) 0x4bcd31 MOV %RCX,%RDI |
(3562) 0x4bcd34 SUB %RAX,%RDI |
(3562) 0x4bcd37 JLE 4bcb84 |
(3562) 0x4bcd3d CMP $0x4,%RDI |
(3562) 0x4bcd41 JAE 4bcd90 |
(3562) 0x4bcd43 MOV %RDI,%R9 |
(3562) 0x4bcd46 AND $-0x4,%R9 |
(3562) 0x4bcd4a CMP %RDI,%R9 |
(3562) 0x4bcd4d JAE 4bcb80 |
(3562) 0x4bcd53 ADD %R9,%RAX |
(3562) 0x4bcd56 MOV 0x38(%RBP),%R9 |
(3562) 0x4bcd5a MOV -0x30(%RBP),%R11 |
(3562) 0x4bcd5e JMP 4bcd6c |
(3563) 0x4bcd60 INC %RAX |
(3563) 0x4bcd63 CMP %RAX,%RCX |
(3563) 0x4bcd66 JE 4bcb84 |
(3563) 0x4bcd6c MOV (%R9,%RAX,8),%RDI |
(3563) 0x4bcd70 MOV (%RSI,%RDI,8),%RDI |
(3563) 0x4bcd74 ADD %R15,%RDI |
(3563) 0x4bcd77 CMP %R10,(%R14,%RDI,8) |
(3563) 0x4bcd7b JGE 4bcd60 |
(3563) 0x4bcd7d MOV %RDX,(%R14,%RDI,8) |
(3563) 0x4bcd81 INC %RDX |
(3563) 0x4bcd84 JMP 4bcd60 |
0x4bcd86 NOPW %CS:(%RAX,%RAX,1) |
(3562) 0x4bcd90 MOV %RDI,%R9 |
(3562) 0x4bcd93 SHR $0x2,%R9 |
(3562) 0x4bcd97 MOV -0xc8(%RBP),%R11 |
(3562) 0x4bcd9e LEA (%R11,%RAX,8),%R11 |
(3562) 0x4bcda2 JMP 4bcdb9 |
0x4bcda4 NOPW %CS:(%RAX,%RAX,1) |
(3564) 0x4bcdb0 ADD $0x20,%R11 |
(3564) 0x4bcdb4 DEC %R9 |
(3564) 0x4bcdb7 JE 4bcd43 |
(3564) 0x4bcdb9 MOV -0x18(%R11),%R12 |
(3564) 0x4bcdbd MOV (%RSI,%R12,8),%R13 |
(3564) 0x4bcdc1 ADD %R15,%R13 |
(3564) 0x4bcdc4 CMP %R10,(%R14,%R13,8) |
(3564) 0x4bcdc8 JGE 4bcdd1 |
(3564) 0x4bcdca MOV %RDX,(%R14,%R13,8) |
(3564) 0x4bcdce INC %RDX |
(3564) 0x4bcdd1 MOV -0x10(%R11),%R12 |
(3564) 0x4bcdd5 MOV (%RSI,%R12,8),%R13 |
(3564) 0x4bcdd9 ADD %R15,%R13 |
(3564) 0x4bcddc CMP %R10,(%R14,%R13,8) |
(3564) 0x4bcde0 JGE 4bcde9 |
(3564) 0x4bcde2 MOV %RDX,(%R14,%R13,8) |
(3564) 0x4bcde6 INC %RDX |
(3564) 0x4bcde9 MOV -0x8(%R11),%R12 |
(3564) 0x4bcded MOV (%RSI,%R12,8),%R13 |
(3564) 0x4bcdf1 ADD %R15,%R13 |
(3564) 0x4bcdf4 CMP %R10,(%R14,%R13,8) |
(3564) 0x4bcdf8 JGE 4bce01 |
(3564) 0x4bcdfa MOV %RDX,(%R14,%R13,8) |
(3564) 0x4bcdfe INC %RDX |
(3564) 0x4bce01 MOV (%R11),%R12 |
(3564) 0x4bce04 MOV (%RSI,%R12,8),%R13 |
(3564) 0x4bce08 ADD %R15,%R13 |
(3564) 0x4bce0b CMP %R10,(%R14,%R13,8) |
(3564) 0x4bce0f JGE 4bcdb0 |
(3564) 0x4bce11 MOV %RDX,(%R14,%R13,8) |
(3564) 0x4bce15 INC %RDX |
(3564) 0x4bce18 JMP 4bcdb0 |
(3558) 0x4bce1a XOR %R12D,%R12D |
(3558) 0x4bce1d JMP 4bce39 |
0x4bce1f NOP |
(3559) 0x4bce20 MOV -0x30(%RBP),%R11 |
(3559) 0x4bce24 LEA 0x1(%R12),%RAX |
(3559) 0x4bce29 MOV -0x38(%RBP),%RCX |
(3559) 0x4bce2d CMP %RCX,%R12 |
(3559) 0x4bce30 MOV %RAX,%R12 |
(3559) 0x4bce33 JE 4bc710 |
(3559) 0x4bce39 LEA (%R11,%R12,1),%RAX |
(3559) 0x4bce3d MOV -0x88(%RBP),%RCX |
(3559) 0x4bce44 MOV (%RCX,%RAX,8),%RAX |
(3559) 0x4bce48 MOV 0x20(%RBP),%RCX |
(3559) 0x4bce4c MOV (%RCX,%RAX,8),%RDI |
(3559) 0x4bce50 MOV 0x8(%RCX,%RAX,8),%RAX |
(3559) 0x4bce55 MOV %RAX,%R9 |
(3559) 0x4bce58 SUB %RDI,%R9 |
(3559) 0x4bce5b JLE 4bce24 |
(3559) 0x4bce5d CMP $0x8,%R9 |
(3559) 0x4bce61 JAE 4bcea0 |
(3559) 0x4bce63 MOV %R9,%RCX |
(3559) 0x4bce66 AND $-0x8,%RCX |
(3559) 0x4bce6a CMP %R9,%RCX |
(3559) 0x4bce6d JAE 4bce20 |
(3559) 0x4bce6f ADD %RCX,%RDI |
(3559) 0x4bce72 MOV 0x28(%RBP),%R9 |
(3559) 0x4bce76 MOV -0x30(%RBP),%R11 |
(3559) 0x4bce7a JMP 4bce88 |
0x4bce7c NOPL (%RAX) |
(3560) 0x4bce80 INC %RDI |
(3560) 0x4bce83 CMP %RDI,%RAX |
(3560) 0x4bce86 JE 4bce24 |
(3560) 0x4bce88 MOV (%R9,%RDI,8),%RCX |
(3560) 0x4bce8c CMP %R8,(%R14,%RCX,8) |
(3560) 0x4bce90 JGE 4bce80 |
(3560) 0x4bce92 MOV %RBX,(%R14,%RCX,8) |
(3560) 0x4bce96 INC %RBX |
(3560) 0x4bce99 JMP 4bce80 |
0x4bce9b NOPL (%RAX,%RAX,1) |
(3559) 0x4bcea0 MOV %R9,%RCX |
(3559) 0x4bcea3 SHR $0x3,%RCX |
(3559) 0x4bcea7 MOV -0x80(%RBP),%R11 |
(3559) 0x4bceab LEA (%R11,%RDI,8),%R11 |
(3559) 0x4bceaf JMP 4bcec9 |
0x4bceb1 NOPW %CS:(%RAX,%RAX,1) |
(3561) 0x4bcec0 ADD $0x40,%R11 |
(3561) 0x4bcec4 DEC %RCX |
(3561) 0x4bcec7 JE 4bce63 |
(3561) 0x4bcec9 MOV -0x38(%R11),%R13 |
(3561) 0x4bcecd CMP %R8,(%R14,%R13,8) |
(3561) 0x4bced1 JGE 4bcf40 |
(3561) 0x4bced3 MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bced7 INC %RBX |
(3561) 0x4bceda MOV -0x30(%R11),%R13 |
(3561) 0x4bcede CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcee2 JL 4bcf4a |
(3561) 0x4bcee4 MOV -0x28(%R11),%R13 |
(3561) 0x4bcee8 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bceec JGE 4bcf5b |
(3561) 0x4bceee MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bcef2 INC %RBX |
(3561) 0x4bcef5 MOV -0x20(%R11),%R13 |
(3561) 0x4bcef9 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcefd JL 4bcf65 |
(3561) 0x4bceff MOV -0x18(%R11),%R13 |
(3561) 0x4bcf03 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcf07 JGE 4bcf76 |
(3561) 0x4bcf09 MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bcf0d INC %RBX |
(3561) 0x4bcf10 MOV -0x10(%R11),%R13 |
(3561) 0x4bcf14 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcf18 JL 4bcf80 |
(3561) 0x4bcf1a MOV -0x8(%R11),%R13 |
(3561) 0x4bcf1e CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcf22 JGE 4bcf91 |
(3561) 0x4bcf24 MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bcf28 INC %RBX |
(3561) 0x4bcf2b MOV (%R11),%R13 |
(3561) 0x4bcf2e CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcf32 JGE 4bcec0 |
(3561) 0x4bcf34 JMP 4bcf9e |
0x4bcf36 NOPW %CS:(%RAX,%RAX,1) |
(3561) 0x4bcf40 MOV -0x30(%R11),%R13 |
(3561) 0x4bcf44 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcf48 JGE 4bcee4 |
(3561) 0x4bcf4a MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bcf4e INC %RBX |
(3561) 0x4bcf51 MOV -0x28(%R11),%R13 |
(3561) 0x4bcf55 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcf59 JL 4bceee |
(3561) 0x4bcf5b MOV -0x20(%R11),%R13 |
(3561) 0x4bcf5f CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcf63 JGE 4bceff |
(3561) 0x4bcf65 MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bcf69 INC %RBX |
(3561) 0x4bcf6c MOV -0x18(%R11),%R13 |
(3561) 0x4bcf70 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcf74 JL 4bcf09 |
(3561) 0x4bcf76 MOV -0x10(%R11),%R13 |
(3561) 0x4bcf7a CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcf7e JGE 4bcf1a |
(3561) 0x4bcf80 MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bcf84 INC %RBX |
(3561) 0x4bcf87 MOV -0x8(%R11),%R13 |
(3561) 0x4bcf8b CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcf8f JL 4bcf24 |
(3561) 0x4bcf91 MOV (%R11),%R13 |
(3561) 0x4bcf94 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bcf98 JGE 4bcec0 |
(3561) 0x4bcf9e MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bcfa2 INC %RBX |
(3561) 0x4bcfa5 JMP 4bcec0 |
0x4bcfaa MOV 0xa0(%RBP),%RAX |
0x4bcfb1 MOV 0x68(%RBP),%RDX |
0x4bcfb5 MOV -0x50(%RBP),%RCX |
0x4bcfb9 MOV (%RCX),%RSI |
0x4bcfbc MOVQ $0,(%RSI,%RDX,8) |
0x4bcfc4 MOV -0x58(%RBP),%RCX |
0x4bcfc8 MOV (%RCX),%RDI |
0x4bcfcb MOVQ $0,(%RDI,%RDX,8) |
0x4bcfd3 TEST %RAX,%RAX |
0x4bcfd6 JLE 4bd2a6 |
0x4bcfdc LEA (%RSI,%RDX,8),%RCX |
0x4bcfe0 LEA (%RDI,%RDX,8),%RDX |
0x4bcfe4 LEA -0x8(%R15,%RAX,8),%R8 |
0x4bcfe9 CMP %RCX,%R8 |
0x4bcfec MOV %R15,%R9 |
0x4bcfef SETAE %R15B |
0x4bcff3 CMP %R9,%RCX |
0x4bcff6 SETAE %R12B |
0x4bcffa CMP %RDX,%R8 |
0x4bcffd MOV %RBX,%R10 |
0x4bd000 SETB %BL |
0x4bd003 CMP %R9,%RDX |
0x4bd006 SETB %R14B |
0x4bd00a CMP %R10,%RCX |
0x4bd00d SETB %R8B |
0x4bd011 LEA -0x8(%R10,%RAX,8),%R9 |
0x4bd016 CMP %RCX,%R9 |
0x4bd019 SETB %R11B |
0x4bd01d CMP %RDX,%R9 |
0x4bd020 SETB %R9B |
0x4bd024 CMP %R10,%RDX |
0x4bd027 SETB %R10B |
0x4bd02b TEST %R12B,%R15B |
0x4bd02e JNE 4bd201 |
0x4bd034 OR %R14B,%BL |
0x4bd037 JE 4bd201 |
0x4bd03d CMP %RSI,%RDI |
0x4bd040 JE 4bd201 |
0x4bd046 OR %R11B,%R8B |
0x4bd049 JE 4bd201 |
0x4bd04f OR %R10B,%R9B |
0x4bd052 JE 4bd201 |
0x4bd058 MOV %RAX,%RSI |
0x4bd05b AND $-0x4,%RSI |
0x4bd05f JE 4bd274 |
0x4bd065 LEA -0x1(%RSI),%RDI |
0x4bd069 VPXOR %XMM0,%XMM0,%XMM0 |
0x4bd06d XOR %R8D,%R8D |
0x4bd070 VPXOR %XMM1,%XMM1,%XMM1 |
0x4bd074 MOV 0xb0(%RBP),%R9 |
0x4bd07b MOV 0xa8(%RBP),%R10 |
0x4bd082 NOPW %CS:(%RAX,%RAX,1) |
(3552) 0x4bd090 VPADDQ (%R10,%R8,8),%YMM1,%YMM1 |
(3552) 0x4bd096 VPADDQ (%R9,%R8,8),%YMM0,%YMM0 |
(3552) 0x4bd09c ADD $0x4,%R8 |
(3552) 0x4bd0a0 CMP %RDI,%R8 |
(3552) 0x4bd0a3 JLE 4bd090 |
0x4bd0a5 VEXTRACTI128 $0x1,%YMM1,%XMM2 |
0x4bd0ab VPADDQ %XMM2,%XMM1,%XMM1 |
0x4bd0af VPSHUFD $-0x12,%XMM1,%XMM2 |
0x4bd0b4 VPADDQ %XMM2,%XMM1,%XMM1 |
0x4bd0b8 VMOVQ %XMM1,%RDI |
0x4bd0bd VEXTRACTI128 $0x1,%YMM0,%XMM1 |
0x4bd0c3 VPADDQ %XMM1,%XMM0,%XMM0 |
0x4bd0c7 VPSHUFD $-0x12,%XMM0,%XMM1 |
0x4bd0cc VPADDQ %XMM1,%XMM0,%XMM0 |
0x4bd0d0 VMOVQ %XMM0,%R8 |
0x4bd0d5 CMP %RAX,%RSI |
0x4bd0d8 JNE 4bd290 |
0x4bd0de JMP 4bd2a0 |
0x4bd0e3 MOV -0x48(%RBP),%R11 |
0x4bd0e7 MOV 0xc0(%RBP),%R14 |
0x4bd0ee MOV -0x40(%RBP),%RSI |
0x4bd0f2 JMP 4bd120 |
0x4bd0f4 XOR %EDX,%EDX |
0x4bd0f6 MOV -0x48(%RBP),%R11 |
0x4bd0fa MOV 0xc0(%RBP),%R14 |
0x4bd101 MOV -0x40(%RBP),%RSI |
0x4bd105 INC %RDX |
0x4bd108 NOPL (%RAX,%RAX,1) |
(3556) 0x4bd110 ADD (%R15,%RDX,8),%RAX |
(3556) 0x4bd114 ADD (%RBX,%RDX,8),%RCX |
(3556) 0x4bd118 INC %RDX |
(3556) 0x4bd11b CMP %RDX,%RDI |
(3556) 0x4bd11e JNE 4bd110 |
0x4bd120 CMP %R11,%RSI |
0x4bd123 JGE 4bd2a6 |
0x4bd129 MOV -0x50(%RBP),%RDX |
0x4bd12d MOV (%RDX),%RDX |
0x4bd130 MOV -0x58(%RBP),%RSI |
0x4bd134 MOV (%RSI),%RSI |
0x4bd137 LEA -0x8(%RDX,%R11,8),%R10 |
0x4bd13c MOV 0xb8(%RBP),%R12 |
0x4bd143 CMP %R12,%RDI |
0x4bd146 CMOVL %RDI,%R12 |
0x4bd14a IMUL %RDI,%R14 |
0x4bd14e LEA (%R12,%R14,1),%RDI |
0x4bd152 LEA (%RSI,%RDI,8),%R8 |
0x4bd156 LEA (%RDX,%RDI,8),%R9 |
0x4bd15a CMP %R8,%R10 |
0x4bd15d JB 4bd197 |
0x4bd15f LEA -0x8(%RSI,%R11,8),%R10 |
0x4bd164 CMP %R9,%R10 |
0x4bd167 JB 4bd197 |
0x4bd169 NOPL (%RAX) |
(3555) 0x4bd170 LEA (%RDX,%RDI,8),%R8 |
(3555) 0x4bd174 MOV (%R8),%R9 |
(3555) 0x4bd177 ADD %RAX,%R9 |
(3555) 0x4bd17a MOV %R9,(%R8) |
(3555) 0x4bd17d LEA (%RSI,%RDI,8),%R8 |
(3555) 0x4bd181 MOV (%R8),%R9 |
(3555) 0x4bd184 ADD %RCX,%R9 |
(3555) 0x4bd187 MOV %R9,(%R8) |
(3555) 0x4bd18a INC %RDI |
(3555) 0x4bd18d CMP %RDI,%R11 |
(3555) 0x4bd190 JNE 4bd170 |
0x4bd192 JMP 4bd2a6 |
0x4bd197 MOV %R11,%R10 |
0x4bd19a SUB %RDI,%R10 |
0x4bd19d MOV %R10,%RDI |
0x4bd1a0 AND $-0x4,%RDI |
0x4bd1a4 JE 4bd244 |
0x4bd1aa MOV %R14,%R15 |
0x4bd1ad MOV %R11,%R14 |
0x4bd1b0 LEA -0x1(%RDI),%R11 |
0x4bd1b4 VPBROADCASTQ %RAX,%YMM0 |
0x4bd1ba VPBROADCASTQ %RCX,%YMM1 |
0x4bd1c0 XOR %EBX,%EBX |
0x4bd1c2 NOPW %CS:(%RAX,%RAX,1) |
(3554) 0x4bd1d0 VPADDQ (%R9,%RBX,8),%YMM0,%YMM2 |
(3554) 0x4bd1d6 VMOVDQU %YMM2,(%R9,%RBX,8) |
(3554) 0x4bd1dc VPADDQ (%R8,%RBX,8),%YMM1,%YMM2 |
(3554) 0x4bd1e2 VMOVDQU %YMM2,(%R8,%RBX,8) |
(3554) 0x4bd1e8 ADD $0x4,%RBX |
(3554) 0x4bd1ec CMP %R11,%RBX |
(3554) 0x4bd1ef JBE 4bd1d0 |
0x4bd1f1 CMP %RDI,%R10 |
0x4bd1f4 MOV %R14,%R11 |
0x4bd1f7 MOV %R15,%R14 |
0x4bd1fa JNE 4bd246 |
0x4bd1fc JMP 4bd2a6 |
0x4bd201 XOR %ESI,%ESI |
0x4bd203 MOV 0xb0(%RBP),%R9 |
0x4bd20a MOV 0xa8(%RBP),%R10 |
0x4bd211 NOPW %CS:(%RAX,%RAX,1) |
(3550) 0x4bd220 MOV (%R10,%RSI,8),%RDI |
(3550) 0x4bd224 MOV (%RCX),%R8 |
(3550) 0x4bd227 ADD %RDI,%R8 |
(3550) 0x4bd22a MOV %R8,(%RCX) |
(3550) 0x4bd22d MOV (%R9,%RSI,8),%RDI |
(3550) 0x4bd231 MOV (%RDX),%R8 |
(3550) 0x4bd234 ADD %RDI,%R8 |
(3550) 0x4bd237 MOV %R8,(%RDX) |
(3550) 0x4bd23a INC %RSI |
(3550) 0x4bd23d CMP %RSI,%RAX |
(3550) 0x4bd240 JNE 4bd220 |
0x4bd242 JMP 4bd2a6 |
0x4bd244 XOR %EDI,%EDI |
0x4bd246 ADD %R12,%RDI |
0x4bd249 ADD %R14,%RDI |
0x4bd24c NOPL (%RAX) |
(3553) 0x4bd250 LEA (%RDX,%RDI,8),%R8 |
(3553) 0x4bd254 MOV (%R8),%R9 |
(3553) 0x4bd257 ADD %RAX,%R9 |
(3553) 0x4bd25a MOV %R9,(%R8) |
(3553) 0x4bd25d LEA (%RSI,%RDI,8),%R8 |
(3553) 0x4bd261 MOV (%R8),%R9 |
(3553) 0x4bd264 ADD %RCX,%R9 |
(3553) 0x4bd267 MOV %R9,(%R8) |
(3553) 0x4bd26a INC %RDI |
(3553) 0x4bd26d CMP %RDI,%R11 |
(3553) 0x4bd270 JNE 4bd250 |
0x4bd272 JMP 4bd2a6 |
0x4bd274 XOR %R8D,%R8D |
0x4bd277 XOR %EDI,%EDI |
0x4bd279 XOR %ESI,%ESI |
0x4bd27b MOV 0xb0(%RBP),%R9 |
0x4bd282 MOV 0xa8(%RBP),%R10 |
0x4bd289 NOPL (%RAX) |
(3551) 0x4bd290 ADD (%R10,%RSI,8),%RDI |
(3551) 0x4bd294 ADD (%R9,%RSI,8),%R8 |
(3551) 0x4bd298 INC %RSI |
(3551) 0x4bd29b CMP %RSI,%RAX |
(3551) 0x4bd29e JNE 4bd290 |
0x4bd2a0 ADD %RDI,(%RCX) |
0x4bd2a3 MOV %R8,(%RDX) |
0x4bd2a6 ADD $0xb8,%RSP |
0x4bd2ad POP %RBX |
0x4bd2ae POP %R12 |
0x4bd2b0 POP %R13 |
0x4bd2b2 POP %R14 |
0x4bd2b4 POP %R15 |
0x4bd2b6 POP %RBP |
0x4bd2b7 VZEROUPPER |
0x4bd2ba RET |
0x4bd2bb NOPL (%RAX,%RAX,1) |
Path / |
Source file and lines | par_csr_matop.c:102-276 |
Module | exec |
nb instructions | 307 |
nb uops | 314 |
loop length | 1381 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 29 |
micro-operation queue | 52.33 cycles |
front end | 52.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 23.10 | 23.30 | 19.00 | 19.00 | 18.00 | 23.30 | 23.10 | 18.00 | 18.00 | 18.00 | 23.20 | 19.00 |
cycles | 23.10 | 23.30 | 19.00 | 19.00 | 18.00 | 23.30 | 23.10 | 18.00 | 18.00 | 18.00 | 23.20 | 19.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 51.66-51.65 |
Stall cycles | 0.00 |
Front-end | 52.33 |
Dispatch | 23.30 |
Overall L1 | 52.33 |
all | 24% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 15% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x90(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e8ff0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x1(%RAX),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R13,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4bc648 <hypre_ParMatmul_RowSizes.extracted+0x1a8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x1(%R14),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RCX,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4bc668 <hypre_ParMatmul_RowSizes.extracted+0x1c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%R12,%R15,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4e72c0 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4bc551 <hypre_ParMatmul_RowSizes.extracted+0xb1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4f03c0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x60(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RBX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JL 4bc67c <hypre_ParMatmul_RowSizes.extracted+0x1dc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa8(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,(%R15,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RBX,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e7390 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x537190,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4bcfaa <hypre_ParMatmul_RowSizes.extracted+0xb0a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4bd0e3 <hypre_ParMatmul_RowSizes.extracted+0xc43> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bd0f4 <hypre_ParMatmul_RowSizes.extracted+0xc54> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ %RAX,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVQ %RCX,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
LEA -0x1(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM1,%XMM2 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM1,%RAX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%RCX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4bd105 <hypre_ParMatmul_RowSizes.extracted+0xc65> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bd120 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R13,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R13,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4bc524 <hypre_ParMatmul_RowSizes.extracted+0x84> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RBX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4bc569 <hypre_ParMatmul_RowSizes.extracted+0xc9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x60(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %RCX,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL 0xc0(%RBP),%RCX | 1 | 0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
ADD %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOT %RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%R9),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x18(%R8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4bc748 <hypre_ParMatmul_RowSizes.extracted+0x2a8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,(%RSI,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,(%RDI,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4bd2a6 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RSI,%RDX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RDX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(%R15,%RAX,8),%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RCX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SETAE %R15B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETAE %R12B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SETB %BL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R14B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R8B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA -0x8(%R10,%RAX,8),%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R11B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R9B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R10,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R10B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %R12B,%R15B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4bd201 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R14B,%BL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bd201 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 4bd201 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R11B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bd201 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R10B,%R9B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bd201 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bd274 <hypre_ParMatmul_RowSizes.extracted+0xdd4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RSI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM1,%XMM2 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM1,%RDI | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%R8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4bd290 <hypre_ParMatmul_RowSizes.extracted+0xdf0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bd2a0 <hypre_ParMatmul_RowSizes.extracted+0xe00> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4bd120 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4bd2a6 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x8(%RDX,%R11,8),%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0xb8(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R12,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %RDI,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RDI,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R12,%R14,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RSI,%RDI,8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDX,%RDI,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4bd197 <hypre_ParMatmul_RowSizes.extracted+0xcf7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x8(%RSI,%R11,8),%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R9,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4bd197 <hypre_ParMatmul_RowSizes.extracted+0xcf7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bd2a6 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R11,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bd244 <hypre_ParMatmul_RowSizes.extracted+0xda4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%RDI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JNE 4bd246 <hypre_ParMatmul_RowSizes.extracted+0xda6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bd2a6 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bd2a6 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R12,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R14,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bd2a6 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %RDI,(%RCX) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV %R8,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | par_csr_matop.c:102-276 |
Module | exec |
nb instructions | 307 |
nb uops | 314 |
loop length | 1381 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 29 |
micro-operation queue | 52.33 cycles |
front end | 52.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 23.10 | 23.30 | 19.00 | 19.00 | 18.00 | 23.30 | 23.10 | 18.00 | 18.00 | 18.00 | 23.20 | 19.00 |
cycles | 23.10 | 23.30 | 19.00 | 19.00 | 18.00 | 23.30 | 23.10 | 18.00 | 18.00 | 18.00 | 23.20 | 19.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 51.66-51.65 |
Stall cycles | 0.00 |
Front-end | 52.33 |
Dispatch | 23.30 |
Overall L1 | 52.33 |
all | 24% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 15% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x90(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e8ff0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x1(%RAX),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R13,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4bc648 <hypre_ParMatmul_RowSizes.extracted+0x1a8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x1(%R14),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RCX,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4bc668 <hypre_ParMatmul_RowSizes.extracted+0x1c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%R12,%R15,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4e72c0 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4bc551 <hypre_ParMatmul_RowSizes.extracted+0xb1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4f03c0 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x60(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RBX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JL 4bc67c <hypre_ParMatmul_RowSizes.extracted+0x1dc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa8(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,(%R15,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RBX,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e7390 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x537190,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410560 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4bcfaa <hypre_ParMatmul_RowSizes.extracted+0xb0a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4bd0e3 <hypre_ParMatmul_RowSizes.extracted+0xc43> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bd0f4 <hypre_ParMatmul_RowSizes.extracted+0xc54> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ %RAX,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVQ %RCX,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
LEA -0x1(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM1,%XMM2 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM1,%RAX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%RCX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4bd105 <hypre_ParMatmul_RowSizes.extracted+0xc65> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bd120 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R13,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R13,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4bc524 <hypre_ParMatmul_RowSizes.extracted+0x84> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RBX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4bc569 <hypre_ParMatmul_RowSizes.extracted+0xc9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x60(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %RCX,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL 0xc0(%RBP),%RCX | 1 | 0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
ADD %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOT %RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%R9),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x18(%R8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4bc748 <hypre_ParMatmul_RowSizes.extracted+0x2a8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,(%RSI,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,(%RDI,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4bd2a6 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RSI,%RDX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RDX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(%R15,%RAX,8),%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RCX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SETAE %R15B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETAE %R12B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SETB %BL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R14B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R8B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA -0x8(%R10,%RAX,8),%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R11B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R9B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R10,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R10B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %R12B,%R15B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4bd201 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R14B,%BL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bd201 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 4bd201 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R11B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bd201 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R10B,%R9B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bd201 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bd274 <hypre_ParMatmul_RowSizes.extracted+0xdd4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RSI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM1,%XMM2 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM1,%RDI | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%R8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4bd290 <hypre_ParMatmul_RowSizes.extracted+0xdf0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bd2a0 <hypre_ParMatmul_RowSizes.extracted+0xe00> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4bd120 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4bd2a6 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x8(%RDX,%R11,8),%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0xb8(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R12,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %RDI,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RDI,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R12,%R14,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RSI,%RDI,8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDX,%RDI,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4bd197 <hypre_ParMatmul_RowSizes.extracted+0xcf7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x8(%RSI,%R11,8),%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R9,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4bd197 <hypre_ParMatmul_RowSizes.extracted+0xcf7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bd2a6 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R11,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bd244 <hypre_ParMatmul_RowSizes.extracted+0xda4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%RDI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JNE 4bd246 <hypre_ParMatmul_RowSizes.extracted+0xda6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bd2a6 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bd2a6 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R12,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R14,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bd2a6 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %RDI,(%RCX) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV %R8,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_ParMatmul_RowSizes.extracted– | 2.36 | 0.3 |
▼Loop 3558 - par_csr_matop.c:109-242 - exec– | 0.07 | 0.01 |
▼Loop 3562 - par_csr_matop.c:109-231 - exec– | 0.95 | 0.1 |
○Loop 3565 - par_csr_matop.c:195-208 - exec | 1.26 | 0.13 |
○Loop 3566 - par_csr_matop.c:195-208 - exec | 0.05 | 0.01 |
○Loop 3563 - par_csr_matop.c:218-231 - exec | 0.01 | 0.01 |
○Loop 3564 - par_csr_matop.c:218-231 - exec | 0 | 0 |
▼Loop 3559 - par_csr_matop.c:109-231 - exec– | 0 | 0 |
○Loop 3561 - par_csr_matop.c:195-208 - exec | 0 | 0 |
○Loop 3560 - par_csr_matop.c:195-208 - exec | 0 | 0 |
▼Loop 3567 - par_csr_matop.c:109-177 - exec– | 0 | 0 |
○Loop 3569 - par_csr_matop.c:170-177 - exec | 0 | 0 |
○Loop 3568 - par_csr_matop.c:170-177 - exec | 0 | 0 |
○Loop 3571 - par_csr_matop.c:154-167 - exec | 0 | 0 |
○Loop 3570 - par_csr_matop.c:154-167 - exec | 0 | 0 |
○Loop 3554 - par_csr_matop.c:263-266 - exec | 0.01 | 0 |
○Loop 3557 - par_csr_matop.c:257-260 - exec | 0 | 0 |
○Loop 3553 - par_csr_matop.c:263-266 - exec | 0 | 0 |
○Loop 3550 - par_csr_matop.c:273-276 - exec | 0 | 0 |
○Loop 3552 - par_csr_matop.c:109-273 - exec | 0 | 0 |
○Loop 3555 - par_csr_matop.c:263-266 - exec | 0 | 0 |
○Loop 3556 - par_csr_matop.c:257-260 - exec | 0 | 0 |
○Loop 3551 - par_csr_matop.c:109-273 - exec | 0 | 0 |