Function: hypre_ParMatmul_RowSizes.extracted | Module: exec | Source: par_csr_matop.c:102-276 [...] | Coverage: 1.51% |
---|
Function: hypre_ParMatmul_RowSizes.extracted | Module: exec | Source: par_csr_matop.c:102-276 [...] | Coverage: 1.51% |
---|
/scratch_na/users/xoserete/qaas_runs/171-172-8218/intel/AMG/build/AMG/AMG/parcsr_mv/par_csr_matop.c: 102 - 276 |
-------------------------------------------------------------------------------- |
102: #pragma omp parallel private(ii, i1, jj_row_begin_diag, jj_row_begin_offd, jj_count_diag, jj_count_offd, jj2, i2, jj3, i3) |
[...] |
108: ii = hypre_GetThreadNum(); |
109: if (ii < rest) |
110: { |
111: ns = ii*size+ii; |
112: ne = (ii+1)*size+ii+1; |
113: } |
114: else |
115: { |
116: ns = ii*size+rest; |
117: ne = (ii+1)*size+rest; |
118: } |
119: jj_count_diag = start_indexing; |
120: jj_count_offd = start_indexing; |
121: |
122: if (num_cols_diag_B || num_cols_offd_C) |
123: B_marker = hypre_CTAlloc(HYPRE_Int, num_cols_diag_B+num_cols_offd_C); |
124: for (i1 = 0; i1 < num_cols_diag_B+num_cols_offd_C; i1++) |
125: B_marker[i1] = -1; |
126: |
127: for (i1 = ns; i1 < ne; i1++) |
[...] |
135: if ( allsquare ) { |
136: B_marker[i1] = jj_count_diag; |
137: jj_count_diag++; |
[...] |
144: if (num_cols_offd_A) |
145: { |
146: for (jj2 = A_offd_i[i1]; jj2 < A_offd_i[i1+1]; jj2++) |
147: { |
148: i2 = A_offd_j[jj2]; |
[...] |
154: for (jj3 = B_ext_offd_i[i2]; jj3 < B_ext_offd_i[i2+1]; jj3++) |
[...] |
164: if (B_marker[i3] < jj_row_begin_offd) |
165: { |
166: B_marker[i3] = jj_count_offd; |
167: jj_count_offd++; |
168: } |
169: } |
170: for (jj3 = B_ext_diag_i[i2]; jj3 < B_ext_diag_i[i2+1]; jj3++) |
171: { |
172: i3 = B_ext_diag_j[jj3]; |
173: |
174: if (B_marker[i3] < jj_row_begin_diag) |
175: { |
176: B_marker[i3] = jj_count_diag; |
177: jj_count_diag++; |
[...] |
187: for (jj2 = A_diag_i[i1]; jj2 < A_diag_i[i1+1]; jj2++) |
188: { |
189: i2 = A_diag_j[jj2]; |
[...] |
195: for (jj3 = B_diag_i[i2]; jj3 < B_diag_i[i2+1]; jj3++) |
196: { |
197: i3 = B_diag_j[jj3]; |
[...] |
205: if (B_marker[i3] < jj_row_begin_diag) |
206: { |
207: B_marker[i3] = jj_count_diag; |
208: jj_count_diag++; |
[...] |
216: if (num_cols_offd_B) |
217: { |
218: for (jj3 = B_offd_i[i2]; jj3 < B_offd_i[i2+1]; jj3++) |
219: { |
220: i3 = num_cols_diag_B+map_B_to_C[B_offd_j[jj3]]; |
[...] |
228: if (B_marker[i3] < jj_row_begin_offd) |
229: { |
230: B_marker[i3] = jj_count_offd; |
231: jj_count_offd++; |
[...] |
241: (*C_diag_i)[i1] = jj_row_begin_diag; |
242: (*C_offd_i)[i1] = jj_row_begin_offd; |
243: |
244: } |
245: jj_count_diag_array[ii] = jj_count_diag; |
246: jj_count_offd_array[ii] = jj_count_offd; |
247: |
248: hypre_TFree(B_marker); |
249: #ifdef HYPRE_USING_OPENMP |
250: #pragma omp barrier |
251: #endif |
252: |
253: if (ii) |
254: { |
255: jj_count_diag = jj_count_diag_array[0]; |
256: jj_count_offd = jj_count_offd_array[0]; |
257: for (i1 = 1; i1 < ii; i1++) |
258: { |
259: jj_count_diag += jj_count_diag_array[i1]; |
260: jj_count_offd += jj_count_offd_array[i1]; |
261: } |
262: |
263: for (i1 = ns; i1 < ne; i1++) |
264: { |
265: (*C_diag_i)[i1] += jj_count_diag; |
266: (*C_offd_i)[i1] += jj_count_offd; |
267: } |
268: } |
269: else |
270: { |
271: (*C_diag_i)[num_rows_diag_A] = 0; |
272: (*C_offd_i)[num_rows_diag_A] = 0; |
273: for (i1 = 0; i1 < num_threads; i1++) |
274: { |
275: (*C_diag_i)[num_rows_diag_A] += jj_count_diag_array[i1]; |
276: (*C_offd_i)[num_rows_diag_A] += jj_count_offd_array[i1]; |
0x4bbf60 PUSH %RBP |
0x4bbf61 MOV %RSP,%RBP |
0x4bbf64 PUSH %R15 |
0x4bbf66 PUSH %R14 |
0x4bbf68 PUSH %R13 |
0x4bbf6a PUSH %R12 |
0x4bbf6c PUSH %RBX |
0x4bbf6d SUB $0xb8,%RSP |
0x4bbf74 MOV %R9,-0x88(%RBP) |
0x4bbf7b MOV %R8,-0xb8(%RBP) |
0x4bbf82 MOV %RCX,-0x58(%RBP) |
0x4bbf86 MOV %RDX,-0x50(%RBP) |
0x4bbf8a MOV %RDI,-0x90(%RBP) |
0x4bbf91 MOV 0xc0(%RBP),%R14 |
0x4bbf98 MOV 0xb8(%RBP),%R13 |
0x4bbf9f MOV 0x90(%RBP),%R12 |
0x4bbfa6 MOV 0x80(%RBP),%R15 |
0x4bbfad CALL 4e8ab0 <hypre_GetThreadNum> |
0x4bbfb2 MOV %RAX,%RCX |
0x4bbfb5 LEA 0x1(%RAX),%RBX |
0x4bbfb9 MOV %RBX,%RAX |
0x4bbfbc IMUL %R14,%RAX |
0x4bbfc0 CMP %R13,%RCX |
0x4bbfc3 JGE 4bc108 |
0x4bbfc9 LEA 0x1(%R14),%RDX |
0x4bbfcd IMUL %RCX,%RDX |
0x4bbfd1 ADD %RAX,%RBX |
0x4bbfd4 MOV %R15,%RAX |
0x4bbfd7 OR %R12,%RAX |
0x4bbfda MOV %RCX,-0x60(%RBP) |
0x4bbfde JE 4bc128 |
0x4bbfe4 MOV %RDX,%R13 |
0x4bbfe7 LEA (%R12,%R15,1),%RDI |
0x4bbfeb MOV $0x8,%ESI |
0x4bbff0 CALL 4e6d80 <hypre_CAlloc> |
0x4bbff5 MOV %RAX,%R14 |
0x4bbff8 ADD %R15,%R12 |
0x4bbffb JLE 4bc011 |
0x4bbffd SAL $0x3,%R12 |
0x4bc001 MOV %R14,%RDI |
0x4bc004 MOV $0xff,%ESI |
0x4bc009 MOV %R12,%RDX |
0x4bc00c CALL 4efe80 <_intel_fast_memset> |
0x4bc011 MOV -0x60(%RBP),%RCX |
0x4bc015 MOV %R13,%RDX |
0x4bc018 MOV %RDX,-0x40(%RBP) |
0x4bc01c CMP %RBX,%RDX |
0x4bc01f MOV %RBX,-0x48(%RBP) |
0x4bc023 JL 4bc13c |
0x4bc029 XOR %EBX,%EBX |
0x4bc02b XOR %EDX,%EDX |
0x4bc02d MOV 0xa8(%RBP),%R15 |
0x4bc034 MOV -0x60(%RBP),%R12 |
0x4bc038 MOV %RBX,(%R15,%R12,8) |
0x4bc03c MOV 0xb0(%RBP),%RBX |
0x4bc043 MOV %RDX,(%RBX,%R12,8) |
0x4bc047 MOV %R14,%RDI |
0x4bc04a CALL 4e6e50 <hypre_Free> |
0x4bc04f MOV -0x90(%RBP),%RAX |
0x4bc056 MOV (%RAX),%ESI |
0x4bc058 MOV $0x736190,%EDI |
0x4bc05d CALL 410020 <__kmpc_barrier@plt> |
0x4bc062 TEST %R12,%R12 |
0x4bc065 JE 4bca6a |
0x4bc06b MOV %R12,%RDI |
0x4bc06e MOV (%R15),%RAX |
0x4bc071 MOV (%RBX),%RCX |
0x4bc074 CMP $0x1,%R12 |
0x4bc078 JLE 4bcba3 |
0x4bc07e LEA -0x1(%RDI),%RSI |
0x4bc082 MOV %RSI,%RDX |
0x4bc085 AND $-0x4,%RDX |
0x4bc089 JE 4bcbb4 |
0x4bc08f VMOVQ %RAX,%XMM1 |
0x4bc094 VMOVQ %RCX,%XMM0 |
0x4bc099 LEA -0x1(%RDX),%RAX |
0x4bc09d XOR %ECX,%ECX |
0x4bc09f MOV -0x48(%RBP),%R11 |
0x4bc0a3 MOV 0xc0(%RBP),%R14 |
0x4bc0aa NOPW (%RAX,%RAX,1) |
(3557) 0x4bc0b0 VPADDQ 0x8(%R15,%RCX,8),%YMM1,%YMM1 |
(3557) 0x4bc0b7 VPADDQ 0x8(%RBX,%RCX,8),%YMM0,%YMM0 |
(3557) 0x4bc0bd ADD $0x4,%RCX |
(3557) 0x4bc0c1 CMP %RAX,%RCX |
(3557) 0x4bc0c4 JLE 4bc0b0 |
0x4bc0c6 VEXTRACTI128 $0x1,%YMM1,%XMM2 |
0x4bc0cc VPADDQ %XMM2,%XMM1,%XMM1 |
0x4bc0d0 VPSHUFD $-0x12,%XMM1,%XMM2 |
0x4bc0d5 VPADDQ %XMM2,%XMM1,%XMM1 |
0x4bc0d9 VMOVQ %XMM1,%RAX |
0x4bc0de VEXTRACTI128 $0x1,%YMM0,%XMM1 |
0x4bc0e4 VPADDQ %XMM1,%XMM0,%XMM0 |
0x4bc0e8 VPSHUFD $-0x12,%XMM0,%XMM1 |
0x4bc0ed VPADDQ %XMM1,%XMM0,%XMM0 |
0x4bc0f1 VMOVQ %XMM0,%RCX |
0x4bc0f6 CMP %RDX,%RSI |
0x4bc0f9 MOV -0x40(%RBP),%RSI |
0x4bc0fd JNE 4bcbc5 |
0x4bc103 JMP 4bcbe0 |
0x4bc108 MOV %RCX,%RDX |
0x4bc10b IMUL %R14,%RDX |
0x4bc10f ADD %R13,%RDX |
0x4bc112 ADD %R13,%RAX |
0x4bc115 MOV %RAX,%RBX |
0x4bc118 MOV %R15,%RAX |
0x4bc11b OR %R12,%RAX |
0x4bc11e MOV %RCX,-0x60(%RBP) |
0x4bc122 JNE 4bbfe4 |
0x4bc128 XOR %R14D,%R14D |
0x4bc12b MOV %RDX,-0x40(%RBP) |
0x4bc12f CMP %RBX,%RDX |
0x4bc132 MOV %RBX,-0x48(%RBP) |
0x4bc136 JGE 4bc029 |
0x4bc13c MOV 0x60(%RBP),%RSI |
0x4bc140 MOV 0x58(%RBP),%RDX |
0x4bc144 MOV 0x48(%RBP),%RDI |
0x4bc148 MOV 0x38(%RBP),%R8 |
0x4bc14c MOV 0x28(%RBP),%R9 |
0x4bc150 MOV 0xb8(%RBP),%RAX |
0x4bc157 CMP %RAX,%RCX |
0x4bc15a CMOVL %RCX,%RAX |
0x4bc15e IMUL 0xc0(%RBP),%RCX |
0x4bc166 ADD %RAX,%RCX |
0x4bc169 MOV %RCX,-0xb0(%RBP) |
0x4bc170 NOT %RCX |
0x4bc173 ADD %RBX,%RCX |
0x4bc176 MOV %RCX,-0xa8(%RBP) |
0x4bc17d MOV -0x50(%RBP),%RAX |
0x4bc181 MOV (%RAX),%RAX |
0x4bc184 MOV %RAX,-0xa0(%RBP) |
0x4bc18b MOV -0x58(%RBP),%RAX |
0x4bc18f MOV (%RAX),%RAX |
0x4bc192 MOV %RAX,-0x98(%RBP) |
0x4bc199 LEA 0x38(%RDX),%RAX |
0x4bc19d MOV %RAX,-0xd8(%RBP) |
0x4bc1a4 LEA 0x38(%RDI),%RAX |
0x4bc1a8 MOV %RAX,-0xd0(%RBP) |
0x4bc1af LEA 0x38(%R9),%RAX |
0x4bc1b3 MOV %RAX,-0x80(%RBP) |
0x4bc1b7 LEA 0x18(%R8),%RAX |
0x4bc1bb MOV %RAX,-0xc8(%RBP) |
0x4bc1c2 XOR %EDI,%EDI |
0x4bc1c4 XOR %R10D,%R10D |
0x4bc1c7 XOR %R8D,%R8D |
0x4bc1ca MOV %R8,%RBX |
0x4bc1cd JMP 4bc208 |
0x4bc1cf NOP |
(3558) 0x4bc1d0 MOV -0xa0(%RBP),%RAX |
(3558) 0x4bc1d7 MOV -0x78(%RBP),%RCX |
(3558) 0x4bc1db MOV %R8,(%RAX,%RCX,8) |
(3558) 0x4bc1df MOV -0x98(%RBP),%RAX |
(3558) 0x4bc1e6 MOV %R10,(%RAX,%RCX,8) |
(3558) 0x4bc1ea MOV -0xc0(%RBP),%RCX |
(3558) 0x4bc1f1 LEA 0x1(%RCX),%RDI |
(3558) 0x4bc1f5 MOV %RDX,%R10 |
(3558) 0x4bc1f8 MOV %RBX,%R8 |
(3558) 0x4bc1fb CMP -0xa8(%RBP),%RCX |
(3558) 0x4bc202 JE 4bc02d |
(3558) 0x4bc208 MOV 0x78(%RBP),%RAX |
(3558) 0x4bc20c TEST %RAX,%RAX |
(3558) 0x4bc20f MOV -0xb0(%RBP),%RCX |
(3558) 0x4bc216 JE 4bc224 |
(3558) 0x4bc218 LEA (%RCX,%RDI,1),%RAX |
(3558) 0x4bc21c MOV %R8,(%R14,%RAX,8) |
(3558) 0x4bc220 LEA 0x1(%R8),%RBX |
(3558) 0x4bc224 ADD %RDI,%RCX |
(3558) 0x4bc227 CMPQ $0,0x70(%RBP) |
(3558) 0x4bc22c MOV %RCX,-0x78(%RBP) |
(3558) 0x4bc230 MOV %RDI,-0xc0(%RBP) |
(3558) 0x4bc237 JE 4bc5f0 |
(3558) 0x4bc23d MOV 0x10(%RBP),%RAX |
(3558) 0x4bc241 MOV (%RAX,%RCX,8),%R13 |
(3558) 0x4bc245 MOV 0x8(%RAX,%RCX,8),%RDX |
(3558) 0x4bc24a LEA 0x1(%RCX),%R9 |
(3558) 0x4bc24e CMP %RDX,%R13 |
(3558) 0x4bc251 JGE 4bc5f4 |
(3558) 0x4bc257 MOV %R13,%RAX |
(3558) 0x4bc25a NOT %RAX |
(3558) 0x4bc25d ADD %RAX,%RDX |
(3558) 0x4bc260 MOV %RDX,-0x30(%RBP) |
(3558) 0x4bc264 XOR %EAX,%EAX |
(3558) 0x4bc266 MOV %R10,%RDX |
(3558) 0x4bc269 MOV %R9,-0x38(%RBP) |
(3558) 0x4bc26d MOV %R13,-0x68(%RBP) |
(3558) 0x4bc271 JMP 4bc29a |
0x4bc273 NOPW %CS:(%RAX,%RAX,1) |
(3567) 0x4bc280 MOV -0x68(%RBP),%R13 |
(3567) 0x4bc284 MOV -0x70(%RBP),%RCX |
(3567) 0x4bc288 LEA 0x1(%RCX),%RAX |
(3567) 0x4bc28c CMP -0x30(%RBP),%RCX |
(3567) 0x4bc290 MOV -0x38(%RBP),%R9 |
(3567) 0x4bc294 JE 4bc600 |
(3567) 0x4bc29a MOV %RAX,-0x70(%RBP) |
(3567) 0x4bc29e ADD %R13,%RAX |
(3567) 0x4bc2a1 MOV 0x18(%RBP),%RCX |
(3567) 0x4bc2a5 MOV (%RCX,%RAX,8),%RAX |
(3567) 0x4bc2a9 MOV 0x50(%RBP),%RCX |
(3567) 0x4bc2ad MOV (%RCX,%RAX,8),%R13 |
(3567) 0x4bc2b1 MOV 0x8(%RCX,%RAX,8),%RDI |
(3567) 0x4bc2b6 MOV %RDI,%R11 |
(3567) 0x4bc2b9 SUB %R13,%R11 |
(3567) 0x4bc2bc JLE 4bc300 |
(3567) 0x4bc2be CMP $0x8,%R11 |
(3567) 0x4bc2c2 JAE 4bc360 |
(3567) 0x4bc2c8 MOV %R11,%RCX |
(3567) 0x4bc2cb AND $-0x8,%RCX |
(3567) 0x4bc2cf CMP %R11,%RCX |
(3567) 0x4bc2d2 JAE 4bc300 |
(3567) 0x4bc2d4 ADD %RCX,%R13 |
(3567) 0x4bc2d7 MOV 0x58(%RBP),%R9 |
(3567) 0x4bc2db JMP 4bc2e8 |
0x4bc2dd NOPL (%RAX) |
(3570) 0x4bc2e0 INC %R13 |
(3570) 0x4bc2e3 CMP %R13,%RDI |
(3570) 0x4bc2e6 JE 4bc300 |
(3570) 0x4bc2e8 MOV (%R9,%R13,8),%RCX |
(3570) 0x4bc2ec ADD %R15,%RCX |
(3570) 0x4bc2ef CMP %R10,(%R14,%RCX,8) |
(3570) 0x4bc2f3 JGE 4bc2e0 |
(3570) 0x4bc2f5 MOV %RDX,(%R14,%RCX,8) |
(3570) 0x4bc2f9 INC %RDX |
(3570) 0x4bc2fc JMP 4bc2e0 |
0x4bc2fe XCHG %AX,%AX |
(3567) 0x4bc300 MOV 0x40(%RBP),%RCX |
(3567) 0x4bc304 MOV (%RCX,%RAX,8),%RDI |
(3567) 0x4bc308 MOV 0x8(%RCX,%RAX,8),%RAX |
(3567) 0x4bc30d MOV %RAX,%R9 |
(3567) 0x4bc310 SUB %RDI,%R9 |
(3567) 0x4bc313 JLE 4bc280 |
(3567) 0x4bc319 CMP $0x8,%R9 |
(3567) 0x4bc31d JAE 4bc4e0 |
(3567) 0x4bc323 MOV -0x68(%RBP),%R13 |
(3567) 0x4bc327 MOV %R9,%RCX |
(3567) 0x4bc32a AND $-0x8,%RCX |
(3567) 0x4bc32e CMP %R9,%RCX |
(3567) 0x4bc331 JAE 4bc284 |
(3567) 0x4bc337 ADD %RCX,%RDI |
(3567) 0x4bc33a MOV 0x48(%RBP),%R9 |
(3567) 0x4bc33e JMP 4bc34c |
(3568) 0x4bc340 INC %RDI |
(3568) 0x4bc343 CMP %RDI,%RAX |
(3568) 0x4bc346 JE 4bc284 |
(3568) 0x4bc34c MOV (%R9,%RDI,8),%RCX |
(3568) 0x4bc350 CMP %R8,(%R14,%RCX,8) |
(3568) 0x4bc354 JGE 4bc340 |
(3568) 0x4bc356 MOV %RBX,(%R14,%RCX,8) |
(3568) 0x4bc35a INC %RBX |
(3568) 0x4bc35d JMP 4bc340 |
0x4bc35f NOP |
(3567) 0x4bc360 MOV %R11,%R9 |
(3567) 0x4bc363 SHR $0x3,%R9 |
(3567) 0x4bc367 MOV -0xd8(%RBP),%RCX |
(3567) 0x4bc36e LEA (%RCX,%R13,8),%RCX |
(3567) 0x4bc372 JMP 4bc38d |
0x4bc374 NOPW %CS:(%RAX,%RAX,1) |
(3571) 0x4bc380 ADD $0x40,%RCX |
(3571) 0x4bc384 DEC %R9 |
(3571) 0x4bc387 JE 4bc2c8 |
(3571) 0x4bc38d MOV -0x38(%RCX),%R12 |
(3571) 0x4bc391 ADD %R15,%R12 |
(3571) 0x4bc394 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc398 JGE 4bc440 |
(3571) 0x4bc39e MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc3a2 INC %RDX |
(3571) 0x4bc3a5 MOV -0x30(%RCX),%R12 |
(3571) 0x4bc3a9 ADD %R15,%R12 |
(3571) 0x4bc3ac CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc3b0 JL 4bc451 |
(3571) 0x4bc3b6 MOV -0x28(%RCX),%R12 |
(3571) 0x4bc3ba ADD %R15,%R12 |
(3571) 0x4bc3bd CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc3c1 JGE 4bc469 |
(3571) 0x4bc3c7 MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc3cb INC %RDX |
(3571) 0x4bc3ce MOV -0x20(%RCX),%R12 |
(3571) 0x4bc3d2 ADD %R15,%R12 |
(3571) 0x4bc3d5 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc3d9 JL 4bc47a |
(3571) 0x4bc3df MOV -0x18(%RCX),%R12 |
(3571) 0x4bc3e3 ADD %R15,%R12 |
(3571) 0x4bc3e6 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc3ea JGE 4bc492 |
(3571) 0x4bc3f0 MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc3f4 INC %RDX |
(3571) 0x4bc3f7 MOV -0x10(%RCX),%R12 |
(3571) 0x4bc3fb ADD %R15,%R12 |
(3571) 0x4bc3fe CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc402 JL 4bc4a3 |
(3571) 0x4bc408 MOV -0x8(%RCX),%R12 |
(3571) 0x4bc40c ADD %R15,%R12 |
(3571) 0x4bc40f CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc413 JGE 4bc4bb |
(3571) 0x4bc419 MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc41d INC %RDX |
(3571) 0x4bc420 MOV (%RCX),%R12 |
(3571) 0x4bc423 ADD %R15,%R12 |
(3571) 0x4bc426 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc42a JGE 4bc380 |
(3571) 0x4bc430 JMP 4bc4cb |
0x4bc435 NOPW %CS:(%RAX,%RAX,1) |
(3571) 0x4bc440 MOV -0x30(%RCX),%R12 |
(3571) 0x4bc444 ADD %R15,%R12 |
(3571) 0x4bc447 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc44b JGE 4bc3b6 |
(3571) 0x4bc451 MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc455 INC %RDX |
(3571) 0x4bc458 MOV -0x28(%RCX),%R12 |
(3571) 0x4bc45c ADD %R15,%R12 |
(3571) 0x4bc45f CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc463 JL 4bc3c7 |
(3571) 0x4bc469 MOV -0x20(%RCX),%R12 |
(3571) 0x4bc46d ADD %R15,%R12 |
(3571) 0x4bc470 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc474 JGE 4bc3df |
(3571) 0x4bc47a MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc47e INC %RDX |
(3571) 0x4bc481 MOV -0x18(%RCX),%R12 |
(3571) 0x4bc485 ADD %R15,%R12 |
(3571) 0x4bc488 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc48c JL 4bc3f0 |
(3571) 0x4bc492 MOV -0x10(%RCX),%R12 |
(3571) 0x4bc496 ADD %R15,%R12 |
(3571) 0x4bc499 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc49d JGE 4bc408 |
(3571) 0x4bc4a3 MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc4a7 INC %RDX |
(3571) 0x4bc4aa MOV -0x8(%RCX),%R12 |
(3571) 0x4bc4ae ADD %R15,%R12 |
(3571) 0x4bc4b1 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc4b5 JL 4bc419 |
(3571) 0x4bc4bb MOV (%RCX),%R12 |
(3571) 0x4bc4be ADD %R15,%R12 |
(3571) 0x4bc4c1 CMP %R10,(%R14,%R12,8) |
(3571) 0x4bc4c5 JGE 4bc380 |
(3571) 0x4bc4cb MOV %RDX,(%R14,%R12,8) |
(3571) 0x4bc4cf INC %RDX |
(3571) 0x4bc4d2 JMP 4bc380 |
0x4bc4d7 NOPW (%RAX,%RAX,1) |
(3567) 0x4bc4e0 MOV %R9,%RCX |
(3567) 0x4bc4e3 SHR $0x3,%RCX |
(3567) 0x4bc4e7 MOV -0xd0(%RBP),%R11 |
(3567) 0x4bc4ee LEA (%R11,%RDI,8),%R11 |
(3567) 0x4bc4f2 MOV -0x68(%RBP),%R13 |
(3567) 0x4bc4f6 JMP 4bc50d |
0x4bc4f8 NOPL (%RAX,%RAX,1) |
(3569) 0x4bc500 ADD $0x40,%R11 |
(3569) 0x4bc504 DEC %RCX |
(3569) 0x4bc507 JE 4bc327 |
(3569) 0x4bc50d MOV -0x38(%R11),%R12 |
(3569) 0x4bc511 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc515 JGE 4bc580 |
(3569) 0x4bc517 MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bc51b INC %RBX |
(3569) 0x4bc51e MOV -0x30(%R11),%R12 |
(3569) 0x4bc522 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc526 JL 4bc58a |
(3569) 0x4bc528 MOV -0x28(%R11),%R12 |
(3569) 0x4bc52c CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc530 JGE 4bc59b |
(3569) 0x4bc532 MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bc536 INC %RBX |
(3569) 0x4bc539 MOV -0x20(%R11),%R12 |
(3569) 0x4bc53d CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc541 JL 4bc5a5 |
(3569) 0x4bc543 MOV -0x18(%R11),%R12 |
(3569) 0x4bc547 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc54b JGE 4bc5b6 |
(3569) 0x4bc54d MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bc551 INC %RBX |
(3569) 0x4bc554 MOV -0x10(%R11),%R12 |
(3569) 0x4bc558 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc55c JL 4bc5c0 |
(3569) 0x4bc55e MOV -0x8(%R11),%R12 |
(3569) 0x4bc562 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc566 JGE 4bc5d1 |
(3569) 0x4bc568 MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bc56c INC %RBX |
(3569) 0x4bc56f MOV (%R11),%R12 |
(3569) 0x4bc572 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc576 JGE 4bc500 |
(3569) 0x4bc578 JMP 4bc5de |
0x4bc57a NOPW (%RAX,%RAX,1) |
(3569) 0x4bc580 MOV -0x30(%R11),%R12 |
(3569) 0x4bc584 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc588 JGE 4bc528 |
(3569) 0x4bc58a MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bc58e INC %RBX |
(3569) 0x4bc591 MOV -0x28(%R11),%R12 |
(3569) 0x4bc595 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc599 JL 4bc532 |
(3569) 0x4bc59b MOV -0x20(%R11),%R12 |
(3569) 0x4bc59f CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc5a3 JGE 4bc543 |
(3569) 0x4bc5a5 MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bc5a9 INC %RBX |
(3569) 0x4bc5ac MOV -0x18(%R11),%R12 |
(3569) 0x4bc5b0 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc5b4 JL 4bc54d |
(3569) 0x4bc5b6 MOV -0x10(%R11),%R12 |
(3569) 0x4bc5ba CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc5be JGE 4bc55e |
(3569) 0x4bc5c0 MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bc5c4 INC %RBX |
(3569) 0x4bc5c7 MOV -0x8(%R11),%R12 |
(3569) 0x4bc5cb CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc5cf JL 4bc568 |
(3569) 0x4bc5d1 MOV (%R11),%R12 |
(3569) 0x4bc5d4 CMP %R8,(%R14,%R12,8) |
(3569) 0x4bc5d8 JGE 4bc500 |
(3569) 0x4bc5de MOV %RBX,(%R14,%R12,8) |
(3569) 0x4bc5e2 INC %RBX |
(3569) 0x4bc5e5 JMP 4bc500 |
0x4bc5ea NOPW (%RAX,%RAX,1) |
(3558) 0x4bc5f0 LEA 0x1(%RCX),%R9 |
(3558) 0x4bc5f4 MOV %R10,%RDX |
(3558) 0x4bc5f7 JMP 4bc604 |
0x4bc5f9 NOPL (%RAX) |
(3558) 0x4bc600 MOV -0x78(%RBP),%RCX |
(3558) 0x4bc604 MOV -0xb8(%RBP),%RAX |
(3558) 0x4bc60b MOV (%RAX,%RCX,8),%R11 |
(3558) 0x4bc60f MOV (%RAX,%R9,8),%RCX |
(3558) 0x4bc613 CMP %RCX,%R11 |
(3558) 0x4bc616 JGE 4bc1d0 |
(3558) 0x4bc61c MOV %R11,%RAX |
(3558) 0x4bc61f NOT %RAX |
(3558) 0x4bc622 ADD %RAX,%RCX |
(3558) 0x4bc625 MOV %RCX,-0x38(%RBP) |
(3558) 0x4bc629 CMPQ $0,0x88(%RBP) |
(3558) 0x4bc631 MOV %R11,-0x30(%RBP) |
(3558) 0x4bc635 JE 4bc8da |
(3558) 0x4bc63b XOR %EAX,%EAX |
(3558) 0x4bc63d JMP 4bc659 |
0x4bc63f NOP |
(3562) 0x4bc640 MOV -0x30(%RBP),%R11 |
(3562) 0x4bc644 MOV -0x70(%RBP),%RDI |
(3562) 0x4bc648 LEA 0x1(%RDI),%RAX |
(3562) 0x4bc64c MOV -0x38(%RBP),%RCX |
(3562) 0x4bc650 CMP %RCX,%RDI |
(3562) 0x4bc653 JE 4bc1d0 |
(3562) 0x4bc659 MOV %RAX,-0x70(%RBP) |
(3562) 0x4bc65d ADD %R11,%RAX |
(3562) 0x4bc660 MOV -0x88(%RBP),%RCX |
(3562) 0x4bc667 MOV (%RCX,%RAX,8),%RDI |
(3562) 0x4bc66b MOV 0x20(%RBP),%RCX |
(3562) 0x4bc66f MOV (%RCX,%RDI,8),%RAX |
(3562) 0x4bc673 MOV 0x8(%RCX,%RDI,8),%R13 |
(3562) 0x4bc678 MOV %R13,%R9 |
(3562) 0x4bc67b SUB %RAX,%R9 |
(3562) 0x4bc67e JLE 4bc7e4 |
(3562) 0x4bc684 CMP $0x8,%R9 |
(3562) 0x4bc688 JAE 4bc6d0 |
(3562) 0x4bc68a MOV %R9,%RCX |
(3562) 0x4bc68d AND $-0x8,%RCX |
(3562) 0x4bc691 CMP %R9,%RCX |
(3562) 0x4bc694 JAE 4bc7e0 |
(3562) 0x4bc69a ADD %RCX,%RAX |
(3562) 0x4bc69d MOV 0x28(%RBP),%R9 |
(3562) 0x4bc6a1 MOV -0x30(%RBP),%R11 |
(3562) 0x4bc6a5 JMP 4bc6bc |
0x4bc6a7 NOPW (%RAX,%RAX,1) |
(3565) 0x4bc6b0 INC %RAX |
(3565) 0x4bc6b3 CMP %RAX,%R13 |
(3565) 0x4bc6b6 JE 4bc7e4 |
(3565) 0x4bc6bc MOV (%R9,%RAX,8),%RCX |
(3565) 0x4bc6c0 CMP %R8,(%R14,%RCX,8) |
(3565) 0x4bc6c4 JGE 4bc6b0 |
(3565) 0x4bc6c6 MOV %RBX,(%R14,%RCX,8) |
(3565) 0x4bc6ca INC %RBX |
(3565) 0x4bc6cd JMP 4bc6b0 |
0x4bc6cf NOP |
(3562) 0x4bc6d0 MOV %R9,%RCX |
(3562) 0x4bc6d3 SHR $0x3,%RCX |
(3562) 0x4bc6d7 MOV -0x80(%RBP),%R11 |
(3562) 0x4bc6db LEA (%R11,%RAX,8),%R11 |
(3562) 0x4bc6df JMP 4bc6f9 |
0x4bc6e1 NOPW %CS:(%RAX,%RAX,1) |
(3566) 0x4bc6f0 ADD $0x40,%R11 |
(3566) 0x4bc6f4 DEC %RCX |
(3566) 0x4bc6f7 JE 4bc68a |
(3566) 0x4bc6f9 MOV -0x38(%R11),%R12 |
(3566) 0x4bc6fd CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc701 JGE 4bc770 |
(3566) 0x4bc703 MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bc707 INC %RBX |
(3566) 0x4bc70a MOV -0x30(%R11),%R12 |
(3566) 0x4bc70e CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc712 JL 4bc77a |
(3566) 0x4bc714 MOV -0x28(%R11),%R12 |
(3566) 0x4bc718 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc71c JGE 4bc78b |
(3566) 0x4bc71e MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bc722 INC %RBX |
(3566) 0x4bc725 MOV -0x20(%R11),%R12 |
(3566) 0x4bc729 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc72d JL 4bc795 |
(3566) 0x4bc72f MOV -0x18(%R11),%R12 |
(3566) 0x4bc733 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc737 JGE 4bc7a6 |
(3566) 0x4bc739 MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bc73d INC %RBX |
(3566) 0x4bc740 MOV -0x10(%R11),%R12 |
(3566) 0x4bc744 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc748 JL 4bc7b0 |
(3566) 0x4bc74a MOV -0x8(%R11),%R12 |
(3566) 0x4bc74e CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc752 JGE 4bc7c1 |
(3566) 0x4bc754 MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bc758 INC %RBX |
(3566) 0x4bc75b MOV (%R11),%R12 |
(3566) 0x4bc75e CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc762 JGE 4bc6f0 |
(3566) 0x4bc764 JMP 4bc7ce |
0x4bc766 NOPW %CS:(%RAX,%RAX,1) |
(3566) 0x4bc770 MOV -0x30(%R11),%R12 |
(3566) 0x4bc774 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc778 JGE 4bc714 |
(3566) 0x4bc77a MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bc77e INC %RBX |
(3566) 0x4bc781 MOV -0x28(%R11),%R12 |
(3566) 0x4bc785 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc789 JL 4bc71e |
(3566) 0x4bc78b MOV -0x20(%R11),%R12 |
(3566) 0x4bc78f CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc793 JGE 4bc72f |
(3566) 0x4bc795 MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bc799 INC %RBX |
(3566) 0x4bc79c MOV -0x18(%R11),%R12 |
(3566) 0x4bc7a0 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc7a4 JL 4bc739 |
(3566) 0x4bc7a6 MOV -0x10(%R11),%R12 |
(3566) 0x4bc7aa CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc7ae JGE 4bc74a |
(3566) 0x4bc7b0 MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bc7b4 INC %RBX |
(3566) 0x4bc7b7 MOV -0x8(%R11),%R12 |
(3566) 0x4bc7bb CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc7bf JL 4bc754 |
(3566) 0x4bc7c1 MOV (%R11),%R12 |
(3566) 0x4bc7c4 CMP %R8,(%R14,%R12,8) |
(3566) 0x4bc7c8 JGE 4bc6f0 |
(3566) 0x4bc7ce MOV %RBX,(%R14,%R12,8) |
(3566) 0x4bc7d2 INC %RBX |
(3566) 0x4bc7d5 JMP 4bc6f0 |
0x4bc7da NOPW (%RAX,%RAX,1) |
(3562) 0x4bc7e0 MOV -0x30(%RBP),%R11 |
(3562) 0x4bc7e4 MOV 0x30(%RBP),%RCX |
(3562) 0x4bc7e8 MOV (%RCX,%RDI,8),%RAX |
(3562) 0x4bc7ec MOV 0x8(%RCX,%RDI,8),%RCX |
(3562) 0x4bc7f1 MOV %RCX,%RDI |
(3562) 0x4bc7f4 SUB %RAX,%RDI |
(3562) 0x4bc7f7 JLE 4bc644 |
(3562) 0x4bc7fd CMP $0x4,%RDI |
(3562) 0x4bc801 JAE 4bc850 |
(3562) 0x4bc803 MOV %RDI,%R9 |
(3562) 0x4bc806 AND $-0x4,%R9 |
(3562) 0x4bc80a CMP %RDI,%R9 |
(3562) 0x4bc80d JAE 4bc640 |
(3562) 0x4bc813 ADD %R9,%RAX |
(3562) 0x4bc816 MOV 0x38(%RBP),%R9 |
(3562) 0x4bc81a MOV -0x30(%RBP),%R11 |
(3562) 0x4bc81e JMP 4bc82c |
(3563) 0x4bc820 INC %RAX |
(3563) 0x4bc823 CMP %RAX,%RCX |
(3563) 0x4bc826 JE 4bc644 |
(3563) 0x4bc82c MOV (%R9,%RAX,8),%RDI |
(3563) 0x4bc830 MOV (%RSI,%RDI,8),%RDI |
(3563) 0x4bc834 ADD %R15,%RDI |
(3563) 0x4bc837 CMP %R10,(%R14,%RDI,8) |
(3563) 0x4bc83b JGE 4bc820 |
(3563) 0x4bc83d MOV %RDX,(%R14,%RDI,8) |
(3563) 0x4bc841 INC %RDX |
(3563) 0x4bc844 JMP 4bc820 |
0x4bc846 NOPW %CS:(%RAX,%RAX,1) |
(3562) 0x4bc850 MOV %RDI,%R9 |
(3562) 0x4bc853 SHR $0x2,%R9 |
(3562) 0x4bc857 MOV -0xc8(%RBP),%R11 |
(3562) 0x4bc85e LEA (%R11,%RAX,8),%R11 |
(3562) 0x4bc862 JMP 4bc879 |
0x4bc864 NOPW %CS:(%RAX,%RAX,1) |
(3564) 0x4bc870 ADD $0x20,%R11 |
(3564) 0x4bc874 DEC %R9 |
(3564) 0x4bc877 JE 4bc803 |
(3564) 0x4bc879 MOV -0x18(%R11),%R12 |
(3564) 0x4bc87d MOV (%RSI,%R12,8),%R13 |
(3564) 0x4bc881 ADD %R15,%R13 |
(3564) 0x4bc884 CMP %R10,(%R14,%R13,8) |
(3564) 0x4bc888 JGE 4bc891 |
(3564) 0x4bc88a MOV %RDX,(%R14,%R13,8) |
(3564) 0x4bc88e INC %RDX |
(3564) 0x4bc891 MOV -0x10(%R11),%R12 |
(3564) 0x4bc895 MOV (%RSI,%R12,8),%R13 |
(3564) 0x4bc899 ADD %R15,%R13 |
(3564) 0x4bc89c CMP %R10,(%R14,%R13,8) |
(3564) 0x4bc8a0 JGE 4bc8a9 |
(3564) 0x4bc8a2 MOV %RDX,(%R14,%R13,8) |
(3564) 0x4bc8a6 INC %RDX |
(3564) 0x4bc8a9 MOV -0x8(%R11),%R12 |
(3564) 0x4bc8ad MOV (%RSI,%R12,8),%R13 |
(3564) 0x4bc8b1 ADD %R15,%R13 |
(3564) 0x4bc8b4 CMP %R10,(%R14,%R13,8) |
(3564) 0x4bc8b8 JGE 4bc8c1 |
(3564) 0x4bc8ba MOV %RDX,(%R14,%R13,8) |
(3564) 0x4bc8be INC %RDX |
(3564) 0x4bc8c1 MOV (%R11),%R12 |
(3564) 0x4bc8c4 MOV (%RSI,%R12,8),%R13 |
(3564) 0x4bc8c8 ADD %R15,%R13 |
(3564) 0x4bc8cb CMP %R10,(%R14,%R13,8) |
(3564) 0x4bc8cf JGE 4bc870 |
(3564) 0x4bc8d1 MOV %RDX,(%R14,%R13,8) |
(3564) 0x4bc8d5 INC %RDX |
(3564) 0x4bc8d8 JMP 4bc870 |
(3558) 0x4bc8da XOR %R12D,%R12D |
(3558) 0x4bc8dd JMP 4bc8f9 |
0x4bc8df NOP |
(3559) 0x4bc8e0 MOV -0x30(%RBP),%R11 |
(3559) 0x4bc8e4 LEA 0x1(%R12),%RAX |
(3559) 0x4bc8e9 MOV -0x38(%RBP),%RCX |
(3559) 0x4bc8ed CMP %RCX,%R12 |
(3559) 0x4bc8f0 MOV %RAX,%R12 |
(3559) 0x4bc8f3 JE 4bc1d0 |
(3559) 0x4bc8f9 LEA (%R11,%R12,1),%RAX |
(3559) 0x4bc8fd MOV -0x88(%RBP),%RCX |
(3559) 0x4bc904 MOV (%RCX,%RAX,8),%RAX |
(3559) 0x4bc908 MOV 0x20(%RBP),%RCX |
(3559) 0x4bc90c MOV (%RCX,%RAX,8),%RDI |
(3559) 0x4bc910 MOV 0x8(%RCX,%RAX,8),%RAX |
(3559) 0x4bc915 MOV %RAX,%R9 |
(3559) 0x4bc918 SUB %RDI,%R9 |
(3559) 0x4bc91b JLE 4bc8e4 |
(3559) 0x4bc91d CMP $0x8,%R9 |
(3559) 0x4bc921 JAE 4bc960 |
(3559) 0x4bc923 MOV %R9,%RCX |
(3559) 0x4bc926 AND $-0x8,%RCX |
(3559) 0x4bc92a CMP %R9,%RCX |
(3559) 0x4bc92d JAE 4bc8e0 |
(3559) 0x4bc92f ADD %RCX,%RDI |
(3559) 0x4bc932 MOV 0x28(%RBP),%R9 |
(3559) 0x4bc936 MOV -0x30(%RBP),%R11 |
(3559) 0x4bc93a JMP 4bc948 |
0x4bc93c NOPL (%RAX) |
(3560) 0x4bc940 INC %RDI |
(3560) 0x4bc943 CMP %RDI,%RAX |
(3560) 0x4bc946 JE 4bc8e4 |
(3560) 0x4bc948 MOV (%R9,%RDI,8),%RCX |
(3560) 0x4bc94c CMP %R8,(%R14,%RCX,8) |
(3560) 0x4bc950 JGE 4bc940 |
(3560) 0x4bc952 MOV %RBX,(%R14,%RCX,8) |
(3560) 0x4bc956 INC %RBX |
(3560) 0x4bc959 JMP 4bc940 |
0x4bc95b NOPL (%RAX,%RAX,1) |
(3559) 0x4bc960 MOV %R9,%RCX |
(3559) 0x4bc963 SHR $0x3,%RCX |
(3559) 0x4bc967 MOV -0x80(%RBP),%R11 |
(3559) 0x4bc96b LEA (%R11,%RDI,8),%R11 |
(3559) 0x4bc96f JMP 4bc989 |
0x4bc971 NOPW %CS:(%RAX,%RAX,1) |
(3561) 0x4bc980 ADD $0x40,%R11 |
(3561) 0x4bc984 DEC %RCX |
(3561) 0x4bc987 JE 4bc923 |
(3561) 0x4bc989 MOV -0x38(%R11),%R13 |
(3561) 0x4bc98d CMP %R8,(%R14,%R13,8) |
(3561) 0x4bc991 JGE 4bca00 |
(3561) 0x4bc993 MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bc997 INC %RBX |
(3561) 0x4bc99a MOV -0x30(%R11),%R13 |
(3561) 0x4bc99e CMP %R8,(%R14,%R13,8) |
(3561) 0x4bc9a2 JL 4bca0a |
(3561) 0x4bc9a4 MOV -0x28(%R11),%R13 |
(3561) 0x4bc9a8 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bc9ac JGE 4bca1b |
(3561) 0x4bc9ae MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bc9b2 INC %RBX |
(3561) 0x4bc9b5 MOV -0x20(%R11),%R13 |
(3561) 0x4bc9b9 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bc9bd JL 4bca25 |
(3561) 0x4bc9bf MOV -0x18(%R11),%R13 |
(3561) 0x4bc9c3 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bc9c7 JGE 4bca36 |
(3561) 0x4bc9c9 MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bc9cd INC %RBX |
(3561) 0x4bc9d0 MOV -0x10(%R11),%R13 |
(3561) 0x4bc9d4 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bc9d8 JL 4bca40 |
(3561) 0x4bc9da MOV -0x8(%R11),%R13 |
(3561) 0x4bc9de CMP %R8,(%R14,%R13,8) |
(3561) 0x4bc9e2 JGE 4bca51 |
(3561) 0x4bc9e4 MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bc9e8 INC %RBX |
(3561) 0x4bc9eb MOV (%R11),%R13 |
(3561) 0x4bc9ee CMP %R8,(%R14,%R13,8) |
(3561) 0x4bc9f2 JGE 4bc980 |
(3561) 0x4bc9f4 JMP 4bca5e |
0x4bc9f6 NOPW %CS:(%RAX,%RAX,1) |
(3561) 0x4bca00 MOV -0x30(%R11),%R13 |
(3561) 0x4bca04 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bca08 JGE 4bc9a4 |
(3561) 0x4bca0a MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bca0e INC %RBX |
(3561) 0x4bca11 MOV -0x28(%R11),%R13 |
(3561) 0x4bca15 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bca19 JL 4bc9ae |
(3561) 0x4bca1b MOV -0x20(%R11),%R13 |
(3561) 0x4bca1f CMP %R8,(%R14,%R13,8) |
(3561) 0x4bca23 JGE 4bc9bf |
(3561) 0x4bca25 MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bca29 INC %RBX |
(3561) 0x4bca2c MOV -0x18(%R11),%R13 |
(3561) 0x4bca30 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bca34 JL 4bc9c9 |
(3561) 0x4bca36 MOV -0x10(%R11),%R13 |
(3561) 0x4bca3a CMP %R8,(%R14,%R13,8) |
(3561) 0x4bca3e JGE 4bc9da |
(3561) 0x4bca40 MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bca44 INC %RBX |
(3561) 0x4bca47 MOV -0x8(%R11),%R13 |
(3561) 0x4bca4b CMP %R8,(%R14,%R13,8) |
(3561) 0x4bca4f JL 4bc9e4 |
(3561) 0x4bca51 MOV (%R11),%R13 |
(3561) 0x4bca54 CMP %R8,(%R14,%R13,8) |
(3561) 0x4bca58 JGE 4bc980 |
(3561) 0x4bca5e MOV %RBX,(%R14,%R13,8) |
(3561) 0x4bca62 INC %RBX |
(3561) 0x4bca65 JMP 4bc980 |
0x4bca6a MOV 0xa0(%RBP),%RAX |
0x4bca71 MOV 0x68(%RBP),%RDX |
0x4bca75 MOV -0x50(%RBP),%RCX |
0x4bca79 MOV (%RCX),%RSI |
0x4bca7c MOVQ $0,(%RSI,%RDX,8) |
0x4bca84 MOV -0x58(%RBP),%RCX |
0x4bca88 MOV (%RCX),%RDI |
0x4bca8b MOVQ $0,(%RDI,%RDX,8) |
0x4bca93 TEST %RAX,%RAX |
0x4bca96 JLE 4bcd66 |
0x4bca9c LEA (%RSI,%RDX,8),%RCX |
0x4bcaa0 LEA (%RDI,%RDX,8),%RDX |
0x4bcaa4 LEA -0x8(%R15,%RAX,8),%R8 |
0x4bcaa9 CMP %RCX,%R8 |
0x4bcaac MOV %R15,%R9 |
0x4bcaaf SETAE %R15B |
0x4bcab3 CMP %R9,%RCX |
0x4bcab6 SETAE %R12B |
0x4bcaba CMP %RDX,%R8 |
0x4bcabd MOV %RBX,%R10 |
0x4bcac0 SETB %BL |
0x4bcac3 CMP %R9,%RDX |
0x4bcac6 SETB %R14B |
0x4bcaca CMP %R10,%RCX |
0x4bcacd SETB %R8B |
0x4bcad1 LEA -0x8(%R10,%RAX,8),%R9 |
0x4bcad6 CMP %RCX,%R9 |
0x4bcad9 SETB %R11B |
0x4bcadd CMP %RDX,%R9 |
0x4bcae0 SETB %R9B |
0x4bcae4 CMP %R10,%RDX |
0x4bcae7 SETB %R10B |
0x4bcaeb TEST %R12B,%R15B |
0x4bcaee JNE 4bccc1 |
0x4bcaf4 OR %R14B,%BL |
0x4bcaf7 JE 4bccc1 |
0x4bcafd CMP %RSI,%RDI |
0x4bcb00 JE 4bccc1 |
0x4bcb06 OR %R11B,%R8B |
0x4bcb09 JE 4bccc1 |
0x4bcb0f OR %R10B,%R9B |
0x4bcb12 JE 4bccc1 |
0x4bcb18 MOV %RAX,%RSI |
0x4bcb1b AND $-0x4,%RSI |
0x4bcb1f JE 4bcd34 |
0x4bcb25 LEA -0x1(%RSI),%RDI |
0x4bcb29 VPXOR %XMM0,%XMM0,%XMM0 |
0x4bcb2d XOR %R8D,%R8D |
0x4bcb30 VPXOR %XMM1,%XMM1,%XMM1 |
0x4bcb34 MOV 0xb0(%RBP),%R9 |
0x4bcb3b MOV 0xa8(%RBP),%R10 |
0x4bcb42 NOPW %CS:(%RAX,%RAX,1) |
(3552) 0x4bcb50 VPADDQ (%R10,%R8,8),%YMM1,%YMM1 |
(3552) 0x4bcb56 VPADDQ (%R9,%R8,8),%YMM0,%YMM0 |
(3552) 0x4bcb5c ADD $0x4,%R8 |
(3552) 0x4bcb60 CMP %RDI,%R8 |
(3552) 0x4bcb63 JLE 4bcb50 |
0x4bcb65 VEXTRACTI128 $0x1,%YMM1,%XMM2 |
0x4bcb6b VPADDQ %XMM2,%XMM1,%XMM1 |
0x4bcb6f VPSHUFD $-0x12,%XMM1,%XMM2 |
0x4bcb74 VPADDQ %XMM2,%XMM1,%XMM1 |
0x4bcb78 VMOVQ %XMM1,%RDI |
0x4bcb7d VEXTRACTI128 $0x1,%YMM0,%XMM1 |
0x4bcb83 VPADDQ %XMM1,%XMM0,%XMM0 |
0x4bcb87 VPSHUFD $-0x12,%XMM0,%XMM1 |
0x4bcb8c VPADDQ %XMM1,%XMM0,%XMM0 |
0x4bcb90 VMOVQ %XMM0,%R8 |
0x4bcb95 CMP %RAX,%RSI |
0x4bcb98 JNE 4bcd50 |
0x4bcb9e JMP 4bcd60 |
0x4bcba3 MOV -0x48(%RBP),%R11 |
0x4bcba7 MOV 0xc0(%RBP),%R14 |
0x4bcbae MOV -0x40(%RBP),%RSI |
0x4bcbb2 JMP 4bcbe0 |
0x4bcbb4 XOR %EDX,%EDX |
0x4bcbb6 MOV -0x48(%RBP),%R11 |
0x4bcbba MOV 0xc0(%RBP),%R14 |
0x4bcbc1 MOV -0x40(%RBP),%RSI |
0x4bcbc5 INC %RDX |
0x4bcbc8 NOPL (%RAX,%RAX,1) |
(3556) 0x4bcbd0 ADD (%R15,%RDX,8),%RAX |
(3556) 0x4bcbd4 ADD (%RBX,%RDX,8),%RCX |
(3556) 0x4bcbd8 INC %RDX |
(3556) 0x4bcbdb CMP %RDX,%RDI |
(3556) 0x4bcbde JNE 4bcbd0 |
0x4bcbe0 CMP %R11,%RSI |
0x4bcbe3 JGE 4bcd66 |
0x4bcbe9 MOV -0x50(%RBP),%RDX |
0x4bcbed MOV (%RDX),%RDX |
0x4bcbf0 MOV -0x58(%RBP),%RSI |
0x4bcbf4 MOV (%RSI),%RSI |
0x4bcbf7 LEA -0x8(%RDX,%R11,8),%R10 |
0x4bcbfc MOV 0xb8(%RBP),%R12 |
0x4bcc03 CMP %R12,%RDI |
0x4bcc06 CMOVL %RDI,%R12 |
0x4bcc0a IMUL %RDI,%R14 |
0x4bcc0e LEA (%R12,%R14,1),%RDI |
0x4bcc12 LEA (%RSI,%RDI,8),%R8 |
0x4bcc16 LEA (%RDX,%RDI,8),%R9 |
0x4bcc1a CMP %R8,%R10 |
0x4bcc1d JB 4bcc57 |
0x4bcc1f LEA -0x8(%RSI,%R11,8),%R10 |
0x4bcc24 CMP %R9,%R10 |
0x4bcc27 JB 4bcc57 |
0x4bcc29 NOPL (%RAX) |
(3555) 0x4bcc30 LEA (%RDX,%RDI,8),%R8 |
(3555) 0x4bcc34 MOV (%R8),%R9 |
(3555) 0x4bcc37 ADD %RAX,%R9 |
(3555) 0x4bcc3a MOV %R9,(%R8) |
(3555) 0x4bcc3d LEA (%RSI,%RDI,8),%R8 |
(3555) 0x4bcc41 MOV (%R8),%R9 |
(3555) 0x4bcc44 ADD %RCX,%R9 |
(3555) 0x4bcc47 MOV %R9,(%R8) |
(3555) 0x4bcc4a INC %RDI |
(3555) 0x4bcc4d CMP %RDI,%R11 |
(3555) 0x4bcc50 JNE 4bcc30 |
0x4bcc52 JMP 4bcd66 |
0x4bcc57 MOV %R11,%R10 |
0x4bcc5a SUB %RDI,%R10 |
0x4bcc5d MOV %R10,%RDI |
0x4bcc60 AND $-0x4,%RDI |
0x4bcc64 JE 4bcd04 |
0x4bcc6a MOV %R14,%R15 |
0x4bcc6d MOV %R11,%R14 |
0x4bcc70 LEA -0x1(%RDI),%R11 |
0x4bcc74 VPBROADCASTQ %RAX,%YMM0 |
0x4bcc7a VPBROADCASTQ %RCX,%YMM1 |
0x4bcc80 XOR %EBX,%EBX |
0x4bcc82 NOPW %CS:(%RAX,%RAX,1) |
(3554) 0x4bcc90 VPADDQ (%R9,%RBX,8),%YMM0,%YMM2 |
(3554) 0x4bcc96 VMOVDQU %YMM2,(%R9,%RBX,8) |
(3554) 0x4bcc9c VPADDQ (%R8,%RBX,8),%YMM1,%YMM2 |
(3554) 0x4bcca2 VMOVDQU %YMM2,(%R8,%RBX,8) |
(3554) 0x4bcca8 ADD $0x4,%RBX |
(3554) 0x4bccac CMP %R11,%RBX |
(3554) 0x4bccaf JBE 4bcc90 |
0x4bccb1 CMP %RDI,%R10 |
0x4bccb4 MOV %R14,%R11 |
0x4bccb7 MOV %R15,%R14 |
0x4bccba JNE 4bcd06 |
0x4bccbc JMP 4bcd66 |
0x4bccc1 XOR %ESI,%ESI |
0x4bccc3 MOV 0xb0(%RBP),%R9 |
0x4bccca MOV 0xa8(%RBP),%R10 |
0x4bccd1 NOPW %CS:(%RAX,%RAX,1) |
(3550) 0x4bcce0 MOV (%R10,%RSI,8),%RDI |
(3550) 0x4bcce4 MOV (%RCX),%R8 |
(3550) 0x4bcce7 ADD %RDI,%R8 |
(3550) 0x4bccea MOV %R8,(%RCX) |
(3550) 0x4bcced MOV (%R9,%RSI,8),%RDI |
(3550) 0x4bccf1 MOV (%RDX),%R8 |
(3550) 0x4bccf4 ADD %RDI,%R8 |
(3550) 0x4bccf7 MOV %R8,(%RDX) |
(3550) 0x4bccfa INC %RSI |
(3550) 0x4bccfd CMP %RSI,%RAX |
(3550) 0x4bcd00 JNE 4bcce0 |
0x4bcd02 JMP 4bcd66 |
0x4bcd04 XOR %EDI,%EDI |
0x4bcd06 ADD %R12,%RDI |
0x4bcd09 ADD %R14,%RDI |
0x4bcd0c NOPL (%RAX) |
(3553) 0x4bcd10 LEA (%RDX,%RDI,8),%R8 |
(3553) 0x4bcd14 MOV (%R8),%R9 |
(3553) 0x4bcd17 ADD %RAX,%R9 |
(3553) 0x4bcd1a MOV %R9,(%R8) |
(3553) 0x4bcd1d LEA (%RSI,%RDI,8),%R8 |
(3553) 0x4bcd21 MOV (%R8),%R9 |
(3553) 0x4bcd24 ADD %RCX,%R9 |
(3553) 0x4bcd27 MOV %R9,(%R8) |
(3553) 0x4bcd2a INC %RDI |
(3553) 0x4bcd2d CMP %RDI,%R11 |
(3553) 0x4bcd30 JNE 4bcd10 |
0x4bcd32 JMP 4bcd66 |
0x4bcd34 XOR %R8D,%R8D |
0x4bcd37 XOR %EDI,%EDI |
0x4bcd39 XOR %ESI,%ESI |
0x4bcd3b MOV 0xb0(%RBP),%R9 |
0x4bcd42 MOV 0xa8(%RBP),%R10 |
0x4bcd49 NOPL (%RAX) |
(3551) 0x4bcd50 ADD (%R10,%RSI,8),%RDI |
(3551) 0x4bcd54 ADD (%R9,%RSI,8),%R8 |
(3551) 0x4bcd58 INC %RSI |
(3551) 0x4bcd5b CMP %RSI,%RAX |
(3551) 0x4bcd5e JNE 4bcd50 |
0x4bcd60 ADD %RDI,(%RCX) |
0x4bcd63 MOV %R8,(%RDX) |
0x4bcd66 ADD $0xb8,%RSP |
0x4bcd6d POP %RBX |
0x4bcd6e POP %R12 |
0x4bcd70 POP %R13 |
0x4bcd72 POP %R14 |
0x4bcd74 POP %R15 |
0x4bcd76 POP %RBP |
0x4bcd77 VZEROUPPER |
0x4bcd7a RET |
0x4bcd7b NOPL (%RAX,%RAX,1) |
Path / |
Source file and lines | par_csr_matop.c:102-276 |
Module | exec |
nb instructions | 307 |
nb uops | 314 |
loop length | 1381 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 29 |
micro-operation queue | 52.33 cycles |
front end | 52.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 23.10 | 23.30 | 19.00 | 19.00 | 18.00 | 23.30 | 23.10 | 18.00 | 18.00 | 18.00 | 23.20 | 19.00 |
cycles | 23.10 | 23.30 | 19.00 | 19.00 | 18.00 | 23.30 | 23.10 | 18.00 | 18.00 | 18.00 | 23.20 | 19.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 51.66-51.65 |
Stall cycles | 0.00 |
Front-end | 52.33 |
Dispatch | 23.30 |
Overall L1 | 52.33 |
all | 24% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 15% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x90(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e8ab0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x1(%RAX),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R13,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4bc108 <hypre_ParMatmul_RowSizes.extracted+0x1a8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x1(%R14),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RCX,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4bc128 <hypre_ParMatmul_RowSizes.extracted+0x1c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%R12,%R15,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4e6d80 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4bc011 <hypre_ParMatmul_RowSizes.extracted+0xb1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4efe80 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x60(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RBX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JL 4bc13c <hypre_ParMatmul_RowSizes.extracted+0x1dc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa8(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,(%R15,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RBX,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e6e50 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x736190,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410020 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4bca6a <hypre_ParMatmul_RowSizes.extracted+0xb0a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4bcba3 <hypre_ParMatmul_RowSizes.extracted+0xc43> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bcbb4 <hypre_ParMatmul_RowSizes.extracted+0xc54> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ %RAX,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVQ %RCX,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
LEA -0x1(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM1,%XMM2 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM1,%RAX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%RCX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4bcbc5 <hypre_ParMatmul_RowSizes.extracted+0xc65> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bcbe0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R13,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R13,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4bbfe4 <hypre_ParMatmul_RowSizes.extracted+0x84> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RBX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4bc029 <hypre_ParMatmul_RowSizes.extracted+0xc9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x60(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %RCX,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL 0xc0(%RBP),%RCX | 1 | 0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
ADD %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOT %RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%R9),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x18(%R8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4bc208 <hypre_ParMatmul_RowSizes.extracted+0x2a8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,(%RSI,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,(%RDI,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4bcd66 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RSI,%RDX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RDX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(%R15,%RAX,8),%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RCX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SETAE %R15B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETAE %R12B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SETB %BL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R14B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R8B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA -0x8(%R10,%RAX,8),%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R11B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R9B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R10,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R10B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %R12B,%R15B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4bccc1 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R14B,%BL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bccc1 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 4bccc1 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R11B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bccc1 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R10B,%R9B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bccc1 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bcd34 <hypre_ParMatmul_RowSizes.extracted+0xdd4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RSI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM1,%XMM2 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM1,%RDI | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%R8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4bcd50 <hypre_ParMatmul_RowSizes.extracted+0xdf0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bcd60 <hypre_ParMatmul_RowSizes.extracted+0xe00> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4bcbe0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4bcd66 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x8(%RDX,%R11,8),%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0xb8(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R12,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %RDI,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RDI,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R12,%R14,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RSI,%RDI,8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDX,%RDI,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4bcc57 <hypre_ParMatmul_RowSizes.extracted+0xcf7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x8(%RSI,%R11,8),%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R9,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4bcc57 <hypre_ParMatmul_RowSizes.extracted+0xcf7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bcd66 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R11,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bcd04 <hypre_ParMatmul_RowSizes.extracted+0xda4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%RDI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JNE 4bcd06 <hypre_ParMatmul_RowSizes.extracted+0xda6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bcd66 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bcd66 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R12,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R14,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bcd66 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %RDI,(%RCX) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV %R8,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | par_csr_matop.c:102-276 |
Module | exec |
nb instructions | 307 |
nb uops | 314 |
loop length | 1381 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 29 |
micro-operation queue | 52.33 cycles |
front end | 52.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 23.10 | 23.30 | 19.00 | 19.00 | 18.00 | 23.30 | 23.10 | 18.00 | 18.00 | 18.00 | 23.20 | 19.00 |
cycles | 23.10 | 23.30 | 19.00 | 19.00 | 18.00 | 23.30 | 23.10 | 18.00 | 18.00 | 18.00 | 23.20 | 19.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 51.66-51.65 |
Stall cycles | 0.00 |
Front-end | 52.33 |
Dispatch | 23.30 |
Overall L1 | 52.33 |
all | 24% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 15% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x90(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e8ab0 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x1(%RAX),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R13,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4bc108 <hypre_ParMatmul_RowSizes.extracted+0x1a8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x1(%R14),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RCX,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4bc128 <hypre_ParMatmul_RowSizes.extracted+0x1c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%R12,%R15,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4e6d80 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4bc011 <hypre_ParMatmul_RowSizes.extracted+0xb1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
SAL $0x3,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV $0xff,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4efe80 <_intel_fast_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x60(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RBX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JL 4bc13c <hypre_ParMatmul_RowSizes.extracted+0x1dc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa8(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,(%R15,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xb0(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,(%RBX,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e6e50 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x736190,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410020 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4bca6a <hypre_ParMatmul_RowSizes.extracted+0xb0a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x1,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4bcba3 <hypre_ParMatmul_RowSizes.extracted+0xc43> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDI),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bcbb4 <hypre_ParMatmul_RowSizes.extracted+0xc54> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVQ %RAX,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVQ %RCX,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
LEA -0x1(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM1,%XMM2 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM1,%RAX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%RCX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4bcbc5 <hypre_ParMatmul_RowSizes.extracted+0xc65> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bcbe0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R13,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R13,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4bbfe4 <hypre_ParMatmul_RowSizes.extracted+0x84> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RBX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4bc029 <hypre_ParMatmul_RowSizes.extracted+0xc9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x60(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %RCX,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL 0xc0(%RBP),%RCX | 1 | 0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
ADD %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOT %RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%RDI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x38(%R9),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x18(%R8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4bc208 <hypre_ParMatmul_RowSizes.extracted+0x2a8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,(%RSI,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,(%RDI,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4bcd66 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%RSI,%RDX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RDX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x8(%R15,%RAX,8),%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RCX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SETAE %R15B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETAE %R12B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SETB %BL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R9,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R14B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R10,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R8B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA -0x8(%R10,%RAX,8),%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R11B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %RDX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R9B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP %R10,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %R10B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %R12B,%R15B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4bccc1 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R14B,%BL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bccc1 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 4bccc1 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R11B,%R8B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bccc1 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %R10B,%R9B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bccc1 <hypre_ParMatmul_RowSizes.extracted+0xd61> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bcd34 <hypre_ParMatmul_RowSizes.extracted+0xdd4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RSI),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM1,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM1,%XMM2 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM2,%XMM1,%XMM1 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM1,%RDI | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%R8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4bcd50 <hypre_ParMatmul_RowSizes.extracted+0xdf0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bcd60 <hypre_ParMatmul_RowSizes.extracted+0xe00> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4bcbe0 <hypre_ParMatmul_RowSizes.extracted+0xc80> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R11,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4bcd66 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x8(%RDX,%R11,8),%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0xb8(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R12,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %RDI,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RDI,%R14 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R12,%R14,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RSI,%RDI,8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDX,%RDI,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4bcc57 <hypre_ParMatmul_RowSizes.extracted+0xcf7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x8(%RSI,%R11,8),%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %R9,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4bcc57 <hypre_ParMatmul_RowSizes.extracted+0xcf7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bcd66 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R11,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4bcd04 <hypre_ParMatmul_RowSizes.extracted+0xda4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%RDI),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RCX,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %EBX,%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JNE 4bcd06 <hypre_ParMatmul_RowSizes.extracted+0xda6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4bcd66 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bcd66 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R12,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R14,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4bcd66 <hypre_ParMatmul_RowSizes.extracted+0xe06> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %RDI,(%RCX) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV %R8,(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0xb8,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_ParMatmul_RowSizes.extracted– | 1.51 | 0.33 |
▼Loop 3558 - par_csr_matop.c:109-242 - exec– | 0.04 | 0.01 |
▼Loop 3562 - par_csr_matop.c:109-231 - exec– | 0.6 | 0.12 |
○Loop 3565 - par_csr_matop.c:195-208 - exec | 0.8 | 0.16 |
○Loop 3566 - par_csr_matop.c:195-208 - exec | 0.04 | 0.01 |
○Loop 3564 - par_csr_matop.c:218-231 - exec | 0 | 0 |
○Loop 3563 - par_csr_matop.c:218-231 - exec | 0 | 0.01 |
▼Loop 3559 - par_csr_matop.c:109-231 - exec– | 0 | 0 |
○Loop 3561 - par_csr_matop.c:195-208 - exec | 0 | 0 |
○Loop 3560 - par_csr_matop.c:195-208 - exec | 0 | 0 |
▼Loop 3567 - par_csr_matop.c:109-177 - exec– | 0 | 0 |
○Loop 3569 - par_csr_matop.c:170-177 - exec | 0 | 0 |
○Loop 3568 - par_csr_matop.c:170-177 - exec | 0 | 0 |
○Loop 3571 - par_csr_matop.c:154-167 - exec | 0 | 0 |
○Loop 3570 - par_csr_matop.c:154-167 - exec | 0 | 0 |
○Loop 3554 - par_csr_matop.c:263-266 - exec | 0.02 | 0 |
○Loop 3557 - par_csr_matop.c:257-260 - exec | 0 | 0 |
○Loop 3553 - par_csr_matop.c:263-266 - exec | 0 | 0 |
○Loop 3550 - par_csr_matop.c:273-276 - exec | 0 | 0 |
○Loop 3552 - par_csr_matop.c:109-273 - exec | 0 | 0 |
○Loop 3555 - par_csr_matop.c:263-266 - exec | 0 | 0 |
○Loop 3556 - par_csr_matop.c:257-260 - exec | 0 | 0 |
○Loop 3551 - par_csr_matop.c:109-273 - exec | 0 | 0 |