Function: hypre_CSRMatrixTranspose.extracted | Module: exec | Source: csr_matop.c:380-560 [...] | Coverage: 0.18% |
---|
Function: hypre_CSRMatrixTranspose.extracted | Module: exec | Source: csr_matop.c:380-560 [...] | Coverage: 0.18% |
---|
/scratch_na/users/xoserete/qaas_runs/171-172-8217/intel/AMG/build/AMG/AMG/seq_mv/csr_matop.c: 380 - 560 |
-------------------------------------------------------------------------------- |
380: return idx%dim1*dim2 + idx/dim1; |
[...] |
463: #pragma omp parallel |
464: #endif |
465: { |
466: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
467: HYPRE_Int my_thread_num = hypre_GetThreadNum(); |
468: |
469: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
470: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
471: hypre_assert(iBegin <= iEnd); |
472: hypre_assert(iBegin >= 0 && iBegin <= num_rowsA); |
473: hypre_assert(iEnd >= 0 && iEnd <= num_rowsA); |
474: |
475: HYPRE_Int i, j; |
476: memset(bucket + my_thread_num*num_colsA, 0, sizeof(HYPRE_Int)*num_colsA); |
[...] |
483: for (j = A_i[iBegin]; j < A_i[iEnd]; ++j) { |
484: HYPRE_Int idx = A_j[j]; |
485: bucket[my_thread_num*num_colsA + idx]++; |
[...] |
496: for (i = my_thread_num*num_colsA + 1; i < (my_thread_num + 1)*num_colsA; ++i) { |
497: HYPRE_Int transpose_i = transpose_idx(i, num_threads, num_colsA); |
498: HYPRE_Int transpose_i_minus_1 = transpose_idx(i - 1, num_threads, num_colsA); |
499: |
500: bucket[transpose_i] += bucket[transpose_i_minus_1]; |
501: } |
502: |
503: #ifdef HYPRE_USING_OPENMP |
504: #pragma omp barrier |
505: #pragma omp master |
506: #endif |
507: { |
508: for (i = 1; i < num_threads; ++i) { |
509: HYPRE_Int j0 = num_colsA*i - 1, j1 = num_colsA*(i + 1) - 1; |
510: HYPRE_Int transpose_j0 = transpose_idx(j0, num_threads, num_colsA); |
511: HYPRE_Int transpose_j1 = transpose_idx(j1, num_threads, num_colsA); |
512: |
513: bucket[transpose_j1] += bucket[transpose_j0]; |
[...] |
520: if (my_thread_num > 0) { |
521: HYPRE_Int transpose_i0 = transpose_idx(num_colsA*my_thread_num - 1, num_threads, num_colsA); |
522: HYPRE_Int offset = bucket[transpose_i0]; |
523: |
524: for (i = my_thread_num*num_colsA; i < (my_thread_num + 1)*num_colsA - 1; ++i) { |
525: HYPRE_Int transpose_i = transpose_idx(i, num_threads, num_colsA); |
526: |
527: bucket[transpose_i] += offset; |
[...] |
539: if (data) { |
540: for (i = iEnd - 1; i >= iBegin; --i) { |
541: for (j = A_i[i + 1] - 1; j >= A_i[i]; --j) { |
542: HYPRE_Int idx = A_j[j]; |
543: --bucket[my_thread_num*num_colsA + idx]; |
544: |
545: HYPRE_Int offset = bucket[my_thread_num*num_colsA + idx]; |
546: |
547: AT_data[offset] = A_data[j]; |
548: AT_j[offset] = i; |
549: } |
550: } |
551: } |
552: else { |
553: for (i = iEnd - 1; i >= iBegin; --i) { |
554: for (j = A_i[i + 1] - 1; j >= A_i[i]; --j) { |
555: HYPRE_Int idx = A_j[j]; |
556: --bucket[my_thread_num*num_colsA + idx]; |
557: |
558: HYPRE_Int offset = bucket[my_thread_num*num_colsA + idx]; |
559: |
560: AT_j[offset] = i; |
0x4c9ea0 PUSH %RBP |
0x4c9ea1 MOV %RSP,%RBP |
0x4c9ea4 PUSH %R15 |
0x4c9ea6 PUSH %R14 |
0x4c9ea8 PUSH %R13 |
0x4c9eaa PUSH %R12 |
0x4c9eac PUSH %RBX |
0x4c9ead SUB $0x38,%RSP |
0x4c9eb1 MOV %R9,%RBX |
0x4c9eb4 MOV %R8,-0x50(%RBP) |
0x4c9eb8 MOV %RCX,-0x60(%RBP) |
0x4c9ebc MOV %RDX,%R13 |
0x4c9ebf MOV %RDI,-0x30(%RBP) |
0x4c9ec3 CALL 4d7300 <hypre_NumActiveThreads> |
0x4c9ec8 MOV %RAX,%R15 |
0x4c9ecb CALL 4d7310 <hypre_GetThreadNum> |
0x4c9ed0 MOV %RAX,%R14 |
0x4c9ed3 MOV %R13,%RDI |
0x4c9ed6 CALL 4cbd60 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> |
0x4c9edb MOV %RAX,%R12 |
0x4c9ede MOV %R13,%RDI |
0x4c9ee1 CALL 4cbde0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> |
0x4c9ee6 MOV %RAX,%RCX |
0x4c9ee9 CMP %R12,%RAX |
0x4c9eec MOV %R12,%RAX |
0x4c9eef MOV %R12,-0x40(%RBP) |
0x4c9ef3 MOV %RCX,-0x38(%RBP) |
0x4c9ef7 JGE 4c9f2f |
0x4c9ef9 MOV 0x250d00(%RIP),%RDI |
0x4c9f00 MOV $0x4f4525,%ESI |
0x4c9f05 MOV $0x4f653b,%EDX |
0x4c9f0a XOR %EAX,%EAX |
0x4c9f0c CALL 4d58d0 <hypre_fprintf> |
0x4c9f11 MOV $0x4f64b4,%EDI |
0x4c9f16 MOV $0x1d7,%ESI |
0x4c9f1b MOV $0x1,%EDX |
0x4c9f20 XOR %ECX,%ECX |
0x4c9f22 CALL 4d8210 <hypre_error_handler> |
0x4c9f27 MOV -0x38(%RBP),%RCX |
0x4c9f2b MOV -0x40(%RBP),%R12 |
0x4c9f2f MOV 0x18(%RBP),%RAX |
0x4c9f33 TEST %R12,%R12 |
0x4c9f36 JS 4c9f3d |
0x4c9f38 CMP %RAX,%R12 |
0x4c9f3b JLE 4c9f75 |
0x4c9f3d MOV 0x250cbc(%RIP),%RDI |
0x4c9f44 MOV $0x4f4525,%ESI |
0x4c9f49 MOV $0x4f654a,%EDX |
0x4c9f4e MOV %RAX,%R12 |
0x4c9f51 XOR %EAX,%EAX |
0x4c9f53 CALL 4d58d0 <hypre_fprintf> |
0x4c9f58 MOV $0x4f64b4,%EDI |
0x4c9f5d MOV $0x1d8,%ESI |
0x4c9f62 MOV $0x1,%EDX |
0x4c9f67 XOR %ECX,%ECX |
0x4c9f69 CALL 4d8210 <hypre_error_handler> |
0x4c9f6e MOV %R12,%RAX |
0x4c9f71 MOV -0x38(%RBP),%RCX |
0x4c9f75 MOV 0x38(%RBP),%R13 |
0x4c9f79 MOV 0x20(%RBP),%R12 |
0x4c9f7d TEST %RCX,%RCX |
0x4c9f80 JS 4c9f87 |
0x4c9f82 CMP %RAX,%RCX |
0x4c9f85 JLE 4c9fb5 |
0x4c9f87 MOV 0x250c72(%RIP),%RDI |
0x4c9f8e MOV $0x4f4525,%ESI |
0x4c9f93 MOV $0x4f656d,%EDX |
0x4c9f98 XOR %EAX,%EAX |
0x4c9f9a CALL 4d58d0 <hypre_fprintf> |
0x4c9f9f MOV $0x4f64b4,%EDI |
0x4c9fa4 MOV $0x1d9,%ESI |
0x4c9fa9 MOV $0x1,%EDX |
0x4c9fae XOR %ECX,%ECX |
0x4c9fb0 CALL 4d8210 <hypre_error_handler> |
0x4c9fb5 MOV (%R12),%RDX |
0x4c9fb9 MOV %RDX,%RAX |
0x4c9fbc IMUL %R14,%RAX |
0x4c9fc0 LEA (%R13,%RAX,8),%RDI |
0x4c9fc5 SAL $0x3,%RDX |
0x4c9fc9 XOR %ESI,%ESI |
0x4c9fcb CALL 4e0430 <__intel_avx_rep_memset> |
0x4c9fd0 MOV -0x38(%RBP),%RSI |
0x4c9fd4 MOV 0x10(%RBP),%RDX |
0x4c9fd8 MOV -0x40(%RBP),%RAX |
0x4c9fdc MOV (%RBX,%RAX,8),%RAX |
0x4c9fe0 CMP (%RBX,%RSI,8),%RAX |
0x4c9fe4 JGE 4ca00d |
0x4c9fe6 NOPW %CS:(%RAX,%RAX,1) |
(3958) 0x4c9ff0 MOV (%R12),%RCX |
(3958) 0x4c9ff4 IMUL %R14,%RCX |
(3958) 0x4c9ff8 ADD (%RDX,%RAX,8),%RCX |
(3958) 0x4c9ffc LEA (%R13,%RCX,8),%RCX |
(3958) 0x4ca001 INCQ (%RCX) |
(3958) 0x4ca004 INC %RAX |
(3958) 0x4ca007 CMP (%RBX,%RSI,8),%RAX |
(3958) 0x4ca00b JL 4c9ff0 |
0x4ca00d MOV -0x30(%RBP),%RAX |
0x4ca011 MOV (%RAX),%ESI |
0x4ca013 MOV $0x719ab0,%EDI |
0x4ca018 CALL 40fed0 <__kmpc_barrier@plt> |
0x4ca01d MOV (%R12),%R9 |
0x4ca021 MOV %R9,%RCX |
0x4ca024 IMUL %R14,%RCX |
0x4ca028 LEA 0x1(%R14),%R11 |
0x4ca02c LEA 0x1(%RCX),%RAX |
0x4ca030 MOV %R9,%RDX |
0x4ca033 IMUL %R11,%RDX |
0x4ca037 CMP %RDX,%RAX |
0x4ca03a JL 4ca16b |
0x4ca040 MOV %R11,-0x58(%RBP) |
0x4ca044 MOV -0x30(%RBP),%RAX |
0x4ca048 MOV (%RAX),%ESI |
0x4ca04a MOV $0x719ad0,%EDI |
0x4ca04f CALL 40fed0 <__kmpc_barrier@plt> |
0x4ca054 MOV -0x30(%RBP),%RAX |
0x4ca058 MOV (%RAX),%ESI |
0x4ca05a MOV $0x719af0,%EDI |
0x4ca05f XOR %EDX,%EDX |
0x4ca061 CALL 410040 <__kmpc_masked@plt> |
0x4ca066 CMP $0x1,%EAX |
0x4ca069 JNE 4ca2c3 |
0x4ca06f CMP $0x1,%R15 |
0x4ca073 MOV -0x30(%RBP),%R9 |
0x4ca077 JLE 4ca2b6 |
0x4ca07d LEA -0x1(%R15),%RAX |
0x4ca081 MOV %RAX,-0x48(%RBP) |
0x4ca085 CMP $0x4,%RAX |
0x4ca089 JAE 4ca55a |
0x4ca08f MOV -0x48(%RBP),%RAX |
0x4ca093 MOV %RAX,%R8 |
0x4ca096 AND $-0x4,%R8 |
0x4ca09a CMP %RAX,%R8 |
0x4ca09d MOV -0x30(%RBP),%R9 |
0x4ca0a1 JAE 4ca2b6 |
0x4ca0a7 INC %R8 |
0x4ca0aa JMP 4ca0d6 |
0x4ca0ac NOPL (%RAX) |
(3955) 0x4ca0b0 CQTO |
(3955) 0x4ca0b2 IDIV %R15 |
(3955) 0x4ca0b5 IMUL %RDI,%RCX |
(3955) 0x4ca0b9 ADD %RSI,%RCX |
(3955) 0x4ca0bc MOV (%R13,%RCX,8),%RCX |
(3955) 0x4ca0c1 IMUL %RDI,%RDX |
(3955) 0x4ca0c5 ADD %RAX,%RDX |
(3955) 0x4ca0c8 ADD %RCX,(%R13,%RDX,8) |
(3955) 0x4ca0cd CMP %R8,%R15 |
(3955) 0x4ca0d0 JE 4ca2b6 |
(3955) 0x4ca0d6 MOV (%R12),%RDI |
(3955) 0x4ca0da MOV %RDI,%RAX |
(3955) 0x4ca0dd IMUL %R8,%RAX |
(3955) 0x4ca0e1 DEC %RAX |
(3955) 0x4ca0e4 MOV %RAX,%RCX |
(3955) 0x4ca0e7 OR %R15,%RCX |
(3955) 0x4ca0ea SHR $0x20,%RCX |
(3955) 0x4ca0ee JE 4ca100 |
(3955) 0x4ca0f0 CQTO |
(3955) 0x4ca0f2 IDIV %R15 |
(3955) 0x4ca0f5 MOV %RDX,%RCX |
(3955) 0x4ca0f8 MOV %RAX,%RSI |
(3955) 0x4ca0fb JMP 4ca109 |
0x4ca0fd NOPL (%RAX) |
(3955) 0x4ca100 XOR %EDX,%EDX |
(3955) 0x4ca102 DIV %R15D |
(3955) 0x4ca105 MOV %EDX,%ECX |
(3955) 0x4ca107 MOV %EAX,%ESI |
(3955) 0x4ca109 INC %R8 |
(3955) 0x4ca10c MOV %RDI,%RAX |
(3955) 0x4ca10f IMUL %R8,%RAX |
(3955) 0x4ca113 DEC %RAX |
(3955) 0x4ca116 MOV %RAX,%RDX |
(3955) 0x4ca119 OR %R15,%RDX |
(3955) 0x4ca11c SHR $0x20,%RDX |
(3955) 0x4ca120 JNE 4ca0b0 |
(3955) 0x4ca122 XOR %EDX,%EDX |
(3955) 0x4ca124 DIV %R15D |
(3955) 0x4ca127 JMP 4ca0b5 |
0x4ca129 NOPL (%RAX) |
(3957) 0x4ca130 MOV %R8,%RAX |
(3957) 0x4ca133 CQTO |
(3957) 0x4ca135 IDIV %R15 |
(3957) 0x4ca138 IMUL %R9,%RDI |
(3957) 0x4ca13c ADD %RDI,%RSI |
(3957) 0x4ca13f MOV (%R13,%RSI,8),%RSI |
(3957) 0x4ca144 IMUL %R9,%RDX |
(3957) 0x4ca148 ADD %RAX,%RDX |
(3957) 0x4ca14b ADD %RSI,(%R13,%RDX,8) |
(3957) 0x4ca150 MOV (%R12),%R9 |
(3957) 0x4ca154 MOV %R11,%RAX |
(3957) 0x4ca157 IMUL %R9,%RAX |
(3957) 0x4ca15b ADD $0x5,%RCX |
(3957) 0x4ca15f CMP %RAX,%RCX |
(3957) 0x4ca162 MOV %R8,%RCX |
(3957) 0x4ca165 JGE 4ca040 |
(3957) 0x4ca16b LEA 0x1(%RCX),%RAX |
(3957) 0x4ca16f MOV %RAX,%RDX |
(3957) 0x4ca172 OR %R15,%RDX |
(3957) 0x4ca175 SHR $0x20,%RDX |
(3957) 0x4ca179 JE 4ca190 |
(3957) 0x4ca17b CQTO |
(3957) 0x4ca17d IDIV %R15 |
(3957) 0x4ca180 MOV %RDX,%RDI |
(3957) 0x4ca183 MOV %RAX,%RSI |
(3957) 0x4ca186 JMP 4ca199 |
0x4ca188 NOPL (%RAX,%RAX,1) |
(3957) 0x4ca190 XOR %EDX,%EDX |
(3957) 0x4ca192 DIV %R15D |
(3957) 0x4ca195 MOV %EDX,%EDI |
(3957) 0x4ca197 MOV %EAX,%ESI |
(3957) 0x4ca199 MOV %RCX,%RAX |
(3957) 0x4ca19c OR %R15,%RAX |
(3957) 0x4ca19f SHR $0x20,%RAX |
(3957) 0x4ca1a3 JE 4ca1b0 |
(3957) 0x4ca1a5 MOV %RCX,%RAX |
(3957) 0x4ca1a8 CQTO |
(3957) 0x4ca1aa IDIV %R15 |
(3957) 0x4ca1ad JMP 4ca1b7 |
0x4ca1af NOP |
(3957) 0x4ca1b0 MOV %ECX,%EAX |
(3957) 0x4ca1b2 XOR %EDX,%EDX |
(3957) 0x4ca1b4 DIV %R15D |
(3957) 0x4ca1b7 IMUL %R9,%RDX |
(3957) 0x4ca1bb ADD %RAX,%RDX |
(3957) 0x4ca1be MOV (%R13,%RDX,8),%RAX |
(3957) 0x4ca1c3 IMUL %RDI,%R9 |
(3957) 0x4ca1c7 ADD %RSI,%R9 |
(3957) 0x4ca1ca ADD %RAX,(%R13,%R9,8) |
(3957) 0x4ca1cf MOV (%R12),%R10 |
(3957) 0x4ca1d3 LEA 0x2(%RCX),%RAX |
(3957) 0x4ca1d7 MOV %R11,%RDX |
(3957) 0x4ca1da IMUL %R10,%RDX |
(3957) 0x4ca1de CMP %RDX,%RAX |
(3957) 0x4ca1e1 JGE 4ca040 |
(3957) 0x4ca1e7 MOV %RAX,%RDX |
(3957) 0x4ca1ea OR %R15,%RDX |
(3957) 0x4ca1ed SHR $0x20,%RDX |
(3957) 0x4ca1f1 JE 4ca200 |
(3957) 0x4ca1f3 CQTO |
(3957) 0x4ca1f5 IDIV %R15 |
(3957) 0x4ca1f8 MOV %RDX,%R9 |
(3957) 0x4ca1fb MOV %RAX,%R8 |
(3957) 0x4ca1fe JMP 4ca20b |
(3957) 0x4ca200 XOR %EDX,%EDX |
(3957) 0x4ca202 DIV %R15D |
(3957) 0x4ca205 MOV %EDX,%R9D |
(3957) 0x4ca208 MOV %EAX,%R8D |
(3957) 0x4ca20b IMUL %R10,%RDI |
(3957) 0x4ca20f ADD %RDI,%RSI |
(3957) 0x4ca212 MOV (%R13,%RSI,8),%RAX |
(3957) 0x4ca217 IMUL %R9,%R10 |
(3957) 0x4ca21b ADD %R8,%R10 |
(3957) 0x4ca21e ADD %RAX,(%R13,%R10,8) |
(3957) 0x4ca223 MOV (%R12),%R10 |
(3957) 0x4ca227 LEA 0x3(%RCX),%RAX |
(3957) 0x4ca22b MOV %R11,%RDX |
(3957) 0x4ca22e IMUL %R10,%RDX |
(3957) 0x4ca232 CMP %RDX,%RAX |
(3957) 0x4ca235 JGE 4ca040 |
(3957) 0x4ca23b MOV %RAX,%RDX |
(3957) 0x4ca23e OR %R15,%RDX |
(3957) 0x4ca241 SHR $0x20,%RDX |
(3957) 0x4ca245 JE 4ca260 |
(3957) 0x4ca247 CQTO |
(3957) 0x4ca249 IDIV %R15 |
(3957) 0x4ca24c MOV %RDX,%RDI |
(3957) 0x4ca24f MOV %RAX,%RSI |
(3957) 0x4ca252 JMP 4ca269 |
0x4ca254 NOPW %CS:(%RAX,%RAX,1) |
(3957) 0x4ca260 XOR %EDX,%EDX |
(3957) 0x4ca262 DIV %R15D |
(3957) 0x4ca265 MOV %EDX,%EDI |
(3957) 0x4ca267 MOV %EAX,%ESI |
(3957) 0x4ca269 IMUL %R10,%R9 |
(3957) 0x4ca26d ADD %R9,%R8 |
(3957) 0x4ca270 MOV (%R13,%R8,8),%RAX |
(3957) 0x4ca275 IMUL %RDI,%R10 |
(3957) 0x4ca279 ADD %RSI,%R10 |
(3957) 0x4ca27c ADD %RAX,(%R13,%R10,8) |
(3957) 0x4ca281 MOV (%R12),%R9 |
(3957) 0x4ca285 LEA 0x4(%RCX),%R8 |
(3957) 0x4ca289 MOV %R11,%RAX |
(3957) 0x4ca28c IMUL %R9,%RAX |
(3957) 0x4ca290 CMP %RAX,%R8 |
(3957) 0x4ca293 JGE 4ca040 |
(3957) 0x4ca299 MOV %R8,%RAX |
(3957) 0x4ca29c OR %R15,%RAX |
(3957) 0x4ca29f SHR $0x20,%RAX |
(3957) 0x4ca2a3 JNE 4ca130 |
(3957) 0x4ca2a9 MOV %R8D,%EAX |
(3957) 0x4ca2ac XOR %EDX,%EDX |
(3957) 0x4ca2ae DIV %R15D |
(3957) 0x4ca2b1 JMP 4ca138 |
0x4ca2b6 MOV (%R9),%ESI |
0x4ca2b9 MOV $0x719b10,%EDI |
0x4ca2be CALL 40fe60 <__kmpc_end_masked@plt> |
0x4ca2c3 MOV -0x30(%RBP),%RAX |
0x4ca2c7 MOV (%RAX),%ESI |
0x4ca2c9 MOV $0x719b30,%EDI |
0x4ca2ce CALL 40fed0 <__kmpc_barrier@plt> |
0x4ca2d3 TEST %R14,%R14 |
0x4ca2d6 MOV -0x58(%RBP),%R8 |
0x4ca2da JLE 4ca452 |
0x4ca2e0 MOV (%R12),%RDI |
0x4ca2e4 MOV %R14,%RCX |
0x4ca2e7 IMUL %RDI,%RCX |
0x4ca2eb LEA -0x1(%RCX),%RAX |
0x4ca2ef MOV %RAX,%RDX |
0x4ca2f2 OR %R15,%RDX |
0x4ca2f5 SHR $0x20,%RDX |
0x4ca2f9 JE 4ca302 |
0x4ca2fb CQTO |
0x4ca2fd IDIV %R15 |
0x4ca300 JMP 4ca307 |
0x4ca302 XOR %EDX,%EDX |
0x4ca304 DIV %R15D |
0x4ca307 MOV %RDI,%RSI |
0x4ca30a IMUL %R8,%RSI |
0x4ca30e DEC %RSI |
0x4ca311 CMP %RSI,%RCX |
0x4ca314 JGE 4ca452 |
0x4ca31a IMUL %RDI,%RDX |
0x4ca31e ADD %RAX,%RDX |
0x4ca321 MOV (%R13,%RDX,8),%RSI |
0x4ca326 JMP 4ca35c |
0x4ca328 NOPL (%RAX,%RAX,1) |
(3954) 0x4ca330 CQTO |
(3954) 0x4ca332 IDIV %R15 |
(3954) 0x4ca335 IMUL %RDX,%RDI |
(3954) 0x4ca339 ADD %RAX,%RDI |
(3954) 0x4ca33c ADD %RSI,(%R13,%RDI,8) |
(3954) 0x4ca341 MOV (%R12),%RDI |
(3954) 0x4ca345 MOV %R8,%RAX |
(3954) 0x4ca348 IMUL %RDI,%RAX |
(3954) 0x4ca34c DEC %RAX |
(3954) 0x4ca34f ADD $0x4,%RCX |
(3954) 0x4ca353 CMP %RAX,%RCX |
(3954) 0x4ca356 JGE 4ca452 |
(3954) 0x4ca35c MOV %RCX,%RAX |
(3954) 0x4ca35f OR %R15,%RAX |
(3954) 0x4ca362 SHR $0x20,%RAX |
(3954) 0x4ca366 JE 4ca380 |
(3954) 0x4ca368 MOV %RCX,%RAX |
(3954) 0x4ca36b CQTO |
(3954) 0x4ca36d IDIV %R15 |
(3954) 0x4ca370 JMP 4ca387 |
0x4ca372 NOPW %CS:(%RAX,%RAX,1) |
(3954) 0x4ca380 MOV %ECX,%EAX |
(3954) 0x4ca382 XOR %EDX,%EDX |
(3954) 0x4ca384 DIV %R15D |
(3954) 0x4ca387 IMUL %RDX,%RDI |
(3954) 0x4ca38b ADD %RAX,%RDI |
(3954) 0x4ca38e ADD %RSI,(%R13,%RDI,8) |
(3954) 0x4ca393 MOV (%R12),%RDI |
(3954) 0x4ca397 LEA 0x1(%RCX),%RAX |
(3954) 0x4ca39b MOV %R8,%RDX |
(3954) 0x4ca39e IMUL %RDI,%RDX |
(3954) 0x4ca3a2 DEC %RDX |
(3954) 0x4ca3a5 CMP %RDX,%RAX |
(3954) 0x4ca3a8 JGE 4ca452 |
(3954) 0x4ca3ae MOV %RAX,%RDX |
(3954) 0x4ca3b1 OR %R15,%RDX |
(3954) 0x4ca3b4 SHR $0x20,%RDX |
(3954) 0x4ca3b8 JE 4ca3d0 |
(3954) 0x4ca3ba CQTO |
(3954) 0x4ca3bc IDIV %R15 |
(3954) 0x4ca3bf JMP 4ca3d5 |
0x4ca3c1 NOPW %CS:(%RAX,%RAX,1) |
(3954) 0x4ca3d0 XOR %EDX,%EDX |
(3954) 0x4ca3d2 DIV %R15D |
(3954) 0x4ca3d5 IMUL %RDX,%RDI |
(3954) 0x4ca3d9 ADD %RAX,%RDI |
(3954) 0x4ca3dc ADD %RSI,(%R13,%RDI,8) |
(3954) 0x4ca3e1 MOV (%R12),%RDI |
(3954) 0x4ca3e5 LEA 0x2(%RCX),%RAX |
(3954) 0x4ca3e9 MOV %R8,%RDX |
(3954) 0x4ca3ec IMUL %RDI,%RDX |
(3954) 0x4ca3f0 DEC %RDX |
(3954) 0x4ca3f3 CMP %RDX,%RAX |
(3954) 0x4ca3f6 JGE 4ca452 |
(3954) 0x4ca3f8 MOV %RAX,%RDX |
(3954) 0x4ca3fb OR %R15,%RDX |
(3954) 0x4ca3fe SHR $0x20,%RDX |
(3954) 0x4ca402 JE 4ca410 |
(3954) 0x4ca404 CQTO |
(3954) 0x4ca406 IDIV %R15 |
(3954) 0x4ca409 JMP 4ca415 |
0x4ca40b NOPL (%RAX,%RAX,1) |
(3954) 0x4ca410 XOR %EDX,%EDX |
(3954) 0x4ca412 DIV %R15D |
(3954) 0x4ca415 IMUL %RDX,%RDI |
(3954) 0x4ca419 ADD %RAX,%RDI |
(3954) 0x4ca41c ADD %RSI,(%R13,%RDI,8) |
(3954) 0x4ca421 MOV (%R12),%RDI |
(3954) 0x4ca425 LEA 0x3(%RCX),%RAX |
(3954) 0x4ca429 MOV %R8,%RDX |
(3954) 0x4ca42c IMUL %RDI,%RDX |
(3954) 0x4ca430 DEC %RDX |
(3954) 0x4ca433 CMP %RDX,%RAX |
(3954) 0x4ca436 JGE 4ca452 |
(3954) 0x4ca438 MOV %RAX,%RDX |
(3954) 0x4ca43b OR %R15,%RDX |
(3954) 0x4ca43e SHR $0x20,%RDX |
(3954) 0x4ca442 JNE 4ca330 |
(3954) 0x4ca448 XOR %EDX,%EDX |
(3954) 0x4ca44a DIV %R15D |
(3954) 0x4ca44d JMP 4ca335 |
0x4ca452 MOV 0x30(%RBP),%R15 |
0x4ca456 MOV -0x30(%RBP),%RAX |
0x4ca45a MOV (%RAX),%ESI |
0x4ca45c MOV $0x719b50,%EDI |
0x4ca461 CALL 40fed0 <__kmpc_barrier@plt> |
0x4ca466 CMPQ $0,-0x60(%RBP) |
0x4ca46b JE 4ca4ad |
0x4ca46d MOV -0x40(%RBP),%R9 |
0x4ca471 MOV -0x38(%RBP),%RSI |
0x4ca475 CMP %R9,%RSI |
0x4ca478 MOV 0x10(%RBP),%R10 |
0x4ca47c MOV -0x50(%RBP),%R11 |
0x4ca480 JLE 4ca899 |
0x4ca486 MOV 0x28(%RBP),%RAX |
0x4ca48a MOV (%RBX,%RSI,8),%RDX |
0x4ca48e MOV %ESI,%ECX |
0x4ca490 SUB %R9D,%ECX |
0x4ca493 LEA 0x1(%R9),%R8 |
0x4ca497 TEST $0x1,%CL |
0x4ca49a JNE 4ca4e0 |
0x4ca49c MOV %RSI,%RCX |
0x4ca49f CMP %R8,%RSI |
0x4ca4a2 JNE 4ca8b5 |
0x4ca4a8 JMP 4ca899 |
0x4ca4ad MOV -0x40(%RBP),%R8 |
0x4ca4b1 MOV -0x38(%RBP),%R10 |
0x4ca4b5 CMP %R8,%R10 |
0x4ca4b8 MOV 0x10(%RBP),%R9 |
0x4ca4bc JLE 4ca899 |
0x4ca4c2 MOV (%RBX,%R10,8),%RCX |
0x4ca4c6 MOV %R10D,%EAX |
0x4ca4c9 SUB %R8D,%EAX |
0x4ca4cc LEA 0x1(%R8),%RDX |
0x4ca4d0 TEST $0x1,%AL |
0x4ca4d2 JNE 4ca78c |
0x4ca4d8 MOV %R10,%RAX |
0x4ca4db JMP 4ca7ce |
0x4ca4e0 LEA -0x1(%RSI),%RCX |
0x4ca4e4 MOV -0x8(%RBX,%RSI,8),%RDI |
0x4ca4e9 CMP %RDI,%RDX |
0x4ca4ec JLE 4ca88d |
0x4ca4f2 MOV %R8,-0x30(%RBP) |
0x4ca4f6 MOV -0x38(%RBP),%RSI |
0x4ca4fa NOPW (%RAX,%RAX,1) |
(3953) 0x4ca500 MOV -0x8(%R10,%RDX,8),%RDI |
(3953) 0x4ca505 MOV (%R12),%R8 |
(3953) 0x4ca509 IMUL %R14,%R8 |
(3953) 0x4ca50d ADD %RDI,%R8 |
(3953) 0x4ca510 LEA (%R13,%R8,8),%R8 |
(3953) 0x4ca515 DECQ (%R8) |
(3953) 0x4ca518 MOV (%R12),%R8 |
(3953) 0x4ca51c IMUL %R14,%R8 |
(3953) 0x4ca520 ADD %RDI,%R8 |
(3953) 0x4ca523 VMOVSD -0x8(%R11,%RDX,8),%XMM0 |
(3953) 0x4ca52a DEC %RDX |
(3953) 0x4ca52d MOV (%R13,%R8,8),%RDI |
(3953) 0x4ca532 VMOVSD %XMM0,(%RAX,%RDI,8) |
(3953) 0x4ca537 MOV %RCX,(%R15,%RDI,8) |
(3953) 0x4ca53b MOV -0x8(%RBX,%RSI,8),%RDI |
(3953) 0x4ca540 CMP %RDI,%RDX |
(3953) 0x4ca543 JG 4ca500 |
0x4ca545 MOV %RDI,%RDX |
0x4ca548 MOV -0x30(%RBP),%R8 |
0x4ca54c CMP %R8,%RSI |
0x4ca54f JNE 4ca8b5 |
0x4ca555 JMP 4ca899 |
0x4ca55a MOV -0x48(%RBP),%R8 |
0x4ca55e SHR $0x2,%R8 |
0x4ca562 XOR %R9D,%R9D |
0x4ca565 JMP 4ca599 |
0x4ca567 NOPW (%RAX,%RAX,1) |
(3956) 0x4ca570 CQTO |
(3956) 0x4ca572 IDIV %R15 |
(3956) 0x4ca575 IMUL %R10,%RCX |
(3956) 0x4ca579 ADD %RSI,%RCX |
(3956) 0x4ca57c MOV (%R13,%RCX,8),%RCX |
(3956) 0x4ca581 IMUL %R10,%RDX |
(3956) 0x4ca585 ADD %RAX,%RDX |
(3956) 0x4ca588 ADD %RCX,(%R13,%RDX,8) |
(3956) 0x4ca58d INC %R9 |
(3956) 0x4ca590 CMP %R9,%R8 |
(3956) 0x4ca593 JE 4ca08f |
(3956) 0x4ca599 MOV (%R12),%R10 |
(3956) 0x4ca59d MOV %R10,%R11 |
(3956) 0x4ca5a0 IMUL %R9,%R11 |
(3956) 0x4ca5a4 LEA -0x1(%R10,%R11,4),%RAX |
(3956) 0x4ca5a9 MOV %RAX,%RCX |
(3956) 0x4ca5ac OR %R15,%RCX |
(3956) 0x4ca5af SHR $0x20,%RCX |
(3956) 0x4ca5b3 JE 4ca5d0 |
(3956) 0x4ca5b5 CQTO |
(3956) 0x4ca5b7 IDIV %R15 |
(3956) 0x4ca5ba MOV %RDX,%RCX |
(3956) 0x4ca5bd MOV %RAX,%RSI |
(3956) 0x4ca5c0 JMP 4ca5d9 |
0x4ca5c2 NOPW %CS:(%RAX,%RAX,1) |
(3956) 0x4ca5d0 XOR %EDX,%EDX |
(3956) 0x4ca5d2 DIV %R15D |
(3956) 0x4ca5d5 MOV %EDX,%ECX |
(3956) 0x4ca5d7 MOV %EAX,%ESI |
(3956) 0x4ca5d9 SAL $0x2,%R11 |
(3956) 0x4ca5dd LEA -0x1(%R11,%R10,2),%RAX |
(3956) 0x4ca5e2 MOV %RAX,%RDX |
(3956) 0x4ca5e5 OR %R15,%RDX |
(3956) 0x4ca5e8 SHR $0x20,%RDX |
(3956) 0x4ca5ec JE 4ca600 |
(3956) 0x4ca5ee CQTO |
(3956) 0x4ca5f0 IDIV %R15 |
(3956) 0x4ca5f3 JMP 4ca605 |
0x4ca5f5 NOPW %CS:(%RAX,%RAX,1) |
(3956) 0x4ca600 XOR %EDX,%EDX |
(3956) 0x4ca602 DIV %R15D |
(3956) 0x4ca605 IMUL %R10,%RCX |
(3956) 0x4ca609 ADD %RSI,%RCX |
(3956) 0x4ca60c MOV (%R13,%RCX,8),%RCX |
(3956) 0x4ca611 IMUL %R10,%RDX |
(3956) 0x4ca615 ADD %RAX,%RDX |
(3956) 0x4ca618 ADD %RCX,(%R13,%RDX,8) |
(3956) 0x4ca61d MOV (%R12),%R10 |
(3956) 0x4ca621 MOV %R10,%R11 |
(3956) 0x4ca624 IMUL %R9,%R11 |
(3956) 0x4ca628 SAL $0x2,%R11 |
(3956) 0x4ca62c LEA -0x1(%R11,%R10,2),%RAX |
(3956) 0x4ca631 MOV %RAX,%RCX |
(3956) 0x4ca634 OR %R15,%RCX |
(3956) 0x4ca637 SHR $0x20,%RCX |
(3956) 0x4ca63b JE 4ca650 |
(3956) 0x4ca63d CQTO |
(3956) 0x4ca63f IDIV %R15 |
(3956) 0x4ca642 MOV %RDX,%RCX |
(3956) 0x4ca645 MOV %RAX,%RSI |
(3956) 0x4ca648 JMP 4ca659 |
0x4ca64a NOPW (%RAX,%RAX,1) |
(3956) 0x4ca650 XOR %EDX,%EDX |
(3956) 0x4ca652 DIV %R15D |
(3956) 0x4ca655 MOV %EDX,%ECX |
(3956) 0x4ca657 MOV %EAX,%ESI |
(3956) 0x4ca659 LEA (%R10,%R10,2),%RAX |
(3956) 0x4ca65d LEA -0x1(%R11,%RAX,1),%RAX |
(3956) 0x4ca662 MOV %RAX,%RDX |
(3956) 0x4ca665 OR %R15,%RDX |
(3956) 0x4ca668 SHR $0x20,%RDX |
(3956) 0x4ca66c JE 4ca680 |
(3956) 0x4ca66e CQTO |
(3956) 0x4ca670 IDIV %R15 |
(3956) 0x4ca673 JMP 4ca685 |
0x4ca675 NOPW %CS:(%RAX,%RAX,1) |
(3956) 0x4ca680 XOR %EDX,%EDX |
(3956) 0x4ca682 DIV %R15D |
(3956) 0x4ca685 IMUL %R10,%RCX |
(3956) 0x4ca689 ADD %RSI,%RCX |
(3956) 0x4ca68c MOV (%R13,%RCX,8),%RCX |
(3956) 0x4ca691 IMUL %R10,%RDX |
(3956) 0x4ca695 ADD %RAX,%RDX |
(3956) 0x4ca698 ADD %RCX,(%R13,%RDX,8) |
(3956) 0x4ca69d MOV (%R12),%R10 |
(3956) 0x4ca6a1 LEA (%R10,%R10,2),%RAX |
(3956) 0x4ca6a5 LEA (,%R10,4),%RDI |
(3956) 0x4ca6ad MOV %RDI,%R11 |
(3956) 0x4ca6b0 IMUL %R9,%R11 |
(3956) 0x4ca6b4 LEA -0x1(%R11,%RAX,1),%RAX |
(3956) 0x4ca6b9 MOV %RAX,%RCX |
(3956) 0x4ca6bc OR %R15,%RCX |
(3956) 0x4ca6bf SHR $0x20,%RCX |
(3956) 0x4ca6c3 JE 4ca6e0 |
(3956) 0x4ca6c5 CQTO |
(3956) 0x4ca6c7 IDIV %R15 |
(3956) 0x4ca6ca MOV %RDX,%RCX |
(3956) 0x4ca6cd MOV %RAX,%RSI |
(3956) 0x4ca6d0 JMP 4ca6e9 |
0x4ca6d2 NOPW %CS:(%RAX,%RAX,1) |
(3956) 0x4ca6e0 XOR %EDX,%EDX |
(3956) 0x4ca6e2 DIV %R15D |
(3956) 0x4ca6e5 MOV %EDX,%ECX |
(3956) 0x4ca6e7 MOV %EAX,%ESI |
(3956) 0x4ca6e9 LEA -0x1(%RDI,%R11,1),%RAX |
(3956) 0x4ca6ee MOV %RAX,%RDX |
(3956) 0x4ca6f1 OR %R15,%RDX |
(3956) 0x4ca6f4 SHR $0x20,%RDX |
(3956) 0x4ca6f8 JE 4ca710 |
(3956) 0x4ca6fa CQTO |
(3956) 0x4ca6fc IDIV %R15 |
(3956) 0x4ca6ff JMP 4ca715 |
0x4ca701 NOPW %CS:(%RAX,%RAX,1) |
(3956) 0x4ca710 XOR %EDX,%EDX |
(3956) 0x4ca712 DIV %R15D |
(3956) 0x4ca715 IMUL %R10,%RCX |
(3956) 0x4ca719 ADD %RSI,%RCX |
(3956) 0x4ca71c MOV (%R13,%RCX,8),%RCX |
(3956) 0x4ca721 IMUL %R10,%RDX |
(3956) 0x4ca725 ADD %RAX,%RDX |
(3956) 0x4ca728 ADD %RCX,(%R13,%RDX,8) |
(3956) 0x4ca72d MOV (%R12),%R10 |
(3956) 0x4ca731 LEA (,%R10,4),%R11 |
(3956) 0x4ca739 IMUL %R9,%R11 |
(3956) 0x4ca73d LEA -0x1(%R11,%R10,4),%RAX |
(3956) 0x4ca742 MOV %RAX,%RCX |
(3956) 0x4ca745 OR %R15,%RCX |
(3956) 0x4ca748 SHR $0x20,%RCX |
(3956) 0x4ca74c JE 4ca760 |
(3956) 0x4ca74e CQTO |
(3956) 0x4ca750 IDIV %R15 |
(3956) 0x4ca753 MOV %RDX,%RCX |
(3956) 0x4ca756 MOV %RAX,%RSI |
(3956) 0x4ca759 JMP 4ca769 |
0x4ca75b NOPL (%RAX,%RAX,1) |
(3956) 0x4ca760 XOR %EDX,%EDX |
(3956) 0x4ca762 DIV %R15D |
(3956) 0x4ca765 MOV %EDX,%ECX |
(3956) 0x4ca767 MOV %EAX,%ESI |
(3956) 0x4ca769 LEA (%R10,%R10,4),%RAX |
(3956) 0x4ca76d LEA -0x1(%R11,%RAX,1),%RAX |
(3956) 0x4ca772 MOV %RAX,%RDX |
(3956) 0x4ca775 OR %R15,%RDX |
(3956) 0x4ca778 SHR $0x20,%RDX |
(3956) 0x4ca77c JNE 4ca570 |
(3956) 0x4ca782 XOR %EDX,%EDX |
(3956) 0x4ca784 DIV %R15D |
(3956) 0x4ca787 JMP 4ca575 |
0x4ca78c LEA -0x1(%R10),%RAX |
(3949) 0x4ca790 MOV -0x8(%RBX,%R10,8),%RSI |
(3949) 0x4ca795 CMP %RSI,%RCX |
(3949) 0x4ca798 JLE 4ca7cb |
(3949) 0x4ca79a MOV -0x8(%R9,%RCX,8),%RSI |
(3949) 0x4ca79f DEC %RCX |
(3949) 0x4ca7a2 MOV (%R12),%RDI |
(3949) 0x4ca7a6 IMUL %R14,%RDI |
(3949) 0x4ca7aa ADD %RSI,%RDI |
(3949) 0x4ca7ad LEA (%R13,%RDI,8),%RDI |
(3949) 0x4ca7b2 DECQ (%RDI) |
(3949) 0x4ca7b5 MOV (%R12),%RDI |
(3949) 0x4ca7b9 IMUL %R14,%RDI |
(3949) 0x4ca7bd ADD %RSI,%RDI |
(3949) 0x4ca7c0 MOV (%R13,%RDI,8),%RSI |
(3949) 0x4ca7c5 MOV %RAX,(%R15,%RSI,8) |
(3949) 0x4ca7c9 JMP 4ca790 |
0x4ca7cb MOV %RSI,%RCX |
0x4ca7ce CMP %RDX,%R10 |
0x4ca7d1 JNE 4ca7e9 |
0x4ca7d3 JMP 4ca899 |
0x4ca7d8 NOPL (%RAX,%RAX,1) |
(3946) 0x4ca7e0 CMP %R8,%RAX |
(3946) 0x4ca7e3 JLE 4ca899 |
(3946) 0x4ca7e9 MOV -0x8(%RBX,%RAX,8),%RDX |
(3946) 0x4ca7ee CMP %RDX,%RCX |
(3946) 0x4ca7f1 JLE 4ca839 |
(3946) 0x4ca7f3 LEA -0x1(%RAX),%RSI |
(3946) 0x4ca7f7 NOPW (%RAX,%RAX,1) |
(3948) 0x4ca800 MOV -0x8(%R9,%RCX,8),%RDX |
(3948) 0x4ca805 DEC %RCX |
(3948) 0x4ca808 MOV (%R12),%RDI |
(3948) 0x4ca80c IMUL %R14,%RDI |
(3948) 0x4ca810 ADD %RDX,%RDI |
(3948) 0x4ca813 LEA (%R13,%RDI,8),%RDI |
(3948) 0x4ca818 DECQ (%RDI) |
(3948) 0x4ca81b MOV (%R12),%RDI |
(3948) 0x4ca81f IMUL %R14,%RDI |
(3948) 0x4ca823 ADD %RDX,%RDI |
(3948) 0x4ca826 MOV (%R13,%RDI,8),%RDX |
(3948) 0x4ca82b MOV %RSI,(%R15,%RDX,8) |
(3948) 0x4ca82f MOV -0x8(%RBX,%RAX,8),%RDX |
(3948) 0x4ca834 CMP %RDX,%RCX |
(3948) 0x4ca837 JG 4ca800 |
(3946) 0x4ca839 MOV -0x10(%RBX,%RAX,8),%RCX |
(3946) 0x4ca83e ADD $-0x2,%RAX |
(3946) 0x4ca842 CMP %RCX,%RDX |
(3946) 0x4ca845 JLE 4ca7e0 |
(3946) 0x4ca847 NOPW (%RAX,%RAX,1) |
(3947) 0x4ca850 MOV -0x8(%R9,%RDX,8),%RCX |
(3947) 0x4ca855 DEC %RDX |
(3947) 0x4ca858 MOV (%R12),%RSI |
(3947) 0x4ca85c IMUL %R14,%RSI |
(3947) 0x4ca860 ADD %RCX,%RSI |
(3947) 0x4ca863 LEA (%R13,%RSI,8),%RSI |
(3947) 0x4ca868 DECQ (%RSI) |
(3947) 0x4ca86b MOV (%R12),%RSI |
(3947) 0x4ca86f IMUL %R14,%RSI |
(3947) 0x4ca873 ADD %RCX,%RSI |
(3947) 0x4ca876 MOV (%R13,%RSI,8),%RCX |
(3947) 0x4ca87b MOV %RAX,(%R15,%RCX,8) |
(3947) 0x4ca87f MOV (%RBX,%RAX,8),%RCX |
(3947) 0x4ca883 CMP %RCX,%RDX |
(3947) 0x4ca886 JG 4ca850 |
(3946) 0x4ca888 JMP 4ca7e0 |
0x4ca88d MOV %RDI,%RDX |
0x4ca890 MOV -0x38(%RBP),%RSI |
0x4ca894 CMP %R8,%RSI |
0x4ca897 JNE 4ca8b5 |
0x4ca899 ADD $0x38,%RSP |
0x4ca89d POP %RBX |
0x4ca89e POP %R12 |
0x4ca8a0 POP %R13 |
0x4ca8a2 POP %R14 |
0x4ca8a4 POP %R15 |
0x4ca8a6 POP %RBP |
0x4ca8a7 RET |
0x4ca8a8 NOPL (%RAX,%RAX,1) |
(3950) 0x4ca8b0 CMP %R9,%RCX |
(3950) 0x4ca8b3 JLE 4ca899 |
(3950) 0x4ca8b5 MOV -0x8(%RBX,%RCX,8),%RSI |
(3950) 0x4ca8ba CMP %RSI,%RDX |
(3950) 0x4ca8bd JLE 4ca915 |
(3950) 0x4ca8bf LEA -0x1(%RCX),%RDI |
(3950) 0x4ca8c3 NOPW %CS:(%RAX,%RAX,1) |
(3952) 0x4ca8d0 MOV -0x8(%R10,%RDX,8),%RSI |
(3952) 0x4ca8d5 MOV (%R12),%R8 |
(3952) 0x4ca8d9 IMUL %R14,%R8 |
(3952) 0x4ca8dd ADD %RSI,%R8 |
(3952) 0x4ca8e0 LEA (%R13,%R8,8),%R8 |
(3952) 0x4ca8e5 DECQ (%R8) |
(3952) 0x4ca8e8 MOV (%R12),%R8 |
(3952) 0x4ca8ec IMUL %R14,%R8 |
(3952) 0x4ca8f0 ADD %RSI,%R8 |
(3952) 0x4ca8f3 VMOVSD -0x8(%R11,%RDX,8),%XMM0 |
(3952) 0x4ca8fa DEC %RDX |
(3952) 0x4ca8fd MOV (%R13,%R8,8),%RSI |
(3952) 0x4ca902 VMOVSD %XMM0,(%RAX,%RSI,8) |
(3952) 0x4ca907 MOV %RDI,(%R15,%RSI,8) |
(3952) 0x4ca90b MOV -0x8(%RBX,%RCX,8),%RSI |
(3952) 0x4ca910 CMP %RSI,%RDX |
(3952) 0x4ca913 JG 4ca8d0 |
(3950) 0x4ca915 MOV -0x10(%RBX,%RCX,8),%RDX |
(3950) 0x4ca91a ADD $-0x2,%RCX |
(3950) 0x4ca91e CMP %RDX,%RSI |
(3950) 0x4ca921 JLE 4ca8b0 |
(3950) 0x4ca923 NOPW %CS:(%RAX,%RAX,1) |
(3951) 0x4ca930 MOV -0x8(%R10,%RSI,8),%RDX |
(3951) 0x4ca935 MOV (%R12),%RDI |
(3951) 0x4ca939 IMUL %R14,%RDI |
(3951) 0x4ca93d ADD %RDX,%RDI |
(3951) 0x4ca940 LEA (%R13,%RDI,8),%RDI |
(3951) 0x4ca945 DECQ (%RDI) |
(3951) 0x4ca948 MOV (%R12),%RDI |
(3951) 0x4ca94c IMUL %R14,%RDI |
(3951) 0x4ca950 ADD %RDX,%RDI |
(3951) 0x4ca953 VMOVSD -0x8(%R11,%RSI,8),%XMM0 |
(3951) 0x4ca95a DEC %RSI |
(3951) 0x4ca95d MOV (%R13,%RDI,8),%RDX |
(3951) 0x4ca962 VMOVSD %XMM0,(%RAX,%RDX,8) |
(3951) 0x4ca967 MOV %RCX,(%R15,%RDX,8) |
(3951) 0x4ca96b MOV (%RBX,%RCX,8),%RDX |
(3951) 0x4ca96f CMP %RDX,%RSI |
(3951) 0x4ca972 JG 4ca930 |
(3950) 0x4ca974 JMP 4ca8b0 |
0x4ca979 NOPL (%RAX) |
Path / |
Source file and lines | csr_matop.c:380-560 |
Module | exec |
nb instructions | 251 |
nb uops | 275 |
loop length | 1046 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 13 |
micro-operation queue | 46.00 cycles |
front end | 46.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 18.10 | 18.00 | 19.00 | 19.00 | 15.50 | 18.00 | 17.90 | 15.50 | 15.50 | 15.50 | 18.00 | 19.00 |
cycles | 18.10 | 21.80 | 19.00 | 19.00 | 15.50 | 18.00 | 17.90 | 15.50 | 15.50 | 15.50 | 18.00 | 19.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 42.88-42.92 |
Stall cycles | 0.00 |
Front-end | 46.00 |
Dispatch | 21.80 |
DIV/SQRT | 16.00 |
Overall L1 | 46.00 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x38,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4d7300 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d7310 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cbd60 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cbde0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c9f2f <hypre_CSRMatrixTranspose.extracted+0x8f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x250d00(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4525,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f653b,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d58d0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f64b4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d7,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8210 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c9f3d <hypre_CSRMatrixTranspose.extracted+0x9d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c9f75 <hypre_CSRMatrixTranspose.extracted+0xd5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x250cbc(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4525,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f654a,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d58d0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f64b4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8210 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c9f87 <hypre_CSRMatrixTranspose.extracted+0xe7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c9fb5 <hypre_CSRMatrixTranspose.extracted+0x115> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x250c72(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4525,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f656d,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d58d0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f64b4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8210 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R13,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e0430 <__intel_avx_rep_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RAX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RBX,%RSI,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JGE 4ca00d <hypre_CSRMatrixTranspose.extracted+0x16d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719ab0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fed0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R12),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x1(%R14),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R11,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4ca16b <hypre_CSRMatrixTranspose.extracted+0x2cb> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R11,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719ad0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fed0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719af0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 410040 <__kmpc_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMP $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca2c3 <hypre_CSRMatrixTranspose.extracted+0x423> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x1,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ca2b6 <hypre_CSRMatrixTranspose.extracted+0x416> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%R15),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4ca55a <hypre_CSRMatrixTranspose.extracted+0x6ba> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JAE 4ca2b6 <hypre_CSRMatrixTranspose.extracted+0x416> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4ca0d6 <hypre_CSRMatrixTranspose.extracted+0x236> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R9),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719b10,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fe60 <__kmpc_end_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719b30,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fed0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x58(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ca452 <hypre_CSRMatrixTranspose.extracted+0x5b2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RDI,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA -0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R15,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4ca302 <hypre_CSRMatrixTranspose.extracted+0x462> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R15 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 4ca307 <hypre_CSRMatrixTranspose.extracted+0x467> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R15D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R8,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ca452 <hypre_CSRMatrixTranspose.extracted+0x5b2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %RDI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R13,%RDX,8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4ca35c <hypre_CSRMatrixTranspose.extracted+0x4bc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719b50,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fed0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,-0x60(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4ca4ad <hypre_CSRMatrixTranspose.extracted+0x60d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ca899 <hypre_CSRMatrixTranspose.extracted+0x9f9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RSI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ESI,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R9D,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R9),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%CL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4ca4e0 <hypre_CSRMatrixTranspose.extracted+0x640> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca8b5 <hypre_CSRMatrixTranspose.extracted+0xa15> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ca899 <hypre_CSRMatrixTranspose.extracted+0x9f9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ca899 <hypre_CSRMatrixTranspose.extracted+0x9f9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%RBX,%R10,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R8D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4ca78c <hypre_CSRMatrixTranspose.extracted+0x8ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4ca7ce <hypre_CSRMatrixTranspose.extracted+0x92e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x1(%RSI),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%RBX,%RSI,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ca88d <hypre_CSRMatrixTranspose.extracted+0x9ed> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R8,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca8b5 <hypre_CSRMatrixTranspose.extracted+0xa15> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ca899 <hypre_CSRMatrixTranspose.extracted+0x9f9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x48(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SHR $0x2,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ca599 <hypre_CSRMatrixTranspose.extracted+0x6f9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x1(%R10),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca7e9 <hypre_CSRMatrixTranspose.extracted+0x949> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ca899 <hypre_CSRMatrixTranspose.extracted+0x9f9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca8b5 <hypre_CSRMatrixTranspose.extracted+0xa15> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x38,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matop.c:380-560 |
Module | exec |
nb instructions | 251 |
nb uops | 275 |
loop length | 1046 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 13 |
micro-operation queue | 46.00 cycles |
front end | 46.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 18.10 | 18.00 | 19.00 | 19.00 | 15.50 | 18.00 | 17.90 | 15.50 | 15.50 | 15.50 | 18.00 | 19.00 |
cycles | 18.10 | 21.80 | 19.00 | 19.00 | 15.50 | 18.00 | 17.90 | 15.50 | 15.50 | 15.50 | 18.00 | 19.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 42.88-42.92 |
Stall cycles | 0.00 |
Front-end | 46.00 |
Dispatch | 21.80 |
DIV/SQRT | 16.00 |
Overall L1 | 46.00 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x38,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 4d7300 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d7310 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cbd60 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cbde0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c9f2f <hypre_CSRMatrixTranspose.extracted+0x8f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x250d00(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4525,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f653b,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d58d0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f64b4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d7,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8210 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c9f3d <hypre_CSRMatrixTranspose.extracted+0x9d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c9f75 <hypre_CSRMatrixTranspose.extracted+0xd5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x250cbc(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4525,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f654a,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d58d0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f64b4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8210 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c9f87 <hypre_CSRMatrixTranspose.extracted+0xe7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c9fb5 <hypre_CSRMatrixTranspose.extracted+0x115> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x250c72(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4525,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f656d,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d58d0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f64b4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1d9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8210 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R13,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e0430 <__intel_avx_rep_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RAX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RBX,%RSI,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JGE 4ca00d <hypre_CSRMatrixTranspose.extracted+0x16d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719ab0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fed0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R12),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x1(%R14),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R11,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4ca16b <hypre_CSRMatrixTranspose.extracted+0x2cb> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R11,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719ad0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fed0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719af0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 410040 <__kmpc_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMP $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca2c3 <hypre_CSRMatrixTranspose.extracted+0x423> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x1,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ca2b6 <hypre_CSRMatrixTranspose.extracted+0x416> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%R15),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4ca55a <hypre_CSRMatrixTranspose.extracted+0x6ba> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JAE 4ca2b6 <hypre_CSRMatrixTranspose.extracted+0x416> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4ca0d6 <hypre_CSRMatrixTranspose.extracted+0x236> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R9),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719b10,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fe60 <__kmpc_end_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719b30,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fed0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x58(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ca452 <hypre_CSRMatrixTranspose.extracted+0x5b2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RDI,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA -0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R15,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4ca302 <hypre_CSRMatrixTranspose.extracted+0x462> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R15 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 4ca307 <hypre_CSRMatrixTranspose.extracted+0x467> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R15D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R8,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ca452 <hypre_CSRMatrixTranspose.extracted+0x5b2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %RDI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R13,%RDX,8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4ca35c <hypre_CSRMatrixTranspose.extracted+0x4bc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719b50,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fed0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,-0x60(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4ca4ad <hypre_CSRMatrixTranspose.extracted+0x60d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ca899 <hypre_CSRMatrixTranspose.extracted+0x9f9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RSI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ESI,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R9D,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R9),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%CL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4ca4e0 <hypre_CSRMatrixTranspose.extracted+0x640> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca8b5 <hypre_CSRMatrixTranspose.extracted+0xa15> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ca899 <hypre_CSRMatrixTranspose.extracted+0x9f9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ca899 <hypre_CSRMatrixTranspose.extracted+0x9f9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%RBX,%R10,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R8D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4ca78c <hypre_CSRMatrixTranspose.extracted+0x8ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4ca7ce <hypre_CSRMatrixTranspose.extracted+0x92e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x1(%RSI),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%RBX,%RSI,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ca88d <hypre_CSRMatrixTranspose.extracted+0x9ed> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R8,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca8b5 <hypre_CSRMatrixTranspose.extracted+0xa15> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ca899 <hypre_CSRMatrixTranspose.extracted+0x9f9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x48(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SHR $0x2,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ca599 <hypre_CSRMatrixTranspose.extracted+0x6f9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x1(%R10),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca7e9 <hypre_CSRMatrixTranspose.extracted+0x949> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ca899 <hypre_CSRMatrixTranspose.extracted+0x9f9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4ca8b5 <hypre_CSRMatrixTranspose.extracted+0xa15> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x38,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixTranspose.extracted– | 0.18 | 0.03 |
▼Loop 3950 - csr_matop.c:540-548 - exec– | 0.04 | 0.01 |
○Loop 3951 - csr_matop.c:541-548 - exec | 0.04 | 0.01 |
○Loop 3952 - csr_matop.c:541-548 - exec | 0.04 | 0.01 |
○Loop 3957 - csr_matop.c:380-500 - exec | 0.02 | 0.01 |
○Loop 3958 - csr_matop.c:483-485 - exec | 0.01 | 0.01 |
○Loop 3954 - csr_matop.c:380-527 - exec | 0.01 | 0.01 |
○Loop 3949 - csr_matop.c:554-560 - exec | 0 | 0 |
○Loop 3956 - csr_matop.c:380-513 - exec | 0 | 0 |
○Loop 3953 - csr_matop.c:541-548 - exec | 0 | 0 |
▼Loop 3946 - csr_matop.c:553-560 - exec– | 0 | 0 |
○Loop 3948 - csr_matop.c:554-560 - exec | 0 | 0 |
○Loop 3947 - csr_matop.c:554-560 - exec | 0 | 0 |
○Loop 3955 - csr_matop.c:380-513 - exec | 0 | 0 |