Function: hypre_CSRMatrixTranspose.extracted | Module: libseq_mv.so | Source: csr_matop.c:380-560 [...] | Coverage: 0.2% |
---|
Function: hypre_CSRMatrixTranspose.extracted | Module: libseq_mv.so | Source: csr_matop.c:380-560 [...] | Coverage: 0.2% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-147-2675/intel/AMG/build/AMG/AMG/seq_mv/csr_matrix.c: 645 - 674 |
-------------------------------------------------------------------------------- |
645: HYPRE_Int num_nonzerosA = hypre_CSRMatrixNumNonzeros(A); |
646: HYPRE_Int num_rowsA = hypre_CSRMatrixNumRows(A); |
647: HYPRE_Int *A_i = hypre_CSRMatrixI(A); |
648: |
649: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
650: |
651: HYPRE_Int nonzeros_per_thread = (num_nonzerosA + num_threads - 1)/num_threads; |
652: |
653: if (idx <= 0) |
654: { |
655: return 0; |
656: } |
657: else if (idx >= num_threads) |
[...] |
663: return (HYPRE_Int)(hypre_LowerBound(A_i, A_i + num_rowsA, nonzeros_per_thread*idx) - A_i); |
[...] |
669: return hypre_CSRMatrixGetLoadBalancedPartitionBoundary(A, hypre_GetThreadNum()); |
670: } |
671: |
672: HYPRE_Int hypre_CSRMatrixGetLoadBalancedPartitionEnd(hypre_CSRMatrix *A) |
673: { |
674: return hypre_CSRMatrixGetLoadBalancedPartitionBoundary(A, hypre_GetThreadNum() + 1); |
/home/eoseret/qaas_runs_CPU_9468/171-147-2675/intel/AMG/build/AMG/AMG/seq_mv/csr_matop.c: 380 - 560 |
-------------------------------------------------------------------------------- |
380: return idx%dim1*dim2 + idx/dim1; |
[...] |
463: #pragma omp parallel |
464: #endif |
465: { |
466: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
467: HYPRE_Int my_thread_num = hypre_GetThreadNum(); |
468: |
469: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
470: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
471: hypre_assert(iBegin <= iEnd); |
472: hypre_assert(iBegin >= 0 && iBegin <= num_rowsA); |
473: hypre_assert(iEnd >= 0 && iEnd <= num_rowsA); |
474: |
475: HYPRE_Int i, j; |
476: memset(bucket + my_thread_num*num_colsA, 0, sizeof(HYPRE_Int)*num_colsA); |
[...] |
483: for (j = A_i[iBegin]; j < A_i[iEnd]; ++j) { |
484: HYPRE_Int idx = A_j[j]; |
485: bucket[my_thread_num*num_colsA + idx]++; |
[...] |
496: for (i = my_thread_num*num_colsA + 1; i < (my_thread_num + 1)*num_colsA; ++i) { |
497: HYPRE_Int transpose_i = transpose_idx(i, num_threads, num_colsA); |
498: HYPRE_Int transpose_i_minus_1 = transpose_idx(i - 1, num_threads, num_colsA); |
499: |
500: bucket[transpose_i] += bucket[transpose_i_minus_1]; |
501: } |
502: |
503: #ifdef HYPRE_USING_OPENMP |
504: #pragma omp barrier |
505: #pragma omp master |
506: #endif |
507: { |
508: for (i = 1; i < num_threads; ++i) { |
509: HYPRE_Int j0 = num_colsA*i - 1, j1 = num_colsA*(i + 1) - 1; |
510: HYPRE_Int transpose_j0 = transpose_idx(j0, num_threads, num_colsA); |
511: HYPRE_Int transpose_j1 = transpose_idx(j1, num_threads, num_colsA); |
512: |
513: bucket[transpose_j1] += bucket[transpose_j0]; |
[...] |
520: if (my_thread_num > 0) { |
521: HYPRE_Int transpose_i0 = transpose_idx(num_colsA*my_thread_num - 1, num_threads, num_colsA); |
522: HYPRE_Int offset = bucket[transpose_i0]; |
523: |
524: for (i = my_thread_num*num_colsA; i < (my_thread_num + 1)*num_colsA - 1; ++i) { |
525: HYPRE_Int transpose_i = transpose_idx(i, num_threads, num_colsA); |
526: |
527: bucket[transpose_i] += offset; |
[...] |
539: if (data) { |
540: for (i = iEnd - 1; i >= iBegin; --i) { |
541: for (j = A_i[i + 1] - 1; j >= A_i[i]; --j) { |
542: HYPRE_Int idx = A_j[j]; |
543: --bucket[my_thread_num*num_colsA + idx]; |
544: |
545: HYPRE_Int offset = bucket[my_thread_num*num_colsA + idx]; |
546: |
547: AT_data[offset] = A_data[j]; |
548: AT_j[offset] = i; |
549: } |
550: } |
551: } |
552: else { |
553: for (i = iEnd - 1; i >= iBegin; --i) { |
554: for (j = A_i[i + 1] - 1; j >= A_i[i]; --j) { |
555: HYPRE_Int idx = A_j[j]; |
556: --bucket[my_thread_num*num_colsA + idx]; |
557: |
558: HYPRE_Int offset = bucket[my_thread_num*num_colsA + idx]; |
559: |
560: AT_j[offset] = i; |
0x44f0 PUSH %RBP |
0x44f1 MOV %RSP,%RBP |
0x44f4 PUSH %R15 |
0x44f6 PUSH %R14 |
0x44f8 PUSH %R13 |
0x44fa PUSH %R12 |
0x44fc PUSH %RBX |
0x44fd SUB $0x48,%RSP |
0x4501 MOV %R9,%RBX |
0x4504 MOV %R8,-0x58(%RBP) |
0x4508 MOV %RCX,-0x68(%RBP) |
0x450c MOV %RDX,%R13 |
0x450f MOV %RDI,-0x40(%RBP) |
0x4513 CALL 3170 <hypre_NumActiveThreads@plt> |
0x4518 MOV %RAX,%R15 |
0x451b CALL 3080 <hypre_GetThreadNum@plt> |
0x4520 MOV %RAX,%R14 |
0x4523 CALL 3080 <hypre_GetThreadNum@plt> |
0x4528 MOV %RAX,-0x30(%RBP) |
0x452c MOV 0x20(%R13),%R12 |
0x4530 MOV (%R13),%RAX |
0x4534 MOV %RAX,-0x48(%RBP) |
0x4538 MOV 0x10(%R13),%RAX |
0x453c MOV %RAX,-0x38(%RBP) |
0x4540 CALL 3170 <hypre_NumActiveThreads@plt> |
0x4545 MOV %RAX,%RCX |
0x4548 LEA -0x1(%R12,%RAX,1),%RAX |
0x454d MOV %RAX,%RDX |
0x4550 OR %RCX,%RDX |
0x4553 SHR $0x20,%RDX |
0x4557 JE 4560 |
0x4559 CQTO |
0x455b IDIV %RCX |
0x455e JMP 4564 |
0x4560 XOR %EDX,%EDX |
0x4562 DIV %ECX |
0x4564 MOV -0x38(%RBP),%RDX |
0x4568 MOV -0x30(%RBP),%RDI |
0x456c TEST %RDI,%RDI |
0x456f JLE 459a |
0x4571 CMP %RDI,%RCX |
0x4574 JLE 45a2 |
0x4576 MOV -0x48(%RBP),%R12 |
0x457a LEA (%R12,%RDX,8),%RSI |
0x457e IMUL %RDI,%RAX |
0x4582 MOV %R12,%RDI |
0x4585 MOV %RAX,%RDX |
0x4588 CALL 3140 <hypre_LowerBound@plt> |
0x458d SUB %R12,%RAX |
0x4590 SAR $0x3,%RAX |
0x4594 MOV %RAX,-0x38(%RBP) |
0x4598 JMP 45a2 |
0x459a MOVQ $0,-0x38(%RBP) |
0x45a2 CALL 3080 <hypre_GetThreadNum@plt> |
0x45a7 MOV %RAX,-0x30(%RBP) |
0x45ab MOV 0x20(%R13),%R12 |
0x45af MOV (%R13),%RAX |
0x45b3 MOV %RAX,-0x48(%RBP) |
0x45b7 MOV 0x10(%R13),%R13 |
0x45bb CALL 3170 <hypre_NumActiveThreads@plt> |
0x45c0 MOV %RAX,%RCX |
0x45c3 LEA -0x1(%R12,%RAX,1),%RAX |
0x45c8 MOV %RAX,%RDX |
0x45cb OR %RCX,%RDX |
0x45ce SHR $0x20,%RDX |
0x45d2 JE 45db |
0x45d4 CQTO |
0x45d6 IDIV %RCX |
0x45d9 JMP 45df |
0x45db XOR %EDX,%EDX |
0x45dd DIV %ECX |
0x45df MOV -0x38(%RBP),%RDX |
0x45e3 MOV %R13,%RSI |
0x45e6 MOV -0x30(%RBP),%RDI |
0x45ea TEST %RDI,%RDI |
0x45ed JS 461e |
0x45ef INC %RDI |
0x45f2 CMP %RDI,%RCX |
0x45f5 JLE 4620 |
0x45f7 MOV -0x48(%RBP),%R12 |
0x45fb LEA (%R12,%RSI,8),%RSI |
0x45ff IMUL %RDI,%RAX |
0x4603 MOV %R12,%RDI |
0x4606 MOV %RAX,%RDX |
0x4609 CALL 3140 <hypre_LowerBound@plt> |
0x460e MOV -0x38(%RBP),%RDX |
0x4612 MOV %RAX,%RSI |
0x4615 SUB %R12,%RSI |
0x4618 SAR $0x3,%RSI |
0x461c JMP 4620 |
0x461e XOR %ESI,%ESI |
0x4620 CMP %RDX,%RSI |
0x4623 MOV %RSI,-0x30(%RBP) |
0x4627 JGE 4668 |
0x4629 MOV 0xc9b0(%RIP),%RAX |
0x4630 MOV (%RAX),%RDI |
0x4633 LEA 0x7d33(%RIP),%RSI |
0x463a LEA 0x7cd4(%RIP),%RDX |
0x4641 XOR %EAX,%EAX |
0x4643 CALL 31e0 <hypre_fprintf@plt> |
0x4648 LEA 0x7a11(%RIP),%RDI |
0x464f MOV $0x1d7,%ESI |
0x4654 MOV $0x1,%EDX |
0x4659 XOR %ECX,%ECX |
0x465b CALL 3220 <hypre_error_handler@plt> |
0x4660 MOV -0x30(%RBP),%RSI |
0x4664 MOV -0x38(%RBP),%RDX |
0x4668 MOV 0x18(%RBP),%RAX |
0x466c TEST %RDX,%RDX |
0x466f JS 4676 |
0x4671 CMP %RAX,%RDX |
0x4674 JLE 46b7 |
0x4676 MOV %RAX,%R12 |
0x4679 MOV 0xc960(%RIP),%RAX |
0x4680 MOV (%RAX),%RDI |
0x4683 LEA 0x7ce3(%RIP),%RSI |
0x468a LEA 0x7a52(%RIP),%RDX |
0x4691 XOR %EAX,%EAX |
0x4693 CALL 31e0 <hypre_fprintf@plt> |
0x4698 LEA 0x79c1(%RIP),%RDI |
0x469f MOV $0x1d8,%ESI |
0x46a4 MOV $0x1,%EDX |
0x46a9 XOR %ECX,%ECX |
0x46ab CALL 3220 <hypre_error_handler@plt> |
0x46b0 MOV %R12,%RAX |
0x46b3 MOV -0x30(%RBP),%RSI |
0x46b7 MOV 0x38(%RBP),%R13 |
0x46bb MOV 0x20(%RBP),%R12 |
0x46bf TEST %RSI,%RSI |
0x46c2 JS 46c9 |
0x46c4 CMP %RAX,%RSI |
0x46c7 JLE 4700 |
0x46c9 MOV 0xc910(%RIP),%RAX |
0x46d0 MOV (%RAX),%RDI |
0x46d3 LEA 0x7c93(%RIP),%RSI |
0x46da LEA 0x7a25(%RIP),%RDX |
0x46e1 XOR %EAX,%EAX |
0x46e3 CALL 31e0 <hypre_fprintf@plt> |
0x46e8 LEA 0x7971(%RIP),%RDI |
0x46ef MOV $0x1d9,%ESI |
0x46f4 MOV $0x1,%EDX |
0x46f9 XOR %ECX,%ECX |
0x46fb CALL 3220 <hypre_error_handler@plt> |
0x4700 MOV (%R12),%RDX |
0x4704 MOV %RDX,%RAX |
0x4707 IMUL %R14,%RAX |
0x470b LEA (%R13,%RAX,8),%RDI |
0x4710 SAL $0x3,%RDX |
0x4714 XOR %ESI,%ESI |
0x4716 CALL 30b0 <__intel_avx_rep_memset@plt> |
0x471b MOV -0x30(%RBP),%RSI |
0x471f MOV 0x10(%RBP),%RDX |
0x4723 MOV -0x38(%RBP),%RAX |
0x4727 MOV (%RBX,%RAX,8),%RAX |
0x472b CMP (%RBX,%RSI,8),%RAX |
0x472f JGE 475d |
0x4731 NOPW %CS:(%RAX,%RAX,1) |
(48) 0x4740 MOV (%R12),%RCX |
(48) 0x4744 IMUL %R14,%RCX |
(48) 0x4748 ADD (%RDX,%RAX,8),%RCX |
(48) 0x474c LEA (%R13,%RCX,8),%RCX |
(48) 0x4751 INCQ (%RCX) |
(48) 0x4754 INC %RAX |
(48) 0x4757 CMP (%RBX,%RSI,8),%RAX |
(48) 0x475b JL 4740 |
0x475d MOV -0x40(%RBP),%RAX |
0x4761 MOV (%RAX),%ESI |
0x4763 LEA 0xc9f6(%RIP),%RDI |
0x476a CALL 31d0 <__kmpc_barrier@plt> |
0x476f MOV (%R12),%R9 |
0x4773 MOV %R9,%RCX |
0x4776 IMUL %R14,%RCX |
0x477a LEA 0x1(%R14),%R11 |
0x477e LEA 0x1(%RCX),%RAX |
0x4782 MOV %R9,%RDX |
0x4785 IMUL %R11,%RDX |
0x4789 CMP %RDX,%RAX |
0x478c JL 48cb |
0x4792 MOV %R11,-0x48(%RBP) |
0x4796 MOV %R15,-0x60(%RBP) |
0x479a MOV -0x40(%RBP),%R15 |
0x479e MOV (%R15),%ESI |
0x47a1 LEA 0xc9d8(%RIP),%RDI |
0x47a8 CALL 31d0 <__kmpc_barrier@plt> |
0x47ad MOV (%R15),%ESI |
0x47b0 MOV -0x60(%RBP),%R15 |
0x47b4 LEA 0xc9e5(%RIP),%RDI |
0x47bb XOR %EDX,%EDX |
0x47bd CALL 30c0 <__kmpc_masked@plt> |
0x47c2 CMP $0x1,%EAX |
0x47c5 JNE 4a25 |
0x47cb CMP $0x1,%R15 |
0x47cf MOV -0x40(%RBP),%R9 |
0x47d3 JLE 4a16 |
0x47d9 LEA -0x1(%R15),%RAX |
0x47dd MOV %RAX,-0x50(%RBP) |
0x47e1 CMP $0x4,%RAX |
0x47e5 JAE 4cba |
0x47eb MOV -0x50(%RBP),%RAX |
0x47ef MOV %RAX,%R8 |
0x47f2 AND $-0x4,%R8 |
0x47f6 CMP %RAX,%R8 |
0x47f9 MOV -0x40(%RBP),%R9 |
0x47fd JAE 4a16 |
0x4803 INC %R8 |
0x4806 JMP 4836 |
0x4808 NOPL (%RAX,%RAX,1) |
(45) 0x4810 CQTO |
(45) 0x4812 IDIV %R15 |
(45) 0x4815 IMUL %RDI,%RCX |
(45) 0x4819 ADD %RSI,%RCX |
(45) 0x481c MOV (%R13,%RCX,8),%RCX |
(45) 0x4821 IMUL %RDI,%RDX |
(45) 0x4825 ADD %RAX,%RDX |
(45) 0x4828 ADD %RCX,(%R13,%RDX,8) |
(45) 0x482d CMP %R8,%R15 |
(45) 0x4830 JE 4a16 |
(45) 0x4836 MOV (%R12),%RDI |
(45) 0x483a MOV %RDI,%RAX |
(45) 0x483d IMUL %R8,%RAX |
(45) 0x4841 DEC %RAX |
(45) 0x4844 MOV %RAX,%RCX |
(45) 0x4847 OR %R15,%RCX |
(45) 0x484a SHR $0x20,%RCX |
(45) 0x484e JE 4860 |
(45) 0x4850 CQTO |
(45) 0x4852 IDIV %R15 |
(45) 0x4855 MOV %RDX,%RCX |
(45) 0x4858 MOV %RAX,%RSI |
(45) 0x485b JMP 4869 |
0x485d NOPL (%RAX) |
(45) 0x4860 XOR %EDX,%EDX |
(45) 0x4862 DIV %R15D |
(45) 0x4865 MOV %EDX,%ECX |
(45) 0x4867 MOV %EAX,%ESI |
(45) 0x4869 INC %R8 |
(45) 0x486c MOV %RDI,%RAX |
(45) 0x486f IMUL %R8,%RAX |
(45) 0x4873 DEC %RAX |
(45) 0x4876 MOV %RAX,%RDX |
(45) 0x4879 OR %R15,%RDX |
(45) 0x487c SHR $0x20,%RDX |
(45) 0x4880 JNE 4810 |
(45) 0x4882 XOR %EDX,%EDX |
(45) 0x4884 DIV %R15D |
(45) 0x4887 JMP 4815 |
0x4889 NOPL (%RAX) |
(47) 0x4890 MOV %R8,%RAX |
(47) 0x4893 CQTO |
(47) 0x4895 IDIV %R15 |
(47) 0x4898 IMUL %R9,%RDI |
(47) 0x489c ADD %RDI,%RSI |
(47) 0x489f MOV (%R13,%RSI,8),%RSI |
(47) 0x48a4 IMUL %R9,%RDX |
(47) 0x48a8 ADD %RAX,%RDX |
(47) 0x48ab ADD %RSI,(%R13,%RDX,8) |
(47) 0x48b0 MOV (%R12),%R9 |
(47) 0x48b4 MOV %R11,%RAX |
(47) 0x48b7 IMUL %R9,%RAX |
(47) 0x48bb ADD $0x5,%RCX |
(47) 0x48bf CMP %RAX,%RCX |
(47) 0x48c2 MOV %R8,%RCX |
(47) 0x48c5 JGE 4792 |
(47) 0x48cb LEA 0x1(%RCX),%RAX |
(47) 0x48cf MOV %RAX,%RDX |
(47) 0x48d2 OR %R15,%RDX |
(47) 0x48d5 SHR $0x20,%RDX |
(47) 0x48d9 JE 48f0 |
(47) 0x48db CQTO |
(47) 0x48dd IDIV %R15 |
(47) 0x48e0 MOV %RDX,%RDI |
(47) 0x48e3 MOV %RAX,%RSI |
(47) 0x48e6 JMP 48f9 |
0x48e8 NOPL (%RAX,%RAX,1) |
(47) 0x48f0 XOR %EDX,%EDX |
(47) 0x48f2 DIV %R15D |
(47) 0x48f5 MOV %EDX,%EDI |
(47) 0x48f7 MOV %EAX,%ESI |
(47) 0x48f9 MOV %RCX,%RAX |
(47) 0x48fc OR %R15,%RAX |
(47) 0x48ff SHR $0x20,%RAX |
(47) 0x4903 JE 4910 |
(47) 0x4905 MOV %RCX,%RAX |
(47) 0x4908 CQTO |
(47) 0x490a IDIV %R15 |
(47) 0x490d JMP 4917 |
0x490f NOP |
(47) 0x4910 MOV %ECX,%EAX |
(47) 0x4912 XOR %EDX,%EDX |
(47) 0x4914 DIV %R15D |
(47) 0x4917 IMUL %R9,%RDX |
(47) 0x491b ADD %RAX,%RDX |
(47) 0x491e MOV (%R13,%RDX,8),%RAX |
(47) 0x4923 IMUL %RDI,%R9 |
(47) 0x4927 ADD %RSI,%R9 |
(47) 0x492a ADD %RAX,(%R13,%R9,8) |
(47) 0x492f MOV (%R12),%R10 |
(47) 0x4933 LEA 0x2(%RCX),%RAX |
(47) 0x4937 MOV %R11,%RDX |
(47) 0x493a IMUL %R10,%RDX |
(47) 0x493e CMP %RDX,%RAX |
(47) 0x4941 JGE 4792 |
(47) 0x4947 MOV %RAX,%RDX |
(47) 0x494a OR %R15,%RDX |
(47) 0x494d SHR $0x20,%RDX |
(47) 0x4951 JE 4960 |
(47) 0x4953 CQTO |
(47) 0x4955 IDIV %R15 |
(47) 0x4958 MOV %RDX,%R9 |
(47) 0x495b MOV %RAX,%R8 |
(47) 0x495e JMP 496b |
(47) 0x4960 XOR %EDX,%EDX |
(47) 0x4962 DIV %R15D |
(47) 0x4965 MOV %EDX,%R9D |
(47) 0x4968 MOV %EAX,%R8D |
(47) 0x496b IMUL %R10,%RDI |
(47) 0x496f ADD %RDI,%RSI |
(47) 0x4972 MOV (%R13,%RSI,8),%RAX |
(47) 0x4977 IMUL %R9,%R10 |
(47) 0x497b ADD %R8,%R10 |
(47) 0x497e ADD %RAX,(%R13,%R10,8) |
(47) 0x4983 MOV (%R12),%R10 |
(47) 0x4987 LEA 0x3(%RCX),%RAX |
(47) 0x498b MOV %R11,%RDX |
(47) 0x498e IMUL %R10,%RDX |
(47) 0x4992 CMP %RDX,%RAX |
(47) 0x4995 JGE 4792 |
(47) 0x499b MOV %RAX,%RDX |
(47) 0x499e OR %R15,%RDX |
(47) 0x49a1 SHR $0x20,%RDX |
(47) 0x49a5 JE 49c0 |
(47) 0x49a7 CQTO |
(47) 0x49a9 IDIV %R15 |
(47) 0x49ac MOV %RDX,%RDI |
(47) 0x49af MOV %RAX,%RSI |
(47) 0x49b2 JMP 49c9 |
0x49b4 NOPW %CS:(%RAX,%RAX,1) |
(47) 0x49c0 XOR %EDX,%EDX |
(47) 0x49c2 DIV %R15D |
(47) 0x49c5 MOV %EDX,%EDI |
(47) 0x49c7 MOV %EAX,%ESI |
(47) 0x49c9 IMUL %R10,%R9 |
(47) 0x49cd ADD %R9,%R8 |
(47) 0x49d0 MOV (%R13,%R8,8),%RAX |
(47) 0x49d5 IMUL %RDI,%R10 |
(47) 0x49d9 ADD %RSI,%R10 |
(47) 0x49dc ADD %RAX,(%R13,%R10,8) |
(47) 0x49e1 MOV (%R12),%R9 |
(47) 0x49e5 LEA 0x4(%RCX),%R8 |
(47) 0x49e9 MOV %R11,%RAX |
(47) 0x49ec IMUL %R9,%RAX |
(47) 0x49f0 CMP %RAX,%R8 |
(47) 0x49f3 JGE 4792 |
(47) 0x49f9 MOV %R8,%RAX |
(47) 0x49fc OR %R15,%RAX |
(47) 0x49ff SHR $0x20,%RAX |
(47) 0x4a03 JNE 4890 |
(47) 0x4a09 MOV %R8D,%EAX |
(47) 0x4a0c XOR %EDX,%EDX |
(47) 0x4a0e DIV %R15D |
(47) 0x4a11 JMP 4898 |
0x4a16 MOV (%R9),%ESI |
0x4a19 LEA 0xc7a0(%RIP),%RDI |
0x4a20 CALL 30d0 <__kmpc_end_masked@plt> |
0x4a25 MOV -0x40(%RBP),%RAX |
0x4a29 MOV (%RAX),%ESI |
0x4a2b LEA 0xc7ae(%RIP),%RDI |
0x4a32 CALL 31d0 <__kmpc_barrier@plt> |
0x4a37 TEST %R14,%R14 |
0x4a3a MOV -0x48(%RBP),%R8 |
0x4a3e JLE 4bb2 |
0x4a44 MOV (%R12),%RDI |
0x4a48 MOV %R14,%RCX |
0x4a4b IMUL %RDI,%RCX |
0x4a4f LEA -0x1(%RCX),%RAX |
0x4a53 MOV %RAX,%RDX |
0x4a56 OR %R15,%RDX |
0x4a59 SHR $0x20,%RDX |
0x4a5d JE 4a66 |
0x4a5f CQTO |
0x4a61 IDIV %R15 |
0x4a64 JMP 4a6b |
0x4a66 XOR %EDX,%EDX |
0x4a68 DIV %R15D |
0x4a6b MOV %RDI,%RSI |
0x4a6e IMUL %R8,%RSI |
0x4a72 DEC %RSI |
0x4a75 CMP %RSI,%RCX |
0x4a78 JGE 4bb2 |
0x4a7e IMUL %RDI,%RDX |
0x4a82 ADD %RAX,%RDX |
0x4a85 MOV (%R13,%RDX,8),%RSI |
0x4a8a JMP 4abc |
0x4a8c NOPL (%RAX) |
(44) 0x4a90 CQTO |
(44) 0x4a92 IDIV %R15 |
(44) 0x4a95 IMUL %RDX,%RDI |
(44) 0x4a99 ADD %RAX,%RDI |
(44) 0x4a9c ADD %RSI,(%R13,%RDI,8) |
(44) 0x4aa1 MOV (%R12),%RDI |
(44) 0x4aa5 MOV %R8,%RAX |
(44) 0x4aa8 IMUL %RDI,%RAX |
(44) 0x4aac DEC %RAX |
(44) 0x4aaf ADD $0x4,%RCX |
(44) 0x4ab3 CMP %RAX,%RCX |
(44) 0x4ab6 JGE 4bb2 |
(44) 0x4abc MOV %RCX,%RAX |
(44) 0x4abf OR %R15,%RAX |
(44) 0x4ac2 SHR $0x20,%RAX |
(44) 0x4ac6 JE 4ae0 |
(44) 0x4ac8 MOV %RCX,%RAX |
(44) 0x4acb CQTO |
(44) 0x4acd IDIV %R15 |
(44) 0x4ad0 JMP 4ae7 |
0x4ad2 NOPW %CS:(%RAX,%RAX,1) |
(44) 0x4ae0 MOV %ECX,%EAX |
(44) 0x4ae2 XOR %EDX,%EDX |
(44) 0x4ae4 DIV %R15D |
(44) 0x4ae7 IMUL %RDX,%RDI |
(44) 0x4aeb ADD %RAX,%RDI |
(44) 0x4aee ADD %RSI,(%R13,%RDI,8) |
(44) 0x4af3 MOV (%R12),%RDI |
(44) 0x4af7 LEA 0x1(%RCX),%RAX |
(44) 0x4afb MOV %R8,%RDX |
(44) 0x4afe IMUL %RDI,%RDX |
(44) 0x4b02 DEC %RDX |
(44) 0x4b05 CMP %RDX,%RAX |
(44) 0x4b08 JGE 4bb2 |
(44) 0x4b0e MOV %RAX,%RDX |
(44) 0x4b11 OR %R15,%RDX |
(44) 0x4b14 SHR $0x20,%RDX |
(44) 0x4b18 JE 4b30 |
(44) 0x4b1a CQTO |
(44) 0x4b1c IDIV %R15 |
(44) 0x4b1f JMP 4b35 |
0x4b21 NOPW %CS:(%RAX,%RAX,1) |
(44) 0x4b30 XOR %EDX,%EDX |
(44) 0x4b32 DIV %R15D |
(44) 0x4b35 IMUL %RDX,%RDI |
(44) 0x4b39 ADD %RAX,%RDI |
(44) 0x4b3c ADD %RSI,(%R13,%RDI,8) |
(44) 0x4b41 MOV (%R12),%RDI |
(44) 0x4b45 LEA 0x2(%RCX),%RAX |
(44) 0x4b49 MOV %R8,%RDX |
(44) 0x4b4c IMUL %RDI,%RDX |
(44) 0x4b50 DEC %RDX |
(44) 0x4b53 CMP %RDX,%RAX |
(44) 0x4b56 JGE 4bb2 |
(44) 0x4b58 MOV %RAX,%RDX |
(44) 0x4b5b OR %R15,%RDX |
(44) 0x4b5e SHR $0x20,%RDX |
(44) 0x4b62 JE 4b70 |
(44) 0x4b64 CQTO |
(44) 0x4b66 IDIV %R15 |
(44) 0x4b69 JMP 4b75 |
0x4b6b NOPL (%RAX,%RAX,1) |
(44) 0x4b70 XOR %EDX,%EDX |
(44) 0x4b72 DIV %R15D |
(44) 0x4b75 IMUL %RDX,%RDI |
(44) 0x4b79 ADD %RAX,%RDI |
(44) 0x4b7c ADD %RSI,(%R13,%RDI,8) |
(44) 0x4b81 MOV (%R12),%RDI |
(44) 0x4b85 LEA 0x3(%RCX),%RAX |
(44) 0x4b89 MOV %R8,%RDX |
(44) 0x4b8c IMUL %RDI,%RDX |
(44) 0x4b90 DEC %RDX |
(44) 0x4b93 CMP %RDX,%RAX |
(44) 0x4b96 JGE 4bb2 |
(44) 0x4b98 MOV %RAX,%RDX |
(44) 0x4b9b OR %R15,%RDX |
(44) 0x4b9e SHR $0x20,%RDX |
(44) 0x4ba2 JNE 4a90 |
(44) 0x4ba8 XOR %EDX,%EDX |
(44) 0x4baa DIV %R15D |
(44) 0x4bad JMP 4a95 |
0x4bb2 MOV 0x30(%RBP),%R15 |
0x4bb6 MOV -0x40(%RBP),%RAX |
0x4bba MOV (%RAX),%ESI |
0x4bbc LEA 0xc63d(%RIP),%RDI |
0x4bc3 CALL 31d0 <__kmpc_barrier@plt> |
0x4bc8 CMPQ $0,-0x68(%RBP) |
0x4bcd JE 4c0f |
0x4bcf MOV -0x38(%RBP),%R9 |
0x4bd3 MOV -0x30(%RBP),%RSI |
0x4bd7 CMP %R9,%RSI |
0x4bda MOV -0x58(%RBP),%R10 |
0x4bde MOV 0x10(%RBP),%R11 |
0x4be2 JLE 4ff9 |
0x4be8 MOV 0x28(%RBP),%RAX |
0x4bec MOV (%RBX,%RSI,8),%RDX |
0x4bf0 MOV %ESI,%ECX |
0x4bf2 SUB %R9D,%ECX |
0x4bf5 LEA 0x1(%R9),%R8 |
0x4bf9 TEST $0x1,%CL |
0x4bfc JNE 4c42 |
0x4bfe MOV %RSI,%RCX |
0x4c01 CMP %R8,%RSI |
0x4c04 JNE 5015 |
0x4c0a JMP 4ff9 |
0x4c0f MOV -0x38(%RBP),%R8 |
0x4c13 MOV -0x30(%RBP),%R10 |
0x4c17 CMP %R8,%R10 |
0x4c1a MOV 0x10(%RBP),%R9 |
0x4c1e JLE 4ff9 |
0x4c24 MOV (%RBX,%R10,8),%RCX |
0x4c28 MOV %R10D,%EAX |
0x4c2b SUB %R8D,%EAX |
0x4c2e LEA 0x1(%R8),%RDX |
0x4c32 TEST $0x1,%AL |
0x4c34 JNE 4eec |
0x4c3a MOV %R10,%RAX |
0x4c3d JMP 4f2e |
0x4c42 LEA -0x1(%RSI),%RCX |
0x4c46 MOV -0x8(%RBX,%RSI,8),%RDI |
0x4c4b CMP %RDI,%RDX |
0x4c4e JLE 4fed |
0x4c54 MOV %R8,-0x40(%RBP) |
0x4c58 MOV -0x30(%RBP),%RSI |
0x4c5c NOPL (%RAX) |
(43) 0x4c60 MOV -0x8(%R11,%RDX,8),%RDI |
(43) 0x4c65 MOV (%R12),%R8 |
(43) 0x4c69 IMUL %R14,%R8 |
(43) 0x4c6d ADD %RDI,%R8 |
(43) 0x4c70 LEA (%R13,%R8,8),%R8 |
(43) 0x4c75 DECQ (%R8) |
(43) 0x4c78 MOV (%R12),%R8 |
(43) 0x4c7c IMUL %R14,%R8 |
(43) 0x4c80 ADD %RDI,%R8 |
(43) 0x4c83 VMOVSD -0x8(%R10,%RDX,8),%XMM0 |
(43) 0x4c8a DEC %RDX |
(43) 0x4c8d MOV (%R13,%R8,8),%RDI |
(43) 0x4c92 VMOVSD %XMM0,(%RAX,%RDI,8) |
(43) 0x4c97 MOV %RCX,(%R15,%RDI,8) |
(43) 0x4c9b MOV -0x8(%RBX,%RSI,8),%RDI |
(43) 0x4ca0 CMP %RDI,%RDX |
(43) 0x4ca3 JG 4c60 |
0x4ca5 MOV %RDI,%RDX |
0x4ca8 MOV -0x40(%RBP),%R8 |
0x4cac CMP %R8,%RSI |
0x4caf JNE 5015 |
0x4cb5 JMP 4ff9 |
0x4cba MOV -0x50(%RBP),%R8 |
0x4cbe SHR $0x2,%R8 |
0x4cc2 XOR %R9D,%R9D |
0x4cc5 JMP 4cf9 |
0x4cc7 NOPW (%RAX,%RAX,1) |
(46) 0x4cd0 CQTO |
(46) 0x4cd2 IDIV %R15 |
(46) 0x4cd5 IMUL %R10,%RCX |
(46) 0x4cd9 ADD %RSI,%RCX |
(46) 0x4cdc MOV (%R13,%RCX,8),%RCX |
(46) 0x4ce1 IMUL %R10,%RDX |
(46) 0x4ce5 ADD %RAX,%RDX |
(46) 0x4ce8 ADD %RCX,(%R13,%RDX,8) |
(46) 0x4ced INC %R9 |
(46) 0x4cf0 CMP %R9,%R8 |
(46) 0x4cf3 JE 47eb |
(46) 0x4cf9 MOV (%R12),%R10 |
(46) 0x4cfd MOV %R10,%R11 |
(46) 0x4d00 IMUL %R9,%R11 |
(46) 0x4d04 LEA -0x1(%R10,%R11,4),%RAX |
(46) 0x4d09 MOV %RAX,%RCX |
(46) 0x4d0c OR %R15,%RCX |
(46) 0x4d0f SHR $0x20,%RCX |
(46) 0x4d13 JE 4d30 |
(46) 0x4d15 CQTO |
(46) 0x4d17 IDIV %R15 |
(46) 0x4d1a MOV %RDX,%RCX |
(46) 0x4d1d MOV %RAX,%RSI |
(46) 0x4d20 JMP 4d39 |
0x4d22 NOPW %CS:(%RAX,%RAX,1) |
(46) 0x4d30 XOR %EDX,%EDX |
(46) 0x4d32 DIV %R15D |
(46) 0x4d35 MOV %EDX,%ECX |
(46) 0x4d37 MOV %EAX,%ESI |
(46) 0x4d39 SAL $0x2,%R11 |
(46) 0x4d3d LEA -0x1(%R11,%R10,2),%RAX |
(46) 0x4d42 MOV %RAX,%RDX |
(46) 0x4d45 OR %R15,%RDX |
(46) 0x4d48 SHR $0x20,%RDX |
(46) 0x4d4c JE 4d60 |
(46) 0x4d4e CQTO |
(46) 0x4d50 IDIV %R15 |
(46) 0x4d53 JMP 4d65 |
0x4d55 NOPW %CS:(%RAX,%RAX,1) |
(46) 0x4d60 XOR %EDX,%EDX |
(46) 0x4d62 DIV %R15D |
(46) 0x4d65 IMUL %R10,%RCX |
(46) 0x4d69 ADD %RSI,%RCX |
(46) 0x4d6c MOV (%R13,%RCX,8),%RCX |
(46) 0x4d71 IMUL %R10,%RDX |
(46) 0x4d75 ADD %RAX,%RDX |
(46) 0x4d78 ADD %RCX,(%R13,%RDX,8) |
(46) 0x4d7d MOV (%R12),%R10 |
(46) 0x4d81 MOV %R10,%R11 |
(46) 0x4d84 IMUL %R9,%R11 |
(46) 0x4d88 SAL $0x2,%R11 |
(46) 0x4d8c LEA -0x1(%R11,%R10,2),%RAX |
(46) 0x4d91 MOV %RAX,%RCX |
(46) 0x4d94 OR %R15,%RCX |
(46) 0x4d97 SHR $0x20,%RCX |
(46) 0x4d9b JE 4db0 |
(46) 0x4d9d CQTO |
(46) 0x4d9f IDIV %R15 |
(46) 0x4da2 MOV %RDX,%RCX |
(46) 0x4da5 MOV %RAX,%RSI |
(46) 0x4da8 JMP 4db9 |
0x4daa NOPW (%RAX,%RAX,1) |
(46) 0x4db0 XOR %EDX,%EDX |
(46) 0x4db2 DIV %R15D |
(46) 0x4db5 MOV %EDX,%ECX |
(46) 0x4db7 MOV %EAX,%ESI |
(46) 0x4db9 LEA (%R10,%R10,2),%RAX |
(46) 0x4dbd LEA -0x1(%R11,%RAX,1),%RAX |
(46) 0x4dc2 MOV %RAX,%RDX |
(46) 0x4dc5 OR %R15,%RDX |
(46) 0x4dc8 SHR $0x20,%RDX |
(46) 0x4dcc JE 4de0 |
(46) 0x4dce CQTO |
(46) 0x4dd0 IDIV %R15 |
(46) 0x4dd3 JMP 4de5 |
0x4dd5 NOPW %CS:(%RAX,%RAX,1) |
(46) 0x4de0 XOR %EDX,%EDX |
(46) 0x4de2 DIV %R15D |
(46) 0x4de5 IMUL %R10,%RCX |
(46) 0x4de9 ADD %RSI,%RCX |
(46) 0x4dec MOV (%R13,%RCX,8),%RCX |
(46) 0x4df1 IMUL %R10,%RDX |
(46) 0x4df5 ADD %RAX,%RDX |
(46) 0x4df8 ADD %RCX,(%R13,%RDX,8) |
(46) 0x4dfd MOV (%R12),%R10 |
(46) 0x4e01 LEA (%R10,%R10,2),%RAX |
(46) 0x4e05 LEA (,%R10,4),%RDI |
(46) 0x4e0d MOV %RDI,%R11 |
(46) 0x4e10 IMUL %R9,%R11 |
(46) 0x4e14 LEA -0x1(%R11,%RAX,1),%RAX |
(46) 0x4e19 MOV %RAX,%RCX |
(46) 0x4e1c OR %R15,%RCX |
(46) 0x4e1f SHR $0x20,%RCX |
(46) 0x4e23 JE 4e40 |
(46) 0x4e25 CQTO |
(46) 0x4e27 IDIV %R15 |
(46) 0x4e2a MOV %RDX,%RCX |
(46) 0x4e2d MOV %RAX,%RSI |
(46) 0x4e30 JMP 4e49 |
0x4e32 NOPW %CS:(%RAX,%RAX,1) |
(46) 0x4e40 XOR %EDX,%EDX |
(46) 0x4e42 DIV %R15D |
(46) 0x4e45 MOV %EDX,%ECX |
(46) 0x4e47 MOV %EAX,%ESI |
(46) 0x4e49 LEA -0x1(%RDI,%R11,1),%RAX |
(46) 0x4e4e MOV %RAX,%RDX |
(46) 0x4e51 OR %R15,%RDX |
(46) 0x4e54 SHR $0x20,%RDX |
(46) 0x4e58 JE 4e70 |
(46) 0x4e5a CQTO |
(46) 0x4e5c IDIV %R15 |
(46) 0x4e5f JMP 4e75 |
0x4e61 NOPW %CS:(%RAX,%RAX,1) |
(46) 0x4e70 XOR %EDX,%EDX |
(46) 0x4e72 DIV %R15D |
(46) 0x4e75 IMUL %R10,%RCX |
(46) 0x4e79 ADD %RSI,%RCX |
(46) 0x4e7c MOV (%R13,%RCX,8),%RCX |
(46) 0x4e81 IMUL %R10,%RDX |
(46) 0x4e85 ADD %RAX,%RDX |
(46) 0x4e88 ADD %RCX,(%R13,%RDX,8) |
(46) 0x4e8d MOV (%R12),%R10 |
(46) 0x4e91 LEA (,%R10,4),%R11 |
(46) 0x4e99 IMUL %R9,%R11 |
(46) 0x4e9d LEA -0x1(%R11,%R10,4),%RAX |
(46) 0x4ea2 MOV %RAX,%RCX |
(46) 0x4ea5 OR %R15,%RCX |
(46) 0x4ea8 SHR $0x20,%RCX |
(46) 0x4eac JE 4ec0 |
(46) 0x4eae CQTO |
(46) 0x4eb0 IDIV %R15 |
(46) 0x4eb3 MOV %RDX,%RCX |
(46) 0x4eb6 MOV %RAX,%RSI |
(46) 0x4eb9 JMP 4ec9 |
0x4ebb NOPL (%RAX,%RAX,1) |
(46) 0x4ec0 XOR %EDX,%EDX |
(46) 0x4ec2 DIV %R15D |
(46) 0x4ec5 MOV %EDX,%ECX |
(46) 0x4ec7 MOV %EAX,%ESI |
(46) 0x4ec9 LEA (%R10,%R10,4),%RAX |
(46) 0x4ecd LEA -0x1(%R11,%RAX,1),%RAX |
(46) 0x4ed2 MOV %RAX,%RDX |
(46) 0x4ed5 OR %R15,%RDX |
(46) 0x4ed8 SHR $0x20,%RDX |
(46) 0x4edc JNE 4cd0 |
(46) 0x4ee2 XOR %EDX,%EDX |
(46) 0x4ee4 DIV %R15D |
(46) 0x4ee7 JMP 4cd5 |
0x4eec LEA -0x1(%R10),%RAX |
(39) 0x4ef0 MOV -0x8(%RBX,%R10,8),%RSI |
(39) 0x4ef5 CMP %RSI,%RCX |
(39) 0x4ef8 JLE 4f2b |
(39) 0x4efa MOV -0x8(%R9,%RCX,8),%RSI |
(39) 0x4eff DEC %RCX |
(39) 0x4f02 MOV (%R12),%RDI |
(39) 0x4f06 IMUL %R14,%RDI |
(39) 0x4f0a ADD %RSI,%RDI |
(39) 0x4f0d LEA (%R13,%RDI,8),%RDI |
(39) 0x4f12 DECQ (%RDI) |
(39) 0x4f15 MOV (%R12),%RDI |
(39) 0x4f19 IMUL %R14,%RDI |
(39) 0x4f1d ADD %RSI,%RDI |
(39) 0x4f20 MOV (%R13,%RDI,8),%RSI |
(39) 0x4f25 MOV %RAX,(%R15,%RSI,8) |
(39) 0x4f29 JMP 4ef0 |
0x4f2b MOV %RSI,%RCX |
0x4f2e CMP %RDX,%R10 |
0x4f31 JNE 4f49 |
0x4f33 JMP 4ff9 |
0x4f38 NOPL (%RAX,%RAX,1) |
(36) 0x4f40 CMP %R8,%RAX |
(36) 0x4f43 JLE 4ff9 |
(36) 0x4f49 MOV -0x8(%RBX,%RAX,8),%RDX |
(36) 0x4f4e CMP %RDX,%RCX |
(36) 0x4f51 JLE 4f99 |
(36) 0x4f53 LEA -0x1(%RAX),%RSI |
(36) 0x4f57 NOPW (%RAX,%RAX,1) |
(38) 0x4f60 MOV -0x8(%R9,%RCX,8),%RDX |
(38) 0x4f65 DEC %RCX |
(38) 0x4f68 MOV (%R12),%RDI |
(38) 0x4f6c IMUL %R14,%RDI |
(38) 0x4f70 ADD %RDX,%RDI |
(38) 0x4f73 LEA (%R13,%RDI,8),%RDI |
(38) 0x4f78 DECQ (%RDI) |
(38) 0x4f7b MOV (%R12),%RDI |
(38) 0x4f7f IMUL %R14,%RDI |
(38) 0x4f83 ADD %RDX,%RDI |
(38) 0x4f86 MOV (%R13,%RDI,8),%RDX |
(38) 0x4f8b MOV %RSI,(%R15,%RDX,8) |
(38) 0x4f8f MOV -0x8(%RBX,%RAX,8),%RDX |
(38) 0x4f94 CMP %RDX,%RCX |
(38) 0x4f97 JG 4f60 |
(36) 0x4f99 MOV -0x10(%RBX,%RAX,8),%RCX |
(36) 0x4f9e ADD $-0x2,%RAX |
(36) 0x4fa2 CMP %RCX,%RDX |
(36) 0x4fa5 JLE 4f40 |
(36) 0x4fa7 NOPW (%RAX,%RAX,1) |
(37) 0x4fb0 MOV -0x8(%R9,%RDX,8),%RCX |
(37) 0x4fb5 DEC %RDX |
(37) 0x4fb8 MOV (%R12),%RSI |
(37) 0x4fbc IMUL %R14,%RSI |
(37) 0x4fc0 ADD %RCX,%RSI |
(37) 0x4fc3 LEA (%R13,%RSI,8),%RSI |
(37) 0x4fc8 DECQ (%RSI) |
(37) 0x4fcb MOV (%R12),%RSI |
(37) 0x4fcf IMUL %R14,%RSI |
(37) 0x4fd3 ADD %RCX,%RSI |
(37) 0x4fd6 MOV (%R13,%RSI,8),%RCX |
(37) 0x4fdb MOV %RAX,(%R15,%RCX,8) |
(37) 0x4fdf MOV (%RBX,%RAX,8),%RCX |
(37) 0x4fe3 CMP %RCX,%RDX |
(37) 0x4fe6 JG 4fb0 |
(36) 0x4fe8 JMP 4f40 |
0x4fed MOV %RDI,%RDX |
0x4ff0 MOV -0x30(%RBP),%RSI |
0x4ff4 CMP %R8,%RSI |
0x4ff7 JNE 5015 |
0x4ff9 ADD $0x48,%RSP |
0x4ffd POP %RBX |
0x4ffe POP %R12 |
0x5000 POP %R13 |
0x5002 POP %R14 |
0x5004 POP %R15 |
0x5006 POP %RBP |
0x5007 RET |
0x5008 NOPL (%RAX,%RAX,1) |
(40) 0x5010 CMP %R9,%RCX |
(40) 0x5013 JLE 4ff9 |
(40) 0x5015 MOV -0x8(%RBX,%RCX,8),%RSI |
(40) 0x501a CMP %RSI,%RDX |
(40) 0x501d JLE 5075 |
(40) 0x501f LEA -0x1(%RCX),%RDI |
(40) 0x5023 NOPW %CS:(%RAX,%RAX,1) |
(42) 0x5030 MOV -0x8(%R11,%RDX,8),%RSI |
(42) 0x5035 MOV (%R12),%R8 |
(42) 0x5039 IMUL %R14,%R8 |
(42) 0x503d ADD %RSI,%R8 |
(42) 0x5040 LEA (%R13,%R8,8),%R8 |
(42) 0x5045 DECQ (%R8) |
(42) 0x5048 MOV (%R12),%R8 |
(42) 0x504c IMUL %R14,%R8 |
(42) 0x5050 ADD %RSI,%R8 |
(42) 0x5053 VMOVSD -0x8(%R10,%RDX,8),%XMM0 |
(42) 0x505a DEC %RDX |
(42) 0x505d MOV (%R13,%R8,8),%RSI |
(42) 0x5062 VMOVSD %XMM0,(%RAX,%RSI,8) |
(42) 0x5067 MOV %RDI,(%R15,%RSI,8) |
(42) 0x506b MOV -0x8(%RBX,%RCX,8),%RSI |
(42) 0x5070 CMP %RSI,%RDX |
(42) 0x5073 JG 5030 |
(40) 0x5075 MOV -0x10(%RBX,%RCX,8),%RDX |
(40) 0x507a ADD $-0x2,%RCX |
(40) 0x507e CMP %RDX,%RSI |
(40) 0x5081 JLE 5010 |
(40) 0x5083 NOPW %CS:(%RAX,%RAX,1) |
(41) 0x5090 MOV -0x8(%R11,%RSI,8),%RDX |
(41) 0x5095 MOV (%R12),%RDI |
(41) 0x5099 IMUL %R14,%RDI |
(41) 0x509d ADD %RDX,%RDI |
(41) 0x50a0 LEA (%R13,%RDI,8),%RDI |
(41) 0x50a5 DECQ (%RDI) |
(41) 0x50a8 MOV (%R12),%RDI |
(41) 0x50ac IMUL %R14,%RDI |
(41) 0x50b0 ADD %RDX,%RDI |
(41) 0x50b3 VMOVSD -0x8(%R10,%RSI,8),%XMM0 |
(41) 0x50ba DEC %RSI |
(41) 0x50bd MOV (%R13,%RDI,8),%RDX |
(41) 0x50c2 VMOVSD %XMM0,(%RAX,%RDX,8) |
(41) 0x50c7 MOV %RCX,(%R15,%RDX,8) |
(41) 0x50cb MOV (%RBX,%RCX,8),%RDX |
(41) 0x50cf CMP %RDX,%RSI |
(41) 0x50d2 JG 5090 |
(40) 0x50d4 JMP 5010 |
0x50d9 NOPL (%RAX) |
Path / |
Source file and lines | csr_matop.c:380-560 |
Module | libseq_mv.so |
nb instructions | 321 |
nb uops | 363 |
loop length | 1318 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 60.67 cycles |
front end | 60.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.70 | 28.00 | 24.33 | 24.33 | 21.00 | 20.80 | 20.70 | 21.00 | 21.00 | 21.00 | 20.80 | 24.33 |
cycles | 20.70 | 36.40 | 24.33 | 24.33 | 21.00 | 20.80 | 20.70 | 21.00 | 21.00 | 21.00 | 20.80 | 24.33 |
Cycles executing div or sqrt instructions | 48.00 |
FE+BE cycles | 55.91-55.97 |
Stall cycles | 0.00 |
Front-end | 60.67 |
Dispatch | 36.40 |
DIV/SQRT | 48.00 |
Overall L1 | 60.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x48,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%R13),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R12,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4560 <hypre_CSRMatrixTranspose.extracted+0x70> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 4564 <hypre_CSRMatrixTranspose.extracted+0x74> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x38(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 459a <hypre_CSRMatrixTranspose.extracted+0xaa> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RDI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 45a2 <hypre_CSRMatrixTranspose.extracted+0xb2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%RDX,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RDI,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3140 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
SUB %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 45a2 <hypre_CSRMatrixTranspose.extracted+0xb2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOVQ $0,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%R13),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R13),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R12,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 45db <hypre_CSRMatrixTranspose.extracted+0xeb> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 45df <hypre_CSRMatrixTranspose.extracted+0xef> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x38(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 461e <hypre_CSRMatrixTranspose.extracted+0x12e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4620 <hypre_CSRMatrixTranspose.extracted+0x130> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%RSI,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RDI,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3140 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JMP 4620 <hypre_CSRMatrixTranspose.extracted+0x130> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4668 <hypre_CSRMatrixTranspose.extracted+0x178> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xc9b0(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x7d33(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x7cd4(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x7a11(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x1d7,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4676 <hypre_CSRMatrixTranspose.extracted+0x186> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 46b7 <hypre_CSRMatrixTranspose.extracted+0x1c7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xc960(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x7ce3(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x7a52(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x79c1(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x1d8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 46c9 <hypre_CSRMatrixTranspose.extracted+0x1d9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4700 <hypre_CSRMatrixTranspose.extracted+0x210> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xc910(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x7c93(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x7a25(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x7971(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x1d9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R13,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 30b0 <__intel_avx_rep_memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RAX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RBX,%RSI,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JGE 475d <hypre_CSRMatrixTranspose.extracted+0x26d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xc9f6(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31d0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R12),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x1(%R14),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R11,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 48cb <hypre_CSRMatrixTranspose.extracted+0x3db> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R11,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x40(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xc9d8(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31d0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R15),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xc9e5(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 30c0 <__kmpc_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMP $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4a25 <hypre_CSRMatrixTranspose.extracted+0x535> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x1,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4a16 <hypre_CSRMatrixTranspose.extracted+0x526> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%R15),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4cba <hypre_CSRMatrixTranspose.extracted+0x7ca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JAE 4a16 <hypre_CSRMatrixTranspose.extracted+0x526> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4836 <hypre_CSRMatrixTranspose.extracted+0x346> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R9),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xc7a0(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 30d0 <__kmpc_end_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xc7ae(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31d0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x48(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4bb2 <hypre_CSRMatrixTranspose.extracted+0x6c2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RDI,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA -0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R15,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4a66 <hypre_CSRMatrixTranspose.extracted+0x576> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R15 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 4a6b <hypre_CSRMatrixTranspose.extracted+0x57b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R15D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R8,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4bb2 <hypre_CSRMatrixTranspose.extracted+0x6c2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %RDI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R13,%RDX,8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4abc <hypre_CSRMatrixTranspose.extracted+0x5cc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xc63d(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31d0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,-0x68(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4c0f <hypre_CSRMatrixTranspose.extracted+0x71f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x38(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x58(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ff9 <hypre_CSRMatrixTranspose.extracted+0xb09> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RSI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ESI,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R9D,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R9),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%CL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4c42 <hypre_CSRMatrixTranspose.extracted+0x752> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5015 <hypre_CSRMatrixTranspose.extracted+0xb25> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ff9 <hypre_CSRMatrixTranspose.extracted+0xb09> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ff9 <hypre_CSRMatrixTranspose.extracted+0xb09> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%RBX,%R10,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R8D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4eec <hypre_CSRMatrixTranspose.extracted+0x9fc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4f2e <hypre_CSRMatrixTranspose.extracted+0xa3e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x1(%RSI),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%RBX,%RSI,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4fed <hypre_CSRMatrixTranspose.extracted+0xafd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R8,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5015 <hypre_CSRMatrixTranspose.extracted+0xb25> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ff9 <hypre_CSRMatrixTranspose.extracted+0xb09> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x50(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SHR $0x2,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4cf9 <hypre_CSRMatrixTranspose.extracted+0x809> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x1(%R10),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4f49 <hypre_CSRMatrixTranspose.extracted+0xa59> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ff9 <hypre_CSRMatrixTranspose.extracted+0xb09> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5015 <hypre_CSRMatrixTranspose.extracted+0xb25> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x48,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matop.c:380-560 |
Module | libseq_mv.so |
nb instructions | 321 |
nb uops | 363 |
loop length | 1318 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 60.67 cycles |
front end | 60.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.70 | 28.00 | 24.33 | 24.33 | 21.00 | 20.80 | 20.70 | 21.00 | 21.00 | 21.00 | 20.80 | 24.33 |
cycles | 20.70 | 36.40 | 24.33 | 24.33 | 21.00 | 20.80 | 20.70 | 21.00 | 21.00 | 21.00 | 20.80 | 24.33 |
Cycles executing div or sqrt instructions | 48.00 |
FE+BE cycles | 55.91-55.97 |
Stall cycles | 0.00 |
Front-end | 60.67 |
Dispatch | 36.40 |
DIV/SQRT | 48.00 |
Overall L1 | 60.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x48,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%R13),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R12,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4560 <hypre_CSRMatrixTranspose.extracted+0x70> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 4564 <hypre_CSRMatrixTranspose.extracted+0x74> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x38(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 459a <hypre_CSRMatrixTranspose.extracted+0xaa> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RDI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 45a2 <hypre_CSRMatrixTranspose.extracted+0xb2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%RDX,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RDI,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3140 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
SUB %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 45a2 <hypre_CSRMatrixTranspose.extracted+0xb2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOVQ $0,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%R13),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R13),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R12,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 45db <hypre_CSRMatrixTranspose.extracted+0xeb> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 45df <hypre_CSRMatrixTranspose.extracted+0xef> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x38(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 461e <hypre_CSRMatrixTranspose.extracted+0x12e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4620 <hypre_CSRMatrixTranspose.extracted+0x130> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%RSI,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RDI,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3140 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JMP 4620 <hypre_CSRMatrixTranspose.extracted+0x130> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4668 <hypre_CSRMatrixTranspose.extracted+0x178> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xc9b0(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x7d33(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x7cd4(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x7a11(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x1d7,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4676 <hypre_CSRMatrixTranspose.extracted+0x186> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 46b7 <hypre_CSRMatrixTranspose.extracted+0x1c7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xc960(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x7ce3(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x7a52(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x79c1(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x1d8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 46c9 <hypre_CSRMatrixTranspose.extracted+0x1d9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4700 <hypre_CSRMatrixTranspose.extracted+0x210> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xc910(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x7c93(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x7a25(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x7971(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x1d9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R13,%RAX,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 30b0 <__intel_avx_rep_memset@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RAX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RBX,%RSI,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JGE 475d <hypre_CSRMatrixTranspose.extracted+0x26d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xc9f6(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31d0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R12),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x1(%R14),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R11,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 48cb <hypre_CSRMatrixTranspose.extracted+0x3db> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R11,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x40(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xc9d8(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31d0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R15),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xc9e5(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 30c0 <__kmpc_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMP $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4a25 <hypre_CSRMatrixTranspose.extracted+0x535> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x1,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4a16 <hypre_CSRMatrixTranspose.extracted+0x526> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%R15),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4cba <hypre_CSRMatrixTranspose.extracted+0x7ca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JAE 4a16 <hypre_CSRMatrixTranspose.extracted+0x526> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4836 <hypre_CSRMatrixTranspose.extracted+0x346> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R9),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xc7a0(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 30d0 <__kmpc_end_masked@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xc7ae(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31d0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x48(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4bb2 <hypre_CSRMatrixTranspose.extracted+0x6c2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RDI,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA -0x1(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R15,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4a66 <hypre_CSRMatrixTranspose.extracted+0x576> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R15 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 4a6b <hypre_CSRMatrixTranspose.extracted+0x57b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R15D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R8,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DEC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4bb2 <hypre_CSRMatrixTranspose.extracted+0x6c2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %RDI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R13,%RDX,8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4abc <hypre_CSRMatrixTranspose.extracted+0x5cc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0xc63d(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31d0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
CMPQ $0,-0x68(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4c0f <hypre_CSRMatrixTranspose.extracted+0x71f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x38(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x58(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ff9 <hypre_CSRMatrixTranspose.extracted+0xb09> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x28(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RSI,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ESI,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R9D,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R9),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%CL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4c42 <hypre_CSRMatrixTranspose.extracted+0x752> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5015 <hypre_CSRMatrixTranspose.extracted+0xb25> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ff9 <hypre_CSRMatrixTranspose.extracted+0xb09> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JLE 4ff9 <hypre_CSRMatrixTranspose.extracted+0xb09> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%RBX,%R10,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R8D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x1(%R8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4eec <hypre_CSRMatrixTranspose.extracted+0x9fc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4f2e <hypre_CSRMatrixTranspose.extracted+0xa3e> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x1(%RSI),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x8(%RBX,%RSI,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4fed <hypre_CSRMatrixTranspose.extracted+0xafd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R8,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5015 <hypre_CSRMatrixTranspose.extracted+0xb25> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ff9 <hypre_CSRMatrixTranspose.extracted+0xb09> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x50(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SHR $0x2,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4cf9 <hypre_CSRMatrixTranspose.extracted+0x809> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x1(%R10),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4f49 <hypre_CSRMatrixTranspose.extracted+0xa59> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4ff9 <hypre_CSRMatrixTranspose.extracted+0xb09> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R8,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 5015 <hypre_CSRMatrixTranspose.extracted+0xb25> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x48,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixTranspose.extracted– | 0.2 | 0.04 |
▼Loop 40 - csr_matop.c:540-548 - libseq_mv.so– | 0.03 | 0.01 |
○Loop 42 - csr_matop.c:541-548 - libseq_mv.so | 0.07 | 0.01 |
○Loop 41 - csr_matop.c:541-548 - libseq_mv.so | 0.07 | 0.01 |
○Loop 48 - csr_matop.c:483-485 - libseq_mv.so | 0.02 | 0.01 |
○Loop 47 - csr_matop.c:380-500 - libseq_mv.so | 0.01 | 0.01 |
▼Loop 36 - csr_matop.c:553-560 - libseq_mv.so– | 0.01 | 0.01 |
○Loop 38 - csr_matop.c:554-560 - libseq_mv.so | 0 | 0 |
○Loop 37 - csr_matop.c:554-560 - libseq_mv.so | 0 | 0.01 |
○Loop 44 - csr_matop.c:380-527 - libseq_mv.so | 0.01 | 0.01 |
○Loop 46 - csr_matop.c:380-513 - libseq_mv.so | 0 | 0 |
○Loop 45 - csr_matop.c:380-513 - libseq_mv.so | 0 | 0 |
○Loop 43 - csr_matop.c:541-548 - libseq_mv.so | 0 | 0 |
○Loop 39 - csr_matop.c:554-560 - libseq_mv.so | 0 | 0 |