Loop Id: 4035 | Module: exec | Source: IJMatrix_parcsr.c:3262-3484 [...] | Coverage: 0.05% |
---|
Loop Id: 4035 | Module: exec | Source: IJMatrix_parcsr.c:3262-3484 [...] | Coverage: 0.05% |
---|
0x4d3a61 SAL $0x3,%RDX |
0x4d3a65 MOV %R12,-0x88(%RBP) |
0x4d3a6c MOV %R13,%RSI |
0x4d3a6f MOV %RDX,%R12 |
0x4d3a72 CALL 4efd90 <_intel_fast_memcpy> |
0x4d3a77 MOV %R14,%RDI |
0x4d3a7a MOV -0x88(%RBP),%RSI |
0x4d3a81 MOV %R12,%RDX |
0x4d3a84 CALL 4efd90 <_intel_fast_memcpy> |
0x4d3a89 MOV %R13,%RDI |
0x4d3a8c VZEROUPPER |
0x4d3a8f CALL 4e6e50 <hypre_Free> |
0x4d3a94 MOV -0x88(%RBP),%RDI |
0x4d3a9b CALL 4e6e50 <hypre_Free> |
0x4d3aa0 XOR %EAX,%EAX |
0x4d3aa2 MOV %RAX,-0x88(%RBP) |
0x4d3aa9 MOV -0x60(%RBP),%RDX |
0x4d3aad MOV -0x48(%RBP),%RSI |
0x4d3ab1 MOV -0x68(%RBP),%R9 |
0x4d3ab5 MOV -0x50(%RBP),%R8 |
0x4d3ab9 MOV 0x20(%RBP),%RAX |
0x4d3abd INC %R9 |
0x4d3ac0 CMP %R8,%R9 |
0x4d3ac3 JGE 4d4533 |
0x4d3ac9 MOV (%RDX,%R9,8),%R13 |
0x4d3acd MOV (%RSI,%R9,8),%R14 |
0x4d3ad1 MOV %R13,-0x58(%RBP) |
0x4d3ad5 SUB (%RAX),%R13 |
0x4d3ad8 JL 4d3b90 |
0x4d3ade MOV -0x58(%RBP),%RCX |
0x4d3ae2 CMP 0x8(%RAX),%RCX |
0x4d3ae6 JGE 4d3b90 |
0x4d3aec CMPQ $0,0x58(%RBP) |
0x4d3af1 MOV %R13,-0x38(%RBP) |
0x4d3af5 JE 4d3d48 |
0x4d3afb MOV 0x38(%RBP),%RAX |
0x4d3aff MOV (%RAX,%R13,8),%R12 |
0x4d3b03 MOV 0x40(%RBP),%RAX |
0x4d3b07 MOV (%RAX,%R13,8),%RAX |
0x4d3b0b MOV %RAX,-0x70(%RBP) |
0x4d3b0f MOV 0x50(%RBP),%RAX |
0x4d3b13 MOV (%RAX,%R13,8),%RCX |
0x4d3b17 MOV 0x48(%RBP),%RAX |
0x4d3b1b MOV (%RAX,%R13,8),%R13 |
0x4d3b1f MOV %RCX,-0x80(%RBP) |
0x4d3b23 MOV %RCX,%RAX |
0x4d3b26 SUB %R13,%RAX |
0x4d3b29 MOV %R14,%RDI |
0x4d3b2c SUB %RAX,%RDI |
0x4d3b2f MOV %R9,-0x68(%RBP) |
0x4d3b33 JLE 4d40f2 |
0x4d3b39 MOV $0x8,%ESI |
0x4d3b3e MOV %RDI,-0x58(%RBP) |
0x4d3b42 VZEROUPPER |
0x4d3b45 CALL 4e6d80 <hypre_CAlloc> |
0x4d3b4a MOV %RAX,-0x78(%RBP) |
0x4d3b4e MOV $0x8,%ESI |
0x4d3b53 MOV -0x58(%RBP),%RDI |
0x4d3b57 CALL 4e6d80 <hypre_CAlloc> |
0x4d3b5c MOV %RAX,-0x88(%RBP) |
0x4d3b63 MOV -0x30(%RBP),%RDI |
0x4d3b67 TEST %R14,%R14 |
0x4d3b6a JG 4d4105 |
0x4d3b70 MOV 0x48(%RBP),%RAX |
0x4d3b74 MOV -0x38(%RBP),%RCX |
0x4d3b78 MOV %R13,(%RAX,%RCX,8) |
0x4d3b7c JMP 4d43f6 |
0x4d3b90 ADD %R14,-0x30(%RBP) |
0x4d3b94 CMPB $0,-0x39(%RBP) |
0x4d3b98 JNE 4d3abd |
0x4d3b9e TEST %R14,%R14 |
0x4d3ba1 JLE 4d3abd |
0x4d3ba7 MOV %R9,-0x68(%RBP) |
0x4d3bab DEC %R14 |
0x4d3bae XOR %ECX,%ECX |
0x4d3bb0 XOR %EAX,%EAX |
0x4d3bb2 JMP 4d3bd4 |
(4036) 0x4d3bc0 LEA 0x1(%RAX),%RDX |
(4036) 0x4d3bc4 CMP -0xb8(%RBP),%RAX |
(4036) 0x4d3bcb MOV %RDX,%RAX |
(4036) 0x4d3bce JE 4d3aa9 |
(4036) 0x4d3bd4 MOV %RCX,%R9 |
(4036) 0x4d3bd7 MOV %RAX,%RSI |
(4036) 0x4d3bda SAL $0x4,%RSI |
(4036) 0x4d3bde MOV 0xa0(%RBP),%RDI |
(4036) 0x4d3be5 MOV 0x8(%RDI,%RSI,1),%RDX |
(4036) 0x4d3bea ADD %RDX,%RCX |
(4036) 0x4d3bed MOV -0x58(%RBP),%R8 |
(4036) 0x4d3bf1 CMP %R8,(%RDI,%RSI,1) |
(4036) 0x4d3bf5 JNE 4d3bc0 |
(4036) 0x4d3bf7 TEST %RDX,%RDX |
(4036) 0x4d3bfa JLE 4d3bc0 |
(4036) 0x4d3bfc MOV 0xa8(%RBP),%RSI |
(4036) 0x4d3c03 LEA -0x8(%RSI,%RCX,8),%RDI |
(4036) 0x4d3c08 LEA (%RSI,%R9,8),%RSI |
(4036) 0x4d3c0c CMP %R15,%RDI |
(4036) 0x4d3c0f JB 4d3c60 |
(4036) 0x4d3c11 CMP %RSI,%R15 |
(4036) 0x4d3c14 JB 4d3c60 |
(4036) 0x4d3c16 XOR %EDI,%EDI |
(4036) 0x4d3c18 JMP 4d3c2c |
(4040) 0x4d3c20 LEA 0x1(%RDI),%R8 |
(4040) 0x4d3c24 CMP %R14,%RDI |
(4040) 0x4d3c27 MOV %R8,%RDI |
(4040) 0x4d3c2a JE 4d3bc0 |
(4040) 0x4d3c2c MOV (%RBX,%RDI,8),%R8 |
(4040) 0x4d3c30 XOR %R9D,%R9D |
(4040) 0x4d3c33 JMP 4d3c48 |
(4041) 0x4d3c40 INC %R9 |
(4041) 0x4d3c43 CMP %R9,%RDX |
(4041) 0x4d3c46 JE 4d3c20 |
(4041) 0x4d3c48 CMP %R8,(%RSI,%R9,8) |
(4041) 0x4d3c4c JNE 4d3c40 |
(4041) 0x4d3c4e MOVQ $-0x1,(%RSI,%R9,8) |
(4041) 0x4d3c56 INCQ (%R15) |
(4041) 0x4d3c59 JMP 4d3c40 |
(4036) 0x4d3c60 MOV %RDX,%RDI |
(4036) 0x4d3c63 SHR $0x2,%RDI |
(4036) 0x4d3c67 MOV %RDX,%R8 |
(4036) 0x4d3c6a AND $-0x4,%R8 |
(4036) 0x4d3c6e MOV -0xb0(%RBP),%R10 |
(4036) 0x4d3c75 LEA (%R10,%R9,8),%R13 |
(4036) 0x4d3c79 XOR %R10D,%R10D |
(4036) 0x4d3c7c JMP 4d3c90 |
(4037) 0x4d3c80 LEA 0x1(%R10),%R9 |
(4037) 0x4d3c84 CMP %R14,%R10 |
(4037) 0x4d3c87 MOV %R9,%R10 |
(4037) 0x4d3c8a JE 4d3bc0 |
(4037) 0x4d3c90 MOV (%RBX,%R10,8),%R11 |
(4037) 0x4d3c94 CMP $0x4,%RDX |
(4037) 0x4d3c98 JAE 4d3cd0 |
(4037) 0x4d3c9a CMP %RDX,%R8 |
(4037) 0x4d3c9d JAE 4d3c80 |
(4037) 0x4d3c9f MOV %R8,%R9 |
(4037) 0x4d3ca2 JMP 4d3cb8 |
(4038) 0x4d3cb0 INC %R9 |
(4038) 0x4d3cb3 CMP %R9,%RDX |
(4038) 0x4d3cb6 JE 4d3c80 |
(4038) 0x4d3cb8 CMP %R11,(%RSI,%R9,8) |
(4038) 0x4d3cbc JNE 4d3cb0 |
(4038) 0x4d3cbe MOVQ $-0x1,(%RSI,%R9,8) |
(4038) 0x4d3cc6 INCQ (%R15) |
(4038) 0x4d3cc9 JMP 4d3cb0 |
(4037) 0x4d3cd0 MOV %RDI,%R12 |
(4037) 0x4d3cd3 MOV %R13,%R9 |
(4037) 0x4d3cd6 JMP 4d3ce9 |
(4039) 0x4d3ce0 ADD $0x20,%R9 |
(4039) 0x4d3ce4 DEC %R12 |
(4039) 0x4d3ce7 JE 4d3c9a |
(4039) 0x4d3ce9 CMP %R11,-0x18(%R9) |
(4039) 0x4d3ced JNE 4d3d20 |
(4039) 0x4d3cef MOVQ $-0x1,-0x18(%R9) |
(4039) 0x4d3cf7 INCQ (%R15) |
(4039) 0x4d3cfa CMP %R11,-0x10(%R9) |
(4039) 0x4d3cfe JE 4d3d26 |
(4039) 0x4d3d00 CMP %R11,-0x8(%R9) |
(4039) 0x4d3d04 JNE 4d3d37 |
(4039) 0x4d3d06 MOVQ $-0x1,-0x8(%R9) |
(4039) 0x4d3d0e INCQ (%R15) |
(4039) 0x4d3d11 CMP %R11,(%R9) |
(4039) 0x4d3d14 JNE 4d3ce0 |
(4039) 0x4d3d16 JMP 4d3d3c |
(4039) 0x4d3d20 CMP %R11,-0x10(%R9) |
(4039) 0x4d3d24 JNE 4d3d00 |
(4039) 0x4d3d26 MOVQ $-0x1,-0x10(%R9) |
(4039) 0x4d3d2e INCQ (%R15) |
(4039) 0x4d3d31 CMP %R11,-0x8(%R9) |
(4039) 0x4d3d35 JE 4d3d06 |
(4039) 0x4d3d37 CMP %R11,(%R9) |
(4039) 0x4d3d3a JNE 4d3ce0 |
(4039) 0x4d3d3c MOVQ $-0x1,(%R9) |
(4039) 0x4d3d43 INCQ (%R15) |
(4039) 0x4d3d46 JMP 4d3ce0 |
0x4d3d48 MOV 0x18(%RBP),%RCX |
0x4d3d4c MOV 0x38(%RCX),%RAX |
0x4d3d50 MOV 0x40(%RCX),%RCX |
0x4d3d54 MOV (%RCX,%R13,8),%R11 |
0x4d3d58 MOV (%RAX,%R13,8),%R10 |
0x4d3d5c TEST %R14,%R14 |
0x4d3d5f JLE 4d4408 |
0x4d3d65 MOV %R9,-0x68(%RBP) |
0x4d3d69 MOV 0x60(%RBP),%RAX |
0x4d3d6d MOV 0x8(%RAX,%R13,8),%RAX |
0x4d3d72 MOV %RAX,-0x78(%RBP) |
0x4d3d76 MOV 0x78(%RBP),%RAX |
0x4d3d7a MOV 0x8(%RAX,%R13,8),%RAX |
0x4d3d7f MOV %RAX,-0x98(%RBP) |
0x4d3d86 MOV -0x30(%RBP),%RDI |
0x4d3d8a LEA (%RDI,%R14,1),%RAX |
0x4d3d8e MOV %RAX,-0xa0(%RBP) |
0x4d3d95 XOR %R8D,%R8D |
0x4d3d98 MOV %R11,-0x80(%RBP) |
0x4d3d9c MOV %R10,-0x90(%RBP) |
0x4d3da3 MOV %R10,-0x70(%RBP) |
0x4d3da7 MOV %R11,%RCX |
0x4d3daa JMP 4d3dc6 |
(4042) 0x4d3db0 MOV -0x38(%RBP),%R13 |
(4042) 0x4d3db4 MOV %RCX,%R11 |
(4042) 0x4d3db7 INC %RDI |
(4042) 0x4d3dba INC %R8 |
(4042) 0x4d3dbd CMP %R14,%R8 |
(4042) 0x4d3dc0 JE 4d4410 |
(4042) 0x4d3dc6 MOV (%RBX,%RDI,8),%R9 |
(4042) 0x4d3dca CMP 0x28(%RBP),%R9 |
(4042) 0x4d3dce JL 4d3f20 |
(4042) 0x4d3dd4 CMP 0x30(%RBP),%R9 |
(4042) 0x4d3dd8 JG 4d3f20 |
(4042) 0x4d3dde MOV 0x60(%RBP),%RAX |
(4042) 0x4d3de2 MOV (%RAX,%R13,8),%R10 |
(4042) 0x4d3de6 MOV -0x90(%RBP),%R11 |
(4042) 0x4d3ded SUB %R10,%R11 |
(4042) 0x4d3df0 JLE 4d3ee0 |
(4042) 0x4d3df6 MOV 0x68(%RBP),%RAX |
(4042) 0x4d3dfa LEA (%RAX,%R10,8),%EAX |
(4042) 0x4d3dfe AND $0x7f,%EAX |
(4042) 0x4d3e01 MOV $0x80,%EDX |
(4042) 0x4d3e06 SUB %EAX,%EDX |
(4042) 0x4d3e08 SHR $0x3,%EDX |
(4042) 0x4d3e0b CMP %RDX,%R11 |
(4042) 0x4d3e0e MOV %RDX,%RSI |
(4042) 0x4d3e11 CMOVB %R11,%RSI |
(4042) 0x4d3e15 TEST %RSI,%RSI |
(4042) 0x4d3e18 JE 4d3e37 |
(4042) 0x4d3e1a MOV %R10,%R12 |
(4042) 0x4d3e1d MOV %RSI,%RAX |
(4048) 0x4d3e20 MOV 0x68(%RBP),%R13 |
(4048) 0x4d3e24 CMP %R9,(%R13,%R12,8) |
(4048) 0x4d3e29 JE 4d4087 |
(4048) 0x4d3e2f INC %R12 |
(4048) 0x4d3e32 DEC %RAX |
(4048) 0x4d3e35 JNE 4d3e20 |
(4042) 0x4d3e37 CMP %RDX,%R11 |
(4042) 0x4d3e3a JBE 4d3ee0 |
(4042) 0x4d3e40 MOV %RDI,-0x30(%RBP) |
(4042) 0x4d3e44 SUB %RSI,%R11 |
(4042) 0x4d3e47 MOV %R11,%R13 |
(4042) 0x4d3e4a AND $-0x10,%R13 |
(4042) 0x4d3e4e JE 4d3eaa |
(4042) 0x4d3e50 LEA -0x1(%R13),%RDI |
(4042) 0x4d3e54 LEA (%R10,%RSI,1),%R12 |
(4042) 0x4d3e58 VPBROADCASTQ %R9,%YMM0 |
(4042) 0x4d3e5e MOV 0x68(%RBP),%RAX |
(4042) 0x4d3e62 LEA (%RAX,%R12,8),%RAX |
(4042) 0x4d3e66 XOR %EDX,%EDX |
(4042) 0x4d3e68 NOPL (%RAX,%RAX,1) |
(4047) 0x4d3e70 VPCMPEQQ 0x20(%RAX,%RDX,8),%YMM0,%K0 |
(4047) 0x4d3e78 VPCMPEQQ (%RAX,%RDX,8),%YMM0,%K1 |
(4047) 0x4d3e7f VPCMPEQQ 0x60(%RAX,%RDX,8),%YMM0,%K2 |
(4047) 0x4d3e87 VPCMPEQQ 0x40(%RAX,%RDX,8),%YMM0,%K3 |
(4047) 0x4d3e8f KORB %K0,%K1,%K4 |
(4047) 0x4d3e93 KORB %K2,%K3,%K5 |
(4047) 0x4d3e97 KORTESTB %K5,%K4 |
(4047) 0x4d3e9b JNE 4d405d |
(4047) 0x4d3ea1 ADD $0x10,%RDX |
(4047) 0x4d3ea5 CMP %RDI,%RDX |
(4047) 0x4d3ea8 JBE 4d3e70 |
(4042) 0x4d3eaa CMP %R11,%R13 |
(4042) 0x4d3ead MOV -0x30(%RBP),%RDI |
(4042) 0x4d3eb1 JAE 4d3ee0 |
(4042) 0x4d3eb3 ADD %RSI,%R10 |
(4042) 0x4d3eb6 ADD %R13,%R10 |
(4042) 0x4d3eb9 MOV %R10,%R12 |
(4042) 0x4d3ebc NOPL (%RAX) |
(4046) 0x4d3ec0 MOV 0x68(%RBP),%RAX |
(4046) 0x4d3ec4 CMP %R9,(%RAX,%R12,8) |
(4046) 0x4d3ec8 JE 4d4087 |
(4046) 0x4d3ece INC %R12 |
(4046) 0x4d3ed1 CMP %R12,-0x90(%RBP) |
(4046) 0x4d3ed8 JNE 4d3ec0 |
(4042) 0x4d3eda NOPW (%RAX,%RAX,1) |
(4042) 0x4d3ee0 MOV -0x70(%RBP),%RDX |
(4042) 0x4d3ee4 CMP -0x78(%RBP),%RDX |
(4042) 0x4d3ee8 JGE 4d4452 |
(4042) 0x4d3eee MOV 0x68(%RBP),%RAX |
(4042) 0x4d3ef2 MOV %R9,(%RAX,%RDX,8) |
(4042) 0x4d3ef6 MOV 0x10(%RBP),%RAX |
(4042) 0x4d3efa VMOVQ (%RAX,%RDI,8),%XMM0 |
(4042) 0x4d3eff MOV 0x70(%RBP),%RAX |
(4042) 0x4d3f03 VMOVQ %XMM0,(%RAX,%RDX,8) |
(4042) 0x4d3f08 INC %RDX |
(4042) 0x4d3f0b MOV %RDX,-0x70(%RBP) |
(4042) 0x4d3f0f JMP 4d3db0 |
(4042) 0x4d3f20 MOV 0x78(%RBP),%RAX |
(4042) 0x4d3f24 MOV (%RAX,%R13,8),%R10 |
(4042) 0x4d3f28 SUB %R10,%R11 |
(4042) 0x4d3f2b JLE 4d4020 |
(4042) 0x4d3f31 MOV 0x80(%RBP),%RAX |
(4042) 0x4d3f38 LEA (%RAX,%R10,8),%EAX |
(4042) 0x4d3f3c AND $0x7f,%EAX |
(4042) 0x4d3f3f MOV $0x80,%EDX |
(4042) 0x4d3f44 SUB %EAX,%EDX |
(4042) 0x4d3f46 SHR $0x3,%EDX |
(4042) 0x4d3f49 CMP %RDX,%R11 |
(4042) 0x4d3f4c MOV %RDX,%RSI |
(4042) 0x4d3f4f CMOVB %R11,%RSI |
(4042) 0x4d3f53 TEST %RSI,%RSI |
(4042) 0x4d3f56 JE 4d3f7a |
(4042) 0x4d3f58 MOV %R10,%R12 |
(4042) 0x4d3f5b MOV %RSI,%RAX |
(4042) 0x4d3f5e XCHG %AX,%AX |
(4045) 0x4d3f60 MOV 0x80(%RBP),%R13 |
(4045) 0x4d3f67 CMP %R9,(%R13,%R12,8) |
(4045) 0x4d3f6c JE 4d40d0 |
(4045) 0x4d3f72 INC %R12 |
(4045) 0x4d3f75 DEC %RAX |
(4045) 0x4d3f78 JNE 4d3f60 |
(4042) 0x4d3f7a CMP %RDX,%R11 |
(4042) 0x4d3f7d JBE 4d4020 |
(4042) 0x4d3f83 MOV %RDI,-0x30(%RBP) |
(4042) 0x4d3f87 SUB %RSI,%R11 |
(4042) 0x4d3f8a MOV %R11,%R13 |
(4042) 0x4d3f8d AND $-0x10,%R13 |
(4042) 0x4d3f91 JE 4d3fea |
(4042) 0x4d3f93 LEA -0x1(%R13),%RDI |
(4042) 0x4d3f97 LEA (%R10,%RSI,1),%R12 |
(4042) 0x4d3f9b VPBROADCASTQ %R9,%YMM0 |
(4042) 0x4d3fa1 MOV 0x80(%RBP),%RAX |
(4042) 0x4d3fa8 LEA (%RAX,%R12,8),%RAX |
(4042) 0x4d3fac XOR %EDX,%EDX |
(4042) 0x4d3fae XCHG %AX,%AX |
(4044) 0x4d3fb0 VPCMPEQQ 0x20(%RAX,%RDX,8),%YMM0,%K0 |
(4044) 0x4d3fb8 VPCMPEQQ (%RAX,%RDX,8),%YMM0,%K1 |
(4044) 0x4d3fbf VPCMPEQQ 0x60(%RAX,%RDX,8),%YMM0,%K2 |
(4044) 0x4d3fc7 VPCMPEQQ 0x40(%RAX,%RDX,8),%YMM0,%K3 |
(4044) 0x4d3fcf KORB %K0,%K1,%K4 |
(4044) 0x4d3fd3 KORB %K2,%K3,%K5 |
(4044) 0x4d3fd7 KORTESTB %K5,%K4 |
(4044) 0x4d3fdb JNE 4d40a6 |
(4044) 0x4d3fe1 ADD $0x10,%RDX |
(4044) 0x4d3fe5 CMP %RDI,%RDX |
(4044) 0x4d3fe8 JBE 4d3fb0 |
(4042) 0x4d3fea CMP %R11,%R13 |
(4042) 0x4d3fed MOV -0x30(%RBP),%RDI |
(4042) 0x4d3ff1 JAE 4d4020 |
(4042) 0x4d3ff3 ADD %RSI,%R10 |
(4042) 0x4d3ff6 ADD %R13,%R10 |
(4042) 0x4d3ff9 MOV %R10,%R12 |
(4042) 0x4d3ffc NOPL (%RAX) |
(4043) 0x4d4000 MOV 0x80(%RBP),%RAX |
(4043) 0x4d4007 CMP %R9,(%RAX,%R12,8) |
(4043) 0x4d400b JE 4d40d0 |
(4043) 0x4d4011 INC %R12 |
(4043) 0x4d4014 CMP %R12,%RCX |
(4043) 0x4d4017 JNE 4d4000 |
(4042) 0x4d4019 NOPL (%RAX) |
(4042) 0x4d4020 MOV -0x80(%RBP),%RDX |
(4042) 0x4d4024 CMP -0x98(%RBP),%RDX |
(4042) 0x4d402b JGE 4d448f |
(4042) 0x4d4031 MOV 0x80(%RBP),%RAX |
(4042) 0x4d4038 MOV %R9,(%RAX,%RDX,8) |
(4042) 0x4d403c MOV 0x10(%RBP),%RAX |
(4042) 0x4d4040 VMOVQ (%RAX,%RDI,8),%XMM0 |
(4042) 0x4d4045 MOV 0x88(%RBP),%RAX |
(4042) 0x4d404c VMOVQ %XMM0,(%RAX,%RDX,8) |
(4042) 0x4d4051 INC %RDX |
(4042) 0x4d4054 MOV %RDX,-0x80(%RBP) |
(4042) 0x4d4058 JMP 4d3db0 |
(4042) 0x4d405d KSHIFTLB $0x4,%K0,%K0 |
(4042) 0x4d4063 KORB %K0,%K1,%K0 |
(4042) 0x4d4067 KSHIFTLB $0x4,%K2,%K1 |
(4042) 0x4d406d KORB %K1,%K3,%K1 |
(4042) 0x4d4071 KUNPCKBW %K0,%K1,%K0 |
(4042) 0x4d4075 KMOVD %K0,%EAX |
(4042) 0x4d4079 TZCNT %EAX,%EAX |
(4042) 0x4d407d ADD %RDX,%R12 |
(4042) 0x4d4080 ADD %RAX,%R12 |
(4042) 0x4d4083 MOV -0x30(%RBP),%RDI |
(4042) 0x4d4087 MOV -0x38(%RBP),%R13 |
(4042) 0x4d408b MOV %RCX,%R11 |
(4042) 0x4d408e MOV 0x10(%RBP),%RAX |
(4042) 0x4d4092 VMOVQ (%RAX,%RDI,8),%XMM0 |
(4042) 0x4d4097 MOV 0x70(%RBP),%RAX |
(4042) 0x4d409b VMOVQ %XMM0,(%RAX,%R12,8) |
(4042) 0x4d40a1 JMP 4d3db7 |
(4042) 0x4d40a6 KSHIFTLB $0x4,%K0,%K0 |
(4042) 0x4d40ac KORB %K0,%K1,%K0 |
(4042) 0x4d40b0 KSHIFTLB $0x4,%K2,%K1 |
(4042) 0x4d40b6 KORB %K1,%K3,%K1 |
(4042) 0x4d40ba KUNPCKBW %K0,%K1,%K0 |
(4042) 0x4d40be KMOVD %K0,%EAX |
(4042) 0x4d40c2 TZCNT %EAX,%EAX |
(4042) 0x4d40c6 ADD %RDX,%R12 |
(4042) 0x4d40c9 ADD %RAX,%R12 |
(4042) 0x4d40cc MOV -0x30(%RBP),%RDI |
(4042) 0x4d40d0 MOV -0x38(%RBP),%R13 |
(4042) 0x4d40d4 MOV %RCX,%R11 |
(4042) 0x4d40d7 MOV 0x10(%RBP),%RAX |
(4042) 0x4d40db VMOVQ (%RAX,%RDI,8),%XMM0 |
(4042) 0x4d40e0 MOV 0x88(%RBP),%RAX |
(4042) 0x4d40e7 VMOVQ %XMM0,(%RAX,%R12,8) |
(4042) 0x4d40ed JMP 4d3db7 |
0x4d40f2 XOR %EAX,%EAX |
0x4d40f4 MOV %RAX,-0x78(%RBP) |
0x4d40f8 MOV -0x30(%RBP),%RDI |
0x4d40fc TEST %R14,%R14 |
0x4d40ff JLE 4d3b70 |
0x4d4105 LEA -0x1(%R14),%RAX |
0x4d4109 MOV %R12D,%EDX |
0x4d410c AND $0x7f,%EDX |
0x4d410f MOV $0x80,%ECX |
0x4d4114 SUB %EDX,%ECX |
0x4d4116 SHR $0x3,%ECX |
0x4d4119 CMP %RCX,%R13 |
0x4d411c MOV %RCX,%RDX |
0x4d411f CMOVB %R13,%RDX |
0x4d4123 MOV %R13,%RSI |
0x4d4126 SUB %RDX,%RSI |
0x4d4129 MOV %RSI,-0xa0(%RBP) |
0x4d4130 AND $-0x10,%RSI |
0x4d4134 LEA -0x1(%RSI),%R8 |
0x4d4138 LEA (%R12,%RDX,8),%R9 |
0x4d413c MOV %RSI,-0x98(%RBP) |
0x4d4143 ADD %RDX,%RSI |
0x4d4146 MOV %RSI,-0xa8(%RBP) |
0x4d414d XOR %ESI,%ESI |
0x4d414f MOV %RSI,-0x90(%RBP) |
0x4d4156 MOV %R13,-0x58(%RBP) |
0x4d415a XOR %R11D,%R11D |
0x4d415d JMP 4d419a |
(4052) 0x4d4160 MOV -0x78(%RBP),%RDI |
(4052) 0x4d4164 MOV -0x90(%RBP),%R10 |
(4052) 0x4d416b MOV %RSI,(%RDI,%R10,8) |
(4052) 0x4d416f MOV -0x88(%RBP),%RSI |
(4052) 0x4d4176 VMOVQ %XMM0,(%RSI,%R10,8) |
(4052) 0x4d417c INC %R10 |
(4052) 0x4d417f MOV %R10,-0x90(%RBP) |
(4052) 0x4d4186 MOV -0x30(%RBP),%RDI |
(4052) 0x4d418a LEA 0x1(%R11),%RSI |
(4052) 0x4d418e CMP %RAX,%R11 |
(4052) 0x4d4191 MOV %RSI,%R11 |
(4052) 0x4d4194 JE 4d42c3 |
(4052) 0x4d419a LEA (%RDI,%R11,1),%R10 |
(4052) 0x4d419e TEST %R13,%R13 |
(4052) 0x4d41a1 JLE 4d4250 |
(4052) 0x4d41a7 MOV (%RBX,%R10,8),%RDI |
(4052) 0x4d41ab TEST %RDX,%RDX |
(4052) 0x4d41ae JE 4d41d2 |
(4052) 0x4d41b0 XOR %ESI,%ESI |
(4052) 0x4d41b2 NOPW %CS:(%RAX,%RAX,1) |
(4055) 0x4d41c0 CMP %RDI,(%R12,%RSI,8) |
(4055) 0x4d41c4 JE 4d42ab |
(4055) 0x4d41ca INC %RSI |
(4055) 0x4d41cd CMP %RSI,%RDX |
(4055) 0x4d41d0 JNE 4d41c0 |
(4052) 0x4d41d2 CMP %RCX,%R13 |
(4052) 0x4d41d5 JBE 4d4250 |
(4052) 0x4d41d7 CMPQ $0,-0x98(%RBP) |
(4052) 0x4d41df JE 4d4226 |
(4052) 0x4d41e1 VPBROADCASTQ %RDI,%YMM0 |
(4052) 0x4d41e7 XOR %ESI,%ESI |
(4052) 0x4d41e9 NOPL (%RAX) |
(4054) 0x4d41f0 VPCMPEQQ 0x20(%R9,%RSI,8),%YMM0,%K0 |
(4054) 0x4d41f8 VPCMPEQQ (%R9,%RSI,8),%YMM0,%K1 |
(4054) 0x4d41ff VPCMPEQQ 0x60(%R9,%RSI,8),%YMM0,%K2 |
(4054) 0x4d4207 VPCMPEQQ 0x40(%R9,%RSI,8),%YMM0,%K3 |
(4054) 0x4d420f KORB %K0,%K1,%K4 |
(4054) 0x4d4213 KORB %K2,%K3,%K5 |
(4054) 0x4d4217 KORTESTB %K5,%K4 |
(4054) 0x4d421b JNE 4d4285 |
(4054) 0x4d421d ADD $0x10,%RSI |
(4054) 0x4d4221 CMP %R8,%RSI |
(4054) 0x4d4224 JBE 4d41f0 |
(4052) 0x4d4226 MOV -0x98(%RBP),%RSI |
(4052) 0x4d422d CMP -0xa0(%RBP),%RSI |
(4052) 0x4d4234 JAE 4d4250 |
(4052) 0x4d4236 MOV -0xa8(%RBP),%RSI |
(4052) 0x4d423d NOPL (%RAX) |
(4053) 0x4d4240 CMP %RDI,(%R12,%RSI,8) |
(4053) 0x4d4244 JE 4d42ab |
(4053) 0x4d4246 INC %RSI |
(4053) 0x4d4249 CMP %RSI,%R13 |
(4053) 0x4d424c JNE 4d4240 |
(4052) 0x4d424e XCHG %AX,%AX |
(4052) 0x4d4250 MOV (%RBX,%R10,8),%RSI |
(4052) 0x4d4254 MOV 0x10(%RBP),%RDI |
(4052) 0x4d4258 VMOVQ (%RDI,%R10,8),%XMM0 |
(4052) 0x4d425e MOV -0x58(%RBP),%RDI |
(4052) 0x4d4262 CMP -0x80(%RBP),%RDI |
(4052) 0x4d4266 JGE 4d4160 |
(4052) 0x4d426c MOV %RSI,(%R12,%RDI,8) |
(4052) 0x4d4270 MOV -0x70(%RBP),%RSI |
(4052) 0x4d4274 VMOVQ %XMM0,(%RSI,%RDI,8) |
(4052) 0x4d4279 INC %RDI |
(4052) 0x4d427c MOV %RDI,-0x58(%RBP) |
(4052) 0x4d4280 JMP 4d4186 |
(4052) 0x4d4285 KSHIFTLB $0x4,%K0,%K0 |
(4052) 0x4d428b KORB %K0,%K1,%K0 |
(4052) 0x4d428f KSHIFTLB $0x4,%K2,%K1 |
(4052) 0x4d4295 KORB %K1,%K3,%K1 |
(4052) 0x4d4299 KUNPCKBW %K0,%K1,%K0 |
(4052) 0x4d429d KMOVD %K0,%EDI |
(4052) 0x4d42a1 TZCNT %EDI,%EDI |
(4052) 0x4d42a5 ADD %RDX,%RSI |
(4052) 0x4d42a8 ADD %RDI,%RSI |
(4052) 0x4d42ab MOV 0x10(%RBP),%RDI |
(4052) 0x4d42af VMOVQ (%RDI,%R10,8),%XMM0 |
(4052) 0x4d42b5 MOV -0x70(%RBP),%RDI |
(4052) 0x4d42b9 VMOVQ %XMM0,(%RDI,%RSI,8) |
(4052) 0x4d42be JMP 4d4186 |
0x4d42c3 ADD %R14,%RDI |
0x4d42c6 MOV -0x90(%RBP),%RCX |
0x4d42cd MOV -0x58(%RBP),%RAX |
0x4d42d1 LEA (%RAX,%RCX,1),%R12 |
0x4d42d5 MOV 0x48(%RBP),%RAX |
0x4d42d9 MOV -0x38(%RBP),%R13 |
0x4d42dd MOV %R12,(%RAX,%R13,8) |
0x4d42e1 TEST %RCX,%RCX |
0x4d42e4 MOV %RDI,-0x30(%RBP) |
0x4d42e8 JE 4d43f6 |
0x4d42ee MOV 0x38(%RBP),%RAX |
0x4d42f2 MOV (%RAX,%R13,8),%RDI |
0x4d42f6 LEA (,%R12,8),%R14 |
0x4d42fe MOV %R14,%RSI |
0x4d4301 VZEROUPPER |
0x4d4304 CALL 4e6de0 <hypre_ReAlloc> |
0x4d4309 MOV 0x38(%RBP),%RCX |
0x4d430d MOV %RAX,(%RCX,%R13,8) |
0x4d4311 MOV 0x40(%RBP),%R13 |
0x4d4315 MOV -0x38(%RBP),%RAX |
0x4d4319 MOV (%R13,%RAX,8),%RDI |
0x4d431e MOV %R14,%RSI |
0x4d4321 CALL 4e6de0 <hypre_ReAlloc> |
0x4d4326 MOV -0x90(%RBP),%RDX |
0x4d432d MOV -0x38(%RBP),%RCX |
0x4d4331 MOV %RAX,(%R13,%RCX,8) |
0x4d4336 MOV -0x38(%RBP),%RSI |
0x4d433a MOV 0x50(%RBP),%RCX |
0x4d433e MOV %R12,(%RCX,%RSI,8) |
0x4d4342 TEST %RDX,%RDX |
0x4d4345 JLE 4d43f6 |
0x4d434b MOV 0x38(%RBP),%RCX |
0x4d434f MOV (%RCX,%RSI,8),%RCX |
0x4d4353 MOV -0x78(%RBP),%R13 |
0x4d4357 LEA -0x8(%R13,%RDX,8),%RSI |
0x4d435c MOV -0x58(%RBP),%R10 |
0x4d4360 LEA (%RCX,%R10,8),%RDI |
0x4d4364 CMP %RDI,%RSI |
0x4d4367 SETAE %R9B |
0x4d436b LEA -0x1(%RDX,%R10,1),%RSI |
0x4d4370 LEA (%RCX,%RSI,8),%RCX |
0x4d4374 CMP %R13,%RCX |
0x4d4377 SETAE %R8B |
0x4d437b MOV -0x88(%RBP),%R12 |
0x4d4382 LEA -0x8(%R12,%RDX,8),%RCX |
0x4d4387 LEA (%RAX,%R10,8),%R14 |
0x4d438b CMP %R14,%RCX |
0x4d438e SETB %CL |
0x4d4391 LEA (%RAX,%RSI,8),%RAX |
0x4d4395 CMP %R12,%RAX |
0x4d4398 SETB %AL |
0x4d439b TEST %R8B,%R9B |
0x4d439e JNE 4d4420 |
0x4d43a4 OR %AL,%CL |
0x4d43a6 JE 4d4420 |
0x4d43a8 CMP $0xd,%RDX |
0x4d43ac JAE 4d3a61 |
0x4d43b2 MOV %RDX,%RAX |
0x4d43b5 AND $-0x4,%RAX |
0x4d43b9 JE 4d4506 |
0x4d43bf LEA -0x1(%RAX),%RCX |
0x4d43c3 XOR %ESI,%ESI |
0x4d43c5 NOPW %CS:(%RAX,%RAX,1) |
(4051) 0x4d43d0 VMOVUPS (%R13,%RSI,8),%YMM0 |
(4051) 0x4d43d7 VMOVUPS %YMM0,(%RDI,%RSI,8) |
(4051) 0x4d43dc VMOVDQU (%R12,%RSI,8),%YMM0 |
(4051) 0x4d43e2 VMOVDQU %YMM0,(%R14,%RSI,8) |
(4051) 0x4d43e8 ADD $0x4,%RSI |
(4051) 0x4d43ec CMP %RCX,%RSI |
(4051) 0x4d43ef JLE 4d43d0 |
0x4d43f1 JMP 4d4510 |
0x4d43f6 MOV -0x78(%RBP),%R13 |
0x4d43fa TEST %R13,%R13 |
0x4d43fd JNE 4d3a89 |
0x4d4403 JMP 4d3aa9 |
0x4d4408 MOV %R11,%RDI |
0x4d440b JMP 4d44ed |
0x4d4410 MOV -0xa0(%RBP),%RAX |
0x4d4417 MOV %RAX,-0x30(%RBP) |
0x4d441b JMP 4d44d5 |
0x4d4420 XOR %EAX,%EAX |
0x4d4422 NOPW %CS:(%RAX,%RAX,1) |
(4049) 0x4d4430 MOV (%R13,%RAX,8),%RCX |
(4049) 0x4d4435 MOV %RCX,(%RDI,%RAX,8) |
(4049) 0x4d4439 VMOVQ (%R12,%RAX,8),%XMM0 |
(4049) 0x4d443f VMOVQ %XMM0,(%R14,%RAX,8) |
(4049) 0x4d4445 INC %RAX |
(4049) 0x4d4448 CMP %RAX,%RDX |
(4049) 0x4d444b JNE 4d4430 |
0x4d444d JMP 4d3a89 |
0x4d4452 MOV %RDI,-0x30(%RBP) |
0x4d4456 MOV $0x511023,%EDI |
0x4d445b MOV $0xd70,%ESI |
0x4d4460 MOV $0x1,%EDX |
0x4d4465 XOR %ECX,%ECX |
0x4d4467 VZEROUPPER |
0x4d446a CALL 4e9720 <hypre_error_handler> |
0x4d446f MOV 0xd0(%RBP),%RAX |
0x4d4476 LOCK INCQ (%RAX) |
0x4d447a MOV $0x5111a5,%EDI |
0x4d447f CMPQ $0,0xc0(%RBP) |
0x4d4487 MOV -0x38(%RBP),%R13 |
0x4d448b JNE 4d44ca |
0x4d448d JMP 4d44d5 |
0x4d448f MOV %RDI,-0x30(%RBP) |
0x4d4493 MOV $0x511023,%EDI |
0x4d4498 MOV $0xd4e,%ESI |
0x4d449d MOV $0x1,%EDX |
0x4d44a2 XOR %ECX,%ECX |
0x4d44a4 VZEROUPPER |
0x4d44a7 CALL 4e9720 <hypre_error_handler> |
0x4d44ac MOV 0xd0(%RBP),%RAX |
0x4d44b3 LOCK INCQ (%RAX) |
0x4d44b7 MOV $0x51117f,%EDI |
0x4d44bc CMPQ $0,0xc0(%RBP) |
0x4d44c4 MOV -0x38(%RBP),%R13 |
0x4d44c8 JE 4d44d5 |
0x4d44ca MOV -0x58(%RBP),%RSI |
0x4d44ce XOR %EAX,%EAX |
0x4d44d0 CALL 4e6f30 <hypre_printf> |
0x4d44d5 MOV -0x60(%RBP),%RDX |
0x4d44d9 MOV -0x48(%RBP),%RSI |
0x4d44dd MOV -0x68(%RBP),%R9 |
0x4d44e1 MOV -0x50(%RBP),%R8 |
0x4d44e5 MOV -0x80(%RBP),%RDI |
0x4d44e9 MOV -0x70(%RBP),%R10 |
0x4d44ed MOV 0x18(%RBP),%RCX |
0x4d44f1 MOV 0x38(%RCX),%RAX |
0x4d44f5 MOV %R10,(%RAX,%R13,8) |
0x4d44f9 MOV 0x40(%RCX),%RAX |
0x4d44fd MOV %RDI,(%RAX,%R13,8) |
0x4d4501 JMP 4d3ab9 |
0x4d4506 XOR %EAX,%EAX |
0x4d4508 JMP 4d4519 |
(4050) 0x4d4510 CMP %RAX,%RDX |
(4050) 0x4d4513 JE 4d3a89 |
(4050) 0x4d4519 MOV (%R13,%RAX,8),%RCX |
(4050) 0x4d451e MOV %RCX,(%RDI,%RAX,8) |
(4050) 0x4d4522 VMOVQ (%R12,%RAX,8),%XMM0 |
(4050) 0x4d4528 VMOVQ %XMM0,(%R14,%RAX,8) |
(4050) 0x4d452e INC %RAX |
(4050) 0x4d4531 JMP 4d4510 |
/scratch_na/users/xoserete/qaas_runs/171-172-8218/intel/AMG/build/AMG/AMG/IJ_mv/IJMatrix_parcsr.c: 3262 - 3484 |
-------------------------------------------------------------------------------- |
3262: if (my_thread_num < rest) |
[...] |
3291: for (ii=ns; ii < ne; ii++) |
3292: { |
3293: row = rows[ii]; |
3294: n = ncols[ii]; |
3295: /* processor owns the row */ |
3296: if (row >= row_partitioning[pstart] && row < row_partitioning[pstart+1]) |
3297: { |
3298: row_local = row - row_partitioning[pstart]; |
3299: /* compute local row number */ |
3300: if (need_aux) |
3301: { |
3302: local_j = aux_j[row_local]; |
3303: local_data = aux_data[row_local]; |
3304: space = row_space[row_local]; |
3305: old_size = row_length[row_local]; |
3306: size = space - old_size; |
3307: if (size < n) |
3308: { |
3309: size = n - size; |
3310: tmp_j = hypre_CTAlloc(HYPRE_Int,size); |
3311: tmp_data = hypre_CTAlloc(HYPRE_Complex,size); |
3312: } |
3313: tmp_indx = 0; |
3314: not_found = 1; |
3315: size = old_size; |
3316: for (i=0; i < n; i++) |
3317: { |
3318: for (j=0; j < old_size; j++) |
3319: { |
3320: if (local_j[j] == cols[indx]) |
3321: { |
3322: local_data[j] = values[indx]; |
[...] |
3329: if (size < space) |
3330: { |
3331: local_j[size] = cols[indx]; |
3332: local_data[size++] = values[indx]; |
3333: } |
3334: else |
3335: { |
3336: tmp_j[tmp_indx] = cols[indx]; |
3337: tmp_data[tmp_indx++] = values[indx]; |
[...] |
3344: row_length[row_local] = size+tmp_indx; |
3345: |
3346: if (tmp_indx) |
3347: { |
3348: aux_j[row_local] = hypre_TReAlloc(aux_j[row_local],HYPRE_Int, |
3349: size+tmp_indx); |
3350: aux_data[row_local] = hypre_TReAlloc(aux_data[row_local], |
3351: HYPRE_Complex,size+tmp_indx); |
3352: row_space[row_local] = size+tmp_indx; |
3353: local_j = aux_j[row_local]; |
[...] |
3359: for (i=0; i < tmp_indx; i++) |
3360: { |
3361: local_j[cnt] = tmp_j[i]; |
3362: local_data[cnt++] = tmp_data[i]; |
3363: } |
3364: |
3365: if (tmp_j) |
3366: { |
3367: hypre_TFree(tmp_j); |
3368: hypre_TFree(tmp_data); |
[...] |
3376: offd_indx = hypre_AuxParCSRMatrixIndxOffd(aux_matrix)[row_local]; |
3377: diag_indx = hypre_AuxParCSRMatrixIndxDiag(aux_matrix)[row_local]; |
3378: cnt_diag = diag_indx; |
3379: cnt_offd = offd_indx; |
3380: diag_space = diag_i[row_local+1]; |
3381: offd_space = offd_i[row_local+1]; |
3382: not_found = 1; |
3383: for (i=0; i < n; i++) |
3384: { |
3385: if (cols[indx] < col_0 || cols[indx] > col_n) |
3386: /* insert into offd */ |
3387: { |
3388: for (j=offd_i[row_local]; j < offd_indx; j++) |
3389: { |
3390: if (offd_j[j] == cols[indx]) |
3391: { |
3392: offd_data[j] = values[indx]; |
[...] |
3399: if (cnt_offd < offd_space) |
3400: { |
3401: offd_j[cnt_offd] = cols[indx]; |
3402: offd_data[cnt_offd++] = values[indx]; |
3403: } |
3404: else |
3405: { |
3406: hypre_error(HYPRE_ERROR_GENERIC); |
3407: #ifdef HYPRE_USING_OPENMP |
3408: #pragma omp atomic |
3409: #endif |
3410: error_flag++; |
[...] |
3422: for (j=diag_i[row_local]; j < diag_indx; j++) |
3423: { |
3424: if (diag_j[j] == cols[indx]) |
3425: { |
3426: diag_data[j] = values[indx]; |
[...] |
3433: if (cnt_diag < diag_space) |
3434: { |
3435: diag_j[cnt_diag] = cols[indx]; |
3436: diag_data[cnt_diag++] = values[indx]; |
3437: } |
3438: else |
3439: { |
3440: hypre_error(HYPRE_ERROR_GENERIC); |
3441: #ifdef HYPRE_USING_OPENMP |
3442: #pragma omp atomic |
3443: #endif |
3444: error_flag++; |
3445: if (print_level) |
[...] |
3454: indx++; |
3455: } |
3456: |
3457: hypre_AuxParCSRMatrixIndxDiag(aux_matrix)[row_local] = cnt_diag; |
3458: hypre_AuxParCSRMatrixIndxOffd(aux_matrix)[row_local] = cnt_offd; |
[...] |
3466: indx += n; |
3467: if (aux_matrix) |
3468: { |
3469: col_indx = 0; |
3470: for (i=0; i < off_proc_i_indx; i=i+2) |
3471: { |
3472: row_len = off_proc_i[i+1]; |
3473: if (off_proc_i[i] == row) |
3474: { |
3475: for (j=0; j < n; j++) |
3476: { |
3477: cnt1 = col_indx; |
3478: for (k=0; k < row_len; k++) |
3479: { |
3480: if (off_proc_j[cnt1] == cols[j]) |
3481: { |
3482: off_proc_j[cnt1++] = -1; |
3483: /*cancel_indx++;*/ |
3484: offproc_cnt[my_thread_num]++; |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.00 |
CQA speedup if FP arith vectorized | 1.00 |
CQA speedup if fully vectorized | 18.22 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.75 |
Bottlenecks | micro-operation queue, |
Function | hypre_IJMatrixSetValuesOMPParCSR.extracted.28 |
Source | IJMatrix_parcsr.c:3262-3262,IJMatrix_parcsr.c:3291-3296,IJMatrix_parcsr.c:3300-3307,IJMatrix_parcsr.c:3310-3311,IJMatrix_parcsr.c:3316-3318,IJMatrix_parcsr.c:3344-3353,IJMatrix_parcsr.c:3359-3362,IJMatrix_parcsr.c:3365-3368,IJMatrix_parcsr.c:3376-3377,IJMatrix_parcsr.c:3380-3383,IJMatrix_parcsr.c:3392-3392,IJMatrix_parcsr.c:3406-3406,IJMatrix_parcsr.c:3410-3410,IJMatrix_parcsr.c:3440-3440,IJMatrix_parcsr.c:3444-3445,IJMatrix_parcsr.c:3457-3458,IJMatrix_parcsr.c:3466-3467,IJMatrix_parcsr.c:3473-3475,IJMatrix_parcsr.c:3484-3484 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 44.83 |
CQA cycles if no scalar integer | 44.83 |
CQA cycles if FP arith vectorized | 44.83 |
CQA cycles if fully vectorized | 2.46 |
Front-end cycles | 44.83 |
DIV/SQRT cycles | 14.80 |
P0 cycles | 14.80 |
P1 cycles | 25.67 |
P2 cycles | 25.67 |
P3 cycles | 24.50 |
P4 cycles | 14.80 |
P5 cycles | 14.80 |
P6 cycles | 24.50 |
P7 cycles | 24.50 |
P8 cycles | 24.50 |
P9 cycles | 14.80 |
P10 cycles | 25.67 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 42.51 |
Stall cycles (UFS) | 0.00 |
Nb insns | 248.00 |
Nb uops | 269.00 |
Nb loads | 77.00 |
Nb stores | 38.00 |
Nb stack references | 27.00 |
FLOP/cycle | 0.00 |
Nb FLOP add-sub | 0.00 |
Nb FLOP mul | 0.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 20.36 |
Bytes prefetched | 0.00 |
Bytes loaded | 609.00 |
Bytes stored | 304.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 7.58 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | NA |
Vectorization ratio add_sub | NA |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 20.00 |
Vector-efficiency ratio all | 13.09 |
Vector-efficiency ratio load | 11.41 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | NA |
Vector-efficiency ratio add_sub | NA |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 14.06 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.00 |
CQA speedup if FP arith vectorized | 1.00 |
CQA speedup if fully vectorized | 18.22 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.75 |
Bottlenecks | micro-operation queue, |
Function | hypre_IJMatrixSetValuesOMPParCSR.extracted.28 |
Source | IJMatrix_parcsr.c:3262-3262,IJMatrix_parcsr.c:3291-3296,IJMatrix_parcsr.c:3300-3307,IJMatrix_parcsr.c:3310-3311,IJMatrix_parcsr.c:3316-3318,IJMatrix_parcsr.c:3344-3353,IJMatrix_parcsr.c:3359-3362,IJMatrix_parcsr.c:3365-3368,IJMatrix_parcsr.c:3376-3377,IJMatrix_parcsr.c:3380-3383,IJMatrix_parcsr.c:3392-3392,IJMatrix_parcsr.c:3406-3406,IJMatrix_parcsr.c:3410-3410,IJMatrix_parcsr.c:3440-3440,IJMatrix_parcsr.c:3444-3445,IJMatrix_parcsr.c:3457-3458,IJMatrix_parcsr.c:3466-3467,IJMatrix_parcsr.c:3473-3475,IJMatrix_parcsr.c:3484-3484 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 44.83 |
CQA cycles if no scalar integer | 44.83 |
CQA cycles if FP arith vectorized | 44.83 |
CQA cycles if fully vectorized | 2.46 |
Front-end cycles | 44.83 |
DIV/SQRT cycles | 14.80 |
P0 cycles | 14.80 |
P1 cycles | 25.67 |
P2 cycles | 25.67 |
P3 cycles | 24.50 |
P4 cycles | 14.80 |
P5 cycles | 14.80 |
P6 cycles | 24.50 |
P7 cycles | 24.50 |
P8 cycles | 24.50 |
P9 cycles | 14.80 |
P10 cycles | 25.67 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 42.51 |
Stall cycles (UFS) | 0.00 |
Nb insns | 248.00 |
Nb uops | 269.00 |
Nb loads | 77.00 |
Nb stores | 38.00 |
Nb stack references | 27.00 |
FLOP/cycle | 0.00 |
Nb FLOP add-sub | 0.00 |
Nb FLOP mul | 0.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 20.36 |
Bytes prefetched | 0.00 |
Bytes loaded | 609.00 |
Bytes stored | 304.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 7.58 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | NA |
Vectorization ratio add_sub | NA |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 20.00 |
Vector-efficiency ratio all | 13.09 |
Vector-efficiency ratio load | 11.41 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | NA |
Vector-efficiency ratio add_sub | NA |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 14.06 |
Path / |
Function | hypre_IJMatrixSetValuesOMPParCSR.extracted.28 |
Source file and lines | IJMatrix_parcsr.c:3262-3484 |
Module | exec |
nb instructions | 248 |
nb uops | 269 |
loop length | 1054 |
used x86 registers | 13 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 27 |
micro-operation queue | 44.83 cycles |
front end | 44.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 14.80 | 14.80 | 25.67 | 25.67 | 24.50 | 14.80 | 14.80 | 24.50 | 24.50 | 24.50 | 14.80 | 25.67 |
cycles | 14.80 | 14.80 | 25.67 | 25.67 | 24.50 | 14.80 | 14.80 | 24.50 | 24.50 | 24.50 | 14.80 | 25.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 42.51 |
Stall cycles | 0.00 |
Front-end | 44.83 |
Dispatch | 25.67 |
Overall L1 | 44.83 |
all | 7% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 20% |
all | 13% |
load | 11% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R12,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4efd90 <_intel_fast_memcpy> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x88(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4efd90 <_intel_fast_memcpy> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e6e50 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x88(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e6e50 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x60(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4d4533 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xd53> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%RDX,%R9,8),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI,%R9,8),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB (%RAX),%R13 | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JL 4d3b90 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x3b0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP 0x8(%RAX),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JGE 4d3b90 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x3b0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0,0x58(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %R13,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4d3d48 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x568> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R13,8),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R13,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R13,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R13,8),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R13,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JLE 4d40f2 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x912> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e6d80 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x58(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e6d80 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JG 4d4105 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x925> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,(%RAX,%RCX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4d43f6 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc16> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
ADD %R14,-0x30(%RBP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
CMPB $0,-0x39(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 4d3abd <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2dd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4d3abd <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2dd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4d3bd4 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x3f4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV 0x18(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R13,8),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R13,8),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4d4408 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc28> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX,%R13,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX,%R13,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDI,%R14,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R11,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4d3dc6 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x5e6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4d3b70 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x390> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%R14),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12D,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $0x7f,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV $0x80,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %EDX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SHR $0x3,%ECX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %RCX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMOVB %R13,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND $-0x10,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
LEA -0x1(%RSI),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R12,%RDX,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4d419a <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x9ba> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %R14,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x90(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RAX,%RCX,1),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,(%RAX,%R13,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4d43f6 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc16> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R13,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (,%R12,8),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e6de0 <hypre_ReAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX,%R13,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%RAX,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e6de0 <hypre_ReAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%R13,%RCX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,(%RCX,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4d43f6 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc16> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%RSI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x78(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x8(%R13,%RDX,8),%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x58(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RCX,%R10,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETAE %R9B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA -0x1(%RDX,%R10,1),%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%RCX,%RSI,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R13,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETAE %R8B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV -0x88(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x8(%R12,%RDX,8),%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%RAX,%R10,8),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R14,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %CL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA (%RAX,%RSI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %AL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %R8B,%R9B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4d4420 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc40> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %AL,%CL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4d4420 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc40> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0xd,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4d3a61 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x281> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4d4506 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xd26> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4d4510 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xd30> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x78(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R13,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4d3a89 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4d3aa9 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2c9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R11,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4d44ed <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xd0d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4d44d5 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xcf5> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4d3a89 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2a9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x511023,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xd70,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e9720 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0xd0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LOCK INCQ (%RAX) | 3 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV $0x5111a5,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMPQ $0,0xc0(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4d44ca <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xcea> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4d44d5 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xcf5> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x511023,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xd4e,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e9720 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0xd0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LOCK INCQ (%RAX) | 3 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV $0x51117f,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMPQ $0,0xc0(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 4d44d5 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xcf5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e6f30 <hypre_printf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x60(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x80(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,(%RAX,%R13,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,(%RAX,%R13,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4d3ab9 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2d9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4d4519 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xd39> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
Function | hypre_IJMatrixSetValuesOMPParCSR.extracted.28 |
Source file and lines | IJMatrix_parcsr.c:3262-3484 |
Module | exec |
nb instructions | 248 |
nb uops | 269 |
loop length | 1054 |
used x86 registers | 13 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 27 |
micro-operation queue | 44.83 cycles |
front end | 44.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 14.80 | 14.80 | 25.67 | 25.67 | 24.50 | 14.80 | 14.80 | 24.50 | 24.50 | 24.50 | 14.80 | 25.67 |
cycles | 14.80 | 14.80 | 25.67 | 25.67 | 24.50 | 14.80 | 14.80 | 24.50 | 24.50 | 24.50 | 14.80 | 25.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 42.51 |
Stall cycles | 0.00 |
Front-end | 44.83 |
Dispatch | 25.67 |
Overall L1 | 44.83 |
all | 7% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 20% |
all | 13% |
load | 11% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R12,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4efd90 <_intel_fast_memcpy> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x88(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4efd90 <_intel_fast_memcpy> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e6e50 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x88(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e6e50 <hypre_Free> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x60(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4d4533 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xd53> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%RDX,%R9,8),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI,%R9,8),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB (%RAX),%R13 | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JL 4d3b90 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x3b0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP 0x8(%RAX),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JGE 4d3b90 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x3b0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0,0x58(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %R13,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4d3d48 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x568> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R13,8),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R13,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R13,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R13,8),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R13,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JLE 4d40f2 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x912> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e6d80 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x58(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4e6d80 <hypre_CAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JG 4d4105 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x925> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,(%RAX,%RCX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4d43f6 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc16> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
ADD %R14,-0x30(%RBP) | 2 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
CMPB $0,-0x39(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 4d3abd <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2dd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4d3abd <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2dd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4d3bd4 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x3f4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV 0x18(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R13,8),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R13,8),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4d4408 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc28> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX,%R13,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX,%R13,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDI,%R14,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R11,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4d3dc6 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x5e6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4d3b70 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x390> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%R14),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12D,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $0x7f,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV $0x80,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %EDX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SHR $0x3,%ECX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %RCX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMOVB %R13,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND $-0x10,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
LEA -0x1(%RSI),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R12,%RDX,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4d419a <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x9ba> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %R14,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x90(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RAX,%RCX,1),%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,(%RAX,%R13,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4d43f6 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc16> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R13,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (,%R12,8),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e6de0 <hypre_ReAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%RCX,%R13,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%RAX,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4e6de0 <hypre_ReAlloc> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,(%R13,%RCX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,(%RCX,%RSI,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4d43f6 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc16> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%RSI,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x78(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x8(%R13,%RDX,8),%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x58(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RCX,%R10,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETAE %R9B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA -0x1(%RDX,%R10,1),%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%RCX,%RSI,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R13,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETAE %R8B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV -0x88(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x8(%R12,%RDX,8),%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%RAX,%R10,8),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R14,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %CL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA (%RAX,%RSI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SETB %AL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %R8B,%R9B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4d4420 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc40> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
OR %AL,%CL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4d4420 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xc40> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0xd,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4d3a61 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x281> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4d4506 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xd26> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RAX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4d4510 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xd30> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x78(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R13,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4d3a89 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2a9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4d3aa9 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2c9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R11,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 4d44ed <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xd0d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0xa0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4d44d5 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xcf5> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4d3a89 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2a9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x511023,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xd70,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e9720 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0xd0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LOCK INCQ (%RAX) | 3 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV $0x5111a5,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMPQ $0,0xc0(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4d44ca <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xcea> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4d44d5 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xcf5> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x511023,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xd4e,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4e9720 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0xd0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LOCK INCQ (%RAX) | 3 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV $0x51117f,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMPQ $0,0xc0(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 4d44d5 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xcf5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e6f30 <hypre_printf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x60(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x80(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,(%RAX,%R13,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RCX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,(%RAX,%R13,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4d3ab9 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x2d9> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4d4519 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xd39> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |