Loop Id: 1254 | Module: exec | Source: par_lr_interp.c:1221-1675 [...] | Coverage: 0.08% |
---|
Loop Id: 1254 | Module: exec | Source: par_lr_interp.c:1221-1675 [...] | Coverage: 0.08% |
---|
0x4529c0 MOV -0xa0(%RBP),%RCX |
0x4529c7 MOV (%RCX),%RCX |
0x4529ca VMOVSD (%RCX,%RAX,8),%XMM5 |
0x4529cf MOV -0x58(%RBP),%RDX |
0x4529d3 VADDSD (%RDX,%R9,8),%XMM5,%XMM5 |
0x4529d9 VMOVSD %XMM5,(%RCX,%RAX,8) |
0x4529de INC %R9 |
0x4529e1 CMP -0x80(%RBP),%R9 |
0x4529e5 JE 4531e8 |
0x4529eb MOV (%RBX,%R9,8),%R10 |
0x4529ef MOV (%R13,%R10,8),%RAX |
0x4529f4 CMP %RDI,%RAX |
0x4529f7 JGE 4529c0 |
0x4529f9 CMP %R8,%RAX |
0x4529fc JNE 452af0 |
0x452a02 MOV -0x180(%RBP),%RCX |
0x452a09 MOV (%RCX,%R10,8),%R11 |
0x452a0d VPXOR %XMM5,%XMM5,%XMM5 |
0x452a11 XOR %EAX,%EAX |
0x452a13 MOV -0x58(%RBP),%RDX |
0x452a17 VUCOMISD (%RDX,%R11,8),%XMM5 |
0x452a1d MOV %R10,-0xf0(%RBP) |
0x452a24 MOV 0x8(%RCX,%R10,8),%RCX |
0x452a29 SETBE %AL |
0x452a2c LEA -0x1(%RAX,%RAX,1),%RAX |
0x452a31 MOV %RAX,-0xb8(%RBP) |
0x452a38 LEA 0x1(%R11),%R10 |
0x452a3c CMP %RCX,%R10 |
0x452a3f MOV %R11,-0x78(%RBP) |
0x452a43 JGE 452b30 |
0x452a49 VCVTSI2SDQ -0xb8(%RBP),%XMM10,%XMM6 |
0x452a52 NOT %R11 |
0x452a55 ADD %RCX,%R11 |
0x452a58 MOV %R11,-0xb0(%RBP) |
0x452a5f CMP $0x4,%R11 |
0x452a63 JAE 452bf1 |
0x452a69 MOV -0xb0(%RBP),%RDX |
0x452a70 MOV %RDX,%RAX |
0x452a73 AND $-0x4,%RAX |
0x452a77 CMP %RDX,%RAX |
0x452a7a JAE 452b30 |
0x452a80 MOV -0x78(%RBP),%RDX |
0x452a84 LEA 0x1(%RDX,%RAX,1),%RAX |
0x452a89 JMP 452a9c |
(1260) 0x452a90 INC %RAX |
(1260) 0x452a93 CMP %RAX,%RCX |
(1260) 0x452a96 JE 452b30 |
(1260) 0x452a9c MOV (%RBX,%RAX,8),%RDX |
(1260) 0x452aa0 XOR %R11D,%R11D |
(1260) 0x452aa3 CMP %RDI,(%R13,%RDX,8) |
(1260) 0x452aa8 SETGE %R11B |
(1260) 0x452aac XOR %R15D,%R15D |
(1260) 0x452aaf CMP %R14,%RDX |
(1260) 0x452ab2 SETE %R15B |
(1260) 0x452ab6 CMP %R11B,%R15B |
(1260) 0x452ab9 CMOVA %R15D,%R11D |
(1260) 0x452abd CMP $0x1,%R11B |
(1260) 0x452ac1 JNE 452a90 |
(1260) 0x452ac3 MOV -0x58(%RBP),%RDX |
(1260) 0x452ac7 VMOVSD (%RDX,%RAX,8),%XMM7 |
(1260) 0x452acc VMULSD %XMM6,%XMM7,%XMM8 |
(1260) 0x452ad0 VADDSD %XMM5,%XMM7,%XMM7 |
(1260) 0x452ad4 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1260) 0x452adb VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1260) 0x452ae1 JMP 452a90 |
0x452af0 MOV -0xe8(%RBP),%RAX |
0x452af7 CMPQ $-0x3,(%RAX,%R10,8) |
0x452afc JE 4529de |
0x452b02 CMPQ $0x1,-0x178(%RBP) |
0x452b0a JE 452b21 |
0x452b0c MOV -0x170(%RBP),%RCX |
0x452b13 MOV (%RCX,%R14,8),%RAX |
0x452b17 CMP (%RCX,%R10,8),%RAX |
0x452b1b JNE 4529de |
0x452b21 MOV -0x58(%RBP),%RAX |
0x452b25 VADDSD (%RAX,%R9,8),%XMM4,%XMM4 |
0x452b2b JMP 4529de |
0x452b30 MOV -0xc8(%RBP),%RAX |
0x452b37 MOV (%RAX),%RAX |
0x452b3a MOV %RAX,-0xb0(%RBP) |
0x452b41 CMP $0x2,%RAX |
0x452b45 JL 452e50 |
0x452b4b MOV -0x168(%RBP),%RDX |
0x452b52 MOV -0xf0(%RBP),%R11 |
0x452b59 MOV (%RDX,%R11,8),%RAX |
0x452b5d MOV 0x8(%RDX,%R11,8),%R12 |
0x452b62 MOV %R12,%R15 |
0x452b65 SUB %RAX,%R15 |
0x452b68 JLE 452e50 |
0x452b6e VCVTSI2SDQ -0xb8(%RBP),%XMM10,%XMM6 |
0x452b77 CMP $0x4,%R15 |
0x452b7b MOV %R15,-0x138(%RBP) |
0x452b82 JAE 452d40 |
0x452b88 MOV -0x138(%RBP),%R11 |
0x452b8f MOV %R11,%RDX |
0x452b92 AND $-0x4,%RDX |
0x452b96 CMP %R11,%RDX |
0x452b99 JAE 452e3c |
0x452b9f ADD %RDX,%RAX |
0x452ba2 MOV -0xc0(%RBP),%R14 |
0x452ba9 JMP 452bbc |
(1258) 0x452bb0 INC %RAX |
(1258) 0x452bb3 CMP %RAX,%R12 |
(1258) 0x452bb6 JE 452e50 |
(1258) 0x452bbc MOV -0xa8(%RBP),%RDX |
(1258) 0x452bc3 MOV (%RDX,%RAX,8),%RDX |
(1258) 0x452bc7 MOV -0x48(%RBP),%R11 |
(1258) 0x452bcb CMP %RSI,(%R11,%RDX,8) |
(1258) 0x452bcf JL 452bb0 |
(1258) 0x452bd1 MOV -0x70(%RBP),%RDX |
(1258) 0x452bd5 VMOVSD (%RDX,%RAX,8),%XMM7 |
(1258) 0x452bda VMULSD %XMM6,%XMM7,%XMM8 |
(1258) 0x452bde VADDSD %XMM5,%XMM7,%XMM7 |
(1258) 0x452be2 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1258) 0x452be9 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1258) 0x452bef JMP 452bb0 |
0x452bf1 MOV -0xb0(%RBP),%R12 |
0x452bf8 SHR $0x2,%R12 |
0x452bfc MOV -0x78(%RBP),%RAX |
0x452c00 LEA 0x20(,%RAX,8),%RAX |
0x452c08 VXORPD %XMM7,%XMM7,%XMM7 |
0x452c0c JMP 452c1d |
(1261) 0x452c10 ADD $0x20,%RAX |
(1261) 0x452c14 DEC %R12 |
(1261) 0x452c17 JE 452a69 |
(1261) 0x452c1d MOV -0x18(%RBX,%RAX,1),%RDX |
(1261) 0x452c22 XOR %R11D,%R11D |
(1261) 0x452c25 CMP %RDI,(%R13,%RDX,8) |
(1261) 0x452c2a SETGE %R11B |
(1261) 0x452c2e XOR %R15D,%R15D |
(1261) 0x452c31 CMP %R14,%RDX |
(1261) 0x452c34 SETE %R15B |
(1261) 0x452c38 CMP %R11B,%R15B |
(1261) 0x452c3b CMOVA %R15D,%R11D |
(1261) 0x452c3f CMP $0x1,%R11B |
(1261) 0x452c43 JNE 452c64 |
(1261) 0x452c45 MOV -0x58(%RBP),%RDX |
(1261) 0x452c49 VMOVSD -0x18(%RDX,%RAX,1),%XMM8 |
(1261) 0x452c4f VMULSD %XMM6,%XMM8,%XMM9 |
(1261) 0x452c53 VADDSD %XMM5,%XMM8,%XMM8 |
(1261) 0x452c57 VCMPSD $0x1,%XMM7,%XMM9,%K1 |
(1261) 0x452c5e VMOVSD %XMM8,%XMM5,%XMM5{%K1} |
(1261) 0x452c64 MOV -0x10(%RBX,%RAX,1),%RDX |
(1261) 0x452c69 XOR %R11D,%R11D |
(1261) 0x452c6c CMP %RDI,(%R13,%RDX,8) |
(1261) 0x452c71 SETGE %R11B |
(1261) 0x452c75 XOR %R15D,%R15D |
(1261) 0x452c78 CMP %R14,%RDX |
(1261) 0x452c7b SETE %R15B |
(1261) 0x452c7f CMP %R11B,%R15B |
(1261) 0x452c82 CMOVA %R15D,%R11D |
(1261) 0x452c86 CMP $0x1,%R11B |
(1261) 0x452c8a JNE 452cab |
(1261) 0x452c8c MOV -0x58(%RBP),%RDX |
(1261) 0x452c90 VMOVSD -0x10(%RDX,%RAX,1),%XMM8 |
(1261) 0x452c96 VMULSD %XMM6,%XMM8,%XMM9 |
(1261) 0x452c9a VADDSD %XMM5,%XMM8,%XMM8 |
(1261) 0x452c9e VCMPSD $0x1,%XMM7,%XMM9,%K1 |
(1261) 0x452ca5 VMOVSD %XMM8,%XMM5,%XMM5{%K1} |
(1261) 0x452cab MOV -0x8(%RBX,%RAX,1),%RDX |
(1261) 0x452cb0 XOR %R11D,%R11D |
(1261) 0x452cb3 CMP %RDI,(%R13,%RDX,8) |
(1261) 0x452cb8 SETGE %R11B |
(1261) 0x452cbc XOR %R15D,%R15D |
(1261) 0x452cbf CMP %R14,%RDX |
(1261) 0x452cc2 SETE %R15B |
(1261) 0x452cc6 CMP %R11B,%R15B |
(1261) 0x452cc9 CMOVA %R15D,%R11D |
(1261) 0x452ccd CMP $0x1,%R11B |
(1261) 0x452cd1 JNE 452cf2 |
(1261) 0x452cd3 MOV -0x58(%RBP),%RDX |
(1261) 0x452cd7 VMOVSD -0x8(%RDX,%RAX,1),%XMM8 |
(1261) 0x452cdd VMULSD %XMM6,%XMM8,%XMM9 |
(1261) 0x452ce1 VADDSD %XMM5,%XMM8,%XMM8 |
(1261) 0x452ce5 VCMPSD $0x1,%XMM7,%XMM9,%K1 |
(1261) 0x452cec VMOVSD %XMM8,%XMM5,%XMM5{%K1} |
(1261) 0x452cf2 MOV (%RBX,%RAX,1),%RDX |
(1261) 0x452cf6 XOR %R11D,%R11D |
(1261) 0x452cf9 CMP %RDI,(%R13,%RDX,8) |
(1261) 0x452cfe SETGE %R11B |
(1261) 0x452d02 XOR %R15D,%R15D |
(1261) 0x452d05 CMP %R14,%RDX |
(1261) 0x452d08 SETE %R15B |
(1261) 0x452d0c CMP %R11B,%R15B |
(1261) 0x452d0f CMOVA %R15D,%R11D |
(1261) 0x452d13 CMP $0x1,%R11B |
(1261) 0x452d17 JNE 452c10 |
(1261) 0x452d1d MOV -0x58(%RBP),%RDX |
(1261) 0x452d21 VMOVSD (%RDX,%RAX,1),%XMM8 |
(1261) 0x452d26 VMULSD %XMM6,%XMM8,%XMM9 |
(1261) 0x452d2a VADDSD %XMM5,%XMM8,%XMM8 |
(1261) 0x452d2e VCMPSD $0x1,%XMM7,%XMM9,%K1 |
(1261) 0x452d35 VMOVSD %XMM8,%XMM5,%XMM5{%K1} |
(1261) 0x452d3b JMP 452c10 |
0x452d40 SHR $0x2,%R15 |
0x452d44 LEA 0x18(,%RAX,8),%RDX |
0x452d4c JMP 452d5d |
(1259) 0x452d50 ADD $0x20,%RDX |
(1259) 0x452d54 DEC %R15 |
(1259) 0x452d57 JE 452b88 |
(1259) 0x452d5d MOV -0xa8(%RBP),%R11 |
(1259) 0x452d64 MOV -0x18(%R11,%RDX,1),%R11 |
(1259) 0x452d69 MOV -0x48(%RBP),%R14 |
(1259) 0x452d6d CMP %RSI,(%R14,%R11,8) |
(1259) 0x452d71 JL 452d93 |
(1259) 0x452d73 MOV -0x70(%RBP),%R11 |
(1259) 0x452d77 VMOVSD -0x18(%R11,%RDX,1),%XMM7 |
(1259) 0x452d7e VMULSD %XMM6,%XMM7,%XMM8 |
(1259) 0x452d82 VADDSD %XMM5,%XMM7,%XMM7 |
(1259) 0x452d86 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1259) 0x452d8d VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1259) 0x452d93 MOV -0xa8(%RBP),%R11 |
(1259) 0x452d9a MOV -0x10(%R11,%RDX,1),%R11 |
(1259) 0x452d9f MOV -0x48(%RBP),%R14 |
(1259) 0x452da3 CMP %RSI,(%R14,%R11,8) |
(1259) 0x452da7 JL 452dc9 |
(1259) 0x452da9 MOV -0x70(%RBP),%R11 |
(1259) 0x452dad VMOVSD -0x10(%R11,%RDX,1),%XMM7 |
(1259) 0x452db4 VMULSD %XMM6,%XMM7,%XMM8 |
(1259) 0x452db8 VADDSD %XMM5,%XMM7,%XMM7 |
(1259) 0x452dbc VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1259) 0x452dc3 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1259) 0x452dc9 MOV -0xa8(%RBP),%R11 |
(1259) 0x452dd0 MOV -0x8(%R11,%RDX,1),%R11 |
(1259) 0x452dd5 MOV -0x48(%RBP),%R14 |
(1259) 0x452dd9 CMP %RSI,(%R14,%R11,8) |
(1259) 0x452ddd JL 452dff |
(1259) 0x452ddf MOV -0x70(%RBP),%R11 |
(1259) 0x452de3 VMOVSD -0x8(%R11,%RDX,1),%XMM7 |
(1259) 0x452dea VMULSD %XMM6,%XMM7,%XMM8 |
(1259) 0x452dee VADDSD %XMM5,%XMM7,%XMM7 |
(1259) 0x452df2 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1259) 0x452df9 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1259) 0x452dff MOV -0xa8(%RBP),%R11 |
(1259) 0x452e06 MOV (%R11,%RDX,1),%R11 |
(1259) 0x452e0a MOV -0x48(%RBP),%R14 |
(1259) 0x452e0e CMP %RSI,(%R14,%R11,8) |
(1259) 0x452e12 JL 452d50 |
(1259) 0x452e18 MOV -0x70(%RBP),%R11 |
(1259) 0x452e1c VMOVSD (%R11,%RDX,1),%XMM7 |
(1259) 0x452e22 VMULSD %XMM6,%XMM7,%XMM8 |
(1259) 0x452e26 VADDSD %XMM5,%XMM7,%XMM7 |
(1259) 0x452e2a VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1259) 0x452e31 VMOVSD %XMM7,%XMM5,%XMM5{%K1} |
(1259) 0x452e37 JMP 452d50 |
0x452e3c MOV -0xc0(%RBP),%R14 |
0x452e43 NOPW %CS:(%RAX,%RAX,1) |
0x452e50 VUCOMISD %XMM0,%XMM5 |
0x452e54 MOV -0x58(%RBP),%RAX |
0x452e58 VMOVSD (%RAX,%R9,8),%XMM6 |
0x452e5e JE 452ef5 |
0x452e64 VDIVSD %XMM5,%XMM6,%XMM5 |
0x452e68 CMP %RCX,%R10 |
0x452e6b MOV -0x48(%RBP),%R12 |
0x452e6f JGE 452f13 |
0x452e75 VCVTSI2SDQ -0xb8(%RBP),%XMM10,%XMM6 |
0x452e7e MOV -0x78(%RBP),%RDX |
0x452e82 MOV %EDX,%EAX |
0x452e84 NOT %EAX |
0x452e86 ADD %ECX,%EAX |
0x452e88 TEST $0x1,%AL |
0x452e8a JE 452f0a |
0x452e8c MOV 0x8(%RBX,%RDX,8),%RAX |
0x452e91 MOV (%R13,%RAX,8),%RDX |
0x452e96 CMP %RDI,%RDX |
0x452e99 JL 452eca |
0x452e9b MOV -0x58(%RBP),%R10 |
0x452e9f MOV -0x78(%RBP),%R11 |
0x452ea3 VMOVSD 0x8(%R10,%R11,8),%XMM7 |
0x452eaa VMULSD %XMM6,%XMM7,%XMM8 |
0x452eae VUCOMISD %XMM0,%XMM8 |
0x452eb2 JAE 452eca |
0x452eb4 MOV -0xa0(%RBP),%R10 |
0x452ebb MOV (%R10),%R10 |
0x452ebe VFMADD213SD (%R10,%RDX,8),%XMM5,%XMM7 |
0x452ec4 VMOVSD %XMM7,(%R10,%RDX,8) |
0x452eca CMP %R14,%RAX |
0x452ecd JNE 452f02 |
0x452ecf MOV -0x58(%RBP),%RAX |
0x452ed3 MOV -0x78(%RBP),%RDX |
0x452ed7 VMOVSD 0x8(%RAX,%RDX,8),%XMM7 |
0x452edd VMULSD %XMM6,%XMM7,%XMM8 |
0x452ee1 VFMADD213SD %XMM4,%XMM5,%XMM7 |
0x452ee6 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
0x452eed VMOVSD %XMM7,%XMM4,%XMM4{%K1} |
0x452ef3 JMP 452f06 |
0x452ef5 VADDSD %XMM4,%XMM6,%XMM4 |
0x452ef9 MOV -0x48(%RBP),%R12 |
0x452efd JMP 4529de |
0x452f02 MOV -0x78(%RBP),%RDX |
0x452f06 LEA 0x2(%RDX),%R10 |
0x452f0a LEA -0x2(%RCX),%RAX |
0x452f0e CMP %RDX,%RAX |
0x452f11 JNE 452f79 |
0x452f13 CMPQ $0x2,-0xb0(%RBP) |
0x452f1b JL 4529de |
0x452f21 MOV -0x168(%RBP),%RCX |
0x452f28 MOV -0xf0(%RBP),%RDX |
0x452f2f MOV (%RCX,%RDX,8),%RAX |
0x452f33 MOV 0x8(%RCX,%RDX,8),%RCX |
0x452f38 MOV %RCX,%R10 |
0x452f3b SUB %RAX,%R10 |
0x452f3e JLE 4529de |
0x452f44 VCVTSI2SDQ -0xb8(%RBP),%XMM10,%XMM6 |
0x452f4d CMP $0x4,%R10 |
0x452f51 JAE 45308c |
0x452f57 MOV %R10,%RDX |
0x452f5a AND $-0x4,%RDX |
0x452f5e CMP %R10,%RDX |
0x452f61 JAE 4529de |
0x452f67 ADD %RDX,%RAX |
0x452f6a JMP 45304c |
(1257) 0x452f70 ADD $0x2,%R10 |
(1257) 0x452f74 CMP %R10,%RCX |
(1257) 0x452f77 JE 452f13 |
(1257) 0x452f79 MOV (%RBX,%R10,8),%RAX |
(1257) 0x452f7d MOV (%R13,%RAX,8),%RDX |
(1257) 0x452f82 CMP %RDI,%RDX |
(1257) 0x452f85 JL 452fb1 |
(1257) 0x452f87 MOV -0x58(%RBP),%R11 |
(1257) 0x452f8b VMOVSD (%R11,%R10,8),%XMM7 |
(1257) 0x452f91 VMULSD %XMM6,%XMM7,%XMM8 |
(1257) 0x452f95 VUCOMISD %XMM0,%XMM8 |
(1257) 0x452f99 JAE 452fb1 |
(1257) 0x452f9b MOV -0xa0(%RBP),%R11 |
(1257) 0x452fa2 MOV (%R11),%R15 |
(1257) 0x452fa5 VFMADD213SD (%R15,%RDX,8),%XMM5,%XMM7 |
(1257) 0x452fab VMOVSD %XMM7,(%R15,%RDX,8) |
(1257) 0x452fb1 CMP %R14,%RAX |
(1257) 0x452fb4 JNE 452fd6 |
(1257) 0x452fb6 MOV -0x58(%RBP),%RAX |
(1257) 0x452fba VMOVSD (%RAX,%R10,8),%XMM7 |
(1257) 0x452fc0 VMULSD %XMM6,%XMM7,%XMM8 |
(1257) 0x452fc4 VFMADD213SD %XMM4,%XMM5,%XMM7 |
(1257) 0x452fc9 VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1257) 0x452fd0 VMOVSD %XMM7,%XMM4,%XMM4{%K1} |
(1257) 0x452fd6 MOV 0x8(%RBX,%R10,8),%RAX |
(1257) 0x452fdb MOV (%R13,%RAX,8),%RDX |
(1257) 0x452fe0 CMP %RDI,%RDX |
(1257) 0x452fe3 JL 453010 |
(1257) 0x452fe5 MOV -0x58(%RBP),%R11 |
(1257) 0x452fe9 VMOVSD 0x8(%R11,%R10,8),%XMM7 |
(1257) 0x452ff0 VMULSD %XMM6,%XMM7,%XMM8 |
(1257) 0x452ff4 VUCOMISD %XMM0,%XMM8 |
(1257) 0x452ff8 JAE 453010 |
(1257) 0x452ffa MOV -0xa0(%RBP),%R11 |
(1257) 0x453001 MOV (%R11),%R15 |
(1257) 0x453004 VFMADD213SD (%R15,%RDX,8),%XMM5,%XMM7 |
(1257) 0x45300a VMOVSD %XMM7,(%R15,%RDX,8) |
(1257) 0x453010 CMP %R14,%RAX |
(1257) 0x453013 JNE 452f70 |
(1257) 0x453019 MOV -0x58(%RBP),%RAX |
(1257) 0x45301d VMOVSD 0x8(%RAX,%R10,8),%XMM7 |
(1257) 0x453024 VMULSD %XMM6,%XMM7,%XMM8 |
(1257) 0x453028 VFMADD213SD %XMM4,%XMM5,%XMM7 |
(1257) 0x45302d VCMPSD $0x1,%XMM0,%XMM8,%K1 |
(1257) 0x453034 VMOVSD %XMM7,%XMM4,%XMM4{%K1} |
(1257) 0x45303a JMP 452f70 |
(1255) 0x453040 INC %RAX |
(1255) 0x453043 CMP %RAX,%RCX |
(1255) 0x453046 JE 4529de |
(1255) 0x45304c MOV -0xa8(%RBP),%RDX |
(1255) 0x453053 MOV (%RDX,%RAX,8),%RDX |
(1255) 0x453057 MOV (%R12,%RDX,8),%RDX |
(1255) 0x45305b CMP %RSI,%RDX |
(1255) 0x45305e JL 453040 |
(1255) 0x453060 MOV -0x70(%RBP),%R10 |
(1255) 0x453064 VMOVSD (%R10,%RAX,8),%XMM7 |
(1255) 0x45306a VMULSD %XMM6,%XMM7,%XMM8 |
(1255) 0x45306e VUCOMISD %XMM0,%XMM8 |
(1255) 0x453072 JAE 453040 |
(1255) 0x453074 MOV -0x88(%RBP),%R10 |
(1255) 0x45307b MOV (%R10),%R10 |
(1255) 0x45307e VFMADD213SD (%R10,%RDX,8),%XMM5,%XMM7 |
(1255) 0x453084 VMOVSD %XMM7,(%R10,%RDX,8) |
(1255) 0x45308a JMP 453040 |
0x45308c MOV %R10,%RDX |
0x45308f SHR $0x2,%RDX |
0x453093 LEA 0x18(,%RAX,8),%R11 |
0x45309b JMP 4530ad |
(1256) 0x4530a0 ADD $0x20,%R11 |
(1256) 0x4530a4 DEC %RDX |
(1256) 0x4530a7 JE 452f57 |
(1256) 0x4530ad MOV -0xa8(%RBP),%R15 |
(1256) 0x4530b4 MOV -0x18(%R15,%R11,1),%R15 |
(1256) 0x4530b9 MOV (%R12,%R15,8),%R15 |
(1256) 0x4530bd CMP %RSI,%R15 |
(1256) 0x4530c0 JL 4530f9 |
(1256) 0x4530c2 MOV -0x70(%RBP),%RBX |
(1256) 0x4530c6 VMOVSD -0x18(%RBX,%R11,1),%XMM7 |
(1256) 0x4530cd MOV -0x118(%RBP),%RBX |
(1256) 0x4530d4 VMULSD %XMM6,%XMM7,%XMM8 |
(1256) 0x4530d8 VUCOMISD %XMM0,%XMM8 |
(1256) 0x4530dc JAE 4530f9 |
(1256) 0x4530de MOV -0x88(%RBP),%R12 |
(1256) 0x4530e5 MOV (%R12),%R12 |
(1256) 0x4530e9 VFMADD213SD (%R12,%R15,8),%XMM5,%XMM7 |
(1256) 0x4530ef VMOVSD %XMM7,(%R12,%R15,8) |
(1256) 0x4530f5 MOV -0x48(%RBP),%R12 |
(1256) 0x4530f9 MOV -0xa8(%RBP),%R15 |
(1256) 0x453100 MOV -0x10(%R15,%R11,1),%R15 |
(1256) 0x453105 MOV (%R12,%R15,8),%R15 |
(1256) 0x453109 CMP %RSI,%R15 |
(1256) 0x45310c JL 453145 |
(1256) 0x45310e MOV -0x70(%RBP),%RBX |
(1256) 0x453112 VMOVSD -0x10(%RBX,%R11,1),%XMM7 |
(1256) 0x453119 MOV -0x118(%RBP),%RBX |
(1256) 0x453120 VMULSD %XMM6,%XMM7,%XMM8 |
(1256) 0x453124 VUCOMISD %XMM0,%XMM8 |
(1256) 0x453128 JAE 453145 |
(1256) 0x45312a MOV -0x88(%RBP),%R12 |
(1256) 0x453131 MOV (%R12),%R12 |
(1256) 0x453135 VFMADD213SD (%R12,%R15,8),%XMM5,%XMM7 |
(1256) 0x45313b VMOVSD %XMM7,(%R12,%R15,8) |
(1256) 0x453141 MOV -0x48(%RBP),%R12 |
(1256) 0x453145 MOV -0xa8(%RBP),%R15 |
(1256) 0x45314c MOV -0x8(%R15,%R11,1),%R15 |
(1256) 0x453151 MOV (%R12,%R15,8),%R15 |
(1256) 0x453155 CMP %RSI,%R15 |
(1256) 0x453158 JL 453191 |
(1256) 0x45315a MOV -0x70(%RBP),%RBX |
(1256) 0x45315e VMOVSD -0x8(%RBX,%R11,1),%XMM7 |
(1256) 0x453165 MOV -0x118(%RBP),%RBX |
(1256) 0x45316c VMULSD %XMM6,%XMM7,%XMM8 |
(1256) 0x453170 VUCOMISD %XMM0,%XMM8 |
(1256) 0x453174 JAE 453191 |
(1256) 0x453176 MOV -0x88(%RBP),%R12 |
(1256) 0x45317d MOV (%R12),%R12 |
(1256) 0x453181 VFMADD213SD (%R12,%R15,8),%XMM5,%XMM7 |
(1256) 0x453187 VMOVSD %XMM7,(%R12,%R15,8) |
(1256) 0x45318d MOV -0x48(%RBP),%R12 |
(1256) 0x453191 MOV -0xa8(%RBP),%R15 |
(1256) 0x453198 MOV (%R15,%R11,1),%R15 |
(1256) 0x45319c MOV (%R12,%R15,8),%R15 |
(1256) 0x4531a0 CMP %RSI,%R15 |
(1256) 0x4531a3 JL 4530a0 |
(1256) 0x4531a9 MOV -0x70(%RBP),%RBX |
(1256) 0x4531ad VMOVSD (%RBX,%R11,1),%XMM7 |
(1256) 0x4531b3 MOV -0x118(%RBP),%RBX |
(1256) 0x4531ba VMULSD %XMM6,%XMM7,%XMM8 |
(1256) 0x4531be VUCOMISD %XMM0,%XMM8 |
(1256) 0x4531c2 JAE 4530a0 |
(1256) 0x4531c8 MOV -0x88(%RBP),%R12 |
(1256) 0x4531cf MOV (%R12),%R12 |
(1256) 0x4531d3 VFMADD213SD (%R12,%R15,8),%XMM5,%XMM7 |
(1256) 0x4531d9 VMOVSD %XMM7,(%R12,%R15,8) |
(1256) 0x4531df MOV -0x48(%RBP),%R12 |
(1256) 0x4531e3 JMP 4530a0 |
/scratch_na/users/xoserete/qaas_runs/171-172-8217/intel/AMG/build/AMG/AMG/parcsr_ls/par_lr_interp.c: 1221 - 1675 |
-------------------------------------------------------------------------------- |
1221: if (n_fine) |
[...] |
1609: for (jj = A_diag_i[i]+1; jj < A_diag_i[i+1]; jj++) |
1610: { /* i1 is a c-point and strongly influences i, accumulate |
1611: * a_(i,i1) into interpolation weight */ |
1612: i1 = A_diag_j[jj]; |
1613: if (P_marker[i1] >= jj_begin_row) |
1614: { |
1615: P_diag_data[P_marker[i1]] += A_diag_data[jj]; |
1616: } |
1617: else if(P_marker[i1] == strong_f_marker) |
1618: { |
1619: sum = zero; |
1620: sgn = 1; |
1621: if(A_diag_data[A_diag_i[i1]] < 0) sgn = -1; |
1622: /* Loop over row of A for point i1 and calculate the sum |
1623: * of the connections to c-points that strongly influence i. */ |
1624: for(jj1 = A_diag_i[i1]+1; jj1 < A_diag_i[i1+1]; jj1++) |
1625: { |
1626: i2 = A_diag_j[jj1]; |
1627: if((P_marker[i2] >= jj_begin_row || i2 == i) && (sgn*A_diag_data[jj1]) < 0) |
1628: sum += A_diag_data[jj1]; |
1629: } |
1630: if(num_procs > 1) |
1631: { |
1632: for(jj1 = A_offd_i[i1]; jj1< A_offd_i[i1+1]; jj1++) |
1633: { |
1634: i2 = A_offd_j[jj1]; |
1635: if(P_marker_offd[i2] >= jj_begin_row_offd && |
1636: (sgn*A_offd_data[jj1]) < 0) |
1637: sum += A_offd_data[jj1]; |
1638: } |
1639: } |
1640: if(sum != 0) |
1641: { |
1642: distribute = A_diag_data[jj]/sum; |
1643: /* Loop over row of A for point i1 and do the distribution */ |
1644: for(jj1 = A_diag_i[i1]+1; jj1 < A_diag_i[i1+1]; jj1++) |
1645: { |
1646: i2 = A_diag_j[jj1]; |
1647: if(P_marker[i2] >= jj_begin_row && (sgn*A_diag_data[jj1]) < 0) |
1648: P_diag_data[P_marker[i2]] += |
1649: distribute*A_diag_data[jj1]; |
1650: if(i2 == i && (sgn*A_diag_data[jj1]) < 0) |
1651: diagonal += distribute*A_diag_data[jj1]; |
1652: } |
1653: if(num_procs > 1) |
1654: { |
1655: for(jj1 = A_offd_i[i1]; jj1 < A_offd_i[i1+1]; jj1++) |
1656: { |
1657: i2 = A_offd_j[jj1]; |
1658: if(P_marker_offd[i2] >= jj_begin_row_offd && |
1659: (sgn*A_offd_data[jj1]) < 0) |
1660: P_offd_data[P_marker_offd[i2]] += |
[...] |
1667: diagonal += A_diag_data[jj]; |
1668: } |
1669: } |
1670: /* neighbor i1 weakly influences i, accumulate a_(i,i1) into |
1671: * diagonal */ |
1672: else if (CF_marker[i1] != -3) |
1673: { |
1674: if(num_functions == 1 || dof_func[i] == dof_func[i1]) |
1675: diagonal += A_diag_data[jj]; |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.84 |
CQA speedup if FP arith vectorized | 2.60 |
CQA speedup if fully vectorized | 8.00 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.38 |
Bottlenecks | micro-operation queue, |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source | par_lr_interp.c:1221-1221,par_lr_interp.c:1609-1609,par_lr_interp.c:1612-1617,par_lr_interp.c:1621-1621,par_lr_interp.c:1624-1624,par_lr_interp.c:1627-1627,par_lr_interp.c:1630-1632,par_lr_interp.c:1635-1636,par_lr_interp.c:1640-1650,par_lr_interp.c:1653-1655,par_lr_interp.c:1659-1659,par_lr_interp.c:1667-1667,par_lr_interp.c:1672-1675 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 27.67 |
CQA cycles if no scalar integer | 15.00 |
CQA cycles if FP arith vectorized | 10.65 |
CQA cycles if fully vectorized | 3.46 |
Front-end cycles | 27.67 |
DIV/SQRT cycles | 16.50 |
P0 cycles | 15.20 |
P1 cycles | 20.00 |
P2 cycles | 20.00 |
P3 cycles | 4.00 |
P4 cycles | 15.40 |
P5 cycles | 16.50 |
P6 cycles | 4.00 |
P7 cycles | 4.00 |
P8 cycles | 4.00 |
P9 cycles | 15.40 |
P10 cycles | 20.00 |
P11 cycles | 4.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 27.96 - 27.98 |
Stall cycles (UFS) | 0.00 |
Nb insns | 160.00 |
Nb uops | 162.00 |
Nb loads | 60.00 |
Nb stores | 8.00 |
Nb stack references | 16.00 |
FLOP/cycle | 0.36 |
Nb FLOP add-sub | 3.00 |
Nb FLOP mul | 2.00 |
Nb FLOP fma | 2.00 |
Nb FLOP div | 1.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 19.66 |
Bytes prefetched | 0.00 |
Bytes loaded | 480.00 |
Bytes stored | 64.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 3.45 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | 0.00 |
Vectorization ratio div_sqrt | 0.00 |
Vectorization ratio other | 6.06 |
Vector-efficiency ratio all | 12.93 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | 12.50 |
Vector-efficiency ratio div_sqrt | 12.50 |
Vector-efficiency ratio other | 13.26 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.84 |
CQA speedup if FP arith vectorized | 2.60 |
CQA speedup if fully vectorized | 8.00 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.38 |
Bottlenecks | micro-operation queue, |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source | par_lr_interp.c:1221-1221,par_lr_interp.c:1609-1609,par_lr_interp.c:1612-1617,par_lr_interp.c:1621-1621,par_lr_interp.c:1624-1624,par_lr_interp.c:1627-1627,par_lr_interp.c:1630-1632,par_lr_interp.c:1635-1636,par_lr_interp.c:1640-1650,par_lr_interp.c:1653-1655,par_lr_interp.c:1659-1659,par_lr_interp.c:1667-1667,par_lr_interp.c:1672-1675 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 27.67 |
CQA cycles if no scalar integer | 15.00 |
CQA cycles if FP arith vectorized | 10.65 |
CQA cycles if fully vectorized | 3.46 |
Front-end cycles | 27.67 |
DIV/SQRT cycles | 16.50 |
P0 cycles | 15.20 |
P1 cycles | 20.00 |
P2 cycles | 20.00 |
P3 cycles | 4.00 |
P4 cycles | 15.40 |
P5 cycles | 16.50 |
P6 cycles | 4.00 |
P7 cycles | 4.00 |
P8 cycles | 4.00 |
P9 cycles | 15.40 |
P10 cycles | 20.00 |
P11 cycles | 4.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 27.96 - 27.98 |
Stall cycles (UFS) | 0.00 |
Nb insns | 160.00 |
Nb uops | 162.00 |
Nb loads | 60.00 |
Nb stores | 8.00 |
Nb stack references | 16.00 |
FLOP/cycle | 0.36 |
Nb FLOP add-sub | 3.00 |
Nb FLOP mul | 2.00 |
Nb FLOP fma | 2.00 |
Nb FLOP div | 1.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 19.66 |
Bytes prefetched | 0.00 |
Bytes loaded | 480.00 |
Bytes stored | 64.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 3.45 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | 0.00 |
Vectorization ratio div_sqrt | 0.00 |
Vectorization ratio other | 6.06 |
Vector-efficiency ratio all | 12.93 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | 12.50 |
Vector-efficiency ratio div_sqrt | 12.50 |
Vector-efficiency ratio other | 13.26 |
Path / |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source file and lines | par_lr_interp.c:1221-1675 |
Module | exec |
nb instructions | 160 |
nb uops | 162 |
loop length | 757 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 7 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 16 |
ADD-SUB / MUL ratio | 1.50 |
micro-operation queue | 27.67 cycles |
front end | 27.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 16.50 | 15.20 | 20.00 | 20.00 | 4.00 | 15.40 | 16.50 | 4.00 | 4.00 | 4.00 | 15.40 | 20.00 |
cycles | 16.50 | 15.20 | 20.00 | 20.00 | 4.00 | 15.40 | 16.50 | 4.00 | 4.00 | 4.00 | 15.40 | 20.00 |
Cycles executing div or sqrt instructions | 4.00 |
FE+BE cycles | 27.96-27.98 |
Stall cycles | 0.00 |
Front-end | 27.67 |
Dispatch | 20.00 |
DIV/SQRT | 4.00 |
Overall L1 | 27.67 |
all | 2% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 3% |
all | 5% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 16% |
all | 3% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 6% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 13% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | 12% |
other | 14% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | 12% |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0xa0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RCX,%RAX,8),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RDX,%R9,8),%XMM5,%XMM5 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM5,(%RCX,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP -0x80(%RBP),%R9 | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4531e8 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1bf8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%RBX,%R9,8),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%R10,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4529c0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13d0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R8,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452af0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1500> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x180(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R10,8),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPXOR %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD (%RDX,%R11,8),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x8(%RCX,%R10,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SETBE %AL | 2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 1-2 | 1 |
LEA -0x1(%RAX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%R11),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R11,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 452b30 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1540> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb8(%RBP),%XMM10,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
NOT %R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RCX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R11,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x4,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 452bf1 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1601> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xb0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 452b30 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1540> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RDX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP 452a9c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ac> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0xe8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $-0x3,(%RAX,%R10,8) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x1,-0x178(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 452b21 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1531> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x170(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R14,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RCX,%R10,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R9,8),%XMM4,%XMM4 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
JMP 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x2,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 452e50 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1860> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x168(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX,%R11,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RDX,%R11,8),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 452e50 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1860> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb8(%RBP),%XMM10,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 452d40 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1750> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x138(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R11,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 452e3c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x184c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 452bbc <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15cc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0xb0(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SHR $0x2,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x20(,%RAX,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM7,%XMM7,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 452c1d <hypre_BoomerAMGBuildExtPIInterp.extracted+0x162d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
SHR $0x2,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%RAX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 452d5d <hypre_BoomerAMGBuildExtPIInterp.extracted+0x176d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM0,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RAX,%R9,8),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 452ef5 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1905> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VDIVSD %XMM5,%XMM6,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-15 | 4 |
CMP %RCX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x48(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 452f13 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1923> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb8(%RBP),%XMM10,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EDX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %ECX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 452f0a <hypre_BoomerAMGBuildExtPIInterp.extracted+0x191a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x8(%RBX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%RAX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 452eca <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18da> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x78(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%R10,%R11,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM6,%XMM7,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VUCOMISD %XMM0,%XMM8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JAE 452eca <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18da> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xa0(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VFMADD213SD (%R10,%RDX,8),%XMM5,%XMM7 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD %XMM7,(%R10,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R14,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452f02 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1912> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%RAX,%RDX,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM6,%XMM7,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM4,%XMM5,%XMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPSD $0x1,%XMM0,%XMM8,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVSD %XMM7,%XMM4,%XMM4{%K1} | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 452f06 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1916> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VADDSD %XMM4,%XMM6,%XMM4 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV -0x48(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x2(%RDX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x2(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452f79 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1989> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x2,-0xb0(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JL 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x168(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX,%RDX,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb8(%RBP),%XMM10,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 45308c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a9c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R10,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 45304c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a5c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%RAX,8),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4530ad <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1abd> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source file and lines | par_lr_interp.c:1221-1675 |
Module | exec |
nb instructions | 160 |
nb uops | 162 |
loop length | 757 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 7 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 16 |
ADD-SUB / MUL ratio | 1.50 |
micro-operation queue | 27.67 cycles |
front end | 27.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 16.50 | 15.20 | 20.00 | 20.00 | 4.00 | 15.40 | 16.50 | 4.00 | 4.00 | 4.00 | 15.40 | 20.00 |
cycles | 16.50 | 15.20 | 20.00 | 20.00 | 4.00 | 15.40 | 16.50 | 4.00 | 4.00 | 4.00 | 15.40 | 20.00 |
Cycles executing div or sqrt instructions | 4.00 |
FE+BE cycles | 27.96-27.98 |
Stall cycles | 0.00 |
Front-end | 27.67 |
Dispatch | 20.00 |
DIV/SQRT | 4.00 |
Overall L1 | 27.67 |
all | 2% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 3% |
all | 5% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 16% |
all | 3% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 6% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 13% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | 12% |
other | 14% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | 12% |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0xa0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RCX,%RAX,8),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RDX,%R9,8),%XMM5,%XMM5 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM5,(%RCX,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP -0x80(%RBP),%R9 | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4531e8 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1bf8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%RBX,%R9,8),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%R10,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4529c0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13d0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R8,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452af0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1500> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x180(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R10,8),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPXOR %XMM5,%XMM5,%XMM5 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x58(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD (%RDX,%R11,8),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R10,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x8(%RCX,%R10,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SETBE %AL | 2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 1-2 | 1 |
LEA -0x1(%RAX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%R11),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R11,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 452b30 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1540> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb8(%RBP),%XMM10,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
NOT %R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RCX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R11,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x4,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 452bf1 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1601> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xb0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 452b30 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1540> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RDX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP 452a9c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x14ac> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0xe8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $-0x3,(%RAX,%R10,8) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x1,-0x178(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 452b21 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1531> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x170(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R14,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RCX,%R10,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R9,8),%XMM4,%XMM4 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
JMP 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP $0x2,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 452e50 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1860> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x168(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX,%R11,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RDX,%R11,8),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 452e50 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1860> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb8(%RBP),%XMM10,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,-0x138(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 452d40 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1750> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x138(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R11,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 452e3c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x184c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 452bbc <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15cc> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0xb0(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SHR $0x2,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV -0x78(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x20(,%RAX,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM7,%XMM7,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 452c1d <hypre_BoomerAMGBuildExtPIInterp.extracted+0x162d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
SHR $0x2,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%RAX,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 452d5d <hypre_BoomerAMGBuildExtPIInterp.extracted+0x176d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0xc0(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM0,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RAX,%R9,8),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 452ef5 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1905> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VDIVSD %XMM5,%XMM6,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-15 | 4 |
CMP %RCX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x48(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 452f13 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1923> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb8(%RBP),%XMM10,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EDX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %ECX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST $0x1,%AL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 452f0a <hypre_BoomerAMGBuildExtPIInterp.extracted+0x191a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x8(%RBX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%RAX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 452eca <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18da> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x78(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%R10,%R11,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM6,%XMM7,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VUCOMISD %XMM0,%XMM8 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JAE 452eca <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18da> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xa0(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VFMADD213SD (%R10,%RDX,8),%XMM5,%XMM7 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD %XMM7,(%R10,%RDX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R14,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452f02 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1912> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%RAX,%RDX,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM6,%XMM7,%XMM8 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD213SD %XMM4,%XMM5,%XMM7 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPSD $0x1,%XMM0,%XMM8,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVSD %XMM7,%XMM4,%XMM4{%K1} | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 452f06 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1916> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VADDSD %XMM4,%XMM6,%XMM4 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV -0x48(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x78(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x2(%RDX),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x2(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 452f79 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1989> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x2,-0xb0(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JL 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x168(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX,%RDX,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb8(%RBP),%XMM10,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 45308c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a9c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %R10,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4529de <hypre_BoomerAMGBuildExtPIInterp.extracted+0x13ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 45304c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a5c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%RAX,8),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4530ad <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1abd> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |