Loop Id: 1314 | Module: exec | Source: par_lr_interp.c:1221-1675 [...] | Coverage: 0.05% |
---|
Loop Id: 1314 | Module: exec | Source: par_lr_interp.c:1221-1675 [...] | Coverage: 0.05% |
---|
0x4549b0 MOV -0x158(%RBP),%RAX |
0x4549b7 MOV (%RAX,%R11,8),%R15 |
0x4549bb MOV (%RBX,%R15,8),%RAX |
0x4549bf CMP %R9,%RAX |
0x4549c2 JGE 454e60 |
0x4549c8 CMP -0x58(%RBP),%RAX |
0x4549cc JNE 454e90 |
0x4549d2 MOV -0x1a0(%RBP),%RCX |
0x4549d9 MOV (%RCX,%R15,8),%RSI |
0x4549dd VXORPD %XMM9,%XMM9,%XMM9 |
0x4549e2 XOR %EAX,%EAX |
0x4549e4 MOV -0xc8(%RBP),%RDX |
0x4549eb VUCOMISD (%RDX,%RSI,8),%XMM9 |
0x4549f0 MOV 0x8(%RCX,%R15,8),%R12 |
0x4549f5 SETBE %AL |
0x4549f8 LEA -0x1(%RAX,%RAX,1),%RAX |
0x4549fd MOV %RAX,-0xb0(%RBP) |
0x454a04 MOV %RSI,-0x68(%RBP) |
0x454a08 LEA 0x1(%RSI),%RAX |
0x454a0c CMP %R12,%RAX |
0x454a0f JGE 454ae0 |
0x454a15 VCVTSI2SDQ -0xb0(%RBP),%XMM16,%XMM10 |
0x454a1c MOV -0x68(%RBP),%R13 |
0x454a20 MOV %R13,%RSI |
0x454a23 NOT %RSI |
0x454a26 ADD %R12,%RSI |
0x454a29 MOV %RSI,%RDX |
0x454a2c AND $-0x4,%RDX |
0x454a30 JE 454ee8 |
0x454a36 LEA -0x1(%RDX),%RDI |
0x454a3a VBROADCASTSD %XMM10,%YMM9 |
0x454a3f MOV -0x80(%RBP),%RCX |
0x454a43 LEA (%RCX,%R13,8),%RCX |
0x454a47 MOV -0xc0(%RBP),%R8 |
0x454a4e LEA (%R8,%R13,8),%R13 |
0x454a52 VXORPD %XMM12,%XMM12,%XMM12 |
0x454a57 VXORPD %XMM11,%XMM11,%XMM11 |
0x454a5c XOR %R14D,%R14D |
0x454a5f NOP |
(1321) 0x454a60 VMOVDQU (%R13,%R14,8),%YMM13 |
(1321) 0x454a67 VPXOR %XMM14,%XMM14,%XMM14 |
(1321) 0x454a6c KXNORW %K0,%K0,%K1 |
(1321) 0x454a70 VPGATHERQQ (%RBX,%YMM13,8),%YMM14{%K1} |
(1321) 0x454a77 VPCMPNLTQ %YMM6,%YMM14,%K0 |
(1321) 0x454a7e VPCMPEQQ %YMM7,%YMM13,%K1 |
(1321) 0x454a84 VPCMPGTQ %YMM14,%YMM6,%K1{%K1} |
(1321) 0x454a8a KORW %K1,%K0,%K1 |
(1321) 0x454a8e VMOVUPD (%RCX,%R14,8),%YMM13{%K1}{z} |
(1321) 0x454a95 VMULPD %YMM9,%YMM13,%YMM14 |
(1321) 0x454a9a VCMPPD $0x1,%YMM12,%YMM14,%K1{%K1} |
(1321) 0x454aa1 VADDPD %YMM13,%YMM11,%YMM11{%K1} |
(1321) 0x454aa7 ADD $0x4,%R14 |
(1321) 0x454aab CMP %RDI,%R14 |
(1321) 0x454aae JBE 454a60 |
0x454ab0 VEXTRACTF128 $0x1,%YMM11,%XMM9 |
0x454ab6 VADDPD %XMM9,%XMM11,%XMM9 |
0x454abb VSHUFPD $0x1,%XMM9,%XMM9,%XMM11 |
0x454ac1 VADDSD %XMM11,%XMM9,%XMM9 |
0x454ac6 CMP %RDX,%RSI |
0x454ac9 MOV -0x110(%RBP),%R14 |
0x454ad0 MOV -0xd0(%RBP),%R8 |
0x454ad7 JNE 454eea |
0x454add NOPL (%RAX) |
0x454ae0 MOV -0xe0(%RBP),%RCX |
0x454ae7 MOV (%RCX),%R13 |
0x454aea CMP $0x2,%R13 |
0x454aee JL 454bf0 |
0x454af4 MOV -0x170(%RBP),%RCX |
0x454afb MOV (%RCX,%R15,8),%RSI |
0x454aff MOV 0x8(%RCX,%R15,8),%RDX |
0x454b04 MOV %RDX,%RDI |
0x454b07 SUB %RSI,%RDI |
0x454b0a JLE 454bf0 |
0x454b10 MOV %RSI,-0x108(%RBP) |
0x454b17 VCVTSI2SDQ -0xb0(%RBP),%XMM16,%XMM10 |
0x454b1e MOV %RDI,%RSI |
0x454b21 AND $-0x4,%RSI |
0x454b25 JE 454f5f |
0x454b2b MOV %R13,-0x168(%RBP) |
0x454b32 LEA -0x1(%RSI),%RCX |
0x454b36 VBROADCASTSD %XMM10,%YMM11 |
0x454b3b MOV -0x88(%RBP),%R8 |
0x454b42 MOV -0x108(%RBP),%R10 |
0x454b49 LEA (%R8,%R10,8),%R13 |
0x454b4d MOV -0xf0(%RBP),%R8 |
0x454b54 MOV %R14,%R10 |
0x454b57 MOV -0x108(%RBP),%R14 |
0x454b5e LEA (%R8,%R14,8),%R14 |
0x454b62 VXORPD %XMM13,%XMM13,%XMM13 |
0x454b67 VXORPD %XMM12,%XMM12,%XMM12 |
0x454b6c XOR %R8D,%R8D |
0x454b6f NOP |
(1319) 0x454b70 VMOVDQU (%R14,%R8,8),%YMM14 |
(1319) 0x454b76 KXNORW %K0,%K0,%K1 |
(1319) 0x454b7a VPXOR %XMM15,%XMM15,%XMM15 |
(1319) 0x454b7f VPGATHERQQ (%R10,%YMM14,8),%YMM15{%K1} |
(1319) 0x454b86 VPCMPNLTQ %YMM8,%YMM15,%K1 |
(1319) 0x454b8d VMOVUPD (%R13,%R8,8),%YMM14{%K1}{z} |
(1319) 0x454b95 VMULPD %YMM11,%YMM14,%YMM15 |
(1319) 0x454b9a VCMPPD $0x1,%YMM13,%YMM15,%K1{%K1} |
(1319) 0x454ba1 VADDPD %YMM14,%YMM12,%YMM12{%K1} |
(1319) 0x454ba7 ADD $0x4,%R8 |
(1319) 0x454bab CMP %RCX,%R8 |
(1319) 0x454bae JBE 454b70 |
0x454bb0 VEXTRACTF128 $0x1,%YMM12,%XMM11 |
0x454bb6 VADDPD %XMM11,%XMM12,%XMM11 |
0x454bbb VSHUFPD $0x1,%XMM11,%XMM11,%XMM12 |
0x454bc1 VADDSD %XMM12,%XMM11,%XMM11 |
0x454bc6 VADDSD %XMM11,%XMM9,%XMM9 |
0x454bcb CMP %RSI,%RDI |
0x454bce MOV %R10,%R14 |
0x454bd1 MOV -0x50(%RBP),%R10 |
0x454bd5 MOV -0xd0(%RBP),%R8 |
0x454bdc MOV -0x168(%RBP),%R13 |
0x454be3 JNE 454f61 |
0x454be9 NOPL (%RAX) |
0x454bf0 VUCOMISD %XMM0,%XMM9 |
0x454bf4 MOV -0xc8(%RBP),%RCX |
0x454bfb VMOVSD (%RCX,%R11,8),%XMM10 |
0x454c01 JE 454ec8 |
0x454c07 VDIVSD %XMM9,%XMM10,%XMM9 |
0x454c0c CMP %R12,%RAX |
0x454c0f JGE 454cbd |
0x454c15 VCVTSI2SDQ -0xb0(%RBP),%XMM16,%XMM10 |
0x454c1c MOV -0x68(%RBP),%RDX |
0x454c20 MOV %EDX,%ECX |
0x454c22 NOT %ECX |
0x454c24 ADD %R12D,%ECX |
0x454c27 TEST $0x1,%CL |
0x454c2a JE 454cb3 |
0x454c30 MOV -0x158(%RBP),%RAX |
0x454c37 MOV 0x8(%RAX,%RDX,8),%RAX |
0x454c3c MOV (%RBX,%RAX,8),%RCX |
0x454c40 CMP %R9,%RCX |
0x454c43 JL 454c7e |
0x454c45 MOV -0xc8(%RBP),%RDX |
0x454c4c MOV -0x68(%RBP),%RSI |
0x454c50 VMOVSD 0x8(%RDX,%RSI,8),%XMM11 |
0x454c56 MOV -0x68(%RBP),%RDX |
0x454c5a VMULSD %XMM10,%XMM11,%XMM12 |
0x454c5f VUCOMISD %XMM0,%XMM12 |
0x454c63 JAE 454c7e |
0x454c65 MOV -0x90(%RBP),%RDX |
0x454c6c MOV (%RDX),%RDX |
0x454c6f VFMADD213SD (%RDX,%RCX,8),%XMM9,%XMM11 |
0x454c75 VMOVSD %XMM11,(%RDX,%RCX,8) |
0x454c7a MOV -0x68(%RBP),%RDX |
0x454c7e CMP %R10,%RAX |
0x454c81 JNE 454caf |
0x454c83 MOV -0xc8(%RBP),%RAX |
0x454c8a VMOVSD 0x8(%RAX,%RDX,8),%XMM11 |
0x454c90 VMULSD %XMM10,%XMM11,%XMM12 |
0x454c95 VMULSD %XMM9,%XMM11,%XMM11 |
0x454c9a VCMPSD $0x1,%XMM0,%XMM12,%K1 |
0x454ca1 VMOVAPD %XMM1,%XMM12 |
0x454ca5 VMOVSD %XMM11,%XMM12,%XMM12{%K1} |
0x454cab VADDSD %XMM5,%XMM12,%XMM5 |
0x454caf LEA 0x2(%RDX),%RAX |
0x454cb3 LEA -0x2(%R12),%RCX |
0x454cb8 CMP %RDX,%RCX |
0x454cbb JNE 454d29 |
0x454cbd CMP $0x2,%R13 |
0x454cc1 JL 454ecc |
0x454cc7 MOV -0x170(%RBP),%RCX |
0x454cce MOV (%RCX,%R15,8),%RAX |
0x454cd2 MOV 0x8(%RCX,%R15,8),%RCX |
0x454cd7 MOV %RCX,%RSI |
0x454cda SUB %RAX,%RSI |
0x454cdd JLE 454ecc |
0x454ce3 VCVTSI2SDQ -0xb0(%RBP),%XMM16,%XMM10 |
0x454cea CMP $0x4,%RSI |
0x454cee MOV -0xa8(%RBP),%R12 |
0x454cf5 JAE 454fba |
0x454cfb MOV %RSI,%RDX |
0x454cfe AND $-0x4,%RDX |
0x454d02 CMP %RSI,%RDX |
0x454d05 JAE 4550f0 |
0x454d0b ADD %RDX,%RAX |
0x454d0e MOV -0x70(%RBP),%R15 |
0x454d12 MOV -0xd0(%RBP),%R8 |
0x454d19 JMP 454e1c |
(1317) 0x454d20 ADD $0x2,%RAX |
(1317) 0x454d24 CMP %RAX,%R12 |
(1317) 0x454d27 JE 454cbd |
(1317) 0x454d29 MOV -0xc0(%RBP),%RCX |
(1317) 0x454d30 MOV -0x8(%RCX,%RAX,8),%RCX |
(1317) 0x454d35 MOV (%RBX,%RCX,8),%RDX |
(1317) 0x454d39 CMP %R9,%RDX |
(1317) 0x454d3c JL 454d68 |
(1317) 0x454d3e MOV -0x80(%RBP),%RSI |
(1317) 0x454d42 VMOVSD -0x8(%RSI,%RAX,8),%XMM11 |
(1317) 0x454d48 VMULSD %XMM10,%XMM11,%XMM12 |
(1317) 0x454d4d VUCOMISD %XMM0,%XMM12 |
(1317) 0x454d51 JAE 454d68 |
(1317) 0x454d53 MOV -0x90(%RBP),%RSI |
(1317) 0x454d5a MOV (%RSI),%RSI |
(1317) 0x454d5d VFMADD213SD (%RSI,%RDX,8),%XMM9,%XMM11 |
(1317) 0x454d63 VMOVSD %XMM11,(%RSI,%RDX,8) |
(1317) 0x454d68 CMP %R10,%RCX |
(1317) 0x454d6b JNE 454d96 |
(1317) 0x454d6d MOV -0x80(%RBP),%RCX |
(1317) 0x454d71 VMOVSD -0x8(%RCX,%RAX,8),%XMM11 |
(1317) 0x454d77 VMULSD %XMM10,%XMM11,%XMM12 |
(1317) 0x454d7c VMULSD %XMM9,%XMM11,%XMM11 |
(1317) 0x454d81 VCMPSD $0x1,%XMM0,%XMM12,%K1 |
(1317) 0x454d88 VMOVAPD %XMM1,%XMM12 |
(1317) 0x454d8c VMOVSD %XMM11,%XMM12,%XMM12{%K1} |
(1317) 0x454d92 VADDSD %XMM5,%XMM12,%XMM5 |
(1317) 0x454d96 MOV -0xc0(%RBP),%RCX |
(1317) 0x454d9d MOV (%RCX,%RAX,8),%RCX |
(1317) 0x454da1 MOV (%RBX,%RCX,8),%RDX |
(1317) 0x454da5 CMP %R9,%RDX |
(1317) 0x454da8 JL 454dd3 |
(1317) 0x454daa MOV -0x80(%RBP),%RSI |
(1317) 0x454dae VMOVSD (%RSI,%RAX,8),%XMM11 |
(1317) 0x454db3 VMULSD %XMM10,%XMM11,%XMM12 |
(1317) 0x454db8 VUCOMISD %XMM0,%XMM12 |
(1317) 0x454dbc JAE 454dd3 |
(1317) 0x454dbe MOV -0x90(%RBP),%RSI |
(1317) 0x454dc5 MOV (%RSI),%RSI |
(1317) 0x454dc8 VFMADD213SD (%RSI,%RDX,8),%XMM9,%XMM11 |
(1317) 0x454dce VMOVSD %XMM11,(%RSI,%RDX,8) |
(1317) 0x454dd3 CMP %R10,%RCX |
(1317) 0x454dd6 JNE 454d20 |
(1317) 0x454ddc MOV -0x80(%RBP),%RCX |
(1317) 0x454de0 VMOVSD (%RCX,%RAX,8),%XMM11 |
(1317) 0x454de5 VMULSD %XMM10,%XMM11,%XMM12 |
(1317) 0x454dea VMULSD %XMM9,%XMM11,%XMM11 |
(1317) 0x454def VCMPSD $0x1,%XMM0,%XMM12,%K1 |
(1317) 0x454df6 VMOVAPD %XMM1,%XMM12 |
(1317) 0x454dfa VMOVSD %XMM11,%XMM12,%XMM12{%K1} |
(1317) 0x454e00 VADDSD %XMM5,%XMM12,%XMM5 |
(1317) 0x454e04 JMP 454d20 |
(1315) 0x454e10 INC %RAX |
(1315) 0x454e13 CMP %RAX,%RCX |
(1315) 0x454e16 JE 454ed7 |
(1315) 0x454e1c MOV -0xf0(%RBP),%RDX |
(1315) 0x454e23 MOV (%RDX,%RAX,8),%RDX |
(1315) 0x454e27 MOV (%R14,%RDX,8),%RDX |
(1315) 0x454e2b CMP -0x30(%RBP),%RDX |
(1315) 0x454e2f JL 454e10 |
(1315) 0x454e31 MOV -0x88(%RBP),%RSI |
(1315) 0x454e38 VMOVSD (%RSI,%RAX,8),%XMM11 |
(1315) 0x454e3d VMULSD %XMM10,%XMM11,%XMM12 |
(1315) 0x454e42 VUCOMISD %XMM0,%XMM12 |
(1315) 0x454e46 JAE 454e10 |
(1315) 0x454e48 MOV -0x60(%RBP),%RSI |
(1315) 0x454e4c MOV (%RSI),%RSI |
(1315) 0x454e4f VFMADD213SD (%RSI,%RDX,8),%XMM9,%XMM11 |
(1315) 0x454e55 VMOVSD %XMM11,(%RSI,%RDX,8) |
(1315) 0x454e5a JMP 454e10 |
0x454e60 MOV -0x90(%RBP),%RCX |
0x454e67 MOV (%RCX),%RCX |
0x454e6a VMOVSD (%RCX,%RAX,8),%XMM9 |
0x454e6f MOV -0xc8(%RBP),%RDX |
0x454e76 VADDSD (%RDX,%R11,8),%XMM9,%XMM9 |
0x454e7c VMOVSD %XMM9,(%RCX,%RAX,8) |
0x454e81 JMP 454ed3 |
0x454e90 MOV -0x100(%RBP),%RAX |
0x454e97 CMPQ $-0x3,(%RAX,%R15,8) |
0x454e9c JE 454ed3 |
0x454e9e CMPQ $0x1,-0x198(%RBP) |
0x454ea6 JE 454eb9 |
0x454ea8 MOV -0x190(%RBP),%RCX |
0x454eaf MOV (%RCX,%R10,8),%RAX |
0x454eb3 CMP (%RCX,%R15,8),%RAX |
0x454eb7 JNE 454ed3 |
0x454eb9 MOV -0xc8(%RBP),%RAX |
0x454ec0 VADDSD (%RAX,%R11,8),%XMM5,%XMM5 |
0x454ec6 JMP 454ed3 |
0x454ec8 VADDSD %XMM5,%XMM10,%XMM5 |
0x454ecc MOV -0xa8(%RBP),%R12 |
0x454ed3 MOV -0x70(%RBP),%R15 |
0x454ed7 INC %R11 |
0x454eda CMP %R8,%R11 |
0x454edd JNE 4549b0 |
0x454ee8 XOR %EDX,%EDX |
0x454eea MOV -0x68(%RBP),%RCX |
0x454eee LEA 0x1(%RDX,%RCX,1),%RDX |
0x454ef3 JMP 454f0c |
(1320) 0x454f00 INC %RDX |
(1320) 0x454f03 CMP %RDX,%R12 |
(1320) 0x454f06 JE 454ae0 |
(1320) 0x454f0c MOV -0x158(%RBP),%RCX |
(1320) 0x454f13 MOV (%RCX,%RDX,8),%RCX |
(1320) 0x454f17 XOR %ESI,%ESI |
(1320) 0x454f19 CMP %R9,(%RBX,%RCX,8) |
(1320) 0x454f1d SETGE %SIL |
(1320) 0x454f21 XOR %EDI,%EDI |
(1320) 0x454f23 CMP %R10,%RCX |
(1320) 0x454f26 SETE %DIL |
(1320) 0x454f2a CMP %SIL,%DIL |
(1320) 0x454f2d CMOVA %EDI,%ESI |
(1320) 0x454f30 CMP $0x1,%SIL |
(1320) 0x454f34 JNE 454f00 |
(1320) 0x454f36 MOV -0xc8(%RBP),%RCX |
(1320) 0x454f3d VMOVSD (%RCX,%RDX,8),%XMM11 |
(1320) 0x454f42 VMULSD %XMM10,%XMM11,%XMM12 |
(1320) 0x454f47 VCMPSD $0x1,%XMM0,%XMM12,%K1 |
(1320) 0x454f4e VMOVAPD %XMM1,%XMM12 |
(1320) 0x454f52 VMOVSD %XMM11,%XMM12,%XMM12{%K1} |
(1320) 0x454f58 VADDSD %XMM9,%XMM12,%XMM9 |
(1320) 0x454f5d JMP 454f00 |
0x454f5f XOR %ESI,%ESI |
0x454f61 ADD -0x108(%RBP),%RSI |
0x454f68 JMP 454f7c |
(1318) 0x454f70 INC %RSI |
(1318) 0x454f73 CMP %RSI,%RDX |
(1318) 0x454f76 JE 454bf0 |
(1318) 0x454f7c MOV -0xf0(%RBP),%RCX |
(1318) 0x454f83 MOV (%RCX,%RSI,8),%RCX |
(1318) 0x454f87 MOV -0x30(%RBP),%RDI |
(1318) 0x454f8b CMP %RDI,(%R14,%RCX,8) |
(1318) 0x454f8f JL 454f70 |
(1318) 0x454f91 MOV -0x88(%RBP),%RCX |
(1318) 0x454f98 VMOVSD (%RCX,%RSI,8),%XMM11 |
(1318) 0x454f9d VMULSD %XMM10,%XMM11,%XMM12 |
(1318) 0x454fa2 VCMPSD $0x1,%XMM0,%XMM12,%K1 |
(1318) 0x454fa9 VMOVAPD %XMM1,%XMM12 |
(1318) 0x454fad VMOVSD %XMM11,%XMM12,%XMM12{%K1} |
(1318) 0x454fb3 VADDSD %XMM9,%XMM12,%XMM9 |
(1318) 0x454fb8 JMP 454f70 |
0x454fba MOV %RSI,%RDX |
0x454fbd SHR $0x2,%RDX |
0x454fc1 LEA 0x18(,%RAX,8),%R15 |
0x454fc9 JMP 454fdd |
(1316) 0x454fd0 ADD $0x20,%R15 |
(1316) 0x454fd4 DEC %RDX |
(1316) 0x454fd7 JE 454cfb |
(1316) 0x454fdd MOV -0xf0(%RBP),%RDI |
(1316) 0x454fe4 MOV -0x18(%RDI,%R15,1),%RDI |
(1316) 0x454fe9 MOV (%R14,%RDI,8),%RDI |
(1316) 0x454fed CMP -0x30(%RBP),%RDI |
(1316) 0x454ff1 JL 45501f |
(1316) 0x454ff3 MOV -0x88(%RBP),%R8 |
(1316) 0x454ffa VMOVSD -0x18(%R8,%R15,1),%XMM11 |
(1316) 0x455001 VMULSD %XMM10,%XMM11,%XMM12 |
(1316) 0x455006 VUCOMISD %XMM0,%XMM12 |
(1316) 0x45500a JAE 45501f |
(1316) 0x45500c MOV -0x60(%RBP),%R8 |
(1316) 0x455010 MOV (%R8),%R8 |
(1316) 0x455013 VFMADD213SD (%R8,%RDI,8),%XMM9,%XMM11 |
(1316) 0x455019 VMOVSD %XMM11,(%R8,%RDI,8) |
(1316) 0x45501f MOV -0xf0(%RBP),%RDI |
(1316) 0x455026 MOV -0x10(%RDI,%R15,1),%RDI |
(1316) 0x45502b MOV (%R14,%RDI,8),%RDI |
(1316) 0x45502f CMP -0x30(%RBP),%RDI |
(1316) 0x455033 JL 455061 |
(1316) 0x455035 MOV -0x88(%RBP),%R8 |
(1316) 0x45503c VMOVSD -0x10(%R8,%R15,1),%XMM11 |
(1316) 0x455043 VMULSD %XMM10,%XMM11,%XMM12 |
(1316) 0x455048 VUCOMISD %XMM0,%XMM12 |
(1316) 0x45504c JAE 455061 |
(1316) 0x45504e MOV -0x60(%RBP),%R8 |
(1316) 0x455052 MOV (%R8),%R8 |
(1316) 0x455055 VFMADD213SD (%R8,%RDI,8),%XMM9,%XMM11 |
(1316) 0x45505b VMOVSD %XMM11,(%R8,%RDI,8) |
(1316) 0x455061 MOV -0xf0(%RBP),%RDI |
(1316) 0x455068 MOV -0x8(%RDI,%R15,1),%RDI |
(1316) 0x45506d MOV (%R14,%RDI,8),%RDI |
(1316) 0x455071 CMP -0x30(%RBP),%RDI |
(1316) 0x455075 JL 4550a3 |
(1316) 0x455077 MOV -0x88(%RBP),%R8 |
(1316) 0x45507e VMOVSD -0x8(%R8,%R15,1),%XMM11 |
(1316) 0x455085 VMULSD %XMM10,%XMM11,%XMM12 |
(1316) 0x45508a VUCOMISD %XMM0,%XMM12 |
(1316) 0x45508e JAE 4550a3 |
(1316) 0x455090 MOV -0x60(%RBP),%R8 |
(1316) 0x455094 MOV (%R8),%R8 |
(1316) 0x455097 VFMADD213SD (%R8,%RDI,8),%XMM9,%XMM11 |
(1316) 0x45509d VMOVSD %XMM11,(%R8,%RDI,8) |
(1316) 0x4550a3 MOV -0xf0(%RBP),%RDI |
(1316) 0x4550aa MOV (%RDI,%R15,1),%RDI |
(1316) 0x4550ae MOV (%R14,%RDI,8),%RDI |
(1316) 0x4550b2 CMP -0x30(%RBP),%RDI |
(1316) 0x4550b6 JL 454fd0 |
(1316) 0x4550bc MOV -0x88(%RBP),%R8 |
(1316) 0x4550c3 VMOVSD (%R8,%R15,1),%XMM11 |
(1316) 0x4550c9 VMULSD %XMM10,%XMM11,%XMM12 |
(1316) 0x4550ce VUCOMISD %XMM0,%XMM12 |
(1316) 0x4550d2 JAE 454fd0 |
(1316) 0x4550d8 MOV -0x60(%RBP),%R8 |
(1316) 0x4550dc MOV (%R8),%R8 |
(1316) 0x4550df VFMADD213SD (%R8,%RDI,8),%XMM9,%XMM11 |
(1316) 0x4550e5 VMOVSD %XMM11,(%R8,%RDI,8) |
(1316) 0x4550eb JMP 454fd0 |
0x4550f0 MOV -0x70(%RBP),%R15 |
0x4550f4 MOV -0xd0(%RBP),%R8 |
0x4550fb INC %R11 |
0x4550fe CMP %R8,%R11 |
0x455101 JNE 4549b0 |
/home/eoseret/qaas_runs_CPU_9468/171-147-2675/intel/AMG/build/AMG/AMG/parcsr_ls/par_lr_interp.c: 1221 - 1675 |
-------------------------------------------------------------------------------- |
1221: if (n_fine) |
[...] |
1609: for (jj = A_diag_i[i]+1; jj < A_diag_i[i+1]; jj++) |
1610: { /* i1 is a c-point and strongly influences i, accumulate |
1611: * a_(i,i1) into interpolation weight */ |
1612: i1 = A_diag_j[jj]; |
1613: if (P_marker[i1] >= jj_begin_row) |
1614: { |
1615: P_diag_data[P_marker[i1]] += A_diag_data[jj]; |
1616: } |
1617: else if(P_marker[i1] == strong_f_marker) |
1618: { |
1619: sum = zero; |
1620: sgn = 1; |
1621: if(A_diag_data[A_diag_i[i1]] < 0) sgn = -1; |
1622: /* Loop over row of A for point i1 and calculate the sum |
1623: * of the connections to c-points that strongly influence i. */ |
1624: for(jj1 = A_diag_i[i1]+1; jj1 < A_diag_i[i1+1]; jj1++) |
1625: { |
1626: i2 = A_diag_j[jj1]; |
1627: if((P_marker[i2] >= jj_begin_row || i2 == i) && (sgn*A_diag_data[jj1]) < 0) |
1628: sum += A_diag_data[jj1]; |
1629: } |
1630: if(num_procs > 1) |
1631: { |
1632: for(jj1 = A_offd_i[i1]; jj1< A_offd_i[i1+1]; jj1++) |
1633: { |
1634: i2 = A_offd_j[jj1]; |
1635: if(P_marker_offd[i2] >= jj_begin_row_offd && |
1636: (sgn*A_offd_data[jj1]) < 0) |
1637: sum += A_offd_data[jj1]; |
1638: } |
1639: } |
1640: if(sum != 0) |
1641: { |
1642: distribute = A_diag_data[jj]/sum; |
1643: /* Loop over row of A for point i1 and do the distribution */ |
1644: for(jj1 = A_diag_i[i1]+1; jj1 < A_diag_i[i1+1]; jj1++) |
1645: { |
1646: i2 = A_diag_j[jj1]; |
1647: if(P_marker[i2] >= jj_begin_row && (sgn*A_diag_data[jj1]) < 0) |
1648: P_diag_data[P_marker[i2]] += |
1649: distribute*A_diag_data[jj1]; |
1650: if(i2 == i && (sgn*A_diag_data[jj1]) < 0) |
1651: diagonal += distribute*A_diag_data[jj1]; |
1652: } |
1653: if(num_procs > 1) |
1654: { |
1655: for(jj1 = A_offd_i[i1]; jj1 < A_offd_i[i1+1]; jj1++) |
1656: { |
1657: i2 = A_offd_j[jj1]; |
1658: if(P_marker_offd[i2] >= jj_begin_row_offd && |
1659: (sgn*A_offd_data[jj1]) < 0) |
1660: P_offd_data[P_marker_offd[i2]] += |
[...] |
1667: diagonal += A_diag_data[jj]; |
1668: } |
1669: } |
1670: /* neighbor i1 weakly influences i, accumulate a_(i,i1) into |
1671: * diagonal */ |
1672: else if (CF_marker[i1] != -3) |
1673: { |
1674: if(num_functions == 1 || dof_func[i] == dof_func[i1]) |
1675: diagonal += A_diag_data[jj]; |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 2.15 |
CQA speedup if FP arith vectorized | 3.11 |
CQA speedup if fully vectorized | 7.76 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.41 |
Bottlenecks | micro-operation queue, |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source | par_lr_interp.c:1221-1221,par_lr_interp.c:1609-1609,par_lr_interp.c:1612-1617,par_lr_interp.c:1621-1621,par_lr_interp.c:1624-1624,par_lr_interp.c:1627-1627,par_lr_interp.c:1630-1632,par_lr_interp.c:1635-1636,par_lr_interp.c:1640-1650,par_lr_interp.c:1653-1655,par_lr_interp.c:1659-1660,par_lr_interp.c:1667-1667,par_lr_interp.c:1672-1675 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 33.33 |
CQA cycles if no scalar integer | 15.50 |
CQA cycles if FP arith vectorized | 10.72 |
CQA cycles if fully vectorized | 4.29 |
Front-end cycles | 33.33 |
DIV/SQRT cycles | 17.60 |
P0 cycles | 17.63 |
P1 cycles | 23.67 |
P2 cycles | 23.67 |
P3 cycles | 3.00 |
P4 cycles | 17.67 |
P5 cycles | 17.50 |
P6 cycles | 3.00 |
P7 cycles | 3.00 |
P8 cycles | 3.00 |
P9 cycles | 17.60 |
P10 cycles | 23.67 |
P11 cycles | 4.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 34.57 - 36.43 |
Stall cycles (UFS) | 0.42 - 2.28 |
Nb insns | 195.00 |
Nb uops | 196.00 |
Nb loads | 71.00 |
Nb stores | 6.00 |
Nb stack references | 23.00 |
FLOP/cycle | 0.51 |
Nb FLOP add-sub | 11.00 |
Nb FLOP mul | 3.00 |
Nb FLOP fma | 1.00 |
Nb FLOP div | 1.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 18.48 |
Bytes prefetched | 0.00 |
Bytes loaded | 568.00 |
Bytes stored | 48.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 18.75 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 20.00 |
Vectorization ratio fma | 0.00 |
Vectorization ratio div_sqrt | 0.00 |
Vectorization ratio other | 25.64 |
Vector-efficiency ratio all | 14.84 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 15.00 |
Vector-efficiency ratio fma | 12.50 |
Vector-efficiency ratio div_sqrt | 12.50 |
Vector-efficiency ratio other | 15.71 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 2.15 |
CQA speedup if FP arith vectorized | 3.11 |
CQA speedup if fully vectorized | 7.76 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.41 |
Bottlenecks | micro-operation queue, |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source | par_lr_interp.c:1221-1221,par_lr_interp.c:1609-1609,par_lr_interp.c:1612-1617,par_lr_interp.c:1621-1621,par_lr_interp.c:1624-1624,par_lr_interp.c:1627-1627,par_lr_interp.c:1630-1632,par_lr_interp.c:1635-1636,par_lr_interp.c:1640-1650,par_lr_interp.c:1653-1655,par_lr_interp.c:1659-1660,par_lr_interp.c:1667-1667,par_lr_interp.c:1672-1675 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 33.33 |
CQA cycles if no scalar integer | 15.50 |
CQA cycles if FP arith vectorized | 10.72 |
CQA cycles if fully vectorized | 4.29 |
Front-end cycles | 33.33 |
DIV/SQRT cycles | 17.60 |
P0 cycles | 17.63 |
P1 cycles | 23.67 |
P2 cycles | 23.67 |
P3 cycles | 3.00 |
P4 cycles | 17.67 |
P5 cycles | 17.50 |
P6 cycles | 3.00 |
P7 cycles | 3.00 |
P8 cycles | 3.00 |
P9 cycles | 17.60 |
P10 cycles | 23.67 |
P11 cycles | 4.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 34.57 - 36.43 |
Stall cycles (UFS) | 0.42 - 2.28 |
Nb insns | 195.00 |
Nb uops | 196.00 |
Nb loads | 71.00 |
Nb stores | 6.00 |
Nb stack references | 23.00 |
FLOP/cycle | 0.51 |
Nb FLOP add-sub | 11.00 |
Nb FLOP mul | 3.00 |
Nb FLOP fma | 1.00 |
Nb FLOP div | 1.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 18.48 |
Bytes prefetched | 0.00 |
Bytes loaded | 568.00 |
Bytes stored | 48.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 18.75 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 20.00 |
Vectorization ratio fma | 0.00 |
Vectorization ratio div_sqrt | 0.00 |
Vectorization ratio other | 25.64 |
Vector-efficiency ratio all | 14.84 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 15.00 |
Vector-efficiency ratio fma | 12.50 |
Vector-efficiency ratio div_sqrt | 12.50 |
Vector-efficiency ratio other | 15.71 |
Path / |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source file and lines | par_lr_interp.c:1221-1675 |
Module | exec |
nb instructions | 195 |
nb uops | 196 |
loop length | 916 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 9 |
used ymm registers | 3 |
used zmm registers | 0 |
nb stack references | 23 |
ADD-SUB / MUL ratio | 3.00 |
micro-operation queue | 33.33 cycles |
front end | 33.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 17.60 | 17.63 | 23.67 | 23.67 | 3.00 | 17.67 | 17.50 | 3.00 | 3.00 | 3.00 | 17.60 | 23.67 |
cycles | 17.60 | 17.63 | 23.67 | 23.67 | 3.00 | 17.67 | 17.50 | 3.00 | 3.00 | 3.00 | 17.60 | 23.67 |
Cycles executing div or sqrt instructions | 4.00 |
FE+BE cycles | 34.57-36.43 |
Stall cycles | 0.42-2.28 |
ROB full (events) | 0.91-3.28 |
Front-end | 33.33 |
Dispatch | 23.67 |
DIV/SQRT | 4.00 |
Overall L1 | 33.33 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 32% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 22% |
fma | 0% |
div/sqrt | 0% |
other | 58% |
all | 18% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 20% |
fma | 0% |
div/sqrt | 0% |
other | 25% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 16% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 15% |
fma | 12% |
div/sqrt | 12% |
other | 19% |
all | 14% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 15% |
fma | 12% |
div/sqrt | 12% |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0x158(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R11,8),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%R15,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 454e60 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a70> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP -0x58(%RBP),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 454e90 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1aa0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x1a0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R15,8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM9,%XMM9,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xc8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD (%RDX,%RSI,8),%XMM9 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x8(%RCX,%R15,8),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SETBE %AL | 2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 1-2 | 1 |
LEA -0x1(%RAX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 454ae0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x16f0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb0(%RBP),%XMM16,%XMM10 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
MOV -0x68(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R12,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 454ee8 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1af8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VBROADCASTSD %XMM10,%YMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x80(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RCX,%R13,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xc0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R8,%R13,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM12,%XMM12,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM11,%XMM11,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTF128 $0x1,%YMM11,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VADDPD %XMM9,%XMM11,%XMM9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VSHUFPD $0x1,%XMM9,%XMM9,%XMM11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VADDSD %XMM11,%XMM9,%XMM9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x110(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 454eea <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1afa> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xe0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x2,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 454bf0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1800> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x170(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R15,8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX,%R15,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 454bf0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1800> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VCVTSI2SDQ -0xb0(%RBP),%XMM16,%XMM10 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 454f5f <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b6f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,-0x168(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0x1(%RSI),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VBROADCASTSD %XMM10,%YMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x88(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x108(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R8,%R10,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xf0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x108(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R8,%R14,8),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM13,%XMM13,%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM12,%XMM12,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTF128 $0x1,%YMM12,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VADDPD %XMM11,%XMM12,%XMM11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VSHUFPD $0x1,%XMM11,%XMM11,%XMM12 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VADDSD %XMM12,%XMM11,%XMM11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VADDSD %XMM11,%XMM9,%XMM9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x50(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x168(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 454f61 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b71> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM0,%XMM9 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0xc8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RCX,%R11,8),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 454ec8 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1ad8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VDIVSD %XMM9,%XMM10,%XMM9 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-15 | 4 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 454cbd <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18cd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb0(%RBP),%XMM16,%XMM10 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EDX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R12D,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST $0x1,%CL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 454cb3 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18c3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x158(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RAX,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 454c7e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x188e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%RDX,%RSI,8),%XMM11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM10,%XMM11,%XMM12 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VUCOMISD %XMM0,%XMM12 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JAE 454c7e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x188e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VFMADD213SD (%RDX,%RCX,8),%XMM9,%XMM11 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD %XMM11,(%RDX,%RCX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 454caf <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18bf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%RAX,%RDX,8),%XMM11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM10,%XMM11,%XMM12 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM9,%XMM11,%XMM11 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPSD $0x1,%XMM0,%XMM12,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD %XMM1,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VMOVSD %XMM11,%XMM12,%XMM12{%K1} | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VADDSD %XMM5,%XMM12,%XMM5 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
LEA 0x2(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x2(%R12),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 454d29 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1939> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x2,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 454ecc <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1adc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x170(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R15,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX,%R15,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 454ecc <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1adc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb0(%RBP),%XMM16,%XMM10 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xa8(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JAE 454fba <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1bca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RSI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4550f0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1d00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x70(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 454e1c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a2c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x90(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RCX,%RAX,8),%XMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RDX,%R11,8),%XMM9,%XMM9 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM9,(%RCX,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 454ed3 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1ae3> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x100(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $-0x3,(%RAX,%R15,8) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 454ed3 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1ae3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x1,-0x198(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 454eb9 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1ac9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x190(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R10,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RCX,%R15,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 454ed3 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1ae3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R11,8),%XMM5,%XMM5 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
JMP 454ed3 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1ae3> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VADDSD %XMM5,%XMM10,%XMM5 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV -0xa8(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4549b0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x68(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RDX,%RCX,1),%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP 454f0c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b1c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD -0x108(%RBP),%RSI | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JMP 454f7c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b8c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%RAX,8),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 454fdd <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1bed> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x70(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4549b0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
Function | hypre_BoomerAMGBuildExtPIInterp.extracted |
Source file and lines | par_lr_interp.c:1221-1675 |
Module | exec |
nb instructions | 195 |
nb uops | 196 |
loop length | 916 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 9 |
used ymm registers | 3 |
used zmm registers | 0 |
nb stack references | 23 |
ADD-SUB / MUL ratio | 3.00 |
micro-operation queue | 33.33 cycles |
front end | 33.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 17.60 | 17.63 | 23.67 | 23.67 | 3.00 | 17.67 | 17.50 | 3.00 | 3.00 | 3.00 | 17.60 | 23.67 |
cycles | 17.60 | 17.63 | 23.67 | 23.67 | 3.00 | 17.67 | 17.50 | 3.00 | 3.00 | 3.00 | 17.60 | 23.67 |
Cycles executing div or sqrt instructions | 4.00 |
FE+BE cycles | 34.57-36.43 |
Stall cycles | 0.42-2.28 |
ROB full (events) | 0.91-3.28 |
Front-end | 33.33 |
Dispatch | 23.67 |
DIV/SQRT | 4.00 |
Overall L1 | 33.33 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 32% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 22% |
fma | 0% |
div/sqrt | 0% |
other | 58% |
all | 18% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 20% |
fma | 0% |
div/sqrt | 0% |
other | 25% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 16% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 15% |
fma | 12% |
div/sqrt | 12% |
other | 19% |
all | 14% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 15% |
fma | 12% |
div/sqrt | 12% |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0x158(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX,%R11,8),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%R15,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 454e60 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a70> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP -0x58(%RBP),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 454e90 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1aa0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x1a0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R15,8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM9,%XMM9,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xc8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD (%RDX,%RSI,8),%XMM9 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x8(%RCX,%R15,8),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SETBE %AL | 2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 1-2 | 1 |
LEA -0x1(%RAX,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 454ae0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x16f0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb0(%RBP),%XMM16,%XMM10 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
MOV -0x68(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R12,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 454ee8 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1af8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RDX),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VBROADCASTSD %XMM10,%YMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x80(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RCX,%R13,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xc0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R8,%R13,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM12,%XMM12,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM11,%XMM11,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R14D,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTF128 $0x1,%YMM11,%XMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VADDPD %XMM9,%XMM11,%XMM9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VSHUFPD $0x1,%XMM9,%XMM9,%XMM11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VADDSD %XMM11,%XMM9,%XMM9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
CMP %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x110(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 454eea <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1afa> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xe0(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP $0x2,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 454bf0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1800> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x170(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R15,8),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX,%R15,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 454bf0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1800> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,-0x108(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VCVTSI2SDQ -0xb0(%RBP),%XMM16,%XMM10 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
MOV %RDI,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 454f5f <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b6f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,-0x168(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA -0x1(%RSI),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VBROADCASTSD %XMM10,%YMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0x88(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x108(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R8,%R10,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xf0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x108(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R8,%R14,8),%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM13,%XMM13,%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM12,%XMM12,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTF128 $0x1,%YMM12,%XMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VADDPD %XMM11,%XMM12,%XMM11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VSHUFPD $0x1,%XMM11,%XMM11,%XMM12 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VADDSD %XMM12,%XMM11,%XMM11 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VADDSD %XMM11,%XMM9,%XMM9 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
CMP %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x50(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x168(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 454f61 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b71> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM0,%XMM9 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV -0xc8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RCX,%R11,8),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JE 454ec8 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1ad8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VDIVSD %XMM9,%XMM10,%XMM9 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 13-15 | 4 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 454cbd <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18cd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb0(%RBP),%XMM16,%XMM10 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EDX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R12D,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST $0x1,%CL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 454cb3 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18c3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x158(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RAX,%RDX,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RAX,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 454c7e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x188e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%RDX,%RSI,8),%XMM11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM10,%XMM11,%XMM12 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VUCOMISD %XMM0,%XMM12 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JAE 454c7e <hypre_BoomerAMGBuildExtPIInterp.extracted+0x188e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VFMADD213SD (%RDX,%RCX,8),%XMM9,%XMM11 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD %XMM11,(%RDX,%RCX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x68(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 454caf <hypre_BoomerAMGBuildExtPIInterp.extracted+0x18bf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8(%RAX,%RDX,8),%XMM11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM10,%XMM11,%XMM12 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMULSD %XMM9,%XMM11,%XMM11 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VCMPSD $0x1,%XMM0,%XMM12,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVAPD %XMM1,%XMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0-1 | 0.17 |
VMOVSD %XMM11,%XMM12,%XMM12{%K1} | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VADDSD %XMM5,%XMM12,%XMM5 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
LEA 0x2(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x2(%R12),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 454d29 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1939> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x2,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 454ecc <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1adc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x170(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R15,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RCX,%R15,8),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 454ecc <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1adc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VCVTSI2SDQ -0xb0(%RBP),%XMM16,%XMM10 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 0.50 |
CMP $0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0xa8(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JAE 454fba <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1bca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RSI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4550f0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1d00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x70(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 454e1c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1a2c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV -0x90(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RCX,%RAX,8),%XMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RDX,%R11,8),%XMM9,%XMM9 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM9,(%RCX,%RAX,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 454ed3 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1ae3> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x100(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $-0x3,(%RAX,%R15,8) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 454ed3 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1ae3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMPQ $0x1,-0x198(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JE 454eb9 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1ac9> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x190(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX,%R10,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP (%RCX,%R15,8),%RAX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JNE 454ed3 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1ae3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX,%R11,8),%XMM5,%XMM5 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
JMP 454ed3 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1ae3> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VADDSD %XMM5,%XMM10,%XMM5 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV -0xa8(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4549b0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x68(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RDX,%RCX,1),%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP 454f0c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b1c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD -0x108(%RBP),%RSI | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JMP 454f7c <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1b8c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x2,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
LEA 0x18(,%RAX,8),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 454fdd <hypre_BoomerAMGBuildExtPIInterp.extracted+0x1bed> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x70(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JNE 4549b0 <hypre_BoomerAMGBuildExtPIInterp.extracted+0x15c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |