Loop Id: 653 | Module: libqmcwfs.so | Source: OneBodyJastrowRef.h:134-155 [...] | Coverage: 0.01% |
---|
Loop Id: 653 | Module: libqmcwfs.so | Source: OneBodyJastrowRef.h:134-155 [...] | Coverage: 0.01% |
---|
0x683f8 MOV -0x1a8(%RBP),%RDI |
0x683ff MOV 0xf0(%R12),%RBX |
0x68407 MOV 0xa8(%R12),%ESI |
0x6840f MOVSXD 0x2a0(%RDI),%RDX |
0x68416 VMOVSD (%RBX,%RDX,8),%XMM7 |
0x6841b VMOVSD %XMM7,-0x70(%RBP) |
0x68420 CALL 8140 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi@plt> |
0x68425 LEA (%R13,%R13,4),%RDI |
0x6842a VMOVSD -0x70(%RBP),%XMM10 |
0x6842f MOV 0x48(%RAX),%R8 |
0x68433 LEA (%R8,%RDI,8),%R9 |
0x68437 MOV 0x18(%R9),%R10 |
0x6843b MOVSXD 0x98(%R12),%R9 |
0x68443 TEST %R9D,%R9D |
0x68446 JLE 69088 |
0x6844c MOV $0x2,%R15D |
0x68452 MOV $0x1,%EDX |
0x68457 MOVQ $0,-0x160(%RBP) |
0x68462 MOV 0x1c8(%R12),%R11 |
0x6846a KXNORB %K1,%K1,%K1 |
0x6846e MOV %R13,-0x1b0(%RBP) |
0x68475 VPBROADCASTD %EDX,%YMM11 |
0x6847b VPBROADCASTD %R15D,%YMM12 |
0x68481 SAL $0x2,%R9 |
0x68485 MOV %R14,-0x1b8(%RBP) |
0x6848c XOR %EDI,%EDI |
0x6848e VMOVQ %XMM10,%RBX |
0x68493 VMOVDQA %YMM11,-0xf0(%RBP) |
0x6849b VMOVDQA %YMM12,-0x110(%RBP) |
0x684a3 NOPL (%RAX,%RAX,1) |
(655) 0x684a8 MOV (%R11,%RDI,2),%RDX |
(655) 0x684ac TEST %RDX,%RDX |
(655) 0x684af JE 6901a |
(655) 0x684b5 MOV 0xa0(%R12),%RSI |
(655) 0x684bd MOV 0x268(%RSI),%RCX |
(655) 0x684c4 MOV 0x18(%RCX),%R8 |
(655) 0x684c8 MOVSXD (%R8,%RDI,1),%RAX |
(655) 0x684cc MOV 0x4(%R8,%RDI,1),%R15D |
(655) 0x684d1 MOV 0x148(%R12),%R8 |
(655) 0x684d9 MOV %RAX,%R14 |
(655) 0x684dc CMP %EAX,%R15D |
(655) 0x684df JLE 6901a |
(655) 0x684e5 MOV %R15D,%R13D |
(655) 0x684e8 VMOVSD 0x8(%RDX),%XMM13 |
(655) 0x684ed LEA (%R10,%RAX,8),%RSI |
(655) 0x684f1 XOR %ECX,%ECX |
(655) 0x684f3 SUB %EAX,%R13D |
(655) 0x684f6 AND $0x7,%R13D |
(655) 0x684fa JE 6861c |
(655) 0x68500 CMP $0x1,%R13D |
(655) 0x68504 JE 685f3 |
(655) 0x6850a CMP $0x2,%R13D |
(655) 0x6850e JE 685d3 |
(655) 0x68514 CMP $0x3,%R13D |
(655) 0x68518 JE 685b3 |
(655) 0x6851e CMP $0x4,%R13D |
(655) 0x68522 JE 68593 |
(655) 0x68524 CMP $0x5,%R13D |
(655) 0x68528 JE 68573 |
(655) 0x6852a CMP $0x6,%R13D |
(655) 0x6852e JE 68552 |
(655) 0x68530 VMOVSD (%RSI),%XMM14 |
(655) 0x68534 VCOMISD %XMM14,%XMM13 |
(655) 0x68539 JBE 6854a |
(655) 0x6853b CMP $-0x1,%EAX |
(655) 0x6853e JE 6854a |
(655) 0x68540 VMOVSD %XMM14,(%R8) |
(655) 0x68545 MOV $0x1,%ECX |
(655) 0x6854a ADD $0x8,%RSI |
(655) 0x6854e LEA 0x1(%R14),%EAX |
(655) 0x68552 VMOVSD (%RSI),%XMM15 |
(655) 0x68556 VCOMISD %XMM15,%XMM13 |
(655) 0x6855b JBE 6856d |
(655) 0x6855d CMP $-0x1,%EAX |
(655) 0x68560 JE 6856d |
(655) 0x68562 MOVSXD %ECX,%R14 |
(655) 0x68565 INC %ECX |
(655) 0x68567 VMOVSD %XMM15,(%R8,%R14,8) |
(655) 0x6856d ADD $0x8,%RSI |
(655) 0x68571 INC %EAX |
(655) 0x68573 VMOVSD (%RSI),%XMM4 |
(655) 0x68577 VCOMISD %XMM4,%XMM13 |
(655) 0x6857b JBE 6858d |
(655) 0x6857d CMP $-0x1,%EAX |
(655) 0x68580 JE 6858d |
(655) 0x68582 MOVSXD %ECX,%R13 |
(655) 0x68585 INC %ECX |
(655) 0x68587 VMOVSD %XMM4,(%R8,%R13,8) |
(655) 0x6858d ADD $0x8,%RSI |
(655) 0x68591 INC %EAX |
(655) 0x68593 VMOVSD (%RSI),%XMM7 |
(655) 0x68597 VCOMISD %XMM7,%XMM13 |
(655) 0x6859b JBE 685ad |
(655) 0x6859d CMP $-0x1,%EAX |
(655) 0x685a0 JE 685ad |
(655) 0x685a2 MOVSXD %ECX,%R14 |
(655) 0x685a5 INC %ECX |
(655) 0x685a7 VMOVSD %XMM7,(%R8,%R14,8) |
(655) 0x685ad ADD $0x8,%RSI |
(655) 0x685b1 INC %EAX |
(655) 0x685b3 VMOVSD (%RSI),%XMM2 |
(655) 0x685b7 VCOMISD %XMM2,%XMM13 |
(655) 0x685bb JBE 685cd |
(655) 0x685bd CMP $-0x1,%EAX |
(655) 0x685c0 JE 685cd |
(655) 0x685c2 MOVSXD %ECX,%R13 |
(655) 0x685c5 INC %ECX |
(655) 0x685c7 VMOVSD %XMM2,(%R8,%R13,8) |
(655) 0x685cd ADD $0x8,%RSI |
(655) 0x685d1 INC %EAX |
(655) 0x685d3 VMOVSD (%RSI),%XMM3 |
(655) 0x685d7 VCOMISD %XMM3,%XMM13 |
(655) 0x685db JBE 685ed |
(655) 0x685dd CMP $-0x1,%EAX |
(655) 0x685e0 JE 685ed |
(655) 0x685e2 MOVSXD %ECX,%R14 |
(655) 0x685e5 INC %ECX |
(655) 0x685e7 VMOVSD %XMM3,(%R8,%R14,8) |
(655) 0x685ed ADD $0x8,%RSI |
(655) 0x685f1 INC %EAX |
(655) 0x685f3 VMOVSD (%RSI),%XMM5 |
(655) 0x685f7 VCOMISD %XMM5,%XMM13 |
(655) 0x685fb JBE 6860d |
(655) 0x685fd CMP $-0x1,%EAX |
(655) 0x68600 JE 6860d |
(655) 0x68602 MOVSXD %ECX,%R13 |
(655) 0x68605 INC %ECX |
(655) 0x68607 VMOVSD %XMM5,(%R8,%R13,8) |
(655) 0x6860d INC %EAX |
(655) 0x6860f ADD $0x8,%RSI |
(655) 0x68613 CMP %EAX,%R15D |
(655) 0x68616 JE 68732 |
(656) 0x6861c VMOVSD (%RSI),%XMM0 |
(656) 0x68620 VCOMISD %XMM0,%XMM13 |
(656) 0x68624 JBE 68636 |
(656) 0x68626 CMP $-0x1,%EAX |
(656) 0x68629 JE 68636 |
(656) 0x6862b MOVSXD %ECX,%R14 |
(656) 0x6862e INC %ECX |
(656) 0x68630 VMOVSD %XMM0,(%R8,%R14,8) |
(656) 0x68636 VMOVSD 0x8(%RSI),%XMM1 |
(656) 0x6863b INC %EAX |
(656) 0x6863d LEA 0x8(%RSI),%R13 |
(656) 0x68641 VCOMISD %XMM1,%XMM13 |
(656) 0x68645 JBE 68657 |
(656) 0x68647 CMP $-0x1,%EAX |
(656) 0x6864a JE 68657 |
(656) 0x6864c MOVSXD %ECX,%RSI |
(656) 0x6864f INC %ECX |
(656) 0x68651 VMOVSD %XMM1,(%R8,%RSI,8) |
(656) 0x68657 VMOVSD 0x8(%R13),%XMM8 |
(656) 0x6865d LEA 0x1(%RAX),%R14D |
(656) 0x68661 VCOMISD %XMM8,%XMM13 |
(656) 0x68666 JBE 68679 |
(656) 0x68668 CMP $-0x1,%R14D |
(656) 0x6866c JE 68679 |
(656) 0x6866e MOVSXD %ECX,%RSI |
(656) 0x68671 INC %ECX |
(656) 0x68673 VMOVSD %XMM8,(%R8,%RSI,8) |
(656) 0x68679 VMOVSD 0x10(%R13),%XMM9 |
(656) 0x6867f LEA 0x2(%RAX),%R14D |
(656) 0x68683 VCOMISD %XMM9,%XMM13 |
(656) 0x68688 JBE 6869b |
(656) 0x6868a CMP $-0x1,%R14D |
(656) 0x6868e JE 6869b |
(656) 0x68690 MOVSXD %ECX,%RSI |
(656) 0x68693 INC %ECX |
(656) 0x68695 VMOVSD %XMM9,(%R8,%RSI,8) |
(656) 0x6869b VMOVSD 0x18(%R13),%XMM6 |
(656) 0x686a1 LEA 0x3(%RAX),%R14D |
(656) 0x686a5 VCOMISD %XMM6,%XMM13 |
(656) 0x686a9 JBE 686bc |
(656) 0x686ab CMP $-0x1,%R14D |
(656) 0x686af JE 686bc |
(656) 0x686b1 MOVSXD %ECX,%RSI |
(656) 0x686b4 INC %ECX |
(656) 0x686b6 VMOVSD %XMM6,(%R8,%RSI,8) |
(656) 0x686bc VMOVSD 0x20(%R13),%XMM10 |
(656) 0x686c2 LEA 0x4(%RAX),%R14D |
(656) 0x686c6 VCOMISD %XMM10,%XMM13 |
(656) 0x686cb JBE 686de |
(656) 0x686cd CMP $-0x1,%R14D |
(656) 0x686d1 JE 686de |
(656) 0x686d3 MOVSXD %ECX,%RSI |
(656) 0x686d6 INC %ECX |
(656) 0x686d8 VMOVSD %XMM10,(%R8,%RSI,8) |
(656) 0x686de VMOVSD 0x28(%R13),%XMM11 |
(656) 0x686e4 LEA 0x5(%RAX),%R14D |
(656) 0x686e8 VCOMISD %XMM11,%XMM13 |
(656) 0x686ed JBE 68700 |
(656) 0x686ef CMP $-0x1,%R14D |
(656) 0x686f3 JE 68700 |
(656) 0x686f5 MOVSXD %ECX,%RSI |
(656) 0x686f8 INC %ECX |
(656) 0x686fa VMOVSD %XMM11,(%R8,%RSI,8) |
(656) 0x68700 VMOVSD 0x30(%R13),%XMM12 |
(656) 0x68706 LEA 0x6(%RAX),%R14D |
(656) 0x6870a VCOMISD %XMM12,%XMM13 |
(656) 0x6870f JBE 68722 |
(656) 0x68711 CMP $-0x1,%R14D |
(656) 0x68715 JE 68722 |
(656) 0x68717 MOVSXD %ECX,%RSI |
(656) 0x6871a INC %ECX |
(656) 0x6871c VMOVSD %XMM12,(%R8,%RSI,8) |
(656) 0x68722 ADD $0x7,%EAX |
(656) 0x68725 LEA 0x38(%R13),%RSI |
(656) 0x68729 CMP %EAX,%R15D |
(656) 0x6872c JNE 6861c |
(655) 0x68732 TEST %ECX,%ECX |
(655) 0x68734 JLE 6901a |
(655) 0x6873a VMOVSD 0x38(%RDX),%XMM2 |
(655) 0x6873f VMOVSD 0x48(%RDX),%XMM3 |
(655) 0x68744 VMOVSD 0x50(%RDX),%XMM6 |
(655) 0x68749 VMOVSD 0x58(%RDX),%XMM0 |
(655) 0x6874e VMOVSD 0x60(%RDX),%XMM14 |
(655) 0x68753 VMOVSD 0x68(%RDX),%XMM15 |
(655) 0x68758 VMOVSD %XMM2,-0x48(%RBP) |
(655) 0x6875d VMOVSD 0x70(%RDX),%XMM9 |
(655) 0x68762 VMOVSD 0x78(%RDX),%XMM8 |
(655) 0x68767 VMOVSD %XMM3,-0x50(%RBP) |
(655) 0x6876c VMOVSD 0x80(%RDX),%XMM13 |
(655) 0x68774 VMOVSD 0x88(%RDX),%XMM12 |
(655) 0x6877c VMOVSD %XMM6,-0x118(%RBP) |
(655) 0x68784 VMOVSD 0x90(%RDX),%XMM29 |
(655) 0x6878b VMOVSD 0x238(%RDX),%XMM4 |
(655) 0x68793 VMOVSD %XMM0,-0x120(%RBP) |
(655) 0x6879b MOV 0x218(%RDX),%RAX |
(655) 0x687a2 VMOVSD 0x18(%RDX),%XMM1 |
(655) 0x687a7 VMOVSD %XMM14,-0x128(%RBP) |
(655) 0x687af VMOVSD 0x20(%RDX),%XMM10 |
(655) 0x687b4 VMOVSD 0x28(%RDX),%XMM5 |
(655) 0x687b9 VMOVSD %XMM15,-0x130(%RBP) |
(655) 0x687c1 VMOVSD 0x30(%RDX),%XMM11 |
(655) 0x687c6 VMOVSD 0x40(%RDX),%XMM7 |
(655) 0x687cb LEA -0x1(%RCX),%EDX |
(655) 0x687ce VMOVSD %XMM9,-0x138(%RBP) |
(655) 0x687d6 VMOVSD %XMM8,-0x140(%RBP) |
(655) 0x687de VMOVSD %XMM13,-0x148(%RBP) |
(655) 0x687e6 VMOVSD %XMM12,-0x150(%RBP) |
(655) 0x687ee VMOVSD %XMM29,-0x158(%RBP) |
(655) 0x687f5 CMP $0x6,%EDX |
(655) 0x687f8 JBE 6944f |
(655) 0x687fe MOV %ECX,%R14D |
(655) 0x68801 VBROADCASTSD %XMM2,%YMM23 |
(655) 0x68807 VBROADCASTSD %XMM3,%YMM21 |
(655) 0x6880d MOV %R8,%R15 |
(655) 0x68810 SHR $0x3,%R14D |
(655) 0x68814 VBROADCASTSD %XMM6,%YMM2 |
(655) 0x68819 VBROADCASTSD %XMM0,%YMM3 |
(655) 0x6881e VMOVSD %XMM4,-0x168(%RBP) |
(655) 0x68826 VBROADCASTSD %XMM14,%YMM6 |
(655) 0x6882b VBROADCASTSD %XMM15,%YMM30 |
(655) 0x68831 VBROADCASTSD %XMM29,%YMM0 |
(655) 0x68837 SAL $0x6,%R14 |
(655) 0x6883b VXORPD %XMM15,%XMM15,%XMM15 |
(655) 0x68840 VBROADCASTSD %XMM4,%YMM28 |
(655) 0x68846 VBROADCASTSD %XMM1,%YMM27 |
(655) 0x6884c VMOVAPD %YMM2,-0x70(%RBP) |
(655) 0x68851 VBROADCASTSD %XMM10,%YMM26 |
(655) 0x68857 VBROADCASTSD %XMM5,%YMM25 |
(655) 0x6885d VBROADCASTSD %XMM11,%YMM24 |
(655) 0x68863 VMOVAPD %YMM3,-0x90(%RBP) |
(655) 0x6886b VBROADCASTSD %XMM7,%YMM22 |
(655) 0x68871 VMOVAPD %YMM6,-0xb0(%RBP) |
(655) 0x68879 VBROADCASTSD %XMM9,%YMM20 |
(655) 0x6887f VBROADCASTSD %XMM8,%YMM19 |
(655) 0x68885 VBROADCASTSD %XMM13,%YMM18 |
(655) 0x6888b VBROADCASTSD %XMM12,%YMM17 |
(655) 0x68891 VMOVAPD %YMM0,-0xd0(%RBP) |
(655) 0x68899 ADD %R8,%R14 |
(655) 0x6889c VMOVAPD %YMM15,%YMM14 |
(655) 0x688a1 VMOVSD %XMM1,-0x170(%RBP) |
(655) 0x688a9 VMOVSD %XMM10,-0x178(%RBP) |
(655) 0x688b1 VMOVSD %XMM5,-0x180(%RBP) |
(655) 0x688b9 VMOVSD %XMM11,-0x188(%RBP) |
(655) 0x688c1 VMOVSD %XMM7,-0x190(%RBP) |
(655) 0x688c9 NOPL (%RAX) |
(657) 0x688d0 VMULPD (%R15),%YMM28,%YMM10 |
(657) 0x688d6 VMOVAPD %YMM25,%YMM6 |
(657) 0x688dc KMOVB %K1,%K2 |
(657) 0x688e0 KMOVB %K1,%K3 |
(657) 0x688e4 KMOVB %K1,%K4 |
(657) 0x688e8 KMOVB %K1,%K5 |
(657) 0x688ec VMULPD 0x20(%R15),%YMM28,%YMM11 |
(657) 0x688f3 KMOVB %K1,%K6 |
(657) 0x688f7 KMOVB %K1,%K7 |
(657) 0x688fb ADD $0x40,%R15 |
(657) 0x688ff VRNDSCALEPD $0xb,%YMM10,%YMM7 |
(657) 0x68906 VCVTTPD2DQ %YMM10,%XMM5 |
(657) 0x6890b VGATHERDPD (%RAX,%XMM5,8),%YMM16{%K2} |
(657) 0x68912 KMOVB %K1,%K2 |
(657) 0x68916 VRNDSCALEPD $0xb,%YMM11,%YMM1 |
(657) 0x6891d VCVTTPD2DQ %YMM11,%XMM4 |
(657) 0x68922 VINSERTI128 $0x1,%XMM4,%YMM5,%YMM0 |
(657) 0x68928 VMOVAPD %YMM25,%YMM5 |
(657) 0x6892e VPERM2I128 $0x11,%YMM0,%YMM0,%YMM8 |
(657) 0x68934 VGATHERDPD (%RAX,%XMM8,8),%YMM13{%K3} |
(657) 0x6893b KMOVB %K1,%K3 |
(657) 0x6893f VSUBPD %YMM7,%YMM10,%YMM2 |
(657) 0x68943 VSUBPD %YMM1,%YMM11,%YMM3 |
(657) 0x68947 VMULPD %YMM2,%YMM2,%YMM1 |
(657) 0x6894b VFMADD132PD %YMM2,%YMM24,%YMM6 |
(657) 0x68951 VMULPD %YMM3,%YMM3,%YMM4 |
(657) 0x68955 VFMADD132PD %YMM3,%YMM24,%YMM5 |
(657) 0x6895b VMULPD %YMM2,%YMM1,%YMM10 |
(657) 0x6895f VMULPD %YMM1,%YMM26,%YMM12 |
(657) 0x68965 VMULPD %YMM3,%YMM4,%YMM9 |
(657) 0x68969 VMULPD %YMM4,%YMM26,%YMM11 |
(657) 0x6896f VFMADD231PD %YMM10,%YMM27,%YMM12 |
(657) 0x68975 VFMADD231PD %YMM9,%YMM27,%YMM11 |
(657) 0x6897b VADDPD %YMM6,%YMM12,%YMM8 |
(657) 0x6897f VPADDD -0xf0(%RBP),%YMM0,%YMM12 |
(657) 0x68987 VADDPD %YMM5,%YMM11,%YMM7 |
(657) 0x6898b VGATHERDPD (%RAX,%XMM12,8),%YMM29{%K4} |
(657) 0x68992 VPERM2I128 $0x11,%YMM12,%YMM12,%YMM5 |
(657) 0x68998 VMOVAPD -0x70(%RBP),%YMM11 |
(657) 0x6899d VMULPD %YMM22,%YMM4,%YMM12 |
(657) 0x689a3 VGATHERDPD (%RAX,%XMM5,8),%YMM6{%K5} |
(657) 0x689aa VMULPD %YMM22,%YMM1,%YMM5 |
(657) 0x689b0 VMOVAPD %YMM11,%YMM31 |
(657) 0x689b6 VFMADD231PD %YMM21,%YMM3,%YMM11 |
(657) 0x689bc VFMADD231PD %YMM21,%YMM2,%YMM31 |
(657) 0x689c2 VFMADD231PD %YMM9,%YMM23,%YMM12 |
(657) 0x689c8 VFMADD231PD %YMM10,%YMM23,%YMM5 |
(657) 0x689ce VADDPD %YMM12,%YMM11,%YMM12 |
(657) 0x689d3 VADDPD %YMM31,%YMM5,%YMM5 |
(657) 0x689d9 VMULPD %YMM12,%YMM6,%YMM6 |
(657) 0x689de VMOVAPD -0x90(%RBP),%YMM12 |
(657) 0x689e6 VMULPD %YMM29,%YMM5,%YMM5 |
(657) 0x689ec VFMADD231PD %YMM7,%YMM13,%YMM6 |
(657) 0x689f1 VPADDD -0x110(%RBP),%YMM0,%YMM13 |
(657) 0x689f9 VPADDD 0x1f81f(%RIP),%YMM0,%YMM0 |
(657) 0x68a01 VFMADD231PD %YMM8,%YMM16,%YMM5 |
(657) 0x68a07 VPERM2I128 $0x11,%YMM13,%YMM13,%YMM11 |
(657) 0x68a0d VGATHERDPD (%RAX,%XMM13,8),%YMM8{%K6} |
(657) 0x68a14 VMOVAPD -0xb0(%RBP),%YMM13 |
(657) 0x68a1c VGATHERDPD (%RAX,%XMM11,8),%YMM7{%K7} |
(657) 0x68a23 VMOVAPD %YMM3,%YMM11 |
(657) 0x68a27 VMULPD %YMM13,%YMM1,%YMM16 |
(657) 0x68a2d VFMADD132PD %YMM30,%YMM20,%YMM11 |
(657) 0x68a33 VMULPD %YMM18,%YMM1,%YMM1 |
(657) 0x68a39 VMULPD %YMM13,%YMM4,%YMM13 |
(657) 0x68a3e VMULPD %YMM18,%YMM4,%YMM4 |
(657) 0x68a44 VFMADD231PD %YMM12,%YMM10,%YMM16 |
(657) 0x68a4a VFMADD231PD %YMM19,%YMM10,%YMM1 |
(657) 0x68a50 VMOVAPD -0xd0(%RBP),%YMM10 |
(657) 0x68a58 VFMADD231PD %YMM12,%YMM9,%YMM13 |
(657) 0x68a5d VMOVAPD %YMM2,%YMM12 |
(657) 0x68a61 VFMADD231PD %YMM19,%YMM9,%YMM4 |
(657) 0x68a67 VFMADD132PD %YMM17,%YMM10,%YMM2 |
(657) 0x68a6d VFMADD132PD %YMM17,%YMM10,%YMM3 |
(657) 0x68a73 VFMADD132PD %YMM30,%YMM20,%YMM12 |
(657) 0x68a79 VADDPD %YMM13,%YMM11,%YMM11 |
(657) 0x68a7e VGATHERDPD (%RAX,%XMM0,8),%YMM13{%K2} |
(657) 0x68a85 VPERM2I128 $0x11,%YMM0,%YMM0,%YMM0 |
(657) 0x68a8b VADDPD %YMM2,%YMM1,%YMM2 |
(657) 0x68a8f VGATHERDPD (%RAX,%XMM0,8),%YMM31{%K3} |
(657) 0x68a96 VADDPD %YMM3,%YMM4,%YMM3 |
(657) 0x68a9a VADDPD %YMM16,%YMM12,%YMM12 |
(657) 0x68aa0 VMULPD %YMM13,%YMM2,%YMM9 |
(657) 0x68aa5 VMULPD %YMM3,%YMM31,%YMM16 |
(657) 0x68aab VFMADD132PD %YMM12,%YMM9,%YMM8 |
(657) 0x68ab0 VFMADD132PD %YMM11,%YMM16,%YMM7 |
(657) 0x68ab6 VADDPD %YMM5,%YMM8,%YMM5 |
(657) 0x68aba VADDPD %YMM6,%YMM7,%YMM6 |
(657) 0x68abe VADDPD %YMM5,%YMM14,%YMM14 |
(657) 0x68ac2 VADDPD %YMM6,%YMM15,%YMM15 |
(657) 0x68ac6 CMP %R15,%R14 |
(657) 0x68ac9 JNE 688d0 |
(655) 0x68acf VADDPD %YMM15,%YMM14,%YMM8 |
(655) 0x68ad4 MOV %ECX,%ESI |
(655) 0x68ad6 VMOVSD -0x168(%RBP),%XMM4 |
(655) 0x68ade VMOVSD -0x170(%RBP),%XMM1 |
(655) 0x68ae6 AND $-0x8,%ESI |
(655) 0x68ae9 VMOVSD -0x178(%RBP),%XMM10 |
(655) 0x68af1 VMOVSD -0x180(%RBP),%XMM5 |
(655) 0x68af9 VMOVSD -0x188(%RBP),%XMM11 |
(655) 0x68b01 VMOVSD -0x190(%RBP),%XMM7 |
(655) 0x68b09 MOV %ESI,%R13D |
(655) 0x68b0c VEXTRACTF64X2 $0x1,%YMM8,%XMM12 |
(655) 0x68b13 VADDPD %XMM8,%XMM12,%XMM13 |
(655) 0x68b18 VUNPCKHPD %XMM13,%XMM13,%XMM0 |
(655) 0x68b1d VADDPD %XMM13,%XMM0,%XMM6 |
(655) 0x68b22 VMOVSD %XMM6,%XMM6,%XMM29 |
(655) 0x68b28 CMP %ECX,%ESI |
(655) 0x68b2a JE 6900b |
(655) 0x68b30 MOV %ECX,%EDX |
(655) 0x68b32 SUB %R13D,%EDX |
(655) 0x68b35 LEA -0x1(%RDX),%R15D |
(655) 0x68b39 CMP $0x2,%R15D |
(655) 0x68b3d JBE 68dae |
(655) 0x68b43 VMOVDDUP %XMM4,%XMM2 |
(655) 0x68b47 LEA (%R8,%R13,8),%R13 |
(655) 0x68b4b VMOVDDUP -0x130(%RBP),%XMM9 |
(655) 0x68b53 VMOVAPD %XMM9,-0x70(%RBP) |
(655) 0x68b58 VMOVDDUP %XMM10,%XMM3 |
(655) 0x68b5d KMOVB %K1,%K5 |
(655) 0x68b61 VMULPD 0x10(%R13),%XMM2,%XMM0 |
(655) 0x68b67 VMOVDDUP %XMM1,%XMM31 |
(655) 0x68b6d VMOVDDUP %XMM11,%XMM28 |
(655) 0x68b73 KMOVB %K1,%K4 |
(655) 0x68b77 VMOVDDUP -0x48(%RBP),%XMM27 |
(655) 0x68b7e VMOVDDUP -0x118(%RBP),%XMM26 |
(655) 0x68b85 VMULPD (%R13),%XMM2,%XMM8 |
(655) 0x68b8b VMOVDDUP %XMM5,%XMM16 |
(655) 0x68b91 VMOVDDUP %XMM7,%XMM12 |
(655) 0x68b95 VMOVDDUP -0x50(%RBP),%XMM15 |
(655) 0x68b9a KMOVB %K1,%K7 |
(655) 0x68b9e KMOVB %K1,%K6 |
(655) 0x68ba2 VMOVDDUP -0x128(%RBP),%XMM14 |
(655) 0x68baa KMOVB %K1,%K3 |
(655) 0x68bae KMOVB %K1,%K2 |
(655) 0x68bb2 VMOVDDUP -0x120(%RBP),%XMM25 |
(655) 0x68bb9 VMOVDDUP -0x138(%RBP),%XMM24 |
(655) 0x68bc0 VMOVDDUP -0x148(%RBP),%XMM22 |
(655) 0x68bc7 VMOVDDUP -0x140(%RBP),%XMM20 |
(655) 0x68bce VMOVDDUP -0x150(%RBP),%XMM19 |
(655) 0x68bd5 VMOVDDUP -0x158(%RBP),%XMM18 |
(655) 0x68bdc MOV %EDX,%R14D |
(655) 0x68bdf AND $-0x4,%R14D |
(655) 0x68be3 VRNDSCALEPD $0xb,%XMM0,%XMM6 |
(655) 0x68bea ADD %R14D,%ESI |
(655) 0x68bed AND $0x3,%EDX |
(655) 0x68bf0 VRNDSCALEPD $0xb,%XMM8,%XMM2 |
(655) 0x68bf7 VINSERTF128 $0x1,%XMM0,%YMM8,%YMM13 |
(655) 0x68bfd VCVTTPD2DQ %YMM13,%XMM9 |
(655) 0x68c02 VPSHUFD $-0x12,%XMM9,%XMM17 |
(655) 0x68c09 VGATHERDPD (%RAX,%XMM9,8),%XMM30{%K4} |
(655) 0x68c10 KMOVB %K1,%K4 |
(655) 0x68c14 VSUBPD %XMM6,%XMM0,%XMM0 |
(655) 0x68c18 VSUBPD %XMM2,%XMM8,%XMM8 |
(655) 0x68c1c VGATHERDPD (%RAX,%XMM17,8),%XMM2{%K5} |
(655) 0x68c23 KMOVB %K1,%K5 |
(655) 0x68c27 VMULPD %XMM0,%XMM0,%XMM6 |
(655) 0x68c2b VMULPD %XMM8,%XMM8,%XMM13 |
(655) 0x68c30 VMULPD %XMM6,%XMM0,%XMM21 |
(655) 0x68c36 VMULPD %XMM13,%XMM8,%XMM23 |
(655) 0x68c3c VMULPD %XMM3,%XMM13,%XMM17 |
(655) 0x68c42 VMULPD %XMM3,%XMM6,%XMM3 |
(655) 0x68c46 VFMADD231PD %XMM31,%XMM23,%XMM17 |
(655) 0x68c4c VFMADD231PD %XMM31,%XMM21,%XMM3 |
(655) 0x68c52 VMOVAPD %XMM8,%XMM31 |
(655) 0x68c58 VFMADD132PD %XMM16,%XMM28,%XMM31 |
(655) 0x68c5e VFMADD132PD %XMM0,%XMM28,%XMM16 |
(655) 0x68c64 VADDPD %XMM16,%XMM3,%XMM3 |
(655) 0x68c6a VADDPD %XMM31,%XMM17,%XMM28 |
(655) 0x68c70 VMULPD %XMM2,%XMM3,%XMM2 |
(655) 0x68c74 VFMADD231PD %XMM28,%XMM30,%XMM2 |
(655) 0x68c7a VPADDD -0x1a0(%RBP),%XMM9,%XMM30 |
(655) 0x68c81 VMULPD %XMM12,%XMM13,%XMM28 |
(655) 0x68c87 VMULPD %XMM12,%XMM6,%XMM12 |
(655) 0x68c8c VPSHUFD $-0x12,%XMM30,%XMM31 |
(655) 0x68c93 VGATHERDPD (%RAX,%XMM30,8),%XMM16{%K6} |
(655) 0x68c9a VGATHERDPD (%RAX,%XMM31,8),%XMM17{%K7} |
(655) 0x68ca1 VFMADD231PD %XMM27,%XMM23,%XMM28 |
(655) 0x68ca7 VFMADD231PD %XMM27,%XMM21,%XMM12 |
(655) 0x68cad VMOVAPD %XMM8,%XMM27 |
(655) 0x68cb3 VFMADD132PD %XMM15,%XMM26,%XMM27 |
(655) 0x68cb9 VFMADD132PD %XMM0,%XMM26,%XMM15 |
(655) 0x68cbf VADDPD %XMM15,%XMM12,%XMM15 |
(655) 0x68cc4 VADDPD %XMM27,%XMM28,%XMM26 |
(655) 0x68cca VMULPD %XMM17,%XMM15,%XMM3 |
(655) 0x68cd0 VFMADD132PD %XMM26,%XMM3,%XMM16 |
(655) 0x68cd6 VADDPD %XMM2,%XMM16,%XMM30 |
(655) 0x68cdc VPADDD 0x1f51c(%RIP),%XMM9,%XMM2 |
(655) 0x68ce4 VPADDD 0x1f534(%RIP),%XMM9,%XMM9 |
(655) 0x68cec VPSHUFD $-0x12,%XMM2,%XMM15 |
(655) 0x68cf1 VGATHERDPD (%RAX,%XMM2,8),%XMM3{%K2} |
(655) 0x68cf8 VMOVAPD -0x70(%RBP),%XMM2 |
(655) 0x68cfd VGATHERDPD (%RAX,%XMM15,8),%XMM12{%K3} |
(655) 0x68d04 VMULPD %XMM14,%XMM13,%XMM15 |
(655) 0x68d09 VMULPD %XMM14,%XMM6,%XMM14 |
(655) 0x68d0e VMULPD %XMM22,%XMM6,%XMM6 |
(655) 0x68d14 VMULPD %XMM22,%XMM13,%XMM13 |
(655) 0x68d1a VFMADD231PD %XMM25,%XMM23,%XMM15 |
(655) 0x68d20 VFMADD231PD %XMM25,%XMM21,%XMM14 |
(655) 0x68d26 VMOVAPD %XMM8,%XMM25 |
(655) 0x68d2c VFMADD132PD %XMM2,%XMM24,%XMM25 |
(655) 0x68d32 VFMADD132PD %XMM0,%XMM24,%XMM2 |
(655) 0x68d38 VFMADD231PD %XMM20,%XMM21,%XMM6 |
(655) 0x68d3e VFMADD132PD %XMM19,%XMM18,%XMM0 |
(655) 0x68d44 VFMADD231PD %XMM20,%XMM23,%XMM13 |
(655) 0x68d4a VFMADD132PD %XMM19,%XMM18,%XMM8 |
(655) 0x68d50 VADDPD %XMM15,%XMM25,%XMM24 |
(655) 0x68d56 VADDPD %XMM14,%XMM2,%XMM15 |
(655) 0x68d5b VPSHUFD $-0x12,%XMM9,%XMM2 |
(655) 0x68d61 VADDPD %XMM0,%XMM6,%XMM0 |
(655) 0x68d65 VADDPD %XMM8,%XMM13,%XMM8 |
(655) 0x68d6a VMULPD %XMM12,%XMM15,%XMM12 |
(655) 0x68d6f VGATHERDPD (%RAX,%XMM2,8),%XMM15{%K5} |
(655) 0x68d76 VFMADD231PD %XMM24,%XMM3,%XMM12 |
(655) 0x68d7c VGATHERDPD (%RAX,%XMM9,8),%XMM3{%K4} |
(655) 0x68d83 VADDPD %XMM30,%XMM12,%XMM14 |
(655) 0x68d89 VMULPD %XMM15,%XMM0,%XMM12 |
(655) 0x68d8e VFMADD132PD %XMM8,%XMM12,%XMM3 |
(655) 0x68d93 VADDPD %XMM14,%XMM3,%XMM14 |
(655) 0x68d98 VUNPCKHPD %XMM14,%XMM14,%XMM9 |
(655) 0x68d9d VADDPD %XMM14,%XMM9,%XMM3 |
(655) 0x68da2 VADDSD %XMM3,%XMM29,%XMM29 |
(655) 0x68da8 JE 6900b |
(655) 0x68dae MOVSXD %ESI,%RDX |
(655) 0x68db1 VMOVSD -0x50(%RBP),%XMM14 |
(655) 0x68db6 VMOVSD -0x118(%RBP),%XMM16 |
(655) 0x68dbd VMULSD (%R8,%RDX,8),%XMM4,%XMM15 |
(655) 0x68dc3 VMOVSD -0x128(%RBP),%XMM18 |
(655) 0x68dca LEA (,%RDX,8),%R15 |
(655) 0x68dd2 LEA 0x1(%RSI),%EDX |
(655) 0x68dd5 VMOVSD -0x120(%RBP),%XMM19 |
(655) 0x68ddc VMOVSD -0x138(%RBP),%XMM20 |
(655) 0x68de3 VMOVSD -0x148(%RBP),%XMM21 |
(655) 0x68dea VMOVSD -0x140(%RBP),%XMM22 |
(655) 0x68df1 VMOVSD -0x158(%RBP),%XMM23 |
(655) 0x68df8 VRNDSCALESD $0xb,%XMM15,%XMM15,%XMM2 |
(655) 0x68dff VCVTTSD2SI %XMM15,%R13D |
(655) 0x68e04 VSUBSD %XMM2,%XMM15,%XMM0 |
(655) 0x68e08 VMOVSD %XMM14,%XMM14,%XMM15 |
(655) 0x68e0d VMULSD %XMM0,%XMM0,%XMM9 |
(655) 0x68e11 VFMADD132SD %XMM0,%XMM16,%XMM15 |
(655) 0x68e17 VMOVSD %XMM0,%XMM0,%XMM8 |
(655) 0x68e1b VFMADD132SD %XMM5,%XMM11,%XMM8 |
(655) 0x68e20 MOVSXD %R13D,%R14 |
(655) 0x68e23 VMULSD %XMM9,%XMM0,%XMM6 |
(655) 0x68e28 VMULSD %XMM10,%XMM9,%XMM13 |
(655) 0x68e2d VMULSD %XMM7,%XMM9,%XMM3 |
(655) 0x68e31 VFMADD231SD %XMM6,%XMM1,%XMM13 |
(655) 0x68e36 VADDSD %XMM8,%XMM13,%XMM12 |
(655) 0x68e3b VMOVSD -0x48(%RBP),%XMM13 |
(655) 0x68e40 VFMADD231SD %XMM13,%XMM6,%XMM3 |
(655) 0x68e45 VFMADD231SD (%RAX,%R14,8),%XMM12,%XMM29 |
(655) 0x68e4c VMULSD %XMM18,%XMM9,%XMM12 |
(655) 0x68e52 VMULSD %XMM21,%XMM9,%XMM9 |
(655) 0x68e58 VADDSD %XMM15,%XMM3,%XMM2 |
(655) 0x68e5d VMOVSD -0x130(%RBP),%XMM15 |
(655) 0x68e65 VMOVSD %XMM15,%XMM15,%XMM8 |
(655) 0x68e6a VFMADD231SD %XMM19,%XMM6,%XMM12 |
(655) 0x68e70 VFMADD132SD %XMM0,%XMM20,%XMM8 |
(655) 0x68e76 VFMADD132SD %XMM22,%XMM9,%XMM6 |
(655) 0x68e7c VADDSD %XMM12,%XMM8,%XMM3 |
(655) 0x68e81 VMULSD 0x10(%RAX,%R14,8),%XMM3,%XMM12 |
(655) 0x68e88 VFMADD132SD 0x8(%RAX,%R14,8),%XMM12,%XMM2 |
(655) 0x68e8f VMOVSD -0x150(%RBP),%XMM12 |
(655) 0x68e97 VFMADD132SD %XMM12,%XMM23,%XMM0 |
(655) 0x68e9d VADDSD %XMM2,%XMM29,%XMM8 |
(655) 0x68ea3 VADDSD %XMM6,%XMM0,%XMM0 |
(655) 0x68ea7 VFMADD132SD 0x18(%RAX,%R14,8),%XMM8,%XMM0 |
(655) 0x68eae VMOVSD %XMM0,%XMM0,%XMM29 |
(655) 0x68eb4 CMP %ECX,%EDX |
(655) 0x68eb6 JGE 6900b |
(655) 0x68ebc VMULSD 0x8(%R8,%R15,1),%XMM4,%XMM6 |
(655) 0x68ec3 VMOVSD %XMM5,%XMM5,%XMM9 |
(655) 0x68ec7 ADD $0x2,%ESI |
(655) 0x68eca VRNDSCALESD $0xb,%XMM6,%XMM6,%XMM2 |
(655) 0x68ed1 VCVTTSD2SI %XMM6,%R13D |
(655) 0x68ed5 VSUBSD %XMM2,%XMM6,%XMM0 |
(655) 0x68ed9 VMULSD %XMM0,%XMM0,%XMM2 |
(655) 0x68edd VFMADD132SD %XMM0,%XMM11,%XMM9 |
(655) 0x68ee2 MOVSXD %R13D,%R14 |
(655) 0x68ee5 VMULSD %XMM0,%XMM2,%XMM3 |
(655) 0x68ee9 VMULSD %XMM2,%XMM10,%XMM8 |
(655) 0x68eed VFMADD231SD %XMM3,%XMM1,%XMM8 |
(655) 0x68ef2 VADDSD %XMM8,%XMM9,%XMM6 |
(655) 0x68ef7 VMULSD %XMM2,%XMM7,%XMM9 |
(655) 0x68efb VMOVSD %XMM14,%XMM14,%XMM8 |
(655) 0x68f00 VFMADD132SD %XMM0,%XMM16,%XMM8 |
(655) 0x68f06 VFMADD231SD %XMM13,%XMM3,%XMM9 |
(655) 0x68f0b VADDSD %XMM9,%XMM8,%XMM9 |
(655) 0x68f10 VMULSD 0x8(%RAX,%R14,8),%XMM9,%XMM8 |
(655) 0x68f17 VMULSD %XMM18,%XMM2,%XMM9 |
(655) 0x68f1d VMULSD %XMM21,%XMM2,%XMM2 |
(655) 0x68f23 VFMADD132SD (%RAX,%R14,8),%XMM8,%XMM6 |
(655) 0x68f29 VMOVSD %XMM15,%XMM15,%XMM8 |
(655) 0x68f2e VFMADD231SD %XMM19,%XMM3,%XMM9 |
(655) 0x68f34 VFMADD132SD %XMM0,%XMM20,%XMM8 |
(655) 0x68f3a VFMADD132SD %XMM22,%XMM2,%XMM3 |
(655) 0x68f40 VFMADD132SD %XMM12,%XMM23,%XMM0 |
(655) 0x68f46 VADDSD %XMM9,%XMM8,%XMM8 |
(655) 0x68f4b VMOVSD %XMM12,%XMM12,%XMM9 |
(655) 0x68f50 VADDSD %XMM3,%XMM0,%XMM0 |
(655) 0x68f54 VMULSD 0x18(%RAX,%R14,8),%XMM0,%XMM3 |
(655) 0x68f5b VFMADD231SD 0x10(%RAX,%R14,8),%XMM8,%XMM3 |
(655) 0x68f62 VADDSD %XMM3,%XMM6,%XMM6 |
(655) 0x68f66 VADDSD %XMM6,%XMM29,%XMM29 |
(655) 0x68f6c CMP %ECX,%ESI |
(655) 0x68f6e JGE 6900b |
(655) 0x68f74 VMULSD 0x10(%R8,%R15,1),%XMM4,%XMM4 |
(655) 0x68f7b VRNDSCALESD $0xb,%XMM4,%XMM4,%XMM8 |
(655) 0x68f82 VCVTTSD2SI %XMM4,%R8D |
(655) 0x68f86 VSUBSD %XMM8,%XMM4,%XMM2 |
(655) 0x68f8b VMULSD %XMM2,%XMM2,%XMM3 |
(655) 0x68f8f VFMADD132SD %XMM2,%XMM11,%XMM5 |
(655) 0x68f94 VFMADD132SD %XMM2,%XMM16,%XMM14 |
(655) 0x68f9a VFMADD132SD %XMM2,%XMM23,%XMM9 |
(655) 0x68fa0 MOVSXD %R8D,%RCX |
(655) 0x68fa3 VFMADD132SD %XMM2,%XMM20,%XMM15 |
(655) 0x68fa9 VMULSD %XMM3,%XMM2,%XMM6 |
(655) 0x68fad VMULSD %XMM3,%XMM10,%XMM10 |
(655) 0x68fb1 VMULSD %XMM3,%XMM7,%XMM7 |
(655) 0x68fb5 VMULSD %XMM18,%XMM3,%XMM4 |
(655) 0x68fbb VMULSD %XMM21,%XMM3,%XMM8 |
(655) 0x68fc1 VFMADD132SD %XMM6,%XMM10,%XMM1 |
(655) 0x68fc6 VFMADD132SD %XMM6,%XMM7,%XMM13 |
(655) 0x68fcb VFMADD231SD %XMM19,%XMM6,%XMM4 |
(655) 0x68fd1 VFMADD132SD %XMM22,%XMM8,%XMM6 |
(655) 0x68fd7 VADDSD %XMM1,%XMM5,%XMM11 |
(655) 0x68fdb VADDSD %XMM14,%XMM13,%XMM1 |
(655) 0x68fe0 VADDSD %XMM4,%XMM15,%XMM0 |
(655) 0x68fe4 VADDSD %XMM6,%XMM9,%XMM12 |
(655) 0x68fe8 VMULSD 0x8(%RAX,%RCX,8),%XMM1,%XMM5 |
(655) 0x68fee VMULSD 0x18(%RAX,%RCX,8),%XMM12,%XMM2 |
(655) 0x68ff4 VFMADD132SD (%RAX,%RCX,8),%XMM5,%XMM11 |
(655) 0x68ffa VFMADD132SD 0x10(%RAX,%RCX,8),%XMM2,%XMM0 |
(655) 0x69001 VADDSD %XMM0,%XMM11,%XMM3 |
(655) 0x69005 VADDSD %XMM3,%XMM29,%XMM29 |
(655) 0x6900b VADDSD -0x160(%RBP),%XMM29,%XMM6 |
(655) 0x69012 VMOVSD %XMM6,-0x160(%RBP) |
(655) 0x6901a ADD $0x4,%RDI |
(655) 0x6901e CMP %RDI,%R9 |
(655) 0x69021 JNE 684a8 |
0x69027 VMOVQ %RBX,%XMM10 |
0x6902c MOV -0x1b0(%RBP),%R13 |
0x69033 MOV -0x1b8(%RBP),%R14 |
0x6903a VSUBSD -0x160(%RBP),%XMM10,%XMM10 |
0x69042 VZEROUPPER |
0x69045 VMOVSD %XMM10,%XMM10,%XMM0 |
0x69049 CALL 8070 <exp@plt> |
0x6904e MOV (%R14),%R10 |
0x69051 MOV 0x8(%R14),%RBX |
0x69055 SUB %R10,%RBX |
0x69058 VMOVSD %XMM0,(%R10,%R13,8) |
0x6905e INC %R13 |
0x69061 SAR $0x3,%RBX |
0x69065 CMP %RBX,%R13 |
0x69068 JB 683f8 |
0x69088 MOV 0x90(%R12),%R11D |
0x69090 TEST %R11D,%R11D |
0x69093 JLE 69045 |
0x69095 MOV 0xa0(%R12),%R15 |
0x6909d MOVSXD %R11D,%RSI |
0x690a0 LEA -0x38(%RBP),%RCX |
0x690a4 MOV 0x1c8(%R12),%RBX |
0x690ac MOV %RCX,-0x70(%RBP) |
0x690b0 MOV %R10,%RDX |
0x690b3 VXORPD %XMM6,%XMM6,%XMM6 |
0x690b7 MOV 0x18(%R15),%RAX |
0x690bb LEA (%RAX,%RSI,4),%R15 |
0x690bf AND $0x1,%ESI |
0x690c2 JE 691f6 |
0x690c8 MOVSXD (%RAX),%RDX |
0x690cb MOV (%RBX,%RDX,8),%R8 |
0x690cf TEST %R8,%R8 |
0x690d2 JE 691e5 |
0x690d8 VMOVSD (%R10),%XMM0 |
0x690dd VCOMISD 0x8(%R8),%XMM0 |
0x690e3 JAE 691e5 |
0x690e9 VMULSD 0x238(%R8),%XMM0,%XMM0 |
0x690f2 MOV %RCX,%RDI |
0x690f5 MOV %RAX,-0xf0(%RBP) |
0x690fc MOV %R10,-0xb0(%RBP) |
0x69103 VMOVSD %XMM10,-0xd0(%RBP) |
0x6910b MOV %R8,-0x90(%RBP) |
0x69112 CALL 8250 <modf@plt> |
0x69117 MOV -0x90(%RBP),%R10 |
0x6911e VCVTTSD2SI -0x38(%RBP),%EDI |
0x69123 VMULSD %XMM0,%XMM0,%XMM2 |
0x69127 VMOVSD 0x28(%R10),%XMM1 |
0x6912d VMOVSD 0x48(%R10),%XMM9 |
0x69133 VMOVSD 0x68(%R10),%XMM13 |
0x69139 VMOVSD 0x90(%R10),%XMM4 |
0x69142 VFMADD213SD 0x30(%R10),%XMM0,%XMM1 |
0x69148 VFMADD213SD 0x50(%R10),%XMM0,%XMM9 |
0x6914e MOVSXD %EDI,%R9 |
0x69151 VFMADD213SD 0x70(%R10),%XMM0,%XMM13 |
0x69157 MOV 0x218(%R10),%RAX |
0x6915e VMULSD %XMM0,%XMM2,%XMM3 |
0x69162 VFMADD132SD 0x88(%R10),%XMM4,%XMM0 |
0x6916b VMULSD 0x20(%R10),%XMM2,%XMM5 |
0x69171 VMULSD 0x40(%R10),%XMM2,%XMM8 |
0x69177 VMULSD 0x60(%R10),%XMM2,%XMM12 |
0x6917d VMULSD 0x80(%R10),%XMM2,%XMM15 |
0x69186 VFMADD231SD 0x18(%R10),%XMM3,%XMM5 |
0x6918c VFMADD231SD 0x38(%R10),%XMM3,%XMM8 |
0x69192 VFMADD231SD 0x58(%R10),%XMM3,%XMM12 |
0x69198 VFMADD132SD 0x78(%R10),%XMM15,%XMM3 |
0x6919e MOV -0xb0(%RBP),%R10 |
0x691a5 VADDSD %XMM1,%XMM5,%XMM6 |
0x691a9 VADDSD %XMM9,%XMM8,%XMM10 |
0x691ae VADDSD %XMM13,%XMM12,%XMM14 |
0x691b3 VADDSD %XMM3,%XMM0,%XMM7 |
0x691b7 VMULSD 0x8(%RAX,%R9,8),%XMM10,%XMM11 |
0x691be VMOVSD -0xd0(%RBP),%XMM10 |
0x691c6 VMULSD 0x18(%RAX,%R9,8),%XMM7,%XMM0 |
0x691cd VFMADD132SD (%RAX,%R9,8),%XMM11,%XMM6 |
0x691d3 VFMADD231SD 0x10(%RAX,%R9,8),%XMM14,%XMM0 |
0x691da MOV -0xf0(%RBP),%RAX |
0x691e1 VADDSD %XMM0,%XMM6,%XMM6 |
0x691e5 ADD $0x4,%RAX |
0x691e9 LEA 0x8(%R10),%RDX |
0x691ed CMP %RAX,%R15 |
0x691f0 JE 69446 |
0x691f6 MOV %R13,-0xf0(%RBP) |
0x691fd MOV %RDX,%R13 |
0x69200 MOV %R12,-0x110(%RBP) |
0x69207 MOV %RBX,%R12 |
0x6920a MOV %R14,-0x48(%RBP) |
0x6920e MOV %RAX,%R14 |
0x69211 VMOVSD %XMM10,-0xd0(%RBP) |
(654) 0x69219 MOVSXD (%R14),%R11 |
(654) 0x6921c MOV (%R12,%R11,8),%RBX |
(654) 0x69220 TEST %RBX,%RBX |
(654) 0x69223 JE 69308 |
(654) 0x69229 VMOVSD (%R13),%XMM2 |
(654) 0x6922f VCOMISD 0x8(%RBX),%XMM2 |
(654) 0x69234 JAE 69308 |
(654) 0x6923a VMULSD 0x238(%RBX),%XMM2,%XMM0 |
(654) 0x69242 MOV -0x70(%RBP),%RDI |
(654) 0x69246 VMOVSD %XMM6,-0x90(%RBP) |
(654) 0x6924e CALL 8250 <modf@plt> |
(654) 0x69253 VMOVSD 0x28(%RBX),%XMM6 |
(654) 0x69258 VMOVSD 0x48(%RBX),%XMM10 |
(654) 0x6925d VMULSD %XMM0,%XMM0,%XMM3 |
(654) 0x69261 VMOVSD 0x68(%RBX),%XMM14 |
(654) 0x69266 VMOVSD 0x90(%RBX),%XMM7 |
(654) 0x6926e VFMADD213SD 0x30(%RBX),%XMM0,%XMM6 |
(654) 0x69274 VFMADD213SD 0x50(%RBX),%XMM0,%XMM10 |
(654) 0x6927a VFMADD213SD 0x70(%RBX),%XMM0,%XMM14 |
(654) 0x69280 VCVTTSD2SI -0x38(%RBP),%ECX |
(654) 0x69285 MOV 0x218(%RBX),%RSI |
(654) 0x6928c VMULSD %XMM0,%XMM3,%XMM5 |
(654) 0x69290 VFMADD132SD 0x88(%RBX),%XMM7,%XMM0 |
(654) 0x69299 VMULSD 0x20(%RBX),%XMM3,%XMM1 |
(654) 0x6929e MOVSXD %ECX,%R8 |
(654) 0x692a1 VMULSD 0x40(%RBX),%XMM3,%XMM9 |
(654) 0x692a6 VMULSD 0x60(%RBX),%XMM3,%XMM13 |
(654) 0x692ab VMULSD 0x80(%RBX),%XMM3,%XMM4 |
(654) 0x692b3 VFMADD231SD 0x18(%RBX),%XMM5,%XMM1 |
(654) 0x692b9 VFMADD231SD 0x38(%RBX),%XMM5,%XMM9 |
(654) 0x692bf VFMADD231SD 0x58(%RBX),%XMM5,%XMM13 |
(654) 0x692c5 VFMADD132SD 0x78(%RBX),%XMM4,%XMM5 |
(654) 0x692cb VADDSD %XMM6,%XMM1,%XMM8 |
(654) 0x692cf VADDSD %XMM10,%XMM9,%XMM11 |
(654) 0x692d4 VADDSD %XMM14,%XMM13,%XMM15 |
(654) 0x692d9 VADDSD %XMM5,%XMM0,%XMM0 |
(654) 0x692dd VMOVSD -0x90(%RBP),%XMM5 |
(654) 0x692e5 VMULSD 0x8(%RSI,%R8,8),%XMM11,%XMM12 |
(654) 0x692ec VMULSD 0x18(%RSI,%R8,8),%XMM0,%XMM2 |
(654) 0x692f3 VFMADD132SD (%RSI,%R8,8),%XMM12,%XMM8 |
(654) 0x692f9 VFMADD231SD 0x10(%RSI,%R8,8),%XMM15,%XMM2 |
(654) 0x69300 VADDSD %XMM2,%XMM8,%XMM3 |
(654) 0x69304 VADDSD %XMM3,%XMM5,%XMM6 |
(654) 0x69308 LEA 0x4(%R14),%RAX |
(654) 0x6930c MOVSXD 0x4(%R14),%R14 |
(654) 0x69310 LEA 0x8(%R13),%RBX |
(654) 0x69314 MOV (%R12,%R14,8),%R14 |
(654) 0x69318 TEST %R14,%R14 |
(654) 0x6931b JE 6941b |
(654) 0x69321 VMOVSD 0x8(%R13),%XMM1 |
(654) 0x69327 VCOMISD 0x8(%R14),%XMM1 |
(654) 0x6932d JAE 6941b |
(654) 0x69333 VMULSD 0x238(%R14),%XMM1,%XMM0 |
(654) 0x6933c MOV -0x70(%RBP),%RDI |
(654) 0x69340 MOV %RAX,-0x90(%RBP) |
(654) 0x69347 VMOVSD %XMM6,-0xb0(%RBP) |
(654) 0x6934f CALL 8250 <modf@plt> |
(654) 0x69354 VMOVSD 0x28(%R14),%XMM10 |
(654) 0x6935a VMOVSD 0x48(%R14),%XMM13 |
(654) 0x69360 VMULSD %XMM0,%XMM0,%XMM8 |
(654) 0x69364 VMOVSD 0x68(%R14),%XMM7 |
(654) 0x6936a VMOVSD 0x90(%R14),%XMM5 |
(654) 0x69373 VFMADD213SD 0x30(%R14),%XMM0,%XMM10 |
(654) 0x69379 VFMADD213SD 0x50(%R14),%XMM0,%XMM13 |
(654) 0x6937f VFMADD213SD 0x70(%R14),%XMM0,%XMM7 |
(654) 0x69385 VCVTTSD2SI -0x38(%RBP),%EDI |
(654) 0x6938a MOV 0x218(%R14),%R13 |
(654) 0x69391 MOV -0x90(%RBP),%RAX |
(654) 0x69398 VMULSD %XMM0,%XMM8,%XMM9 |
(654) 0x6939c VFMADD132SD 0x88(%R14),%XMM5,%XMM0 |
(654) 0x693a5 VMULSD 0x20(%R14),%XMM8,%XMM6 |
(654) 0x693ab MOVSXD %EDI,%R9 |
(654) 0x693ae VMULSD 0x40(%R14),%XMM8,%XMM12 |
(654) 0x693b4 VMULSD 0x60(%R14),%XMM8,%XMM4 |
(654) 0x693ba VMULSD 0x80(%R14),%XMM8,%XMM3 |
(654) 0x693c3 VFMADD231SD 0x18(%R14),%XMM9,%XMM6 |
(654) 0x693c9 VFMADD231SD 0x38(%R14),%XMM9,%XMM12 |
(654) 0x693cf VFMADD231SD 0x58(%R14),%XMM9,%XMM4 |
(654) 0x693d5 VFMADD132SD 0x78(%R14),%XMM3,%XMM9 |
(654) 0x693db VADDSD %XMM10,%XMM6,%XMM11 |
(654) 0x693e0 VADDSD %XMM13,%XMM12,%XMM14 |
(654) 0x693e5 VADDSD %XMM7,%XMM4,%XMM2 |
(654) 0x693e9 VADDSD %XMM9,%XMM0,%XMM0 |
(654) 0x693ee VMOVSD -0xb0(%RBP),%XMM9 |
(654) 0x693f6 VMULSD 0x8(%R13,%R9,8),%XMM14,%XMM15 |
(654) 0x693fd VMULSD 0x18(%R13,%R9,8),%XMM0,%XMM1 |
(654) 0x69404 VFMADD132SD (%R13,%R9,8),%XMM15,%XMM11 |
(654) 0x6940b VFMADD231SD 0x10(%R13,%R9,8),%XMM2,%XMM1 |
(654) 0x69412 VADDSD %XMM1,%XMM11,%XMM8 |
(654) 0x69416 VADDSD %XMM8,%XMM9,%XMM6 |
(654) 0x6941b LEA 0x4(%RAX),%R14 |
(654) 0x6941f LEA 0x8(%RBX),%R13 |
(654) 0x69423 CMP %R14,%R15 |
(654) 0x69426 JNE 69219 |
0x6942c VMOVSD -0xd0(%RBP),%XMM10 |
0x69434 MOV -0xf0(%RBP),%R13 |
0x6943b MOV -0x110(%RBP),%R12 |
0x69442 MOV -0x48(%RBP),%R14 |
0x69446 VSUBSD %XMM6,%XMM10,%XMM10 |
0x6944a JMP 69045 |
(655) 0x6944f XOR %R13D,%R13D |
(655) 0x69452 VXORPD %XMM29,%XMM29,%XMM29 |
(655) 0x69458 XOR %ESI,%ESI |
(655) 0x6945a JMP 68b30 |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/OneBodyJastrowRef.h: 134 - 155 |
-------------------------------------------------------------------------------- |
134: for (int k = 0; k < ratios.size(); ++k) |
135: ratios[k] = std::exp(Vat[VP.refPtcl] - computeU(VP.getDistTableAB(myTableID).getDistRow(k).data())); |
136: } |
137: |
138: inline valT computeU(const valT* dist) |
139: { |
140: valT curVat(0); |
141: if (NumGroups > 0) |
142: { |
143: for (int jg = 0; jg < NumGroups; ++jg) |
144: { |
145: if (F[jg] != nullptr) |
146: curVat += F[jg]->evaluateV(-1, Ions.first(jg), Ions.last(jg), dist, DistCompressed.data()); |
147: } |
148: } |
149: else |
150: { |
151: for (int c = 0; c < Nions; ++c) |
152: { |
153: int gid = Ions.GroupID[c]; |
154: if (F[gid] != nullptr) |
155: curVat += F[gid]->evaluate(dist[c]); |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/shared_ptr_base.h: 1666 - 1666 |
-------------------------------------------------------------------------------- |
1666: { return _M_ptr; } |
/cluster/comp/gcc/13.2.0/include/c++/13.2.0/bits/stl_vector.h: 990 - 1145 |
-------------------------------------------------------------------------------- |
990: { return size_type(this->_M_impl._M_finish - this->_M_impl._M_start); } |
[...] |
1123: operator[](size_type __n) _GLIBCXX_NOEXCEPT |
1124: { |
1125: __glibcxx_requires_subscript(__n); |
1126: return *(this->_M_impl._M_start + __n); |
[...] |
1142: operator[](size_type __n) const _GLIBCXX_NOEXCEPT |
1143: { |
1144: __glibcxx_requires_subscript(__n); |
1145: return *(this->_M_impl._M_start + __n); |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Particle/ParticleSet.h: 313 - 316 |
-------------------------------------------------------------------------------- |
313: inline int first(int igroup) const { return (*group_offsets_)[igroup]; } |
314: |
315: ///return the last index of a group i |
316: inline int last(int igroup) const { return (*group_offsets_)[igroup + 1]; } |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/QMCWaveFunctions/Jastrow/BsplineFunctor.h: 164 - 260 |
-------------------------------------------------------------------------------- |
164: inline real_type evaluate(real_type r) |
165: { |
166: if (r >= cutoff_radius) |
167: return 0.0; |
168: r *= DeltaRInv; |
169: real_type ipart, t; |
170: t = std::modf(r, &ipart); |
171: int i = (int)ipart; |
172: real_type tp[4]; |
173: tp[0] = t * t * t; |
[...] |
179: (SplineCoefs[i+0]*(A[ 0]*tp[0] + A[ 1]*tp[1] + A[ 2]*tp[2] + A[ 3]*tp[3])+ |
180: SplineCoefs[i+1]*(A[ 4]*tp[0] + A[ 5]*tp[1] + A[ 6]*tp[2] + A[ 7]*tp[3])+ |
181: SplineCoefs[i+2]*(A[ 8]*tp[0] + A[ 9]*tp[1] + A[10]*tp[2] + A[11]*tp[3])+ |
182: SplineCoefs[i+3]*(A[12]*tp[0] + A[13]*tp[1] + A[14]*tp[2] + A[15]*tp[3])); |
[...] |
231: ASSUME_ALIGNED(distArrayCompressed); |
232: int iCount = 0; |
233: const int iLimit = iEnd - iStart; |
234: |
235: #pragma vector always |
236: for (int jat = 0; jat < iLimit; jat++) |
237: { |
238: real_type r = distArray[jat]; |
239: // pick the distances smaller than the cutoff and avoid the reference atom |
240: if (r < cutoff_radius && iStart + jat != iat) |
241: distArrayCompressed[iCount++] = distArray[jat]; |
242: } |
243: |
244: real_type d = 0.0; |
245: //#pragma omp simd reduction(+:d) |
246: for (int jat = 0; jat < iCount; jat++) |
247: { |
248: real_type r = distArrayCompressed[jat]; |
249: r *= DeltaRInv; |
250: int i = (int)r; |
251: real_type t = r - real_type(i); |
252: real_type tp0 = t * t * t; |
253: real_type tp1 = t * t; |
254: real_type tp2 = t; |
255: |
256: real_type d1 = SplineCoefs[i + 0] * (A[0] * tp0 + A[1] * tp1 + A[2] * tp2 + A[3]); |
257: real_type d2 = SplineCoefs[i + 1] * (A[4] * tp0 + A[5] * tp1 + A[6] * tp2 + A[7]); |
258: real_type d3 = SplineCoefs[i + 2] * (A[8] * tp0 + A[9] * tp1 + A[10] * tp2 + A[11]); |
259: real_type d4 = SplineCoefs[i + 3] * (A[12] * tp0 + A[13] * tp1 + A[14] * tp2 + A[15]); |
260: d += (d1 + d2 + d3 + d4); |
/home/eoseret/qaas_runs_CPU_9468/171-143-7755/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 249 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
229: return X[i]; |
[...] |
249: inline const_pointer data() const { return X; } |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.72 |
CQA speedup if FP arith vectorized | 1.98 |
CQA speedup if fully vectorized | 10.23 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.24 |
Bottlenecks | micro-operation queue, |
Function | _ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE |
Source | OneBodyJastrowRef.h:134-135,OneBodyJastrowRef.h:140-141,OneBodyJastrowRef.h:151-151,OneBodyJastrowRef.h:154-155,stl_vector.h:990-990,stl_vector.h:1123-1123,stl_vector.h:1126-1126,BsplineFunctor.h:164-173,BsplineFunctor.h:179-182,BsplineFunctor.h:256-258,OhmmsVector.h:229-229,OhmmsVector.h:249-249 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 22.33 |
CQA cycles if no scalar integer | 13.00 |
CQA cycles if FP arith vectorized | 11.29 |
CQA cycles if fully vectorized | 2.18 |
Front-end cycles | 22.33 |
DIV/SQRT cycles | 13.50 |
P0 cycles | 13.50 |
P1 cycles | 18.00 |
P2 cycles | 18.00 |
P3 cycles | 9.50 |
P4 cycles | 10.00 |
P5 cycles | 9.00 |
P6 cycles | 9.50 |
P7 cycles | 9.50 |
P8 cycles | 9.50 |
P9 cycles | 9.00 |
P10 cycles | 18.00 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 26.90 - 26.91 |
Stall cycles (UFS) | 4.80 - 4.82 |
Nb insns | 124.00 |
Nb uops | 130.00 |
Nb loads | 54.00 |
Nb stores | 16.00 |
Nb stack references | 12.00 |
FLOP/cycle | 1.61 |
Nb FLOP add-sub | 7.00 |
Nb FLOP mul | 9.00 |
Nb FLOP fma | 10.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 26.33 |
Bytes prefetched | 0.00 |
Bytes loaded | 412.00 |
Bytes stored | 176.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 6.06 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 12.50 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | 0.00 |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 15.38 |
Vector-efficiency ratio all | 13.45 |
Vector-efficiency ratio load | 12.30 |
Vector-efficiency ratio store | 16.80 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | 12.50 |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 12.50 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.72 |
CQA speedup if FP arith vectorized | 1.98 |
CQA speedup if fully vectorized | 10.23 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.24 |
Bottlenecks | micro-operation queue, |
Function | _ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE |
Source | OneBodyJastrowRef.h:134-135,OneBodyJastrowRef.h:140-141,OneBodyJastrowRef.h:151-151,OneBodyJastrowRef.h:154-155,stl_vector.h:990-990,stl_vector.h:1123-1123,stl_vector.h:1126-1126,BsplineFunctor.h:164-173,BsplineFunctor.h:179-182,BsplineFunctor.h:256-258,OhmmsVector.h:229-229,OhmmsVector.h:249-249 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 22.33 |
CQA cycles if no scalar integer | 13.00 |
CQA cycles if FP arith vectorized | 11.29 |
CQA cycles if fully vectorized | 2.18 |
Front-end cycles | 22.33 |
DIV/SQRT cycles | 13.50 |
P0 cycles | 13.50 |
P1 cycles | 18.00 |
P2 cycles | 18.00 |
P3 cycles | 9.50 |
P4 cycles | 10.00 |
P5 cycles | 9.00 |
P6 cycles | 9.50 |
P7 cycles | 9.50 |
P8 cycles | 9.50 |
P9 cycles | 9.00 |
P10 cycles | 18.00 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 26.90 - 26.91 |
Stall cycles (UFS) | 4.80 - 4.82 |
Nb insns | 124.00 |
Nb uops | 130.00 |
Nb loads | 54.00 |
Nb stores | 16.00 |
Nb stack references | 12.00 |
FLOP/cycle | 1.61 |
Nb FLOP add-sub | 7.00 |
Nb FLOP mul | 9.00 |
Nb FLOP fma | 10.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 26.33 |
Bytes prefetched | 0.00 |
Bytes loaded | 412.00 |
Bytes stored | 176.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 6.06 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 12.50 |
Vectorization ratio mul | 0.00 |
Vectorization ratio add_sub | 0.00 |
Vectorization ratio fma | 0.00 |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 15.38 |
Vector-efficiency ratio all | 13.45 |
Vector-efficiency ratio load | 12.30 |
Vector-efficiency ratio store | 16.80 |
Vector-efficiency ratio mul | 12.50 |
Vector-efficiency ratio add_sub | 12.50 |
Vector-efficiency ratio fma | 12.50 |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 12.50 |
Path / |
Function | _ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE |
Source file and lines | OneBodyJastrowRef.h:134-155 |
Module | libqmcwfs.so |
nb instructions | 124 |
nb uops | 130 |
loop length | 683 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 16 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 12 |
ADD-SUB / MUL ratio | 0.78 |
micro-operation queue | 22.33 cycles |
front end | 22.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 13.50 | 13.50 | 18.00 | 18.00 | 9.50 | 10.00 | 9.00 | 9.50 | 9.50 | 9.50 | 9.00 | 18.00 |
cycles | 13.50 | 13.50 | 18.00 | 18.00 | 9.50 | 10.00 | 9.00 | 9.50 | 9.50 | 9.50 | 9.00 | 18.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 26.90-26.91 |
Stall cycles | 4.80-4.82 |
LM full (events) | 7.33-7.26 |
Front-end | 22.33 |
Dispatch | 18.00 |
Overall L1 | 22.33 |
all | 13% |
load | 0% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 6% |
load | 0% |
store | 12% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 14% |
load | 9% |
store | 18% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 13% |
load | 12% |
store | 16% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0x1a8(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xf0(%R12),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%R12),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0x2a0(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RBX,%RDX,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM7,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 8140 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA (%R13,%R13,4),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD -0x70(%RBP),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RAX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R8,%RDI,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%R9),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0x98(%R12),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R9D,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 69088 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0xce8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x2,%R15D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVQ $0,-0x160(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1c8(%R12),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KXNORB %K1,%K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV %R13,-0x1b0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTD %EDX,%YMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTD %R15D,%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x2,%R9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,-0x1b8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVQ %XMM10,%RBX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVDQA %YMM11,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVDQA %YMM12,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVQ %RBX,%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x1b0(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x1b8(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VSUBSD -0x160(%RBP),%XMM10,%XMM10 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VMOVSD %XMM10,%XMM10,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CALL 8070 <exp@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R14),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%R14),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %R10,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVSD %XMM0,(%R10,%R13,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x3,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %RBX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 683f8 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x58> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x90(%R12),%R11D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R11D,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 69045 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0xca5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xa0(%R12),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD %R11D,%RSI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
LEA -0x38(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x1c8(%R12),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VXORPD %XMM6,%XMM6,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RAX,%RSI,4),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $0x1,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 691f6 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0xe56> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RDX,8),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R8,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 691e5 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0xe45> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%R10),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VCOMISD 0x8(%R8),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JAE 691e5 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0xe45> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMULSD 0x238(%R8),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM10,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 8250 <modf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x90(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VCVTTSD2SI -0x38(%RBP),%EDI | 2 | 1.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 1 |
VMULSD %XMM0,%XMM0,%XMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x28(%R10),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x48(%R10),%XMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x68(%R10),%XMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x90(%R10),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VFMADD213SD 0x30(%R10),%XMM0,%XMM1 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD213SD 0x50(%R10),%XMM0,%XMM9 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOVSXD %EDI,%R9 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
VFMADD213SD 0x70(%R10),%XMM0,%XMM13 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV 0x218(%R10),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM0,%XMM2,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD132SD 0x88(%R10),%XMM4,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMULSD 0x20(%R10),%XMM2,%XMM5 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMULSD 0x40(%R10),%XMM2,%XMM8 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMULSD 0x60(%R10),%XMM2,%XMM12 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMULSD 0x80(%R10),%XMM2,%XMM15 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD231SD 0x18(%R10),%XMM3,%XMM5 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD231SD 0x38(%R10),%XMM3,%XMM8 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD231SD 0x58(%R10),%XMM3,%XMM12 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD132SD 0x78(%R10),%XMM15,%XMM3 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV -0xb0(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD %XMM1,%XMM5,%XMM6 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VADDSD %XMM9,%XMM8,%XMM10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VADDSD %XMM13,%XMM12,%XMM14 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VADDSD %XMM3,%XMM0,%XMM7 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMULSD 0x8(%RAX,%R9,8),%XMM10,%XMM11 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD -0xd0(%RBP),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0x18(%RAX,%R9,8),%XMM7,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD132SD (%RAX,%R9,8),%XMM11,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD231SD 0x10(%RAX,%R9,8),%XMM14,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV -0xf0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD %XMM0,%XMM6,%XMM6 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADD $0x4,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x8(%R10),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 69446 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x10a6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R14,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVSD %XMM10,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0xd0(%RBP),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x110(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VSUBSD %XMM6,%XMM10,%XMM10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
JMP 69045 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0xca5> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
Function | _ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE |
Source file and lines | OneBodyJastrowRef.h:134-155 |
Module | libqmcwfs.so |
nb instructions | 124 |
nb uops | 130 |
loop length | 683 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 16 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 12 |
ADD-SUB / MUL ratio | 0.78 |
micro-operation queue | 22.33 cycles |
front end | 22.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 13.50 | 13.50 | 18.00 | 18.00 | 9.50 | 10.00 | 9.00 | 9.50 | 9.50 | 9.50 | 9.00 | 18.00 |
cycles | 13.50 | 13.50 | 18.00 | 18.00 | 9.50 | 10.00 | 9.00 | 9.50 | 9.50 | 9.50 | 9.00 | 18.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 26.90-26.91 |
Stall cycles | 4.80-4.82 |
LM full (events) | 7.33-7.26 |
Front-end | 22.33 |
Dispatch | 18.00 |
Overall L1 | 22.33 |
all | 13% |
load | 0% |
store | 16% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 25% |
all | 6% |
load | 0% |
store | 12% |
mul | 0% |
add-sub | 0% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 14% |
load | 9% |
store | 18% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | 12% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 13% |
load | 12% |
store | 16% |
mul | 12% |
add-sub | 12% |
fma | 12% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0x1a8(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xf0(%R12),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%R12),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0x2a0(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD (%RBX,%RDX,8),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM7,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 8140 <_ZNK11qmcplusplus11ParticleSet14getDistTableABEi@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA (%R13,%R13,4),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVSD -0x70(%RBP),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RAX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R8,%RDI,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%R9),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD 0x98(%R12),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R9D,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 69088 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0xce8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x2,%R15D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVQ $0,-0x160(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1c8(%R12),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KXNORB %K1,%K1,%K1 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV %R13,-0x1b0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTD %EDX,%YMM11 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTD %R15D,%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x2,%R9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R14,-0x1b8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVQ %XMM10,%RBX | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVDQA %YMM11,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVDQA %YMM12,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVQ %RBX,%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x1b0(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x1b8(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VSUBSD -0x160(%RBP),%XMM10,%XMM10 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
VMOVSD %XMM10,%XMM10,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CALL 8070 <exp@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV (%R14),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%R14),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %R10,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVSD %XMM0,(%R10,%R13,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x3,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %RBX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 683f8 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x58> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x90(%R12),%R11D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R11D,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 69045 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0xca5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xa0(%R12),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD %R11D,%RSI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
LEA -0x38(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x1c8(%R12),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VXORPD %XMM6,%XMM6,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RAX,%RSI,4),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $0x1,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 691f6 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0xe56> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVSXD (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX,%RDX,8),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R8,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 691e5 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0xe45> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD (%R10),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VCOMISD 0x8(%R8),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JAE 691e5 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0xe45> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMULSD 0x238(%R8),%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM10,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 8250 <modf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x90(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VCVTTSD2SI -0x38(%RBP),%EDI | 2 | 1.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 7 | 1 |
VMULSD %XMM0,%XMM0,%XMM2 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VMOVSD 0x28(%R10),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x48(%R10),%XMM9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x68(%R10),%XMM13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x90(%R10),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VFMADD213SD 0x30(%R10),%XMM0,%XMM1 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD213SD 0x50(%R10),%XMM0,%XMM9 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOVSXD %EDI,%R9 | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
VFMADD213SD 0x70(%R10),%XMM0,%XMM13 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV 0x218(%R10),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD %XMM0,%XMM2,%XMM3 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VFMADD132SD 0x88(%R10),%XMM4,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMULSD 0x20(%R10),%XMM2,%XMM5 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMULSD 0x40(%R10),%XMM2,%XMM8 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMULSD 0x60(%R10),%XMM2,%XMM12 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMULSD 0x80(%R10),%XMM2,%XMM15 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD231SD 0x18(%R10),%XMM3,%XMM5 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD231SD 0x38(%R10),%XMM3,%XMM8 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD231SD 0x58(%R10),%XMM3,%XMM12 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD132SD 0x78(%R10),%XMM15,%XMM3 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV -0xb0(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD %XMM1,%XMM5,%XMM6 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VADDSD %XMM9,%XMM8,%XMM10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VADDSD %XMM13,%XMM12,%XMM14 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VADDSD %XMM3,%XMM0,%XMM7 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
VMULSD 0x8(%RAX,%R9,8),%XMM10,%XMM11 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VMOVSD -0xd0(%RBP),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0x18(%RAX,%R9,8),%XMM7,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD132SD (%RAX,%R9,8),%XMM11,%XMM6 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
VFMADD231SD 0x10(%RAX,%R9,8),%XMM14,%XMM0 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV -0xf0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD %XMM0,%XMM6,%XMM6 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADD $0x4,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x8(%R10),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JE 69446 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0x10a6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R12,-0x110(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R14,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVSD %XMM10,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0xd0(%RBP),%XMM10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xf0(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x110(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x48(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VSUBSD %XMM6,%XMM10,%XMM10 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
JMP 69045 <_ZN16miniqmcreference17OneBodyJastrowRefIN11qmcplusplus14BsplineFunctorIdEEE14evaluateRatiosERNS1_18VirtualParticleSetERSt6vectorIdSaIdEE+0xca5> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |