Function: accelerate_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: accelerate_kernel.f90:57-79 | Coverage: 5.15% |
---|
Function: accelerate_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: accelerate_kernel.f90:57-79 | Coverage: 5.15% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-861-0321/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/accelerate_kernel.f90: 57 - 79 |
-------------------------------------------------------------------------------- |
57: !$OMP PARALLEL |
58: |
59: !$OMP DO PRIVATE(j,k,stepbymass_s) |
60: DO k=y_min,y_max+1 |
61: !$OMP SIMD |
62: DO j=x_min,x_max+1 |
63: stepbymass_s=halfdt/((density0(j-1,k-1)*volume(j-1,k-1) & |
64: +density0(j ,k-1)*volume(j ,k-1) & |
65: +density0(j ,k )*volume(j ,k ) & |
66: +density0(j-1,k )*volume(j-1,k )) & |
67: *0.25_8) |
68: |
69: xvel1(j,k)=xvel0(j,k)-stepbymass_s*(xarea(j ,k )*(pressure(j ,k )-pressure(j-1,k )) & |
70: +xarea(j ,k-1)*(pressure(j ,k-1)-pressure(j-1,k-1))) |
71: yvel1(j,k)=yvel0(j,k)-stepbymass_s*(yarea(j ,k )*(pressure(j ,k )-pressure(j ,k-1)) & |
72: +yarea(j-1,k )*(pressure(j-1,k )-pressure(j-1,k-1))) |
73: xvel1(j,k)=xvel1(j,k)-stepbymass_s*(xarea(j ,k )*(viscosity(j ,k )-viscosity(j-1,k )) & |
74: +xarea(j ,k-1)*(viscosity(j ,k-1)-viscosity(j-1,k-1))) |
75: yvel1(j,k)=yvel1(j,k)-stepbymass_s*(yarea(j ,k )*(viscosity(j ,k )-viscosity(j ,k-1)) & |
76: +yarea(j-1,k )*(viscosity(j-1,k )-viscosity(j-1,k-1))) |
77: ENDDO |
78: ENDDO |
79: !$OMP END DO |
0x424590 PUSH %RBP |
0x424591 MOV %RSP,%RBP |
0x424594 PUSH %R15 |
0x424596 PUSH %R14 |
0x424598 PUSH %R13 |
0x42459a PUSH %R12 |
0x42459c PUSH %RBX |
0x42459d AND $-0x20,%RSP |
0x4245a1 SUB $0x480,%RSP |
0x4245a8 MOV %R9,0xa8(%RSP) |
0x4245b0 MOV %RCX,%RSI |
0x4245b3 MOV 0xc0(%RBP),%RAX |
0x4245ba MOV %RAX,0x1e0(%RSP) |
0x4245c2 MOV 0xb8(%RBP),%RAX |
0x4245c9 MOV %RAX,0x1d8(%RSP) |
0x4245d1 MOV 0xb0(%RBP),%RAX |
0x4245d8 MOV %RAX,0x1d0(%RSP) |
0x4245e0 MOV 0xa8(%RBP),%RAX |
0x4245e7 MOV %RAX,0x1c8(%RSP) |
0x4245ef MOV 0xa0(%RBP),%RAX |
0x4245f6 MOV %RAX,0x1c0(%RSP) |
0x4245fe MOV 0x98(%RBP),%RAX |
0x424605 MOV %RAX,0x1b8(%RSP) |
0x42460d MOV 0x60(%RBP),%EBX |
0x424610 MOV 0x58(%RBP),%EAX |
0x424613 SUB %EBX,%EAX |
0x424615 INC %EAX |
0x424617 MOV 0x90(%RBP),%RCX |
0x42461e MOV %RCX,0x1b0(%RSP) |
0x424626 MOV 0x88(%RBP),%RCX |
0x42462d MOV %RCX,0x1a8(%RSP) |
0x424635 MOV 0x80(%RBP),%RCX |
0x42463c MOV %RCX,0x1a0(%RSP) |
0x424644 MOV 0x78(%RBP),%RCX |
0x424648 MOV %RCX,0x198(%RSP) |
0x424650 MOV 0x70(%RBP),%R13 |
0x424654 MOV 0x68(%RBP),%R9 |
0x424658 MOV 0x50(%RBP),%RCX |
0x42465c MOV %RCX,0xa0(%RSP) |
0x424664 MOV 0x48(%RBP),%RCX |
0x424668 MOV %RCX,0x98(%RSP) |
0x424670 MOV 0x40(%RBP),%RCX |
0x424674 MOV %RCX,0x90(%RSP) |
0x42467c MOV 0x38(%RBP),%RCX |
0x424680 MOV %RCX,0x88(%RSP) |
0x424688 MOV 0x30(%RBP),%RCX |
0x42468c MOV %RCX,0x80(%RSP) |
0x424694 MOV 0x28(%RBP),%RCX |
0x424698 MOV %RCX,0x78(%RSP) |
0x42469d MOV 0x20(%RBP),%RCX |
0x4246a1 MOV %RCX,0x70(%RSP) |
0x4246a6 MOV 0x18(%RBP),%RCX |
0x4246aa MOV %RCX,0x68(%RSP) |
0x4246af MOV 0x10(%RBP),%RCX |
0x4246b3 MOV %RCX,0x60(%RSP) |
0x4246b8 MOVL $0,0x5c(%RSP) |
0x4246c0 JS 42474f |
0x4246c6 MOV %R9,0x8(%RSP) |
0x4246cb MOV %RDX,%R14 |
0x4246ce MOV %R8,%R15 |
0x4246d1 MOV %RSI,0x20(%RSP) |
0x4246d6 MOV %RDI,0x110(%RSP) |
0x4246de MOV (%RDI),%ESI |
0x4246e0 MOVL $0,0x34(%RSP) |
0x4246e8 MOV %EAX,0x30(%RSP) |
0x4246ec MOVL $0x1,0x58(%RSP) |
0x4246f4 SUB $0x8,%RSP |
0x4246f8 LEA 0x60(%RSP),%RAX |
0x4246fd LEA 0x64(%RSP),%RCX |
0x424702 LEA 0x3c(%RSP),%R8 |
0x424707 LEA 0x38(%RSP),%R9 |
0x42470c MOV $0x53b290,%EDI |
0x424711 MOV %ESI,0x54(%RSP) |
0x424715 MOV $0x22,%EDX |
0x42471a PUSH $0x1 |
0x42471c PUSH $0x1 |
0x42471e PUSH %RAX |
0x42471f CALL 404670 <__kmpc_for_static_init_4@plt> |
0x424724 ADD $0x20,%RSP |
0x424728 MOV 0x34(%RSP),%EAX |
0x42472c MOV 0x30(%RSP),%R12D |
0x424731 SUB %EAX,%R12D |
0x424734 JAE 424769 |
0x424736 MOV $0x53b2b0,%EDI |
0x42473b MOV 0x4c(%RSP),%ESI |
0x42473f VZEROUPPER |
0x424742 CALL 404230 <__kmpc_for_static_fini@plt> |
0x424747 MOV 0x110(%RSP),%RDI |
0x42474f MOV (%RDI),%ESI |
0x424751 MOV $0x53b2d0,%EDI |
0x424756 LEA -0x28(%RBP),%RSP |
0x42475a POP %RBX |
0x42475b POP %R12 |
0x42475d POP %R13 |
0x42475f POP %R14 |
0x424761 POP %R15 |
0x424763 POP %RBP |
0x424764 JMP 404740 |
0x424769 MOV %RAX,%R8 |
0x42476c VMOVQ %R14,%XMM0 |
0x424771 MOV %R15,%R9 |
0x424774 SAL $0x20,%R9 |
0x424778 MOV $-0x200000000,%RAX |
0x424782 LEA (%R9,%RAX,1),%RCX |
0x424786 MOV %RCX,%R10 |
0x424789 SAR $0x20,%R10 |
0x42478d MOV 0x20(%RSP),%RDX |
0x424792 SAL $0x20,%RDX |
0x424796 ADD %RDX,%RAX |
0x424799 MOV %RDX,%R14 |
0x42479c MOV %RAX,%R11 |
0x42479f SAR $0x20,%R11 |
0x4247a3 ADD %EBX,%R8D |
0x4247a6 MOVSXD (%R13),%RBX |
0x4247aa MOV 0x8(%RSP),%RDX |
0x4247af MOV (%RDX),%EDX |
0x4247b1 SUB %EBX,%EDX |
0x4247b3 LEA 0x1(%RDX),%ESI |
0x4247b6 MOV %ESI,0x54(%RSP) |
0x4247ba ADD $0x2,%EDX |
0x4247bd CMP $0x2,%EDX |
0x4247c0 MOV $0x1,%R15D |
0x4247c6 CMOVGE %EDX,%R15D |
0x4247ca MOV %R15D,%EDX |
0x4247cd AND $0x7ffffffc,%EDX |
0x4247d3 MOV %RDX,0x20(%RSP) |
0x4247d8 TEST %RCX,%RCX |
0x4247db MOV $-0x1,%RDX |
0x4247e2 CMOVNS %RCX,%RDX |
0x4247e6 TEST %RDX,%RDX |
0x4247e9 MOV $0x1,%ESI |
0x4247ee CMOVG %RSI,%RDX |
0x4247f2 MOV $0x200000000,%R13 |
0x4247fc MOV %R13,%RDI |
0x4247ff SUB %R9,%RDI |
0x424802 CMP %RDI,%RCX |
0x424805 CMOVG %RCX,%RDI |
0x424809 MOV %R11,0xb8(%RSP) |
0x424811 NOT %R11 |
0x424814 MOV %R11,0xb0(%RSP) |
0x42481c VPBROADCASTQ %XMM0,%YMM0 |
0x424821 MOV %R15,0x170(%RSP) |
0x424829 VPBROADCASTQ %R15,%YMM1 |
0x42482f VMOVDQA %YMM1,0x220(%RSP) |
0x424838 SHR $0x20,%RDI |
0x42483c IMUL %RDX,%RDI |
0x424840 MOV %RBX,0x180(%RSP) |
0x424848 LEA (,%RBX,8),%R11 |
0x424850 SAL $0x3,%RDI |
0x424854 SUB %RDI,%R11 |
0x424857 MOV $-0x1,%RCX |
0x42485e TEST %RAX,%RAX |
0x424861 CMOVNS %RAX,%RCX |
0x424865 TEST %RCX,%RCX |
0x424868 CMOVG %RSI,%RCX |
0x42486c MOV %R10,0x188(%RSP) |
0x424874 NOT %R10 |
0x424877 MOV %R10,0x178(%RSP) |
0x42487f SUB %R14,%R13 |
0x424882 MOV 0x90(%RSP),%RDX |
0x42488a ADD %R11,%RDX |
0x42488d MOV %RDX,0x158(%RSP) |
0x424895 CMP %R13,%RAX |
0x424898 CMOVG %RAX,%R13 |
0x42489c MOV 0x88(%RSP),%RAX |
0x4248a4 ADD %R11,%RAX |
0x4248a7 MOV %RAX,0x150(%RSP) |
0x4248af SHR $0x20,%R13 |
0x4248b3 IMUL %RCX,%R13 |
0x4248b7 NEG %R13 |
0x4248ba MOV %R13,0x168(%RSP) |
0x4248c2 MOV 0x80(%RSP),%RAX |
0x4248ca ADD %R11,%RAX |
0x4248cd MOV %RAX,0x148(%RSP) |
0x4248d5 MOV 0x98(%RSP),%RAX |
0x4248dd LEA (%RAX,%R11,1),%RAX |
0x4248e1 MOV %RAX,0x140(%RSP) |
0x4248e9 MOV 0x78(%RSP),%RAX |
0x4248ee LEA (%RAX,%R11,1),%RAX |
0x4248f2 MOV %RAX,0x138(%RSP) |
0x4248fa MOV 0xa8(%RSP),%RAX |
0x424902 LEA (%RAX,%R11,1),%RAX |
0x424906 MOV %RAX,0x130(%RSP) |
0x42490e MOV 0x68(%RSP),%RAX |
0x424913 ADD %R11,%RAX |
0x424916 MOV %RAX,0x128(%RSP) |
0x42491e MOV 0x60(%RSP),%RAX |
0x424923 ADD %R11,%RAX |
0x424926 MOV %RAX,0x120(%RSP) |
0x42492e MOV 0x70(%RSP),%RAX |
0x424933 ADD %R11,%RAX |
0x424936 MOV %RAX,0x118(%RSP) |
0x42493e ADD 0xa0(%RSP),%R11 |
0x424946 MOV %R11,0x160(%RSP) |
0x42494e VBROADCASTSD 0xd4261(%RIP),%YMM3 |
0x424957 XOR %R13D,%R13D |
0x42495a MOV %R8,0x190(%RSP) |
0x424962 MOV %R8D,%R15D |
0x424965 MOV %R12D,0x2c(%RSP) |
0x42496a JMP 424e13 |
0x42496f NOP |
(119) 0x424970 MOVSXD %ESI,%RSI |
(119) 0x424973 MOV 0xb0(%RSP),%RDI |
(119) 0x42497b ADD %RSI,%RDI |
(119) 0x42497e MOV %RCX,%R9 |
(119) 0x424981 IMUL %RDI,%R9 |
(119) 0x424985 MOV %R9,0xd0(%RSP) |
(119) 0x42498d MOV %RDX,%R13 |
(119) 0x424990 MOV %R8,%RDX |
(119) 0x424993 MOV %R8,%R9 |
(119) 0x424996 IMUL %RDI,%R9 |
(119) 0x42499a MOV %R9,0xd8(%RSP) |
(119) 0x4249a2 MOV %R13,%R14 |
(119) 0x4249a5 IMUL %RDI,%R13 |
(119) 0x4249a9 MOV %R10,%R9 |
(119) 0x4249ac IMUL %RDI,%R10 |
(119) 0x4249b0 MOV %R11,%R8 |
(119) 0x4249b3 MOV %R11,%R12 |
(119) 0x4249b6 IMUL %RDI,%R8 |
(119) 0x4249ba SUB 0xb8(%RSP),%RSI |
(119) 0x4249c2 IMUL %RSI,%RCX |
(119) 0x4249c6 IMUL %RSI,%RDX |
(119) 0x4249ca IMUL %RSI,%R14 |
(119) 0x4249ce MOV %R14,0xe0(%RSP) |
(119) 0x4249d6 IMUL %RSI,%R9 |
(119) 0x4249da MOV %R9,0xe8(%RSP) |
(119) 0x4249e2 MOV %RBX,%RAX |
(119) 0x4249e5 IMUL %RSI,%RAX |
(119) 0x4249e9 IMUL %RSI,%R12 |
(119) 0x4249ed MOV %R12,0xf8(%RSP) |
(119) 0x4249f5 MOV 0x2c(%RSP),%R12D |
(119) 0x4249fa MOV 0x18(%RSP),%R9 |
(119) 0x4249ff IMUL %RSI,%R9 |
(119) 0x424a03 MOV 0x10(%RSP),%RDI |
(119) 0x424a08 IMUL %RSI,%RDI |
(119) 0x424a0c MOV 0x38(%RSP),%RBX |
(119) 0x424a11 IMUL %RSI,%RBX |
(119) 0x424a15 MOV 0x8(%RSP),%R11 |
(119) 0x424a1a IMUL %RSI,%R11 |
(119) 0x424a1e MOV %R9,0xf0(%RSP) |
(119) 0x424a26 MOV %R8,0x100(%RSP) |
(119) 0x424a2e MOV %RAX,%R9 |
(119) 0x424a31 MOV %R13,%R14 |
(119) 0x424a34 MOV 0x108(%RSP),%R13 |
(119) 0x424a3c MOV %RDX,0xc8(%RSP) |
(119) 0x424a44 MOV %RCX,0xc0(%RSP) |
(119) 0x424a4c XOR %EAX,%EAX |
(119) 0x424a4e VPBROADCASTQ %RAX,%YMM1 |
(119) 0x424a54 VMOVDQA 0x220(%RSP),%YMM2 |
(119) 0x424a5d VPSUBQ %YMM1,%YMM2,%YMM1 |
(119) 0x424a61 VPCMPNLEUQ 0xd36d4(%RIP),%YMM1,%K1 |
(119) 0x424a6c MOV 0x90(%RSP),%RDX |
(119) 0x424a74 MOV 0xd0(%RSP),%RSI |
(119) 0x424a7c ADD %RDX,%RSI |
(119) 0x424a7f ADD 0x180(%RSP),%RAX |
(119) 0x424a87 MOV 0x178(%RSP),%RCX |
(119) 0x424a8f ADD %RAX,%RCX |
(119) 0x424a92 VMOVUPD (%RSI,%RCX,8),%YMM26{%K1}{z} |
(119) 0x424a99 SUB 0x188(%RSP),%RAX |
(119) 0x424aa1 VMOVUPD (%RSI,%RAX,8),%YMM27{%K1}{z} |
(119) 0x424aa8 MOV 0x88(%RSP),%RSI |
(119) 0x424ab0 MOV 0xd8(%RSP),%R8 |
(119) 0x424ab8 ADD %RSI,%R8 |
(119) 0x424abb VMOVUPD (%R8,%RCX,8),%YMM28{%K1}{z} |
(119) 0x424ac2 VMOVUPD (%R8,%RAX,8),%YMM29{%K1}{z} |
(119) 0x424ac9 MOV 0xc0(%RSP),%R8 |
(119) 0x424ad1 ADD %RDX,%R8 |
(119) 0x424ad4 VMOVUPD (%R8,%RAX,8),%YMM30{%K1}{z} |
(119) 0x424adb VMOVUPD (%R8,%RCX,8),%YMM31{%K1}{z} |
(119) 0x424ae2 MOV 0xc8(%RSP),%RDX |
(119) 0x424aea ADD %RSI,%RDX |
(119) 0x424aed VMOVUPD (%RDX,%RAX,8),%YMM2{%K1}{z} |
(119) 0x424af4 VMOVUPD (%RDX,%RCX,8),%YMM1{%K1}{z} |
(119) 0x424afb MOV 0xa0(%RSP),%RDX |
(119) 0x424b03 MOV 0xe0(%RSP),%RSI |
(119) 0x424b0b ADD %RDX,%RSI |
(119) 0x424b0e VMOVUPD (%RSI,%RAX,8),%YMM4{%K1}{z} |
(119) 0x424b15 MOV 0x80(%RSP),%RSI |
(119) 0x424b1d MOV 0xe8(%RSP),%R8 |
(119) 0x424b25 ADD %RSI,%R8 |
(119) 0x424b28 VMOVUPD (%R8,%RAX,8),%YMM5{%K1}{z} |
(119) 0x424b2f VMOVUPD (%R8,%RCX,8),%YMM18{%K1}{z} |
(119) 0x424b36 ADD %RDX,%R14 |
(119) 0x424b39 VMOVUPD (%R14,%RAX,8),%YMM19{%K1}{z} |
(119) 0x424b40 ADD %RSI,%R10 |
(119) 0x424b43 VMOVUPD (%R10,%RAX,8),%YMM20{%K1}{z} |
(119) 0x424b4a VMOVUPD (%R10,%RCX,8),%YMM21{%K1}{z} |
(119) 0x424b51 ADD 0x98(%RSP),%R9 |
(119) 0x424b59 VMOVUPD (%R9,%RAX,8),%YMM22{%K1}{z} |
(119) 0x424b60 VMOVUPD (%R9,%RCX,8),%YMM23{%K1}{z} |
(119) 0x424b67 MOV 0x78(%RSP),%RDX |
(119) 0x424b6c MOV 0xf8(%RSP),%RSI |
(119) 0x424b74 ADD %RDX,%RSI |
(119) 0x424b77 VMOVUPD (%RSI,%RAX,8),%YMM24{%K1}{z} |
(119) 0x424b7e VMOVUPD (%RSI,%RCX,8),%YMM25{%K1}{z} |
(119) 0x424b85 MOV 0x100(%RSP),%RSI |
(119) 0x424b8d ADD %RDX,%RSI |
(119) 0x424b90 VMOVUPD (%RSI,%RCX,8),%YMM6{%K1}{z} |
(119) 0x424b97 VMOVUPD (%RSI,%RAX,8),%YMM7{%K1}{z} |
(119) 0x424b9e MOV 0xf0(%RSP),%RCX |
(119) 0x424ba6 ADD 0x70(%RSP),%RCX |
(119) 0x424bab VMOVUPD (%RCX,%RAX,8),%YMM8{%K1}{z} |
(119) 0x424bb2 VMOVAPD 0x260(%RSP),%YMM12 |
(119) 0x424bbb VMOVAPD %YMM26,%YMM12{%K1} |
(119) 0x424bc1 VMOVAPD 0x2a0(%RSP),%YMM11 |
(119) 0x424bca VMOVAPD %YMM28,%YMM11{%K1} |
(119) 0x424bd0 VMOVAPD 0x2e0(%RSP),%YMM10 |
(119) 0x424bd9 VMOVAPD %YMM27,%YMM10{%K1} |
(119) 0x424bdf VMOVAPD 0x320(%RSP),%YMM9 |
(119) 0x424be8 VMOVAPD %YMM29,%YMM9{%K1} |
(119) 0x424bee VMOVAPD 0x340(%RSP),%YMM29 |
(119) 0x424bf6 VMOVAPD %YMM30,%YMM29{%K1} |
(119) 0x424bfc VMOVAPD 0x360(%RSP),%YMM28 |
(119) 0x424c04 VMOVAPD %YMM2,%YMM28{%K1} |
(119) 0x424c0a VMOVAPD 0x380(%RSP),%YMM27 |
(119) 0x424c12 VMOVAPD %YMM31,%YMM27{%K1} |
(119) 0x424c18 VMOVAPD 0x3a0(%RSP),%YMM26 |
(119) 0x424c20 VMOVAPD %YMM1,%YMM26{%K1} |
(119) 0x424c26 VMOVAPD %YMM4,%YMM17{%K1} |
(119) 0x424c2c VMOVAPD %YMM5,%YMM16{%K1} |
(119) 0x424c32 VMOVAPD %YMM18,%YMM15{%K1} |
(119) 0x424c38 VMOVAPD %YMM19,%YMM14{%K1} |
(119) 0x424c3e VMOVAPD %YMM20,%YMM13{%K1} |
(119) 0x424c44 VSUBPD %YMM16,%YMM15,%YMM1 |
(119) 0x424c4a VMULPD %YMM17,%YMM1,%YMM1 |
(119) 0x424c50 VMOVAPD 0x240(%RSP),%YMM5 |
(119) 0x424c59 VMOVAPD %YMM21,%YMM5{%K1} |
(119) 0x424c5f VSUBPD %YMM13,%YMM5,%YMM2 |
(119) 0x424c64 VFMADD213PD %YMM1,%YMM14,%YMM2 |
(119) 0x424c69 VMOVAPD 0x300(%RSP),%YMM20 |
(119) 0x424c71 VMOVAPD %YMM24,%YMM20{%K1} |
(119) 0x424c77 VMOVAPD 0x3c0(%RSP),%YMM19 |
(119) 0x424c7f VMOVAPD %YMM25,%YMM19{%K1} |
(119) 0x424c85 VMOVAPD 0x3e0(%RSP),%YMM18 |
(119) 0x424c8d VMOVAPD %YMM7,%YMM18{%K1} |
(119) 0x424c93 VMOVAPD 0x400(%RSP),%YMM7 |
(119) 0x424c9c VMOVAPD %YMM6,%YMM7{%K1} |
(119) 0x424ca2 VSUBPD %YMM20,%YMM19,%YMM1 |
(119) 0x424ca8 VFMADD213PD %YMM2,%YMM17,%YMM1 |
(119) 0x424cae VSUBPD %YMM18,%YMM7,%YMM2 |
(119) 0x424cb4 VFMADD231PD %YMM2,%YMM14,%YMM1 |
(119) 0x424cb9 VMOVAPD %YMM11,0x2a0(%RSP) |
(119) 0x424cc2 VMOVAPD %YMM12,0x260(%RSP) |
(119) 0x424ccb VMULPD %YMM11,%YMM12,%YMM2 |
(119) 0x424cd0 VMOVAPD %YMM9,0x320(%RSP) |
(119) 0x424cd9 VMOVAPD %YMM10,0x2e0(%RSP) |
(119) 0x424ce2 VFMADD231PD %YMM9,%YMM10,%YMM2 |
(119) 0x424ce7 VMOVAPD %YMM28,0x360(%RSP) |
(119) 0x424cef VMOVAPD %YMM29,0x340(%RSP) |
(119) 0x424cf7 VFMADD231PD %YMM28,%YMM29,%YMM2 |
(119) 0x424cfd VMOVAPD %YMM26,0x3a0(%RSP) |
(119) 0x424d05 VMOVAPD %YMM27,0x380(%RSP) |
(119) 0x424d0d VFMADD231PD %YMM26,%YMM27,%YMM2 |
(119) 0x424d13 VMULPD %YMM3,%YMM2,%YMM2 |
(119) 0x424d17 VDIVPD %YMM2,%YMM0,%YMM2 |
(119) 0x424d1b VMOVAPD 0x420(%RSP),%YMM4 |
(119) 0x424d24 VMOVAPD %YMM8,%YMM4{%K1} |
(119) 0x424d2a VMOVAPD %YMM4,0x420(%RSP) |
(119) 0x424d33 VFMADD213PD %YMM4,%YMM2,%YMM1 |
(119) 0x424d38 ADD 0x60(%RSP),%RDI |
(119) 0x424d3d VMOVUPD %YMM1,(%RDI,%RAX,8){%K1} |
(119) 0x424d44 ADD 0x68(%RSP),%RBX |
(119) 0x424d49 VMOVUPD (%RBX,%RAX,8),%YMM1{%K1}{z} |
(119) 0x424d50 VMOVAPD 0x280(%RSP),%YMM9 |
(119) 0x424d59 VMOVAPD %YMM22,%YMM9{%K1} |
(119) 0x424d5f VSUBPD %YMM16,%YMM13,%YMM4 |
(119) 0x424d65 VMULPD %YMM4,%YMM9,%YMM4 |
(119) 0x424d69 VMOVAPD 0x2c0(%RSP),%YMM8 |
(119) 0x424d72 VMOVAPD %YMM23,%YMM8{%K1} |
(119) 0x424d78 VMOVAPD %YMM5,0x240(%RSP) |
(119) 0x424d81 VSUBPD %YMM15,%YMM5,%YMM5 |
(119) 0x424d86 VFMADD213PD %YMM4,%YMM8,%YMM5 |
(119) 0x424d8b VMOVAPD %YMM18,0x3e0(%RSP) |
(119) 0x424d93 VMOVAPD %YMM20,0x300(%RSP) |
(119) 0x424d9b VSUBPD %YMM20,%YMM18,%YMM4 |
(119) 0x424da1 VMOVAPD %YMM7,0x400(%RSP) |
(119) 0x424daa VMOVAPD %YMM19,0x3c0(%RSP) |
(119) 0x424db2 VSUBPD %YMM19,%YMM7,%YMM6 |
(119) 0x424db8 VMOVAPD %YMM9,0x280(%RSP) |
(119) 0x424dc1 VFMADD213PD %YMM5,%YMM9,%YMM4 |
(119) 0x424dc6 VMOVAPD %YMM8,0x2c0(%RSP) |
(119) 0x424dcf VFMADD231PD %YMM6,%YMM8,%YMM4 |
(119) 0x424dd4 VMOVAPD 0x440(%RSP),%YMM5 |
(119) 0x424ddd VMOVAPD %YMM1,%YMM5{%K1} |
(119) 0x424de3 VMOVAPD %YMM5,0x440(%RSP) |
(119) 0x424dec VFMADD213PD %YMM5,%YMM2,%YMM4 |
(119) 0x424df1 ADD 0xa8(%RSP),%R11 |
(119) 0x424df9 VMOVUPD %YMM4,(%R11,%RAX,8){%K1} |
(119) 0x424e00 LEA 0x1(%R13),%EAX |
(119) 0x424e04 INC %R15D |
(119) 0x424e07 CMP %R12D,%R13D |
(119) 0x424e0a MOV %EAX,%R13D |
(119) 0x424e0d JE 424736 |
(119) 0x424e13 CMPL $0,0x54(%RSP) |
(119) 0x424e18 JS 424e00 |
(119) 0x424e1a MOV 0x190(%RSP),%RAX |
(119) 0x424e22 LEA (%RAX,%R13,1),%ESI |
(119) 0x424e26 MOV 0x198(%RSP),%RAX |
(119) 0x424e2e MOV (%RAX),%R8 |
(119) 0x424e31 MOV 0x1a0(%RSP),%RAX |
(119) 0x424e39 MOV (%RAX),%RCX |
(119) 0x424e3c MOV 0x1a8(%RSP),%RAX |
(119) 0x424e44 MOV (%RAX),%RAX |
(119) 0x424e47 MOV %RAX,0x18(%RSP) |
(119) 0x424e4c MOV 0x1b0(%RSP),%RAX |
(119) 0x424e54 MOV (%RAX),%RDX |
(119) 0x424e57 MOV 0x1b8(%RSP),%RAX |
(119) 0x424e5f MOV (%RAX),%R10 |
(119) 0x424e62 MOV 0x1c0(%RSP),%RAX |
(119) 0x424e6a MOV (%RAX),%RAX |
(119) 0x424e6d MOV %RAX,0x10(%RSP) |
(119) 0x424e72 MOV 0x1c8(%RSP),%RAX |
(119) 0x424e7a MOV (%RAX),%RAX |
(119) 0x424e7d MOV %RAX,0x38(%RSP) |
(119) 0x424e82 MOV 0x1d0(%RSP),%RAX |
(119) 0x424e8a MOV (%RAX),%RBX |
(119) 0x424e8d MOV 0x1d8(%RSP),%RAX |
(119) 0x424e95 MOV (%RAX),%RAX |
(119) 0x424e98 MOV %RAX,0x8(%RSP) |
(119) 0x424e9d MOV 0x1e0(%RSP),%RAX |
(119) 0x424ea5 MOV (%RAX),%R11 |
(119) 0x424ea8 CMPQ $0,0x20(%RSP) |
(119) 0x424eae MOV %R13,0x108(%RSP) |
(119) 0x424eb6 JE 424970 |
(119) 0x424ebc MOV %R15D,0x50(%RSP) |
(119) 0x424ec1 MOVSXD %R15D,%R15 |
(119) 0x424ec4 MOV 0xb0(%RSP),%RDI |
(119) 0x424ecc LEA (%RDI,%R15,1),%RAX |
(119) 0x424ed0 ADD 0x168(%RSP),%R15 |
(119) 0x424ed8 MOVSXD %ESI,%RSI |
(119) 0x424edb ADD %RSI,%RDI |
(119) 0x424ede MOV %RCX,%R12 |
(119) 0x424ee1 MOV %RCX,%R9 |
(119) 0x424ee4 IMUL %RDI,%R9 |
(119) 0x424ee8 MOV %R9,0xd0(%RSP) |
(119) 0x424ef0 MOV %R8,%R9 |
(119) 0x424ef3 IMUL %RDI,%R9 |
(119) 0x424ef7 MOV %R9,0xd8(%RSP) |
(119) 0x424eff SUB 0xb8(%RSP),%RSI |
(119) 0x424f07 MOV %RCX,%R9 |
(119) 0x424f0a IMUL %RSI,%R9 |
(119) 0x424f0e MOV %R9,0xc0(%RSP) |
(119) 0x424f16 MOV %R8,%R9 |
(119) 0x424f19 IMUL %RSI,%R9 |
(119) 0x424f1d MOV %R9,0xc8(%RSP) |
(119) 0x424f25 MOV %RDX,0x40(%RSP) |
(119) 0x424f2a MOV %RDX,%R9 |
(119) 0x424f2d IMUL %RSI,%R9 |
(119) 0x424f31 MOV %R9,0xe0(%RSP) |
(119) 0x424f39 MOV %R10,%R9 |
(119) 0x424f3c IMUL %RSI,%R9 |
(119) 0x424f40 MOV %R9,0xe8(%RSP) |
(119) 0x424f48 MOV %RDX,%R9 |
(119) 0x424f4b IMUL %RDI,%R9 |
(119) 0x424f4f MOV %R9,0x1f0(%RSP) |
(119) 0x424f57 MOV %R10,%R9 |
(119) 0x424f5a IMUL %RDI,%R9 |
(119) 0x424f5e MOV %R9,0x1f8(%RSP) |
(119) 0x424f66 MOV %RBX,%R9 |
(119) 0x424f69 MOV %RBX,%RDX |
(119) 0x424f6c IMUL %RSI,%R9 |
(119) 0x424f70 MOV %R9,0x200(%RSP) |
(119) 0x424f78 MOV %R11,%R9 |
(119) 0x424f7b IMUL %RSI,%R9 |
(119) 0x424f7f MOV %R9,0xf8(%RSP) |
(119) 0x424f87 IMUL %R11,%RDI |
(119) 0x424f8b MOV %RDI,0x100(%RSP) |
(119) 0x424f93 MOV 0x18(%RSP),%RDI |
(119) 0x424f98 IMUL %RSI,%RDI |
(119) 0x424f9c MOV %RDI,0xf0(%RSP) |
(119) 0x424fa4 MOV 0x10(%RSP),%RDI |
(119) 0x424fa9 IMUL %RSI,%RDI |
(119) 0x424fad MOV %RDI,0x208(%RSP) |
(119) 0x424fb5 MOV 0x38(%RSP),%RBX |
(119) 0x424fba MOV %RBX,%RDI |
(119) 0x424fbd IMUL %RSI,%RDI |
(119) 0x424fc1 MOV %RDI,0x210(%RSP) |
(119) 0x424fc9 MOV 0x8(%RSP),%R13 |
(119) 0x424fce IMUL %R13,%RSI |
(119) 0x424fd2 MOV %RSI,0x218(%RSP) |
(119) 0x424fda MOV %RCX,%RDI |
(119) 0x424fdd IMUL %RAX,%RDI |
(119) 0x424fe1 MOV %R8,%R14 |
(119) 0x424fe4 IMUL %RAX,%R14 |
(119) 0x424fe8 MOV %R15,%RCX |
(119) 0x424feb IMUL %R15,%R12 |
(119) 0x424fef IMUL %R15,%R8 |
(119) 0x424ff3 MOV %R10,%R15 |
(119) 0x424ff6 IMUL %RCX,%R15 |
(119) 0x424ffa IMUL %RAX,%R10 |
(119) 0x424ffe IMUL %RCX,%RDX |
(119) 0x425002 MOV %RDX,0x1e8(%RSP) |
(119) 0x42500a MOV %R11,%R9 |
(119) 0x42500d IMUL %RCX,%R9 |
(119) 0x425011 IMUL %RAX,%R11 |
(119) 0x425015 IMUL %RCX,%R13 |
(119) 0x425019 IMUL %RCX,%RBX |
(119) 0x42501d MOV 0x10(%RSP),%RSI |
(119) 0x425022 IMUL %RCX,%RSI |
(119) 0x425026 MOV %RSI,0x10(%RSP) |
(119) 0x42502b MOV 0x18(%RSP),%RSI |
(119) 0x425030 IMUL %RCX,%RSI |
(119) 0x425034 MOV %RSI,0x18(%RSP) |
(119) 0x425039 MOV 0x40(%RSP),%RSI |
(119) 0x42503e IMUL %RSI,%RAX |
(119) 0x425042 IMUL %RSI,%RCX |
(119) 0x425046 MOV 0x158(%RSP),%RDX |
(119) 0x42504e ADD %RDX,%RDI |
(119) 0x425051 MOV 0x150(%RSP),%RSI |
(119) 0x425059 ADD %RSI,%R14 |
(119) 0x42505c ADD %RDX,%R12 |
(119) 0x42505f MOV %R12,0x8(%RSP) |
(119) 0x425064 ADD %RSI,%R8 |
(119) 0x425067 MOV %R8,0x38(%RSP) |
(119) 0x42506c MOV 0x148(%RSP),%RSI |
(119) 0x425074 ADD %RSI,%R15 |
(119) 0x425077 ADD %RSI,%R10 |
(119) 0x42507a MOV %R10,0x40(%RSP) |
(119) 0x42507f MOV 0x1e8(%RSP),%RDX |
(119) 0x425087 ADD 0x140(%RSP),%RDX |
(119) 0x42508f MOV 0x138(%RSP),%RSI |
(119) 0x425097 ADD %RSI,%R9 |
(119) 0x42509a ADD %RSI,%R11 |
(119) 0x42509d MOV %R11,%R10 |
(119) 0x4250a0 ADD 0x130(%RSP),%R13 |
(119) 0x4250a8 MOV %R13,%R12 |
(119) 0x4250ab ADD 0x128(%RSP),%RBX |
(119) 0x4250b3 MOV %RBX,%R13 |
(119) 0x4250b6 MOV 0x10(%RSP),%R11 |
(119) 0x4250bb ADD 0x120(%RSP),%R11 |
(119) 0x4250c3 MOV 0x18(%RSP),%RBX |
(119) 0x4250c8 ADD 0x118(%RSP),%RBX |
(119) 0x4250d0 MOV 0x160(%RSP),%RSI |
(119) 0x4250d8 ADD %RSI,%RAX |
(119) 0x4250db ADD %RSI,%RCX |
(119) 0x4250de XOR %ESI,%ESI |
(120) 0x4250e0 VMOVUPD -0x8(%RDI,%RSI,8),%YMM1 |
(120) 0x4250e6 VMOVUPD (%RDI,%RSI,8),%YMM2 |
(120) 0x4250eb VMULPD -0x8(%R14,%RSI,8),%YMM1,%YMM1 |
(120) 0x4250f2 VFMADD231PD (%R14,%RSI,8),%YMM2,%YMM1 |
(120) 0x4250f8 MOV 0x8(%RSP),%R8 |
(120) 0x4250fd VMOVUPD -0x8(%R8,%RSI,8),%YMM2 |
(120) 0x425104 VMOVUPD (%R8,%RSI,8),%YMM4 |
(120) 0x42510a MOV 0x38(%RSP),%R8 |
(120) 0x42510f VFMADD132PD (%R8,%RSI,8),%YMM1,%YMM4 |
(120) 0x425115 VFMADD231PD -0x8(%R8,%RSI,8),%YMM2,%YMM4 |
(120) 0x42511c VMULPD %YMM3,%YMM4,%YMM1 |
(120) 0x425120 VDIVPD %YMM1,%YMM0,%YMM1 |
(120) 0x425124 VMOVUPD (%RCX,%RSI,8),%YMM2 |
(120) 0x425129 VMOVUPD -0x8(%R15,%RSI,8),%YMM4 |
(120) 0x425130 VMOVUPD (%R15,%RSI,8),%YMM5 |
(120) 0x425136 VSUBPD %YMM5,%YMM4,%YMM6 |
(120) 0x42513a VMULPD %YMM2,%YMM6,%YMM6 |
(120) 0x42513e VMOVUPD (%RAX,%RSI,8),%YMM7 |
(120) 0x425143 MOV 0x40(%RSP),%R8 |
(120) 0x425148 VMOVUPD -0x8(%R8,%RSI,8),%YMM8 |
(120) 0x42514f VMOVUPD (%R8,%RSI,8),%YMM18 |
(120) 0x425156 VSUBPD %YMM18,%YMM8,%YMM19 |
(120) 0x42515c VFMADD213PD %YMM6,%YMM7,%YMM19 |
(120) 0x425162 MOV %RDX,%R8 |
(120) 0x425165 VMOVUPD -0x8(%RDX,%RSI,8),%YMM6 |
(120) 0x42516b VMOVUPD (%RDX,%RSI,8),%YMM20 |
(120) 0x425172 VSUBPD %YMM5,%YMM18,%YMM5 |
(120) 0x425178 VMULPD %YMM5,%YMM20,%YMM5 |
(120) 0x42517e VSUBPD %YMM4,%YMM8,%YMM4 |
(120) 0x425182 VFMADD213PD %YMM5,%YMM6,%YMM4 |
(120) 0x425187 VMOVUPD -0x8(%R9,%RSI,8),%YMM5 |
(120) 0x42518e VMOVUPD (%R9,%RSI,8),%YMM8 |
(120) 0x425194 MOV %R10,%R8 |
(120) 0x425197 VMOVUPD -0x8(%R10,%RSI,8),%YMM18 |
(120) 0x4251a2 VMOVUPD (%R10,%RSI,8),%YMM21 |
(120) 0x4251a9 VSUBPD %YMM8,%YMM5,%YMM22 |
(120) 0x4251af VSUBPD %YMM21,%YMM18,%YMM23 |
(120) 0x4251b5 VFMADD213PD %YMM19,%YMM2,%YMM22 |
(120) 0x4251bb VFMADD231PD %YMM23,%YMM7,%YMM22 |
(120) 0x4251c1 VFMADD213PD (%RBX,%RSI,8),%YMM1,%YMM22 |
(120) 0x4251c8 VMOVUPD %YMM22,(%R11,%RSI,8) |
(120) 0x4251cf VSUBPD %YMM8,%YMM21,%YMM2 |
(120) 0x4251d5 VSUBPD %YMM5,%YMM18,%YMM5 |
(120) 0x4251db VFMADD213PD %YMM4,%YMM20,%YMM2 |
(120) 0x4251e1 VFMADD231PD %YMM5,%YMM6,%YMM2 |
(120) 0x4251e6 VFMADD213PD (%R13,%RSI,8),%YMM1,%YMM2 |
(120) 0x4251ed VMOVUPD %YMM2,(%R12,%RSI,8) |
(120) 0x4251f3 ADD $0x4,%RSI |
(120) 0x4251f7 CMP 0x20(%RSP),%RSI |
(120) 0x4251fc JB 4250e0 |
(119) 0x425202 MOV 0x20(%RSP),%RCX |
(119) 0x425207 MOV %RCX,%RAX |
(119) 0x42520a CMP 0x170(%RSP),%RCX |
(119) 0x425212 MOV 0x2c(%RSP),%R12D |
(119) 0x425217 MOV 0x50(%RSP),%R15D |
(119) 0x42521c MOV 0x108(%RSP),%R13 |
(119) 0x425224 MOV 0x218(%RSP),%R11 |
(119) 0x42522c MOV 0x210(%RSP),%RBX |
(119) 0x425234 MOV 0x208(%RSP),%RDI |
(119) 0x42523c MOV 0x200(%RSP),%R9 |
(119) 0x425244 MOV 0x1f8(%RSP),%R10 |
(119) 0x42524c MOV 0x1f0(%RSP),%R14 |
(119) 0x425254 JNE 424a4e |
(119) 0x42525a JMP 424e00 |
0x42525f NOP |
Path / |
Source file and lines | accelerate_kernel.f90:57-79 |
Module | exec |
nb instructions | 202 |
nb uops | 203 |
loop length | 993 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 3 |
used zmm registers | 0 |
nb stack references | 76 |
micro-operation queue | 33.83 cycles |
front end | 33.83 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 18.50 | 18.50 | 18.25 | 18.25 | 3.50 | 32.00 | 32.00 | 32.00 | 0.00 | 1.00 | 1.00 | 0.00 | 0.50 | 0.50 |
cycles | 18.50 | 18.50 | 18.25 | 18.25 | 3.50 | 32.00 | 32.00 | 32.00 | 0.00 | 1.00 | 1.00 | 0.00 | 0.50 | 0.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 33.83 |
Dispatch | 32.00 |
Overall L1 | 33.83 |
all | 2% |
load | 0% |
store | 2% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 3% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 2% |
load | 0% |
store | 2% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 3% |
all | 11% |
load | 11% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 11% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 11% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x480,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R9,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RCX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,0x1e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,0x1d8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,0x1d0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,0x1c8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,0x1b8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x60(%RBP),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x58(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EBX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INC %EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x90(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x1b0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x88(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x1a8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x80(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x1a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x78(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x198(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x70(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x68(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x50(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x48(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x40(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x38(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x30(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x28(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x20(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,0x5c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JS 42474f <accelerate_kernel_module_mp_accelerate_kernel_.DIR.OMP.PARALLEL.2+0x1bf> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R9,0x8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVL $0,0x34(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EAX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0x1,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x60(%RSP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x64(%RSP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x3c(%RSP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x38(%RSP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x53b290,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,0x54(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x34(%RSP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RSP),%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EAX,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JAE 424769 <accelerate_kernel_module_mp_accelerate_kernel_.DIR.OMP.PARALLEL.2+0x1d9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x53b2b0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x4c(%RSP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x110(%RSP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV $0x53b2d0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 404740 <__kmpc_barrier@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVQ %R14,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
MOV %R15,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x20,%R9 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
LEA (%R9,%RAX,1),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAR $0x20,%R10 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RSP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SAL $0x20,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAR $0x20,%R11 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %EBX,%R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVSXD (%R13),%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV 0x8(%RSP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EBX,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x1(%RDX),%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,0x54(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
ADD $0x2,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x2,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVGE %EDX,%R15D | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15D,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $0x7ffffffc,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %RCX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x1,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNS %RCX,%RDX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RDX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RSI,%RDX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %R9,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %RDI,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RCX,%RDI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R11,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
NOT %R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R11,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %XMM0,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,0x170(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %R15,%YMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVDQA %YMM1,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
SHR $0x20,%RDI | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RDX,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RBX,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (,%RBX,8),%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAL $0x3,%RDI | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %RDI,%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x1,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNS %RAX,%RCX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RCX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RSI,%RCX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x188(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
NOT %R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R10,0x178(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %R14,%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x90(%RSP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,0x158(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R13,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RAX,%R13 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x150(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SHR $0x20,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RCX,%R13 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R13,0x168(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x80(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x148(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x98(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA (%RAX,%R11,1),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x78(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA (%RAX,%R11,1),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x138(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0xa8(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA (%RAX,%R11,1),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x68(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x128(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x60(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x70(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x118(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
ADD 0xa0(%RSP),%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %R11,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0xd4261(%RIP),%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R8,0x190(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R8D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12D,0x2c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JMP 424e13 <accelerate_kernel_module_mp_accelerate_kernel_.DIR.OMP.PARALLEL.2+0x883> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Source file and lines | accelerate_kernel.f90:57-79 |
Module | exec |
nb instructions | 202 |
nb uops | 203 |
loop length | 993 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 3 |
used zmm registers | 0 |
nb stack references | 76 |
micro-operation queue | 33.83 cycles |
front end | 33.83 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 18.50 | 18.50 | 18.25 | 18.25 | 3.50 | 32.00 | 32.00 | 32.00 | 0.00 | 1.00 | 1.00 | 0.00 | 0.50 | 0.50 |
cycles | 18.50 | 18.50 | 18.25 | 18.25 | 3.50 | 32.00 | 32.00 | 32.00 | 0.00 | 1.00 | 1.00 | 0.00 | 0.50 | 0.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 33.83 |
Dispatch | 32.00 |
Overall L1 | 33.83 |
all | 2% |
load | 0% |
store | 2% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 3% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 2% |
load | 0% |
store | 2% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 3% |
all | 11% |
load | 11% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 11% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 11% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND $-0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB $0x480,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R9,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RCX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xc0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,0x1e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0xb8(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,0x1d8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,0x1d0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0xa8(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,0x1c8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0xa0(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x98(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RAX,0x1b8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x60(%RBP),%EBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x58(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EBX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INC %EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x90(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x1b0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x88(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x1a8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x80(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x1a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x78(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x198(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x70(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x68(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x50(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x48(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x40(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x38(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x30(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x28(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x20(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x10(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0,0x5c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JS 42474f <accelerate_kernel_module_mp_accelerate_kernel_.DIR.OMP.PARALLEL.2+0x1bf> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R9,0x8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVL $0,0x34(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EAX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0x1,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x60(%RSP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x64(%RSP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x3c(%RSP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x38(%RSP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x53b290,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,0x54(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x34(%RSP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x30(%RSP),%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EAX,%R12D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JAE 424769 <accelerate_kernel_module_mp_accelerate_kernel_.DIR.OMP.PARALLEL.2+0x1d9> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x53b2b0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x4c(%RSP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
VZEROUPPER | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x110(%RSP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV $0x53b2d0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x28(%RBP),%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JMP 404740 <__kmpc_barrier@plt> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVQ %R14,%XMM0 | 1 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
MOV %R15,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x20,%R9 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
LEA (%R9,%RAX,1),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAR $0x20,%R10 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RSP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SAL $0x20,%RDX | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAR $0x20,%R11 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %EBX,%R8D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVSXD (%R13),%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV 0x8(%RSP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDX),%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EBX,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA 0x1(%RDX),%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,0x54(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
ADD $0x2,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x2,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%R15D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVGE %EDX,%R15D | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15D,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
AND $0x7ffffffc,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %RCX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x1,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNS %RCX,%RDX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RDX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RSI,%RDX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %R13,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %R9,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %RDI,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RCX,%RDI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R11,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
NOT %R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R11,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %XMM0,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R15,0x170(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VPBROADCASTQ %R15,%YMM1 | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVDQA %YMM1,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 4 | 1 |
SHR $0x20,%RDI | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RDX,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RBX,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (,%RBX,8),%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAL $0x3,%RDI | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %RDI,%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x1,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNS %RAX,%RCX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RCX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RSI,%RCX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x188(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
NOT %R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R10,0x178(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %R14,%R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV 0x90(%RSP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,0x158(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R13,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RAX,%R13 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x88(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x150(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SHR $0x20,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RCX,%R13 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %R13 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R13,0x168(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x80(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x148(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x98(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA (%RAX,%R11,1),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x78(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA (%RAX,%R11,1),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x138(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0xa8(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA (%RAX,%R11,1),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x68(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x128(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x60(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x70(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,0x118(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
ADD 0xa0(%RSP),%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %R11,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
VBROADCASTSD 0xd4261(%RIP),%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R8,0x190(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R8D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12D,0x2c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JMP 424e13 <accelerate_kernel_module_mp_accelerate_kernel_.DIR.OMP.PARALLEL.2+0x883> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼accelerate_kernel_.DIR.OMP.PARALLEL.2– | 5.15 | 2.67 |
▼Loop 119 - accelerate_kernel.f90:60-76 - exec– | 0.04 | 0.02 |
○Loop 120 - accelerate_kernel.f90:62-76 - exec | 5.11 | 2.64 |