Function: viscosity_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: viscosity_kernel.f90:50-94 | Coverage: 2.17% |
---|
Function: viscosity_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: viscosity_kernel.f90:50-94 | Coverage: 2.17% |
---|
/scratch_na/users/xoserete/qaas_runs/171-215-0463/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90: 50 - 94 |
-------------------------------------------------------------------------------- |
50: !$OMP PARALLEL |
51: |
52: !$OMP DO PRIVATE(ugrad,vgrad,div,strain2,pgradx,pgrady,pgradx2,pgrady2,limiter,pgrad,xgrad,ygrad,grad,grad2,dirx,diry) |
53: DO k=y_min,y_max |
54: !$OMP SIMD |
55: DO j=x_min,x_max |
56: ugrad=(xvel0(j+1,k )+xvel0(j+1,k+1))-(xvel0(j ,k )+xvel0(j ,k+1)) |
57: |
58: vgrad=(yvel0(j ,k+1)+yvel0(j+1,k+1))-(yvel0(j ,k )+yvel0(j+1,k )) |
59: |
60: div = (celldx(j)*(ugrad)+ celldy(k)*(vgrad)) |
61: |
62: strain2 = 0.5_8*(xvel0(j, k+1) + xvel0(j+1,k+1)-xvel0(j ,k )-xvel0(j+1,k ))/celldy(k) & |
63: + 0.5_8*(yvel0(j+1,k ) + yvel0(j+1,k+1)-yvel0(j ,k )-yvel0(j ,k+1))/celldx(j) |
64: |
65: pgradx=(pressure(j+1,k)-pressure(j-1,k))/(celldx(j)+celldx(j+1)) |
66: pgrady=(pressure(j,k+1)-pressure(j,k-1))/(celldy(k)+celldy(k+1)) |
67: |
68: pgradx2 = pgradx*pgradx |
69: pgrady2 = pgrady*pgrady |
70: |
71: limiter = ((0.5_8*(ugrad)/celldx(j))*pgradx2+(0.5_8*(vgrad)/celldy(k))*pgrady2+strain2*pgradx*pgrady) & |
72: /MAX(pgradx2+pgrady2,1.0e-16_8) |
73: |
74: IF ((limiter.GT.0.0).OR.(div.GE.0.0))THEN |
75: viscosity(j,k) = 0.0 |
76: ELSE |
77: dirx=1.0_8 |
78: IF(pgradx.LT.0.0) dirx=-1.0_8 |
79: pgradx = dirx*MAX(1.0e-16_8,ABS(pgradx)) |
80: diry=1.0_8 |
81: IF(pgradx.LT.0.0) diry=-1.0_8 |
82: pgrady = diry*MAX(1.0e-16_8,ABS(pgrady)) |
83: pgrad = SQRT(pgradx**2+pgrady**2) |
84: xgrad = ABS(celldx(j)*pgrad/pgradx) |
85: ygrad = ABS(celldy(k)*pgrad/pgrady) |
86: grad = MIN(xgrad,ygrad) |
87: grad2 = grad*grad |
88: |
89: viscosity(j,k)=2.0_8*density0(j,k)*grad2*limiter*limiter |
90: ENDIF |
91: |
92: ENDDO |
93: ENDDO |
94: !$OMP END DO |
0x46b120 PUSH %RBP |
0x46b121 MOV %RSP,%RBP |
0x46b124 PUSH %R15 |
0x46b126 PUSH %R14 |
0x46b128 PUSH %R13 |
0x46b12a PUSH %R12 |
0x46b12c PUSH %RBX |
0x46b12d AND $-0x20,%RSP |
0x46b131 SUB $0x300,%RSP |
0x46b138 MOV %R9,0x30(%RSP) |
0x46b13d MOV %R8,0x28(%RSP) |
0x46b142 MOV 0x40(%RBP),%EBX |
0x46b145 MOV 0x38(%RBP),%EAX |
0x46b148 SUB %EBX,%EAX |
0x46b14a MOVL $0,0x24(%RSP) |
0x46b152 JS 46b1cf |
0x46b154 MOV %RCX,%R12 |
0x46b157 MOV %RDX,%R13 |
0x46b15a MOV %RDI,0x48(%RSP) |
0x46b15f MOV (%RDI),%ESI |
0x46b161 MOVL $0,0x10(%RSP) |
0x46b169 MOV %EAX,0xc(%RSP) |
0x46b16d MOVL $0x1,0x20(%RSP) |
0x46b175 SUB $0x8,%RSP |
0x46b179 LEA 0x28(%RSP),%RAX |
0x46b17e LEA 0x2c(%RSP),%RCX |
0x46b183 LEA 0x18(%RSP),%R8 |
0x46b188 LEA 0x14(%RSP),%R9 |
0x46b18d MOV $0x73d630,%EDI |
0x46b192 MOV %ESI,0x1c(%RSP) |
0x46b196 MOV $0x22,%EDX |
0x46b19b PUSH $0x1 |
0x46b19d PUSH $0x1 |
0x46b19f PUSH %RAX |
0x46b1a0 CALL 404520 <__kmpc_for_static_init_4@plt> |
0x46b1a5 ADD $0x20,%RSP |
0x46b1a9 MOV 0x10(%RSP),%EAX |
0x46b1ad MOV 0xc(%RSP),%ECX |
0x46b1b1 SUB %EAX,%ECX |
0x46b1b3 MOV %ECX,0x18(%RSP) |
0x46b1b7 JAE 46b1ea |
0x46b1b9 MOV $0x73d650,%EDI |
0x46b1be MOV 0x14(%RSP),%ESI |
0x46b1c2 VZEROUPPER |
0x46b1c5 CALL 404110 <__kmpc_for_static_fini@plt> |
0x46b1ca MOV 0x48(%RSP),%RDI |
0x46b1cf MOV (%RDI),%ESI |
0x46b1d1 MOV $0x73d670,%EDI |
0x46b1d6 CALL 4045e0 <__kmpc_barrier@plt> |
0x46b1db LEA -0x28(%RBP),%RSP |
0x46b1df POP %RBX |
0x46b1e0 POP %R12 |
0x46b1e2 POP %R13 |
0x46b1e4 POP %R14 |
0x46b1e6 POP %R15 |
0x46b1e8 POP %RBP |
0x46b1e9 RET |
0x46b1ea MOV %RAX,%RDI |
0x46b1ed MOV 0x50(%RBP),%RDX |
0x46b1f1 MOV 0x48(%RBP),%RSI |
0x46b1f5 SAL $0x20,%R12 |
0x46b1f9 MOV $-0x200000000,%RAX |
0x46b203 LEA (%R12,%RAX,1),%RCX |
0x46b207 MOV %RCX,%R8 |
0x46b20a SAR $0x20,%R8 |
0x46b20e SAL $0x20,%R13 |
0x46b212 ADD %R13,%RAX |
0x46b215 MOV %RAX,%R9 |
0x46b218 SAR $0x20,%R9 |
0x46b21c MOVSXD (%RDX),%R10 |
0x46b21f MOV (%RSI),%EDX |
0x46b221 SUB %R10D,%EDX |
0x46b224 ADD %EBX,%EDI |
0x46b226 MOV %RDX,0x130(%RSP) |
0x46b22e INC %EDX |
0x46b230 CMP $0x2,%EDX |
0x46b233 MOV $0x1,%ESI |
0x46b238 CMOVGE %EDX,%ESI |
0x46b23b MOV %RSI,0x38(%RSP) |
0x46b240 AND $0x7ffffffc,%ESI |
0x46b246 MOV %RSI,0xd8(%RSP) |
0x46b24e TEST %RCX,%RCX |
0x46b251 MOV $-0x1,%RSI |
0x46b258 CMOVNS %RCX,%RSI |
0x46b25c TEST %RSI,%RSI |
0x46b25f MOV $0x1,%R11D |
0x46b265 CMOVG %R11,%RSI |
0x46b269 MOV $0x200000000,%RBX |
0x46b273 MOV %RBX,%RDX |
0x46b276 SUB %R12,%RDX |
0x46b279 CMP %RDX,%RCX |
0x46b27c CMOVG %RCX,%RDX |
0x46b280 LEA (,%R10,8),%RCX |
0x46b288 SHR $0x20,%RDX |
0x46b28c IMUL %RSI,%RDX |
0x46b290 MOV $-0x1,%RSI |
0x46b297 SAL $0x3,%RDX |
0x46b29b SUB %RDX,%RCX |
0x46b29e TEST %RAX,%RAX |
0x46b2a1 CMOVNS %RAX,%RSI |
0x46b2a5 TEST %RSI,%RSI |
0x46b2a8 CMOVG %R11,%RSI |
0x46b2ac SUB %R13,%RBX |
0x46b2af MOV 0x30(%RBP),%R14 |
0x46b2b3 CMP %RBX,%RAX |
0x46b2b6 CMOVG %RAX,%RBX |
0x46b2ba MOV %R8,%RAX |
0x46b2bd NOT %RAX |
0x46b2c0 MOV %RAX,0xa8(%RSP) |
0x46b2c8 SHR $0x20,%RBX |
0x46b2cc IMUL %RSI,%RBX |
0x46b2d0 NEG %RBX |
0x46b2d3 MOV %RBX,0xc8(%RSP) |
0x46b2db MOV $0x8,%ESI |
0x46b2e0 SUB %RDX,%RSI |
0x46b2e3 MOV %R9,%RAX |
0x46b2e6 NOT %RAX |
0x46b2e9 MOV %RAX,0xc0(%RSP) |
0x46b2f1 MOV %R9,0xe0(%RSP) |
0x46b2f9 SUB %R9,%R11 |
0x46b2fc MOV %R11,0xd0(%RSP) |
0x46b304 MOV 0x20(%RBP),%RAX |
0x46b308 MOV 0x18(%RBP),%R9 |
0x46b30c MOV 0x10(%RBP),%RDX |
0x46b310 LEA 0x8(%R9,%RCX,1),%R11 |
0x46b315 MOV %R11,0x78(%RSP) |
0x46b31a ADD %RCX,%RDX |
0x46b31d MOV %RDX,0x70(%RSP) |
0x46b322 LEA (%RAX,%RCX,1),%RAX |
0x46b326 MOV %RAX,0x68(%RSP) |
0x46b32b LEA (%R9,%RCX,1),%RAX |
0x46b32f MOV %RAX,0x60(%RSP) |
0x46b334 LEA 0x8(%R14,%RCX,1),%RAX |
0x46b339 MOV %RAX,0x158(%RSP) |
0x46b341 MOV 0x28(%RSP),%RDX |
0x46b346 LEA 0x8(%RDX,%RCX,1),%RAX |
0x46b34b MOV %RAX,0x58(%RSP) |
0x46b350 MOV 0x30(%RSP),%RAX |
0x46b355 LEA 0x8(%RAX,%RCX,1),%RCX |
0x46b35a MOV %RCX,0x50(%RSP) |
0x46b35f MOV %R10,0xb0(%RSP) |
0x46b367 MOV %R8,0xb8(%RSP) |
0x46b36f SUB %R8,%R10 |
0x46b372 MOV %R10,0x98(%RSP) |
0x46b37a LEA (%R14,%RSI,1),%RCX |
0x46b37e MOV %RCX,0x90(%RSP) |
0x46b386 LEA (%R9,%RSI,1),%RCX |
0x46b38a MOV %RCX,0x88(%RSP) |
0x46b392 LEA (%RDX,%RSI,1),%RCX |
0x46b396 MOV %RCX,0x80(%RSP) |
0x46b39e ADD %RAX,%RSI |
0x46b3a1 MOV %RSI,0xa0(%RSP) |
0x46b3a9 VMOVSD 0x89d0d(%RIP),%XMM21 |
0x46b3b3 VMOVSD 0x8a9e3(%RIP),%XMM22 |
0x46b3bd VMOVSD 0xa7651(%RIP),%XMM23 |
0x46b3c7 VMOVSD 0xa764f(%RIP),%XMM25 |
0x46b3d1 VBROADCASTSD 0x89ce6(%RIP),%YMM14 |
0x46b3da VXORPD %XMM18,%XMM18,%XMM18 |
0x46b3e0 XOR %R9D,%R9D |
0x46b3e3 MOV %RDI,0xe8(%RSP) |
0x46b3eb MOV %EDI,%ESI |
0x46b3ed JMP 46b40e |
0x46b3ef NOP |
(1026) 0x46b3f0 MOV 0x150(%RSP),%RCX |
(1026) 0x46b3f8 LEA 0x1(%RCX),%EAX |
(1026) 0x46b3fb MOV 0x1c(%RSP),%ESI |
(1026) 0x46b3ff INC %ESI |
(1026) 0x46b401 CMP 0x18(%RSP),%ECX |
(1026) 0x46b405 MOV %EAX,%R9D |
(1026) 0x46b408 JE 46b1b9 |
(1026) 0x46b40e CMPL $0,0x130(%RSP) |
(1026) 0x46b416 MOV %ESI,0x1c(%RSP) |
(1026) 0x46b41a MOV %R9,0x150(%RSP) |
(1026) 0x46b422 JS 46b3f0 |
(1026) 0x46b424 MOVSXD %ESI,%R8 |
(1026) 0x46b427 MOV 0xc8(%RSP),%RAX |
(1026) 0x46b42f LEA (%RAX,%R8,1),%RBX |
(1026) 0x46b433 MOV 0xc0(%RSP),%RAX |
(1026) 0x46b43b LEA (%RAX,%R8,1),%R13 |
(1026) 0x46b43f ADD 0xd0(%RSP),%R8 |
(1026) 0x46b447 MOV 0xe8(%RSP),%RCX |
(1026) 0x46b44f LEA (%RCX,%R9,1),%EAX |
(1026) 0x46b453 MOVSXD %EAX,%R10 |
(1026) 0x46b456 MOV 0xe0(%RSP),%RDX |
(1026) 0x46b45e SUB %RDX,%R10 |
(1026) 0x46b461 LEA (%RCX,%R9,1),%EAX |
(1026) 0x46b465 INC %EAX |
(1026) 0x46b467 CLTQ |
(1026) 0x46b469 SUB %RDX,%RAX |
(1026) 0x46b46c MOV 0x58(%RBP),%RCX |
(1026) 0x46b470 MOV (%RCX),%R15 |
(1026) 0x46b473 MOV 0x28(%RBP),%RDX |
(1026) 0x46b477 VMOVSD (%RDX,%R10,8),%XMM20 |
(1026) 0x46b47e MOV 0x60(%RBP),%RCX |
(1026) 0x46b482 MOV (%RCX),%R14 |
(1026) 0x46b485 MOV 0x68(%RBP),%RCX |
(1026) 0x46b489 MOV (%RCX),%R11 |
(1026) 0x46b48c VADDSD (%RDX,%RAX,8),%XMM20,%XMM1 |
(1026) 0x46b493 MOV 0x70(%RBP),%RAX |
(1026) 0x46b497 MOV (%RAX),%R12 |
(1026) 0x46b49a MOV 0xd8(%RSP),%RDI |
(1026) 0x46b4a2 TEST %RDI,%RDI |
(1026) 0x46b4a5 VMOVAPD %XMM20,0x170(%RSP) |
(1026) 0x46b4ad MOV %R8,0x148(%RSP) |
(1026) 0x46b4b5 MOV %R12,0x140(%RSP) |
(1026) 0x46b4bd MOV %R14,0x138(%RSP) |
(1026) 0x46b4c5 JE 46bc20 |
(1026) 0x46b4cb VMOVAPD %XMM8,0x1f0(%RSP) |
(1026) 0x46b4d4 VBROADCASTSD %XMM8,%YMM4 |
(1026) 0x46b4d9 VMOVAPD %XMM26,0x1e0(%RSP) |
(1026) 0x46b4e1 VBROADCASTSD %XMM26,%YMM17 |
(1026) 0x46b4e7 VMOVAPD %XMM27,0x1d0(%RSP) |
(1026) 0x46b4ef VBROADCASTSD %XMM27,%YMM16 |
(1026) 0x46b4f5 VMOVAPD %XMM28,0x1c0(%RSP) |
(1026) 0x46b4fd VBROADCASTSD %XMM28,%YMM15 |
(1026) 0x46b503 VMOVAPD %XMM31,0x1b0(%RSP) |
(1026) 0x46b50b VBROADCASTSD %XMM31,%YMM19 |
(1026) 0x46b511 VMOVAPD %XMM29,0x160(%RSP) |
(1026) 0x46b519 VBROADCASTSD %XMM29,%YMM0 |
(1026) 0x46b51f VMOVAPD %XMM30,0x1a0(%RSP) |
(1026) 0x46b527 VBROADCASTSD %XMM30,%YMM27 |
(1026) 0x46b52d MOV %R15,%RAX |
(1026) 0x46b530 IMUL %R10,%RAX |
(1026) 0x46b534 MOV %RAX,0x100(%RSP) |
(1026) 0x46b53c LEA 0x1(%R10),%RCX |
(1026) 0x46b540 MOV %R15,%RAX |
(1026) 0x46b543 IMUL %RCX,%RAX |
(1026) 0x46b547 MOV %RAX,0x108(%RSP) |
(1026) 0x46b54f IMUL %R14,%RCX |
(1026) 0x46b553 MOV %RCX,0xf8(%RSP) |
(1026) 0x46b55b MOV %R14,%RAX |
(1026) 0x46b55e IMUL %R10,%RAX |
(1026) 0x46b562 MOV %RAX,0xf0(%RSP) |
(1026) 0x46b56a VBROADCASTSD %XMM20,%YMM24 |
(1026) 0x46b570 VDIVSD %XMM20,%XMM21,%XMM2 |
(1026) 0x46b576 VBROADCASTSD %XMM2,%YMM26 |
(1026) 0x46b57c IMUL %R11,%R10 |
(1026) 0x46b580 MOV %R10,0x40(%RSP) |
(1026) 0x46b585 VMOVSD %XMM1,0x118(%RSP) |
(1026) 0x46b58e VDIVSD %XMM1,%XMM21,%XMM2 |
(1026) 0x46b594 VBROADCASTSD %XMM2,%YMM1 |
(1026) 0x46b599 VMOVAPD %YMM1,0x180(%RSP) |
(1026) 0x46b5a2 MOV %R11,%RAX |
(1026) 0x46b5a5 IMUL %RBX,%RAX |
(1026) 0x46b5a9 ADD 0x78(%RSP),%RAX |
(1026) 0x46b5ae IMUL %RBX,%R12 |
(1026) 0x46b5b2 ADD 0x70(%RSP),%R12 |
(1026) 0x46b5b7 MOV %R11,%RDX |
(1026) 0x46b5ba MOV %R13,0x128(%RSP) |
(1026) 0x46b5c2 IMUL %R13,%R11 |
(1026) 0x46b5c6 MOV 0x60(%RSP),%RCX |
(1026) 0x46b5cb ADD %RCX,%R11 |
(1026) 0x46b5ce MOV %R15,%R10 |
(1026) 0x46b5d1 MOV %RDX,0x110(%RSP) |
(1026) 0x46b5d9 MOV %RDX,%R15 |
(1026) 0x46b5dc IMUL %R8,%R15 |
(1026) 0x46b5e0 ADD %RCX,%R15 |
(1026) 0x46b5e3 MOV %R14,%RSI |
(1026) 0x46b5e6 IMUL %RBX,%RSI |
(1026) 0x46b5ea MOV 0x58(%RSP),%RCX |
(1026) 0x46b5ef ADD %RCX,%RSI |
(1026) 0x46b5f2 MOV %R14,%RDX |
(1026) 0x46b5f5 IMUL %R8,%RDX |
(1026) 0x46b5f9 ADD %RCX,%RDX |
(1026) 0x46b5fc MOV %R10,%R14 |
(1026) 0x46b5ff IMUL %R8,%R14 |
(1026) 0x46b603 MOV 0x50(%RSP),%RCX |
(1026) 0x46b608 ADD %RCX,%R14 |
(1026) 0x46b60b MOV %R10,0x120(%RSP) |
(1026) 0x46b613 MOV %RBX,%R8 |
(1026) 0x46b616 IMUL %RBX,%R10 |
(1026) 0x46b61a ADD %RCX,%R10 |
(1026) 0x46b61d VPCMPEQD %YMM7,%YMM7,%YMM7 |
(1026) 0x46b621 XOR %R13D,%R13D |
(1026) 0x46b624 VPCMPEQD %YMM12,%YMM12,%YMM12 |
(1026) 0x46b629 VPCMPEQD %YMM11,%YMM11,%YMM11 |
(1026) 0x46b62e VPCMPEQD %YMM3,%YMM3,%YMM3 |
(1026) 0x46b632 VPCMPEQD %YMM6,%YMM6,%YMM6 |
(1026) 0x46b636 VPCMPEQD %YMM9,%YMM9,%YMM9 |
(1026) 0x46b63b VPCMPEQD %YMM5,%YMM5,%YMM5 |
(1026) 0x46b63f MOV 0x68(%RSP),%R9 |
(1026) 0x46b644 VMOVAPD %YMM14,%YMM18 |
(1026) 0x46b64a VBROADCASTSD 0xa73c5(%RIP),%YMM8 |
(1026) 0x46b653 VXORPD %XMM28,%XMM28,%XMM28 |
(1026) 0x46b659 JMP 46b7c9 |
0x46b65e XCHG %AX,%AX |
(1028) 0x46b660 VCMPPD $0x1,%YMM13,%YMM22,%K3 |
(1028) 0x46b667 VBROADCASTSD 0xa73b0(%RIP),%YMM8 |
(1028) 0x46b670 VBLENDMPD %YMM8,%YMM18,%YMM31{%K3} |
(1028) 0x46b676 VBROADCASTSD 0x898c8(%RIP),%YMM29 |
(1028) 0x46b680 VANDPD %YMM29,%YMM22,%YMM1 |
(1028) 0x46b686 VMAXPD %YMM1,%YMM14,%YMM1 |
(1028) 0x46b68a VMULPD %YMM31,%YMM1,%YMM1 |
(1028) 0x46b690 VCMPPD $0x1,%YMM13,%YMM1,%K3 |
(1028) 0x46b697 VBLENDMPD %YMM8,%YMM18,%YMM25{%K3} |
(1028) 0x46b69d VANDPD %YMM29,%YMM21,%YMM13 |
(1028) 0x46b6a3 VMAXPD %YMM13,%YMM14,%YMM13 |
(1028) 0x46b6a8 VMULPD %YMM25,%YMM13,%YMM13 |
(1028) 0x46b6ae VMULPD %YMM1,%YMM1,%YMM20 |
(1028) 0x46b6b4 VFMADD231PD %YMM13,%YMM13,%YMM20 |
(1028) 0x46b6ba VXORPD %XMM28,%XMM28,%XMM28 |
(1028) 0x46b6c0 VSQRTPD %YMM20,%YMM23 |
(1028) 0x46b6c6 VMULPD %YMM2,%YMM23,%YMM2 |
(1028) 0x46b6cc VDIVPD %YMM1,%YMM2,%YMM1 |
(1028) 0x46b6d0 VANDPD %YMM29,%YMM1,%YMM22 |
(1028) 0x46b6d6 VMULPD %YMM24,%YMM23,%YMM1 |
(1028) 0x46b6dc VDIVPD %YMM13,%YMM1,%YMM1 |
(1028) 0x46b6e1 VANDPD %YMM29,%YMM1,%YMM21 |
(1028) 0x46b6e7 VCMPPD $0x2,%YMM21,%YMM22,%K3 |
(1028) 0x46b6ee VBLENDMPD %YMM22,%YMM21,%YMM30{%K3} |
(1028) 0x46b6f4 VMULPD %YMM30,%YMM30,%YMM29 |
(1028) 0x46b6fa VMULPD %YMM10,%YMM10,%YMM1 |
(1028) 0x46b6ff IMUL %R8,%RCX |
(1028) 0x46b703 ADD %R9,%RCX |
(1028) 0x46b706 VMOVUPD (%RCX,%R13,8),%YMM2{%K2}{z} |
(1028) 0x46b70d VADDPD %YMM29,%YMM29,%YMM10 |
(1028) 0x46b713 VMULPD %YMM2,%YMM1,%YMM1 |
(1028) 0x46b717 VMULPD %YMM1,%YMM10,%YMM1 |
(1028) 0x46b71b VPBROADCASTQ %R13,%YMM2 |
(1028) 0x46b721 VPADDQ 0x89637(%RIP),%YMM2,%YMM2 |
(1028) 0x46b729 VPBLENDMQ %YMM5,%YMM2,%YMM5{%K1} |
(1028) 0x46b72f VMOVAPD %YMM4,%YMM31{%K1} |
(1028) 0x46b735 VPBLENDMQ %YMM9,%YMM2,%YMM9{%K1} |
(1028) 0x46b73b VMOVAPD %YMM17,%YMM25{%K1} |
(1028) 0x46b741 VPBLENDMQ %YMM6,%YMM2,%YMM6{%K1} |
(1028) 0x46b747 VMOVAPD %YMM16,%YMM23{%K1} |
(1028) 0x46b74d VPBLENDMQ %YMM3,%YMM2,%YMM3{%K1} |
(1028) 0x46b753 VMOVAPD %YMM15,%YMM22{%K1} |
(1028) 0x46b759 VPBLENDMQ %YMM11,%YMM2,%YMM11{%K1} |
(1028) 0x46b75f VMOVAPD %YMM19,%YMM21{%K1} |
(1028) 0x46b765 VPBLENDMQ %YMM12,%YMM2,%YMM12{%K1} |
(1028) 0x46b76b VMOVAPD %YMM0,%YMM30{%K1} |
(1028) 0x46b771 VMOVDQA64 %YMM7,%YMM2{%K1} |
(1028) 0x46b777 VMOVAPD %YMM27,%YMM29{%K1} |
(1028) 0x46b77d VMOVAPD %YMM28,%YMM1{%K1} |
(1028) 0x46b783 VMOVUPD %YMM1,(%R12,%R13,8) |
(1028) 0x46b789 ADD $0x4,%R13 |
(1028) 0x46b78d VMOVDQA %YMM2,%YMM7 |
(1028) 0x46b791 VMOVAPD %YMM29,%YMM27 |
(1028) 0x46b797 VMOVAPD %YMM30,%YMM0 |
(1028) 0x46b79d VMOVAPD %YMM21,%YMM19 |
(1028) 0x46b7a3 VMOVAPD %YMM22,%YMM15 |
(1028) 0x46b7a9 VMOVAPD %YMM23,%YMM16 |
(1028) 0x46b7af VMOVAPD %YMM25,%YMM17 |
(1028) 0x46b7b5 VMOVAPD %YMM31,%YMM4 |
(1028) 0x46b7bb CMP %RDI,%R13 |
(1028) 0x46b7be VMOVAPD %YMM14,%YMM8 |
(1028) 0x46b7c3 JAE 46b960 |
(1028) 0x46b7c9 VMOVUPD -0x8(%R10,%R13,8),%YMM10 |
(1028) 0x46b7d0 VMOVUPD (%R10,%R13,8),%YMM21 |
(1028) 0x46b7d7 VMOVUPD -0x8(%R14,%R13,8),%YMM22 |
(1028) 0x46b7e2 VMOVUPD (%R14,%R13,8),%YMM23 |
(1028) 0x46b7e9 VADDPD %YMM21,%YMM23,%YMM2 |
(1028) 0x46b7ef VADDPD %YMM22,%YMM10,%YMM25 |
(1028) 0x46b7f5 VMOVUPD -0x8(%RDX,%R13,8),%YMM29 |
(1028) 0x46b800 VMOVUPD (%RDX,%R13,8),%YMM30 |
(1028) 0x46b807 VSUBPD %YMM25,%YMM2,%YMM25 |
(1028) 0x46b80d VMOVUPD -0x8(%RSI,%R13,8),%YMM31 |
(1028) 0x46b818 VMOVUPD (%RSI,%R13,8),%YMM20 |
(1028) 0x46b81f VADDPD %YMM29,%YMM30,%YMM2 |
(1028) 0x46b825 VADDPD %YMM20,%YMM31,%YMM1 |
(1028) 0x46b82b VSUBPD %YMM1,%YMM2,%YMM1 |
(1028) 0x46b82f MOV 0x158(%RSP),%RCX |
(1028) 0x46b837 VMOVUPD -0x8(%RCX,%R13,8),%YMM2 |
(1028) 0x46b83e VMULPD %YMM25,%YMM2,%YMM13 |
(1028) 0x46b844 VFMADD231PD %YMM1,%YMM24,%YMM13 |
(1028) 0x46b84a VADDPD %YMM10,%YMM21,%YMM10 |
(1028) 0x46b850 VSUBPD %YMM10,%YMM23,%YMM10 |
(1028) 0x46b856 VADDPD %YMM22,%YMM10,%YMM10 |
(1028) 0x46b85c VBROADCASTSD 0x8a53b(%RIP),%YMM14 |
(1028) 0x46b865 VMULPD %YMM14,%YMM10,%YMM10 |
(1028) 0x46b86a VADDPD %YMM31,%YMM29,%YMM21 |
(1028) 0x46b870 VSUBPD %YMM21,%YMM30,%YMM21 |
(1028) 0x46b876 VADDPD %YMM20,%YMM21,%YMM20 |
(1028) 0x46b87c VMULPD %YMM14,%YMM20,%YMM20 |
(1028) 0x46b882 VDIVPD %YMM2,%YMM18,%YMM23 |
(1028) 0x46b888 VMULPD %YMM23,%YMM20,%YMM20 |
(1028) 0x46b88e VMOVUPD (%RAX,%R13,8),%YMM21 |
(1028) 0x46b895 VFMADD231PD %YMM10,%YMM26,%YMM20 |
(1028) 0x46b89b VSUBPD -0x10(%RAX,%R13,8),%YMM21,%YMM10 |
(1028) 0x46b8a6 VADDPD (%RCX,%R13,8),%YMM2,%YMM21 |
(1028) 0x46b8ad VDIVPD %YMM21,%YMM10,%YMM22 |
(1028) 0x46b8b3 VMOVUPD (%R15,%R13,8),%YMM10 |
(1028) 0x46b8b9 VSUBPD (%R11,%R13,8),%YMM10,%YMM10 |
(1028) 0x46b8bf VMULPD 0x180(%RSP),%YMM10,%YMM21 |
(1028) 0x46b8c7 VMULPD %YMM22,%YMM22,%YMM10 |
(1028) 0x46b8cd VMULPD %YMM21,%YMM21,%YMM29 |
(1028) 0x46b8d3 VMULPD %YMM14,%YMM25,%YMM25 |
(1028) 0x46b8d9 VMULPD %YMM23,%YMM25,%YMM23 |
(1028) 0x46b8df VMULPD %YMM10,%YMM23,%YMM23 |
(1028) 0x46b8e5 VMULPD %YMM1,%YMM14,%YMM1 |
(1028) 0x46b8e9 VMULPD %YMM29,%YMM1,%YMM1 |
(1028) 0x46b8ef VMULPD %YMM20,%YMM22,%YMM20 |
(1028) 0x46b8f5 VFMADD213PD %YMM23,%YMM21,%YMM20 |
(1028) 0x46b8fb VFMADD231PD %YMM1,%YMM26,%YMM20 |
(1028) 0x46b901 VADDPD %YMM10,%YMM29,%YMM1 |
(1028) 0x46b907 VMAXPD %YMM8,%YMM1,%YMM1 |
(1028) 0x46b90c VDIVPD %YMM1,%YMM20,%YMM10 |
(1028) 0x46b912 VCMPPD $0x1,%YMM10,%YMM28,%K1 |
(1028) 0x46b919 VCMPPD $0x2,%YMM13,%YMM28,%K0 |
(1028) 0x46b920 VCMPPD $0x6,%YMM13,%YMM28,%K1{%K1} |
(1028) 0x46b927 KORW %K1,%K0,%K1 |
(1028) 0x46b92b KNOTW %K1,%K2 |
(1028) 0x46b92f KMOVD %K2,%EBX |
(1028) 0x46b933 TEST $0xf,%BL |
(1028) 0x46b936 VMOVAPD %YMM8,%YMM14 |
(1028) 0x46b93b VXORPD %XMM13,%XMM13,%XMM13 |
(1028) 0x46b940 JE 46b660 |
(1028) 0x46b946 MOV 0x78(%RBP),%RCX |
(1028) 0x46b94a MOV (%RCX),%RCX |
(1028) 0x46b94d JMP 46b660 |
0x46b952 NOPW %CS:(%RAX,%RAX,1) |
(1026) 0x46b960 VMOVAPD %YMM18,%YMM14 |
(1026) 0x46b966 VPCMPEQD %YMM4,%YMM4,%YMM4 |
(1026) 0x46b96a VPTEST %YMM4,%YMM5 |
(1026) 0x46b96f VMOVAPD 0x1f0(%RSP),%XMM8 |
(1026) 0x46b978 JB 46b9b8 |
(1026) 0x46b97a VEXTRACTI128 $0x1,%YMM5,%XMM0 |
(1026) 0x46b980 VPMAXSQ %XMM0,%XMM5,%XMM0 |
(1026) 0x46b986 VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46b98b VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46b991 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46b996 VPCMPEQQ %YMM0,%YMM5,%K0 |
(1026) 0x46b99c KMOVD %K0,%EAX |
(1026) 0x46b9a0 TZCNT %EAX,%EAX |
(1026) 0x46b9a4 VMOVAPD %YMM31,0x2c0(%RSP) |
(1026) 0x46b9ac AND $0x3,%EAX |
(1026) 0x46b9af VMOVSD 0x2c0(%RSP,%RAX,8),%XMM8 |
(1026) 0x46b9b8 VPTEST %YMM4,%YMM9 |
(1026) 0x46b9bd VXORPD %XMM18,%XMM18,%XMM18 |
(1026) 0x46b9c3 VMOVAPD 0x1e0(%RSP),%XMM26 |
(1026) 0x46b9cb VMOVAPD 0x1d0(%RSP),%XMM27 |
(1026) 0x46b9d3 VMOVAPD 0x1c0(%RSP),%XMM28 |
(1026) 0x46b9db MOV 0x128(%RSP),%R13 |
(1026) 0x46b9e3 MOV 0x120(%RSP),%R15 |
(1026) 0x46b9eb MOV 0x110(%RSP),%R11 |
(1026) 0x46b9f3 MOV 0x108(%RSP),%RSI |
(1026) 0x46b9fb MOV 0xf8(%RSP),%R9 |
(1026) 0x46ba03 MOV 0xf0(%RSP),%RBX |
(1026) 0x46ba0b JB 46ba4a |
(1026) 0x46ba0d VEXTRACTI128 $0x1,%YMM9,%XMM0 |
(1026) 0x46ba13 VPMAXSQ %XMM0,%XMM9,%XMM0 |
(1026) 0x46ba19 VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46ba1e VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46ba24 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46ba29 VPCMPEQQ %YMM0,%YMM9,%K0 |
(1026) 0x46ba2f KMOVD %K0,%EAX |
(1026) 0x46ba33 TZCNT %EAX,%EAX |
(1026) 0x46ba37 VMOVAPD %YMM25,0x2a0(%RSP) |
(1026) 0x46ba3f AND $0x3,%EAX |
(1026) 0x46ba42 VMOVSD 0x2a0(%RSP,%RAX,8),%XMM26 |
(1026) 0x46ba4a VPTEST %YMM4,%YMM6 |
(1026) 0x46ba4f VMOVAPD 0x1b0(%RSP),%XMM31 |
(1026) 0x46ba57 JB 46ba96 |
(1026) 0x46ba59 VEXTRACTI128 $0x1,%YMM6,%XMM0 |
(1026) 0x46ba5f VPMAXSQ %XMM0,%XMM6,%XMM0 |
(1026) 0x46ba65 VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46ba6a VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46ba70 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46ba75 VPCMPEQQ %YMM0,%YMM6,%K0 |
(1026) 0x46ba7b KMOVD %K0,%EAX |
(1026) 0x46ba7f TZCNT %EAX,%EAX |
(1026) 0x46ba83 VMOVAPD %YMM23,0x280(%RSP) |
(1026) 0x46ba8b AND $0x3,%EAX |
(1026) 0x46ba8e VMOVSD 0x280(%RSP,%RAX,8),%XMM27 |
(1026) 0x46ba96 VPTEST %YMM4,%YMM3 |
(1026) 0x46ba9b VMOVSD 0xa6f7b(%RIP),%XMM25 |
(1026) 0x46baa5 VMOVAPD 0x170(%RSP),%XMM20 |
(1026) 0x46baad JB 46baec |
(1026) 0x46baaf VEXTRACTI128 $0x1,%YMM3,%XMM0 |
(1026) 0x46bab5 VPMAXSQ %XMM0,%XMM3,%XMM0 |
(1026) 0x46babb VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46bac0 VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46bac6 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46bacb VPCMPEQQ %YMM0,%YMM3,%K0 |
(1026) 0x46bad1 KMOVD %K0,%EAX |
(1026) 0x46bad5 TZCNT %EAX,%EAX |
(1026) 0x46bad9 VMOVAPD %YMM22,0x260(%RSP) |
(1026) 0x46bae1 AND $0x3,%EAX |
(1026) 0x46bae4 VMOVSD 0x260(%RSP,%RAX,8),%XMM28 |
(1026) 0x46baec VPTEST %YMM4,%YMM11 |
(1026) 0x46baf1 VMOVSD 0xa6f1d(%RIP),%XMM23 |
(1026) 0x46bafb JB 46bb3a |
(1026) 0x46bafd VEXTRACTI128 $0x1,%YMM11,%XMM0 |
(1026) 0x46bb03 VPMAXSQ %XMM0,%XMM11,%XMM0 |
(1026) 0x46bb09 VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46bb0e VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46bb14 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46bb19 VPCMPEQQ %YMM0,%YMM11,%K0 |
(1026) 0x46bb1f KMOVD %K0,%EAX |
(1026) 0x46bb23 TZCNT %EAX,%EAX |
(1026) 0x46bb27 VMOVAPD %YMM21,0x240(%RSP) |
(1026) 0x46bb2f AND $0x3,%EAX |
(1026) 0x46bb32 VMOVSD 0x240(%RSP,%RAX,8),%XMM31 |
(1026) 0x46bb3a VPTEST %YMM4,%YMM12 |
(1026) 0x46bb3f VMOVSD 0x8a257(%RIP),%XMM22 |
(1026) 0x46bb49 JB 46bb92 |
(1026) 0x46bb4b VEXTRACTI128 $0x1,%YMM12,%XMM0 |
(1026) 0x46bb51 VPMAXSQ %XMM0,%XMM12,%XMM0 |
(1026) 0x46bb57 VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46bb5c VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46bb62 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46bb67 VPCMPEQQ %YMM0,%YMM12,%K0 |
(1026) 0x46bb6d KMOVD %K0,%EAX |
(1026) 0x46bb71 TZCNT %EAX,%EAX |
(1026) 0x46bb75 VMOVAPD %YMM30,0x220(%RSP) |
(1026) 0x46bb7d AND $0x3,%EAX |
(1026) 0x46bb80 VMOVSD 0x220(%RSP,%RAX,8),%XMM0 |
(1026) 0x46bb89 VMOVAPD %XMM0,0x160(%RSP) |
(1026) 0x46bb92 VPTEST %YMM4,%YMM2 |
(1026) 0x46bb97 VMOVSD 0x8951f(%RIP),%XMM21 |
(1026) 0x46bba1 VMOVAPD 0x1a0(%RSP),%XMM30 |
(1026) 0x46bba9 JB 46bbe8 |
(1026) 0x46bbab VEXTRACTI128 $0x1,%YMM2,%XMM0 |
(1026) 0x46bbb1 VPMAXSQ %XMM0,%XMM2,%XMM0 |
(1026) 0x46bbb7 VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46bbbc VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46bbc2 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46bbc7 VPCMPEQQ %YMM0,%YMM2,%K0 |
(1026) 0x46bbcd KMOVD %K0,%EAX |
(1026) 0x46bbd1 TZCNT %EAX,%EAX |
(1026) 0x46bbd5 VMOVAPD %YMM29,0x200(%RSP) |
(1026) 0x46bbdd AND $0x3,%EAX |
(1026) 0x46bbe0 VMOVSD 0x200(%RSP,%RAX,8),%XMM30 |
(1026) 0x46bbe8 MOV %RDI,%RDX |
(1026) 0x46bbeb CMP 0x38(%RSP),%RDI |
(1026) 0x46bbf0 VMOVAPD 0x160(%RSP),%XMM29 |
(1026) 0x46bbf8 VMOVSD 0x118(%RSP),%XMM1 |
(1026) 0x46bc01 MOV 0x100(%RSP),%RDI |
(1026) 0x46bc09 JE 46b3f0 |
(1026) 0x46bc0f JMP 46bc4b |
0x46bc11 NOPW %CS:(%RAX,%RAX,1) |
(1026) 0x46bc20 MOV %RBX,%R8 |
(1026) 0x46bc23 MOV %R14,%RBX |
(1026) 0x46bc26 IMUL %R10,%RBX |
(1026) 0x46bc2a LEA 0x1(%R10),%RSI |
(1026) 0x46bc2e MOV %R14,%R9 |
(1026) 0x46bc31 IMUL %RSI,%R9 |
(1026) 0x46bc35 MOV %R15,%RDI |
(1026) 0x46bc38 IMUL %R10,%RDI |
(1026) 0x46bc3c IMUL %R15,%RSI |
(1026) 0x46bc40 IMUL %R11,%R10 |
(1026) 0x46bc44 MOV %R10,0x40(%RSP) |
(1026) 0x46bc49 XOR %EDX,%EDX |
(1026) 0x46bc4b MOV 0x28(%RSP),%RAX |
(1026) 0x46bc50 ADD %RAX,%RBX |
(1026) 0x46bc53 MOV 0xb0(%RSP),%RCX |
(1026) 0x46bc5b LEA (%RCX,%RDX,1),%R10 |
(1026) 0x46bc5f MOV %R10,%R14 |
(1026) 0x46bc62 SUB 0xb8(%RSP),%R14 |
(1026) 0x46bc6a VMOVSD (%RBX,%R14,8),%XMM3 |
(1026) 0x46bc70 ADD %RAX,%R9 |
(1026) 0x46bc73 VMOVSD (%R9,%R14,8),%XMM11 |
(1026) 0x46bc79 MOV 0x30(%RSP),%RAX |
(1026) 0x46bc7e ADD %RAX,%RDI |
(1026) 0x46bc81 VMOVSD (%RDI,%R14,8),%XMM12 |
(1026) 0x46bc87 MOV 0xa8(%RSP),%RCX |
(1026) 0x46bc8f ADD %R10,%RCX |
(1026) 0x46bc92 ADD %RAX,%RSI |
(1026) 0x46bc95 VMOVSD (%RSI,%R14,8),%XMM24 |
(1026) 0x46bc9c IMUL %R11,%R13 |
(1026) 0x46bca0 MOV %R11,%R9 |
(1026) 0x46bca3 MOV %R8,%R12 |
(1026) 0x46bca6 IMUL %R8,%R11 |
(1026) 0x46bcaa LEA (%R11,%R10,8),%RAX |
(1026) 0x46bcae MOV 0x18(%RBP),%RSI |
(1026) 0x46bcb2 MOV 0x40(%RSP),%R8 |
(1026) 0x46bcb7 ADD %RSI,%R8 |
(1026) 0x46bcba VMOVSD (%R8,%RCX,8),%XMM4 |
(1026) 0x46bcc0 MOV 0x138(%RSP),%RSI |
(1026) 0x46bcc8 MOV %RSI,%RCX |
(1026) 0x46bccb IMUL %R12,%RCX |
(1026) 0x46bccf LEA (%RCX,%R10,8),%R11 |
(1026) 0x46bcd3 MOV 0x148(%RSP),%RCX |
(1026) 0x46bcdb IMUL %RCX,%RSI |
(1026) 0x46bcdf LEA (%RSI,%R10,8),%RSI |
(1026) 0x46bce3 IMUL %RCX,%R9 |
(1026) 0x46bce7 IMUL %R15,%RCX |
(1026) 0x46bceb LEA (%RCX,%R10,8),%RBX |
(1026) 0x46bcef IMUL %R12,%R15 |
(1026) 0x46bcf3 LEA (%R15,%R10,8),%RCX |
(1026) 0x46bcf7 MOV 0x90(%RSP),%RDI |
(1026) 0x46bcff LEA (%RDI,%R10,8),%R15 |
(1026) 0x46bd03 VMOVQ (%R8,%R14,8),%XMM9 |
(1026) 0x46bd09 MOV 0x30(%RBP),%RDI |
(1026) 0x46bd0d VMOVSD (%RDI,%R14,8),%XMM0 |
(1026) 0x46bd13 VDIVSD %XMM20,%XMM21,%XMM6 |
(1026) 0x46bd19 VDIVSD %XMM1,%XMM21,%XMM2 |
(1026) 0x46bd1f MOV 0x38(%RSP),%R8 |
(1026) 0x46bd24 SUB %RDX,%R8 |
(1026) 0x46bd27 MOV %R12,0x180(%RSP) |
(1026) 0x46bd2f MOV 0x140(%RSP),%RDI |
(1026) 0x46bd37 IMUL %R12,%RDI |
(1026) 0x46bd3b ADD 0x98(%RSP),%RDX |
(1026) 0x46bd43 LEA (%RDI,%RDX,8),%R12 |
(1026) 0x46bd47 ADD 0x10(%RBP),%R12 |
(1026) 0x46bd4b MOV 0x20(%RBP),%RDI |
(1026) 0x46bd4f LEA (%RDI,%RDX,8),%R14 |
(1026) 0x46bd53 LEA (%R13,%RDX,8),%R13 |
(1026) 0x46bd58 MOV 0x18(%RBP),%RDI |
(1026) 0x46bd5c ADD %RDI,%R13 |
(1026) 0x46bd5f LEA (%R9,%RDX,8),%RDX |
(1026) 0x46bd63 ADD %RDI,%RDX |
(1026) 0x46bd66 ADD 0x88(%RSP),%RAX |
(1026) 0x46bd6e MOV 0x80(%RSP),%RDI |
(1026) 0x46bd76 ADD %RDI,%R11 |
(1026) 0x46bd79 ADD %RDI,%RSI |
(1026) 0x46bd7c MOV 0xa0(%RSP),%RDI |
(1026) 0x46bd84 ADD %RDI,%RBX |
(1026) 0x46bd87 ADD %RDI,%RCX |
(1026) 0x46bd8a XOR %R10D,%R10D |
(1026) 0x46bd8d JMP 46bdaf |
0x46bd8f NOP |
(1027) 0x46bd90 VMOVSD %XMM17,(%R12,%R10,8) |
(1027) 0x46bd97 INC %R10 |
(1027) 0x46bd9a VMOVDQA %XMM9,%XMM4 |
(1027) 0x46bd9e VMOVAPD %XMM5,%XMM9 |
(1027) 0x46bda2 VMOVAPD %XMM7,%XMM0 |
(1027) 0x46bda6 CMP %R10,%R8 |
(1027) 0x46bda9 JE 46b3f0 |
(1027) 0x46bdaf VMOVAPD %XMM24,%XMM1 |
(1027) 0x46bdb5 VMOVAPD %XMM12,%XMM5 |
(1027) 0x46bdb9 VMOVSD (%RCX,%R10,8),%XMM12 |
(1027) 0x46bdbf VMOVSD (%RBX,%R10,8),%XMM24 |
(1027) 0x46bdc6 VMOVAPD %XMM11,%XMM7 |
(1027) 0x46bdca VMOVAPD %XMM3,%XMM10 |
(1027) 0x46bdce VADDSD %XMM12,%XMM24,%XMM3 |
(1027) 0x46bdd4 VADDSD %XMM1,%XMM5,%XMM11 |
(1027) 0x46bdd8 VSUBSD %XMM11,%XMM3,%XMM13 |
(1027) 0x46bddd VMOVSD (%RSI,%R10,8),%XMM11 |
(1027) 0x46bde3 VMOVSD (%R11,%R10,8),%XMM3 |
(1027) 0x46bde9 VADDSD %XMM7,%XMM11,%XMM15 |
(1027) 0x46bded VADDSD %XMM3,%XMM10,%XMM16 |
(1027) 0x46bdf3 VSUBSD %XMM16,%XMM15,%XMM17 |
(1027) 0x46bdf9 VMULSD %XMM13,%XMM0,%XMM19 |
(1027) 0x46bdff VFMADD231SD %XMM17,%XMM20,%XMM19 |
(1027) 0x46be05 VADDSD %XMM5,%XMM12,%XMM5 |
(1027) 0x46be09 VSUBSD %XMM5,%XMM24,%XMM5 |
(1027) 0x46be0f VADDSD %XMM1,%XMM5,%XMM1 |
(1027) 0x46be13 VMULSD %XMM22,%XMM1,%XMM1 |
(1027) 0x46be19 VADDSD %XMM7,%XMM10,%XMM5 |
(1027) 0x46be1d VSUBSD %XMM5,%XMM11,%XMM5 |
(1027) 0x46be21 VADDSD %XMM3,%XMM5,%XMM5 |
(1027) 0x46be25 VMULSD %XMM22,%XMM5,%XMM5 |
(1027) 0x46be2b VDIVSD %XMM0,%XMM21,%XMM10 |
(1027) 0x46be31 VMULSD %XMM10,%XMM5,%XMM20 |
(1027) 0x46be37 VFMADD231SD %XMM1,%XMM6,%XMM20 |
(1027) 0x46be3d VMOVSD (%RAX,%R10,8),%XMM5 |
(1027) 0x46be43 VSUBSD %XMM4,%XMM5,%XMM1 |
(1027) 0x46be47 VMOVSD (%R15,%R10,8),%XMM7 |
(1027) 0x46be4d VADDSD %XMM0,%XMM7,%XMM4 |
(1027) 0x46be51 VDIVSD %XMM4,%XMM1,%XMM16 |
(1027) 0x46be57 VMOVSD (%RDX,%R10,8),%XMM1 |
(1027) 0x46be5d VSUBSD (%R13,%R10,8),%XMM1,%XMM1 |
(1027) 0x46be64 VMULSD %XMM2,%XMM1,%XMM15 |
(1027) 0x46be68 VMULSD %XMM16,%XMM16,%XMM1 |
(1027) 0x46be6e VMULSD %XMM15,%XMM15,%XMM4 |
(1027) 0x46be73 VMULSD %XMM22,%XMM13,%XMM13 |
(1027) 0x46be79 VMULSD %XMM10,%XMM13,%XMM10 |
(1027) 0x46be7e VMULSD %XMM1,%XMM10,%XMM10 |
(1027) 0x46be82 VMULSD %XMM22,%XMM17,%XMM13 |
(1027) 0x46be88 VMULSD %XMM4,%XMM13,%XMM13 |
(1027) 0x46be8c VMULSD %XMM20,%XMM16,%XMM17 |
(1027) 0x46be92 VMOVAPD 0x170(%RSP),%XMM20 |
(1027) 0x46be9a VFMADD213SD %XMM10,%XMM15,%XMM17 |
(1027) 0x46bea0 VFMADD231SD %XMM13,%XMM6,%XMM17 |
(1027) 0x46bea6 VADDSD %XMM1,%XMM4,%XMM1 |
(1027) 0x46beaa VMAXSD %XMM23,%XMM1,%XMM1 |
(1027) 0x46beb0 VDIVSD %XMM1,%XMM17,%XMM4 |
(1027) 0x46beb6 VXORPD %XMM17,%XMM17,%XMM17 |
(1027) 0x46bebc XOR %EDI,%EDI |
(1027) 0x46bebe VUCOMISD %XMM17,%XMM4 |
(1027) 0x46bec4 SETBE %DIL |
(1027) 0x46bec8 XOR %R9D,%R9D |
(1027) 0x46becb VUCOMISD %XMM17,%XMM19 |
(1027) 0x46bed1 SETB %R9B |
(1027) 0x46bed5 CMP %R9B,%DIL |
(1027) 0x46bed8 CMOVB %EDI,%R9D |
(1027) 0x46bedc CMP $0x1,%R9B |
(1027) 0x46bee0 JNE 46bd90 |
(1027) 0x46bee6 VCMPSD $0x1,%XMM18,%XMM16,%K1 |
(1027) 0x46beed VMOVAPD %XMM21,%XMM8 |
(1027) 0x46bef3 VMOVSD %XMM25,%XMM8,%XMM8{%K1} |
(1027) 0x46bef9 VMOVDDUP 0x89047(%RIP),%XMM1 |
(1027) 0x46bf01 VANDPD %XMM1,%XMM16,%XMM10 |
(1027) 0x46bf07 VMAXSD %XMM10,%XMM23,%XMM10 |
(1027) 0x46bf0d VMULSD %XMM8,%XMM10,%XMM10 |
(1027) 0x46bf12 VCMPSD $0x1,%XMM18,%XMM10,%K1 |
(1027) 0x46bf19 VMOVAPD %XMM21,%XMM26 |
(1027) 0x46bf1f VMOVSD %XMM25,%XMM26,%XMM26{%K1} |
(1027) 0x46bf25 VANDPD %XMM1,%XMM15,%XMM13 |
(1027) 0x46bf29 VMAXSD %XMM13,%XMM23,%XMM13 |
(1027) 0x46bf2f VMULSD %XMM26,%XMM13,%XMM13 |
(1027) 0x46bf35 VMULSD %XMM10,%XMM10,%XMM15 |
(1027) 0x46bf3a VFMADD231SD %XMM13,%XMM13,%XMM15 |
(1027) 0x46bf3f VSQRTSD %XMM15,%XMM15,%XMM27 |
(1027) 0x46bf45 VMULSD %XMM0,%XMM27,%XMM0 |
(1027) 0x46bf4b VDIVSD %XMM10,%XMM0,%XMM0 |
(1027) 0x46bf50 VANDPD %XMM1,%XMM0,%XMM28 |
(1027) 0x46bf56 VMULSD %XMM20,%XMM27,%XMM0 |
(1027) 0x46bf5c VDIVSD %XMM13,%XMM0,%XMM0 |
(1027) 0x46bf61 VANDPD %XMM1,%XMM0,%XMM31 |
(1027) 0x46bf67 VCMPSD $0x2,%XMM31,%XMM28,%K1 |
(1027) 0x46bf6e VMOVAPD %XMM31,%XMM29 |
(1027) 0x46bf74 VMOVSD %XMM28,%XMM29,%XMM29{%K1} |
(1027) 0x46bf7a VMULSD %XMM29,%XMM29,%XMM30 |
(1027) 0x46bf80 VMULSD %XMM4,%XMM4,%XMM0 |
(1027) 0x46bf84 VADDSD %XMM30,%XMM30,%XMM1 |
(1027) 0x46bf8a VMULSD %XMM1,%XMM0,%XMM0 |
(1027) 0x46bf8e MOV 0x78(%RBP),%RDI |
(1027) 0x46bf92 MOV (%RDI),%RDI |
(1027) 0x46bf95 IMUL 0x180(%RSP),%RDI |
(1027) 0x46bf9e ADD %R14,%RDI |
(1027) 0x46bfa1 VMULSD (%RDI,%R10,8),%XMM0,%XMM17 |
(1027) 0x46bfa8 JMP 46bd90 |
0x46bfad NOPL (%RAX) |
Path / |
Source file and lines | viscosity_kernel.f90:50-94 |
Module | exec |
nb instructions | 168 |
nb uops | 172 |
loop length | 755 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 43 |
micro-operation queue | 28.67 cycles |
front end | 28.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 12.30 | 12.20 | 10.00 | 10.00 | 22.00 | 12.20 | 12.10 | 22.00 | 22.00 | 22.00 | 12.20 | 10.00 |
cycles | 12.30 | 13.60 | 10.00 | 10.00 | 22.00 | 12.20 | 12.10 | 22.00 | 22.00 | 22.00 | 12.20 | 10.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 28.14-28.20 |
Stall cycles | 0.00 |
Front-end | 28.67 |
Dispatch | 22.00 |
Overall L1 | 28.67 |
all | 1% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 16% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 3% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
all | 11% |
load | 6% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 11% |
load | 11% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x300,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,0x24(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 46b1cf <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xaf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0xc(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x28(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x2c(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x18(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x14(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x73d630,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 404520 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x10(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc(%RSP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EAX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ECX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 46b1ea <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x73d650,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x14(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404110 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x48(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x73d670,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4045e0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAL $0x20,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
LEA (%R12,%RAX,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
SAL $0x20,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %R13,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%R9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOVSXD (%RDX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%EDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %R10D,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %EBX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP $0x2,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVGE %EDX,%ESI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND $0x7ffffffc,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RSI,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $-0x1,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVNS %RCX,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $0x1,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %R11,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RCX,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA (,%R10,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RSI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV $-0x1,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
SUB %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVNS %RAX,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVG %R11,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %R13,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x30(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R8,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x20,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RSI,%RBX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R9,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R11,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(%R9,%RCX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RAX,%RCX,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R9,%RCX,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x8(%R14,%RCX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,0x158(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(%RDX,%RCX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(%RAX,%RCX,1),%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RCX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R14,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R9,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RDX,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x89d0d(%RIP),%XMM21 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8a9e3(%RIP),%XMM22 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xa7651(%RIP),%XMM23 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xa764f(%RIP),%XMM25 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0x89ce6(%RIP),%YMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VXORPD %XMM18,%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EDI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 46b40e <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x2ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | viscosity_kernel.f90:50-94 |
Module | exec |
nb instructions | 168 |
nb uops | 172 |
loop length | 755 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 43 |
micro-operation queue | 28.67 cycles |
front end | 28.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 12.30 | 12.20 | 10.00 | 10.00 | 22.00 | 12.20 | 12.10 | 22.00 | 22.00 | 22.00 | 12.20 | 10.00 |
cycles | 12.30 | 13.60 | 10.00 | 10.00 | 22.00 | 12.20 | 12.10 | 22.00 | 22.00 | 22.00 | 12.20 | 10.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 28.14-28.20 |
Stall cycles | 0.00 |
Front-end | 28.67 |
Dispatch | 22.00 |
Overall L1 | 28.67 |
all | 1% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 16% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 3% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
all | 11% |
load | 6% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 11% |
load | 11% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x300,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,0x24(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 46b1cf <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xaf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0xc(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x28(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x2c(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x18(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x14(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x73d630,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 404520 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x10(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc(%RSP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EAX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ECX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 46b1ea <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x73d650,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x14(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404110 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x48(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x73d670,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4045e0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAL $0x20,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
LEA (%R12,%RAX,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
SAL $0x20,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %R13,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%R9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOVSXD (%RDX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%EDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %R10D,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %EBX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP $0x2,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVGE %EDX,%ESI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND $0x7ffffffc,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RSI,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $-0x1,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVNS %RCX,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $0x1,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %R11,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RCX,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA (,%R10,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RSI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV $-0x1,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
SUB %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVNS %RAX,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVG %R11,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %R13,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x30(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R8,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x20,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RSI,%RBX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R9,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R11,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(%R9,%RCX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RAX,%RCX,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R9,%RCX,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x8(%R14,%RCX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,0x158(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(%RDX,%RCX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(%RAX,%RCX,1),%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RCX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R14,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R9,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RDX,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x89d0d(%RIP),%XMM21 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8a9e3(%RIP),%XMM22 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xa7651(%RIP),%XMM23 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xa764f(%RIP),%XMM25 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0x89ce6(%RIP),%YMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VXORPD %XMM18,%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EDI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 46b40e <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x2ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼viscosity_kernel_.DIR.OMP.PARALLEL.2– | 2.17 | 1.67 |
▼Loop 1026 - viscosity_kernel.f90:53-89 - exec– | 0 | 0.01 |
○Loop 1028 - viscosity_kernel.f90:53-89 - exec | 2.17 | 1.66 |
○Loop 1027 - viscosity_kernel.f90:55-89 - exec | 0 | 0 |