Function: viscosity_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: viscosity_kernel.f90:50-94 | Coverage: 2.26% |
---|
Function: viscosity_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: viscosity_kernel.f90:50-94 | Coverage: 2.26% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-137-7698/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90: 50 - 94 |
-------------------------------------------------------------------------------- |
50: !$OMP PARALLEL |
51: |
52: !$OMP DO PRIVATE(ugrad,vgrad,div,strain2,pgradx,pgrady,pgradx2,pgrady2,limiter,pgrad,xgrad,ygrad,grad,grad2,dirx,diry) |
53: DO k=y_min,y_max |
54: !$OMP SIMD |
55: DO j=x_min,x_max |
56: ugrad=(xvel0(j+1,k )+xvel0(j+1,k+1))-(xvel0(j ,k )+xvel0(j ,k+1)) |
57: |
58: vgrad=(yvel0(j ,k+1)+yvel0(j+1,k+1))-(yvel0(j ,k )+yvel0(j+1,k )) |
59: |
60: div = (celldx(j)*(ugrad)+ celldy(k)*(vgrad)) |
61: |
62: strain2 = 0.5_8*(xvel0(j, k+1) + xvel0(j+1,k+1)-xvel0(j ,k )-xvel0(j+1,k ))/celldy(k) & |
63: + 0.5_8*(yvel0(j+1,k ) + yvel0(j+1,k+1)-yvel0(j ,k )-yvel0(j ,k+1))/celldx(j) |
64: |
65: pgradx=(pressure(j+1,k)-pressure(j-1,k))/(celldx(j)+celldx(j+1)) |
66: pgrady=(pressure(j,k+1)-pressure(j,k-1))/(celldy(k)+celldy(k+1)) |
67: |
68: pgradx2 = pgradx*pgradx |
69: pgrady2 = pgrady*pgrady |
70: |
71: limiter = ((0.5_8*(ugrad)/celldx(j))*pgradx2+(0.5_8*(vgrad)/celldy(k))*pgrady2+strain2*pgradx*pgrady) & |
72: /MAX(pgradx2+pgrady2,1.0e-16_8) |
73: |
74: IF ((limiter.GT.0.0).OR.(div.GE.0.0))THEN |
75: viscosity(j,k) = 0.0 |
76: ELSE |
77: dirx=1.0_8 |
78: IF(pgradx.LT.0.0) dirx=-1.0_8 |
79: pgradx = dirx*MAX(1.0e-16_8,ABS(pgradx)) |
80: diry=1.0_8 |
81: IF(pgradx.LT.0.0) diry=-1.0_8 |
82: pgrady = diry*MAX(1.0e-16_8,ABS(pgrady)) |
83: pgrad = SQRT(pgradx**2+pgrady**2) |
84: xgrad = ABS(celldx(j)*pgrad/pgradx) |
85: ygrad = ABS(celldy(k)*pgrad/pgrady) |
86: grad = MIN(xgrad,ygrad) |
87: grad2 = grad*grad |
88: |
89: viscosity(j,k)=2.0_8*density0(j,k)*grad2*limiter*limiter |
90: ENDIF |
91: |
92: ENDDO |
93: ENDDO |
94: !$OMP END DO |
0x47cc00 PUSH %RBP |
0x47cc01 MOV %RSP,%RBP |
0x47cc04 PUSH %R15 |
0x47cc06 PUSH %R14 |
0x47cc08 PUSH %R13 |
0x47cc0a PUSH %R12 |
0x47cc0c PUSH %RBX |
0x47cc0d AND $-0x40,%RSP |
0x47cc11 SUB $0x2c0,%RSP |
0x47cc18 MOV %R9,0x40(%RSP) |
0x47cc1d MOV %R8,0x38(%RSP) |
0x47cc22 MOV 0x40(%RBP),%ESI |
0x47cc25 MOV 0x38(%RBP),%EAX |
0x47cc28 SUB %ESI,%EAX |
0x47cc2a MOVL $0,0x34(%RSP) |
0x47cc32 JS 47ccb0 |
0x47cc34 MOV %RCX,%R14 |
0x47cc37 MOV %RDX,%RBX |
0x47cc3a MOV %RDI,0x58(%RSP) |
0x47cc3f MOV (%RDI),%ESI |
0x47cc41 MOVL $0,0x1c(%RSP) |
0x47cc49 MOV %EAX,0x18(%RSP) |
0x47cc4d MOVL $0x1,0x30(%RSP) |
0x47cc55 SUB $0x8,%RSP |
0x47cc59 LEA 0x38(%RSP),%RAX |
0x47cc5e LEA 0x3c(%RSP),%RCX |
0x47cc63 LEA 0x24(%RSP),%R8 |
0x47cc68 LEA 0x20(%RSP),%R9 |
0x47cc6d MOV $0x553310,%EDI |
0x47cc72 MOV %ESI,0x30(%RSP) |
0x47cc76 MOV $0x22,%EDX |
0x47cc7b PUSH $0x1 |
0x47cc7d PUSH $0x1 |
0x47cc7f PUSH %RAX |
0x47cc80 CALL 404670 <__kmpc_for_static_init_4@plt> |
0x47cc85 ADD $0x20,%RSP |
0x47cc89 MOV 0x1c(%RSP),%EAX |
0x47cc8d MOV 0x18(%RSP),%EDI |
0x47cc91 MOV %RAX,0x50(%RSP) |
0x47cc96 SUB %EAX,%EDI |
0x47cc98 JAE 47cd00 |
0x47cc9a MOV $0x553330,%EDI |
0x47cc9f MOV 0x28(%RSP),%ESI |
0x47cca3 VZEROUPPER |
0x47cca6 CALL 404230 <__kmpc_for_static_fini@plt> |
0x47ccab MOV 0x58(%RSP),%RDI |
0x47ccb0 MOV (%RDI),%ESI |
0x47ccb2 MOV $0x553350,%EDI |
0x47ccb7 CALL 404740 <__kmpc_barrier@plt> |
0x47ccbc LEA -0x28(%RBP),%RSP |
0x47ccc0 POP %RBX |
0x47ccc1 POP %R12 |
0x47ccc3 POP %R13 |
0x47ccc5 POP %R14 |
0x47ccc7 POP %R15 |
0x47ccc9 POP %RBP |
0x47ccca RET |
0x47cccb NOPW %CS:(%RAX,%RAX,1) |
0x47ccda NOPW %CS:(%RAX,%RAX,1) |
0x47cce9 NOPW %CS:(%RAX,%RAX,1) |
0x47ccf8 NOPL (%RAX,%RAX,1) |
0x47cd00 MOV 0x30(%RBP),%R8 |
0x47cd04 MOV 0x20(%RBP),%R9 |
0x47cd08 MOV 0x18(%RBP),%R10 |
0x47cd0c SAL $0x20,%R14 |
0x47cd10 MOV $-0x200000000,%RAX |
0x47cd1a LEA (%R14,%RAX,1),%RDX |
0x47cd1e MOV %RDX,%RCX |
0x47cd21 SAR $0x20,%RCX |
0x47cd25 MOV %RCX,0x60(%RSP) |
0x47cd2a SAL $0x20,%RBX |
0x47cd2e ADD %RBX,%RAX |
0x47cd31 MOV %RAX,%R11 |
0x47cd34 SAR $0x20,%R11 |
0x47cd38 TEST %RDX,%RDX |
0x47cd3b MOV $-0x1,%RSI |
0x47cd42 CMOVNS %RDX,%RSI |
0x47cd46 TEST %RSI,%RSI |
0x47cd49 MOV $0x1,%R15D |
0x47cd4f CMOVG %R15,%RSI |
0x47cd53 MOV $0x200000000,%R12 |
0x47cd5d MOV %R12,%RCX |
0x47cd60 SUB %R14,%RCX |
0x47cd63 MOV 0x10(%RBP),%R14 |
0x47cd67 CMP %RCX,%RDX |
0x47cd6a CMOVG %RDX,%RCX |
0x47cd6e MOV $-0x1,%RDX |
0x47cd75 SHR $0x20,%RCX |
0x47cd79 IMUL %RSI,%RCX |
0x47cd7d SAL $0x3,%RCX |
0x47cd81 MOV $0x8,%ESI |
0x47cd86 SUB %RCX,%RSI |
0x47cd89 TEST %RAX,%RAX |
0x47cd8c CMOVNS %RAX,%RDX |
0x47cd90 TEST %RDX,%RDX |
0x47cd93 CMOVG %R15,%RDX |
0x47cd97 SUB %RBX,%R12 |
0x47cd9a CMP %R12,%RAX |
0x47cd9d CMOVG %RAX,%R12 |
0x47cda1 SHR $0x20,%R12 |
0x47cda5 IMUL %RDX,%R12 |
0x47cda9 NEG %R12 |
0x47cdac MOV %R12,0xa0(%RSP) |
0x47cdb4 SUB %RCX,%R14 |
0x47cdb7 MOV %R14,0x90(%RSP) |
0x47cdbf SUB %RCX,%R9 |
0x47cdc2 MOV %R9,0x88(%RSP) |
0x47cdca MOV %R10,%RAX |
0x47cdcd SUB %RCX,%RAX |
0x47cdd0 MOV %RAX,0x80(%RSP) |
0x47cdd8 MOV %R11,%RAX |
0x47cddb NOT %RAX |
0x47cdde MOV %RAX,0x48(%RSP) |
0x47cde3 MOV %R11,0xd8(%RSP) |
0x47cdeb SUB %R11,%R15 |
0x47cdee MOV %R15,0xa8(%RSP) |
0x47cdf6 LEA (%R10,%RSI,1),%RAX |
0x47cdfa MOV %RAX,0x78(%RSP) |
0x47cdff LEA (%R8,%RSI,1),%RAX |
0x47ce03 MOV %RAX,0x70(%RSP) |
0x47ce08 MOV 0x38(%RSP),%RAX |
0x47ce0d ADD %RSI,%RAX |
0x47ce10 MOV %RAX,0x68(%RSP) |
0x47ce15 ADD 0x40(%RSP),%RSI |
0x47ce1a MOV %RSI,0x98(%RSP) |
0x47ce22 VBROADCASTSD 0x8e844(%RIP),%ZMM2 |
0x47ce2c VBROADCASTSD 0xc3cf2(%RIP),%ZMM3 |
0x47ce36 VBROADCASTSD 0x8e8c8(%RIP),%ZMM4 |
0x47ce40 VBROADCASTSD 0x8e7f6(%RIP),%ZMM5 |
0x47ce4a VBROADCASTSD 0x8e864(%RIP),%ZMM6 |
0x47ce54 MOV 0x50(%RBP),%RDX |
0x47ce58 MOV 0x48(%RBP),%R8 |
0x47ce5c MOV 0x40(%RBP),%EAX |
0x47ce5f MOV 0x50(%RSP),%RCX |
0x47ce64 LEA (%RCX,%RAX,1),%EBX |
0x47ce67 XOR %R9D,%R9D |
0x47ce6a MOV %EDI,0x14(%RSP) |
0x47ce6e JMP 47cea2 |
0x47ce70 NOPW %CS:(%RAX,%RAX,1) |
0x47ce7f NOP |
(918) 0x47ce80 MOV 0x50(%RBP),%RDX |
(918) 0x47ce84 MOV 0x48(%RBP),%R8 |
(918) 0x47ce88 NOPL (%RAX,%RAX,1) |
(918) 0x47ce90 LEA 0x1(%R9),%EAX |
(918) 0x47ce94 INC %EBX |
(918) 0x47ce96 CMP %EDI,%R9D |
(918) 0x47ce99 MOV %EAX,%R9D |
(918) 0x47ce9c JE 47cc9a |
(918) 0x47cea2 MOVSXD (%RDX),%R12 |
(918) 0x47cea5 MOV (%R8),%R11D |
(918) 0x47cea8 CMP %R12D,%R11D |
(918) 0x47ceab JS 47ce90 |
(918) 0x47cead MOV 0x40(%RBP),%EAX |
(918) 0x47ceb0 MOV 0x50(%RSP),%RCX |
(918) 0x47ceb5 ADD %ECX,%EAX |
(918) 0x47ceb7 LEA (%RAX,%R9,1),%ECX |
(918) 0x47cebb MOV 0x58(%RBP),%RDX |
(918) 0x47cebf MOV (%RDX),%RDX |
(918) 0x47cec2 MOV %RDX,0x20(%RSP) |
(918) 0x47cec7 MOV 0x60(%RBP),%RDX |
(918) 0x47cecb MOV (%RDX),%R14 |
(918) 0x47cece MOVSXD %ECX,%R13 |
(918) 0x47ced1 MOV %R13,%R15 |
(918) 0x47ced4 MOV 0xd8(%RSP),%RCX |
(918) 0x47cedc SUB %RCX,%R15 |
(918) 0x47cedf MOV 0x28(%RBP),%RSI |
(918) 0x47cee3 VMOVSD (%RSI,%R15,8),%XMM22 |
(918) 0x47ceea MOV 0x68(%RBP),%RDX |
(918) 0x47ceee MOV (%RDX),%R8 |
(918) 0x47cef1 LEA 0x1(%R9,%RAX,1),%EAX |
(918) 0x47cef6 CLTQ |
(918) 0x47cef8 SUB %RCX,%RAX |
(918) 0x47cefb VADDSD (%RSI,%RAX,8),%XMM22,%XMM1 |
(918) 0x47cf02 MOV 0x70(%RBP),%RAX |
(918) 0x47cf06 MOV (%RAX),%R10 |
(918) 0x47cf09 VMOVSD 0xc3c17(%RIP),%XMM0 |
(918) 0x47cf11 VDIVSD %XMM22,%XMM0,%XMM24 |
(918) 0x47cf17 VDIVSD %XMM1,%XMM0,%XMM23 |
(918) 0x47cf1d SUB %R12D,%R11D |
(918) 0x47cf20 INC %R11D |
(918) 0x47cf23 CMP $0x2,%R11D |
(918) 0x47cf27 MOV $0x1,%EAX |
(918) 0x47cf2c CMOVL %EAX,%R11D |
(918) 0x47cf30 MOV %R11,%RAX |
(918) 0x47cf33 AND $0x7ffffff8,%R11 |
(918) 0x47cf3a MOV %R12,0xf0(%RSP) |
(918) 0x47cf42 JE 47d340 |
(918) 0x47cf48 MOV %RAX,0xe0(%RSP) |
(918) 0x47cf50 MOV %R13,0xc0(%RSP) |
(918) 0x47cf58 MOV %R15,0xd0(%RSP) |
(918) 0x47cf60 MOV %R9,0xe8(%RSP) |
(918) 0x47cf68 MOV %EBX,0x2c(%RSP) |
(918) 0x47cf6c MOVSXD %EBX,%RDX |
(918) 0x47cf6f MOV 0xa0(%RSP),%RAX |
(918) 0x47cf77 LEA (%RAX,%RDX,1),%RCX |
(918) 0x47cf7b MOV 0x48(%RSP),%RAX |
(918) 0x47cf80 ADD %RDX,%RAX |
(918) 0x47cf83 ADD 0xa8(%RSP),%RDX |
(918) 0x47cf8b MOV %R8,%RDI |
(918) 0x47cf8e IMUL %RCX,%RDI |
(918) 0x47cf92 LEA (%RDI,%R12,8),%R9 |
(918) 0x47cf96 ADD 0x78(%RSP),%R9 |
(918) 0x47cf9b MOV %R10,0xc8(%RSP) |
(918) 0x47cfa3 MOV %R10,%RDI |
(918) 0x47cfa6 IMUL %RCX,%RDI |
(918) 0x47cfaa MOV %R8,%R10 |
(918) 0x47cfad LEA (%RDI,%R12,8),%R8 |
(918) 0x47cfb1 ADD 0x90(%RSP),%R8 |
(918) 0x47cfb9 MOV 0x88(%RSP),%RSI |
(918) 0x47cfc1 LEA (%RSI,%R12,8),%RSI |
(918) 0x47cfc5 MOV %RSI,0xf8(%RSP) |
(918) 0x47cfcd IMUL %R10,%RAX |
(918) 0x47cfd1 LEA (%RAX,%R12,8),%RAX |
(918) 0x47cfd5 MOV 0x80(%RSP),%RSI |
(918) 0x47cfdd ADD %RSI,%RAX |
(918) 0x47cfe0 MOV %R10,0xb8(%RSP) |
(918) 0x47cfe8 MOV %R10,%RDI |
(918) 0x47cfeb IMUL %RDX,%RDI |
(918) 0x47cfef LEA (%RDI,%R12,8),%RBX |
(918) 0x47cff3 ADD %RSI,%RBX |
(918) 0x47cff6 MOV 0x70(%RSP),%RSI |
(918) 0x47cffb LEA (%RSI,%R12,8),%R15 |
(918) 0x47cfff MOV %R14,%RDI |
(918) 0x47d002 IMUL %RCX,%RDI |
(918) 0x47d006 LEA (%RDI,%R12,8),%R13 |
(918) 0x47d00a MOV 0x68(%RSP),%RSI |
(918) 0x47d00f ADD %RSI,%R13 |
(918) 0x47d012 MOV %R14,0xb0(%RSP) |
(918) 0x47d01a IMUL %RDX,%R14 |
(918) 0x47d01e LEA (%R14,%R12,8),%R10 |
(918) 0x47d022 ADD %RSI,%R10 |
(918) 0x47d025 MOV 0x20(%RSP),%RDI |
(918) 0x47d02a IMUL %RDI,%RDX |
(918) 0x47d02e LEA (%RDX,%R12,8),%R14 |
(918) 0x47d032 MOV 0x98(%RSP),%RSI |
(918) 0x47d03a ADD %RSI,%R14 |
(918) 0x47d03d MOV %RDI,%RDX |
(918) 0x47d040 IMUL %RCX,%RDX |
(918) 0x47d044 LEA (%RDX,%R12,8),%RDX |
(918) 0x47d048 ADD %RSI,%RDX |
(918) 0x47d04b VBROADCASTSD %XMM22,%ZMM25 |
(918) 0x47d051 VBROADCASTSD %XMM24,%ZMM26 |
(918) 0x47d057 VBROADCASTSD %XMM23,%ZMM27 |
(918) 0x47d05d XOR %EDI,%EDI |
(918) 0x47d05f JMP 47d09a |
0x47d061 NOPW %CS:(%RAX,%RAX,1) |
0x47d070 NOPW %CS:(%RAX,%RAX,1) |
0x47d07f NOP |
(919) 0x47d080 VMOVAPD %ZMM1,%ZMM0{%K1}{z} |
(919) 0x47d086 VMOVUPD %ZMM0,(%R8,%RDI,8) |
(919) 0x47d08d ADD $0x8,%RDI |
(919) 0x47d091 CMP %R11,%RDI |
(919) 0x47d094 JAE 47d2c0 |
(919) 0x47d09a VMOVUPD -0x8(%RDX,%RDI,8),%ZMM1 |
(919) 0x47d0a5 VMOVUPD (%RDX,%RDI,8),%ZMM29 |
(919) 0x47d0ac VMOVUPD -0x8(%R14,%RDI,8),%ZMM30 |
(919) 0x47d0b7 VMOVUPD (%R14,%RDI,8),%ZMM31 |
(919) 0x47d0be VADDPD %ZMM29,%ZMM31,%ZMM28 |
(919) 0x47d0c4 VADDPD %ZMM30,%ZMM1,%ZMM21 |
(919) 0x47d0ca VSUBPD %ZMM21,%ZMM28,%ZMM21 |
(919) 0x47d0d0 VMOVUPD -0x8(%R10,%RDI,8),%ZMM0 |
(919) 0x47d0db VMOVUPD (%R10,%RDI,8),%ZMM16 |
(919) 0x47d0e2 VMOVUPD -0x8(%R13,%RDI,8),%ZMM17 |
(919) 0x47d0ed VMOVUPD (%R13,%RDI,8),%ZMM18 |
(919) 0x47d0f5 VADDPD %ZMM0,%ZMM16,%ZMM28 |
(919) 0x47d0fb VADDPD %ZMM18,%ZMM17,%ZMM19 |
(919) 0x47d101 VSUBPD %ZMM19,%ZMM28,%ZMM19 |
(919) 0x47d107 VMOVUPD -0x8(%R15,%RDI,8),%ZMM28 |
(919) 0x47d112 VMULPD %ZMM21,%ZMM28,%ZMM20 |
(919) 0x47d118 VFMADD231PD %ZMM19,%ZMM25,%ZMM20 |
(919) 0x47d11e VADDPD %ZMM1,%ZMM29,%ZMM1 |
(919) 0x47d124 VSUBPD %ZMM1,%ZMM31,%ZMM1 |
(919) 0x47d12a VADDPD %ZMM30,%ZMM1,%ZMM1 |
(919) 0x47d130 VMULPD %ZMM2,%ZMM1,%ZMM1 |
(919) 0x47d136 VADDPD %ZMM17,%ZMM0,%ZMM0 |
(919) 0x47d13c VSUBPD %ZMM0,%ZMM16,%ZMM0 |
(919) 0x47d142 VADDPD %ZMM18,%ZMM0,%ZMM0 |
(919) 0x47d148 VMULPD %ZMM2,%ZMM0,%ZMM0 |
(919) 0x47d14e VDIVPD %ZMM28,%ZMM3,%ZMM16 |
(919) 0x47d154 VMULPD %ZMM16,%ZMM0,%ZMM0 |
(919) 0x47d15a VMOVUPD (%R9,%RDI,8),%ZMM17 |
(919) 0x47d161 VSUBPD -0x10(%R9,%RDI,8),%ZMM17,%ZMM17 |
(919) 0x47d16c VADDPD (%R15,%RDI,8),%ZMM28,%ZMM18 |
(919) 0x47d173 VDIVPD %ZMM18,%ZMM17,%ZMM31 |
(919) 0x47d179 VMOVUPD (%RBX,%RDI,8),%ZMM17 |
(919) 0x47d180 VSUBPD (%RAX,%RDI,8),%ZMM17,%ZMM17 |
(919) 0x47d187 VFMADD231PD %ZMM1,%ZMM26,%ZMM0 |
(919) 0x47d18d VMULPD %ZMM27,%ZMM17,%ZMM30 |
(919) 0x47d193 VMULPD %ZMM31,%ZMM31,%ZMM1 |
(919) 0x47d199 VMULPD %ZMM30,%ZMM30,%ZMM17 |
(919) 0x47d19f VMULPD %ZMM2,%ZMM21,%ZMM18 |
(919) 0x47d1a5 VMULPD %ZMM16,%ZMM18,%ZMM16 |
(919) 0x47d1ab VMULPD %ZMM1,%ZMM16,%ZMM16 |
(919) 0x47d1b1 VMULPD %ZMM2,%ZMM19,%ZMM18 |
(919) 0x47d1b7 VMULPD %ZMM17,%ZMM18,%ZMM18 |
(919) 0x47d1bd VMULPD %ZMM0,%ZMM31,%ZMM0 |
(919) 0x47d1c3 VFMADD213PD %ZMM16,%ZMM30,%ZMM0 |
(919) 0x47d1c9 VFMADD231PD %ZMM18,%ZMM26,%ZMM0 |
(919) 0x47d1cf VADDPD %ZMM1,%ZMM17,%ZMM1 |
(919) 0x47d1d5 VMAXPD %ZMM4,%ZMM1,%ZMM1 |
(919) 0x47d1db VDIVPD %ZMM1,%ZMM0,%ZMM29 |
(919) 0x47d1e1 VXORPD %XMM1,%XMM1,%XMM1 |
(919) 0x47d1e5 VCMPPD $0x1,%ZMM29,%ZMM1,%K1 |
(919) 0x47d1ec VCMPPD $0x2,%ZMM20,%ZMM1,%K0 |
(919) 0x47d1f3 VCMPPD $0x6,%ZMM20,%ZMM1,%K1{%K1} |
(919) 0x47d1fa KORB %K1,%K0,%K0 |
(919) 0x47d1fe KNOTB %K0,%K1 |
(919) 0x47d202 KORTESTB %K1,%K1 |
(919) 0x47d206 JE 47d080 |
(919) 0x47d20c VFPCLASSPD $0x50,%ZMM31,%K2 |
(919) 0x47d213 VANDPD %ZMM5,%ZMM31,%ZMM0 |
(919) 0x47d219 VMAXPD %ZMM0,%ZMM4,%ZMM0 |
(919) 0x47d21f VXORPD %ZMM6,%ZMM0,%ZMM0{%K2} |
(919) 0x47d225 VFPCLASSPD $0x50,%ZMM0,%K2 |
(919) 0x47d22c VANDPD %ZMM5,%ZMM30,%ZMM1 |
(919) 0x47d232 VMAXPD %ZMM1,%ZMM4,%ZMM1 |
(919) 0x47d238 VXORPD %ZMM6,%ZMM1,%ZMM1{%K2} |
(919) 0x47d23e VMULPD %ZMM0,%ZMM0,%ZMM16 |
(919) 0x47d244 VFMADD231PD %ZMM1,%ZMM1,%ZMM16 |
(919) 0x47d24a VSQRTPD %ZMM16,%ZMM16 |
(919) 0x47d250 VMULPD %ZMM28,%ZMM16,%ZMM17 |
(919) 0x47d256 VDIVPD %ZMM0,%ZMM17,%ZMM0 |
(919) 0x47d25c VANDPD %ZMM5,%ZMM0,%ZMM0 |
(919) 0x47d262 VMULPD %ZMM25,%ZMM16,%ZMM16 |
(919) 0x47d268 VDIVPD %ZMM1,%ZMM16,%ZMM1 |
(919) 0x47d26e VANDPD %ZMM5,%ZMM1,%ZMM1 |
(919) 0x47d274 VCMPPD $0x2,%ZMM1,%ZMM0,%K2 |
(919) 0x47d27b VMOVAPD %ZMM0,%ZMM1{%K2} |
(919) 0x47d281 VMULPD %ZMM1,%ZMM1,%ZMM0 |
(919) 0x47d287 VMULPD %ZMM29,%ZMM29,%ZMM1 |
(919) 0x47d28d VADDPD %ZMM0,%ZMM0,%ZMM0 |
(919) 0x47d293 MOV 0x78(%RBP),%RSI |
(919) 0x47d297 MOV (%RSI),%RSI |
(919) 0x47d29a IMUL %RCX,%RSI |
(919) 0x47d29e ADD 0xf8(%RSP),%RSI |
(919) 0x47d2a6 VMOVUPD (%RSI,%RDI,8),%ZMM16{%K1}{z} |
(919) 0x47d2ad VMULPD %ZMM16,%ZMM1,%ZMM1 |
(919) 0x47d2b3 VMULPD %ZMM0,%ZMM1,%ZMM1 |
(919) 0x47d2b9 JMP 47d080 |
0x47d2be XCHG %AX,%AX |
(918) 0x47d2c0 MOV 0xe0(%RSP),%RAX |
(918) 0x47d2c8 CMP %RAX,%R11 |
(918) 0x47d2cb MOV 0x14(%RSP),%EDI |
(918) 0x47d2cf MOV 0x50(%RBP),%RDX |
(918) 0x47d2d3 MOV 0x48(%RBP),%R8 |
(918) 0x47d2d7 MOV 0x2c(%RSP),%EBX |
(918) 0x47d2db MOV 0xe8(%RSP),%R9 |
(918) 0x47d2e3 JE 47ce90 |
(918) 0x47d2e9 VPBROADCASTQ %RAX,%ZMM1 |
(918) 0x47d2ef MOV 0xd0(%RSP),%R15 |
(918) 0x47d2f7 MOV 0xc8(%RSP),%R10 |
(918) 0x47d2ff MOV 0xc0(%RSP),%R13 |
(918) 0x47d307 MOV 0xb8(%RSP),%R8 |
(918) 0x47d30f MOV 0xb0(%RSP),%R14 |
(918) 0x47d317 JMP 47d349 |
0x47d319 NOPW %CS:(%RAX,%RAX,1) |
0x47d328 NOPW %CS:(%RAX,%RAX,1) |
0x47d337 NOPW (%RAX,%RAX,1) |
(918) 0x47d340 VPBROADCASTQ %RAX,%ZMM1 |
(918) 0x47d346 XOR %R11D,%R11D |
(918) 0x47d349 MOV 0x20(%RSP),%RDX |
(918) 0x47d34e VPBROADCASTQ %R11,%ZMM25 |
(918) 0x47d354 VPSUBQ %ZMM25,%ZMM1,%ZMM1 |
(918) 0x47d35a VPCMPNLEUQ 0x8df9b(%RIP),%ZMM1,%K1 |
(918) 0x47d365 KORTESTB %K1,%K1 |
(918) 0x47d369 JE 47ce80 |
(918) 0x47d36f MOV %RDX,%RAX |
(918) 0x47d372 IMUL %R15,%RAX |
(918) 0x47d376 MOV 0x40(%RSP),%RCX |
(918) 0x47d37b ADD %RCX,%RAX |
(918) 0x47d37e ADD 0xf0(%RSP),%R11 |
(918) 0x47d386 MOV %R11,%RSI |
(918) 0x47d389 MOV %R8,%RDI |
(918) 0x47d38c MOV 0x60(%RSP),%R8 |
(918) 0x47d391 SUB %R8,%RSI |
(918) 0x47d394 VMOVUPD 0x8(%RAX,%RSI,8),%ZMM25{%K1}{z} |
(918) 0x47d39f VMOVUPD (%RAX,%RSI,8),%ZMM26{%K1}{z} |
(918) 0x47d3a6 LEA 0x1(%R15),%RAX |
(918) 0x47d3aa IMUL %RAX,%RDX |
(918) 0x47d3ae ADD %RCX,%RDX |
(918) 0x47d3b1 VMOVUPD 0x8(%RDX,%RSI,8),%ZMM27{%K1}{z} |
(918) 0x47d3bc VMOVUPD (%RDX,%RSI,8),%ZMM28{%K1}{z} |
(918) 0x47d3c3 MOV %R14,%RCX |
(918) 0x47d3c6 IMUL %RAX,%RCX |
(918) 0x47d3ca MOV 0x38(%RSP),%RDX |
(918) 0x47d3cf ADD %RDX,%RCX |
(918) 0x47d3d2 VMOVUPD (%RCX,%RSI,8),%ZMM29{%K1}{z} |
(918) 0x47d3d9 VMOVUPD 0x8(%RCX,%RSI,8),%ZMM30{%K1}{z} |
(918) 0x47d3e4 IMUL %R15,%R14 |
(918) 0x47d3e8 ADD %RDX,%R14 |
(918) 0x47d3eb VMOVUPD (%R14,%RSI,8),%ZMM31{%K1}{z} |
(918) 0x47d3f2 VMOVUPD 0x8(%R14,%RSI,8),%ZMM0{%K1}{z} |
(918) 0x47d3fd MOV %R8,%RCX |
(918) 0x47d400 NOT %RCX |
(918) 0x47d403 ADD %R11,%RCX |
(918) 0x47d406 MOV %RDI,%RDX |
(918) 0x47d409 IMUL %R15,%RDX |
(918) 0x47d40d MOV 0x18(%RBP),%R8 |
(918) 0x47d411 ADD %R8,%RDX |
(918) 0x47d414 VMOVUPD (%RDX,%RCX,8),%ZMM1{%K1}{z} |
(918) 0x47d41b VMOVUPD 0x8(%RDX,%RSI,8),%ZMM16{%K1}{z} |
(918) 0x47d426 IMUL %RDI,%RAX |
(918) 0x47d42a ADD %R8,%RAX |
(918) 0x47d42d VMOVUPD (%RAX,%RSI,8),%ZMM17{%K1}{z} |
(918) 0x47d434 ADD 0x48(%RSP),%R13 |
(918) 0x47d439 IMUL %RDI,%R13 |
(918) 0x47d43d ADD %R8,%R13 |
(918) 0x47d440 VMOVUPD (%R13,%RSI,8),%ZMM18{%K1}{z} |
(918) 0x47d448 VMOVAPD %ZMM25,%ZMM7{%K1} |
(918) 0x47d44e VMOVAPD %ZMM27,%ZMM8{%K1} |
(918) 0x47d454 VMOVAPD %ZMM26,%ZMM9{%K1} |
(918) 0x47d45a VMOVAPD %ZMM28,%ZMM10{%K1} |
(918) 0x47d460 VADDPD %ZMM7,%ZMM8,%ZMM19 |
(918) 0x47d466 VADDPD %ZMM10,%ZMM9,%ZMM20 |
(918) 0x47d46c VSUBPD %ZMM20,%ZMM19,%ZMM19 |
(918) 0x47d472 VMOVAPD %ZMM29,%ZMM11{%K1} |
(918) 0x47d478 VMOVAPD %ZMM30,%ZMM12{%K1} |
(918) 0x47d47e VMOVAPD %ZMM31,%ZMM13{%K1} |
(918) 0x47d484 VMOVAPD %ZMM0,%ZMM14{%K1} |
(918) 0x47d48a VADDPD %ZMM11,%ZMM12,%ZMM0 |
(918) 0x47d490 VADDPD %ZMM14,%ZMM13,%ZMM20 |
(918) 0x47d496 VSUBPD %ZMM20,%ZMM0,%ZMM0 |
(918) 0x47d49c MOV 0x30(%RBP),%RAX |
(918) 0x47d4a0 VMOVUPD (%RAX,%RSI,8),%ZMM20{%K1}{z} |
(918) 0x47d4a7 VMOVAPD %ZMM20,%ZMM15{%K1} |
(918) 0x47d4ad VADDPD %ZMM9,%ZMM7,%ZMM20 |
(918) 0x47d4b3 VSUBPD %ZMM20,%ZMM8,%ZMM20 |
(918) 0x47d4b9 VADDPD %ZMM10,%ZMM20,%ZMM20 |
(918) 0x47d4bf VMULPD %ZMM2,%ZMM20,%ZMM20 |
(918) 0x47d4c5 VBROADCASTSD %XMM24,%ZMM21 |
(918) 0x47d4cb VADDPD %ZMM13,%ZMM11,%ZMM24 |
(918) 0x47d4d1 VSUBPD %ZMM24,%ZMM12,%ZMM24 |
(918) 0x47d4d7 VADDPD %ZMM14,%ZMM24,%ZMM24 |
(918) 0x47d4dd VMULPD %ZMM2,%ZMM24,%ZMM24 |
(918) 0x47d4e3 VDIVPD %ZMM15,%ZMM3,%ZMM26 |
(918) 0x47d4e9 VMULPD %ZMM26,%ZMM24,%ZMM27 |
(918) 0x47d4ef VFMADD231PD %ZMM20,%ZMM21,%ZMM27 |
(918) 0x47d4f5 VMOVAPD 0x240(%RSP),%ZMM20 |
(918) 0x47d4fd VMOVAPD %ZMM16,%ZMM20{%K1} |
(918) 0x47d503 VMOVAPD 0x200(%RSP),%ZMM16 |
(918) 0x47d50b VMOVAPD %ZMM1,%ZMM16{%K1} |
(918) 0x47d511 VMOVUPD 0x8(%RAX,%RSI,8),%ZMM1{%K1}{z} |
(918) 0x47d51c VMOVAPD %ZMM20,0x240(%RSP) |
(918) 0x47d524 VMOVAPD %ZMM16,0x200(%RSP) |
(918) 0x47d52c VSUBPD %ZMM16,%ZMM20,%ZMM16 |
(918) 0x47d532 VMOVAPD 0x1c0(%RSP),%ZMM20 |
(918) 0x47d53a VMOVAPD %ZMM1,%ZMM20{%K1} |
(918) 0x47d540 VMOVAPD %ZMM20,0x1c0(%RSP) |
(918) 0x47d548 VADDPD %ZMM15,%ZMM20,%ZMM1 |
(918) 0x47d54e VDIVPD %ZMM1,%ZMM16,%ZMM24 |
(918) 0x47d554 VMULPD %ZMM19,%ZMM15,%ZMM16 |
(918) 0x47d55a VBROADCASTSD %XMM22,%ZMM22 |
(918) 0x47d560 VFMADD231PD %ZMM0,%ZMM22,%ZMM16 |
(918) 0x47d566 VMOVAPD 0x180(%RSP),%ZMM1 |
(918) 0x47d56e VMOVAPD %ZMM17,%ZMM1{%K1} |
(918) 0x47d574 VMOVAPD 0x140(%RSP),%ZMM17 |
(918) 0x47d57c VMOVAPD %ZMM18,%ZMM17{%K1} |
(918) 0x47d582 VMOVAPD %ZMM1,0x180(%RSP) |
(918) 0x47d58a VMOVAPD %ZMM17,0x140(%RSP) |
(918) 0x47d592 VSUBPD %ZMM17,%ZMM1,%ZMM1 |
(918) 0x47d598 VBROADCASTSD %XMM23,%ZMM17 |
(918) 0x47d59e VMULPD %ZMM17,%ZMM1,%ZMM25 |
(918) 0x47d5a4 VMULPD %ZMM24,%ZMM24,%ZMM1 |
(918) 0x47d5aa VMULPD %ZMM25,%ZMM25,%ZMM17 |
(918) 0x47d5b0 VMULPD %ZMM2,%ZMM19,%ZMM18 |
(918) 0x47d5b6 VMULPD %ZMM26,%ZMM18,%ZMM18 |
(918) 0x47d5bc VMULPD %ZMM1,%ZMM18,%ZMM18 |
(918) 0x47d5c2 VMULPD %ZMM2,%ZMM0,%ZMM0 |
(918) 0x47d5c8 VMULPD %ZMM17,%ZMM0,%ZMM0 |
(918) 0x47d5ce VMULPD %ZMM27,%ZMM24,%ZMM19 |
(918) 0x47d5d4 VFMADD213PD %ZMM18,%ZMM25,%ZMM19 |
(918) 0x47d5da VFMADD231PD %ZMM0,%ZMM21,%ZMM19 |
(918) 0x47d5e0 VADDPD %ZMM1,%ZMM17,%ZMM0 |
(918) 0x47d5e6 VMAXPD %ZMM4,%ZMM0,%ZMM0 |
(918) 0x47d5ec VDIVPD %ZMM0,%ZMM19,%ZMM23 |
(918) 0x47d5f2 VXORPD %XMM1,%XMM1,%XMM1 |
(918) 0x47d5f6 VCMPPD $0x1,%ZMM23,%ZMM1,%K2 |
(918) 0x47d5fd VCMPPD $0x2,%ZMM16,%ZMM1,%K0 |
(918) 0x47d604 VCMPPD $0x6,%ZMM16,%ZMM1,%K2{%K2} |
(918) 0x47d60b KORB %K2,%K0,%K0 |
(918) 0x47d60f KANDNB %K1,%K0,%K2 |
(918) 0x47d613 KORTESTB %K2,%K2 |
(918) 0x47d617 JE 47d6dc |
(918) 0x47d61d VFPCLASSPD $0x50,%ZMM24,%K3 |
(918) 0x47d624 VANDPD %ZMM5,%ZMM24,%ZMM0 |
(918) 0x47d62a VMAXPD %ZMM0,%ZMM4,%ZMM0 |
(918) 0x47d630 VXORPD %ZMM6,%ZMM0,%ZMM0{%K3} |
(918) 0x47d636 VFPCLASSPD $0x50,%ZMM0,%K3 |
(918) 0x47d63d VANDPD %ZMM5,%ZMM25,%ZMM1 |
(918) 0x47d643 VMAXPD %ZMM1,%ZMM4,%ZMM1 |
(918) 0x47d649 VXORPD %ZMM6,%ZMM1,%ZMM1{%K3} |
(918) 0x47d64f VMULPD %ZMM0,%ZMM0,%ZMM16 |
(918) 0x47d655 VFMADD231PD %ZMM1,%ZMM1,%ZMM16 |
(918) 0x47d65b VSQRTPD %ZMM16,%ZMM16 |
(918) 0x47d661 VMULPD %ZMM15,%ZMM16,%ZMM17 |
(918) 0x47d667 VDIVPD %ZMM0,%ZMM17,%ZMM0 |
(918) 0x47d66d VANDPD %ZMM5,%ZMM0,%ZMM0 |
(918) 0x47d673 VMULPD %ZMM22,%ZMM16,%ZMM16 |
(918) 0x47d679 VDIVPD %ZMM1,%ZMM16,%ZMM1 |
(918) 0x47d67f VANDPD %ZMM5,%ZMM1,%ZMM1 |
(918) 0x47d685 VCMPPD $0x2,%ZMM1,%ZMM0,%K3 |
(918) 0x47d68c VMOVAPD %ZMM0,%ZMM1{%K3} |
(918) 0x47d692 VMULPD %ZMM1,%ZMM1,%ZMM0 |
(918) 0x47d698 VMULPD %ZMM23,%ZMM23,%ZMM1 |
(918) 0x47d69e VADDPD %ZMM0,%ZMM0,%ZMM0 |
(918) 0x47d6a4 MOV 0x78(%RBP),%RAX |
(918) 0x47d6a8 MOV (%RAX),%RAX |
(918) 0x47d6ab IMUL %R15,%RAX |
(918) 0x47d6af ADD 0x20(%RBP),%RAX |
(918) 0x47d6b3 VMOVUPD (%RAX,%RSI,8),%ZMM16{%K2}{z} |
(918) 0x47d6ba VMOVAPD 0x100(%RSP),%ZMM17 |
(918) 0x47d6c2 VMOVAPD %ZMM16,%ZMM17{%K2} |
(918) 0x47d6c8 VMOVAPD %ZMM17,0x100(%RSP) |
(918) 0x47d6d0 VMULPD %ZMM17,%ZMM1,%ZMM1 |
(918) 0x47d6d6 VMULPD %ZMM0,%ZMM1,%ZMM1 |
(918) 0x47d6dc MOV 0x14(%RSP),%EDI |
(918) 0x47d6e0 MOV 0x50(%RBP),%RDX |
(918) 0x47d6e4 MOV 0x48(%RBP),%R8 |
(918) 0x47d6e8 VMOVAPD %ZMM1,%ZMM0{%K2}{z} |
(918) 0x47d6ee IMUL %R15,%R10 |
(918) 0x47d6f2 ADD 0x10(%RBP),%R10 |
(918) 0x47d6f6 VMOVUPD %ZMM0,(%R10,%RSI,8){%K1} |
(918) 0x47d6fd JMP 47ce90 |
0x47d702 NOPW %CS:(%RAX,%RAX,1) |
0x47d70c NOPL (%RAX) |
Path / |
Source file and lines | viscosity_kernel.f90:50-94 |
Module | exec |
nb instructions | 149 |
nb uops | 153 |
loop length | 726 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 5 |
nb stack references | 34 |
micro-operation queue | 25.50 cycles |
front end | 25.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 10.20 | 10.20 | 10.00 | 10.00 | 17.00 | 10.20 | 10.20 | 17.00 | 17.00 | 17.00 | 10.20 | 10.00 |
cycles | 10.20 | 10.20 | 10.00 | 10.00 | 17.00 | 10.20 | 10.20 | 17.00 | 17.00 | 17.00 | 10.20 | 10.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 24.95-24.98 |
Stall cycles | 0.00 |
Front-end | 25.50 |
Dispatch | 17.00 |
Overall L1 | 25.50 |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 4% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 1% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 3% |
all | 11% |
load | 12% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 12% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x40,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x2c0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %ESI,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,0x34(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 47ccb0 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xb0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x38(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x3c(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x24(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x20(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x553310,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x1c(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RSP),%EDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %EAX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 47cd00 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x100> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x553330,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x58(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x553350,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 404740 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAL $0x20,%R14 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
LEA (%R14,%RAX,1),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RCX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x20,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%R11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $-0x1,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVNS %RDX,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $0x1,%R15D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %R15,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R14,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RDX,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $-0x1,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SHR $0x20,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RSI,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x3,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RCX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVNS %RAX,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVG %R15,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %RBX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SHR $0x20,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RDX,%R12 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %RCX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R11,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%RSI,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R8,%RSI,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RSI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD 0x40(%RSP),%RSI | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RSI,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD 0x8e844(%RIP),%ZMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xc3cf2(%RIP),%ZMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x8e8c8(%RIP),%ZMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x8e7f6(%RIP),%ZMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x8e864(%RIP),%ZMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV 0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RCX,%RAX,1),%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDI,0x14(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 47cea2 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x2a2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | viscosity_kernel.f90:50-94 |
Module | exec |
nb instructions | 149 |
nb uops | 153 |
loop length | 726 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 5 |
nb stack references | 34 |
micro-operation queue | 25.50 cycles |
front end | 25.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 10.20 | 10.20 | 10.00 | 10.00 | 17.00 | 10.20 | 10.20 | 17.00 | 17.00 | 17.00 | 10.20 | 10.00 |
cycles | 10.20 | 10.20 | 10.00 | 10.00 | 17.00 | 10.20 | 10.20 | 17.00 | 17.00 | 17.00 | 10.20 | 10.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 24.95-24.98 |
Stall cycles | 0.00 |
Front-end | 25.50 |
Dispatch | 17.00 |
Overall L1 | 25.50 |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 4% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 1% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 3% |
all | 11% |
load | 12% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 12% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x40,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x2c0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %ESI,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,0x34(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 47ccb0 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xb0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x38(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x3c(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x24(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x20(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x553310,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x1c(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RSP),%EDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %EAX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 47cd00 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x100> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x553330,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x58(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x553350,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 404740 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAL $0x20,%R14 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
LEA (%R14,%RAX,1),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RCX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x20,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%R11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $-0x1,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVNS %RDX,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $0x1,%R15D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %R15,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R14,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RDX,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $-0x1,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SHR $0x20,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RSI,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x3,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RCX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVNS %RAX,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVG %R15,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %RBX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SHR $0x20,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RDX,%R12 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %RCX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R11,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%RSI,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R8,%RSI,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RSI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD 0x40(%RSP),%RSI | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RSI,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD 0x8e844(%RIP),%ZMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xc3cf2(%RIP),%ZMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x8e8c8(%RIP),%ZMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x8e7f6(%RIP),%ZMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x8e864(%RIP),%ZMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV 0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RCX,%RAX,1),%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDI,0x14(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 47cea2 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x2a2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼viscosity_kernel_.DIR.OMP.PARALLEL.2– | 2.26 | 0.71 |
▼Loop 918 - viscosity_kernel.f90:53-89 - exec– | 0 | 0 |
○Loop 919 - viscosity_kernel.f90:53-89 - exec | 2.25 | 0.71 |