Function: viscosity_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: viscosity_kernel.f90:50-94 | Coverage: 2.23% |
---|
Function: viscosity_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: viscosity_kernel.f90:50-94 | Coverage: 2.23% |
---|
/scratch_na/users/xoserete/qaas_runs/171-214-9740/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90: 50 - 94 |
-------------------------------------------------------------------------------- |
50: !$OMP PARALLEL |
51: |
52: !$OMP DO PRIVATE(ugrad,vgrad,div,strain2,pgradx,pgrady,pgradx2,pgrady2,limiter,pgrad,xgrad,ygrad,grad,grad2,dirx,diry) |
53: DO k=y_min,y_max |
54: !$OMP SIMD |
55: DO j=x_min,x_max |
56: ugrad=(xvel0(j+1,k )+xvel0(j+1,k+1))-(xvel0(j ,k )+xvel0(j ,k+1)) |
57: |
58: vgrad=(yvel0(j ,k+1)+yvel0(j+1,k+1))-(yvel0(j ,k )+yvel0(j+1,k )) |
59: |
60: div = (celldx(j)*(ugrad)+ celldy(k)*(vgrad)) |
61: |
62: strain2 = 0.5_8*(xvel0(j, k+1) + xvel0(j+1,k+1)-xvel0(j ,k )-xvel0(j+1,k ))/celldy(k) & |
63: + 0.5_8*(yvel0(j+1,k ) + yvel0(j+1,k+1)-yvel0(j ,k )-yvel0(j ,k+1))/celldx(j) |
64: |
65: pgradx=(pressure(j+1,k)-pressure(j-1,k))/(celldx(j)+celldx(j+1)) |
66: pgrady=(pressure(j,k+1)-pressure(j,k-1))/(celldy(k)+celldy(k+1)) |
67: |
68: pgradx2 = pgradx*pgradx |
69: pgrady2 = pgrady*pgrady |
70: |
71: limiter = ((0.5_8*(ugrad)/celldx(j))*pgradx2+(0.5_8*(vgrad)/celldy(k))*pgrady2+strain2*pgradx*pgrady) & |
72: /MAX(pgradx2+pgrady2,1.0e-16_8) |
73: |
74: IF ((limiter.GT.0.0).OR.(div.GE.0.0))THEN |
75: viscosity(j,k) = 0.0 |
76: ELSE |
77: dirx=1.0_8 |
78: IF(pgradx.LT.0.0) dirx=-1.0_8 |
79: pgradx = dirx*MAX(1.0e-16_8,ABS(pgradx)) |
80: diry=1.0_8 |
81: IF(pgradx.LT.0.0) diry=-1.0_8 |
82: pgrady = diry*MAX(1.0e-16_8,ABS(pgrady)) |
83: pgrad = SQRT(pgradx**2+pgrady**2) |
84: xgrad = ABS(celldx(j)*pgrad/pgradx) |
85: ygrad = ABS(celldy(k)*pgrad/pgrady) |
86: grad = MIN(xgrad,ygrad) |
87: grad2 = grad*grad |
88: |
89: viscosity(j,k)=2.0_8*density0(j,k)*grad2*limiter*limiter |
90: ENDIF |
91: |
92: ENDDO |
93: ENDDO |
94: !$OMP END DO |
0x47ca80 PUSH %RBP |
0x47ca81 MOV %RSP,%RBP |
0x47ca84 PUSH %R15 |
0x47ca86 PUSH %R14 |
0x47ca88 PUSH %R13 |
0x47ca8a PUSH %R12 |
0x47ca8c PUSH %RBX |
0x47ca8d AND $-0x40,%RSP |
0x47ca91 SUB $0x2c0,%RSP |
0x47ca98 MOV %R9,0x40(%RSP) |
0x47ca9d MOV %R8,0x38(%RSP) |
0x47caa2 MOV 0x40(%RBP),%ESI |
0x47caa5 MOV 0x38(%RBP),%EAX |
0x47caa8 SUB %ESI,%EAX |
0x47caaa MOVL $0,0x34(%RSP) |
0x47cab2 JS 47cb30 |
0x47cab4 MOV %RCX,%R14 |
0x47cab7 MOV %RDX,%RBX |
0x47caba MOV %RDI,0x58(%RSP) |
0x47cabf MOV (%RDI),%ESI |
0x47cac1 MOVL $0,0x1c(%RSP) |
0x47cac9 MOV %EAX,0x18(%RSP) |
0x47cacd MOVL $0x1,0x30(%RSP) |
0x47cad5 SUB $0x8,%RSP |
0x47cad9 LEA 0x38(%RSP),%RAX |
0x47cade LEA 0x3c(%RSP),%RCX |
0x47cae3 LEA 0x24(%RSP),%R8 |
0x47cae8 LEA 0x20(%RSP),%R9 |
0x47caed MOV $0x753310,%EDI |
0x47caf2 MOV %ESI,0x30(%RSP) |
0x47caf6 MOV $0x22,%EDX |
0x47cafb PUSH $0x1 |
0x47cafd PUSH $0x1 |
0x47caff PUSH %RAX |
0x47cb00 CALL 4044c0 <__kmpc_for_static_init_4@plt> |
0x47cb05 ADD $0x20,%RSP |
0x47cb09 MOV 0x1c(%RSP),%EAX |
0x47cb0d MOV 0x18(%RSP),%EDI |
0x47cb11 MOV %RAX,0x50(%RSP) |
0x47cb16 SUB %EAX,%EDI |
0x47cb18 JAE 47cb80 |
0x47cb1a MOV $0x753330,%EDI |
0x47cb1f MOV 0x28(%RSP),%ESI |
0x47cb23 VZEROUPPER |
0x47cb26 CALL 4040b0 <__kmpc_for_static_fini@plt> |
0x47cb2b MOV 0x58(%RSP),%RDI |
0x47cb30 MOV (%RDI),%ESI |
0x47cb32 MOV $0x753350,%EDI |
0x47cb37 CALL 404580 <__kmpc_barrier@plt> |
0x47cb3c LEA -0x28(%RBP),%RSP |
0x47cb40 POP %RBX |
0x47cb41 POP %R12 |
0x47cb43 POP %R13 |
0x47cb45 POP %R14 |
0x47cb47 POP %R15 |
0x47cb49 POP %RBP |
0x47cb4a RET |
0x47cb4b NOPW %CS:(%RAX,%RAX,1) |
0x47cb5a NOPW %CS:(%RAX,%RAX,1) |
0x47cb69 NOPW %CS:(%RAX,%RAX,1) |
0x47cb78 NOPL (%RAX,%RAX,1) |
0x47cb80 MOV 0x30(%RBP),%R8 |
0x47cb84 MOV 0x20(%RBP),%R9 |
0x47cb88 MOV 0x18(%RBP),%R10 |
0x47cb8c SAL $0x20,%R14 |
0x47cb90 MOV $-0x200000000,%RAX |
0x47cb9a LEA (%R14,%RAX,1),%RDX |
0x47cb9e MOV %RDX,%RCX |
0x47cba1 SAR $0x20,%RCX |
0x47cba5 MOV %RCX,0x60(%RSP) |
0x47cbaa SAL $0x20,%RBX |
0x47cbae ADD %RBX,%RAX |
0x47cbb1 MOV %RAX,%R11 |
0x47cbb4 SAR $0x20,%R11 |
0x47cbb8 TEST %RDX,%RDX |
0x47cbbb MOV $-0x1,%RSI |
0x47cbc2 CMOVNS %RDX,%RSI |
0x47cbc6 TEST %RSI,%RSI |
0x47cbc9 MOV $0x1,%R15D |
0x47cbcf CMOVG %R15,%RSI |
0x47cbd3 MOV $0x200000000,%R12 |
0x47cbdd MOV %R12,%RCX |
0x47cbe0 SUB %R14,%RCX |
0x47cbe3 MOV 0x10(%RBP),%R14 |
0x47cbe7 CMP %RCX,%RDX |
0x47cbea CMOVG %RDX,%RCX |
0x47cbee MOV $-0x1,%RDX |
0x47cbf5 SHR $0x20,%RCX |
0x47cbf9 IMUL %RSI,%RCX |
0x47cbfd SAL $0x3,%RCX |
0x47cc01 MOV $0x8,%ESI |
0x47cc06 SUB %RCX,%RSI |
0x47cc09 TEST %RAX,%RAX |
0x47cc0c CMOVNS %RAX,%RDX |
0x47cc10 TEST %RDX,%RDX |
0x47cc13 CMOVG %R15,%RDX |
0x47cc17 SUB %RBX,%R12 |
0x47cc1a CMP %R12,%RAX |
0x47cc1d CMOVG %RAX,%R12 |
0x47cc21 SHR $0x20,%R12 |
0x47cc25 IMUL %RDX,%R12 |
0x47cc29 NEG %R12 |
0x47cc2c MOV %R12,0xa0(%RSP) |
0x47cc34 SUB %RCX,%R14 |
0x47cc37 MOV %R14,0x90(%RSP) |
0x47cc3f SUB %RCX,%R9 |
0x47cc42 MOV %R9,0x88(%RSP) |
0x47cc4a MOV %R10,%RAX |
0x47cc4d SUB %RCX,%RAX |
0x47cc50 MOV %RAX,0x80(%RSP) |
0x47cc58 MOV %R11,%RAX |
0x47cc5b NOT %RAX |
0x47cc5e MOV %RAX,0x48(%RSP) |
0x47cc63 MOV %R11,0xd8(%RSP) |
0x47cc6b SUB %R11,%R15 |
0x47cc6e MOV %R15,0xa8(%RSP) |
0x47cc76 LEA (%R10,%RSI,1),%RAX |
0x47cc7a MOV %RAX,0x78(%RSP) |
0x47cc7f LEA (%R8,%RSI,1),%RAX |
0x47cc83 MOV %RAX,0x70(%RSP) |
0x47cc88 MOV 0x38(%RSP),%RAX |
0x47cc8d ADD %RSI,%RAX |
0x47cc90 MOV %RAX,0x68(%RSP) |
0x47cc95 ADD 0x40(%RSP),%RSI |
0x47cc9a MOV %RSI,0x98(%RSP) |
0x47cca2 VBROADCASTSD 0x8e004(%RIP),%ZMM2 |
0x47ccac VBROADCASTSD 0xc49f2(%RIP),%ZMM3 |
0x47ccb6 VBROADCASTSD 0x8e088(%RIP),%ZMM4 |
0x47ccc0 VBROADCASTSD 0x8dfb6(%RIP),%ZMM5 |
0x47ccca VBROADCASTSD 0x8e024(%RIP),%ZMM6 |
0x47ccd4 MOV 0x50(%RBP),%RDX |
0x47ccd8 MOV 0x48(%RBP),%R8 |
0x47ccdc MOV 0x40(%RBP),%EAX |
0x47ccdf MOV 0x50(%RSP),%RCX |
0x47cce4 LEA (%RCX,%RAX,1),%EBX |
0x47cce7 XOR %R9D,%R9D |
0x47ccea MOV %EDI,0x14(%RSP) |
0x47ccee JMP 47cd22 |
0x47ccf0 NOPW %CS:(%RAX,%RAX,1) |
0x47ccff NOP |
(918) 0x47cd00 MOV 0x50(%RBP),%RDX |
(918) 0x47cd04 MOV 0x48(%RBP),%R8 |
(918) 0x47cd08 NOPL (%RAX,%RAX,1) |
(918) 0x47cd10 LEA 0x1(%R9),%EAX |
(918) 0x47cd14 INC %EBX |
(918) 0x47cd16 CMP %EDI,%R9D |
(918) 0x47cd19 MOV %EAX,%R9D |
(918) 0x47cd1c JE 47cb1a |
(918) 0x47cd22 MOVSXD (%RDX),%R12 |
(918) 0x47cd25 MOV (%R8),%R11D |
(918) 0x47cd28 CMP %R12D,%R11D |
(918) 0x47cd2b JS 47cd10 |
(918) 0x47cd2d MOV 0x40(%RBP),%EAX |
(918) 0x47cd30 MOV 0x50(%RSP),%RCX |
(918) 0x47cd35 ADD %ECX,%EAX |
(918) 0x47cd37 LEA (%RAX,%R9,1),%ECX |
(918) 0x47cd3b MOV 0x58(%RBP),%RDX |
(918) 0x47cd3f MOV (%RDX),%RDX |
(918) 0x47cd42 MOV %RDX,0x20(%RSP) |
(918) 0x47cd47 MOV 0x60(%RBP),%RDX |
(918) 0x47cd4b MOV (%RDX),%R14 |
(918) 0x47cd4e MOVSXD %ECX,%R13 |
(918) 0x47cd51 MOV %R13,%R15 |
(918) 0x47cd54 MOV 0xd8(%RSP),%RCX |
(918) 0x47cd5c SUB %RCX,%R15 |
(918) 0x47cd5f MOV 0x28(%RBP),%RSI |
(918) 0x47cd63 VMOVSD (%RSI,%R15,8),%XMM22 |
(918) 0x47cd6a MOV 0x68(%RBP),%RDX |
(918) 0x47cd6e MOV (%RDX),%R8 |
(918) 0x47cd71 LEA 0x1(%R9,%RAX,1),%EAX |
(918) 0x47cd76 CLTQ |
(918) 0x47cd78 SUB %RCX,%RAX |
(918) 0x47cd7b VADDSD (%RSI,%RAX,8),%XMM22,%XMM1 |
(918) 0x47cd82 MOV 0x70(%RBP),%RAX |
(918) 0x47cd86 MOV (%RAX),%R10 |
(918) 0x47cd89 VMOVSD 0xc4917(%RIP),%XMM0 |
(918) 0x47cd91 VDIVSD %XMM22,%XMM0,%XMM24 |
(918) 0x47cd97 VDIVSD %XMM1,%XMM0,%XMM23 |
(918) 0x47cd9d SUB %R12D,%R11D |
(918) 0x47cda0 INC %R11D |
(918) 0x47cda3 CMP $0x2,%R11D |
(918) 0x47cda7 MOV $0x1,%EAX |
(918) 0x47cdac CMOVL %EAX,%R11D |
(918) 0x47cdb0 MOV %R11,%RAX |
(918) 0x47cdb3 AND $0x7ffffff8,%R11 |
(918) 0x47cdba MOV %R12,0xf0(%RSP) |
(918) 0x47cdc2 JE 47d1c0 |
(918) 0x47cdc8 MOV %RAX,0xe0(%RSP) |
(918) 0x47cdd0 MOV %R13,0xc0(%RSP) |
(918) 0x47cdd8 MOV %R15,0xd0(%RSP) |
(918) 0x47cde0 MOV %R9,0xe8(%RSP) |
(918) 0x47cde8 MOV %EBX,0x2c(%RSP) |
(918) 0x47cdec MOVSXD %EBX,%RDX |
(918) 0x47cdef MOV 0xa0(%RSP),%RAX |
(918) 0x47cdf7 LEA (%RAX,%RDX,1),%RCX |
(918) 0x47cdfb MOV 0x48(%RSP),%RAX |
(918) 0x47ce00 ADD %RDX,%RAX |
(918) 0x47ce03 ADD 0xa8(%RSP),%RDX |
(918) 0x47ce0b MOV %R8,%RDI |
(918) 0x47ce0e IMUL %RCX,%RDI |
(918) 0x47ce12 LEA (%RDI,%R12,8),%R9 |
(918) 0x47ce16 ADD 0x78(%RSP),%R9 |
(918) 0x47ce1b MOV %R10,0xc8(%RSP) |
(918) 0x47ce23 MOV %R10,%RDI |
(918) 0x47ce26 IMUL %RCX,%RDI |
(918) 0x47ce2a MOV %R8,%R10 |
(918) 0x47ce2d LEA (%RDI,%R12,8),%R8 |
(918) 0x47ce31 ADD 0x90(%RSP),%R8 |
(918) 0x47ce39 MOV 0x88(%RSP),%RSI |
(918) 0x47ce41 LEA (%RSI,%R12,8),%RSI |
(918) 0x47ce45 MOV %RSI,0xf8(%RSP) |
(918) 0x47ce4d IMUL %R10,%RAX |
(918) 0x47ce51 LEA (%RAX,%R12,8),%RAX |
(918) 0x47ce55 MOV 0x80(%RSP),%RSI |
(918) 0x47ce5d ADD %RSI,%RAX |
(918) 0x47ce60 MOV %R10,0xb8(%RSP) |
(918) 0x47ce68 MOV %R10,%RDI |
(918) 0x47ce6b IMUL %RDX,%RDI |
(918) 0x47ce6f LEA (%RDI,%R12,8),%RBX |
(918) 0x47ce73 ADD %RSI,%RBX |
(918) 0x47ce76 MOV 0x70(%RSP),%RSI |
(918) 0x47ce7b LEA (%RSI,%R12,8),%R15 |
(918) 0x47ce7f MOV %R14,%RDI |
(918) 0x47ce82 IMUL %RCX,%RDI |
(918) 0x47ce86 LEA (%RDI,%R12,8),%R13 |
(918) 0x47ce8a MOV 0x68(%RSP),%RSI |
(918) 0x47ce8f ADD %RSI,%R13 |
(918) 0x47ce92 MOV %R14,0xb0(%RSP) |
(918) 0x47ce9a IMUL %RDX,%R14 |
(918) 0x47ce9e LEA (%R14,%R12,8),%R10 |
(918) 0x47cea2 ADD %RSI,%R10 |
(918) 0x47cea5 MOV 0x20(%RSP),%RDI |
(918) 0x47ceaa IMUL %RDI,%RDX |
(918) 0x47ceae LEA (%RDX,%R12,8),%R14 |
(918) 0x47ceb2 MOV 0x98(%RSP),%RSI |
(918) 0x47ceba ADD %RSI,%R14 |
(918) 0x47cebd MOV %RDI,%RDX |
(918) 0x47cec0 IMUL %RCX,%RDX |
(918) 0x47cec4 LEA (%RDX,%R12,8),%RDX |
(918) 0x47cec8 ADD %RSI,%RDX |
(918) 0x47cecb VBROADCASTSD %XMM22,%ZMM25 |
(918) 0x47ced1 VBROADCASTSD %XMM24,%ZMM26 |
(918) 0x47ced7 VBROADCASTSD %XMM23,%ZMM27 |
(918) 0x47cedd XOR %EDI,%EDI |
(918) 0x47cedf JMP 47cf1a |
0x47cee1 NOPW %CS:(%RAX,%RAX,1) |
0x47cef0 NOPW %CS:(%RAX,%RAX,1) |
0x47ceff NOP |
(919) 0x47cf00 VMOVAPD %ZMM1,%ZMM0{%K1}{z} |
(919) 0x47cf06 VMOVUPD %ZMM0,(%R8,%RDI,8) |
(919) 0x47cf0d ADD $0x8,%RDI |
(919) 0x47cf11 CMP %R11,%RDI |
(919) 0x47cf14 JAE 47d140 |
(919) 0x47cf1a VMOVUPD -0x8(%RDX,%RDI,8),%ZMM1 |
(919) 0x47cf25 VMOVUPD (%RDX,%RDI,8),%ZMM29 |
(919) 0x47cf2c VMOVUPD -0x8(%R14,%RDI,8),%ZMM30 |
(919) 0x47cf37 VMOVUPD (%R14,%RDI,8),%ZMM31 |
(919) 0x47cf3e VADDPD %ZMM29,%ZMM31,%ZMM28 |
(919) 0x47cf44 VADDPD %ZMM30,%ZMM1,%ZMM21 |
(919) 0x47cf4a VSUBPD %ZMM21,%ZMM28,%ZMM21 |
(919) 0x47cf50 VMOVUPD -0x8(%R10,%RDI,8),%ZMM0 |
(919) 0x47cf5b VMOVUPD (%R10,%RDI,8),%ZMM16 |
(919) 0x47cf62 VMOVUPD -0x8(%R13,%RDI,8),%ZMM17 |
(919) 0x47cf6d VMOVUPD (%R13,%RDI,8),%ZMM18 |
(919) 0x47cf75 VADDPD %ZMM0,%ZMM16,%ZMM28 |
(919) 0x47cf7b VADDPD %ZMM18,%ZMM17,%ZMM19 |
(919) 0x47cf81 VSUBPD %ZMM19,%ZMM28,%ZMM19 |
(919) 0x47cf87 VMOVUPD -0x8(%R15,%RDI,8),%ZMM28 |
(919) 0x47cf92 VMULPD %ZMM21,%ZMM28,%ZMM20 |
(919) 0x47cf98 VFMADD231PD %ZMM19,%ZMM25,%ZMM20 |
(919) 0x47cf9e VADDPD %ZMM1,%ZMM29,%ZMM1 |
(919) 0x47cfa4 VSUBPD %ZMM1,%ZMM31,%ZMM1 |
(919) 0x47cfaa VADDPD %ZMM30,%ZMM1,%ZMM1 |
(919) 0x47cfb0 VMULPD %ZMM2,%ZMM1,%ZMM1 |
(919) 0x47cfb6 VADDPD %ZMM17,%ZMM0,%ZMM0 |
(919) 0x47cfbc VSUBPD %ZMM0,%ZMM16,%ZMM0 |
(919) 0x47cfc2 VADDPD %ZMM18,%ZMM0,%ZMM0 |
(919) 0x47cfc8 VMULPD %ZMM2,%ZMM0,%ZMM0 |
(919) 0x47cfce VDIVPD %ZMM28,%ZMM3,%ZMM16 |
(919) 0x47cfd4 VMULPD %ZMM16,%ZMM0,%ZMM0 |
(919) 0x47cfda VMOVUPD (%R9,%RDI,8),%ZMM17 |
(919) 0x47cfe1 VSUBPD -0x10(%R9,%RDI,8),%ZMM17,%ZMM17 |
(919) 0x47cfec VADDPD (%R15,%RDI,8),%ZMM28,%ZMM18 |
(919) 0x47cff3 VDIVPD %ZMM18,%ZMM17,%ZMM31 |
(919) 0x47cff9 VMOVUPD (%RBX,%RDI,8),%ZMM17 |
(919) 0x47d000 VSUBPD (%RAX,%RDI,8),%ZMM17,%ZMM17 |
(919) 0x47d007 VFMADD231PD %ZMM1,%ZMM26,%ZMM0 |
(919) 0x47d00d VMULPD %ZMM27,%ZMM17,%ZMM30 |
(919) 0x47d013 VMULPD %ZMM31,%ZMM31,%ZMM1 |
(919) 0x47d019 VMULPD %ZMM30,%ZMM30,%ZMM17 |
(919) 0x47d01f VMULPD %ZMM2,%ZMM21,%ZMM18 |
(919) 0x47d025 VMULPD %ZMM16,%ZMM18,%ZMM16 |
(919) 0x47d02b VMULPD %ZMM1,%ZMM16,%ZMM16 |
(919) 0x47d031 VMULPD %ZMM2,%ZMM19,%ZMM18 |
(919) 0x47d037 VMULPD %ZMM17,%ZMM18,%ZMM18 |
(919) 0x47d03d VMULPD %ZMM0,%ZMM31,%ZMM0 |
(919) 0x47d043 VFMADD213PD %ZMM16,%ZMM30,%ZMM0 |
(919) 0x47d049 VFMADD231PD %ZMM18,%ZMM26,%ZMM0 |
(919) 0x47d04f VADDPD %ZMM1,%ZMM17,%ZMM1 |
(919) 0x47d055 VMAXPD %ZMM4,%ZMM1,%ZMM1 |
(919) 0x47d05b VDIVPD %ZMM1,%ZMM0,%ZMM29 |
(919) 0x47d061 VXORPD %XMM1,%XMM1,%XMM1 |
(919) 0x47d065 VCMPPD $0x1,%ZMM29,%ZMM1,%K1 |
(919) 0x47d06c VCMPPD $0x2,%ZMM20,%ZMM1,%K0 |
(919) 0x47d073 VCMPPD $0x6,%ZMM20,%ZMM1,%K1{%K1} |
(919) 0x47d07a KORB %K1,%K0,%K0 |
(919) 0x47d07e KNOTB %K0,%K1 |
(919) 0x47d082 KORTESTB %K1,%K1 |
(919) 0x47d086 JE 47cf00 |
(919) 0x47d08c VFPCLASSPD $0x50,%ZMM31,%K2 |
(919) 0x47d093 VANDPD %ZMM5,%ZMM31,%ZMM0 |
(919) 0x47d099 VMAXPD %ZMM0,%ZMM4,%ZMM0 |
(919) 0x47d09f VXORPD %ZMM6,%ZMM0,%ZMM0{%K2} |
(919) 0x47d0a5 VFPCLASSPD $0x50,%ZMM0,%K2 |
(919) 0x47d0ac VANDPD %ZMM5,%ZMM30,%ZMM1 |
(919) 0x47d0b2 VMAXPD %ZMM1,%ZMM4,%ZMM1 |
(919) 0x47d0b8 VXORPD %ZMM6,%ZMM1,%ZMM1{%K2} |
(919) 0x47d0be VMULPD %ZMM0,%ZMM0,%ZMM16 |
(919) 0x47d0c4 VFMADD231PD %ZMM1,%ZMM1,%ZMM16 |
(919) 0x47d0ca VSQRTPD %ZMM16,%ZMM16 |
(919) 0x47d0d0 VMULPD %ZMM28,%ZMM16,%ZMM17 |
(919) 0x47d0d6 VDIVPD %ZMM0,%ZMM17,%ZMM0 |
(919) 0x47d0dc VANDPD %ZMM5,%ZMM0,%ZMM0 |
(919) 0x47d0e2 VMULPD %ZMM25,%ZMM16,%ZMM16 |
(919) 0x47d0e8 VDIVPD %ZMM1,%ZMM16,%ZMM1 |
(919) 0x47d0ee VANDPD %ZMM5,%ZMM1,%ZMM1 |
(919) 0x47d0f4 VCMPPD $0x2,%ZMM1,%ZMM0,%K2 |
(919) 0x47d0fb VMOVAPD %ZMM0,%ZMM1{%K2} |
(919) 0x47d101 VMULPD %ZMM1,%ZMM1,%ZMM0 |
(919) 0x47d107 VMULPD %ZMM29,%ZMM29,%ZMM1 |
(919) 0x47d10d VADDPD %ZMM0,%ZMM0,%ZMM0 |
(919) 0x47d113 MOV 0x78(%RBP),%RSI |
(919) 0x47d117 MOV (%RSI),%RSI |
(919) 0x47d11a IMUL %RCX,%RSI |
(919) 0x47d11e ADD 0xf8(%RSP),%RSI |
(919) 0x47d126 VMOVUPD (%RSI,%RDI,8),%ZMM16{%K1}{z} |
(919) 0x47d12d VMULPD %ZMM16,%ZMM1,%ZMM1 |
(919) 0x47d133 VMULPD %ZMM0,%ZMM1,%ZMM1 |
(919) 0x47d139 JMP 47cf00 |
0x47d13e XCHG %AX,%AX |
(918) 0x47d140 MOV 0xe0(%RSP),%RAX |
(918) 0x47d148 CMP %RAX,%R11 |
(918) 0x47d14b MOV 0x14(%RSP),%EDI |
(918) 0x47d14f MOV 0x50(%RBP),%RDX |
(918) 0x47d153 MOV 0x48(%RBP),%R8 |
(918) 0x47d157 MOV 0x2c(%RSP),%EBX |
(918) 0x47d15b MOV 0xe8(%RSP),%R9 |
(918) 0x47d163 JE 47cd10 |
(918) 0x47d169 VPBROADCASTQ %RAX,%ZMM1 |
(918) 0x47d16f MOV 0xd0(%RSP),%R15 |
(918) 0x47d177 MOV 0xc8(%RSP),%R10 |
(918) 0x47d17f MOV 0xc0(%RSP),%R13 |
(918) 0x47d187 MOV 0xb8(%RSP),%R8 |
(918) 0x47d18f MOV 0xb0(%RSP),%R14 |
(918) 0x47d197 JMP 47d1c9 |
0x47d199 NOPW %CS:(%RAX,%RAX,1) |
0x47d1a8 NOPW %CS:(%RAX,%RAX,1) |
0x47d1b7 NOPW (%RAX,%RAX,1) |
(918) 0x47d1c0 VPBROADCASTQ %RAX,%ZMM1 |
(918) 0x47d1c6 XOR %R11D,%R11D |
(918) 0x47d1c9 MOV 0x20(%RSP),%RDX |
(918) 0x47d1ce VPBROADCASTQ %R11,%ZMM25 |
(918) 0x47d1d4 VPSUBQ %ZMM25,%ZMM1,%ZMM1 |
(918) 0x47d1da VPCMPNLEUQ 0x8d75b(%RIP),%ZMM1,%K1 |
(918) 0x47d1e5 KORTESTB %K1,%K1 |
(918) 0x47d1e9 JE 47cd00 |
(918) 0x47d1ef MOV %RDX,%RAX |
(918) 0x47d1f2 IMUL %R15,%RAX |
(918) 0x47d1f6 MOV 0x40(%RSP),%RCX |
(918) 0x47d1fb ADD %RCX,%RAX |
(918) 0x47d1fe ADD 0xf0(%RSP),%R11 |
(918) 0x47d206 MOV %R11,%RSI |
(918) 0x47d209 MOV %R8,%RDI |
(918) 0x47d20c MOV 0x60(%RSP),%R8 |
(918) 0x47d211 SUB %R8,%RSI |
(918) 0x47d214 VMOVUPD 0x8(%RAX,%RSI,8),%ZMM25{%K1}{z} |
(918) 0x47d21f VMOVUPD (%RAX,%RSI,8),%ZMM26{%K1}{z} |
(918) 0x47d226 LEA 0x1(%R15),%RAX |
(918) 0x47d22a IMUL %RAX,%RDX |
(918) 0x47d22e ADD %RCX,%RDX |
(918) 0x47d231 VMOVUPD 0x8(%RDX,%RSI,8),%ZMM27{%K1}{z} |
(918) 0x47d23c VMOVUPD (%RDX,%RSI,8),%ZMM28{%K1}{z} |
(918) 0x47d243 MOV %R14,%RCX |
(918) 0x47d246 IMUL %RAX,%RCX |
(918) 0x47d24a MOV 0x38(%RSP),%RDX |
(918) 0x47d24f ADD %RDX,%RCX |
(918) 0x47d252 VMOVUPD (%RCX,%RSI,8),%ZMM29{%K1}{z} |
(918) 0x47d259 VMOVUPD 0x8(%RCX,%RSI,8),%ZMM30{%K1}{z} |
(918) 0x47d264 IMUL %R15,%R14 |
(918) 0x47d268 ADD %RDX,%R14 |
(918) 0x47d26b VMOVUPD (%R14,%RSI,8),%ZMM31{%K1}{z} |
(918) 0x47d272 VMOVUPD 0x8(%R14,%RSI,8),%ZMM0{%K1}{z} |
(918) 0x47d27d MOV %R8,%RCX |
(918) 0x47d280 NOT %RCX |
(918) 0x47d283 ADD %R11,%RCX |
(918) 0x47d286 MOV %RDI,%RDX |
(918) 0x47d289 IMUL %R15,%RDX |
(918) 0x47d28d MOV 0x18(%RBP),%R8 |
(918) 0x47d291 ADD %R8,%RDX |
(918) 0x47d294 VMOVUPD (%RDX,%RCX,8),%ZMM1{%K1}{z} |
(918) 0x47d29b VMOVUPD 0x8(%RDX,%RSI,8),%ZMM16{%K1}{z} |
(918) 0x47d2a6 IMUL %RDI,%RAX |
(918) 0x47d2aa ADD %R8,%RAX |
(918) 0x47d2ad VMOVUPD (%RAX,%RSI,8),%ZMM17{%K1}{z} |
(918) 0x47d2b4 ADD 0x48(%RSP),%R13 |
(918) 0x47d2b9 IMUL %RDI,%R13 |
(918) 0x47d2bd ADD %R8,%R13 |
(918) 0x47d2c0 VMOVUPD (%R13,%RSI,8),%ZMM18{%K1}{z} |
(918) 0x47d2c8 VMOVAPD %ZMM25,%ZMM7{%K1} |
(918) 0x47d2ce VMOVAPD %ZMM27,%ZMM8{%K1} |
(918) 0x47d2d4 VMOVAPD %ZMM26,%ZMM9{%K1} |
(918) 0x47d2da VMOVAPD %ZMM28,%ZMM10{%K1} |
(918) 0x47d2e0 VADDPD %ZMM7,%ZMM8,%ZMM19 |
(918) 0x47d2e6 VADDPD %ZMM10,%ZMM9,%ZMM20 |
(918) 0x47d2ec VSUBPD %ZMM20,%ZMM19,%ZMM19 |
(918) 0x47d2f2 VMOVAPD %ZMM29,%ZMM11{%K1} |
(918) 0x47d2f8 VMOVAPD %ZMM30,%ZMM12{%K1} |
(918) 0x47d2fe VMOVAPD %ZMM31,%ZMM13{%K1} |
(918) 0x47d304 VMOVAPD %ZMM0,%ZMM14{%K1} |
(918) 0x47d30a VADDPD %ZMM11,%ZMM12,%ZMM0 |
(918) 0x47d310 VADDPD %ZMM14,%ZMM13,%ZMM20 |
(918) 0x47d316 VSUBPD %ZMM20,%ZMM0,%ZMM0 |
(918) 0x47d31c MOV 0x30(%RBP),%RAX |
(918) 0x47d320 VMOVUPD (%RAX,%RSI,8),%ZMM20{%K1}{z} |
(918) 0x47d327 VMOVAPD %ZMM20,%ZMM15{%K1} |
(918) 0x47d32d VADDPD %ZMM9,%ZMM7,%ZMM20 |
(918) 0x47d333 VSUBPD %ZMM20,%ZMM8,%ZMM20 |
(918) 0x47d339 VADDPD %ZMM10,%ZMM20,%ZMM20 |
(918) 0x47d33f VMULPD %ZMM2,%ZMM20,%ZMM20 |
(918) 0x47d345 VBROADCASTSD %XMM24,%ZMM21 |
(918) 0x47d34b VADDPD %ZMM13,%ZMM11,%ZMM24 |
(918) 0x47d351 VSUBPD %ZMM24,%ZMM12,%ZMM24 |
(918) 0x47d357 VADDPD %ZMM14,%ZMM24,%ZMM24 |
(918) 0x47d35d VMULPD %ZMM2,%ZMM24,%ZMM24 |
(918) 0x47d363 VDIVPD %ZMM15,%ZMM3,%ZMM26 |
(918) 0x47d369 VMULPD %ZMM26,%ZMM24,%ZMM27 |
(918) 0x47d36f VFMADD231PD %ZMM20,%ZMM21,%ZMM27 |
(918) 0x47d375 VMOVAPD 0x240(%RSP),%ZMM20 |
(918) 0x47d37d VMOVAPD %ZMM16,%ZMM20{%K1} |
(918) 0x47d383 VMOVAPD 0x200(%RSP),%ZMM16 |
(918) 0x47d38b VMOVAPD %ZMM1,%ZMM16{%K1} |
(918) 0x47d391 VMOVUPD 0x8(%RAX,%RSI,8),%ZMM1{%K1}{z} |
(918) 0x47d39c VMOVAPD %ZMM20,0x240(%RSP) |
(918) 0x47d3a4 VMOVAPD %ZMM16,0x200(%RSP) |
(918) 0x47d3ac VSUBPD %ZMM16,%ZMM20,%ZMM16 |
(918) 0x47d3b2 VMOVAPD 0x1c0(%RSP),%ZMM20 |
(918) 0x47d3ba VMOVAPD %ZMM1,%ZMM20{%K1} |
(918) 0x47d3c0 VMOVAPD %ZMM20,0x1c0(%RSP) |
(918) 0x47d3c8 VADDPD %ZMM15,%ZMM20,%ZMM1 |
(918) 0x47d3ce VDIVPD %ZMM1,%ZMM16,%ZMM24 |
(918) 0x47d3d4 VMULPD %ZMM19,%ZMM15,%ZMM16 |
(918) 0x47d3da VBROADCASTSD %XMM22,%ZMM22 |
(918) 0x47d3e0 VFMADD231PD %ZMM0,%ZMM22,%ZMM16 |
(918) 0x47d3e6 VMOVAPD 0x180(%RSP),%ZMM1 |
(918) 0x47d3ee VMOVAPD %ZMM17,%ZMM1{%K1} |
(918) 0x47d3f4 VMOVAPD 0x140(%RSP),%ZMM17 |
(918) 0x47d3fc VMOVAPD %ZMM18,%ZMM17{%K1} |
(918) 0x47d402 VMOVAPD %ZMM1,0x180(%RSP) |
(918) 0x47d40a VMOVAPD %ZMM17,0x140(%RSP) |
(918) 0x47d412 VSUBPD %ZMM17,%ZMM1,%ZMM1 |
(918) 0x47d418 VBROADCASTSD %XMM23,%ZMM17 |
(918) 0x47d41e VMULPD %ZMM17,%ZMM1,%ZMM25 |
(918) 0x47d424 VMULPD %ZMM24,%ZMM24,%ZMM1 |
(918) 0x47d42a VMULPD %ZMM25,%ZMM25,%ZMM17 |
(918) 0x47d430 VMULPD %ZMM2,%ZMM19,%ZMM18 |
(918) 0x47d436 VMULPD %ZMM26,%ZMM18,%ZMM18 |
(918) 0x47d43c VMULPD %ZMM1,%ZMM18,%ZMM18 |
(918) 0x47d442 VMULPD %ZMM2,%ZMM0,%ZMM0 |
(918) 0x47d448 VMULPD %ZMM17,%ZMM0,%ZMM0 |
(918) 0x47d44e VMULPD %ZMM27,%ZMM24,%ZMM19 |
(918) 0x47d454 VFMADD213PD %ZMM18,%ZMM25,%ZMM19 |
(918) 0x47d45a VFMADD231PD %ZMM0,%ZMM21,%ZMM19 |
(918) 0x47d460 VADDPD %ZMM1,%ZMM17,%ZMM0 |
(918) 0x47d466 VMAXPD %ZMM4,%ZMM0,%ZMM0 |
(918) 0x47d46c VDIVPD %ZMM0,%ZMM19,%ZMM23 |
(918) 0x47d472 VXORPD %XMM1,%XMM1,%XMM1 |
(918) 0x47d476 VCMPPD $0x1,%ZMM23,%ZMM1,%K2 |
(918) 0x47d47d VCMPPD $0x2,%ZMM16,%ZMM1,%K0 |
(918) 0x47d484 VCMPPD $0x6,%ZMM16,%ZMM1,%K2{%K2} |
(918) 0x47d48b KORB %K2,%K0,%K0 |
(918) 0x47d48f KANDNB %K1,%K0,%K2 |
(918) 0x47d493 KORTESTB %K2,%K2 |
(918) 0x47d497 JE 47d55c |
(918) 0x47d49d VFPCLASSPD $0x50,%ZMM24,%K3 |
(918) 0x47d4a4 VANDPD %ZMM5,%ZMM24,%ZMM0 |
(918) 0x47d4aa VMAXPD %ZMM0,%ZMM4,%ZMM0 |
(918) 0x47d4b0 VXORPD %ZMM6,%ZMM0,%ZMM0{%K3} |
(918) 0x47d4b6 VFPCLASSPD $0x50,%ZMM0,%K3 |
(918) 0x47d4bd VANDPD %ZMM5,%ZMM25,%ZMM1 |
(918) 0x47d4c3 VMAXPD %ZMM1,%ZMM4,%ZMM1 |
(918) 0x47d4c9 VXORPD %ZMM6,%ZMM1,%ZMM1{%K3} |
(918) 0x47d4cf VMULPD %ZMM0,%ZMM0,%ZMM16 |
(918) 0x47d4d5 VFMADD231PD %ZMM1,%ZMM1,%ZMM16 |
(918) 0x47d4db VSQRTPD %ZMM16,%ZMM16 |
(918) 0x47d4e1 VMULPD %ZMM15,%ZMM16,%ZMM17 |
(918) 0x47d4e7 VDIVPD %ZMM0,%ZMM17,%ZMM0 |
(918) 0x47d4ed VANDPD %ZMM5,%ZMM0,%ZMM0 |
(918) 0x47d4f3 VMULPD %ZMM22,%ZMM16,%ZMM16 |
(918) 0x47d4f9 VDIVPD %ZMM1,%ZMM16,%ZMM1 |
(918) 0x47d4ff VANDPD %ZMM5,%ZMM1,%ZMM1 |
(918) 0x47d505 VCMPPD $0x2,%ZMM1,%ZMM0,%K3 |
(918) 0x47d50c VMOVAPD %ZMM0,%ZMM1{%K3} |
(918) 0x47d512 VMULPD %ZMM1,%ZMM1,%ZMM0 |
(918) 0x47d518 VMULPD %ZMM23,%ZMM23,%ZMM1 |
(918) 0x47d51e VADDPD %ZMM0,%ZMM0,%ZMM0 |
(918) 0x47d524 MOV 0x78(%RBP),%RAX |
(918) 0x47d528 MOV (%RAX),%RAX |
(918) 0x47d52b IMUL %R15,%RAX |
(918) 0x47d52f ADD 0x20(%RBP),%RAX |
(918) 0x47d533 VMOVUPD (%RAX,%RSI,8),%ZMM16{%K2}{z} |
(918) 0x47d53a VMOVAPD 0x100(%RSP),%ZMM17 |
(918) 0x47d542 VMOVAPD %ZMM16,%ZMM17{%K2} |
(918) 0x47d548 VMOVAPD %ZMM17,0x100(%RSP) |
(918) 0x47d550 VMULPD %ZMM17,%ZMM1,%ZMM1 |
(918) 0x47d556 VMULPD %ZMM0,%ZMM1,%ZMM1 |
(918) 0x47d55c MOV 0x14(%RSP),%EDI |
(918) 0x47d560 MOV 0x50(%RBP),%RDX |
(918) 0x47d564 MOV 0x48(%RBP),%R8 |
(918) 0x47d568 VMOVAPD %ZMM1,%ZMM0{%K2}{z} |
(918) 0x47d56e IMUL %R15,%R10 |
(918) 0x47d572 ADD 0x10(%RBP),%R10 |
(918) 0x47d576 VMOVUPD %ZMM0,(%R10,%RSI,8){%K1} |
(918) 0x47d57d JMP 47cd10 |
0x47d582 NOPW %CS:(%RAX,%RAX,1) |
0x47d58c NOPL (%RAX) |
Path / |
Source file and lines | viscosity_kernel.f90:50-94 |
Module | exec |
nb instructions | 149 |
nb uops | 153 |
loop length | 726 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 5 |
nb stack references | 34 |
micro-operation queue | 25.50 cycles |
front end | 25.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 10.20 | 10.20 | 10.00 | 10.00 | 17.00 | 10.20 | 10.20 | 17.00 | 17.00 | 17.00 | 10.20 | 10.00 |
cycles | 10.20 | 10.20 | 10.00 | 10.00 | 17.00 | 10.20 | 10.20 | 17.00 | 17.00 | 17.00 | 10.20 | 10.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 24.95-24.98 |
Stall cycles | 0.00 |
Front-end | 25.50 |
Dispatch | 17.00 |
Overall L1 | 25.50 |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 4% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 1% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 3% |
all | 11% |
load | 12% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 12% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x40,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x2c0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %ESI,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,0x34(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 47cb30 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xb0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x38(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x3c(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x24(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x20(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x753310,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 4044c0 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x1c(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RSP),%EDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %EAX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 47cb80 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x100> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x753330,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4040b0 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x58(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x753350,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 404580 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAL $0x20,%R14 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
LEA (%R14,%RAX,1),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RCX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x20,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%R11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $-0x1,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVNS %RDX,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $0x1,%R15D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %R15,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R14,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RDX,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $-0x1,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SHR $0x20,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RSI,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x3,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RCX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVNS %RAX,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVG %R15,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %RBX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SHR $0x20,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RDX,%R12 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %RCX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R11,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%RSI,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R8,%RSI,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RSI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD 0x40(%RSP),%RSI | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RSI,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD 0x8e004(%RIP),%ZMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xc49f2(%RIP),%ZMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x8e088(%RIP),%ZMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x8dfb6(%RIP),%ZMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x8e024(%RIP),%ZMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV 0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RCX,%RAX,1),%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDI,0x14(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 47cd22 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x2a2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | viscosity_kernel.f90:50-94 |
Module | exec |
nb instructions | 149 |
nb uops | 153 |
loop length | 726 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 5 |
nb stack references | 34 |
micro-operation queue | 25.50 cycles |
front end | 25.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 10.20 | 10.20 | 10.00 | 10.00 | 17.00 | 10.20 | 10.20 | 17.00 | 17.00 | 17.00 | 10.20 | 10.00 |
cycles | 10.20 | 10.20 | 10.00 | 10.00 | 17.00 | 10.20 | 10.20 | 17.00 | 17.00 | 17.00 | 10.20 | 10.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 24.95-24.98 |
Stall cycles | 0.00 |
Front-end | 25.50 |
Dispatch | 17.00 |
Overall L1 | 25.50 |
all | 2% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 4% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 1% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 3% |
all | 11% |
load | 12% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 12% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x40,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x2c0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %ESI,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,0x34(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 47cb30 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xb0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x38(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x3c(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x24(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x20(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x753310,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 4044c0 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x1c(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RSP),%EDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %EAX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 47cb80 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x100> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x753330,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4040b0 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x58(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x753350,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 404580 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAL $0x20,%R14 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
LEA (%R14,%RAX,1),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RCX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x20,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%R11 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $-0x1,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVNS %RDX,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $0x1,%R15D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %R15,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R14,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RDX,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $-0x1,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SHR $0x20,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RSI,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SAL $0x3,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RCX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVNS %RAX,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RDX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVG %R15,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %RBX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SHR $0x20,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RDX,%R12 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %RCX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R11,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%RSI,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R8,%RSI,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RSI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD 0x40(%RSP),%RSI | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RSI,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD 0x8e004(%RIP),%ZMM2 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xc49f2(%RIP),%ZMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x8e088(%RIP),%ZMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x8dfb6(%RIP),%ZMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0x8e024(%RIP),%ZMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV 0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RCX,%RAX,1),%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDI,0x14(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 47cd22 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x2a2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼viscosity_kernel_.DIR.OMP.PARALLEL.2– | 2.23 | 0.69 |
▼Loop 918 - viscosity_kernel.f90:53-89 - exec– | 0 | 0 |
○Loop 919 - viscosity_kernel.f90:53-89 - exec | 2.23 | 0.68 |