Function: calc_dt_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: calc_dt_kernel.f90:89-133 [...] | Coverage: 3.27% |
---|
Function: calc_dt_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: calc_dt_kernel.f90:89-133 [...] | Coverage: 3.27% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-861-0321/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/calc_dt_kernel.f90: 89 - 133 |
-------------------------------------------------------------------------------- |
89: !$OMP PARALLEL |
90: |
91: !$OMP DO PRIVATE(dsx,dsy,cc,dv1,dv2,div,dtct,dtut,dtvt,dtdivt) REDUCTION(MIN : dt_min_val) |
92: DO k=y_min,y_max |
93: !$OMP SIMD |
94: DO j=x_min,x_max |
95: |
96: dsx=celldx(j) |
97: dsy=celldy(k) |
98: |
99: cc=soundspeed(j,k)*soundspeed(j,k) |
100: cc=cc+2.0_8*viscosity_a(j,k)/density0(j,k) |
101: cc=MAX(SQRT(cc),g_small) |
102: |
103: dtct=dtc_safe*MIN(dsx,dsy)/cc |
104: |
105: div=0.0 |
106: |
107: dv1=(xvel0(j ,k)+xvel0(j ,k+1))*xarea(j ,k) |
108: dv2=(xvel0(j+1,k)+xvel0(j+1,k+1))*xarea(j+1,k) |
109: |
110: div=div+dv2-dv1 |
111: |
112: dtut=dtu_safe*2.0_8*volume(j,k)/MAX(ABS(dv1),ABS(dv2),g_small*volume(j,k)) |
113: |
114: dv1=(yvel0(j,k )+yvel0(j+1,k ))*yarea(j,k ) |
115: dv2=(yvel0(j,k+1)+yvel0(j+1,k+1))*yarea(j,k+1) |
116: |
117: div=div+dv2-dv1 |
118: |
119: dtvt=dtv_safe*2.0_8*volume(j,k)/MAX(ABS(dv1),ABS(dv2),g_small*volume(j,k)) |
120: |
121: div=div/(2.0_8*volume(j,k)) |
122: |
123: IF(div.LT.-g_small)THEN |
[...] |
129: dt_min_val=MIN(dt_min_val,dtct,dtut,dtvt,dtdivt) |
130: |
131: ENDDO |
132: ENDDO |
133: !$OMP END DO |
0x438ae0 PUSH %RBP |
0x438ae1 MOV %RSP,%RBP |
0x438ae4 PUSH %R15 |
0x438ae6 PUSH %R14 |
0x438ae8 PUSH %R13 |
0x438aea PUSH %R12 |
0x438aec PUSH %RBX |
0x438aed SUB $0x158,%RSP |
0x438af4 MOV %RCX,%R14 |
0x438af7 MOV 0x90(%RBP),%ECX |
0x438afd MOV 0x88(%RBP),%EAX |
0x438b03 SUB %ECX,%EAX |
0x438b05 MOVL $0,-0x54(%RBP) |
0x438b0c JS 438bf6 |
0x438b12 MOV %R9,%RBX |
0x438b15 MOV %RDX,%R13 |
0x438b18 MOV %R8,-0x88(%RBP) |
0x438b1f MOV %RDI,-0x60(%RBP) |
0x438b23 MOV (%RDI),%ESI |
0x438b25 MOVL $0,-0x30(%RBP) |
0x438b2c MOV %EAX,-0x2c(%RBP) |
0x438b2f MOVL $0x1,-0x50(%RBP) |
0x438b36 SUB $0x8,%RSP |
0x438b3a LEA -0x50(%RBP),%RAX |
0x438b3e LEA -0x54(%RBP),%RCX |
0x438b42 LEA -0x30(%RBP),%R8 |
0x438b46 LEA -0x2c(%RBP),%R9 |
0x438b4a MOV $0x5720c0,%EDI |
0x438b4f MOV %ESI,-0x44(%RBP) |
0x438b52 MOV $0x22,%EDX |
0x438b57 PUSH $0x1 |
0x438b59 PUSH $0x1 |
0x438b5b PUSH %RAX |
0x438b5c CALL 404670 <__kmpc_for_static_init_4@plt> |
0x438b61 ADD $0x20,%RSP |
0x438b65 MOV -0x30(%RBP),%R9D |
0x438b69 MOV -0x2c(%RBP),%EAX |
0x438b6c SUB %R9D,%EAX |
0x438b6f MOV %EAX,-0x48(%RBP) |
0x438b72 JAE 438c14 |
0x438b78 MOVSD 0xf48ef(%RIP),%XMM14 |
0x438b81 MOVSD %XMM14,-0x80(%RBP) |
0x438b87 MOV $0x5720e0,%EDI |
0x438b8c MOV -0x44(%RBP),%ESI |
0x438b8f CALL 404230 <__kmpc_for_static_fini@plt> |
0x438b94 MOV -0x60(%RBP),%RBX |
0x438b98 MOV (%RBX),%ESI |
0x438b9a SUB $0x8,%RSP |
0x438b9e LEA -0x80(%RBP),%R8 |
0x438ba2 MOV $0x572100,%EDI |
0x438ba7 MOV $0x4395b0,%R9D |
0x438bad MOV $0x1,%EDX |
0x438bb2 MOV $0x8,%ECX |
0x438bb7 PUSH $0x57933c |
0x438bbc CALL 404830 <__kmpc_reduce@plt> |
0x438bc1 MOV %RBX,%RDI |
0x438bc4 ADD $0x10,%RSP |
0x438bc8 CMP $0x1,%EAX |
0x438bcb MOV -0x88(%RBP),%RAX |
0x438bd2 JNE 438bf6 |
0x438bd4 MOVSD -0x80(%RBP),%XMM0 |
0x438bd9 MINSD (%RAX),%XMM0 |
0x438bdd MOVSD %XMM0,(%RAX) |
0x438be1 MOV (%RDI),%ESI |
0x438be3 MOV $0x572120,%EDI |
0x438be8 MOV $0x57933c,%EDX |
0x438bed CALL 4049c0 <__kmpc_end_reduce@plt> |
0x438bf2 MOV -0x60(%RBP),%RDI |
0x438bf6 MOV (%RDI),%ESI |
0x438bf8 MOV $0x572140,%EDI |
0x438bfd CALL 404740 <__kmpc_barrier@plt> |
0x438c02 ADD $0x158,%RSP |
0x438c09 POP %RBX |
0x438c0a POP %R12 |
0x438c0c POP %R13 |
0x438c0e POP %R14 |
0x438c10 POP %R15 |
0x438c12 POP %RBP |
0x438c13 RET |
0x438c14 MOV 0x30(%RBP),%R10 |
0x438c18 MOV 0x28(%RBP),%R11 |
0x438c1c SAL $0x20,%R14 |
0x438c20 MOV $-0x200000000,%RAX |
0x438c2a LEA (%R14,%RAX,1),%RCX |
0x438c2e SAL $0x20,%R13 |
0x438c32 ADD %R13,%RAX |
0x438c35 MOV %RAX,%R15 |
0x438c38 SAR $0x20,%R15 |
0x438c3c TEST %RCX,%RCX |
0x438c3f MOV $-0x1,%RDX |
0x438c46 MOV $-0x1,%RSI |
0x438c4d CMOVNS %RCX,%RSI |
0x438c51 TEST %RSI,%RSI |
0x438c54 MOV $0x1,%EDI |
0x438c59 CMOVG %RDI,%RSI |
0x438c5d MOV $0x200000000,%R12 |
0x438c67 MOV %R12,%R8 |
0x438c6a SUB %R14,%R8 |
0x438c6d CMP %R8,%RCX |
0x438c70 CMOVG %RCX,%R8 |
0x438c74 SHR $0x20,%R8 |
0x438c78 IMUL %RSI,%R8 |
0x438c7c LEA (,%R8,8),%RCX |
0x438c84 MOV $0x8,%ESI |
0x438c89 SUB %RCX,%RSI |
0x438c8c MOV $0x1,%R14D |
0x438c92 MOV %R15,-0x100(%RBP) |
0x438c99 SUB %R15,%R14 |
0x438c9c MOV %R14,-0xf0(%RBP) |
0x438ca3 TEST %RAX,%RAX |
0x438ca6 CMOVNS %RAX,%RDX |
0x438caa TEST %RDX,%RDX |
0x438cad CMOVG %RDI,%RDX |
0x438cb1 MOV 0x20(%RBP),%RDI |
0x438cb5 SUB %R13,%R12 |
0x438cb8 CMP %R12,%RAX |
0x438cbb CMOVG %RAX,%R12 |
0x438cbf SHR $0x20,%R12 |
0x438cc3 IMUL %RDX,%R12 |
0x438cc7 MOV 0x48(%RBP),%RAX |
0x438ccb SUB %RCX,%RAX |
0x438cce MOV %RAX,-0xc8(%RBP) |
0x438cd5 SUB %RCX,%R10 |
0x438cd8 MOV %R10,-0xc0(%RBP) |
0x438cdf SUB %RCX,%R11 |
0x438ce2 MOV %R11,-0xb8(%RBP) |
0x438ce9 SUB %RCX,%RDI |
0x438cec MOV %RDI,-0xb0(%RBP) |
0x438cf3 MOV 0x18(%RBP),%RAX |
0x438cf7 SUB %RCX,%RAX |
0x438cfa MOV %RAX,-0xa8(%RBP) |
0x438d01 MOV 0x40(%RBP),%RAX |
0x438d05 SUB %RCX,%RAX |
0x438d08 MOV %RAX,-0xa0(%RBP) |
0x438d0f LEA (%RBX,%RSI,1),%RAX |
0x438d13 MOV %RAX,-0x98(%RBP) |
0x438d1a SUB %RCX,%RBX |
0x438d1d MOV %RBX,-0xe8(%RBP) |
0x438d24 NEG %R12 |
0x438d27 MOV %R12,-0xf8(%RBP) |
0x438d2e MOV 0x50(%RBP),%RAX |
0x438d32 ADD %RSI,%RAX |
0x438d35 MOV %RAX,-0x90(%RBP) |
0x438d3c ADD 0x10(%RBP),%RSI |
0x438d40 MOV %RSI,-0xd0(%RBP) |
0x438d47 NEG %R8 |
0x438d4a MOV %R8,-0xe0(%RBP) |
0x438d51 MOVSD 0xf4716(%RIP),%XMM14 |
0x438d5a MOVSD 0xf46dd(%RIP),%XMM13 |
0x438d63 MOVAPD 0xf48b4(%RIP),%XMM10 |
0x438d6c MOVAPD 0x12a0ac(%RIP),%XMM7 |
0x438d74 MOV 0x90(%RBP),%EAX |
0x438d7a LEA (%R9,%RAX,1),%EDX |
0x438d7e XOR %EDI,%EDI |
0x438d80 MOV %R9,%R13 |
0x438d83 MOV %R9,-0xd8(%RBP) |
0x438d8a JMP 438dbb |
0x438d8c NOPL (%RAX) |
(316) 0x438d90 MOV -0x140(%RBP),%RCX |
(316) 0x438d97 LEA 0x1(%RCX),%EAX |
(316) 0x438d9a MOV -0x4c(%RBP),%EDX |
(316) 0x438d9d INC %EDX |
(316) 0x438d9f CMP -0x48(%RBP),%ECX |
(316) 0x438da2 MOV %EAX,%EDI |
(316) 0x438da4 MOVAPD 0xf4873(%RIP),%XMM10 |
(316) 0x438dad MOVAPD 0x12a06b(%RIP),%XMM7 |
(316) 0x438db5 JE 438b81 |
(316) 0x438dbb MOV 0xa0(%RBP),%RAX |
(316) 0x438dc2 MOVSXD (%RAX),%R9 |
(316) 0x438dc5 MOV 0x98(%RBP),%RAX |
(316) 0x438dcc MOV (%RAX),%R8D |
(316) 0x438dcf CMP %R9D,%R8D |
(316) 0x438dd2 MOV %EDX,-0x4c(%RBP) |
(316) 0x438dd5 MOV %RDI,-0x140(%RBP) |
(316) 0x438ddc JS 438d90 |
(316) 0x438dde MOVSXD %EDX,%R12 |
(316) 0x438de1 MOV -0xf0(%RBP),%RAX |
(316) 0x438de8 ADD %R12,%RAX |
(316) 0x438deb MOV %RAX,-0x38(%RBP) |
(316) 0x438def ADD -0xf8(%RBP),%R12 |
(316) 0x438df6 MOV 0x90(%RBP),%EAX |
(316) 0x438dfc ADD %R13D,%EAX |
(316) 0x438dff ADD %EDI,%EAX |
(316) 0x438e01 CLTQ |
(316) 0x438e03 SUB -0x100(%RBP),%RAX |
(316) 0x438e0a MOV 0x38(%RBP),%RCX |
(316) 0x438e0e MOVSD (%RCX,%RAX,8),%XMM9 |
(316) 0x438e14 MOV 0xa8(%RBP),%RAX |
(316) 0x438e1b MOV (%RAX),%RAX |
(316) 0x438e1e MOV %RAX,-0x78(%RBP) |
(316) 0x438e22 MOV 0xb0(%RBP),%RAX |
(316) 0x438e29 MOV (%RAX),%RAX |
(316) 0x438e2c MOV %RAX,-0x70(%RBP) |
(316) 0x438e30 MOV 0xb8(%RBP),%RAX |
(316) 0x438e37 MOV (%RAX),%RCX |
(316) 0x438e3a MOVSD 0x140f2e(%RIP),%XMM1 |
(316) 0x438e42 MOV 0xc0(%RBP),%RAX |
(316) 0x438e49 MOV (%RAX),%R14 |
(316) 0x438e4c MOV 0xc8(%RBP),%RAX |
(316) 0x438e53 MOV (%RAX),%R15 |
(316) 0x438e56 MOVSD 0x140f0a(%RIP),%XMM2 |
(316) 0x438e5e MOV 0xd0(%RBP),%RAX |
(316) 0x438e65 MOV (%RAX),%R10 |
(316) 0x438e68 MOV 0xd8(%RBP),%RAX |
(316) 0x438e6f MOV (%RAX),%RBX |
(316) 0x438e72 MOV 0xe0(%RBP),%RAX |
(316) 0x438e79 MOV (%RAX),%R11 |
(316) 0x438e7c MOVSD 0x140edc(%RIP),%XMM3 |
(316) 0x438e84 MOVAPD %XMM3,-0x170(%RBP) |
(316) 0x438e8c MOVSD 0x140ec3(%RIP),%XMM12 |
(316) 0x438e95 XORPD 0x129f92(%RIP),%XMM12 |
(316) 0x438e9e SUB %R9D,%R8D |
(316) 0x438ea1 INC %R8D |
(316) 0x438ea4 CMP $0x2,%R8D |
(316) 0x438ea8 MOV $0x1,%EAX |
(316) 0x438ead CMOVL %EAX,%R8D |
(316) 0x438eb1 MOV %R8,%RSI |
(316) 0x438eb4 AND $0x7ffffffe,%RSI |
(316) 0x438ebb MOV %R8,-0x40(%RBP) |
(316) 0x438ebf MOVAPD %XMM12,-0x180(%RBP) |
(316) 0x438ec8 JE 4392c0 |
(316) 0x438ece UNPCKLPD %XMM14,%XMM14 |
(316) 0x438ed3 MOV %RBX,%RAX |
(316) 0x438ed6 MOV -0x38(%RBP),%RDI |
(316) 0x438eda IMUL %RDI,%RAX |
(316) 0x438ede LEA (%RAX,%R9,8),%R8 |
(316) 0x438ee2 MOV %RCX,%RDX |
(316) 0x438ee5 MOV -0x98(%RBP),%RCX |
(316) 0x438eec ADD %RCX,%R8 |
(316) 0x438eef MOV %RBX,-0x108(%RBP) |
(316) 0x438ef6 MOV %RBX,%RAX |
(316) 0x438ef9 IMUL %R12,%RAX |
(316) 0x438efd MOV %R11,%RBX |
(316) 0x438f00 MOV %R9,%R11 |
(316) 0x438f03 MOV %R10,-0x68(%RBP) |
(316) 0x438f07 LEA (%RAX,%R9,8),%R10 |
(316) 0x438f0b ADD %RCX,%R10 |
(316) 0x438f0e MOV %R15,-0x120(%RBP) |
(316) 0x438f15 MOV %R15,%RAX |
(316) 0x438f18 IMUL %R12,%RAX |
(316) 0x438f1c LEA (%RAX,%R9,8),%R13 |
(316) 0x438f20 ADD -0x90(%RBP),%R13 |
(316) 0x438f27 MOV %R14,%RAX |
(316) 0x438f2a IMUL %R12,%RAX |
(316) 0x438f2e MOV %RDX,%R9 |
(316) 0x438f31 LEA (%RAX,%R11,8),%R15 |
(316) 0x438f35 MOV -0xd0(%RBP),%RCX |
(316) 0x438f3c ADD %RCX,%R15 |
(316) 0x438f3f MOV %R14,-0x128(%RBP) |
(316) 0x438f46 MOV %R14,%RAX |
(316) 0x438f49 IMUL %RDI,%RAX |
(316) 0x438f4d LEA (%RAX,%R11,8),%R14 |
(316) 0x438f51 ADD %RCX,%R14 |
(316) 0x438f54 MOV %RBX,%RAX |
(316) 0x438f57 IMUL %RDI,%RAX |
(316) 0x438f5b LEA (%RAX,%R11,8),%RDI |
(316) 0x438f5f MOV -0xc8(%RBP),%RDX |
(316) 0x438f66 ADD %RDX,%RDI |
(316) 0x438f69 MOV %RBX,-0x110(%RBP) |
(316) 0x438f70 IMUL %R12,%RBX |
(316) 0x438f74 LEA (%RBX,%R11,8),%RCX |
(316) 0x438f78 ADD %RDX,%RCX |
(316) 0x438f7b MOV -0x68(%RBP),%RAX |
(316) 0x438f7f IMUL %R12,%RAX |
(316) 0x438f83 LEA (%RAX,%R11,8),%RDX |
(316) 0x438f87 ADD -0xc0(%RBP),%RDX |
(316) 0x438f8e MOV %R9,-0x130(%RBP) |
(316) 0x438f95 IMUL %R12,%R9 |
(316) 0x438f99 LEA (%R9,%R11,8),%RAX |
(316) 0x438f9d ADD -0xb8(%RBP),%RAX |
(316) 0x438fa4 MOV -0x70(%RBP),%R9 |
(316) 0x438fa8 IMUL %R12,%R9 |
(316) 0x438fac MOV %R12,%RBX |
(316) 0x438faf LEA (%R9,%R11,8),%R12 |
(316) 0x438fb3 ADD -0xb0(%RBP),%R12 |
(316) 0x438fba MOV -0x78(%RBP),%R9 |
(316) 0x438fbe MOV %RBX,-0x138(%RBP) |
(316) 0x438fc5 IMUL %RBX,%R9 |
(316) 0x438fc9 LEA (%R9,%R11,8),%RBX |
(316) 0x438fcd ADD -0xa8(%RBP),%RBX |
(316) 0x438fd4 MOV -0xa0(%RBP),%R9 |
(316) 0x438fdb MOV %R11,-0x118(%RBP) |
(316) 0x438fe2 LEA (%R9,%R11,8),%R11 |
(316) 0x438fe6 MOVAPD %XMM14,%XMM15 |
(316) 0x438feb XOR %R9D,%R9D |
(316) 0x438fee MOVAPD %XMM1,-0x160(%RBP) |
(316) 0x438ff6 MOVAPD %XMM2,-0x150(%RBP) |
(316) 0x438ffe XCHG %AX,%AX |
(318) 0x439000 MOVUPD (%R12,%R9,8),%XMM0 |
(318) 0x439006 MOVUPD (%R11,%R9,8),%XMM1 |
(318) 0x43900c MOVUPD (%RAX,%R9,8),%XMM3 |
(318) 0x439012 MOVAPD %XMM9,%XMM4 |
(318) 0x439017 UNPCKLPD %XMM9,%XMM4 |
(318) 0x43901c ADDPD %XMM0,%XMM0 |
(318) 0x439020 MOVAPD -0x160(%RBP),%XMM14 |
(318) 0x439029 UNPCKLPD %XMM14,%XMM14 |
(318) 0x43902e MOVUPD -0x8(%R14,%R9,8),%XMM5 |
(318) 0x439035 MINPD %XMM4,%XMM1 |
(318) 0x439039 MOVUPD (%R14,%R9,8),%XMM4 |
(318) 0x43903f MOVUPD -0x8(%R15,%R9,8),%XMM11 |
(318) 0x439046 ADDPD %XMM5,%XMM11 |
(318) 0x43904b DIVPD %XMM3,%XMM0 |
(318) 0x43904f MOVUPD (%R15,%R9,8),%XMM5 |
(318) 0x439055 ADDPD %XMM4,%XMM5 |
(318) 0x439059 MOVUPD -0x8(%R13,%R9,8),%XMM4 |
(318) 0x439060 MULPD %XMM1,%XMM14 |
(318) 0x439065 MOVUPD (%R13,%R9,8),%XMM13 |
(318) 0x43906c MOVUPD (%RDX,%R9,8),%XMM3 |
(318) 0x439072 MOVAPD %XMM3,%XMM6 |
(318) 0x439076 MULPD %XMM11,%XMM4 |
(318) 0x43907b ADDPD %XMM3,%XMM6 |
(318) 0x43907f MOVAPD -0x150(%RBP),%XMM11 |
(318) 0x439088 UNPCKLPD %XMM11,%XMM11 |
(318) 0x43908d MULPD %XMM5,%XMM13 |
(318) 0x439092 MULPD %XMM6,%XMM11 |
(318) 0x439097 MOVAPD %XMM4,%XMM5 |
(318) 0x43909b MOVAPD %XMM13,%XMM8 |
(318) 0x4390a0 ANDPD %XMM7,%XMM5 |
(318) 0x4390a4 ANDPD %XMM7,%XMM8 |
(318) 0x4390a9 MULPD %XMM10,%XMM3 |
(318) 0x4390ae MOVAPD %XMM3,%XMM1 |
(318) 0x4390b2 CMPPD $0x2,%XMM8,%XMM1 |
(318) 0x4390b8 ANDPD %XMM1,%XMM8 |
(318) 0x4390bd ANDNPD %XMM3,%XMM1 |
(318) 0x4390c1 ORPD %XMM8,%XMM1 |
(318) 0x4390c6 MOVAPD %XMM1,%XMM8 |
(318) 0x4390cb CMPPD $0x2,%XMM5,%XMM8 |
(318) 0x4390d1 ANDPD %XMM8,%XMM5 |
(318) 0x4390d6 ANDNPD %XMM1,%XMM8 |
(318) 0x4390db ORPD %XMM5,%XMM8 |
(318) 0x4390e0 MOVUPD -0x8(%R10,%R9,8),%XMM1 |
(318) 0x4390e7 MOVUPD (%R10,%R9,8),%XMM2 |
(318) 0x4390ed ADDPD %XMM1,%XMM2 |
(318) 0x4390f1 DIVPD %XMM8,%XMM11 |
(318) 0x4390f6 MOVUPD (%RCX,%R9,8),%XMM5 |
(318) 0x4390fc MULPD %XMM2,%XMM5 |
(318) 0x439100 MOVUPD -0x8(%R8,%R9,8),%XMM1 |
(318) 0x439107 MOVUPD (%R8,%R9,8),%XMM2 |
(318) 0x43910d ADDPD %XMM1,%XMM2 |
(318) 0x439111 MOVUPD (%RDI,%R9,8),%XMM1 |
(318) 0x439117 MULPD %XMM2,%XMM1 |
(318) 0x43911b ADDPD %XMM5,%XMM4 |
(318) 0x43911f SUBPD %XMM4,%XMM13 |
(318) 0x439124 ADDPD %XMM1,%XMM13 |
(318) 0x439129 MOVAPD %XMM3,%XMM2 |
(318) 0x43912d ANDPD %XMM7,%XMM1 |
(318) 0x439131 CMPPD $0x2,%XMM1,%XMM2 |
(318) 0x439136 ANDPD %XMM2,%XMM1 |
(318) 0x43913a ANDNPD %XMM3,%XMM2 |
(318) 0x43913e ANDPD %XMM7,%XMM5 |
(318) 0x439142 ORPD %XMM1,%XMM2 |
(318) 0x439146 MOVAPD %XMM2,%XMM1 |
(318) 0x43914a CMPPD $0x2,%XMM5,%XMM1 |
(318) 0x43914f ANDPD %XMM1,%XMM5 |
(318) 0x439153 ANDNPD %XMM2,%XMM1 |
(318) 0x439157 MOVUPD (%RBX,%R9,8),%XMM2 |
(318) 0x43915d MULPD %XMM2,%XMM2 |
(318) 0x439161 ADDPD %XMM2,%XMM0 |
(318) 0x439165 ORPD %XMM5,%XMM1 |
(318) 0x439169 MOVAPD -0x170(%RBP),%XMM2 |
(318) 0x439171 UNPCKLPD %XMM2,%XMM2 |
(318) 0x439175 MULPD %XMM6,%XMM2 |
(318) 0x439179 DIVPD %XMM1,%XMM2 |
(318) 0x43917d SQRTPD %XMM0,%XMM0 |
(318) 0x439181 MAXPD %XMM10,%XMM0 |
(318) 0x439186 DIVPD %XMM0,%XMM14 |
(318) 0x43918b DIVPD %XMM6,%XMM13 |
(318) 0x439190 MOVAPD %XMM12,%XMM0 |
(318) 0x439195 UNPCKLPD %XMM12,%XMM0 |
(318) 0x43919a DIVPD %XMM13,%XMM0 |
(318) 0x43919f CMPPD $0x1,0xf4487(%RIP),%XMM13 |
(318) 0x4391a9 ANDPD %XMM13,%XMM0 |
(318) 0x4391ae ANDNPD 0xf4489(%RIP),%XMM13 |
(318) 0x4391b7 ORPD %XMM0,%XMM13 |
(318) 0x4391bc MOVAPD %XMM2,%XMM0 |
(318) 0x4391c0 CMPPD $0x2,%XMM13,%XMM0 |
(318) 0x4391c6 ANDPD %XMM0,%XMM2 |
(318) 0x4391ca ANDNPD %XMM13,%XMM0 |
(318) 0x4391cf ORPD %XMM2,%XMM0 |
(318) 0x4391d3 MOVAPD %XMM11,%XMM1 |
(318) 0x4391d8 CMPPD $0x2,%XMM0,%XMM1 |
(318) 0x4391dd ANDPD %XMM1,%XMM11 |
(318) 0x4391e2 ANDNPD %XMM0,%XMM1 |
(318) 0x4391e6 ORPD %XMM11,%XMM1 |
(318) 0x4391eb MOVAPD %XMM14,%XMM0 |
(318) 0x4391f0 CMPPD $0x2,%XMM1,%XMM0 |
(318) 0x4391f5 ANDPD %XMM0,%XMM14 |
(318) 0x4391fa ANDNPD %XMM1,%XMM0 |
(318) 0x4391fe ORPD %XMM14,%XMM0 |
(318) 0x439203 MOVAPD %XMM15,%XMM1 |
(318) 0x439208 CMPPD $0x2,%XMM0,%XMM15 |
(318) 0x43920e ANDPD %XMM15,%XMM1 |
(318) 0x439213 ANDNPD %XMM0,%XMM15 |
(318) 0x439218 ORPD %XMM1,%XMM15 |
(318) 0x43921d ADD $0x2,%R9 |
(318) 0x439221 CMP %RSI,%R9 |
(318) 0x439224 JB 439000 |
(316) 0x43922a MOVAPD %XMM15,%XMM0 |
(316) 0x43922f UNPCKHPD %XMM15,%XMM0 |
(316) 0x439234 MOVAPD %XMM15,%XMM14 |
(316) 0x439239 CMPSD $0x3,%XMM15,%XMM14 |
(316) 0x43923f MOVAPD %XMM14,%XMM1 |
(316) 0x439244 ANDPD %XMM0,%XMM1 |
(316) 0x439248 MINSD %XMM15,%XMM0 |
(316) 0x43924d ANDNPD %XMM0,%XMM14 |
(316) 0x439252 ORPD %XMM1,%XMM14 |
(316) 0x439257 CMP -0x40(%RBP),%RSI |
(316) 0x43925b MOV -0xd8(%RBP),%R13 |
(316) 0x439262 MOVSD 0xf41d5(%RIP),%XMM13 |
(316) 0x43926b MOVAPD -0x160(%RBP),%XMM7 |
(316) 0x439273 MOVAPD -0x150(%RBP),%XMM12 |
(316) 0x43927c MOV -0x138(%RBP),%R12 |
(316) 0x439283 MOV -0x38(%RBP),%RDX |
(316) 0x439287 MOV -0x130(%RBP),%RCX |
(316) 0x43928e MOV -0x128(%RBP),%R14 |
(316) 0x439295 MOV -0x120(%RBP),%R15 |
(316) 0x43929c MOV -0x68(%RBP),%R10 |
(316) 0x4392a0 MOV -0x118(%RBP),%R9 |
(316) 0x4392a7 MOV -0x110(%RBP),%R11 |
(316) 0x4392ae MOV -0x108(%RBP),%RBX |
(316) 0x4392b5 JE 438d90 |
(316) 0x4392bb JMP 4392cf |
0x4392bd NOPL (%RAX) |
(316) 0x4392c0 XOR %ESI,%ESI |
(316) 0x4392c2 MOVAPD %XMM1,%XMM7 |
(316) 0x4392c6 MOVAPD %XMM2,%XMM12 |
(316) 0x4392cb MOV -0x38(%RBP),%RDX |
(316) 0x4392cf SUB %RSI,-0x40(%RBP) |
(316) 0x4392d3 MOV %RBX,%RAX |
(316) 0x4392d6 IMUL %RDX,%RAX |
(316) 0x4392da LEA (%RAX,%RSI,8),%RAX |
(316) 0x4392de LEA (%RAX,%R9,8),%R8 |
(316) 0x4392e2 IMUL %R12,%RBX |
(316) 0x4392e6 LEA (%RBX,%RSI,8),%RAX |
(316) 0x4392ea LEA (%RAX,%R9,8),%RAX |
(316) 0x4392ee ADD -0xe0(%RBP),%RSI |
(316) 0x4392f5 ADD %R9,%RSI |
(316) 0x4392f8 MOV %RCX,%RBX |
(316) 0x4392fb MOV %R11,%RCX |
(316) 0x4392fe IMUL %RDX,%RCX |
(316) 0x439302 MOV %R14,%R9 |
(316) 0x439305 IMUL %RDX,%R14 |
(316) 0x439309 MOV -0xe8(%RBP),%RDX |
(316) 0x439310 ADD %RDX,%R8 |
(316) 0x439313 ADD %RDX,%RAX |
(316) 0x439316 LEA (%RCX,%RSI,8),%RCX |
(316) 0x43931a MOV 0x48(%RBP),%RDI |
(316) 0x43931e ADD %RDI,%RCX |
(316) 0x439321 IMUL %R12,%R11 |
(316) 0x439325 LEA (%R11,%RSI,8),%RDX |
(316) 0x439329 ADD %RDI,%RDX |
(316) 0x43932c IMUL %R12,%R10 |
(316) 0x439330 LEA (%R10,%RSI,8),%RDI |
(316) 0x439334 ADD 0x30(%RBP),%RDI |
(316) 0x439338 IMUL %R12,%R15 |
(316) 0x43933c LEA (%R15,%RSI,8),%R10 |
(316) 0x439340 ADD 0x50(%RBP),%R10 |
(316) 0x439344 IMUL %R12,%R9 |
(316) 0x439348 LEA (%R9,%RSI,8),%R11 |
(316) 0x43934c MOV 0x10(%RBP),%R9 |
(316) 0x439350 ADD %R9,%R11 |
(316) 0x439353 LEA (%R14,%RSI,8),%R14 |
(316) 0x439357 ADD %R9,%R14 |
(316) 0x43935a IMUL %R12,%RBX |
(316) 0x43935e LEA (%RBX,%RSI,8),%R15 |
(316) 0x439362 ADD 0x28(%RBP),%R15 |
(316) 0x439366 MOV -0x70(%RBP),%R9 |
(316) 0x43936a IMUL %R12,%R9 |
(316) 0x43936e LEA (%R9,%RSI,8),%RBX |
(316) 0x439372 ADD 0x20(%RBP),%RBX |
(316) 0x439376 MOV -0x78(%RBP),%R9 |
(316) 0x43937a IMUL %R12,%R9 |
(316) 0x43937e LEA (%R9,%RSI,8),%R12 |
(316) 0x439382 ADD 0x18(%RBP),%R12 |
(316) 0x439386 MOV 0x40(%RBP),%R9 |
(316) 0x43938a LEA (%R9,%RSI,8),%RSI |
(316) 0x43938e XOR %R9D,%R9D |
(316) 0x439391 MOVAPD %XMM14,%XMM15 |
(316) 0x439396 JMP 439506 |
0x43939b NOPL (%RAX,%RAX,1) |
(317) 0x4393a0 MOVSD (%RSI,%R9,8),%XMM2 |
(317) 0x4393a6 MOVSD (%R12,%R9,8),%XMM3 |
(317) 0x4393ac MULSD %XMM3,%XMM3 |
(317) 0x4393b0 MOVSD (%RBX,%R9,8),%XMM6 |
(317) 0x4393b6 ADDSD %XMM6,%XMM6 |
(317) 0x4393ba DIVSD (%R15,%R9,8),%XMM6 |
(317) 0x4393c0 ADDSD %XMM3,%XMM6 |
(317) 0x4393c4 SQRTSD %XMM6,%XMM6 |
(317) 0x4393c8 MAXSD %XMM13,%XMM6 |
(317) 0x4393cd MOVAPD %XMM2,%XMM3 |
(317) 0x4393d1 CMPSD $0x2,%XMM9,%XMM3 |
(317) 0x4393d7 ANDPD %XMM3,%XMM2 |
(317) 0x4393db ANDNPD %XMM9,%XMM3 |
(317) 0x4393e0 ORPD %XMM2,%XMM3 |
(317) 0x4393e4 MULSD %XMM7,%XMM3 |
(317) 0x4393e8 DIVSD %XMM6,%XMM3 |
(317) 0x4393ec MOVAPD 0x129a2b(%RIP),%XMM10 |
(317) 0x4393f5 ANDPD %XMM10,%XMM1 |
(317) 0x4393fa ANDPD %XMM10,%XMM5 |
(317) 0x4393ff MULSD %XMM13,%XMM8 |
(317) 0x439404 MOVAPD %XMM8,%XMM2 |
(317) 0x439409 CMPSD $0x2,%XMM5,%XMM2 |
(317) 0x43940e ANDPD %XMM2,%XMM5 |
(317) 0x439412 ANDNPD %XMM8,%XMM2 |
(317) 0x439417 ORPD %XMM5,%XMM2 |
(317) 0x43941b MOVAPD %XMM2,%XMM5 |
(317) 0x43941f CMPSD $0x2,%XMM1,%XMM5 |
(317) 0x439424 MOVAPD %XMM5,%XMM6 |
(317) 0x439428 ANDNPD %XMM2,%XMM6 |
(317) 0x43942c ANDPD %XMM1,%XMM5 |
(317) 0x439430 ORPD %XMM6,%XMM5 |
(317) 0x439434 MOVAPD %XMM14,%XMM1 |
(317) 0x439439 MULSD %XMM12,%XMM1 |
(317) 0x43943e DIVSD %XMM5,%XMM1 |
(317) 0x439442 ANDPD %XMM10,%XMM0 |
(317) 0x439447 ANDPD %XMM10,%XMM4 |
(317) 0x43944c MOVAPD %XMM8,%XMM2 |
(317) 0x439451 CMPSD $0x2,%XMM4,%XMM2 |
(317) 0x439456 ANDPD %XMM2,%XMM4 |
(317) 0x43945a ANDNPD %XMM8,%XMM2 |
(317) 0x43945f ORPD %XMM4,%XMM2 |
(317) 0x439463 MOVAPD %XMM2,%XMM4 |
(317) 0x439467 CMPSD $0x2,%XMM0,%XMM4 |
(317) 0x43946c MOVAPD %XMM4,%XMM5 |
(317) 0x439470 ANDNPD %XMM2,%XMM5 |
(317) 0x439474 ANDPD %XMM0,%XMM4 |
(317) 0x439478 ORPD %XMM5,%XMM4 |
(317) 0x43947c MULSD -0x170(%RBP),%XMM14 |
(317) 0x439485 DIVSD %XMM4,%XMM14 |
(317) 0x43948a MOVAPD %XMM14,%XMM0 |
(317) 0x43948f CMPSD $0x2,%XMM11,%XMM0 |
(317) 0x439495 ANDPD %XMM0,%XMM14 |
(317) 0x43949a ANDNPD %XMM11,%XMM0 |
(317) 0x43949f ORPD %XMM14,%XMM0 |
(317) 0x4394a4 MOVAPD %XMM1,%XMM2 |
(317) 0x4394a8 CMPSD $0x2,%XMM0,%XMM2 |
(317) 0x4394ad MOVAPD %XMM2,%XMM4 |
(317) 0x4394b1 ANDNPD %XMM0,%XMM4 |
(317) 0x4394b5 ANDPD %XMM1,%XMM2 |
(317) 0x4394b9 ORPD %XMM4,%XMM2 |
(317) 0x4394bd MOVAPD %XMM3,%XMM0 |
(317) 0x4394c1 CMPSD $0x2,%XMM2,%XMM0 |
(317) 0x4394c6 MOVAPD %XMM0,%XMM1 |
(317) 0x4394ca ANDNPD %XMM2,%XMM1 |
(317) 0x4394ce ANDPD %XMM3,%XMM0 |
(317) 0x4394d2 ORPD %XMM1,%XMM0 |
(317) 0x4394d6 MOVAPD %XMM15,%XMM14 |
(317) 0x4394db CMPSD $0x2,%XMM0,%XMM14 |
(317) 0x4394e1 MOVAPD %XMM14,%XMM1 |
(317) 0x4394e6 ANDNPD %XMM0,%XMM1 |
(317) 0x4394ea ANDPD %XMM15,%XMM14 |
(317) 0x4394ef ORPD %XMM1,%XMM14 |
(317) 0x4394f4 INC %R9 |
(317) 0x4394f7 MOVAPD %XMM14,%XMM15 |
(317) 0x4394fc CMP %R9,-0x40(%RBP) |
(317) 0x439500 JE 438d90 |
(317) 0x439506 MOVUPD (%R14,%R9,8),%XMM0 |
(317) 0x43950c MOVUPD (%R11,%R9,8),%XMM2 |
(317) 0x439512 ADDPD %XMM0,%XMM2 |
(317) 0x439516 MOVUPD (%R10,%R9,8),%XMM1 |
(317) 0x43951c MULPD %XMM2,%XMM1 |
(317) 0x439520 MOVSD (%RDI,%R9,8),%XMM8 |
(317) 0x439526 MOVAPD %XMM8,%XMM14 |
(317) 0x43952b ADDSD %XMM8,%XMM14 |
(317) 0x439530 MOVSD 0x8(%RAX,%R9,8),%XMM0 |
(317) 0x439537 ADDSD (%RAX,%R9,8),%XMM0 |
(317) 0x43953d MULSD (%RDX,%R9,8),%XMM0 |
(317) 0x439543 MOVAPD %XMM1,%XMM5 |
(317) 0x439547 MOVSD 0x8(%R8,%R9,8),%XMM4 |
(317) 0x43954e ADDSD (%R8,%R9,8),%XMM4 |
(317) 0x439554 UNPCKHPD %XMM1,%XMM5 |
(317) 0x439558 MULSD (%RCX,%R9,8),%XMM4 |
(317) 0x43955e MOVAPD %XMM1,%XMM2 |
(317) 0x439562 ADDSD %XMM0,%XMM2 |
(317) 0x439566 MOVAPD %XMM5,%XMM3 |
(317) 0x43956a SUBSD %XMM2,%XMM3 |
(317) 0x43956e ADDSD %XMM4,%XMM3 |
(317) 0x439572 DIVSD %XMM14,%XMM3 |
(317) 0x439577 MOVSD 0xf3f01(%RIP),%XMM2 |
(317) 0x43957f UCOMISD %XMM3,%XMM2 |
(317) 0x439583 MOVSD 0xf3eec(%RIP),%XMM11 |
(317) 0x43958c JBE 4393a0 |
(317) 0x439592 MOVAPD -0x180(%RBP),%XMM11 |
(317) 0x43959b DIVSD %XMM3,%XMM11 |
(317) 0x4395a0 JMP 4393a0 |
0x4395a5 NOPW %CS:(%RAX,%RAX,1) |
0x4395af NOP |
Path / |
Source file and lines | calc_dt_kernel.f90:89-133 |
Module | exec |
nb instructions | 162 |
nb uops | 162 |
loop length | 707 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 34 |
micro-operation queue | 27.00 cycles |
front end | 27.00 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 18.75 | 18.75 | 18.50 | 18.50 | 5.50 | 19.33 | 19.33 | 19.33 | 0.00 | 0.00 | 0.50 | 0.50 | 1.00 | 1.00 |
cycles | 18.75 | 18.75 | 18.50 | 18.50 | 5.50 | 19.33 | 19.33 | 19.33 | 0.00 | 0.00 | 0.50 | 0.50 | 1.00 | 1.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 27.00 |
Dispatch | 19.33 |
Overall L1 | 27.00 |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 22% |
load | 28% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 2% |
load | 20% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 10% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 15% |
load | 16% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 14% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x90(%RBP),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x88(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %ECX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVL $0,-0x54(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JS 438bf6 <calc_dt_kernel_module_mp_calc_dt_kernel_.DIR.OMP.PARALLEL.2+0x116> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EAX,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0x1,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x50(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x54(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x30(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x2c(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x5720c0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x44(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x30(%RBP),%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x2c(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %R9D,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %EAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JAE 438c14 <calc_dt_kernel_module_mp_calc_dt_kernel_.DIR.OMP.PARALLEL.2+0x134> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOVSD 0xf48ef(%RIP),%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD %XMM14,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOV $0x5720e0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x44(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x60(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x80(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x572100,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x4395b0,%R9D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x8,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x57933c | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404830 <__kmpc_reduce@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x10,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x1,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JNE 438bf6 <calc_dt_kernel_module_mp_calc_dt_kernel_.DIR.OMP.PARALLEL.2+0x116> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOVSD -0x80(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MINSD (%RAX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 2 | 0.50 |
MOVSD %XMM0,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV $0x572120,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x57933c,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CALL 4049c0 <__kmpc_end_reduce@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x60(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV $0x572140,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CALL 404740 <__kmpc_barrier@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SAL $0x20,%R14 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
LEA (%R14,%RAX,1),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAL $0x20,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %R13,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAR $0x20,%R15 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RCX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x1,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x1,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNS %RCX,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RDI,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %R12,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %R14,%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R8,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RCX,%R8 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SHR $0x20,%R8 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RSI,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (,%R8,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x8,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %RCX,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %R15,%R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNS %RAX,%RDX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RDX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RDI,%RDX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %R13,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RAX,%R12 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SHR $0x20,%R12 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RDX,%R12 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %RCX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R10,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R11,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %RCX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %RCX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%RBX,%RSI,1),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RBX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
NEG %R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R12,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %RSI,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
ADD 0x10(%RBP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %RSI,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
NEG %R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R8,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVSD 0xf4716(%RIP),%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0xf46dd(%RIP),%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVAPD 0xf48b4(%RIP),%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVAPD 0x12a0ac(%RIP),%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV 0x90(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA (%R9,%RAX,1),%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JMP 438dbb <calc_dt_kernel_module_mp_calc_dt_kernel_.DIR.OMP.PARALLEL.2+0x2db> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Source file and lines | calc_dt_kernel.f90:89-133 |
Module | exec |
nb instructions | 162 |
nb uops | 162 |
loop length | 707 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 34 |
micro-operation queue | 27.00 cycles |
front end | 27.00 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 18.75 | 18.75 | 18.50 | 18.50 | 5.50 | 19.33 | 19.33 | 19.33 | 0.00 | 0.00 | 0.50 | 0.50 | 1.00 | 1.00 |
cycles | 18.75 | 18.75 | 18.50 | 18.50 | 5.50 | 19.33 | 19.33 | 19.33 | 0.00 | 0.00 | 0.50 | 0.50 | 1.00 | 1.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 27.00 |
Dispatch | 19.33 |
Overall L1 | 27.00 |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 22% |
load | 28% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 2% |
load | 20% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 10% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 15% |
load | 16% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 14% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x90(%RBP),%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x88(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %ECX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVL $0,-0x54(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JS 438bf6 <calc_dt_kernel_module_mp_calc_dt_kernel_.DIR.OMP.PARALLEL.2+0x116> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RDI,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EAX,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0x1,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x50(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x54(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x30(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x2c(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x5720c0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x44(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x30(%RBP),%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x2c(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %R9D,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %EAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JAE 438c14 <calc_dt_kernel_module_mp_calc_dt_kernel_.DIR.OMP.PARALLEL.2+0x134> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOVSD 0xf48ef(%RIP),%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD %XMM14,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOV $0x5720e0,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x44(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x60(%RBP),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RBX),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x80(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x572100,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x4395b0,%R9D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x8,%ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x57933c | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404830 <__kmpc_reduce@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x10,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP $0x1,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JNE 438bf6 <calc_dt_kernel_module_mp_calc_dt_kernel_.DIR.OMP.PARALLEL.2+0x116> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOVSD -0x80(%RBP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MINSD (%RAX),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 2 | 0.50 |
MOVSD %XMM0,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 1 | 1 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV $0x572120,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x57933c,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CALL 4049c0 <__kmpc_end_reduce@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x60(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV $0x572140,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CALL 404740 <__kmpc_barrier@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x158,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV 0x28(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SAL $0x20,%R14 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
LEA (%R14,%RAX,1),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SAL $0x20,%R13 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD %R13,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAR $0x20,%R15 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RCX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x1,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $-0x1,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNS %RCX,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RDI,%RSI | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %R12,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %R14,%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R8,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RCX,%R8 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SHR $0x20,%R8 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RSI,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (,%R8,8),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x8,%ESI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB %RCX,%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x1,%R14D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R15,-0x100(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %R15,%R14 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R14,-0xf0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %RAX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVNS %RAX,%RDX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RDX,%RDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RDI,%RDX | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %R13,%R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP %R12,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMOVG %RAX,%R12 | 1 | 0.50 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SHR $0x20,%R12 | 1 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %RDX,%R12 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x48(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %RCX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0xc8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%R10 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R10,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R11,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDI,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x18(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %RCX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x40(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %RCX,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
LEA (%RBX,%RSI,1),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB %RCX,%RBX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RBX,-0xe8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
NEG %R12 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R12,-0xf8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %RSI,%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
ADD 0x10(%RBP),%RSI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %RSI,-0xd0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
NEG %R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R8,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVSD 0xf4716(%RIP),%XMM14 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVSD 0xf46dd(%RIP),%XMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOVAPD 0xf48b4(%RIP),%XMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVAPD 0x12a0ac(%RIP),%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV 0x90(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA (%R9,%RAX,1),%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,-0xd8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JMP 438dbb <calc_dt_kernel_module_mp_calc_dt_kernel_.DIR.OMP.PARALLEL.2+0x2db> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPL (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOP | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼calc_dt_kernel_.DIR.OMP.PARALLEL.2– | 3.27 | 1.7 |
▼Loop 316 - calc_dt_kernel.f90:92-129 - exec– | 0.03 | 0.01 |
○Loop 318 - calc_dt_kernel.f90:94-129 - exec | 3.24 | 1.68 |
○Loop 317 - calc_dt_kernel.f90:94-129 - exec | 0 | 0 |