Function: field_summary_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: field_summary_kernel.f90:54-74 | Coverage: 0.29% |
---|
Function: field_summary_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: field_summary_kernel.f90:54-74 | Coverage: 0.29% |
---|
/scratch_na/users/xoserete/qaas_runs/171-214-9740/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/field_summary_kernel.f90: 54 - 74 |
-------------------------------------------------------------------------------- |
54: !$OMP PARALLEL |
55: !$OMP DO PRIVATE(vsqrd,cell_vol,cell_mass) REDUCTION(+ : vol,mass,press,ie,ke) |
56: DO k=y_min,y_max |
57: !$OMP SIMD |
58: DO j=x_min,x_max |
59: vsqrd=0.0 |
60: DO kv=k,k+1 |
61: DO jv=j,j+1 |
62: vsqrd=vsqrd+0.25*(xvel0(jv,kv)**2+yvel0(jv,kv)**2) |
63: ENDDO |
64: ENDDO |
65: cell_vol=volume(j,k) |
66: cell_mass=cell_vol*density0(j,k) |
67: vol=vol+cell_vol |
68: mass=mass+cell_mass |
69: ie=ie+cell_mass*energy0(j,k) |
70: ke=ke+cell_mass*0.5*vsqrd |
71: press=press+cell_vol*pressure(j,k) |
72: ENDDO |
73: ENDDO |
74: !$OMP END DO |
0x4408c0 PUSH %RBP |
0x4408c1 MOV %RSP,%RBP |
0x4408c4 PUSH %R15 |
0x4408c6 PUSH %R14 |
0x4408c8 PUSH %R13 |
0x4408ca PUSH %R12 |
0x4408cc PUSH %RBX |
0x4408cd SUB $0x98,%RSP |
0x4408d4 MOV %R9,-0x90(%RBP) |
0x4408db MOV %R8,-0x88(%RBP) |
0x4408e2 MOV 0x60(%RBP),%EBX |
0x4408e5 MOV 0x58(%RBP),%EAX |
0x4408e8 SUB %EBX,%EAX |
0x4408ea MOVL $0,-0x54(%RBP) |
0x4408f1 JS 44119f |
0x4408f7 MOV %RCX,%R14 |
0x4408fa MOV %RDX,%R13 |
0x4408fd MOV %RDI,-0x30(%RBP) |
0x440901 MOV (%RDI),%ESI |
0x440903 MOVL $0,-0x3c(%RBP) |
0x44090a MOV %EAX,-0x38(%RBP) |
0x44090d MOVL $0x1,-0x50(%RBP) |
0x440914 SUB $0x8,%RSP |
0x440918 LEA -0x50(%RBP),%RAX |
0x44091c LEA -0x54(%RBP),%RCX |
0x440920 LEA -0x3c(%RBP),%R8 |
0x440924 LEA -0x38(%RBP),%R9 |
0x440928 MOV $0x74d290,%EDI |
0x44092d MOV %ESI,-0x4c(%RBP) |
0x440930 MOV $0x22,%EDX |
0x440935 PUSH $0x1 |
0x440937 PUSH $0x1 |
0x440939 PUSH %RAX |
0x44093a CALL 4044c0 <__kmpc_for_static_init_4@plt> |
0x44093f ADD $0x20,%RSP |
0x440943 MOV -0x3c(%RBP),%ESI |
0x440946 MOV -0x38(%RBP),%R8D |
0x44094a VXORPD %XMM1,%XMM1,%XMM1 |
0x44094e VXORPD %XMM0,%XMM0,%XMM0 |
0x440952 VXORPD %XMM2,%XMM2,%XMM2 |
0x440956 VXORPD %XMM3,%XMM3,%XMM3 |
0x44095a VXORPD %XMM4,%XMM4,%XMM4 |
0x44095e SUB %ESI,%R8D |
0x440961 JAE 440a80 |
0x440967 MOV 0x20(%RBP),%R15 |
0x44096b MOV 0x18(%RBP),%R14 |
0x44096f MOV 0x10(%RBP),%R13 |
0x440973 VMOVSD %XMM4,-0x80(%RBP) |
0x440978 VMOVSD %XMM3,-0x78(%RBP) |
0x44097d VMOVSD %XMM2,-0x70(%RBP) |
0x440982 VMOVSD %XMM0,-0x68(%RBP) |
0x440987 VMOVSD %XMM1,-0x60(%RBP) |
0x44098c MOV $0x74d2b0,%EDI |
0x440991 MOV -0x4c(%RBP),%ESI |
0x440994 VZEROUPPER |
0x440997 CALL 4040b0 <__kmpc_for_static_fini@plt> |
0x44099c MOV -0x30(%RBP),%RAX |
0x4409a0 MOV (%RAX),%ESI |
0x4409a2 SUB $0x8,%RSP |
0x4409a6 LEA -0x80(%RBP),%R8 |
0x4409aa MOV $0x74d370,%EDI |
0x4409af MOV $0x4411c0,%R9D |
0x4409b5 MOV $0x5,%EDX |
0x4409ba MOV $0x28,%ECX |
0x4409bf PUSH $0x75433c |
0x4409c4 CALL 4046a0 <__kmpc_reduce@plt> |
0x4409c9 ADD $0x10,%RSP |
0x4409cd CMP $0x2,%EAX |
0x4409d0 JGE 441100 |
0x4409d6 CMP $0x1,%EAX |
0x4409d9 MOV -0x30(%RBP),%RDI |
0x4409dd JNE 44119f |
0x4409e3 VMOVSD -0x80(%RBP),%XMM0 |
0x4409e8 VADDSD (%R15),%XMM0,%XMM0 |
0x4409ed VMOVSD %XMM0,(%R15) |
0x4409f2 VMOVSD -0x78(%RBP),%XMM0 |
0x4409f7 VADDSD (%R14),%XMM0,%XMM0 |
0x4409fc VMOVSD %XMM0,(%R14) |
0x440a01 VMOVSD -0x70(%RBP),%XMM0 |
0x440a06 MOV -0x88(%RBP),%RAX |
0x440a0d VADDSD (%RAX),%XMM0,%XMM0 |
0x440a11 VMOVSD %XMM0,(%RAX) |
0x440a15 VMOVSD -0x68(%RBP),%XMM0 |
0x440a1a VADDSD (%R13),%XMM0,%XMM0 |
0x440a20 VMOVSD %XMM0,(%R13) |
0x440a26 VMOVSD -0x60(%RBP),%XMM0 |
0x440a2b MOV -0x90(%RBP),%RAX |
0x440a32 VADDSD (%RAX),%XMM0,%XMM0 |
0x440a36 VMOVSD %XMM0,(%RAX) |
0x440a3a MOV (%RDI),%ESI |
0x440a3c MOV $0x74d390,%EDI |
0x440a41 JMP 441191 |
0x440a46 NOPW %CS:(%RAX,%RAX,1) |
0x440a55 NOPW %CS:(%RAX,%RAX,1) |
0x440a64 NOPW %CS:(%RAX,%RAX,1) |
0x440a73 NOPW %CS:(%RAX,%RAX,1) |
0x440a80 MOV 0xa0(%RBP),%R9 |
0x440a87 ADD %EBX,%ESI |
0x440a89 ADD $-0x2,%R14D |
0x440a8d MOVSXD %R14D,%RAX |
0x440a90 MOV %RAX,-0x98(%RBP) |
0x440a97 ADD $-0x2,%R13D |
0x440a9b MOVSXD %R13D,%RAX |
0x440a9e MOV %RAX,-0xa8(%RBP) |
0x440aa5 VMOVDQA64 0xc92d1(%RIP),%ZMM5 |
0x440aaf VPBROADCASTQ 0xca26f(%RIP),%ZMM6 |
0x440ab9 VBROADCASTSD 0xca25d(%RIP),%ZMM7 |
0x440ac3 MOV 0x28(%RBP),%R10 |
0x440ac7 XOR %R13D,%R13D |
0x440aca MOV %RSI,-0xa0(%RBP) |
0x440ad1 MOV %R8D,-0x34(%RBP) |
0x440ad5 JMP 440c01 |
0x440ada NOPW %CS:(%RAX,%RAX,1) |
0x440ae9 NOPW %CS:(%RAX,%RAX,1) |
0x440af8 NOPL (%RAX,%RAX,1) |
(333) 0x440b00 VEXTRACTF64X4 $0x1,%ZMM13,%YMM9 |
(333) 0x440b07 VADDPD %ZMM9,%ZMM13,%ZMM9 |
(333) 0x440b0d VMOVAPD %XMM9,%XMM13 |
(333) 0x440b12 VEXTRACTF128 $0x1,%YMM9,%XMM9 |
(333) 0x440b18 VADDPD %XMM9,%XMM13,%XMM9 |
(333) 0x440b1d VSHUFPD $0x1,%XMM9,%XMM9,%XMM13 |
(333) 0x440b23 VADDSD %XMM13,%XMM9,%XMM9 |
(333) 0x440b28 VADDSD %XMM2,%XMM9,%XMM2 |
(333) 0x440b2c VEXTRACTF64X4 $0x1,%ZMM12,%YMM9 |
(333) 0x440b33 VADDPD %ZMM9,%ZMM12,%ZMM9 |
(333) 0x440b39 VMOVAPD %XMM9,%XMM12 |
(333) 0x440b3e VEXTRACTF128 $0x1,%YMM9,%XMM9 |
(333) 0x440b44 VADDPD %XMM9,%XMM12,%XMM9 |
(333) 0x440b49 VSHUFPD $0x1,%XMM9,%XMM9,%XMM12 |
(333) 0x440b4f VADDSD %XMM12,%XMM9,%XMM9 |
(333) 0x440b54 VADDSD %XMM1,%XMM9,%XMM1 |
(333) 0x440b58 VEXTRACTF64X4 $0x1,%ZMM11,%YMM9 |
(333) 0x440b5f VADDPD %ZMM9,%ZMM11,%ZMM9 |
(333) 0x440b65 VMOVAPD %XMM9,%XMM11 |
(333) 0x440b6a VEXTRACTF128 $0x1,%YMM9,%XMM9 |
(333) 0x440b70 VADDPD %XMM9,%XMM11,%XMM9 |
(333) 0x440b75 VSHUFPD $0x1,%XMM9,%XMM9,%XMM11 |
(333) 0x440b7b VADDSD %XMM11,%XMM9,%XMM9 |
(333) 0x440b80 VADDSD %XMM0,%XMM9,%XMM0 |
(333) 0x440b84 VEXTRACTF64X4 $0x1,%ZMM10,%YMM9 |
(333) 0x440b8b VADDPD %ZMM9,%ZMM10,%ZMM9 |
(333) 0x440b91 VMOVAPD %XMM9,%XMM10 |
(333) 0x440b96 VEXTRACTF128 $0x1,%YMM9,%XMM9 |
(333) 0x440b9c VADDPD %XMM9,%XMM10,%XMM9 |
(333) 0x440ba1 VSHUFPD $0x1,%XMM9,%XMM9,%XMM10 |
(333) 0x440ba7 VADDSD %XMM10,%XMM9,%XMM9 |
(333) 0x440bac VADDSD %XMM3,%XMM9,%XMM3 |
(333) 0x440bb0 VEXTRACTF64X4 $0x1,%ZMM8,%YMM9 |
(333) 0x440bb7 VADDPD %ZMM9,%ZMM8,%ZMM8 |
(333) 0x440bbd VMOVAPD %XMM8,%XMM9 |
(333) 0x440bc2 VEXTRACTF128 $0x1,%YMM8,%XMM8 |
(333) 0x440bc8 VADDPD %XMM8,%XMM9,%XMM8 |
(333) 0x440bcd VSHUFPD $0x1,%XMM8,%XMM8,%XMM9 |
(333) 0x440bd3 VADDSD %XMM9,%XMM8,%XMM8 |
(333) 0x440bd8 VADDSD %XMM4,%XMM8,%XMM4 |
(333) 0x440bdc MOV 0x28(%RBP),%R10 |
(333) 0x440be0 MOV -0xa0(%RBP),%RSI |
(333) 0x440be7 MOV -0x34(%RBP),%R8D |
(333) 0x440beb MOV -0xb8(%RBP),%RCX |
(333) 0x440bf2 LEA 0x1(%RCX),%EAX |
(333) 0x440bf5 CMP %R8D,%ECX |
(333) 0x440bf8 MOV %EAX,%R13D |
(333) 0x440bfb JE 440967 |
(333) 0x440c01 MOV 0x70(%RBP),%RAX |
(333) 0x440c05 MOV (%RAX),%EDX |
(333) 0x440c07 MOV 0x68(%RBP),%RAX |
(333) 0x440c0b MOV (%RAX),%EDI |
(333) 0x440c0d SUB %EDX,%EDI |
(333) 0x440c0f MOV %R13,-0xb8(%RBP) |
(333) 0x440c16 JS 440beb |
(333) 0x440c18 LEA (%RSI,%R13,1),%R8D |
(333) 0x440c1c MOV 0x78(%RBP),%RAX |
(333) 0x440c20 MOV (%RAX),%R14 |
(333) 0x440c23 MOV 0x80(%RBP),%RAX |
(333) 0x440c2a MOV (%RAX),%R11 |
(333) 0x440c2d MOV 0x88(%RBP),%RAX |
(333) 0x440c34 MOV (%RAX),%R15 |
(333) 0x440c37 MOV 0x90(%RBP),%RAX |
(333) 0x440c3e MOV (%RAX),%RAX |
(333) 0x440c41 MOV 0x98(%RBP),%RCX |
(333) 0x440c48 MOV (%RCX),%RCX |
(333) 0x440c4b VPBROADCASTD %EDX,%YMM8 |
(333) 0x440c51 MOV (%R9),%R12 |
(333) 0x440c54 INC %EDI |
(333) 0x440c56 CMP $0x2,%EDI |
(333) 0x440c59 MOV $0x1,%EDX |
(333) 0x440c5e CMOVL %EDX,%EDI |
(333) 0x440c61 MOVSXD %R8D,%RDX |
(333) 0x440c64 CMP $0x8,%EDI |
(333) 0x440c67 JAE 440c80 |
(333) 0x440c69 MOVQ $0,-0x48(%RBP) |
(333) 0x440c71 MOV 0x38(%RBP),%R13 |
(333) 0x440c75 JMP 440f0b |
0x440c7a NOPW (%RAX,%RAX,1) |
(333) 0x440c80 MOV %RDI,-0xb0(%RBP) |
(333) 0x440c87 AND $0x7ffffff8,%EDI |
(333) 0x440c8d MOV %RDI,-0x48(%RBP) |
(333) 0x440c91 VXORPD %XMM13,%XMM13,%XMM13 |
(333) 0x440c96 VPMOVSXDQ %XMM8,%XMM14 |
(333) 0x440c9b VXORPD %XMM12,%XMM12,%XMM12 |
(333) 0x440ca0 VXORPD %XMM11,%XMM11,%XMM11 |
(333) 0x440ca5 VXORPD %XMM10,%XMM10,%XMM10 |
(333) 0x440caa VXORPD %XMM9,%XMM9,%XMM9 |
(333) 0x440caf XOR %EBX,%EBX |
(333) 0x440cb1 VMOVDQA64 %ZMM5,%ZMM15 |
(333) 0x440cb7 MOV -0x98(%RBP),%RDI |
(333) 0x440cbe MOV 0x30(%RBP),%RSI |
(333) 0x440cc2 NOPW %CS:(%RAX,%RAX,1) |
(334) 0x440cd0 MOV %RDX,%R13 |
(334) 0x440cd3 SUB -0xa8(%RBP),%RDX |
(334) 0x440cda MOV %R14,%R9 |
(334) 0x440cdd IMUL %RDX,%R9 |
(334) 0x440ce1 ADD %RSI,%R9 |
(334) 0x440ce4 VMOVDQA64 %XMM15,%XMM16 |
(334) 0x440cea VPADDQ %XMM14,%XMM15,%XMM16 |
(334) 0x440cf0 VMOVQ %XMM16,%R8 |
(334) 0x440cf6 SUB %RDI,%R8 |
(334) 0x440cf9 VMOVUPD (%R9,%R8,8),%ZMM16 |
(334) 0x440d00 VMOVUPD 0x8(%R9,%R8,8),%ZMM17 |
(334) 0x440d0b MOV %R11,%R9 |
(334) 0x440d0e IMUL %RDX,%R9 |
(334) 0x440d12 ADD %R10,%R9 |
(334) 0x440d15 VMOVUPD (%R9,%R8,8),%ZMM18 |
(334) 0x440d1c VMOVUPD 0x8(%R9,%R8,8),%ZMM19 |
(334) 0x440d27 LEA 0x1(%RDX),%R9 |
(334) 0x440d2b MOV %R14,%R10 |
(334) 0x440d2e IMUL %R9,%R10 |
(334) 0x440d32 ADD %RSI,%R10 |
(334) 0x440d35 VMOVUPD (%R10,%R8,8),%ZMM20 |
(334) 0x440d3c VMOVUPD 0x8(%R10,%R8,8),%ZMM21 |
(334) 0x440d47 MOV %R15,%R10 |
(334) 0x440d4a IMUL %RDX,%R10 |
(334) 0x440d4e ADD 0x50(%RBP),%R10 |
(334) 0x440d52 VMOVUPD (%R10,%R8,8),%ZMM22 |
(334) 0x440d59 MOV %RAX,%R10 |
(334) 0x440d5c IMUL %RDX,%R10 |
(334) 0x440d60 ADD 0x48(%RBP),%R10 |
(334) 0x440d64 VMULPD (%R10,%R8,8),%ZMM22,%ZMM23 |
(334) 0x440d6b MOV 0x28(%RBP),%R10 |
(334) 0x440d6f IMUL %R11,%R9 |
(334) 0x440d73 ADD %R10,%R9 |
(334) 0x440d76 VMOVUPD (%R9,%R8,8),%ZMM24 |
(334) 0x440d7d VMOVUPD 0x8(%R9,%R8,8),%ZMM25 |
(334) 0x440d88 MOV %RCX,%R9 |
(334) 0x440d8b IMUL %RDX,%R9 |
(334) 0x440d8f ADD 0x40(%RBP),%R9 |
(334) 0x440d93 VFMADD231PD (%R9,%R8,8),%ZMM23,%ZMM11 |
(334) 0x440d9a IMUL %R12,%RDX |
(334) 0x440d9e ADD 0x38(%RBP),%RDX |
(334) 0x440da2 VFMADD231PD (%RDX,%R8,8),%ZMM22,%ZMM13 |
(334) 0x440da9 MOV %R13,%RDX |
(334) 0x440dac VMULPD %ZMM16,%ZMM16,%ZMM16 |
(334) 0x440db2 VFMADD213PD %ZMM16,%ZMM18,%ZMM18 |
(334) 0x440db8 VFMADD231PD %ZMM17,%ZMM17,%ZMM18 |
(334) 0x440dbe VFMADD231PD %ZMM19,%ZMM19,%ZMM18 |
(334) 0x440dc4 VFMADD213PD %ZMM18,%ZMM20,%ZMM20 |
(334) 0x440dca VFMADD213PD %ZMM20,%ZMM24,%ZMM24 |
(334) 0x440dd0 VFMADD231PD %ZMM21,%ZMM21,%ZMM24 |
(334) 0x440dd6 VFMADD231PD %ZMM25,%ZMM25,%ZMM24 |
(334) 0x440ddc VADDPD %ZMM22,%ZMM9,%ZMM9 |
(334) 0x440de2 VADDPD %ZMM23,%ZMM10,%ZMM10 |
(334) 0x440de8 VMULPD %ZMM24,%ZMM23,%ZMM16 |
(334) 0x440dee VFMADD231PD %ZMM7,%ZMM16,%ZMM12 |
(334) 0x440df4 VPADDQ %ZMM6,%ZMM15,%ZMM15 |
(334) 0x440dfa ADD $0x8,%RBX |
(334) 0x440dfe CMP -0x48(%RBP),%RBX |
(334) 0x440e02 JB 440cd0 |
(333) 0x440e08 VEXTRACTF64X4 $0x1,%ZMM13,%YMM14 |
(333) 0x440e0f VADDPD %ZMM14,%ZMM13,%ZMM13 |
(333) 0x440e15 VMOVAPD %XMM13,%XMM14 |
(333) 0x440e1a VEXTRACTF128 $0x1,%YMM13,%XMM13 |
(333) 0x440e20 VADDPD %XMM13,%XMM14,%XMM13 |
(333) 0x440e25 VSHUFPD $0x1,%XMM13,%XMM13,%XMM14 |
(333) 0x440e2b VADDSD %XMM14,%XMM13,%XMM13 |
(333) 0x440e30 VADDSD %XMM2,%XMM13,%XMM2 |
(333) 0x440e34 VEXTRACTF64X4 $0x1,%ZMM12,%YMM13 |
(333) 0x440e3b VADDPD %ZMM13,%ZMM12,%ZMM12 |
(333) 0x440e41 VMOVAPD %XMM12,%XMM13 |
(333) 0x440e46 VEXTRACTF128 $0x1,%YMM12,%XMM12 |
(333) 0x440e4c VADDPD %XMM12,%XMM13,%XMM12 |
(333) 0x440e51 VSHUFPD $0x1,%XMM12,%XMM12,%XMM13 |
(333) 0x440e57 VADDSD %XMM13,%XMM12,%XMM12 |
(333) 0x440e5c VADDSD %XMM1,%XMM12,%XMM1 |
(333) 0x440e60 VEXTRACTF64X4 $0x1,%ZMM11,%YMM12 |
(333) 0x440e67 VADDPD %ZMM12,%ZMM11,%ZMM11 |
(333) 0x440e6d VMOVAPD %XMM11,%XMM12 |
(333) 0x440e72 VEXTRACTF128 $0x1,%YMM11,%XMM11 |
(333) 0x440e78 VADDPD %XMM11,%XMM12,%XMM11 |
(333) 0x440e7d VSHUFPD $0x1,%XMM11,%XMM11,%XMM12 |
(333) 0x440e83 VADDSD %XMM12,%XMM11,%XMM11 |
(333) 0x440e88 VADDSD %XMM0,%XMM11,%XMM0 |
(333) 0x440e8c VEXTRACTF64X4 $0x1,%ZMM10,%YMM11 |
(333) 0x440e93 VADDPD %ZMM11,%ZMM10,%ZMM10 |
(333) 0x440e99 VMOVAPD %XMM10,%XMM11 |
(333) 0x440e9e VEXTRACTF128 $0x1,%YMM10,%XMM10 |
(333) 0x440ea4 VADDPD %XMM10,%XMM11,%XMM10 |
(333) 0x440ea9 VSHUFPD $0x1,%XMM10,%XMM10,%XMM11 |
(333) 0x440eaf VADDSD %XMM11,%XMM10,%XMM10 |
(333) 0x440eb4 VADDSD %XMM3,%XMM10,%XMM3 |
(333) 0x440eb8 VEXTRACTF64X4 $0x1,%ZMM9,%YMM10 |
(333) 0x440ebf VADDPD %ZMM10,%ZMM9,%ZMM9 |
(333) 0x440ec5 VMOVAPD %XMM9,%XMM10 |
(333) 0x440eca VEXTRACTF128 $0x1,%YMM9,%XMM9 |
(333) 0x440ed0 VADDPD %XMM9,%XMM10,%XMM9 |
(333) 0x440ed5 VSHUFPD $0x1,%XMM9,%XMM9,%XMM10 |
(333) 0x440edb VADDSD %XMM10,%XMM9,%XMM9 |
(333) 0x440ee0 VADDSD %XMM4,%XMM9,%XMM4 |
(333) 0x440ee4 MOV -0xb0(%RBP),%RDI |
(333) 0x440eeb CMP %RDI,-0x48(%RBP) |
(333) 0x440eef MOV -0xa0(%RBP),%RSI |
(333) 0x440ef6 MOV -0x34(%RBP),%R8D |
(333) 0x440efa MOV 0xa0(%RBP),%R9 |
(333) 0x440f01 MOV 0x38(%RBP),%R13 |
(333) 0x440f05 JE 440beb |
(333) 0x440f0b MOV -0x48(%RBP),%RSI |
(333) 0x440f0f VMOVQ %RSI,%XMM10 |
(333) 0x440f14 SUB %RSI,%RDI |
(333) 0x440f17 VPBROADCASTQ %RDI,%ZMM9 |
(333) 0x440f1d MOV %R10,%R8 |
(333) 0x440f20 MOV -0xa8(%RBP),%RSI |
(333) 0x440f27 SUB %RSI,%RDX |
(333) 0x440f2a MOV %R14,%RSI |
(333) 0x440f2d MOV %R11,%RDI |
(333) 0x440f30 LEA 0x1(%RDX),%RBX |
(333) 0x440f34 IMUL %RBX,%R14 |
(333) 0x440f38 IMUL %RBX,%R11 |
(333) 0x440f3c IMUL %RDX,%RSI |
(333) 0x440f40 IMUL %RDX,%RDI |
(333) 0x440f44 IMUL %RDX,%R15 |
(333) 0x440f48 IMUL %RDX,%RAX |
(333) 0x440f4c IMUL %RDX,%RCX |
(333) 0x440f50 IMUL %RDX,%R12 |
(333) 0x440f54 VXORPD %XMM13,%XMM13,%XMM13 |
(333) 0x440f59 MOV 0x30(%RBP),%RDX |
(333) 0x440f5d ADD %RDX,%RSI |
(333) 0x440f60 VMOVDQA %XMM10,%XMM14 |
(333) 0x440f65 VPMOVSXDQ %XMM8,%XMM15 |
(333) 0x440f6a ADD %R10,%RDI |
(333) 0x440f6d ADD %RDX,%R14 |
(333) 0x440f70 ADD %R10,%R11 |
(333) 0x440f73 ADD 0x50(%RBP),%R15 |
(333) 0x440f77 ADD 0x48(%RBP),%RAX |
(333) 0x440f7b ADD 0x40(%RBP),%RCX |
(333) 0x440f7f ADD %R13,%R12 |
(333) 0x440f82 VXORPD %XMM12,%XMM12,%XMM12 |
(333) 0x440f87 VXORPD %XMM11,%XMM11,%XMM11 |
(333) 0x440f8c VPXOR %XMM10,%XMM10,%XMM10 |
(333) 0x440f91 VPXOR %XMM8,%XMM8,%XMM8 |
(333) 0x440f96 VMOVDQA64 %ZMM5,%ZMM16 |
(333) 0x440f9c MOV -0x98(%RBP),%R13 |
(333) 0x440fa3 JMP 440ff5 |
0x440fa5 NOPW %CS:(%RAX,%RAX,1) |
0x440fb4 NOPW %CS:(%RAX,%RAX,1) |
(335) 0x440fc0 VMOVAPD %ZMM17,%ZMM8{%K1} |
(335) 0x440fc6 VMOVAPD %ZMM18,%ZMM10{%K1} |
(335) 0x440fcc VMOVAPD %ZMM19,%ZMM11{%K1} |
(335) 0x440fd2 VMOVAPD %ZMM20,%ZMM12{%K1} |
(335) 0x440fd8 VMOVAPD %ZMM21,%ZMM13{%K1} |
(335) 0x440fde VPADDQ %ZMM6,%ZMM16,%ZMM16 |
(335) 0x440fe4 VPCMPLTUQ %ZMM9,%ZMM16,%K0 |
(335) 0x440feb KORTESTB %K0,%K0 |
(335) 0x440fef JE 440b00 |
(335) 0x440ff5 VPCMPLTUQ %ZMM9,%ZMM16,%K1 |
(335) 0x440ffc KORTESTB %K1,%K1 |
(335) 0x441000 VXORPD %XMM17,%XMM17,%XMM17 |
(335) 0x441006 VXORPD %XMM18,%XMM18,%XMM18 |
(335) 0x44100c VXORPD %XMM19,%XMM19,%XMM19 |
(335) 0x441012 VXORPD %XMM20,%XMM20,%XMM20 |
(335) 0x441018 VXORPD %XMM21,%XMM21,%XMM21 |
(335) 0x44101e JE 440fc0 |
(335) 0x441020 VMOVDQA64 %XMM16,%XMM17 |
(335) 0x441026 VPADDQ %XMM14,%XMM16,%XMM17 |
(335) 0x44102c VPADDQ %XMM15,%XMM17,%XMM17 |
(335) 0x441032 VMOVQ %XMM17,%RDX |
(335) 0x441038 SUB %R13,%RDX |
(335) 0x44103b VMOVUPD (%RSI,%RDX,8),%ZMM17{%K1}{z} |
(335) 0x441042 VMULPD %ZMM17,%ZMM17,%ZMM17 |
(335) 0x441048 VMOVUPD (%RDI,%RDX,8),%ZMM18{%K1}{z} |
(335) 0x44104f VMOVUPD 0x8(%RSI,%RDX,8),%ZMM19{%K1}{z} |
(335) 0x44105a VMOVUPD 0x8(%RDI,%RDX,8),%ZMM20{%K1}{z} |
(335) 0x441065 VFMADD213PD %ZMM17,%ZMM18,%ZMM18 |
(335) 0x44106b VFMADD213PD %ZMM18,%ZMM19,%ZMM19 |
(335) 0x441071 VMOVUPD (%R14,%RDX,8),%ZMM17{%K1}{z} |
(335) 0x441078 VMOVUPD (%R11,%RDX,8),%ZMM18{%K1}{z} |
(335) 0x44107f VFMADD231PD %ZMM20,%ZMM20,%ZMM19 |
(335) 0x441085 VFMADD213PD %ZMM19,%ZMM17,%ZMM17 |
(335) 0x44108b VMOVUPD 0x8(%R14,%RDX,8),%ZMM20{%K1}{z} |
(335) 0x441096 VMOVUPD 0x8(%R11,%RDX,8),%ZMM19{%K1}{z} |
(335) 0x4410a1 VFMADD231PD %ZMM18,%ZMM18,%ZMM17 |
(335) 0x4410a7 VFMADD213PD %ZMM17,%ZMM20,%ZMM20 |
(335) 0x4410ad VMOVUPD (%R15,%RDX,8),%ZMM22{%K1}{z} |
(335) 0x4410b4 VMOVUPD (%RAX,%RDX,8),%ZMM17{%K1}{z} |
(335) 0x4410bb VFMADD231PD %ZMM19,%ZMM19,%ZMM20 |
(335) 0x4410c1 VMULPD %ZMM22,%ZMM17,%ZMM21 |
(335) 0x4410c7 VADDPD %ZMM22,%ZMM8,%ZMM17 |
(335) 0x4410cd VADDPD %ZMM21,%ZMM10,%ZMM18 |
(335) 0x4410d3 VMOVUPD (%RCX,%RDX,8),%ZMM19{%K1}{z} |
(335) 0x4410da VFMADD213PD %ZMM11,%ZMM21,%ZMM19 |
(335) 0x4410e0 VMULPD %ZMM20,%ZMM21,%ZMM20 |
(335) 0x4410e6 VFMADD132PD %ZMM7,%ZMM12,%ZMM20 |
(335) 0x4410ec VMOVUPD (%R12,%RDX,8),%ZMM21{%K1}{z} |
(335) 0x4410f3 VFMADD213PD %ZMM13,%ZMM22,%ZMM21 |
(335) 0x4410f9 JMP 440fc0 |
0x4410fe XCHG %AX,%AX |
0x441100 MOV -0x30(%RBP),%RDI |
0x441104 JNE 44119f |
0x44110a VMOVSD -0x80(%RBP),%XMM0 |
0x44110f MOV (%RDI),%ESI |
0x441111 MOV $0x74d2d0,%EDI |
0x441116 MOV %R15,%RDX |
0x441119 CALL 4041b0 <__kmpc_atomic_float8_add@plt> |
0x44111e VMOVSD -0x78(%RBP),%XMM0 |
0x441123 MOV -0x30(%RBP),%RAX |
0x441127 MOV (%RAX),%ESI |
0x441129 MOV $0x74d2f0,%EDI |
0x44112e MOV %R14,%RDX |
0x441131 CALL 4041b0 <__kmpc_atomic_float8_add@plt> |
0x441136 VMOVSD -0x70(%RBP),%XMM0 |
0x44113b MOV -0x30(%RBP),%RAX |
0x44113f MOV (%RAX),%ESI |
0x441141 MOV $0x74d310,%EDI |
0x441146 MOV -0x88(%RBP),%RDX |
0x44114d CALL 4041b0 <__kmpc_atomic_float8_add@plt> |
0x441152 VMOVSD -0x68(%RBP),%XMM0 |
0x441157 MOV -0x30(%RBP),%RAX |
0x44115b MOV (%RAX),%ESI |
0x44115d MOV $0x74d330,%EDI |
0x441162 MOV %R13,%RDX |
0x441165 CALL 4041b0 <__kmpc_atomic_float8_add@plt> |
0x44116a VMOVSD -0x60(%RBP),%XMM0 |
0x44116f MOV -0x30(%RBP),%RAX |
0x441173 MOV (%RAX),%ESI |
0x441175 MOV $0x74d350,%EDI |
0x44117a MOV -0x90(%RBP),%RDX |
0x441181 CALL 4041b0 <__kmpc_atomic_float8_add@plt> |
0x441186 MOV -0x30(%RBP),%RAX |
0x44118a MOV (%RAX),%ESI |
0x44118c MOV $0x74d3b0,%EDI |
0x441191 MOV $0x75433c,%EDX |
0x441196 CALL 404820 <__kmpc_end_reduce@plt> |
0x44119b MOV -0x30(%RBP),%RDI |
0x44119f MOV (%RDI),%ESI |
0x4411a1 MOV $0x74d3d0,%EDI |
0x4411a6 CALL 404580 <__kmpc_barrier@plt> |
0x4411ab ADD $0x98,%RSP |
0x4411b2 POP %RBX |
0x4411b3 POP %R12 |
0x4411b5 POP %R13 |
0x4411b7 POP %R14 |
0x4411b9 POP %R15 |
0x4411bb POP %RBP |
0x4411bc RET |
0x4411bd NOPL (%RAX) |
Path / |
Source file and lines | field_summary_kernel.f90:54-74 |
Module | exec |
nb instructions | 168 |
nb uops | 179 |
loop length | 803 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 0 |
used zmm registers | 3 |
nb stack references | 24 |
micro-operation queue | 29.83 cycles |
front end | 29.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 7.60 | 7.70 | 19.33 | 19.33 | 21.00 | 7.50 | 7.60 | 21.00 | 21.00 | 21.00 | 7.60 | 19.33 |
cycles | 7.60 | 7.70 | 19.33 | 19.33 | 21.00 | 7.50 | 7.60 | 21.00 | 21.00 | 21.00 | 7.60 | 19.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 28.17 |
Stall cycles | 0.00 |
Front-end | 29.83 |
Dispatch | 21.00 |
Overall L1 | 29.83 |
all | 4% |
load | 5% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 8% |
all | 16% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 83% |
all | 9% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 10% |
load | 12% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 14% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 22% |
all | 12% |
load | 12% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 10% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RBP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,-0x54(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 44119f <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x54(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x3c(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x38(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x74d290,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,-0x4c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 4044c0 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R8D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM3,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %ESI,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 440a80 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x1c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x20(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM4,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM3,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM2,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM0,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM1,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x74d2b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x4c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4040b0 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x80(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x74d370,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4411c0,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x5,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x28,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x75433c | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 4046a0 <__kmpc_reduce@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x10,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x2,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 441100 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x840> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 44119f <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD -0x80(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%R15),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%R15) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x78(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%R14),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%R14) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x70(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x68(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%R13),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x60(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d390,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 441191 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8d1> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %EBX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD $-0x2,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVSXD %R14D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x2,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVSXD %R13D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVDQA64 0xc92d1(%RIP),%ZMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.50 |
VPBROADCASTQ 0xca26f(%RIP),%ZMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xca25d(%RIP),%ZMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV 0x28(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8D,-0x34(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 440c01 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x341> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 44119f <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD -0x80(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d2d0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4041b0 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x78(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d2f0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4041b0 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x70(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d310,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x88(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4041b0 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x68(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d330,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4041b0 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x60(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d350,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4041b0 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d3b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x75433c,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 404820 <__kmpc_end_reduce@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d3d0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 404580 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | field_summary_kernel.f90:54-74 |
Module | exec |
nb instructions | 168 |
nb uops | 179 |
loop length | 803 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 0 |
used zmm registers | 3 |
nb stack references | 24 |
micro-operation queue | 29.83 cycles |
front end | 29.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 7.60 | 7.70 | 19.33 | 19.33 | 21.00 | 7.50 | 7.60 | 21.00 | 21.00 | 21.00 | 7.60 | 19.33 |
cycles | 7.60 | 7.70 | 19.33 | 19.33 | 21.00 | 7.50 | 7.60 | 21.00 | 21.00 | 21.00 | 7.60 | 19.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 28.17 |
Stall cycles | 0.00 |
Front-end | 29.83 |
Dispatch | 21.00 |
Overall L1 | 29.83 |
all | 4% |
load | 5% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 8% |
all | 16% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 83% |
all | 9% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 10% |
load | 12% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 14% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 22% |
all | 12% |
load | 12% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 10% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RBP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,-0x54(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 44119f <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x54(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x3c(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x38(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x74d290,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,-0x4c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 4044c0 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R8D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM3,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %ESI,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 440a80 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x1c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x20(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM4,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM3,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM2,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM0,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM1,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x74d2b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x4c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 4040b0 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x80(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x74d370,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4411c0,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x5,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x28,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x75433c | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 4046a0 <__kmpc_reduce@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x10,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x2,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 441100 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x840> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 44119f <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD -0x80(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%R15),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%R15) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x78(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%R14),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%R14) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x70(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x68(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%R13),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x60(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d390,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 441191 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8d1> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %EBX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD $-0x2,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVSXD %R14D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x2,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVSXD %R13D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVDQA64 0xc92d1(%RIP),%ZMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.50 |
VPBROADCASTQ 0xca26f(%RIP),%ZMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xca25d(%RIP),%ZMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV 0x28(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8D,-0x34(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 440c01 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x341> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 44119f <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD -0x80(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d2d0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4041b0 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x78(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d2f0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4041b0 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x70(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d310,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x88(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4041b0 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x68(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d330,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4041b0 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x60(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d350,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 4041b0 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d3b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x75433c,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 404820 <__kmpc_end_reduce@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d3d0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 404580 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼field_summary_kernel_.DIR.OMP.PARALLEL.2– | 0.29 | 0.09 |
▼Loop 333 - field_summary_kernel.f90:56-71 - exec– | 0 | 0 |
○Loop 334 - field_summary_kernel.f90:58-71 - exec | 0.29 | 0.09 |
○Loop 335 - field_summary_kernel.f90:58-71 - exec | 0 | 0 |