Function: field_summary_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: field_summary_kernel.f90:54-74 | Coverage: 0.31% |
---|
Function: field_summary_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: field_summary_kernel.f90:54-74 | Coverage: 0.31% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-137-7698/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/field_summary_kernel.f90: 54 - 74 |
-------------------------------------------------------------------------------- |
54: !$OMP PARALLEL |
55: !$OMP DO PRIVATE(vsqrd,cell_vol,cell_mass) REDUCTION(+ : vol,mass,press,ie,ke) |
56: DO k=y_min,y_max |
57: !$OMP SIMD |
58: DO j=x_min,x_max |
59: vsqrd=0.0 |
60: DO kv=k,k+1 |
61: DO jv=j,j+1 |
62: vsqrd=vsqrd+0.25*(xvel0(jv,kv)**2+yvel0(jv,kv)**2) |
63: ENDDO |
64: ENDDO |
65: cell_vol=volume(j,k) |
66: cell_mass=cell_vol*density0(j,k) |
67: vol=vol+cell_vol |
68: mass=mass+cell_mass |
69: ie=ie+cell_mass*energy0(j,k) |
70: ke=ke+cell_mass*0.5*vsqrd |
71: press=press+cell_vol*pressure(j,k) |
72: ENDDO |
73: ENDDO |
74: !$OMP END DO |
0x440a40 PUSH %RBP |
0x440a41 MOV %RSP,%RBP |
0x440a44 PUSH %R15 |
0x440a46 PUSH %R14 |
0x440a48 PUSH %R13 |
0x440a4a PUSH %R12 |
0x440a4c PUSH %RBX |
0x440a4d SUB $0x98,%RSP |
0x440a54 MOV %R9,-0x90(%RBP) |
0x440a5b MOV %R8,-0x88(%RBP) |
0x440a62 MOV 0x60(%RBP),%EBX |
0x440a65 MOV 0x58(%RBP),%EAX |
0x440a68 SUB %EBX,%EAX |
0x440a6a MOVL $0,-0x54(%RBP) |
0x440a71 JS 44131f |
0x440a77 MOV %RCX,%R14 |
0x440a7a MOV %RDX,%R13 |
0x440a7d MOV %RDI,-0x30(%RBP) |
0x440a81 MOV (%RDI),%ESI |
0x440a83 MOVL $0,-0x3c(%RBP) |
0x440a8a MOV %EAX,-0x38(%RBP) |
0x440a8d MOVL $0x1,-0x50(%RBP) |
0x440a94 SUB $0x8,%RSP |
0x440a98 LEA -0x50(%RBP),%RAX |
0x440a9c LEA -0x54(%RBP),%RCX |
0x440aa0 LEA -0x3c(%RBP),%R8 |
0x440aa4 LEA -0x38(%RBP),%R9 |
0x440aa8 MOV $0x54d290,%EDI |
0x440aad MOV %ESI,-0x4c(%RBP) |
0x440ab0 MOV $0x22,%EDX |
0x440ab5 PUSH $0x1 |
0x440ab7 PUSH $0x1 |
0x440ab9 PUSH %RAX |
0x440aba CALL 404670 <__kmpc_for_static_init_4@plt> |
0x440abf ADD $0x20,%RSP |
0x440ac3 MOV -0x3c(%RBP),%ESI |
0x440ac6 MOV -0x38(%RBP),%R8D |
0x440aca VXORPD %XMM1,%XMM1,%XMM1 |
0x440ace VXORPD %XMM0,%XMM0,%XMM0 |
0x440ad2 VXORPD %XMM2,%XMM2,%XMM2 |
0x440ad6 VXORPD %XMM3,%XMM3,%XMM3 |
0x440ada VXORPD %XMM4,%XMM4,%XMM4 |
0x440ade SUB %ESI,%R8D |
0x440ae1 JAE 440c00 |
0x440ae7 MOV 0x20(%RBP),%R15 |
0x440aeb MOV 0x18(%RBP),%R14 |
0x440aef MOV 0x10(%RBP),%R13 |
0x440af3 VMOVSD %XMM4,-0x80(%RBP) |
0x440af8 VMOVSD %XMM3,-0x78(%RBP) |
0x440afd VMOVSD %XMM2,-0x70(%RBP) |
0x440b02 VMOVSD %XMM0,-0x68(%RBP) |
0x440b07 VMOVSD %XMM1,-0x60(%RBP) |
0x440b0c MOV $0x54d2b0,%EDI |
0x440b11 MOV -0x4c(%RBP),%ESI |
0x440b14 VZEROUPPER |
0x440b17 CALL 404230 <__kmpc_for_static_fini@plt> |
0x440b1c MOV -0x30(%RBP),%RAX |
0x440b20 MOV (%RAX),%ESI |
0x440b22 SUB $0x8,%RSP |
0x440b26 LEA -0x80(%RBP),%R8 |
0x440b2a MOV $0x54d370,%EDI |
0x440b2f MOV $0x441340,%R9D |
0x440b35 MOV $0x5,%EDX |
0x440b3a MOV $0x28,%ECX |
0x440b3f PUSH $0x55433c |
0x440b44 CALL 404830 <__kmpc_reduce@plt> |
0x440b49 ADD $0x10,%RSP |
0x440b4d CMP $0x2,%EAX |
0x440b50 JGE 441280 |
0x440b56 CMP $0x1,%EAX |
0x440b59 MOV -0x30(%RBP),%RDI |
0x440b5d JNE 44131f |
0x440b63 VMOVSD -0x80(%RBP),%XMM0 |
0x440b68 VADDSD (%R15),%XMM0,%XMM0 |
0x440b6d VMOVSD %XMM0,(%R15) |
0x440b72 VMOVSD -0x78(%RBP),%XMM0 |
0x440b77 VADDSD (%R14),%XMM0,%XMM0 |
0x440b7c VMOVSD %XMM0,(%R14) |
0x440b81 VMOVSD -0x70(%RBP),%XMM0 |
0x440b86 MOV -0x88(%RBP),%RAX |
0x440b8d VADDSD (%RAX),%XMM0,%XMM0 |
0x440b91 VMOVSD %XMM0,(%RAX) |
0x440b95 VMOVSD -0x68(%RBP),%XMM0 |
0x440b9a VADDSD (%R13),%XMM0,%XMM0 |
0x440ba0 VMOVSD %XMM0,(%R13) |
0x440ba6 VMOVSD -0x60(%RBP),%XMM0 |
0x440bab MOV -0x90(%RBP),%RAX |
0x440bb2 VADDSD (%RAX),%XMM0,%XMM0 |
0x440bb6 VMOVSD %XMM0,(%RAX) |
0x440bba MOV (%RDI),%ESI |
0x440bbc MOV $0x54d390,%EDI |
0x440bc1 JMP 441311 |
0x440bc6 NOPW %CS:(%RAX,%RAX,1) |
0x440bd5 NOPW %CS:(%RAX,%RAX,1) |
0x440be4 NOPW %CS:(%RAX,%RAX,1) |
0x440bf3 NOPW %CS:(%RAX,%RAX,1) |
0x440c00 MOV 0xa0(%RBP),%R9 |
0x440c07 ADD %EBX,%ESI |
0x440c09 ADD $-0x2,%R14D |
0x440c0d MOVSXD %R14D,%RAX |
0x440c10 MOV %RAX,-0x98(%RBP) |
0x440c17 ADD $-0x2,%R13D |
0x440c1b MOVSXD %R13D,%RAX |
0x440c1e MOV %RAX,-0xa8(%RBP) |
0x440c25 VMOVDQA64 0xc9b11(%RIP),%ZMM5 |
0x440c2f VPBROADCASTQ 0xcaaaf(%RIP),%ZMM6 |
0x440c39 VBROADCASTSD 0xcaa9d(%RIP),%ZMM7 |
0x440c43 MOV 0x28(%RBP),%R10 |
0x440c47 XOR %R13D,%R13D |
0x440c4a MOV %RSI,-0xa0(%RBP) |
0x440c51 MOV %R8D,-0x34(%RBP) |
0x440c55 JMP 440d81 |
0x440c5a NOPW %CS:(%RAX,%RAX,1) |
0x440c69 NOPW %CS:(%RAX,%RAX,1) |
0x440c78 NOPL (%RAX,%RAX,1) |
(333) 0x440c80 VEXTRACTF64X4 $0x1,%ZMM13,%YMM9 |
(333) 0x440c87 VADDPD %ZMM9,%ZMM13,%ZMM9 |
(333) 0x440c8d VMOVAPD %XMM9,%XMM13 |
(333) 0x440c92 VEXTRACTF128 $0x1,%YMM9,%XMM9 |
(333) 0x440c98 VADDPD %XMM9,%XMM13,%XMM9 |
(333) 0x440c9d VSHUFPD $0x1,%XMM9,%XMM9,%XMM13 |
(333) 0x440ca3 VADDSD %XMM13,%XMM9,%XMM9 |
(333) 0x440ca8 VADDSD %XMM2,%XMM9,%XMM2 |
(333) 0x440cac VEXTRACTF64X4 $0x1,%ZMM12,%YMM9 |
(333) 0x440cb3 VADDPD %ZMM9,%ZMM12,%ZMM9 |
(333) 0x440cb9 VMOVAPD %XMM9,%XMM12 |
(333) 0x440cbe VEXTRACTF128 $0x1,%YMM9,%XMM9 |
(333) 0x440cc4 VADDPD %XMM9,%XMM12,%XMM9 |
(333) 0x440cc9 VSHUFPD $0x1,%XMM9,%XMM9,%XMM12 |
(333) 0x440ccf VADDSD %XMM12,%XMM9,%XMM9 |
(333) 0x440cd4 VADDSD %XMM1,%XMM9,%XMM1 |
(333) 0x440cd8 VEXTRACTF64X4 $0x1,%ZMM11,%YMM9 |
(333) 0x440cdf VADDPD %ZMM9,%ZMM11,%ZMM9 |
(333) 0x440ce5 VMOVAPD %XMM9,%XMM11 |
(333) 0x440cea VEXTRACTF128 $0x1,%YMM9,%XMM9 |
(333) 0x440cf0 VADDPD %XMM9,%XMM11,%XMM9 |
(333) 0x440cf5 VSHUFPD $0x1,%XMM9,%XMM9,%XMM11 |
(333) 0x440cfb VADDSD %XMM11,%XMM9,%XMM9 |
(333) 0x440d00 VADDSD %XMM0,%XMM9,%XMM0 |
(333) 0x440d04 VEXTRACTF64X4 $0x1,%ZMM10,%YMM9 |
(333) 0x440d0b VADDPD %ZMM9,%ZMM10,%ZMM9 |
(333) 0x440d11 VMOVAPD %XMM9,%XMM10 |
(333) 0x440d16 VEXTRACTF128 $0x1,%YMM9,%XMM9 |
(333) 0x440d1c VADDPD %XMM9,%XMM10,%XMM9 |
(333) 0x440d21 VSHUFPD $0x1,%XMM9,%XMM9,%XMM10 |
(333) 0x440d27 VADDSD %XMM10,%XMM9,%XMM9 |
(333) 0x440d2c VADDSD %XMM3,%XMM9,%XMM3 |
(333) 0x440d30 VEXTRACTF64X4 $0x1,%ZMM8,%YMM9 |
(333) 0x440d37 VADDPD %ZMM9,%ZMM8,%ZMM8 |
(333) 0x440d3d VMOVAPD %XMM8,%XMM9 |
(333) 0x440d42 VEXTRACTF128 $0x1,%YMM8,%XMM8 |
(333) 0x440d48 VADDPD %XMM8,%XMM9,%XMM8 |
(333) 0x440d4d VSHUFPD $0x1,%XMM8,%XMM8,%XMM9 |
(333) 0x440d53 VADDSD %XMM9,%XMM8,%XMM8 |
(333) 0x440d58 VADDSD %XMM4,%XMM8,%XMM4 |
(333) 0x440d5c MOV 0x28(%RBP),%R10 |
(333) 0x440d60 MOV -0xa0(%RBP),%RSI |
(333) 0x440d67 MOV -0x34(%RBP),%R8D |
(333) 0x440d6b MOV -0xb8(%RBP),%RCX |
(333) 0x440d72 LEA 0x1(%RCX),%EAX |
(333) 0x440d75 CMP %R8D,%ECX |
(333) 0x440d78 MOV %EAX,%R13D |
(333) 0x440d7b JE 440ae7 |
(333) 0x440d81 MOV 0x70(%RBP),%RAX |
(333) 0x440d85 MOV (%RAX),%EDX |
(333) 0x440d87 MOV 0x68(%RBP),%RAX |
(333) 0x440d8b MOV (%RAX),%EDI |
(333) 0x440d8d SUB %EDX,%EDI |
(333) 0x440d8f MOV %R13,-0xb8(%RBP) |
(333) 0x440d96 JS 440d6b |
(333) 0x440d98 LEA (%RSI,%R13,1),%R8D |
(333) 0x440d9c MOV 0x78(%RBP),%RAX |
(333) 0x440da0 MOV (%RAX),%R14 |
(333) 0x440da3 MOV 0x80(%RBP),%RAX |
(333) 0x440daa MOV (%RAX),%R11 |
(333) 0x440dad MOV 0x88(%RBP),%RAX |
(333) 0x440db4 MOV (%RAX),%R15 |
(333) 0x440db7 MOV 0x90(%RBP),%RAX |
(333) 0x440dbe MOV (%RAX),%RAX |
(333) 0x440dc1 MOV 0x98(%RBP),%RCX |
(333) 0x440dc8 MOV (%RCX),%RCX |
(333) 0x440dcb VPBROADCASTD %EDX,%YMM8 |
(333) 0x440dd1 MOV (%R9),%R12 |
(333) 0x440dd4 INC %EDI |
(333) 0x440dd6 CMP $0x2,%EDI |
(333) 0x440dd9 MOV $0x1,%EDX |
(333) 0x440dde CMOVL %EDX,%EDI |
(333) 0x440de1 MOVSXD %R8D,%RDX |
(333) 0x440de4 CMP $0x8,%EDI |
(333) 0x440de7 JAE 440e00 |
(333) 0x440de9 MOVQ $0,-0x48(%RBP) |
(333) 0x440df1 MOV 0x38(%RBP),%R13 |
(333) 0x440df5 JMP 44108b |
0x440dfa NOPW (%RAX,%RAX,1) |
(333) 0x440e00 MOV %RDI,-0xb0(%RBP) |
(333) 0x440e07 AND $0x7ffffff8,%EDI |
(333) 0x440e0d MOV %RDI,-0x48(%RBP) |
(333) 0x440e11 VXORPD %XMM13,%XMM13,%XMM13 |
(333) 0x440e16 VPMOVSXDQ %XMM8,%XMM14 |
(333) 0x440e1b VXORPD %XMM12,%XMM12,%XMM12 |
(333) 0x440e20 VXORPD %XMM11,%XMM11,%XMM11 |
(333) 0x440e25 VXORPD %XMM10,%XMM10,%XMM10 |
(333) 0x440e2a VXORPD %XMM9,%XMM9,%XMM9 |
(333) 0x440e2f XOR %EBX,%EBX |
(333) 0x440e31 VMOVDQA64 %ZMM5,%ZMM15 |
(333) 0x440e37 MOV -0x98(%RBP),%RDI |
(333) 0x440e3e MOV 0x30(%RBP),%RSI |
(333) 0x440e42 NOPW %CS:(%RAX,%RAX,1) |
(334) 0x440e50 MOV %RDX,%R13 |
(334) 0x440e53 SUB -0xa8(%RBP),%RDX |
(334) 0x440e5a MOV %R14,%R9 |
(334) 0x440e5d IMUL %RDX,%R9 |
(334) 0x440e61 ADD %RSI,%R9 |
(334) 0x440e64 VMOVDQA64 %XMM15,%XMM16 |
(334) 0x440e6a VPADDQ %XMM14,%XMM15,%XMM16 |
(334) 0x440e70 VMOVQ %XMM16,%R8 |
(334) 0x440e76 SUB %RDI,%R8 |
(334) 0x440e79 VMOVUPD (%R9,%R8,8),%ZMM16 |
(334) 0x440e80 VMOVUPD 0x8(%R9,%R8,8),%ZMM17 |
(334) 0x440e8b MOV %R11,%R9 |
(334) 0x440e8e IMUL %RDX,%R9 |
(334) 0x440e92 ADD %R10,%R9 |
(334) 0x440e95 VMOVUPD (%R9,%R8,8),%ZMM18 |
(334) 0x440e9c VMOVUPD 0x8(%R9,%R8,8),%ZMM19 |
(334) 0x440ea7 LEA 0x1(%RDX),%R9 |
(334) 0x440eab MOV %R14,%R10 |
(334) 0x440eae IMUL %R9,%R10 |
(334) 0x440eb2 ADD %RSI,%R10 |
(334) 0x440eb5 VMOVUPD (%R10,%R8,8),%ZMM20 |
(334) 0x440ebc VMOVUPD 0x8(%R10,%R8,8),%ZMM21 |
(334) 0x440ec7 MOV %R15,%R10 |
(334) 0x440eca IMUL %RDX,%R10 |
(334) 0x440ece ADD 0x50(%RBP),%R10 |
(334) 0x440ed2 VMOVUPD (%R10,%R8,8),%ZMM22 |
(334) 0x440ed9 MOV %RAX,%R10 |
(334) 0x440edc IMUL %RDX,%R10 |
(334) 0x440ee0 ADD 0x48(%RBP),%R10 |
(334) 0x440ee4 VMULPD (%R10,%R8,8),%ZMM22,%ZMM23 |
(334) 0x440eeb MOV 0x28(%RBP),%R10 |
(334) 0x440eef IMUL %R11,%R9 |
(334) 0x440ef3 ADD %R10,%R9 |
(334) 0x440ef6 VMOVUPD (%R9,%R8,8),%ZMM24 |
(334) 0x440efd VMOVUPD 0x8(%R9,%R8,8),%ZMM25 |
(334) 0x440f08 MOV %RCX,%R9 |
(334) 0x440f0b IMUL %RDX,%R9 |
(334) 0x440f0f ADD 0x40(%RBP),%R9 |
(334) 0x440f13 VFMADD231PD (%R9,%R8,8),%ZMM23,%ZMM11 |
(334) 0x440f1a IMUL %R12,%RDX |
(334) 0x440f1e ADD 0x38(%RBP),%RDX |
(334) 0x440f22 VFMADD231PD (%RDX,%R8,8),%ZMM22,%ZMM13 |
(334) 0x440f29 MOV %R13,%RDX |
(334) 0x440f2c VMULPD %ZMM16,%ZMM16,%ZMM16 |
(334) 0x440f32 VFMADD213PD %ZMM16,%ZMM18,%ZMM18 |
(334) 0x440f38 VFMADD231PD %ZMM17,%ZMM17,%ZMM18 |
(334) 0x440f3e VFMADD231PD %ZMM19,%ZMM19,%ZMM18 |
(334) 0x440f44 VFMADD213PD %ZMM18,%ZMM20,%ZMM20 |
(334) 0x440f4a VFMADD213PD %ZMM20,%ZMM24,%ZMM24 |
(334) 0x440f50 VFMADD231PD %ZMM21,%ZMM21,%ZMM24 |
(334) 0x440f56 VFMADD231PD %ZMM25,%ZMM25,%ZMM24 |
(334) 0x440f5c VADDPD %ZMM22,%ZMM9,%ZMM9 |
(334) 0x440f62 VADDPD %ZMM23,%ZMM10,%ZMM10 |
(334) 0x440f68 VMULPD %ZMM24,%ZMM23,%ZMM16 |
(334) 0x440f6e VFMADD231PD %ZMM7,%ZMM16,%ZMM12 |
(334) 0x440f74 VPADDQ %ZMM6,%ZMM15,%ZMM15 |
(334) 0x440f7a ADD $0x8,%RBX |
(334) 0x440f7e CMP -0x48(%RBP),%RBX |
(334) 0x440f82 JB 440e50 |
(333) 0x440f88 VEXTRACTF64X4 $0x1,%ZMM13,%YMM14 |
(333) 0x440f8f VADDPD %ZMM14,%ZMM13,%ZMM13 |
(333) 0x440f95 VMOVAPD %XMM13,%XMM14 |
(333) 0x440f9a VEXTRACTF128 $0x1,%YMM13,%XMM13 |
(333) 0x440fa0 VADDPD %XMM13,%XMM14,%XMM13 |
(333) 0x440fa5 VSHUFPD $0x1,%XMM13,%XMM13,%XMM14 |
(333) 0x440fab VADDSD %XMM14,%XMM13,%XMM13 |
(333) 0x440fb0 VADDSD %XMM2,%XMM13,%XMM2 |
(333) 0x440fb4 VEXTRACTF64X4 $0x1,%ZMM12,%YMM13 |
(333) 0x440fbb VADDPD %ZMM13,%ZMM12,%ZMM12 |
(333) 0x440fc1 VMOVAPD %XMM12,%XMM13 |
(333) 0x440fc6 VEXTRACTF128 $0x1,%YMM12,%XMM12 |
(333) 0x440fcc VADDPD %XMM12,%XMM13,%XMM12 |
(333) 0x440fd1 VSHUFPD $0x1,%XMM12,%XMM12,%XMM13 |
(333) 0x440fd7 VADDSD %XMM13,%XMM12,%XMM12 |
(333) 0x440fdc VADDSD %XMM1,%XMM12,%XMM1 |
(333) 0x440fe0 VEXTRACTF64X4 $0x1,%ZMM11,%YMM12 |
(333) 0x440fe7 VADDPD %ZMM12,%ZMM11,%ZMM11 |
(333) 0x440fed VMOVAPD %XMM11,%XMM12 |
(333) 0x440ff2 VEXTRACTF128 $0x1,%YMM11,%XMM11 |
(333) 0x440ff8 VADDPD %XMM11,%XMM12,%XMM11 |
(333) 0x440ffd VSHUFPD $0x1,%XMM11,%XMM11,%XMM12 |
(333) 0x441003 VADDSD %XMM12,%XMM11,%XMM11 |
(333) 0x441008 VADDSD %XMM0,%XMM11,%XMM0 |
(333) 0x44100c VEXTRACTF64X4 $0x1,%ZMM10,%YMM11 |
(333) 0x441013 VADDPD %ZMM11,%ZMM10,%ZMM10 |
(333) 0x441019 VMOVAPD %XMM10,%XMM11 |
(333) 0x44101e VEXTRACTF128 $0x1,%YMM10,%XMM10 |
(333) 0x441024 VADDPD %XMM10,%XMM11,%XMM10 |
(333) 0x441029 VSHUFPD $0x1,%XMM10,%XMM10,%XMM11 |
(333) 0x44102f VADDSD %XMM11,%XMM10,%XMM10 |
(333) 0x441034 VADDSD %XMM3,%XMM10,%XMM3 |
(333) 0x441038 VEXTRACTF64X4 $0x1,%ZMM9,%YMM10 |
(333) 0x44103f VADDPD %ZMM10,%ZMM9,%ZMM9 |
(333) 0x441045 VMOVAPD %XMM9,%XMM10 |
(333) 0x44104a VEXTRACTF128 $0x1,%YMM9,%XMM9 |
(333) 0x441050 VADDPD %XMM9,%XMM10,%XMM9 |
(333) 0x441055 VSHUFPD $0x1,%XMM9,%XMM9,%XMM10 |
(333) 0x44105b VADDSD %XMM10,%XMM9,%XMM9 |
(333) 0x441060 VADDSD %XMM4,%XMM9,%XMM4 |
(333) 0x441064 MOV -0xb0(%RBP),%RDI |
(333) 0x44106b CMP %RDI,-0x48(%RBP) |
(333) 0x44106f MOV -0xa0(%RBP),%RSI |
(333) 0x441076 MOV -0x34(%RBP),%R8D |
(333) 0x44107a MOV 0xa0(%RBP),%R9 |
(333) 0x441081 MOV 0x38(%RBP),%R13 |
(333) 0x441085 JE 440d6b |
(333) 0x44108b MOV -0x48(%RBP),%RSI |
(333) 0x44108f VMOVQ %RSI,%XMM10 |
(333) 0x441094 SUB %RSI,%RDI |
(333) 0x441097 VPBROADCASTQ %RDI,%ZMM9 |
(333) 0x44109d MOV %R10,%R8 |
(333) 0x4410a0 MOV -0xa8(%RBP),%RSI |
(333) 0x4410a7 SUB %RSI,%RDX |
(333) 0x4410aa MOV %R14,%RSI |
(333) 0x4410ad MOV %R11,%RDI |
(333) 0x4410b0 LEA 0x1(%RDX),%RBX |
(333) 0x4410b4 IMUL %RBX,%R14 |
(333) 0x4410b8 IMUL %RBX,%R11 |
(333) 0x4410bc IMUL %RDX,%RSI |
(333) 0x4410c0 IMUL %RDX,%RDI |
(333) 0x4410c4 IMUL %RDX,%R15 |
(333) 0x4410c8 IMUL %RDX,%RAX |
(333) 0x4410cc IMUL %RDX,%RCX |
(333) 0x4410d0 IMUL %RDX,%R12 |
(333) 0x4410d4 VXORPD %XMM13,%XMM13,%XMM13 |
(333) 0x4410d9 MOV 0x30(%RBP),%RDX |
(333) 0x4410dd ADD %RDX,%RSI |
(333) 0x4410e0 VMOVDQA %XMM10,%XMM14 |
(333) 0x4410e5 VPMOVSXDQ %XMM8,%XMM15 |
(333) 0x4410ea ADD %R10,%RDI |
(333) 0x4410ed ADD %RDX,%R14 |
(333) 0x4410f0 ADD %R10,%R11 |
(333) 0x4410f3 ADD 0x50(%RBP),%R15 |
(333) 0x4410f7 ADD 0x48(%RBP),%RAX |
(333) 0x4410fb ADD 0x40(%RBP),%RCX |
(333) 0x4410ff ADD %R13,%R12 |
(333) 0x441102 VXORPD %XMM12,%XMM12,%XMM12 |
(333) 0x441107 VXORPD %XMM11,%XMM11,%XMM11 |
(333) 0x44110c VPXOR %XMM10,%XMM10,%XMM10 |
(333) 0x441111 VPXOR %XMM8,%XMM8,%XMM8 |
(333) 0x441116 VMOVDQA64 %ZMM5,%ZMM16 |
(333) 0x44111c MOV -0x98(%RBP),%R13 |
(333) 0x441123 JMP 441175 |
0x441125 NOPW %CS:(%RAX,%RAX,1) |
0x441134 NOPW %CS:(%RAX,%RAX,1) |
(335) 0x441140 VMOVAPD %ZMM17,%ZMM8{%K1} |
(335) 0x441146 VMOVAPD %ZMM18,%ZMM10{%K1} |
(335) 0x44114c VMOVAPD %ZMM19,%ZMM11{%K1} |
(335) 0x441152 VMOVAPD %ZMM20,%ZMM12{%K1} |
(335) 0x441158 VMOVAPD %ZMM21,%ZMM13{%K1} |
(335) 0x44115e VPADDQ %ZMM6,%ZMM16,%ZMM16 |
(335) 0x441164 VPCMPLTUQ %ZMM9,%ZMM16,%K0 |
(335) 0x44116b KORTESTB %K0,%K0 |
(335) 0x44116f JE 440c80 |
(335) 0x441175 VPCMPLTUQ %ZMM9,%ZMM16,%K1 |
(335) 0x44117c KORTESTB %K1,%K1 |
(335) 0x441180 VXORPD %XMM17,%XMM17,%XMM17 |
(335) 0x441186 VXORPD %XMM18,%XMM18,%XMM18 |
(335) 0x44118c VXORPD %XMM19,%XMM19,%XMM19 |
(335) 0x441192 VXORPD %XMM20,%XMM20,%XMM20 |
(335) 0x441198 VXORPD %XMM21,%XMM21,%XMM21 |
(335) 0x44119e JE 441140 |
(335) 0x4411a0 VMOVDQA64 %XMM16,%XMM17 |
(335) 0x4411a6 VPADDQ %XMM14,%XMM16,%XMM17 |
(335) 0x4411ac VPADDQ %XMM15,%XMM17,%XMM17 |
(335) 0x4411b2 VMOVQ %XMM17,%RDX |
(335) 0x4411b8 SUB %R13,%RDX |
(335) 0x4411bb VMOVUPD (%RSI,%RDX,8),%ZMM17{%K1}{z} |
(335) 0x4411c2 VMULPD %ZMM17,%ZMM17,%ZMM17 |
(335) 0x4411c8 VMOVUPD (%RDI,%RDX,8),%ZMM18{%K1}{z} |
(335) 0x4411cf VMOVUPD 0x8(%RSI,%RDX,8),%ZMM19{%K1}{z} |
(335) 0x4411da VMOVUPD 0x8(%RDI,%RDX,8),%ZMM20{%K1}{z} |
(335) 0x4411e5 VFMADD213PD %ZMM17,%ZMM18,%ZMM18 |
(335) 0x4411eb VFMADD213PD %ZMM18,%ZMM19,%ZMM19 |
(335) 0x4411f1 VMOVUPD (%R14,%RDX,8),%ZMM17{%K1}{z} |
(335) 0x4411f8 VMOVUPD (%R11,%RDX,8),%ZMM18{%K1}{z} |
(335) 0x4411ff VFMADD231PD %ZMM20,%ZMM20,%ZMM19 |
(335) 0x441205 VFMADD213PD %ZMM19,%ZMM17,%ZMM17 |
(335) 0x44120b VMOVUPD 0x8(%R14,%RDX,8),%ZMM20{%K1}{z} |
(335) 0x441216 VMOVUPD 0x8(%R11,%RDX,8),%ZMM19{%K1}{z} |
(335) 0x441221 VFMADD231PD %ZMM18,%ZMM18,%ZMM17 |
(335) 0x441227 VFMADD213PD %ZMM17,%ZMM20,%ZMM20 |
(335) 0x44122d VMOVUPD (%R15,%RDX,8),%ZMM22{%K1}{z} |
(335) 0x441234 VMOVUPD (%RAX,%RDX,8),%ZMM17{%K1}{z} |
(335) 0x44123b VFMADD231PD %ZMM19,%ZMM19,%ZMM20 |
(335) 0x441241 VMULPD %ZMM22,%ZMM17,%ZMM21 |
(335) 0x441247 VADDPD %ZMM22,%ZMM8,%ZMM17 |
(335) 0x44124d VADDPD %ZMM21,%ZMM10,%ZMM18 |
(335) 0x441253 VMOVUPD (%RCX,%RDX,8),%ZMM19{%K1}{z} |
(335) 0x44125a VFMADD213PD %ZMM11,%ZMM21,%ZMM19 |
(335) 0x441260 VMULPD %ZMM20,%ZMM21,%ZMM20 |
(335) 0x441266 VFMADD132PD %ZMM7,%ZMM12,%ZMM20 |
(335) 0x44126c VMOVUPD (%R12,%RDX,8),%ZMM21{%K1}{z} |
(335) 0x441273 VFMADD213PD %ZMM13,%ZMM22,%ZMM21 |
(335) 0x441279 JMP 441140 |
0x44127e XCHG %AX,%AX |
0x441280 MOV -0x30(%RBP),%RDI |
0x441284 JNE 44131f |
0x44128a VMOVSD -0x80(%RBP),%XMM0 |
0x44128f MOV (%RDI),%ESI |
0x441291 MOV $0x54d2d0,%EDI |
0x441296 MOV %R15,%RDX |
0x441299 CALL 404330 <__kmpc_atomic_float8_add@plt> |
0x44129e VMOVSD -0x78(%RBP),%XMM0 |
0x4412a3 MOV -0x30(%RBP),%RAX |
0x4412a7 MOV (%RAX),%ESI |
0x4412a9 MOV $0x54d2f0,%EDI |
0x4412ae MOV %R14,%RDX |
0x4412b1 CALL 404330 <__kmpc_atomic_float8_add@plt> |
0x4412b6 VMOVSD -0x70(%RBP),%XMM0 |
0x4412bb MOV -0x30(%RBP),%RAX |
0x4412bf MOV (%RAX),%ESI |
0x4412c1 MOV $0x54d310,%EDI |
0x4412c6 MOV -0x88(%RBP),%RDX |
0x4412cd CALL 404330 <__kmpc_atomic_float8_add@plt> |
0x4412d2 VMOVSD -0x68(%RBP),%XMM0 |
0x4412d7 MOV -0x30(%RBP),%RAX |
0x4412db MOV (%RAX),%ESI |
0x4412dd MOV $0x54d330,%EDI |
0x4412e2 MOV %R13,%RDX |
0x4412e5 CALL 404330 <__kmpc_atomic_float8_add@plt> |
0x4412ea VMOVSD -0x60(%RBP),%XMM0 |
0x4412ef MOV -0x30(%RBP),%RAX |
0x4412f3 MOV (%RAX),%ESI |
0x4412f5 MOV $0x54d350,%EDI |
0x4412fa MOV -0x90(%RBP),%RDX |
0x441301 CALL 404330 <__kmpc_atomic_float8_add@plt> |
0x441306 MOV -0x30(%RBP),%RAX |
0x44130a MOV (%RAX),%ESI |
0x44130c MOV $0x54d3b0,%EDI |
0x441311 MOV $0x55433c,%EDX |
0x441316 CALL 4049b0 <__kmpc_end_reduce@plt> |
0x44131b MOV -0x30(%RBP),%RDI |
0x44131f MOV (%RDI),%ESI |
0x441321 MOV $0x54d3d0,%EDI |
0x441326 CALL 404740 <__kmpc_barrier@plt> |
0x44132b ADD $0x98,%RSP |
0x441332 POP %RBX |
0x441333 POP %R12 |
0x441335 POP %R13 |
0x441337 POP %R14 |
0x441339 POP %R15 |
0x44133b POP %RBP |
0x44133c RET |
0x44133d NOPL (%RAX) |
Path / |
Source file and lines | field_summary_kernel.f90:54-74 |
Module | exec |
nb instructions | 168 |
nb uops | 179 |
loop length | 803 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 0 |
used zmm registers | 3 |
nb stack references | 24 |
micro-operation queue | 29.83 cycles |
front end | 29.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 7.60 | 7.70 | 19.33 | 19.33 | 21.00 | 7.50 | 7.60 | 21.00 | 21.00 | 21.00 | 7.60 | 19.33 |
cycles | 7.60 | 7.70 | 19.33 | 19.33 | 21.00 | 7.50 | 7.60 | 21.00 | 21.00 | 21.00 | 7.60 | 19.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 28.17 |
Stall cycles | 0.00 |
Front-end | 29.83 |
Dispatch | 21.00 |
Overall L1 | 29.83 |
all | 4% |
load | 5% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 8% |
all | 16% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 83% |
all | 9% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 10% |
load | 12% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 14% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 22% |
all | 12% |
load | 12% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 10% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RBP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,-0x54(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 44131f <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x54(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x3c(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x38(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x54d290,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,-0x4c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R8D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM3,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %ESI,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 440c00 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x1c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x20(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM4,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM3,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM2,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM0,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM1,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x54d2b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x4c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x80(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x54d370,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x441340,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x5,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x28,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x55433c | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 404830 <__kmpc_reduce@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x10,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x2,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 441280 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x840> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 44131f <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD -0x80(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%R15),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%R15) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x78(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%R14),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%R14) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x70(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x68(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%R13),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x60(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d390,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 441311 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8d1> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %EBX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD $-0x2,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVSXD %R14D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x2,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVSXD %R13D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVDQA64 0xc9b11(%RIP),%ZMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.50 |
VPBROADCASTQ 0xcaaaf(%RIP),%ZMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xcaa9d(%RIP),%ZMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV 0x28(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8D,-0x34(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 440d81 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x341> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 44131f <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD -0x80(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d2d0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 404330 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x78(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d2f0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 404330 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x70(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d310,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x88(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 404330 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x68(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d330,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 404330 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x60(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d350,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 404330 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d3b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x55433c,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4049b0 <__kmpc_end_reduce@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d3d0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 404740 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | field_summary_kernel.f90:54-74 |
Module | exec |
nb instructions | 168 |
nb uops | 179 |
loop length | 803 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 0 |
used zmm registers | 3 |
nb stack references | 24 |
micro-operation queue | 29.83 cycles |
front end | 29.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 7.60 | 7.70 | 19.33 | 19.33 | 21.00 | 7.50 | 7.60 | 21.00 | 21.00 | 21.00 | 7.60 | 19.33 |
cycles | 7.60 | 7.70 | 19.33 | 19.33 | 21.00 | 7.50 | 7.60 | 21.00 | 21.00 | 21.00 | 7.60 | 19.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 28.17 |
Stall cycles | 0.00 |
Front-end | 29.83 |
Dispatch | 21.00 |
Overall L1 | 29.83 |
all | 4% |
load | 5% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 8% |
all | 16% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 83% |
all | 9% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 10% |
load | 12% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 14% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 22% |
all | 12% |
load | 12% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 10% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RBP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,-0x54(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 44131f <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x50(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x54(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x3c(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x38(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x54d290,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,-0x4c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x3c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x38(%RBP),%R8D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM2,%XMM2,%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM3,%XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VXORPD %XMM4,%XMM4,%XMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SUB %ESI,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 440c00 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x1c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x20(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD %XMM4,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM3,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM2,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM0,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD %XMM1,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x54d2b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x4c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x80(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x54d370,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x441340,%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x5,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x28,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x55433c | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 404830 <__kmpc_reduce@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x10,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x2,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 441280 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x840> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x1,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 44131f <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD -0x80(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%R15),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%R15) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x78(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%R14),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%R14) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x70(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x88(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x68(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%R13),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%R13) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD -0x60(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VADDSD (%RAX),%XMM0,%XMM0 | 1 | 0 | 0.50 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.50 |
VMOVSD %XMM0,(%RAX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d390,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 441311 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8d1> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa0(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %EBX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD $-0x2,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVSXD %R14D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV %RAX,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x2,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVSXD %R13D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVDQA64 0xc9b11(%RIP),%ZMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.50 |
VPBROADCASTQ 0xcaaaf(%RIP),%ZMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VBROADCASTSD 0xcaa9d(%RIP),%ZMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
MOV 0x28(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8D,-0x34(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 440d81 <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x341> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 44131f <field_summary_kernel_module_mp_field_summary_kernel_.DIR.OMP.PARALLEL.2+0x8df> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VMOVSD -0x80(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d2d0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 404330 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x78(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d2f0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R14,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 404330 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x70(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d310,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x88(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 404330 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x68(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d330,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R13,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 404330 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD -0x60(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d350,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x90(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 404330 <__kmpc_atomic_float8_add@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d3b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x55433c,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4049b0 <__kmpc_end_reduce@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x30(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x54d3d0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 404740 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼field_summary_kernel_.DIR.OMP.PARALLEL.2– | 0.31 | 0.1 |
▼Loop 333 - field_summary_kernel.f90:56-71 - exec– | 0 | 0 |
○Loop 334 - field_summary_kernel.f90:58-71 - exec | 0.31 | 0.1 |
○Loop 335 - field_summary_kernel.f90:58-71 - exec | 0 | 0 |