Function: __ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0 | Module: exec | Source: ideal_gas_kernel.f90:45-55 | Coverage: 4.84% |
---|
Function: __ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0 | Module: exec | Source: ideal_gas_kernel.f90:45-55 | Coverage: 4.84% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-7919/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/ideal_gas_kernel.f90: 45 - 55 |
-------------------------------------------------------------------------------- |
45: !$OMP PARALLEL |
46: !$OMP DO PRIVATE(v,pressurebyenergy,pressurebyvolume,sound_speed_squared) |
47: DO k=y_min,y_max |
48: !$OMP SIMD |
49: DO j=x_min,x_max |
50: v=1.0_8/density(j,k) |
51: pressure(j,k)=(1.4_8-1.0_8)*density(j,k)*energy(j,k) |
52: pressurebyenergy=(1.4_8-1.0_8)*density(j,k) |
53: pressurebyvolume=-density(j,k)*pressure(j,k) |
54: sound_speed_squared=v*v*(pressure(j,k)*pressurebyenergy-pressurebyvolume) |
55: soundspeed(j,k)=SQRT(sound_speed_squared) |
0x435570 PUSH %RBP |
0x435571 MOV %RSP,%RBP |
0x435574 PUSH %R15 |
0x435576 PUSH %R14 |
0x435578 PUSH %R13 |
0x43557a PUSH %R12 |
0x43557c PUSH %RBX |
0x43557d AND $-0x40,%RSP |
0x435581 ADD $-0x80,%RSP |
0x435585 MOV 0x70(%RDI),%RDX |
0x435589 MOV 0x68(%RDI),%RCX |
0x43558d MOV %RDI,0x78(%RSP) |
0x435592 MOV 0x78(%RDI),%RAX |
0x435596 MOV 0x60(%RDI),%RBX |
0x43559a MOV 0x50(%RDI),%RSI |
0x43559e MOV 0x40(%RDI),%R8 |
0x4355a2 MOV %RDX,0x48(%RSP) |
0x4355a7 MOV 0x10(%RDI),%R9 |
0x4355ab MOV 0x58(%RDI),%R13 |
0x4355af MOV %RCX,0x60(%RSP) |
0x4355b4 MOV 0x48(%RDI),%R14 |
0x4355b8 MOV %RSI,0x38(%RSP) |
0x4355bd MOV (%R9),%R12D |
0x4355c0 MOV %R8,0x30(%RSP) |
0x4355c5 MOV %RAX,0x70(%RSP) |
0x4355ca MOV %RBX,0x40(%RSP) |
0x4355cf CALL 402080 <@plt_start@+0x60> |
0x4355d4 MOV %EAX,%R15D |
0x4355d7 CALL 402180 <@plt_start@+0x160> |
0x4355dc MOV 0x78(%RSP),%RCX |
0x4355e1 MOV %EAX,%EDI |
0x4355e3 MOV 0x18(%RCX),%R10 |
0x4355e7 MOV (%R10),%EAX |
0x4355ea INC %EAX |
0x4355ec SUB %R12D,%EAX |
0x4355ef CLTD |
0x4355f0 IDIV %R15D |
0x4355f3 CMP %EDX,%EDI |
0x4355f5 JL 435c13 |
0x4355fb IMUL %EAX,%EDI |
0x4355fe ADD %EDX,%EDI |
0x435600 ADD %EDI,%EAX |
0x435602 CMP %EAX,%EDI |
0x435604 JGE 435be5 |
0x43560a MOV 0x8(%RCX),%R8 |
0x43560e MOV 0x30(%RCX),%R9 |
0x435612 ADD %R12D,%EAX |
0x435615 ADD %R12D,%EDI |
0x435618 MOV (%RCX),%R11 |
0x43561b MOV 0x28(%RCX),%R10 |
0x43561f MOV %EAX,0x2c(%RSP) |
0x435623 MOV (%R8),%R15D |
0x435626 VMOVSD 0x5a8ba(%RIP),%XMM7 |
0x43562e MOV %R9,0x78(%RSP) |
0x435633 MOV 0x30(%RSP),%R9 |
0x435638 MOVSXD (%R11),%RSI |
0x43563b MOV %EDI,0x6c(%RSP) |
0x43563f LEA 0x1(%R15),%EAX |
0x435643 MOV 0x40(%RSP),%R11 |
0x435648 VMOVSD 0x5a880(%RIP),%XMM6 |
0x435650 MOV %R15D,0x68(%RSP) |
0x435655 MOV %EAX,0x24(%RSP) |
0x435659 MOVSXD %EDI,%RAX |
0x43565c ADD %RSI,%R14 |
0x43565f MOV 0x60(%RSP),%RDI |
0x435664 IMUL %RAX,%R9 |
0x435668 LEA (%R13,%RSI,1),%R8 |
0x43566d MOV 0x38(%RSP),%R13 |
0x435672 MOV %RSI,%RBX |
0x435675 IMUL %RAX,%R11 |
0x435679 ADD %RSI,%RDI |
0x43567c MOV %ESI,0x58(%RSP) |
0x435680 VMOVSD 0x5a850(%RIP),%XMM5 |
0x435688 IMUL %RAX,%R13 |
0x43568c MOV %RSI,0x10(%RSP) |
0x435691 MOV 0x70(%RSP),%RSI |
0x435696 VBROADCASTSD %XMM7,%YMM10 |
0x43569b ADD %R14,%R9 |
0x43569e MOV 0x48(%RSP),%R14 |
0x4356a3 MOV %R10,0x70(%RSP) |
0x4356a8 VBROADCASTSD %XMM6,%YMM9 |
0x4356ad ADD %RBX,%RSI |
0x4356b0 ADD %R11,%RDI |
0x4356b3 MOV 0x20(%RCX),%RDX |
0x4356b7 MOV 0x38(%RCX),%R12 |
0x4356bb IMUL %R14,%RAX |
0x4356bf VBROADCASTSD %XMM5,%YMM8 |
0x4356c4 VBROADCASTSD %XMM7,%ZMM4 |
0x4356ca ADD %R13,%R8 |
0x4356cd VBROADCASTSD %XMM6,%ZMM3 |
0x4356d3 VBROADCASTSD %XMM5,%ZMM2 |
0x4356d9 ADD %RAX,%RSI |
0x4356dc MOV %R15D,%EAX |
0x4356df SUB %EBX,%EAX |
0x4356e1 MOV %EAX,0x5c(%RSP) |
0x4356e5 INC %EAX |
0x4356e7 MOV %EAX,%R13D |
0x4356ea MOV %EAX,%R11D |
0x4356ed SHR $0x3,%R13D |
0x4356f1 AND $-0x8,%R11D |
0x4356f5 SAL $0x6,%R13 |
0x4356f9 CMP %R15D,%EBX |
0x4356fc LEA (%R11,%RBX,1),%R14D |
0x435700 MOV %R11D,0x20(%RSP) |
0x435705 CMOVLE 0x24(%RSP),%EBX |
0x43570a AND $0x7,%EAX |
0x43570d MOV %R13,0x60(%RSP) |
0x435712 XOR %R11D,%R11D |
0x435715 MOV %R14D,0x1c(%RSP) |
0x43571a MOV %EBX,0x18(%RSP) |
0x43571e MOV %EAX,0x28(%RSP) |
0x435722 MOV %RCX,0x8(%RSP) |
0x435727 NOPW (%RAX,%RAX,1) |
(239) 0x435730 MOV 0x68(%RSP),%ECX |
(239) 0x435734 CMP %ECX,0x58(%RSP) |
(239) 0x435738 JG 435bf8 |
(239) 0x43573e CMPL $0x6,0x5c(%RSP) |
(239) 0x435743 JBE 435c08 |
(239) 0x435749 MOV 0x70(%RSP),%R10 |
(239) 0x43574e MOV 0x60(%RSP),%R14 |
(239) 0x435753 LEA (%RDX,%R9,8),%R15 |
(239) 0x435757 LEA (%R12,%RSI,8),%RCX |
(239) 0x43575b MOV 0x78(%RSP),%R11 |
(239) 0x435760 XOR %EAX,%EAX |
(239) 0x435762 LEA (%R10,%R8,8),%R13 |
(239) 0x435766 LEA -0x40(%R14),%R10 |
(239) 0x43576a SHR $0x6,%R10 |
(239) 0x43576e LEA (%R11,%RDI,8),%RBX |
(239) 0x435772 INC %R10 |
(239) 0x435775 AND $0x3,%R10D |
(239) 0x435779 JE 43587a |
(239) 0x43577f CMP $0x1,%R10 |
(239) 0x435783 JE 435823 |
(239) 0x435789 CMP $0x2,%R10 |
(239) 0x43578d JE 4357d7 |
(239) 0x43578f VMOVUPD (%R15),%ZMM1 |
(239) 0x435795 MOV $0x40,%EAX |
(239) 0x43579a VMULPD (%R13),%ZMM1,%ZMM0 |
(239) 0x4357a1 VDIVPD %ZMM1,%ZMM4,%ZMM11 |
(239) 0x4357a7 VMULPD %ZMM11,%ZMM11,%ZMM14 |
(239) 0x4357ad VMULPD %ZMM3,%ZMM0,%ZMM12 |
(239) 0x4357b3 VMOVUPD %ZMM12,(%RBX) |
(239) 0x4357b9 VMULPD (%R15),%ZMM2,%ZMM13 |
(239) 0x4357bf VMULPD %ZMM14,%ZMM13,%ZMM15 |
(239) 0x4357c5 VMULPD %ZMM12,%ZMM15,%ZMM1 |
(239) 0x4357cb VSQRTPD %ZMM1,%ZMM11 |
(239) 0x4357d1 VMOVUPD %ZMM11,(%RCX) |
(239) 0x4357d7 VMOVUPD (%R15,%RAX,1),%ZMM0 |
(239) 0x4357de VMULPD (%R13,%RAX,1),%ZMM0,%ZMM13 |
(239) 0x4357e6 VDIVPD %ZMM0,%ZMM4,%ZMM12 |
(239) 0x4357ec VMULPD %ZMM12,%ZMM12,%ZMM1 |
(239) 0x4357f2 VMULPD %ZMM3,%ZMM13,%ZMM14 |
(239) 0x4357f8 VMOVUPD %ZMM14,(%RBX,%RAX,1) |
(239) 0x4357ff VMULPD (%R15,%RAX,1),%ZMM2,%ZMM15 |
(239) 0x435806 VMULPD %ZMM1,%ZMM15,%ZMM11 |
(239) 0x43580c VMULPD %ZMM14,%ZMM11,%ZMM0 |
(239) 0x435812 VSQRTPD %ZMM0,%ZMM12 |
(239) 0x435818 VMOVUPD %ZMM12,(%RCX,%RAX,1) |
(239) 0x43581f ADD $0x40,%RAX |
(239) 0x435823 VMOVUPD (%R15,%RAX,1),%ZMM13 |
(239) 0x43582a VMULPD (%R13,%RAX,1),%ZMM13,%ZMM15 |
(239) 0x435832 VDIVPD %ZMM13,%ZMM4,%ZMM14 |
(239) 0x435838 VMULPD %ZMM14,%ZMM14,%ZMM11 |
(239) 0x43583e VMULPD %ZMM3,%ZMM15,%ZMM1 |
(239) 0x435844 VMOVUPD %ZMM1,(%RBX,%RAX,1) |
(239) 0x43584b VMULPD (%R15,%RAX,1),%ZMM2,%ZMM0 |
(239) 0x435852 VMULPD %ZMM11,%ZMM0,%ZMM12 |
(239) 0x435858 VMULPD %ZMM1,%ZMM12,%ZMM13 |
(239) 0x43585e VSQRTPD %ZMM13,%ZMM14 |
(239) 0x435864 VMOVUPD %ZMM14,(%RCX,%RAX,1) |
(239) 0x43586b ADD $0x40,%RAX |
(239) 0x43586f CMP %RAX,0x60(%RSP) |
(239) 0x435874 JE 4359b7 |
(240) 0x43587a VMOVUPD (%R15,%RAX,1),%ZMM15 |
(240) 0x435881 VMULPD (%R13,%RAX,1),%ZMM15,%ZMM1 |
(240) 0x435889 VDIVPD %ZMM15,%ZMM4,%ZMM11 |
(240) 0x43588f VMULPD %ZMM11,%ZMM11,%ZMM13 |
(240) 0x435895 VMULPD %ZMM3,%ZMM1,%ZMM12 |
(240) 0x43589b VMOVUPD %ZMM12,(%RBX,%RAX,1) |
(240) 0x4358a2 VMULPD (%R15,%RAX,1),%ZMM2,%ZMM0 |
(240) 0x4358a9 VMULPD %ZMM13,%ZMM0,%ZMM14 |
(240) 0x4358af VMULPD %ZMM12,%ZMM14,%ZMM15 |
(240) 0x4358b5 VSQRTPD %ZMM15,%ZMM11 |
(240) 0x4358bb VMOVUPD %ZMM11,(%RCX,%RAX,1) |
(240) 0x4358c2 VMOVUPD 0x40(%R15,%RAX,1),%ZMM1 |
(240) 0x4358ca VMULPD 0x40(%R13,%RAX,1),%ZMM1,%ZMM0 |
(240) 0x4358d2 VDIVPD %ZMM1,%ZMM4,%ZMM12 |
(240) 0x4358d8 VMULPD %ZMM12,%ZMM12,%ZMM15 |
(240) 0x4358de VMULPD %ZMM3,%ZMM0,%ZMM13 |
(240) 0x4358e4 VMOVUPD %ZMM13,0x40(%RBX,%RAX,1) |
(240) 0x4358ec VMULPD 0x40(%R15,%RAX,1),%ZMM2,%ZMM14 |
(240) 0x4358f4 VMULPD %ZMM15,%ZMM14,%ZMM11 |
(240) 0x4358fa VMULPD %ZMM13,%ZMM11,%ZMM1 |
(240) 0x435900 VSQRTPD %ZMM1,%ZMM12 |
(240) 0x435906 VMOVUPD %ZMM12,0x40(%RCX,%RAX,1) |
(240) 0x43590e VMOVUPD 0x80(%R15,%RAX,1),%ZMM0 |
(240) 0x435916 VMULPD 0x80(%R13,%RAX,1),%ZMM0,%ZMM14 |
(240) 0x43591e VDIVPD %ZMM0,%ZMM4,%ZMM13 |
(240) 0x435924 VMULPD %ZMM13,%ZMM13,%ZMM11 |
(240) 0x43592a VMULPD %ZMM3,%ZMM14,%ZMM15 |
(240) 0x435930 VMOVUPD %ZMM15,0x80(%RBX,%RAX,1) |
(240) 0x435938 VMULPD 0x80(%R15,%RAX,1),%ZMM2,%ZMM1 |
(240) 0x435940 VMULPD %ZMM11,%ZMM1,%ZMM12 |
(240) 0x435946 VMULPD %ZMM15,%ZMM12,%ZMM0 |
(240) 0x43594c VSQRTPD %ZMM0,%ZMM13 |
(240) 0x435952 VMOVUPD %ZMM13,0x80(%RCX,%RAX,1) |
(240) 0x43595a VMOVUPD 0xc0(%R15,%RAX,1),%ZMM14 |
(240) 0x435962 VMULPD 0xc0(%R13,%RAX,1),%ZMM14,%ZMM1 |
(240) 0x43596a VDIVPD %ZMM14,%ZMM4,%ZMM15 |
(240) 0x435970 VMULPD %ZMM15,%ZMM15,%ZMM11 |
(240) 0x435976 VMULPD %ZMM3,%ZMM1,%ZMM12 |
(240) 0x43597c VMOVUPD %ZMM12,0xc0(%RBX,%RAX,1) |
(240) 0x435984 VMULPD 0xc0(%R15,%RAX,1),%ZMM2,%ZMM0 |
(240) 0x43598c VMULPD %ZMM11,%ZMM0,%ZMM13 |
(240) 0x435992 VMULPD %ZMM12,%ZMM13,%ZMM14 |
(240) 0x435998 VSQRTPD %ZMM14,%ZMM15 |
(240) 0x43599e VMOVUPD %ZMM15,0xc0(%RCX,%RAX,1) |
(240) 0x4359a6 ADD $0x100,%RAX |
(240) 0x4359ac CMP %RAX,0x60(%RSP) |
(240) 0x4359b1 JNE 43587a |
(239) 0x4359b7 MOV 0x28(%RSP),%R15D |
(239) 0x4359bc TEST %R15D,%R15D |
(239) 0x4359bf JE 435b87 |
(239) 0x4359c5 MOV 0x20(%RSP),%ECX |
(239) 0x4359c9 MOV 0x1c(%RSP),%EAX |
(239) 0x4359cd MOV 0x5c(%RSP),%R13D |
(239) 0x4359d2 SUB %ECX,%R13D |
(239) 0x4359d5 LEA 0x1(%R13),%R10D |
(239) 0x4359d9 CMP $0x2,%R13D |
(239) 0x4359dd JBE 435a46 |
(239) 0x4359df LEA (%R9,%RCX,1),%R11 |
(239) 0x4359e3 MOV 0x70(%RSP),%R14 |
(239) 0x4359e8 LEA (%R8,%RCX,1),%R15 |
(239) 0x4359ec MOV 0x78(%RSP),%R13 |
(239) 0x4359f1 LEA (%RDX,%R11,8),%R11 |
(239) 0x4359f5 LEA (%RCX,%RSI,1),%RBX |
(239) 0x4359f9 ADD %RDI,%RCX |
(239) 0x4359fc VMOVUPD (%R11),%YMM1 |
(239) 0x435a01 VDIVPD %YMM1,%YMM10,%YMM12 |
(239) 0x435a05 VMULPD (%R14,%R15,8),%YMM1,%YMM0 |
(239) 0x435a0b VMULPD %YMM9,%YMM0,%YMM13 |
(239) 0x435a10 VMOVUPD %YMM13,(%R13,%RCX,8) |
(239) 0x435a17 VMULPD (%R11),%YMM8,%YMM14 |
(239) 0x435a1c VMULPD %YMM12,%YMM12,%YMM11 |
(239) 0x435a21 VMULPD %YMM11,%YMM14,%YMM15 |
(239) 0x435a26 VMULPD %YMM13,%YMM15,%YMM1 |
(239) 0x435a2b VSQRTPD %YMM1,%YMM12 |
(239) 0x435a2f VMOVUPD %YMM12,(%R12,%RBX,8) |
(239) 0x435a35 TEST $0x3,%R10B |
(239) 0x435a39 JE 435b87 |
(239) 0x435a3f AND $-0x4,%R10D |
(239) 0x435a43 ADD %R10D,%EAX |
(239) 0x435a46 MOV 0x10(%RSP),%RCX |
(239) 0x435a4b MOV %R9,%R10 |
(239) 0x435a4e MOV %R8,%R13 |
(239) 0x435a51 MOV %RDI,%RBX |
(239) 0x435a54 MOV %RSI,%R11 |
(239) 0x435a57 SUB %RCX,%R11 |
(239) 0x435a5a SUB %RCX,%R10 |
(239) 0x435a5d SUB %RCX,%R13 |
(239) 0x435a60 SUB %RCX,%RBX |
(239) 0x435a63 MOVSXD %EAX,%RCX |
(239) 0x435a66 MOV %R11,0x50(%RSP) |
(239) 0x435a6b MOV 0x70(%RSP),%R11 |
(239) 0x435a70 LEA (%R10,%RCX,1),%R14 |
(239) 0x435a74 LEA (%RCX,%R13,1),%R15 |
(239) 0x435a78 VMOVSD (%RDX,%R14,8),%XMM0 |
(239) 0x435a7e VDIVSD %XMM0,%XMM7,%XMM13 |
(239) 0x435a82 VMULSD (%R11,%R15,8),%XMM0,%XMM14 |
(239) 0x435a88 MOV 0x78(%RSP),%R11 |
(239) 0x435a8d LEA (%RCX,%RBX,1),%R15 |
(239) 0x435a91 VMULSD %XMM6,%XMM14,%XMM11 |
(239) 0x435a95 VMOVSD %XMM11,(%R11,%R15,8) |
(239) 0x435a9b VMULSD (%RDX,%R14,8),%XMM5,%XMM15 |
(239) 0x435aa1 MOV 0x50(%RSP),%R14 |
(239) 0x435aa6 ADD %R14,%RCX |
(239) 0x435aa9 VMULSD %XMM11,%XMM15,%XMM1 |
(239) 0x435aae VMULSD %XMM13,%XMM13,%XMM12 |
(239) 0x435ab3 VMULSD %XMM12,%XMM1,%XMM0 |
(239) 0x435ab8 VSQRTSD %XMM0,%XMM0,%XMM0 |
(239) 0x435abc VMOVSD %XMM0,(%R12,%RCX,8) |
(239) 0x435ac2 LEA 0x1(%RAX),%ECX |
(239) 0x435ac5 CMP %ECX,0x68(%RSP) |
(239) 0x435ac9 JL 435b87 |
(239) 0x435acf MOVSXD %ECX,%RCX |
(239) 0x435ad2 MOV 0x70(%RSP),%R11 |
(239) 0x435ad7 ADD $0x2,%EAX |
(239) 0x435ada LEA (%R10,%RCX,1),%R14 |
(239) 0x435ade LEA (%R13,%RCX,1),%R15 |
(239) 0x435ae3 VMOVSD (%RDX,%R14,8),%XMM13 |
(239) 0x435ae9 VDIVSD %XMM13,%XMM7,%XMM14 |
(239) 0x435aee VMULSD (%R11,%R15,8),%XMM13,%XMM11 |
(239) 0x435af4 MOV 0x78(%RSP),%R11 |
(239) 0x435af9 LEA (%RBX,%RCX,1),%R15 |
(239) 0x435afd VMULSD %XMM6,%XMM11,%XMM15 |
(239) 0x435b01 VMOVSD %XMM15,(%R11,%R15,8) |
(239) 0x435b07 VMULSD (%RDX,%R14,8),%XMM5,%XMM1 |
(239) 0x435b0d MOV 0x50(%RSP),%R14 |
(239) 0x435b12 ADD %R14,%RCX |
(239) 0x435b15 VMULSD %XMM15,%XMM1,%XMM12 |
(239) 0x435b1a VMULSD %XMM14,%XMM14,%XMM0 |
(239) 0x435b1f VMULSD %XMM0,%XMM12,%XMM13 |
(239) 0x435b23 VSQRTSD %XMM13,%XMM13,%XMM13 |
(239) 0x435b28 VMOVSD %XMM13,(%R12,%RCX,8) |
(239) 0x435b2e CMP %EAX,0x68(%RSP) |
(239) 0x435b32 JL 435b87 |
(239) 0x435b34 CLTQ |
(239) 0x435b36 MOV 0x70(%RSP),%RCX |
(239) 0x435b3b ADD %RAX,%R10 |
(239) 0x435b3e ADD %RAX,%R13 |
(239) 0x435b41 ADD %RAX,%RBX |
(239) 0x435b44 ADD %RAX,%R14 |
(239) 0x435b47 VMOVSD (%RDX,%R10,8),%XMM14 |
(239) 0x435b4d VDIVSD %XMM14,%XMM7,%XMM11 |
(239) 0x435b52 VMULSD (%RCX,%R13,8),%XMM14,%XMM15 |
(239) 0x435b58 MOV 0x78(%RSP),%R13 |
(239) 0x435b5d VMULSD %XMM6,%XMM15,%XMM1 |
(239) 0x435b61 VMOVSD %XMM1,(%R13,%RBX,8) |
(239) 0x435b68 VMULSD (%RDX,%R10,8),%XMM5,%XMM12 |
(239) 0x435b6e VMULSD %XMM1,%XMM12,%XMM0 |
(239) 0x435b72 VMULSD %XMM11,%XMM11,%XMM13 |
(239) 0x435b77 VMULSD %XMM13,%XMM0,%XMM14 |
(239) 0x435b7c VSQRTSD %XMM14,%XMM14,%XMM14 |
(239) 0x435b81 VMOVSD %XMM14,(%R12,%R14,8) |
(239) 0x435b87 MOV 0x18(%RSP),%EAX |
(239) 0x435b8b MOV $0x1,%R11D |
(239) 0x435b91 MOV %EAX,0x50(%RSP) |
(239) 0x435b95 NOPL (%RAX) |
(239) 0x435b98 INCL 0x6c(%RSP) |
(239) 0x435b9c MOV 0x30(%RSP),%RBX |
(239) 0x435ba1 MOV 0x38(%RSP),%R14 |
(239) 0x435ba6 MOV 0x40(%RSP),%RCX |
(239) 0x435bab MOV 0x48(%RSP),%R13 |
(239) 0x435bb0 ADD %RBX,%R9 |
(239) 0x435bb3 ADD %R14,%R8 |
(239) 0x435bb6 ADD %RCX,%RDI |
(239) 0x435bb9 MOV 0x6c(%RSP),%R10D |
(239) 0x435bbe ADD %R13,%RSI |
(239) 0x435bc1 CMP %R10D,0x2c(%RSP) |
(239) 0x435bc6 JG 435730 |
0x435bcc MOV 0x8(%RSP),%RDX |
0x435bd1 TEST %R11B,%R11B |
0x435bd4 JE 435c1c |
0x435bd6 MOV 0x50(%RSP),%R12D |
0x435bdb MOV %R12D,0x80(%RDX) |
0x435be2 VZEROUPPER |
0x435be5 LEA -0x28(%RBP),%RSP |
0x435be9 POP %RBX |
0x435bea POP %R12 |
0x435bec POP %R13 |
0x435bee POP %R14 |
0x435bf0 POP %R15 |
0x435bf2 POP %RBP |
0x435bf3 RET |
0x435bf4 NOPL (%RAX) |
(239) 0x435bf8 MOV 0x18(%RSP),%EBX |
(239) 0x435bfc CMP %EBX,0x24(%RSP) |
(239) 0x435c00 JNE 435b98 |
(239) 0x435c02 JMP 435b87 |
0x435c04 NOPL (%RAX) |
(239) 0x435c08 MOV 0x58(%RSP),%EAX |
(239) 0x435c0c XOR %ECX,%ECX |
(239) 0x435c0e JMP 4359cd |
0x435c13 INC %EAX |
0x435c15 XOR %EDX,%EDX |
0x435c17 JMP 4355fb |
0x435c1c VZEROUPPER |
0x435c1f LEA -0x28(%RBP),%RSP |
0x435c23 POP %RBX |
0x435c24 POP %R12 |
0x435c26 POP %R13 |
0x435c28 POP %R14 |
0x435c2a POP %R15 |
0x435c2c POP %RBP |
0x435c2d RET |
0x435c2e XCHG %AX,%AX |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
○98.30 | gomp_thread_start | team.c:130 | libgomp.so.1.0.0 |
○1.70 | GOMP_parallel | libgomp.h:985 | libgomp.so.1.0.0 |
Path / |
Source file and lines | ideal_gas_kernel.f90:45-55 |
Module | exec |
nb instructions | 142 |
nb uops | 149 |
loop length | 525 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 3 |
used zmm registers | 3 |
nb stack references | 21 |
micro-operation queue | 24.83 cycles |
front end | 24.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.90 | 9.80 | 15.67 | 15.67 | 15.50 | 9.80 | 9.70 | 15.50 | 15.50 | 15.50 | 9.80 | 15.67 |
cycles | 9.90 | 13.33 | 15.67 | 15.67 | 15.50 | 9.80 | 9.70 | 15.50 | 15.50 | 15.50 | 9.80 | 15.67 |
Cycles executing div or sqrt instructions | 6.00 |
FE+BE cycles | 24.25-25.63 |
Stall cycles | 0.00-1.24 |
Front-end | 24.83 |
Dispatch | 15.67 |
DIV/SQRT | 6.00 |
Overall L1 | 24.83 |
all | 5% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 28% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 16% |
all | 10% |
load | 10% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 10% |
load | 10% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 6% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x40,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
ADD $-0x80,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x70(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x68(%RDI),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x78(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RDI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RDI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RDI),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RDI),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RDI),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RDI),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R9),%R12D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 402080 <@plt_start@+0x60> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %EAX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 402180 <@plt_start@+0x160> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x78(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x18(%RCX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %R12D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CLTD | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R15D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
CMP %EDX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 435c13 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x6a3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %EAX,%EDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %EDX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %EDI,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %EAX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 435be5 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x675> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x8(%RCX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RCX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %R12D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R12D,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%RCX),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RCX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,0x2c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R8),%R15D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x5a8ba(%RIP),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RSP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD (%R11),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EDI,0x6c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%R15),%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0x40(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x5a880(%RIP),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15D,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0x24(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %EDI,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
ADD %RSI,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x60(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %RAX,%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R13,%RSI,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RAX,%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x5a850(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %RAX,%R13 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RSI,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD %XMM7,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R14,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x48(%RSP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM6,%YMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RBX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R11,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x20(%RCX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RCX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM5,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM7,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R13,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VBROADCASTSD %XMM6,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM5,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EAX,0x5c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EAX,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x3,%R13D | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
AND $-0x8,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SAL $0x6,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %R15D,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (%R11,%RBX,1),%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R11D,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMOVLE 0x24(%RSP),%EBX | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.50 |
AND $0x7,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R13,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14D,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EBX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x8(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R11B,%R11B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 435c1c <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x6ac> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x50(%RSP),%R12D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12D,0x80(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4355fb <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x8b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | ideal_gas_kernel.f90:45-55 |
Module | exec |
nb instructions | 142 |
nb uops | 149 |
loop length | 525 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 3 |
used zmm registers | 3 |
nb stack references | 21 |
micro-operation queue | 24.83 cycles |
front end | 24.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.90 | 9.80 | 15.67 | 15.67 | 15.50 | 9.80 | 9.70 | 15.50 | 15.50 | 15.50 | 9.80 | 15.67 |
cycles | 9.90 | 13.33 | 15.67 | 15.67 | 15.50 | 9.80 | 9.70 | 15.50 | 15.50 | 15.50 | 9.80 | 15.67 |
Cycles executing div or sqrt instructions | 6.00 |
FE+BE cycles | 24.25-25.63 |
Stall cycles | 0.00-1.24 |
Front-end | 24.83 |
Dispatch | 15.67 |
DIV/SQRT | 6.00 |
Overall L1 | 24.83 |
all | 5% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 28% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 16% |
all | 10% |
load | 10% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 11% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 10% |
load | 10% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 6% |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x40,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
ADD $-0x80,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x70(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x68(%RDI),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x78(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RDI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RDI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RDI),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RDI),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RDI),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RDI),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R9),%R12D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 402080 <@plt_start@+0x60> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %EAX,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 402180 <@plt_start@+0x160> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x78(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x18(%RCX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R10),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %R12D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CLTD | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R15D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
CMP %EDX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 435c13 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x6a3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %EAX,%EDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %EDX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %EDI,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %EAX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 435be5 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x675> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x8(%RCX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RCX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %R12D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R12D,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%RCX),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RCX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,0x2c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R8),%R15D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x5a8ba(%RIP),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RSP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD (%R11),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EDI,0x6c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%R15),%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0x40(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x5a880(%RIP),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15D,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0x24(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %EDI,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
ADD %RSI,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x60(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %RAX,%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R13,%RSI,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RAX,%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RSI,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x5a850(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %RAX,%R13 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RSI,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD %XMM7,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R14,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x48(%RSP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VBROADCASTSD %XMM6,%YMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RBX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %R11,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x20(%RCX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RCX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM5,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM7,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R13,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VBROADCASTSD %XMM6,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM5,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R15D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EAX,0x5c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EAX,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x3,%R13D | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
AND $-0x8,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SAL $0x6,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %R15D,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (%R11,%RBX,1),%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R11D,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMOVLE 0x24(%RSP),%EBX | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.50 |
AND $0x7,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R13,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R11D,%R11D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14D,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EBX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x8(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R11B,%R11B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 435c1c <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x6ac> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x50(%RSP),%R12D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12D,0x80(%RDX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4355fb <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x8b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0– | 4.84 | 3.6 |
▼Loop 239 - ideal_gas_kernel.f90:45-55 - exec– | 0 | 0 |
○Loop 240 - ideal_gas_kernel.f90:50-55 - exec | 4.84 | 3.6 |