Function: ideal_gas_kernel._omp_fn.0 | Module: exec | Source: ideal_gas_kernel.f90:45-55 | Coverage: 4.87% |
---|
Function: ideal_gas_kernel._omp_fn.0 | Module: exec | Source: ideal_gas_kernel.f90:45-55 | Coverage: 4.87% |
---|
/scratch_na/users/xoserete/qaas_runs/171-215-0463/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/ideal_gas_kernel.f90: 45 - 55 |
-------------------------------------------------------------------------------- |
45: !$OMP PARALLEL |
46: !$OMP DO PRIVATE(v,pressurebyenergy,pressurebyvolume,sound_speed_squared) |
47: DO k=y_min,y_max |
48: !$OMP SIMD |
49: DO j=x_min,x_max |
50: v=1.0_8/density(j,k) |
51: pressure(j,k)=(1.4_8-1.0_8)*density(j,k)*energy(j,k) |
52: pressurebyenergy=(1.4_8-1.0_8)*density(j,k) |
53: pressurebyvolume=-density(j,k)*pressure(j,k) |
54: sound_speed_squared=v*v*(pressure(j,k)*pressurebyenergy-pressurebyvolume) |
55: soundspeed(j,k)=SQRT(sound_speed_squared) |
0x44ded0 PUSH %RBP |
0x44ded1 MOV %RSP,%RBP |
0x44ded4 PUSH %R15 |
0x44ded6 PUSH %R14 |
0x44ded8 PUSH %R13 |
0x44deda PUSH %R12 |
0x44dedc PUSH %RBX |
0x44dedd AND $-0x40,%RSP |
0x44dee1 ADD $-0x80,%RSP |
0x44dee5 MOV 0x68(%RDI),%RDX |
0x44dee9 MOV 0x50(%RDI),%RBX |
0x44deed MOV %RDI,0x78(%RSP) |
0x44def2 MOV 0x40(%RDI),%RSI |
0x44def6 MOV 0x70(%RDI),%RAX |
0x44defa MOV 0x60(%RDI),%RCX |
0x44defe MOV 0x10(%RDI),%R8 |
0x44df02 MOV %RDX,0x70(%RSP) |
0x44df07 MOV 0x78(%RDI),%R15 |
0x44df0b MOV 0x58(%RDI),%R13 |
0x44df0f MOV %RSI,0x30(%RSP) |
0x44df14 MOV 0x48(%RDI),%R14 |
0x44df18 MOV %RCX,0x40(%RSP) |
0x44df1d MOV %RBX,0x38(%RSP) |
0x44df22 MOV (%R8),%EBX |
0x44df25 MOV %RAX,0x48(%RSP) |
0x44df2a CALL 402080 <@plt_start@+0x60> |
0x44df2f MOV %EAX,%R12D |
0x44df32 CALL 402180 <@plt_start@+0x160> |
0x44df37 MOV 0x78(%RSP),%R11 |
0x44df3c MOV %EAX,%ESI |
0x44df3e MOV 0x18(%R11),%RDI |
0x44df42 MOV (%RDI),%EAX |
0x44df44 INC %EAX |
0x44df46 SUB %EBX,%EAX |
0x44df48 CLTD |
0x44df49 IDIV %R12D |
0x44df4c CMP %EDX,%ESI |
0x44df4e JL 44e51b |
0x44df54 IMUL %EAX,%ESI |
0x44df57 ADD %EDX,%ESI |
0x44df59 ADD %ESI,%EAX |
0x44df5b CMP %EAX,%ESI |
0x44df5d JGE 44e501 |
0x44df63 MOV 0x8(%R11),%R10 |
0x44df67 ADD %EBX,%ESI |
0x44df69 ADD %EBX,%EAX |
0x44df6b MOV (%R11),%R9 |
0x44df6e VMOVSD 0x5e7a2(%RIP),%XMM7 |
0x44df76 VMOVSD 0x5ec82(%RIP),%XMM6 |
0x44df7e MOV %ESI,0x5c(%RSP) |
0x44df82 MOV (%R10),%ECX |
0x44df85 MOVSXD (%R9),%R8 |
0x44df88 MOV %EAX,0x1c(%RSP) |
0x44df8c MOVSXD %ESI,%RAX |
0x44df8f MOV 0x30(%RSP),%RSI |
0x44df94 VMOVSD 0x5ec6c(%RIP),%XMM5 |
0x44df9c VBROADCASTSD %XMM7,%YMM10 |
0x44dfa1 VBROADCASTSD %XMM6,%YMM9 |
0x44dfa6 MOV %ECX,0x60(%RSP) |
0x44dfaa LEA 0x1(%RCX),%R12D |
0x44dfae MOV 0x38(%RSP),%RCX |
0x44dfb3 ADD %R8,%R14 |
0x44dfb6 IMUL %RAX,%RSI |
0x44dfba ADD %R8,%R13 |
0x44dfbd MOV %R8D,0x24(%RSP) |
0x44dfc2 LEA (%R15,%R8,1),%R15 |
0x44dfc6 IMUL %RAX,%RCX |
0x44dfca MOV %R8,0x28(%RSP) |
0x44dfcf MOV 0x20(%R11),%RDX |
0x44dfd3 VBROADCASTSD %XMM5,%YMM8 |
0x44dfd8 MOV %R12D,0x18(%RSP) |
0x44dfdd MOV 0x60(%RSP),%R12D |
0x44dfe2 VBROADCASTSD %XMM7,%ZMM4 |
0x44dfe8 VBROADCASTSD %XMM6,%ZMM3 |
0x44dfee ADD %R14,%RSI |
0x44dff1 MOV 0x70(%RSP),%R14 |
0x44dff6 MOV 0x24(%RSP),%EBX |
0x44dffa VBROADCASTSD %XMM5,%ZMM2 |
0x44e000 ADD %RCX,%R13 |
0x44e003 MOV 0x40(%RSP),%RCX |
0x44e008 MOV 0x28(%R11),%R10 |
0x44e00c ADD %R8,%R14 |
0x44e00f MOV 0x48(%RSP),%R8 |
0x44e014 MOV 0x30(%R11),%R9 |
0x44e018 MOV %R13,0x78(%RSP) |
0x44e01d IMUL %RAX,%RCX |
0x44e021 MOV 0x38(%R11),%RDI |
0x44e025 IMUL %R8,%RAX |
0x44e029 LEA (%R14,%RCX,1),%R13 |
0x44e02d LEA (%R15,%RAX,1),%R8 |
0x44e031 MOV %R12D,%EAX |
0x44e034 MOV %R13,0x70(%RSP) |
0x44e039 SUB %EBX,%EAX |
0x44e03b MOV %EAX,0x64(%RSP) |
0x44e03f INC %EAX |
0x44e041 MOV %EAX,%R14D |
0x44e044 MOV %EAX,%ECX |
0x44e046 SHR $0x3,%R14D |
0x44e04a AND $-0x8,%ECX |
0x44e04d MOV %R14D,%R15D |
0x44e050 LEA (%RCX,%RBX,1),%R13D |
0x44e054 MOV %ECX,0x54(%RSP) |
0x44e058 SAL $0x6,%R15 |
0x44e05c CMP %R12D,%EBX |
0x44e05f MOV %R13D,0x50(%RSP) |
0x44e064 CMOVLE 0x18(%RSP),%EBX |
0x44e069 AND $0x7,%EAX |
0x44e06c MOV %R15,0x68(%RSP) |
0x44e071 XOR %ECX,%ECX |
0x44e073 MOV %EBX,0x20(%RSP) |
0x44e077 MOV %EAX,0x58(%RSP) |
0x44e07b MOV %R11,0x8(%RSP) |
0x44e080 MOV 0x10(%RSP),%R11D |
(254) 0x44e085 MOV 0x60(%RSP),%R12D |
(254) 0x44e08a CMP %R12D,0x24(%RSP) |
(254) 0x44e08f JG 44e524 |
(254) 0x44e095 CMPL $0x6,0x64(%RSP) |
(254) 0x44e09a JBE 44e510 |
(254) 0x44e0a0 MOV 0x78(%RSP),%R13 |
(254) 0x44e0a5 MOV 0x68(%RSP),%R11 |
(254) 0x44e0aa LEA (%RDX,%RSI,8),%R15 |
(254) 0x44e0ae LEA (%RDI,%R8,8),%RBX |
(254) 0x44e0b2 MOV 0x70(%RSP),%R14 |
(254) 0x44e0b7 XOR %EAX,%EAX |
(254) 0x44e0b9 LEA (%R10,%R13,8),%RCX |
(254) 0x44e0bd LEA -0x40(%R11),%R13 |
(254) 0x44e0c1 SHR $0x6,%R13 |
(254) 0x44e0c5 LEA (%R9,%R14,8),%R12 |
(254) 0x44e0c9 INC %R13 |
(254) 0x44e0cc AND $0x3,%R13D |
(254) 0x44e0d0 JE 44e1cf |
(254) 0x44e0d6 CMP $0x1,%R13 |
(254) 0x44e0da JE 44e179 |
(254) 0x44e0e0 CMP $0x2,%R13 |
(254) 0x44e0e4 JE 44e12e |
(254) 0x44e0e6 VMOVUPD (%R15),%ZMM1 |
(254) 0x44e0ec MOV $0x40,%EAX |
(254) 0x44e0f1 VMULPD (%RCX),%ZMM1,%ZMM0 |
(254) 0x44e0f7 VDIVPD %ZMM1,%ZMM4,%ZMM11 |
(254) 0x44e0fd VMULPD %ZMM11,%ZMM11,%ZMM14 |
(254) 0x44e103 VMULPD %ZMM3,%ZMM0,%ZMM12 |
(254) 0x44e109 VMOVUPD %ZMM12,(%R12) |
(254) 0x44e110 VMULPD (%R15),%ZMM2,%ZMM13 |
(254) 0x44e116 VMULPD %ZMM14,%ZMM13,%ZMM15 |
(254) 0x44e11c VMULPD %ZMM12,%ZMM15,%ZMM1 |
(254) 0x44e122 VSQRTPD %ZMM1,%ZMM11 |
(254) 0x44e128 VMOVUPD %ZMM11,(%RBX) |
(254) 0x44e12e VMOVUPD (%R15,%RAX,1),%ZMM0 |
(254) 0x44e135 VMULPD (%RCX,%RAX,1),%ZMM0,%ZMM13 |
(254) 0x44e13c VDIVPD %ZMM0,%ZMM4,%ZMM12 |
(254) 0x44e142 VMULPD %ZMM12,%ZMM12,%ZMM1 |
(254) 0x44e148 VMULPD %ZMM3,%ZMM13,%ZMM14 |
(254) 0x44e14e VMOVUPD %ZMM14,(%R12,%RAX,1) |
(254) 0x44e155 VMULPD (%R15,%RAX,1),%ZMM2,%ZMM15 |
(254) 0x44e15c VMULPD %ZMM1,%ZMM15,%ZMM11 |
(254) 0x44e162 VMULPD %ZMM14,%ZMM11,%ZMM0 |
(254) 0x44e168 VSQRTPD %ZMM0,%ZMM12 |
(254) 0x44e16e VMOVUPD %ZMM12,(%RBX,%RAX,1) |
(254) 0x44e175 ADD $0x40,%RAX |
(254) 0x44e179 VMOVUPD (%R15,%RAX,1),%ZMM13 |
(254) 0x44e180 VMULPD (%RCX,%RAX,1),%ZMM13,%ZMM15 |
(254) 0x44e187 VDIVPD %ZMM13,%ZMM4,%ZMM14 |
(254) 0x44e18d VMULPD %ZMM14,%ZMM14,%ZMM11 |
(254) 0x44e193 VMULPD %ZMM3,%ZMM15,%ZMM1 |
(254) 0x44e199 VMOVUPD %ZMM1,(%R12,%RAX,1) |
(254) 0x44e1a0 VMULPD (%R15,%RAX,1),%ZMM2,%ZMM0 |
(254) 0x44e1a7 VMULPD %ZMM11,%ZMM0,%ZMM12 |
(254) 0x44e1ad VMULPD %ZMM1,%ZMM12,%ZMM13 |
(254) 0x44e1b3 VSQRTPD %ZMM13,%ZMM14 |
(254) 0x44e1b9 VMOVUPD %ZMM14,(%RBX,%RAX,1) |
(254) 0x44e1c0 ADD $0x40,%RAX |
(254) 0x44e1c4 CMP %RAX,0x68(%RSP) |
(254) 0x44e1c9 JE 44e30b |
(256) 0x44e1cf VMOVUPD (%R15,%RAX,1),%ZMM15 |
(256) 0x44e1d6 VMULPD (%RCX,%RAX,1),%ZMM15,%ZMM1 |
(256) 0x44e1dd VDIVPD %ZMM15,%ZMM4,%ZMM11 |
(256) 0x44e1e3 VMULPD %ZMM11,%ZMM11,%ZMM13 |
(256) 0x44e1e9 VMULPD %ZMM3,%ZMM1,%ZMM12 |
(256) 0x44e1ef VMOVUPD %ZMM12,(%R12,%RAX,1) |
(256) 0x44e1f6 VMULPD (%R15,%RAX,1),%ZMM2,%ZMM0 |
(256) 0x44e1fd VMULPD %ZMM13,%ZMM0,%ZMM14 |
(256) 0x44e203 VMULPD %ZMM12,%ZMM14,%ZMM15 |
(256) 0x44e209 VSQRTPD %ZMM15,%ZMM11 |
(256) 0x44e20f VMOVUPD %ZMM11,(%RBX,%RAX,1) |
(256) 0x44e216 VMOVUPD 0x40(%R15,%RAX,1),%ZMM1 |
(256) 0x44e21e VMULPD 0x40(%RCX,%RAX,1),%ZMM1,%ZMM0 |
(256) 0x44e226 VDIVPD %ZMM1,%ZMM4,%ZMM12 |
(256) 0x44e22c VMULPD %ZMM12,%ZMM12,%ZMM15 |
(256) 0x44e232 VMULPD %ZMM3,%ZMM0,%ZMM13 |
(256) 0x44e238 VMOVUPD %ZMM13,0x40(%R12,%RAX,1) |
(256) 0x44e240 VMULPD 0x40(%R15,%RAX,1),%ZMM2,%ZMM14 |
(256) 0x44e248 VMULPD %ZMM15,%ZMM14,%ZMM11 |
(256) 0x44e24e VMULPD %ZMM13,%ZMM11,%ZMM1 |
(256) 0x44e254 VSQRTPD %ZMM1,%ZMM12 |
(256) 0x44e25a VMOVUPD %ZMM12,0x40(%RBX,%RAX,1) |
(256) 0x44e262 VMOVUPD 0x80(%R15,%RAX,1),%ZMM0 |
(256) 0x44e26a VMULPD 0x80(%RCX,%RAX,1),%ZMM0,%ZMM14 |
(256) 0x44e272 VDIVPD %ZMM0,%ZMM4,%ZMM13 |
(256) 0x44e278 VMULPD %ZMM13,%ZMM13,%ZMM11 |
(256) 0x44e27e VMULPD %ZMM3,%ZMM14,%ZMM15 |
(256) 0x44e284 VMOVUPD %ZMM15,0x80(%R12,%RAX,1) |
(256) 0x44e28c VMULPD 0x80(%R15,%RAX,1),%ZMM2,%ZMM1 |
(256) 0x44e294 VMULPD %ZMM11,%ZMM1,%ZMM12 |
(256) 0x44e29a VMULPD %ZMM15,%ZMM12,%ZMM0 |
(256) 0x44e2a0 VSQRTPD %ZMM0,%ZMM13 |
(256) 0x44e2a6 VMOVUPD %ZMM13,0x80(%RBX,%RAX,1) |
(256) 0x44e2ae VMOVUPD 0xc0(%R15,%RAX,1),%ZMM14 |
(256) 0x44e2b6 VMULPD 0xc0(%RCX,%RAX,1),%ZMM14,%ZMM1 |
(256) 0x44e2be VDIVPD %ZMM14,%ZMM4,%ZMM15 |
(256) 0x44e2c4 VMULPD %ZMM15,%ZMM15,%ZMM11 |
(256) 0x44e2ca VMULPD %ZMM3,%ZMM1,%ZMM12 |
(256) 0x44e2d0 VMOVUPD %ZMM12,0xc0(%R12,%RAX,1) |
(256) 0x44e2d8 VMULPD 0xc0(%R15,%RAX,1),%ZMM2,%ZMM0 |
(256) 0x44e2e0 VMULPD %ZMM11,%ZMM0,%ZMM13 |
(256) 0x44e2e6 VMULPD %ZMM12,%ZMM13,%ZMM14 |
(256) 0x44e2ec VSQRTPD %ZMM14,%ZMM15 |
(256) 0x44e2f2 VMOVUPD %ZMM15,0xc0(%RBX,%RAX,1) |
(256) 0x44e2fa ADD $0x100,%RAX |
(256) 0x44e300 CMP %RAX,0x68(%RSP) |
(256) 0x44e305 JNE 44e1cf |
(254) 0x44e30b MOV 0x58(%RSP),%R15D |
(254) 0x44e310 TEST %R15D,%R15D |
(254) 0x44e313 JE 44e4ac |
(254) 0x44e319 MOV 0x54(%RSP),%ECX |
(254) 0x44e31d MOV 0x50(%RSP),%EAX |
(254) 0x44e321 MOV 0x64(%RSP),%R14D |
(254) 0x44e326 SUB %ECX,%R14D |
(254) 0x44e329 LEA 0x1(%R14),%R11D |
(254) 0x44e32d CMP $0x2,%R14D |
(254) 0x44e331 JBE 44e398 |
(254) 0x44e333 LEA (%RSI,%RCX,1),%R12 |
(254) 0x44e337 MOV 0x78(%RSP),%R13 |
(254) 0x44e33c MOV 0x70(%RSP),%R14 |
(254) 0x44e341 LEA (%RDX,%R12,8),%RBX |
(254) 0x44e345 LEA (%RCX,%R8,1),%R12 |
(254) 0x44e349 VMOVUPD (%RBX),%YMM1 |
(254) 0x44e34d LEA (%R13,%RCX,1),%R15 |
(254) 0x44e352 ADD %R14,%RCX |
(254) 0x44e355 VDIVPD %YMM1,%YMM10,%YMM12 |
(254) 0x44e359 VMULPD (%R10,%R15,8),%YMM1,%YMM0 |
(254) 0x44e35f VMULPD %YMM9,%YMM0,%YMM13 |
(254) 0x44e364 VMOVUPD %YMM13,(%R9,%RCX,8) |
(254) 0x44e36a VMULPD (%RBX),%YMM8,%YMM14 |
(254) 0x44e36e VMULPD %YMM12,%YMM12,%YMM11 |
(254) 0x44e373 VMULPD %YMM11,%YMM14,%YMM15 |
(254) 0x44e378 VMULPD %YMM13,%YMM15,%YMM1 |
(254) 0x44e37d VSQRTPD %YMM1,%YMM12 |
(254) 0x44e381 VMOVUPD %YMM12,(%RDI,%R12,8) |
(254) 0x44e387 TEST $0x3,%R11B |
(254) 0x44e38b JE 44e4ac |
(254) 0x44e391 AND $-0x4,%R11D |
(254) 0x44e395 ADD %R11D,%EAX |
(254) 0x44e398 MOV 0x28(%RSP),%RCX |
(254) 0x44e39d MOV 0x78(%RSP),%R13 |
(254) 0x44e3a2 MOV %RSI,%R11 |
(254) 0x44e3a5 MOV %R8,%RBX |
(254) 0x44e3a8 MOV 0x70(%RSP),%R12 |
(254) 0x44e3ad SUB %RCX,%R11 |
(254) 0x44e3b0 SUB %RCX,%R13 |
(254) 0x44e3b3 SUB %RCX,%RBX |
(254) 0x44e3b6 SUB %RCX,%R12 |
(254) 0x44e3b9 MOVSXD %EAX,%RCX |
(254) 0x44e3bc LEA (%R11,%RCX,1),%R14 |
(254) 0x44e3c0 LEA (%RCX,%R13,1),%R15 |
(254) 0x44e3c4 VMOVSD (%RDX,%R14,8),%XMM0 |
(254) 0x44e3ca VDIVSD %XMM0,%XMM7,%XMM13 |
(254) 0x44e3ce VMULSD (%R10,%R15,8),%XMM0,%XMM14 |
(254) 0x44e3d4 LEA (%RCX,%R12,1),%R15 |
(254) 0x44e3d8 ADD %RBX,%RCX |
(254) 0x44e3db VMULSD %XMM6,%XMM14,%XMM11 |
(254) 0x44e3df VMOVSD %XMM11,(%R9,%R15,8) |
(254) 0x44e3e5 VMULSD (%RDX,%R14,8),%XMM5,%XMM15 |
(254) 0x44e3eb VMULSD %XMM11,%XMM15,%XMM1 |
(254) 0x44e3f0 VMULSD %XMM13,%XMM13,%XMM12 |
(254) 0x44e3f5 VMULSD %XMM12,%XMM1,%XMM0 |
(254) 0x44e3fa VSQRTSD %XMM0,%XMM0,%XMM0 |
(254) 0x44e3fe VMOVSD %XMM0,(%RDI,%RCX,8) |
(254) 0x44e403 LEA 0x1(%RAX),%ECX |
(254) 0x44e406 CMP %ECX,0x60(%RSP) |
(254) 0x44e40a JL 44e4ac |
(254) 0x44e410 MOVSXD %ECX,%RCX |
(254) 0x44e413 ADD $0x2,%EAX |
(254) 0x44e416 LEA (%R11,%RCX,1),%R14 |
(254) 0x44e41a LEA (%R13,%RCX,1),%R15 |
(254) 0x44e41f VMOVSD (%RDX,%R14,8),%XMM13 |
(254) 0x44e425 VDIVSD %XMM13,%XMM7,%XMM14 |
(254) 0x44e42a VMULSD (%R10,%R15,8),%XMM13,%XMM11 |
(254) 0x44e430 LEA (%R12,%RCX,1),%R15 |
(254) 0x44e434 ADD %RBX,%RCX |
(254) 0x44e437 VMULSD %XMM6,%XMM11,%XMM15 |
(254) 0x44e43b VMOVSD %XMM15,(%R9,%R15,8) |
(254) 0x44e441 VMULSD (%RDX,%R14,8),%XMM5,%XMM1 |
(254) 0x44e447 VMULSD %XMM15,%XMM1,%XMM12 |
(254) 0x44e44c VMULSD %XMM14,%XMM14,%XMM0 |
(254) 0x44e451 VMULSD %XMM0,%XMM12,%XMM13 |
(254) 0x44e455 VSQRTSD %XMM13,%XMM13,%XMM13 |
(254) 0x44e45a VMOVSD %XMM13,(%RDI,%RCX,8) |
(254) 0x44e45f CMP %EAX,0x60(%RSP) |
(254) 0x44e463 JL 44e4ac |
(254) 0x44e465 CLTQ |
(254) 0x44e467 ADD %RAX,%R11 |
(254) 0x44e46a ADD %RAX,%R13 |
(254) 0x44e46d ADD %RAX,%R12 |
(254) 0x44e470 ADD %RAX,%RBX |
(254) 0x44e473 VMOVSD (%RDX,%R11,8),%XMM14 |
(254) 0x44e479 VDIVSD %XMM14,%XMM7,%XMM11 |
(254) 0x44e47e VMULSD (%R10,%R13,8),%XMM14,%XMM15 |
(254) 0x44e484 VMULSD %XMM6,%XMM15,%XMM1 |
(254) 0x44e488 VMOVSD %XMM1,(%R9,%R12,8) |
(254) 0x44e48e VMULSD (%RDX,%R11,8),%XMM5,%XMM12 |
(254) 0x44e494 VMULSD %XMM1,%XMM12,%XMM0 |
(254) 0x44e498 VMULSD %XMM11,%XMM11,%XMM13 |
(254) 0x44e49d VMULSD %XMM13,%XMM0,%XMM14 |
(254) 0x44e4a2 VSQRTSD %XMM14,%XMM14,%XMM14 |
(254) 0x44e4a7 VMOVSD %XMM14,(%RDI,%RBX,8) |
(254) 0x44e4ac INCL 0x5c(%RSP) |
(254) 0x44e4b0 MOV 0x30(%RSP),%R11 |
(254) 0x44e4b5 MOV $0x1,%ECX |
(254) 0x44e4ba MOV 0x38(%RSP),%R13 |
(254) 0x44e4bf MOV 0x40(%RSP),%R12 |
(254) 0x44e4c4 MOV 0x48(%RSP),%RBX |
(254) 0x44e4c9 ADD %R11,%RSI |
(254) 0x44e4cc ADD %R13,0x78(%RSP) |
(254) 0x44e4d1 MOV 0x5c(%RSP),%EAX |
(254) 0x44e4d5 ADD %R12,0x70(%RSP) |
(254) 0x44e4da ADD %RBX,%R8 |
(254) 0x44e4dd CMP %EAX,0x1c(%RSP) |
(254) 0x44e4e1 JLE 44e4ed |
(254) 0x44e4e3 MOV 0x20(%RSP),%R11D |
(254) 0x44e4e8 JMP 44e085 |
0x44e4ed MOV 0x8(%RSP),%RSI |
0x44e4f2 MOV 0x20(%RSP),%R9D |
0x44e4f7 MOV %R9D,0x80(%RSI) |
0x44e4fe VZEROUPPER |
0x44e501 LEA -0x28(%RBP),%RSP |
0x44e505 POP %RBX |
0x44e506 POP %R12 |
0x44e508 POP %R13 |
0x44e50a POP %R14 |
0x44e50c POP %R15 |
0x44e50e POP %RBP |
0x44e50f RET |
(254) 0x44e510 MOV 0x24(%RSP),%EAX |
(254) 0x44e514 XOR %ECX,%ECX |
(254) 0x44e516 JMP 44e321 |
0x44e51b INC %EAX |
0x44e51d XOR %EDX,%EDX |
0x44e51f JMP 44df54 |
(254) 0x44e524 MOV 0x5c(%RSP),%EAX |
(254) 0x44e528 MOV 0x1c(%RSP),%EBX |
(254) 0x44e52c MOV 0x20(%RSP),%R14D |
(254) 0x44e531 NOT %EAX |
(254) 0x44e533 ADD %EBX,%EAX |
(254) 0x44e535 AND $0x7,%EAX |
(254) 0x44e538 CMP %R14D,0x18(%RSP) |
(254) 0x44e53d JE 44e4ac |
(254) 0x44e543 MOV 0x38(%RSP),%R15 |
(254) 0x44e548 MOV 0x40(%RSP),%R12 |
(254) 0x44e54d INCL 0x5c(%RSP) |
(254) 0x44e551 MOV 0x30(%RSP),%R13 |
(254) 0x44e556 ADD %R15,0x78(%RSP) |
(254) 0x44e55b ADD %R12,0x70(%RSP) |
(254) 0x44e560 MOV 0x48(%RSP),%R12 |
(254) 0x44e565 ADD %R13,%RSI |
(254) 0x44e568 MOV 0x5c(%RSP),%EBX |
(254) 0x44e56c ADD %R12,%R8 |
(254) 0x44e56f MOV 0x78(%RSP),%R14 |
(254) 0x44e574 MOV 0x70(%RSP),%R15 |
(254) 0x44e579 CMP %EBX,0x1c(%RSP) |
(254) 0x44e57d JLE 44e7b2 |
(254) 0x44e583 TEST %EAX,%EAX |
(254) 0x44e585 JE 44e7d2 |
(254) 0x44e58b CMP $0x1,%EAX |
(254) 0x44e58e JE 44e706 |
(254) 0x44e594 CMP $0x2,%EAX |
(254) 0x44e597 JE 44e6d0 |
(254) 0x44e59d CMP $0x3,%EAX |
(254) 0x44e5a0 JE 44e69a |
(254) 0x44e5a6 CMP $0x4,%EAX |
(254) 0x44e5a9 JE 44e662 |
(254) 0x44e5af CMP $0x5,%EAX |
(254) 0x44e5b2 JE 44e62a |
(254) 0x44e5b4 CMP $0x6,%EAX |
(254) 0x44e5b7 JE 44e5f2 |
(254) 0x44e5b9 MOV 0x20(%RSP),%EAX |
(254) 0x44e5bd CMP %EAX,0x18(%RSP) |
(254) 0x44e5c1 JE 44e4ac |
(254) 0x44e5c7 INC %EBX |
(254) 0x44e5c9 ADD %R13,%RSI |
(254) 0x44e5cc MOV 0x40(%RSP),%R13 |
(254) 0x44e5d1 MOV %EBX,0x5c(%RSP) |
(254) 0x44e5d5 MOV 0x38(%RSP),%RBX |
(254) 0x44e5da ADD %R13,%R15 |
(254) 0x44e5dd ADD %RBX,%R14 |
(254) 0x44e5e0 MOV %R15,0x70(%RSP) |
(254) 0x44e5e5 MOV %R14,0x78(%RSP) |
(254) 0x44e5ea MOV 0x48(%RSP),%R14 |
(254) 0x44e5ef ADD %R14,%R8 |
(254) 0x44e5f2 MOV 0x20(%RSP),%R15D |
(254) 0x44e5f7 CMP %R15D,0x18(%RSP) |
(254) 0x44e5fc JE 44e4ac |
(254) 0x44e602 MOV 0x38(%RSP),%RAX |
(254) 0x44e607 MOV 0x40(%RSP),%RBX |
(254) 0x44e60c INCL 0x5c(%RSP) |
(254) 0x44e610 MOV 0x30(%RSP),%R12 |
(254) 0x44e615 ADD %RAX,0x78(%RSP) |
(254) 0x44e61a MOV 0x48(%RSP),%R13 |
(254) 0x44e61f ADD %RBX,0x70(%RSP) |
(254) 0x44e624 ADD %R12,%RSI |
(254) 0x44e627 ADD %R13,%R8 |
(254) 0x44e62a MOV 0x20(%RSP),%R14D |
(254) 0x44e62f CMP %R14D,0x18(%RSP) |
(254) 0x44e634 JE 44e4ac |
(254) 0x44e63a MOV 0x38(%RSP),%R12 |
(254) 0x44e63f MOV 0x40(%RSP),%RAX |
(254) 0x44e644 INCL 0x5c(%RSP) |
(254) 0x44e648 MOV 0x30(%RSP),%R15 |
(254) 0x44e64d ADD %R12,0x78(%RSP) |
(254) 0x44e652 MOV 0x48(%RSP),%RBX |
(254) 0x44e657 ADD %RAX,0x70(%RSP) |
(254) 0x44e65c ADD %R15,%RSI |
(254) 0x44e65f ADD %RBX,%R8 |
(254) 0x44e662 MOV 0x20(%RSP),%R13D |
(254) 0x44e667 CMP %R13D,0x18(%RSP) |
(254) 0x44e66c JE 44e4ac |
(254) 0x44e672 MOV 0x38(%RSP),%R15 |
(254) 0x44e677 MOV 0x40(%RSP),%R12 |
(254) 0x44e67c INCL 0x5c(%RSP) |
(254) 0x44e680 MOV 0x30(%RSP),%R14 |
(254) 0x44e685 ADD %R15,0x78(%RSP) |
(254) 0x44e68a MOV 0x48(%RSP),%RAX |
(254) 0x44e68f ADD %R12,0x70(%RSP) |
(254) 0x44e694 ADD %R14,%RSI |
(254) 0x44e697 ADD %RAX,%R8 |
(254) 0x44e69a MOV 0x20(%RSP),%EBX |
(254) 0x44e69e CMP %EBX,0x18(%RSP) |
(254) 0x44e6a2 JE 44e4ac |
(254) 0x44e6a8 MOV 0x38(%RSP),%R14 |
(254) 0x44e6ad MOV 0x40(%RSP),%R15 |
(254) 0x44e6b2 INCL 0x5c(%RSP) |
(254) 0x44e6b6 MOV 0x30(%RSP),%R13 |
(254) 0x44e6bb ADD %R14,0x78(%RSP) |
(254) 0x44e6c0 MOV 0x48(%RSP),%R12 |
(254) 0x44e6c5 ADD %R15,0x70(%RSP) |
(254) 0x44e6ca ADD %R13,%RSI |
(254) 0x44e6cd ADD %R12,%R8 |
(254) 0x44e6d0 MOV 0x20(%RSP),%EAX |
(254) 0x44e6d4 CMP %EAX,0x18(%RSP) |
(254) 0x44e6d8 JE 44e4ac |
(254) 0x44e6de MOV 0x38(%RSP),%R13 |
(254) 0x44e6e3 MOV 0x40(%RSP),%R14 |
(254) 0x44e6e8 INCL 0x5c(%RSP) |
(254) 0x44e6ec MOV 0x30(%RSP),%RBX |
(254) 0x44e6f1 ADD %R13,0x78(%RSP) |
(254) 0x44e6f6 MOV 0x48(%RSP),%R15 |
(254) 0x44e6fb ADD %R14,0x70(%RSP) |
(254) 0x44e700 ADD %RBX,%RSI |
(254) 0x44e703 ADD %R15,%R8 |
(254) 0x44e706 MOV 0x20(%RSP),%R12D |
(254) 0x44e70b CMP %R12D,0x18(%RSP) |
(254) 0x44e710 JE 44e4ac |
(254) 0x44e716 INCL 0x5c(%RSP) |
(254) 0x44e71a MOV 0x30(%RSP),%RBX |
(254) 0x44e71f MOV 0x38(%RSP),%R13 |
(254) 0x44e724 MOV 0x40(%RSP),%R14 |
(254) 0x44e729 MOV 0x48(%RSP),%R15 |
(254) 0x44e72e ADD %RBX,%RSI |
(254) 0x44e731 ADD %R13,0x78(%RSP) |
(254) 0x44e736 MOV 0x5c(%RSP),%EAX |
(254) 0x44e73a ADD %R14,0x70(%RSP) |
(254) 0x44e73f ADD %R15,%R8 |
(254) 0x44e742 CMP %EAX,0x1c(%RSP) |
(254) 0x44e746 JLE 44e7b2 |
(254) 0x44e748 MOV %R11D,0x5c(%RSP) |
(254) 0x44e74d MOV %R15,%R12 |
(254) 0x44e750 MOV %R14,%R13 |
(254) 0x44e753 MOV 0x30(%RSP),%R15 |
(254) 0x44e758 MOV 0x38(%RSP),%R14 |
(254) 0x44e75d MOV 0x78(%RSP),%R11 |
(254) 0x44e762 MOV 0x70(%RSP),%RBX |
(254) 0x44e767 MOV %RDI,0x10(%RSP) |
(254) 0x44e76c MOV %RDX,%RDI |
(254) 0x44e76f MOV 0x20(%RSP),%EDX |
(255) 0x44e773 CMP %EDX,0x18(%RSP) |
(255) 0x44e777 JE 44e7eb |
(255) 0x44e779 ADD $0x8,%EAX |
(255) 0x44e77c LEA (%RSI,%R15,8),%RSI |
(255) 0x44e780 LEA (%R11,%R14,8),%R11 |
(255) 0x44e784 LEA (%RBX,%R13,8),%RBX |
(255) 0x44e788 LEA (%R8,%R12,8),%R8 |
(255) 0x44e78c CMP %EAX,0x1c(%RSP) |
(255) 0x44e790 JG 44e773 |
0x44e792 MOV 0x5c(%RSP),%R12D |
0x44e797 MOV 0x8(%RSP),%RSI |
0x44e79c MOV %R12D,0x10(%RSP) |
0x44e7a1 TEST %CL,%CL |
0x44e7a3 JE 44e7c0 |
0x44e7a5 MOV 0x10(%RSP),%ECX |
0x44e7a9 MOV %ECX,0x20(%RSP) |
0x44e7ad JMP 44e4f2 |
0x44e7b2 MOV %R11D,0x10(%RSP) |
0x44e7b7 MOV 0x8(%RSP),%RSI |
0x44e7bc JMP 44e7a1 |
0x44e7be XCHG %AX,%AX |
0x44e7c0 VZEROUPPER |
0x44e7c3 LEA -0x28(%RBP),%RSP |
0x44e7c7 POP %RBX |
0x44e7c8 POP %R12 |
0x44e7ca POP %R13 |
0x44e7cc POP %R14 |
0x44e7ce POP %R15 |
0x44e7d0 POP %RBP |
0x44e7d1 RET |
(254) 0x44e7d2 MOV %R13,%R15 |
(254) 0x44e7d5 MOV %R11D,0x5c(%RSP) |
(254) 0x44e7da MOV 0x40(%RSP),%R13 |
(254) 0x44e7df MOV %EBX,%EAX |
(254) 0x44e7e1 MOV 0x38(%RSP),%R14 |
(254) 0x44e7e6 JMP 44e75d |
(254) 0x44e7eb MOV %RDI,%RDX |
(254) 0x44e7ee MOV %EAX,0x5c(%RSP) |
(254) 0x44e7f2 MOV 0x10(%RSP),%RDI |
(254) 0x44e7f7 MOV %R11,0x78(%RSP) |
(254) 0x44e7fc MOV %RBX,0x70(%RSP) |
(254) 0x44e801 JMP 44e4ac |
0x44e806 NOPW %CS:(%RAX,%RAX,1) |
Path / |
Source file and lines | ideal_gas_kernel.f90:45-55 |
Module | exec |
nb instructions | 150 |
nb uops | 157 |
loop length | 555 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 3 |
used zmm registers | 3 |
nb stack references | 21 |
micro-operation queue | 26.17 cycles |
front end | 26.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.50 | 9.40 | 17.67 | 17.67 | 16.50 | 9.40 | 9.30 | 16.50 | 16.50 | 16.50 | 9.40 | 17.67 |
cycles | 9.50 | 12.93 | 17.67 | 17.67 | 16.50 | 9.40 | 9.30 | 16.50 | 16.50 | 16.50 | 9.40 | 17.67 |
Cycles executing div or sqrt instructions | 6.00 |
FE+BE cycles | 25.55-25.56 |
Stall cycles | 0.00 |
Front-end | 26.17 |
Dispatch | 17.67 |
DIV/SQRT | 6.00 |
Overall L1 | 26.17 |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 22% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 14% |
all | 9% |
load | 10% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 10% |
load | 10% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 6% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x40,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
ADD $-0x80,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x68(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RDI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RDI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x70(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RDI),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RDI),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x78(%RDI),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RDI),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RDI),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R8),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 402080 <@plt_start@+0x60> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %EAX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 402180 <@plt_start@+0x160> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x78(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x18(%R11),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CLTD | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R12D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
CMP %EDX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 44e51b <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x64b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %EAX,%ESI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %EDX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %ESI,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %EAX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 44e501 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x631> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x8(%R11),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %EBX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R11),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x5e7a2(%RIP),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x5ec82(%RIP),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ESI,0x5c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R10),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD (%R9),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %ESI,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV 0x30(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x5ec6c(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD %XMM7,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM6,%YMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %ECX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%RCX),%R12D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0x38(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %R8,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
IMUL %RAX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R8,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8D,0x24(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R15,%R8,1),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R8,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%R11),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD %XMM5,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12D,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RSP),%R12D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD %XMM7,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM6,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R14,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x70(%RSP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x24(%RSP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD %XMM5,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RCX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x40(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%R11),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %R8,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x48(%RSP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%R11),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x38(%R11),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %R8,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R14,%RCX,1),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R15,%RAX,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EAX,0x64(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x3,%R14D | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
AND $-0x8,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R14D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%RCX,%RBX,1),%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %ECX,0x54(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x6,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %R12D,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R13D,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMOVLE 0x18(%RSP),%EBX | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.50 |
AND $0x7,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R15,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EBX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RSP),%R11D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RSP),%R9D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9D,0x80(%RSI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 44df54 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x84> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x5c(%RSP),%R12D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12D,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %CL,%CL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 44e7c0 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x8f0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x10(%RSP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ECX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 44e4f2 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x622> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R11D,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x8(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 44e7a1 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x8d1> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | ideal_gas_kernel.f90:45-55 |
Module | exec |
nb instructions | 150 |
nb uops | 157 |
loop length | 555 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 3 |
used zmm registers | 3 |
nb stack references | 21 |
micro-operation queue | 26.17 cycles |
front end | 26.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.50 | 9.40 | 17.67 | 17.67 | 16.50 | 9.40 | 9.30 | 16.50 | 16.50 | 16.50 | 9.40 | 17.67 |
cycles | 9.50 | 12.93 | 17.67 | 17.67 | 16.50 | 9.40 | 9.30 | 16.50 | 16.50 | 16.50 | 9.40 | 17.67 |
Cycles executing div or sqrt instructions | 6.00 |
FE+BE cycles | 25.55-25.56 |
Stall cycles | 0.00 |
Front-end | 26.17 |
Dispatch | 17.67 |
DIV/SQRT | 6.00 |
Overall L1 | 26.17 |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 22% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 14% |
all | 9% |
load | 10% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 10% |
load | 10% |
store | 9% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 6% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x40,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
ADD $-0x80,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x68(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RDI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RDI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x70(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RDI),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RDI),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x78(%RDI),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RDI),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RDI),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R8),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 402080 <@plt_start@+0x60> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %EAX,%R12D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 402180 <@plt_start@+0x160> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x78(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x18(%R11),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CLTD | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R12D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
CMP %EDX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 44e51b <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x64b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %EAX,%ESI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %EDX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %ESI,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %EAX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 44e501 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x631> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x8(%R11),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %EBX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R11),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x5e7a2(%RIP),%XMM7 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x5ec82(%RIP),%XMM6 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ESI,0x5c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R10),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD (%R9),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %ESI,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV 0x30(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x5ec6c(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD %XMM7,%YMM10 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM6,%YMM9 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %ECX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%RCX),%R12D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0x38(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %R8,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
IMUL %RAX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R8,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8D,0x24(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R15,%R8,1),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R8,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%R11),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD %XMM5,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12D,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x60(%RSP),%R12D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD %XMM7,%ZMM4 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM6,%ZMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %R14,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x70(%RSP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x24(%RSP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD %XMM5,%ZMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RCX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x40(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%R11),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %R8,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x48(%RSP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%R11),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x38(%R11),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %R8,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%R14,%RCX,1),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R15,%RAX,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EAX,0x64(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %EAX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x3,%R14D | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
AND $-0x8,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R14D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%RCX,%RBX,1),%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %ECX,0x54(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x6,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %R12D,%EBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R13D,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMOVLE 0x18(%RSP),%EBX | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.50 |
AND $0x7,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R15,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EBX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RSP),%R11D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RSP),%R9D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9D,0x80(%RSI) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 44df54 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x84> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x5c(%RSP),%R12D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x8(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12D,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %CL,%CL | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 44e7c0 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x8f0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x10(%RSP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ECX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 44e4f2 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x622> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R11D,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x8(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 44e7a1 <__ideal_gas_kernel_module_MOD_ideal_gas_kernel._omp_fn.0+0x8d1> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼ideal_gas_kernel._omp_fn.0– | 4.87 | 3.6 |
▼Loop 254 - ideal_gas_kernel.f90:45-55 - exec– | 0 | 0 |
○Loop 256 - ideal_gas_kernel.f90:50-55 - exec | 4.86 | 3.59 |
○Loop 255 - ideal_gas_kernel.f90:46-46 - exec | 0 | 0 |