Function: __pack_kernel_module_MOD_clover_unpack_message_left._omp_fn.0.lto_priv.0 | Module: exec | Source: pack_kernel.f90:108-113 | Coverage: 0.03% |
---|
Function: __pack_kernel_module_MOD_clover_unpack_message_left._omp_fn.0.lto_priv.0 | Module: exec | Source: pack_kernel.f90:108-113 | Coverage: 0.03% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-137-7698/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/pack_kernel.f90: 108 - 113 |
-------------------------------------------------------------------------------- |
108: !$OMP PARALLEL DO PRIVATE(index) |
109: DO k=y_min-depth,y_max+y_inc+depth |
110: !$OMP SIMD |
111: DO j=1,depth |
112: index= buffer_offset + j+(k+depth-1)*depth |
113: field(x_min-j,k)=left_rcv_buffer(index) |
0x42a7d0 PUSH %RBP |
0x42a7d1 MOV %RSP,%RBP |
0x42a7d4 PUSH %R15 |
0x42a7d6 PUSH %R14 |
0x42a7d8 PUSH %R13 |
0x42a7da PUSH %R12 |
0x42a7dc PUSH %RBX |
0x42a7dd SUB $0x98,%RSP |
0x42a7e4 MOV %RDI,-0x38(%RBP) |
0x42a7e8 MOV 0x28(%RDI),%RDX |
0x42a7ec MOV 0x30(%RDI),%RAX |
0x42a7f0 MOV 0x54(%RDI),%R13D |
0x42a7f4 MOV 0x48(%RDI),%R15 |
0x42a7f8 MOV 0x40(%RDI),%RBX |
0x42a7fc MOV 0x20(%RDI),%R12 |
0x42a800 MOV %RDX,-0x70(%RBP) |
0x42a804 MOV %RAX,-0x40(%RBP) |
0x42a808 CALL 402080 <@plt_start@+0x60> |
0x42a80d MOV %EAX,%R14D |
0x42a810 CALL 402180 <@plt_start@+0x160> |
0x42a815 MOV -0x38(%RBP),%RCX |
0x42a819 MOV %EAX,%ESI |
0x42a81b MOV 0x58(%RCX),%EAX |
0x42a81e INC %EAX |
0x42a820 SUB %R13D,%EAX |
0x42a823 CLTD |
0x42a824 IDIV %R14D |
0x42a827 CMP %EDX,%ESI |
0x42a829 JL 42acbc |
0x42a82f IMUL %EAX,%ESI |
0x42a832 ADD %EDX,%ESI |
0x42a834 ADD %ESI,%EAX |
0x42a836 CMP %EAX,%ESI |
0x42a838 JGE 42ac98 |
0x42a83e MOV 0x8(%RCX),%R8 |
0x42a842 LEA (%R13,%RSI,1),%EDI |
0x42a847 ADD %R13D,%EAX |
0x42a84a MOV (%RCX),%R13 |
0x42a84d KXORB %K0,%K0,%K0 |
0x42a851 MOV -0x70(%RBP),%RDX |
0x42a855 MOV 0x10(%RCX),%R9 |
0x42a859 MOV %EAX,-0x7c(%RBP) |
0x42a85c MOVSXD %EDI,%RAX |
0x42a85f MOV (%R8),%R11D |
0x42a862 MOV 0x38(%RCX),%R10 |
0x42a866 MOV %R13,-0x90(%RBP) |
0x42a86d MOV %R12,%R13 |
0x42a870 IMUL %RDX,%RAX |
0x42a874 NEG %R13 |
0x42a877 MOV %R9,-0x88(%RBP) |
0x42a87e MOV -0x40(%RBP),%R8 |
0x42a882 LEA -0x1(%R11),%ESI |
0x42a886 MOV %R10,-0x38(%RBP) |
0x42a88a LEA (,%RBX,8),%R10 |
0x42a892 MOV 0x18(%RCX),%R14 |
0x42a896 LEA (%RDI,%RSI,1),%R9D |
0x42a89a MOV %ESI,-0x94(%RBP) |
0x42a8a0 MOV %R13,%RSI |
0x42a8a3 LEA (,%R12,4),%RDX |
0x42a8ab SAL $0x5,%RSI |
0x42a8af MOV %EDI,-0x48(%RBP) |
0x42a8b2 MOV %R11D,%EDI |
0x42a8b5 ADD %RAX,%R8 |
0x42a8b8 MOV %R10,-0x78(%RBP) |
0x42a8bc LEA (,%R13,8),%R10 |
0x42a8c4 SAL $0x4,%R13 |
0x42a8c8 SHR $0x2,%EDI |
0x42a8cb MOV %RSI,-0x58(%RBP) |
0x42a8cf MOV %RBX,%RAX |
0x42a8d2 IMUL %R11D,%R9D |
0x42a8d6 MOV %R11D,%ESI |
0x42a8d9 MOV %R13,-0x60(%RBP) |
0x42a8dd MOV %R12,%R13 |
0x42a8e0 SAL $0x4,%RAX |
0x42a8e4 AND $-0x4,%ESI |
0x42a8e7 SUB %RDX,%R13 |
0x42a8ea MOV %EDI,-0x4c(%RBP) |
0x42a8ed MOV %RBX,%RDI |
0x42a8f0 SAL $0x3,%R13 |
0x42a8f4 MOV %RAX,-0xa8(%RBP) |
0x42a8fb SAL $0x5,%RDI |
0x42a8ff XOR %EAX,%EAX |
0x42a901 MOV %ESI,-0x98(%RBP) |
0x42a907 INC %ESI |
0x42a909 TEST %R11D,%R11D |
0x42a90c CMOVNS %R11D,%EAX |
0x42a910 MOV %R13,-0x68(%RBP) |
0x42a914 MOV %ESI,-0xb4(%RBP) |
0x42a91a INC %EAX |
0x42a91c MOV %RCX,-0xc0(%RBP) |
0x42a923 MOV %EAX,-0x80(%RBP) |
0x42a926 MOV %R11D,-0x44(%RBP) |
0x42a92a MOV $0x1,%R11D |
0x42a930 KMOVB %R11D,%K1 |
0x42a935 NOPL (%RAX) |
(187) 0x42a938 MOV -0x44(%RBP),%ECX |
(187) 0x42a93b TEST %ECX,%ECX |
(187) 0x42a93d JLE 42ac49 |
(187) 0x42a943 MOV -0x90(%RBP),%R13 |
(187) 0x42a94a MOV -0x88(%RBP),%RDX |
(187) 0x42a951 CMPL $0x2,-0x94(%RBP) |
(187) 0x42a958 MOV (%R13),%ESI |
(187) 0x42a95c MOV (%RDX),%EAX |
(187) 0x42a95e MOV %ESI,-0x40(%RBP) |
(187) 0x42a961 JBE 42acb0 |
(187) 0x42a967 MOVSXD %EAX,%R11 |
(187) 0x42a96a MOVSXD %R9D,%RCX |
(187) 0x42a96d MOVSXD %ESI,%RSI |
(187) 0x42a970 MOV -0x38(%RBP),%RDX |
(187) 0x42a974 LEA 0x1(%R11,%RCX,1),%R13 |
(187) 0x42a979 DEC %RSI |
(187) 0x42a97c MOV -0xa8(%RBP),%RCX |
(187) 0x42a983 IMUL %RBX,%R13 |
(187) 0x42a987 IMUL %R12,%RSI |
(187) 0x42a98b ADD %R15,%R13 |
(187) 0x42a98e LEA (%RDX,%R13,8),%R11 |
(187) 0x42a992 MOV -0x4c(%RBP),%R13D |
(187) 0x42a996 ADD %R8,%RSI |
(187) 0x42a999 LEA (%R14,%RSI,8),%RDX |
(187) 0x42a99d MOV %R11,-0xa0(%RBP) |
(187) 0x42a9a4 LEA (%R11,%RCX,1),%RCX |
(187) 0x42a9a8 XOR %ESI,%ESI |
(187) 0x42a9aa AND $0x3,%R13D |
(187) 0x42a9ae JE 42aa97 |
(187) 0x42a9b4 CMP $0x1,%R13D |
(187) 0x42a9b8 JE 42aa4d |
(187) 0x42a9be CMP $0x2,%R13D |
(187) 0x42a9c2 JE 42aa0c |
(187) 0x42a9c4 MOV -0xa0(%RBP),%RSI |
(187) 0x42a9cb VMOVSD (%RCX),%XMM1 |
(187) 0x42a9cf ADD %RDI,%R11 |
(187) 0x42a9d2 MOV -0x60(%RBP),%R13 |
(187) 0x42a9d6 VMOVSD (%RCX,%RBX,8),%XMM0 |
(187) 0x42a9db ADD %RDI,%RCX |
(187) 0x42a9de VMOVSD (%RSI),%XMM3 |
(187) 0x42a9e2 VMOVSD (%RSI,%RBX,8),%XMM2 |
(187) 0x42a9e7 MOV -0x68(%RBP),%RSI |
(187) 0x42a9eb VMOVSD %XMM3,(%RDX) |
(187) 0x42a9ef VMOVSD %XMM2,(%RDX,%R10,1) |
(187) 0x42a9f5 VMOVSD %XMM1,(%RDX,%R13,1) |
(187) 0x42a9fb MOV -0x58(%RBP),%R13 |
(187) 0x42a9ff VMOVSD %XMM0,(%RDX,%RSI,1) |
(187) 0x42aa04 MOV $0x1,%ESI |
(187) 0x42aa09 ADD %R13,%RDX |
(187) 0x42aa0c VMOVSD (%R11),%XMM4 |
(187) 0x42aa11 VMOVSD (%R11,%RBX,8),%XMM5 |
(187) 0x42aa17 INC %ESI |
(187) 0x42aa19 ADD %RDI,%R11 |
(187) 0x42aa1c VMOVSD (%RCX),%XMM6 |
(187) 0x42aa20 MOV -0x60(%RBP),%R13 |
(187) 0x42aa24 VMOVSD (%RCX,%RBX,8),%XMM7 |
(187) 0x42aa29 VMOVSD %XMM4,(%RDX) |
(187) 0x42aa2d ADD %RDI,%RCX |
(187) 0x42aa30 VMOVSD %XMM5,(%RDX,%R10,1) |
(187) 0x42aa36 VMOVSD %XMM6,(%RDX,%R13,1) |
(187) 0x42aa3c MOV -0x68(%RBP),%R13 |
(187) 0x42aa40 VMOVSD %XMM7,(%RDX,%R13,1) |
(187) 0x42aa46 MOV -0x58(%RBP),%R13 |
(187) 0x42aa4a ADD %R13,%RDX |
(187) 0x42aa4d VMOVSD (%R11),%XMM8 |
(187) 0x42aa52 VMOVSD (%R11,%RBX,8),%XMM9 |
(187) 0x42aa58 INC %ESI |
(187) 0x42aa5a ADD %RDI,%R11 |
(187) 0x42aa5d VMOVSD (%RCX),%XMM10 |
(187) 0x42aa61 MOV -0x60(%RBP),%R13 |
(187) 0x42aa65 VMOVSD (%RCX,%RBX,8),%XMM11 |
(187) 0x42aa6a VMOVSD %XMM8,(%RDX) |
(187) 0x42aa6e ADD %RDI,%RCX |
(187) 0x42aa71 VMOVSD %XMM9,(%RDX,%R10,1) |
(187) 0x42aa77 VMOVSD %XMM10,(%RDX,%R13,1) |
(187) 0x42aa7d MOV -0x68(%RBP),%R13 |
(187) 0x42aa81 VMOVSD %XMM11,(%RDX,%R13,1) |
(187) 0x42aa87 MOV -0x58(%RBP),%R13 |
(187) 0x42aa8b ADD %R13,%RDX |
(187) 0x42aa8e CMP %ESI,-0x4c(%RBP) |
(187) 0x42aa91 JE 42ab95 |
(187) 0x42aa97 MOV %EAX,-0xa0(%RBP) |
(187) 0x42aa9d MOV -0x68(%RBP),%R13 |
(187) 0x42aaa1 MOV %R8,-0xb0(%RBP) |
(187) 0x42aaa8 MOV -0x58(%RBP),%RAX |
(187) 0x42aaac MOV -0x60(%RBP),%R8 |
(188) 0x42aab0 VMOVSD (%R11),%XMM12 |
(188) 0x42aab5 VMOVSD (%R11,%RBX,8),%XMM13 |
(188) 0x42aabb ADD %RDI,%R11 |
(188) 0x42aabe ADD $0x4,%ESI |
(188) 0x42aac1 VMOVSD (%RCX),%XMM14 |
(188) 0x42aac5 VMOVSD (%RCX,%RBX,8),%XMM15 |
(188) 0x42aaca ADD %RDI,%RCX |
(188) 0x42aacd VMOVSD %XMM12,(%RDX) |
(188) 0x42aad1 VMOVSD %XMM13,(%RDX,%R10,1) |
(188) 0x42aad7 VMOVSD %XMM14,(%RDX,%R8,1) |
(188) 0x42aadd VMOVSD %XMM15,(%RDX,%R13,1) |
(188) 0x42aae3 ADD %RAX,%RDX |
(188) 0x42aae6 VMOVSD (%R11),%XMM3 |
(188) 0x42aaeb VMOVSD (%R11,%RBX,8),%XMM2 |
(188) 0x42aaf1 ADD %RDI,%R11 |
(188) 0x42aaf4 VMOVSD (%RCX),%XMM1 |
(188) 0x42aaf8 VMOVSD (%RCX,%RBX,8),%XMM0 |
(188) 0x42aafd ADD %RDI,%RCX |
(188) 0x42ab00 VMOVSD %XMM3,(%RDX) |
(188) 0x42ab04 VMOVSD %XMM2,(%RDX,%R10,1) |
(188) 0x42ab0a VMOVSD %XMM1,(%RDX,%R8,1) |
(188) 0x42ab10 VMOVSD %XMM0,(%RDX,%R13,1) |
(188) 0x42ab16 ADD %RAX,%RDX |
(188) 0x42ab19 VMOVSD (%R11),%XMM4 |
(188) 0x42ab1e VMOVSD (%R11,%RBX,8),%XMM5 |
(188) 0x42ab24 ADD %RDI,%R11 |
(188) 0x42ab27 VMOVSD (%RCX),%XMM6 |
(188) 0x42ab2b VMOVSD (%RCX,%RBX,8),%XMM7 |
(188) 0x42ab30 ADD %RDI,%RCX |
(188) 0x42ab33 VMOVSD %XMM4,(%RDX) |
(188) 0x42ab37 VMOVSD %XMM5,(%RDX,%R10,1) |
(188) 0x42ab3d VMOVSD %XMM6,(%RDX,%R8,1) |
(188) 0x42ab43 VMOVSD %XMM7,(%RDX,%R13,1) |
(188) 0x42ab49 ADD %RAX,%RDX |
(188) 0x42ab4c VMOVSD (%R11),%XMM8 |
(188) 0x42ab51 VMOVSD (%R11,%RBX,8),%XMM9 |
(188) 0x42ab57 ADD %RDI,%R11 |
(188) 0x42ab5a VMOVSD (%RCX),%XMM10 |
(188) 0x42ab5e VMOVSD (%RCX,%RBX,8),%XMM11 |
(188) 0x42ab63 ADD %RDI,%RCX |
(188) 0x42ab66 VMOVSD %XMM8,(%RDX) |
(188) 0x42ab6a VMOVSD %XMM9,(%RDX,%R10,1) |
(188) 0x42ab70 VMOVSD %XMM10,(%RDX,%R8,1) |
(188) 0x42ab76 VMOVSD %XMM11,(%RDX,%R13,1) |
(188) 0x42ab7c ADD %RAX,%RDX |
(188) 0x42ab7f CMP %ESI,-0x4c(%RBP) |
(188) 0x42ab82 JNE 42aab0 |
(187) 0x42ab88 MOV -0xa0(%RBP),%EAX |
(187) 0x42ab8e MOV -0xb0(%RBP),%R8 |
(187) 0x42ab95 MOV -0x98(%RBP),%ESI |
(187) 0x42ab9b CMP %ESI,-0x44(%RBP) |
(187) 0x42ab9e JE 42ac49 |
(187) 0x42aba4 MOV -0xb4(%RBP),%EDX |
(187) 0x42abaa MOV -0x44(%RBP),%R11D |
(187) 0x42abae SUB %ESI,%R11D |
(187) 0x42abb1 CMP $0x1,%R11D |
(187) 0x42abb5 JE 42ac1d |
(187) 0x42abb7 MOVSXD %R9D,%R13 |
(187) 0x42abba MOVSXD %EAX,%RCX |
(187) 0x42abbd LEA 0x1(%RCX,%R13,1),%RCX |
(187) 0x42abc2 MOV %RBX,%R13 |
(187) 0x42abc5 IMUL %RBX,%RCX |
(187) 0x42abc9 IMUL %RSI,%R13 |
(187) 0x42abcd IMUL %R10,%RSI |
(187) 0x42abd1 ADD %R15,%RCX |
(187) 0x42abd4 ADD %R13,%RCX |
(187) 0x42abd7 MOV -0x38(%RBP),%R13 |
(187) 0x42abdb LEA (%R13,%RCX,8),%R13 |
(187) 0x42abe0 MOVSXD -0x40(%RBP),%RCX |
(187) 0x42abe4 VMOVSD (%R13),%XMM12 |
(187) 0x42abea DEC %RCX |
(187) 0x42abed IMUL %R12,%RCX |
(187) 0x42abf1 ADD %R8,%RCX |
(187) 0x42abf4 LEA (%RSI,%RCX,8),%RCX |
(187) 0x42abf8 MOV -0x78(%RBP),%RSI |
(187) 0x42abfc ADD %R14,%RCX |
(187) 0x42abff VMOVSD (%R13,%RSI,1),%XMM13 |
(187) 0x42ac06 VMOVSD %XMM12,(%RCX) |
(187) 0x42ac0a VMOVSD %XMM13,(%RCX,%R10,1) |
(187) 0x42ac10 TEST $0x1,%R11B |
(187) 0x42ac14 JE 42ac49 |
(187) 0x42ac16 AND $-0x2,%R11D |
(187) 0x42ac1a ADD %R11D,%EDX |
(187) 0x42ac1d ADD %EDX,%EAX |
(187) 0x42ac1f MOV -0x38(%RBP),%R11 |
(187) 0x42ac23 ADD %R9D,%EAX |
(187) 0x42ac26 CLTQ |
(187) 0x42ac28 IMUL %RBX,%RAX |
(187) 0x42ac2c ADD %R15,%RAX |
(187) 0x42ac2f VMOVSD (%R11,%RAX,8),%XMM14 |
(187) 0x42ac35 MOV -0x40(%RBP),%EAX |
(187) 0x42ac38 SUB %EDX,%EAX |
(187) 0x42ac3a CLTQ |
(187) 0x42ac3c IMUL %R12,%RAX |
(187) 0x42ac40 ADD %R8,%RAX |
(187) 0x42ac43 VMOVSD %XMM14,(%R14,%RAX,8) |
(187) 0x42ac49 MOV -0x44(%RBP),%R13D |
(187) 0x42ac4d MOV -0x50(%RBP),%EDX |
(187) 0x42ac50 KMOVB %K0,%ECX |
(187) 0x42ac54 KMOVB %K1,%ESI |
(187) 0x42ac58 MOV -0x70(%RBP),%RAX |
(187) 0x42ac5c TEST %R13D,%R13D |
(187) 0x42ac5f CMOVNS -0x80(%RBP),%EDX |
(187) 0x42ac63 CMOVNS %ESI,%ECX |
(187) 0x42ac66 INCL -0x48(%RBP) |
(187) 0x42ac69 ADD %R13D,%R9D |
(187) 0x42ac6c ADD %RAX,%R8 |
(187) 0x42ac6f MOV %EDX,-0x50(%RBP) |
(187) 0x42ac72 KMOVB %ECX,%K0 |
(187) 0x42ac76 MOV -0x48(%RBP),%R11D |
(187) 0x42ac7a CMP %R11D,-0x7c(%RBP) |
(187) 0x42ac7e JG 42a938 |
0x42ac84 MOV -0xc0(%RBP),%R15 |
0x42ac8b KORTESTB %K0,%K0 |
0x42ac8f JE 42ac98 |
0x42ac91 MOV -0x50(%RBP),%EBX |
0x42ac94 MOV %EBX,0x50(%R15) |
0x42ac98 ADD $0x98,%RSP |
0x42ac9f POP %RBX |
0x42aca0 POP %R12 |
0x42aca2 POP %R13 |
0x42aca4 POP %R14 |
0x42aca6 POP %R15 |
0x42aca8 POP %RBP |
0x42aca9 RET |
0x42acaa NOPW (%RAX,%RAX,1) |
(187) 0x42acb0 XOR %ESI,%ESI |
(187) 0x42acb2 MOV $0x1,%EDX |
(187) 0x42acb7 JMP 42abaa |
0x42acbc INC %EAX |
0x42acbe XOR %EDX,%EDX |
0x42acc0 JMP 42a82f |
0x42acc5 NOPW %CS:(%RAX,%RAX,1) |
Path / |
Source file and lines | pack_kernel.f90:108-113 |
Module | exec |
nb instructions | 113 |
nb uops | 118 |
loop length | 424 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 20 |
micro-operation queue | 19.67 cycles |
front end | 19.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 8.60 | 8.60 | 8.33 | 8.33 | 14.50 | 8.60 | 8.60 | 14.50 | 14.50 | 14.50 | 8.60 | 8.33 |
cycles | 8.60 | 10.53 | 8.33 | 8.33 | 14.50 | 8.60 | 8.60 | 14.50 | 14.50 | 14.50 | 8.60 | 8.33 |
Cycles executing div or sqrt instructions | 6.00 |
FE+BE cycles | 19.35-19.36 |
Stall cycles | 0.00 |
Front-end | 19.67 |
Dispatch | 14.50 |
DIV/SQRT | 6.00 |
Overall L1 | 19.67 |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 9% |
load | 12% |
store | 9% |
mul | 6% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 6% |
other | 6% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x54(%RDI),%R13D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RDI),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RDI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RDI),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 402080 <@plt_start@+0x60> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 402180 <@plt_start@+0x160> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x58(%RCX),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %R13D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CLTD | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R14D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
CMP %EDX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 42acbc <__pack_kernel_module_MOD_clover_unpack_message_left._omp_fn.0.lto_priv.0+0x4ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %EAX,%ESI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %EDX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %ESI,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %EAX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 42ac98 <__pack_kernel_module_MOD_clover_unpack_message_left._omp_fn.0.lto_priv.0+0x4c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x8(%RCX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R13,%RSI,1),%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
ADD %R13D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%RCX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KXORB %K0,%K0,%K0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x70(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RCX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,-0x7c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %EDI,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV (%R8),%R11D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RCX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RDX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%R11),%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R10,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RBX,8),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%RCX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDI,%RSI,1),%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %ESI,-0x94(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (,%R12,4),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x5,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %EDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11D,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %RAX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%R13,8),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x4,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
SHR $0x2,%EDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RSI,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R11D,%R9D | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11D,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAL $0x4,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
AND $-0x4,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB %RDX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EDI,-0x4c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAL $0x3,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x5,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %ESI,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %R11D,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVNS %R11D,%EAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R13,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %ESI,-0xb4(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11D,-0x44(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x1,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
KMOVB %R11D,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xc0(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K0,%K0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 42ac98 <__pack_kernel_module_MOD_clover_unpack_message_left._omp_fn.0.lto_priv.0+0x4c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EBX,0x50(%R15) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 42a82f <__pack_kernel_module_MOD_clover_unpack_message_left._omp_fn.0.lto_priv.0+0x5f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | pack_kernel.f90:108-113 |
Module | exec |
nb instructions | 113 |
nb uops | 118 |
loop length | 424 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 20 |
micro-operation queue | 19.67 cycles |
front end | 19.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 8.60 | 8.60 | 8.33 | 8.33 | 14.50 | 8.60 | 8.60 | 14.50 | 14.50 | 14.50 | 8.60 | 8.33 |
cycles | 8.60 | 10.53 | 8.33 | 8.33 | 14.50 | 8.60 | 8.60 | 14.50 | 14.50 | 14.50 | 8.60 | 8.33 |
Cycles executing div or sqrt instructions | 6.00 |
FE+BE cycles | 19.35-19.36 |
Stall cycles | 0.00 |
Front-end | 19.67 |
Dispatch | 14.50 |
DIV/SQRT | 6.00 |
Overall L1 | 19.67 |
all | 0% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 9% |
load | 12% |
store | 9% |
mul | 6% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 6% |
other | 6% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RDI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x54(%RDI),%R13D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RDI),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RDI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RDI),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 402080 <@plt_start@+0x60> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %EAX,%R14D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 402180 <@plt_start@+0x160> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x58(%RCX),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %R13D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CLTD | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R14D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
CMP %EDX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 42acbc <__pack_kernel_module_MOD_clover_unpack_message_left._omp_fn.0.lto_priv.0+0x4ec> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %EAX,%ESI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %EDX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %ESI,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %EAX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 42ac98 <__pack_kernel_module_MOD_clover_unpack_message_left._omp_fn.0.lto_priv.0+0x4c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x8(%RCX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R13,%RSI,1),%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
ADD %R13D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%RCX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KXORB %K0,%K0,%K0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV -0x70(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RCX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,-0x7c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %EDI,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV (%R8),%R11D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RCX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %RDX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x1(%R11),%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R10,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RBX,8),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x18(%RCX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDI,%RSI,1),%R9D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %ESI,-0x94(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (,%R12,4),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x5,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %EDI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11D,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %RAX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%R13,8),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x4,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
SHR $0x2,%EDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RSI,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R11D,%R9D | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11D,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAL $0x4,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
AND $-0x4,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB %RDX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EDI,-0x4c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAL $0x3,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x5,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %ESI,-0x98(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %R11D,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVNS %R11D,%EAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R13,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %ESI,-0xb4(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11D,-0x44(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x1,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
KMOVB %R11D,%K1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xc0(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
KORTESTB %K0,%K0 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JE 42ac98 <__pack_kernel_module_MOD_clover_unpack_message_left._omp_fn.0.lto_priv.0+0x4c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x50(%RBP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EBX,0x50(%R15) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 42a82f <__pack_kernel_module_MOD_clover_unpack_message_left._omp_fn.0.lto_priv.0+0x5f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼__pack_kernel_module_MOD_clover_unpack_message_left._omp_fn.0.lto_priv.0– | 0.03 | 0.01 |
▼Loop 187 - pack_kernel.f90:110-113 - exec– | 0.02 | 0.02 |
○Loop 188 - pack_kernel.f90:113-113 - exec | 0 | 0 |