Function: clover_unpack_message_right_.DIR.OMP.PARALLEL.LOOP.2.split103 | Module: exec | Source: pack_kernel.f90:202-210 | Coverage: 0.01% |
---|
Function: clover_unpack_message_right_.DIR.OMP.PARALLEL.LOOP.2.split103 | Module: exec | Source: pack_kernel.f90:202-210 | Coverage: 0.01% |
---|
/beegfs/hackathon/users/eoseret/qaas_runs/170-861-0321/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/pack_kernel.f90: 202 - 210 |
-------------------------------------------------------------------------------- |
202: !$OMP PARALLEL DO PRIVATE(index) |
203: DO k=y_min-depth,y_max+y_inc+depth |
204: !$OMP SIMD |
205: DO j=1,depth |
206: index= buffer_offset + j+(k+depth-1)*depth |
207: field(x_max+x_inc+j,k)=right_rcv_buffer(index) |
208: ENDDO |
209: ENDDO |
210: !$OMP END PARALLEL DO |
0x441f50 PUSH %RBP |
0x441f51 MOV %RSP,%RBP |
0x441f54 PUSH %R15 |
0x441f56 PUSH %R14 |
0x441f58 PUSH %R13 |
0x441f5a PUSH %R12 |
0x441f5c PUSH %RBX |
0x441f5d SUB $0x78,%RSP |
0x441f61 MOV %R9,-0x58(%RBP) |
0x441f65 MOV %R8,-0x68(%RBP) |
0x441f69 MOV %RCX,-0x50(%RBP) |
0x441f6d MOV 0x30(%RBP),%EAX |
0x441f70 MOVL $0,-0x44(%RBP) |
0x441f77 TEST %EAX,%EAX |
0x441f79 JS 441fda |
0x441f7b MOV %RDX,%R13 |
0x441f7e MOV (%RDI),%ESI |
0x441f80 MOVL $0,-0x30(%RBP) |
0x441f87 MOV %EAX,-0x2c(%RBP) |
0x441f8a MOVL $0x1,-0x40(%RBP) |
0x441f91 SUB $0x8,%RSP |
0x441f95 LEA -0x40(%RBP),%RAX |
0x441f99 LEA -0x44(%RBP),%RCX |
0x441f9d LEA -0x30(%RBP),%R8 |
0x441fa1 LEA -0x2c(%RBP),%R9 |
0x441fa5 MOV $0x573600,%EDI |
0x441faa MOV %ESI,-0x34(%RBP) |
0x441fad MOV $0x22,%EDX |
0x441fb2 PUSH $0x1 |
0x441fb4 PUSH $0x1 |
0x441fb6 PUSH %RAX |
0x441fb7 CALL 404670 <__kmpc_for_static_init_4@plt> |
0x441fbc ADD $0x20,%RSP |
0x441fc0 MOV -0x30(%RBP),%EAX |
0x441fc3 MOV -0x2c(%RBP),%EDX |
0x441fc6 SUB %EAX,%EDX |
0x441fc8 MOV %EDX,-0x3c(%RBP) |
0x441fcb JAE 441fe9 |
0x441fcd MOV $0x573620,%EDI |
0x441fd2 MOV -0x34(%RBP),%ESI |
0x441fd5 CALL 404230 <__kmpc_for_static_fini@plt> |
0x441fda ADD $0x78,%RSP |
0x441fde POP %RBX |
0x441fdf POP %R12 |
0x441fe1 POP %R13 |
0x441fe3 POP %R14 |
0x441fe5 POP %R15 |
0x441fe7 POP %RBP |
0x441fe8 RET |
0x441fe9 MOV %RAX,%RCX |
0x441fec MOV -0x58(%RBP),%RAX |
0x441ff0 MOV (%RAX),%EAX |
0x441ff2 MOV %RCX,%RDX |
0x441ff5 LEA (%RCX,%R13,1),%R9D |
0x441ff9 DEC %R9D |
0x441ffc MOV -0x50(%RBP),%RCX |
0x442000 INC %ECX |
0x442002 MOV %ECX,-0x38(%RBP) |
0x442005 XOR %R10D,%R10D |
0x442008 ADD %R13D,%EDX |
0x44200b MOV %RDX,-0x60(%RBP) |
0x44200f MOVDQA 0xeb6d9(%RIP),%XMM0 |
0x442017 MOVDQA 0xeb631(%RIP),%XMM1 |
0x44201f MOVDQA 0xeb709(%RIP),%XMM2 |
0x442027 PCMPEQD %XMM3,%XMM3 |
0x44202b JMP 442043 |
0x44202d NOPL (%RAX) |
(441) 0x442030 MOV %R11D,%EAX |
(441) 0x442033 LEA 0x1(%R10),%ECX |
(441) 0x442037 INC %R9D |
(441) 0x44203a CMP -0x3c(%RBP),%R10D |
(441) 0x44203e MOV %ECX,%R10D |
(441) 0x442041 JE 441fcd |
(441) 0x442043 TEST %EAX,%EAX |
(441) 0x442045 JLE 442033 |
(441) 0x442047 MOV -0x60(%RBP),%RCX |
(441) 0x44204b ADD %R10D,%ECX |
(441) 0x44204e MOV -0x68(%RBP),%RDX |
(441) 0x442052 MOVSXD (%RDX),%RSI |
(441) 0x442055 MOV -0x58(%RBP),%RDX |
(441) 0x442059 MOV (%RDX),%R11D |
(441) 0x44205c MOV 0x136b8d(%RIP),%R13 |
(441) 0x442063 MOV 0x136bbe(%RIP),%R12 |
(441) 0x44206a MOV 0x18(%RBP),%R8 |
(441) 0x44206e MOV (%R8),%RDX |
(441) 0x442071 MOV 0x38(%R8),%RBX |
(441) 0x442075 MOV 0x20(%RBP),%RDI |
(441) 0x442079 MOV (%RDI),%EDI |
(441) 0x44207b MOV 0x50(%R8),%R14 |
(441) 0x44207f MOV %EAX,%R8D |
(441) 0x442082 MOV %R8,%R15 |
(441) 0x442085 MOVSXD %ECX,%RAX |
(441) 0x442088 MOV $-0x4,%ECX |
(441) 0x44208d AND %RCX,%R15 |
(441) 0x442090 MOV %RSI,-0x98(%RBP) |
(441) 0x442097 JE 442300 |
(441) 0x44209d MOV %R10,-0x88(%RBP) |
(441) 0x4420a4 MOV %R9,-0x90(%RBP) |
(441) 0x4420ab LEA (%R11,%R9,1),%ECX |
(441) 0x4420af MOV %R11,-0x80(%RBP) |
(441) 0x4420b3 IMUL %R11D,%ECX |
(441) 0x4420b7 MOVSXD %ECX,%RCX |
(441) 0x4420ba ADD %RSI,%RCX |
(441) 0x4420bd MOV -0x50(%RBP),%RSI |
(441) 0x4420c1 MOV %RDI,%R9 |
(441) 0x4420c4 MOV %RBX,%RDI |
(441) 0x4420c7 MOV %R9,-0x70(%RBP) |
(441) 0x4420cb LEA (%RSI,%R9,1),%EBX |
(441) 0x4420cf MOVQ %R13,%XMM4 |
(441) 0x4420d4 PSHUFD $0x44,%XMM4,%XMM4 |
(441) 0x4420d9 MOVQ %R12,%XMM5 |
(441) 0x4420de PSHUFD $0x44,%XMM5,%XMM5 |
(441) 0x4420e3 MOVDQA %XMM5,%XMM6 |
(441) 0x4420e7 PSRLQ $0x20,%XMM6 |
(441) 0x4420ec MOVQ %RDX,%XMM7 |
(441) 0x4420f1 MOV %RDI,-0x78(%RBP) |
(441) 0x4420f5 MOVQ %RDI,%XMM8 |
(441) 0x4420fa PSHUFD $0x44,%XMM8,%XMM8 |
(441) 0x442100 MOVDQA %XMM8,%XMM9 |
(441) 0x442105 PSRLQ $0x20,%XMM9 |
(441) 0x44210b XOR %ESI,%ESI |
(441) 0x44210d NOPL (%RAX) |
(443) 0x442110 LEA (%RCX,%RSI,1),%RDI |
(443) 0x442114 MOVQ %RDI,%XMM10 |
(443) 0x442119 PSHUFD $0x44,%XMM10,%XMM10 |
(443) 0x44211f MOVDQA %XMM10,%XMM11 |
(443) 0x442124 PADDQ %XMM0,%XMM11 |
(443) 0x442129 PADDQ %XMM1,%XMM10 |
(443) 0x44212e MOVDQA %XMM6,%XMM12 |
(443) 0x442133 PMULUDQ %XMM10,%XMM12 |
(443) 0x442138 MOVDQA %XMM5,%XMM13 |
(443) 0x44213d PMULUDQ %XMM10,%XMM13 |
(443) 0x442142 PSRLQ $0x20,%XMM10 |
(443) 0x442148 PMULUDQ %XMM5,%XMM10 |
(443) 0x44214d PADDQ %XMM12,%XMM10 |
(443) 0x442152 PSLLQ $0x20,%XMM10 |
(443) 0x442158 MOVDQA %XMM6,%XMM12 |
(443) 0x44215d PMULUDQ %XMM11,%XMM12 |
(443) 0x442162 MOVDQA %XMM5,%XMM14 |
(443) 0x442167 PMULUDQ %XMM11,%XMM14 |
(443) 0x44216c PSRLQ $0x20,%XMM11 |
(443) 0x442172 PMULUDQ %XMM5,%XMM11 |
(443) 0x442177 PADDQ %XMM12,%XMM11 |
(443) 0x44217c PSLLQ $0x20,%XMM11 |
(443) 0x442182 PADDQ %XMM4,%XMM14 |
(443) 0x442187 PADDQ %XMM11,%XMM14 |
(443) 0x44218c PADDQ %XMM4,%XMM13 |
(443) 0x442191 PADDQ %XMM10,%XMM13 |
(443) 0x442196 MOVQ %XMM13,%RDI |
(443) 0x44219b MOVSD (%RDI),%XMM10 |
(443) 0x4421a0 PSHUFD $-0x12,%XMM13,%XMM11 |
(443) 0x4421a6 MOVQ %XMM11,%R11 |
(443) 0x4421ab MOVQ %XMM14,%R10 |
(443) 0x4421b0 PSHUFD $-0x12,%XMM14,%XMM11 |
(443) 0x4421b6 MOVQ %XMM11,%RDI |
(443) 0x4421bb LEA (%RBX,%RSI,1),%R9D |
(443) 0x4421bf MOVD %R9D,%XMM11 |
(443) 0x4421c4 LEA 0x1(%RAX),%R9 |
(443) 0x4421c8 IMUL %R14,%R9 |
(443) 0x4421cc PSHUFD $0,%XMM11,%XMM11 |
(443) 0x4421d2 PADDD %XMM2,%XMM11 |
(443) 0x4421d7 PXOR %XMM13,%XMM13 |
(443) 0x4421dc PCMPGTD %XMM11,%XMM13 |
(443) 0x4421e1 PSHUFD $-0x12,%XMM11,%XMM12 |
(443) 0x4421e7 PUNPCKLDQ %XMM13,%XMM11 |
(443) 0x4421ec PXOR %XMM13,%XMM13 |
(443) 0x4421f1 PCMPGTD %XMM12,%XMM13 |
(443) 0x4421f6 PUNPCKLDQ %XMM13,%XMM12 |
(443) 0x4421fb PSUBQ %XMM3,%XMM12 |
(443) 0x442200 PSUBQ %XMM3,%XMM11 |
(443) 0x442205 MOVDQA %XMM9,%XMM13 |
(443) 0x44220a PMULUDQ %XMM11,%XMM13 |
(443) 0x44220f MOVDQA %XMM8,%XMM14 |
(443) 0x442214 PMULUDQ %XMM11,%XMM14 |
(443) 0x442219 PSRLQ $0x20,%XMM11 |
(443) 0x44221f PMULUDQ %XMM8,%XMM11 |
(443) 0x442224 PADDQ %XMM13,%XMM11 |
(443) 0x442229 MOVDQA %XMM9,%XMM13 |
(443) 0x44222e PMULUDQ %XMM12,%XMM13 |
(443) 0x442233 MOVDQA %XMM8,%XMM15 |
(443) 0x442238 PMULUDQ %XMM12,%XMM15 |
(443) 0x44223d PSRLQ $0x20,%XMM12 |
(443) 0x442243 PMULUDQ %XMM8,%XMM12 |
(443) 0x442248 PADDQ %XMM13,%XMM12 |
(443) 0x44224d MOVQ %R9,%XMM13 |
(443) 0x442252 PADDQ %XMM7,%XMM13 |
(443) 0x442257 PSHUFD $0x44,%XMM13,%XMM13 |
(443) 0x44225d PSLLQ $0x20,%XMM12 |
(443) 0x442263 PADDQ %XMM13,%XMM15 |
(443) 0x442268 PADDQ %XMM12,%XMM15 |
(443) 0x44226d MOVSD (%R11),%XMM12 |
(443) 0x442272 PADDQ %XMM13,%XMM14 |
(443) 0x442277 MOVSD (%R10),%XMM13 |
(443) 0x44227c PSLLQ $0x20,%XMM11 |
(443) 0x442282 PADDQ %XMM11,%XMM14 |
(443) 0x442287 MOVSD (%RDI),%XMM11 |
(443) 0x44228c MOVQ %XMM14,%RDI |
(443) 0x442291 MOVSD %XMM10,(%RDI) |
(443) 0x442296 PSHUFD $-0x12,%XMM14,%XMM10 |
(443) 0x44229c MOVQ %XMM10,%RDI |
(443) 0x4422a1 MOVSD %XMM12,(%RDI) |
(443) 0x4422a6 MOVQ %XMM15,%RDI |
(443) 0x4422ab MOVSD %XMM13,(%RDI) |
(443) 0x4422b0 PSHUFD $-0x12,%XMM15,%XMM10 |
(443) 0x4422b6 MOVQ %XMM10,%RDI |
(443) 0x4422bb MOVSD %XMM11,(%RDI) |
(443) 0x4422c0 ADD $0x4,%RSI |
(443) 0x4422c4 CMP %R15,%RSI |
(443) 0x4422c7 JB 442110 |
(441) 0x4422cd CMP %R8,%R15 |
(441) 0x4422d0 MOV -0x90(%RBP),%R9 |
(441) 0x4422d7 MOV -0x88(%RBP),%R10 |
(441) 0x4422de MOV -0x80(%RBP),%R11 |
(441) 0x4422e2 MOV -0x78(%RBP),%RBX |
(441) 0x4422e6 MOV -0x70(%RBP),%RDI |
(441) 0x4422ea JE 442030 |
(441) 0x4422f0 JMP 442303 |
0x4422f2 NOPW %CS:(%RAX,%RAX,1) |
(441) 0x442300 XOR %R15D,%R15D |
(441) 0x442303 SUB %R15,%R8 |
(441) 0x442306 MOV -0x98(%RBP),%RSI |
(441) 0x44230d ADD %R15,%RSI |
(441) 0x442310 LEA (%R11,%R9,1),%ECX |
(441) 0x442314 IMUL %R11D,%ECX |
(441) 0x442318 MOVSXD %ECX,%RCX |
(441) 0x44231b ADD %RSI,%RCX |
(441) 0x44231e IMUL %R12,%RCX |
(441) 0x442322 ADD %RCX,%R13 |
(441) 0x442325 ADD -0x38(%RBP),%EDI |
(441) 0x442328 ADD %EDI,%R15D |
(441) 0x44232b INC %RAX |
(441) 0x44232e IMUL %RAX,%R14 |
(441) 0x442332 ADD %R14,%RDX |
(441) 0x442335 NOPW %CS:(%RAX,%RAX,1) |
(442) 0x442340 MOVSXD %R15D,%R15 |
(442) 0x442343 LEA 0x1(%R15),%RAX |
(442) 0x442347 IMUL %RBX,%RAX |
(442) 0x44234b MOVQ (%R13),%XMM4 |
(442) 0x442351 MOVQ %XMM4,(%RAX,%RDX,1) |
(442) 0x442356 ADD %R12,%R13 |
(442) 0x442359 INC %R15D |
(442) 0x44235c DEC %R8 |
(442) 0x44235f JNE 442340 |
(441) 0x442361 JMP 442030 |
0x442366 NOPW %CS:(%RAX,%RAX,1) |
Path / |
Source file and lines | pack_kernel.f90:202-210 |
Module | exec |
nb instructions | 69 |
nb uops | 68 |
loop length | 248 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 12 |
micro-operation queue | 11.33 cycles |
front end | 11.33 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 8.00 | 8.00 | 8.00 | 0.25 | 0.25 | 0.25 | 0.25 | 0.00 | 0.00 |
cycles | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 8.00 | 8.00 | 8.00 | 0.25 | 0.25 | 0.25 | 0.25 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 11.33 |
Dispatch | 8.00 |
Overall L1 | 11.33 |
all | 16% |
load | 60% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 11% |
load | 17% |
store | 8% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 11% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x78,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R9,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R8,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RCX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x30(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVL $0,-0x44(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %EAX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JS 441fda <pack_kernel_module_mp_clover_unpack_message_right_.DIR.OMP.PARALLEL.LOOP.2.split103+0x8a> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EAX,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0x1,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x40(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x44(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x30(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x2c(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x573600,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x34(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x30(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x2c(%RBP),%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EAX,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %EDX,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JAE 441fe9 <pack_kernel_module_mp_clover_unpack_message_right_.DIR.OMP.PARALLEL.LOOP.2.split103+0x99> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x573620,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x34(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x78,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RCX,%R13,1),%R9D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
DEC %R9D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x50(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
INC %ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ECX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
ADD %R13D,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVDQA 0xeb6d9(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVDQA 0xeb631(%RIP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVDQA 0xeb709(%RIP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
PCMPEQD %XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
JMP 442043 <pack_kernel_module_mp_clover_unpack_message_right_.DIR.OMP.PARALLEL.LOOP.2.split103+0xf3> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Source file and lines | pack_kernel.f90:202-210 |
Module | exec |
nb instructions | 69 |
nb uops | 68 |
loop length | 248 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 12 |
micro-operation queue | 11.33 cycles |
front end | 11.33 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 8.00 | 8.00 | 8.00 | 0.25 | 0.25 | 0.25 | 0.25 | 0.00 | 0.00 |
cycles | 5.00 | 5.00 | 5.00 | 5.00 | 3.00 | 8.00 | 8.00 | 8.00 | 0.25 | 0.25 | 0.25 | 0.25 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 11.33 |
Dispatch | 8.00 |
Overall L1 | 11.33 |
all | 16% |
load | 60% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 33% |
all | 11% |
load | 17% |
store | 8% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 11% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB $0x78,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R9,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %R8,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RCX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x30(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVL $0,-0x44(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
TEST %EAX,%EAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JS 441fda <pack_kernel_module_mp_clover_unpack_message_right_.DIR.OMP.PARALLEL.LOOP.2.split103+0x8a> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %EAX,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVL $0x1,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
SUB $0x8,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x40(%RBP),%RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x44(%RBP),%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x30(%RBP),%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LEA -0x2c(%RBP),%R9 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV $0x573600,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ESI,-0x34(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV $0x22,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x20,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x30(%RBP),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x2c(%RBP),%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
SUB %EAX,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %EDX,-0x3c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JAE 441fe9 <pack_kernel_module_mp_clover_unpack_message_right_.DIR.OMP.PARALLEL.LOOP.2.split103+0x99> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV $0x573620,%EDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x34(%RBP),%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0.50 | 0 | 0 | 0 | 0.50 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD $0x78,%RSP | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
POP %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
RET | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x58(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RAX),%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RCX,%R13,1),%R9D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
DEC %R9D | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV -0x50(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
INC %ECX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %ECX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 |
ADD %R13D,%EDX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RDX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOVDQA 0xeb6d9(%RIP),%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVDQA 0xeb631(%RIP),%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOVDQA 0xeb709(%RIP),%XMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
PCMPEQD %XMM3,%XMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 1 | 0.25 |
JMP 442043 <pack_kernel_module_mp_clover_unpack_message_right_.DIR.OMP.PARALLEL.LOOP.2.split103+0xf3> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
NOPW %CS:(%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼clover_unpack_message_right_.DIR.OMP.PARALLEL.LOOP.2.split103– | 0.01 | 0 |
▼Loop 441 - pack_kernel.f90:203-207 - exec– | 0 | 0 |
○Loop 442 - pack_kernel.f90:205-207 - exec | 0.01 | 0.01 |
○Loop 443 - pack_kernel.f90:205-207 - exec | 0 | 0 |