Function: initialise_chunk(int, global_variables&) [clone .extracted.7] | Module: exec | Source: initialise_chunk.cpp:77-83 [...] | Coverage: 0.01% |
---|
Function: initialise_chunk(int, global_variables&) [clone .extracted.7] | Module: exec | Source: initialise_chunk.cpp:77-83 [...] | Coverage: 0.01% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-4687/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 46 - 69 |
-------------------------------------------------------------------------------- |
46: T &operator[](size_t i) const { return data[i]; } |
[...] |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
/scratch_na/users/xoserete/qaas_runs/171-415-4687/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/initialise_chunk.cpp: 77 - 83 |
-------------------------------------------------------------------------------- |
77: #pragma omp parallel for simd collapse(2) |
78: for (int j = (0); j < (yrange1); j++) { |
79: for (int i = (0); i < (xrange1); i++) { |
80: field.volume(i, j) = dx * dy; |
81: field.xarea(i, j) = field.celldy[j]; |
82: field.yarea(i, j) = field.celldx[i]; |
83: } |
0x42e8a0 PUSH %RBP |
0x42e8a1 MOV %RSP,%RBP |
0x42e8a4 PUSH %R15 |
0x42e8a6 PUSH %R14 |
0x42e8a8 PUSH %R13 |
0x42e8aa PUSH %R12 |
0x42e8ac PUSH %RBX |
0x42e8ad SUB $0x68,%RSP |
0x42e8b1 MOVL $0,-0x30(%RBP) |
0x42e8b8 MOV %R9,%RBX |
0x42e8bb MOV %R8,%R15 |
0x42e8be MOV %RCX,%R12 |
0x42e8c1 MOV %RDX,%R13 |
0x42e8c4 MOV (%RDI),%ESI |
0x42e8c6 MOVQ $0,-0x38(%RBP) |
0x42e8ce MOVQ $0x1,-0x88(%RBP) |
0x42e8d9 SUB $0x8,%RSP |
0x42e8dd LEA -0x88(%RBP),%RAX |
0x42e8e4 LEA -0x30(%RBP),%RCX |
0x42e8e8 LEA -0x38(%RBP),%R8 |
0x42e8ec LEA 0x18(%RBP),%R9 |
0x42e8f0 MOV $0x683250,%EDI |
0x42e8f5 MOV %ESI,-0x2c(%RBP) |
0x42e8f8 MOV $0x22,%EDX |
0x42e8fd PUSH $0x1 |
0x42e8ff PUSH $0x1 |
0x42e901 PUSH %RAX |
0x42e902 CALL 403020 <__kmpc_for_static_init_8@plt> |
0x42e907 ADD $0x20,%RSP |
0x42e90b MOV -0x38(%RBP),%RSI |
0x42e90f MOV 0x18(%RBP),%R9 |
0x42e913 CMP %R9,%RSI |
0x42e916 JA 42ecb7 |
0x42e91c MOV %RBX,%R8 |
0x42e91f VMOVQ %R13,%XMM0 |
0x42e924 VMOVQ %R12,%XMM1 |
0x42e929 VMULSD %XMM0,%XMM1,%XMM16 |
0x42e92f MOV 0x2a0(%R15),%R12 |
0x42e936 MOV 0x290(%R15),%R10 |
0x42e93d MOV 0x228(%R15),%R14 |
0x42e944 MOV 0x248(%R15),%R13 |
0x42e94b MOV 0x2b8(%R15),%RDI |
0x42e952 MOV 0x2a8(%R15),%R11 |
0x42e959 MOV 0x2d0(%R15),%RBX |
0x42e960 MOV 0x2c0(%R15),%R15 |
0x42e967 LEA 0x1(%RSI),%RAX |
0x42e96b INC %R9 |
0x42e96e CMP %R9,%RAX |
0x42e971 CMOVG %RAX,%R9 |
0x42e975 MOV %R9,%RCX |
0x42e978 SUB %RSI,%RCX |
0x42e97b MOV %RCX,%RAX |
0x42e97e AND $-0x10,%RAX |
0x42e982 JE 42ecd5 |
0x42e988 MOV %RCX,-0x40(%RBP) |
0x42e98c MOV %R9,-0x68(%RBP) |
0x42e990 MOV %RAX,-0x48(%RBP) |
0x42e994 DEC %RAX |
0x42e997 MOV %RAX,-0x80(%RBP) |
0x42e99b MOV %R8,-0x70(%RBP) |
0x42e99f VPBROADCASTQ %R8,%YMM8 |
0x42e9a5 MOV %R10,-0x60(%RBP) |
0x42e9a9 VPBROADCASTQ %R10,%YMM17 |
0x42e9af VBROADCASTSD %XMM16,%YMM18 |
0x42e9b5 MOV %R11,-0x58(%RBP) |
0x42e9b9 VPBROADCASTQ %R11,%YMM19 |
0x42e9bf MOV %R15,-0x50(%RBP) |
0x42e9c3 VPBROADCASTQ %R15,%YMM20 |
0x42e9c9 XOR %R15D,%R15D |
0x42e9cc VMOVDQU64 0x397ea(%RIP),%YMM21 |
0x42e9d6 VMOVDQU64 0x39800(%RIP),%YMM22 |
0x42e9e0 VMOVDQU64 0x37896(%RIP),%YMM23 |
0x42e9ea VMOVDQU64 0x3770c(%RIP),%YMM24 |
0x42e9f4 MOV %RSI,-0x78(%RBP) |
0x42e9f8 NOPL (%RAX,%RAX,1) |
(196) 0x42ea00 LEA (%RSI,%R15,1),%RAX |
(196) 0x42ea04 VPBROADCASTQ %RAX,%YMM0 |
(196) 0x42ea0a VPADDQ %YMM21,%YMM0,%YMM9 |
(196) 0x42ea10 VPADDQ %YMM22,%YMM0,%YMM10 |
(196) 0x42ea16 VPADDQ %YMM23,%YMM0,%YMM11 |
(196) 0x42ea1c VPADDQ %YMM24,%YMM0,%YMM12 |
(196) 0x42ea22 VMOVDQA %YMM12,%YMM0 |
(196) 0x42ea26 VMOVDQA %YMM8,%YMM1 |
(196) 0x42ea2a MOV $0x454200,%RAX |
(196) 0x42ea31 MOV %RBX,%RSI |
(196) 0x42ea34 MOV %RDI,%RBX |
(196) 0x42ea37 MOV %R13,%RDI |
(196) 0x42ea3a MOV %R14,%R13 |
(196) 0x42ea3d MOV %R12,%R14 |
(196) 0x42ea40 MOV %RAX,%R12 |
(196) 0x42ea43 CALL %RAX |
(196) 0x42ea45 VMOVDQA %YMM0,%YMM13 |
(196) 0x42ea49 VMOVDQA %YMM11,%YMM0 |
(196) 0x42ea4d VMOVDQA %YMM8,%YMM1 |
(196) 0x42ea51 CALL %R12 |
(196) 0x42ea54 VMOVDQA %YMM0,%YMM14 |
(196) 0x42ea58 VMOVDQA %YMM10,%YMM0 |
(196) 0x42ea5c VMOVDQA %YMM8,%YMM1 |
(196) 0x42ea60 CALL %R12 |
(196) 0x42ea63 VMOVDQA %YMM0,%YMM15 |
(196) 0x42ea67 VMOVDQA %YMM9,%YMM0 |
(196) 0x42ea6b VMOVDQA %YMM8,%YMM1 |
(196) 0x42ea6f CALL %R12 |
(196) 0x42ea72 MOV %R14,%R12 |
(196) 0x42ea75 MOV %R13,%R14 |
(196) 0x42ea78 MOV %RDI,%R13 |
(196) 0x42ea7b MOV %RBX,%RDI |
(196) 0x42ea7e MOV %RSI,%RBX |
(196) 0x42ea81 MOV -0x78(%RBP),%RSI |
(196) 0x42ea85 VXORPS %XMM4,%XMM4,%XMM4 |
(196) 0x42ea89 VPMULLQ %YMM8,%YMM0,%YMM4 |
(196) 0x42ea8f VPMULLQ %YMM8,%YMM15,%YMM5 |
(196) 0x42ea95 VPMULLQ %YMM8,%YMM14,%YMM6 |
(196) 0x42ea9b VXORPS %XMM2,%XMM2,%XMM2 |
(196) 0x42ea9f VPMULLQ %YMM8,%YMM13,%YMM2 |
(196) 0x42eaa5 VPSLLQ $0x20,%YMM14,%YMM1 |
(196) 0x42eaab VPSRAQ $0x20,%YMM1,%YMM1 |
(196) 0x42eab2 VPSLLQ $0x20,%YMM13,%YMM3 |
(196) 0x42eab8 VPSRAQ $0x20,%YMM3,%YMM3 |
(196) 0x42eabf VPMULLQ %YMM3,%YMM17,%YMM7 |
(196) 0x42eac5 VXORPS %XMM13,%XMM13,%XMM13 |
(196) 0x42eaca VPMULLQ %YMM1,%YMM17,%YMM13 |
(196) 0x42ead0 VPSLLQ $0x20,%YMM15,%YMM14 |
(196) 0x42ead6 VPSRAQ $0x20,%YMM14,%YMM14 |
(196) 0x42eadd VXORPS %XMM15,%XMM15,%XMM15 |
(196) 0x42eae2 VPMULLQ %YMM14,%YMM17,%YMM15 |
(196) 0x42eae8 VPSUBQ %YMM2,%YMM12,%YMM2 |
(196) 0x42eaec VPSLLQ $0x20,%YMM0,%YMM0 |
(196) 0x42eaf1 VPSRAQ $0x20,%YMM0,%YMM0 |
(196) 0x42eaf8 VXORPS %XMM12,%XMM12,%XMM12 |
(196) 0x42eafd VPMULLQ %YMM0,%YMM17,%YMM12 |
(196) 0x42eb03 VPSUBQ %YMM6,%YMM11,%YMM6 |
(196) 0x42eb07 VPSUBQ %YMM5,%YMM10,%YMM5 |
(196) 0x42eb0b VPSUBQ %YMM4,%YMM9,%YMM4 |
(196) 0x42eb0f VPADDQ %YMM4,%YMM12,%YMM9 |
(196) 0x42eb13 VPADDQ %YMM5,%YMM15,%YMM10 |
(196) 0x42eb17 VPADDQ %YMM6,%YMM13,%YMM11 |
(196) 0x42eb1b VPADDQ %YMM7,%YMM2,%YMM7 |
(196) 0x42eb1f KXNORW %K0,%K0,%K1 |
(196) 0x42eb23 VSCATTERQPD %YMM18,(%R12,%YMM7,8){%K1} |
(196) 0x42eb2a KXNORW %K0,%K0,%K1 |
(196) 0x42eb2e VSCATTERQPD %YMM18,(%R12,%YMM11,8){%K1} |
(196) 0x42eb35 KXNORW %K0,%K0,%K1 |
(196) 0x42eb39 VSCATTERQPD %YMM18,(%R12,%YMM10,8){%K1} |
(196) 0x42eb40 KXNORW %K0,%K0,%K1 |
(196) 0x42eb44 VSCATTERQPD %YMM18,(%R12,%YMM9,8){%K1} |
(196) 0x42eb4b KXNORW %K0,%K0,%K1 |
(196) 0x42eb4f VXORPD %XMM7,%XMM7,%XMM7 |
(196) 0x42eb53 VGATHERQPD (%R13,%YMM0,8),%YMM7{%K1} |
(196) 0x42eb5b KXNORW %K0,%K0,%K1 |
(196) 0x42eb5f VXORPD %XMM9,%XMM9,%XMM9 |
(196) 0x42eb64 VGATHERQPD (%R13,%YMM14,8),%YMM9{%K1} |
(196) 0x42eb6c KXNORW %K0,%K0,%K1 |
(196) 0x42eb70 VXORPD %XMM10,%XMM10,%XMM10 |
(196) 0x42eb75 VGATHERQPD (%R13,%YMM1,8),%YMM10{%K1} |
(196) 0x42eb7d KXNORW %K0,%K0,%K1 |
(196) 0x42eb81 VXORPD %XMM11,%XMM11,%XMM11 |
(196) 0x42eb86 VGATHERQPD (%R13,%YMM3,8),%YMM11{%K1} |
(196) 0x42eb8e VXORPS %XMM12,%XMM12,%XMM12 |
(196) 0x42eb93 VPMULLQ %YMM3,%YMM19,%YMM12 |
(196) 0x42eb99 VXORPS %XMM13,%XMM13,%XMM13 |
(196) 0x42eb9e VPMULLQ %YMM1,%YMM19,%YMM13 |
(196) 0x42eba4 VXORPS %XMM15,%XMM15,%XMM15 |
(196) 0x42eba9 VPMULLQ %YMM14,%YMM19,%YMM15 |
(196) 0x42ebaf VPMULLQ %YMM0,%YMM19,%YMM25 |
(196) 0x42ebb5 VPADDQ %YMM25,%YMM4,%YMM25 |
(196) 0x42ebbb VPADDQ %YMM5,%YMM15,%YMM15 |
(196) 0x42ebbf VPADDQ %YMM6,%YMM13,%YMM13 |
(196) 0x42ebc3 VPADDQ %YMM2,%YMM12,%YMM12 |
(196) 0x42ebc7 KXNORW %K0,%K0,%K1 |
(196) 0x42ebcb VSCATTERQPD %YMM11,(%RDI,%YMM12,8){%K1} |
(196) 0x42ebd2 KXNORW %K0,%K0,%K1 |
(196) 0x42ebd6 VSCATTERQPD %YMM10,(%RDI,%YMM13,8){%K1} |
(196) 0x42ebdd KXNORW %K0,%K0,%K1 |
(196) 0x42ebe1 VSCATTERQPD %YMM9,(%RDI,%YMM15,8){%K1} |
(196) 0x42ebe8 KXNORW %K0,%K0,%K1 |
(196) 0x42ebec VSCATTERQPD %YMM7,(%RDI,%YMM25,8){%K1} |
(196) 0x42ebf3 KXNORW %K0,%K0,%K1 |
(196) 0x42ebf7 VXORPD %XMM7,%XMM7,%XMM7 |
(196) 0x42ebfb VGATHERQPD (%R14,%YMM4,8),%YMM7{%K1} |
(196) 0x42ec02 KXNORW %K0,%K0,%K1 |
(196) 0x42ec06 VXORPD %XMM9,%XMM9,%XMM9 |
(196) 0x42ec0b VGATHERQPD (%R14,%YMM5,8),%YMM9{%K1} |
(196) 0x42ec12 KXNORW %K0,%K0,%K1 |
(196) 0x42ec16 VXORPD %XMM10,%XMM10,%XMM10 |
(196) 0x42ec1b VGATHERQPD (%R14,%YMM6,8),%YMM10{%K1} |
(196) 0x42ec22 KXNORW %K0,%K0,%K1 |
(196) 0x42ec26 VXORPD %XMM11,%XMM11,%XMM11 |
(196) 0x42ec2b VGATHERQPD (%R14,%YMM2,8),%YMM11{%K1} |
(196) 0x42ec32 VPMULLQ %YMM3,%YMM20,%YMM3 |
(196) 0x42ec38 VPMULLQ %YMM1,%YMM20,%YMM1 |
(196) 0x42ec3e VXORPS %XMM12,%XMM12,%XMM12 |
(196) 0x42ec43 VPMULLQ %YMM14,%YMM20,%YMM12 |
(196) 0x42ec49 VPMULLQ %YMM0,%YMM20,%YMM0 |
(196) 0x42ec4f VPADDQ %YMM0,%YMM4,%YMM0 |
(196) 0x42ec53 VPADDQ %YMM5,%YMM12,%YMM4 |
(196) 0x42ec57 VPADDQ %YMM1,%YMM6,%YMM1 |
(196) 0x42ec5b VPADDQ %YMM3,%YMM2,%YMM2 |
(196) 0x42ec5f KXNORW %K0,%K0,%K1 |
(196) 0x42ec63 VSCATTERQPD %YMM11,(%RBX,%YMM2,8){%K1} |
(196) 0x42ec6a KXNORW %K0,%K0,%K1 |
(196) 0x42ec6e VSCATTERQPD %YMM10,(%RBX,%YMM1,8){%K1} |
(196) 0x42ec75 KXNORW %K0,%K0,%K1 |
(196) 0x42ec79 VSCATTERQPD %YMM9,(%RBX,%YMM4,8){%K1} |
(196) 0x42ec80 KXNORW %K0,%K0,%K1 |
(196) 0x42ec84 VSCATTERQPD %YMM7,(%RBX,%YMM0,8){%K1} |
(196) 0x42ec8b ADD $0x10,%R15 |
(196) 0x42ec8f CMP -0x80(%RBP),%R15 |
(196) 0x42ec93 JBE 42ea00 |
0x42ec99 MOV -0x48(%RBP),%RAX |
0x42ec9d CMP %RAX,-0x40(%RBP) |
0x42eca1 MOV -0x70(%RBP),%R8 |
0x42eca5 MOV -0x68(%RBP),%R9 |
0x42eca9 MOV -0x60(%RBP),%R10 |
0x42ecad MOV -0x58(%RBP),%R11 |
0x42ecb1 MOV -0x50(%RBP),%R15 |
0x42ecb5 JNE 42ecd7 |
0x42ecb7 MOV $0x683270,%EDI |
0x42ecbc MOV -0x2c(%RBP),%ESI |
0x42ecbf ADD $0x68,%RSP |
0x42ecc3 POP %RBX |
0x42ecc4 POP %R12 |
0x42ecc6 POP %R13 |
0x42ecc8 POP %R14 |
0x42ecca POP %R15 |
0x42eccc POP %RBP |
0x42eccd VZEROUPPER |
0x42ecd0 JMP 402e90 |
0x42ecd5 XOR %EAX,%EAX |
0x42ecd7 ADD %RAX,%RSI |
0x42ecda JMP 42ed2b |
0x42ecdc NOPL (%RAX) |
(195) 0x42ece0 MOV %RSI,%RAX |
(195) 0x42ece3 CQTO |
(195) 0x42ece5 IDIV %R8 |
(195) 0x42ece8 CLTQ |
(195) 0x42ecea MOV %R10,%RCX |
(195) 0x42eced IMUL %RAX,%RCX |
(195) 0x42ecf1 ADD %RDX,%RCX |
(195) 0x42ecf4 VMOVSD %XMM16,(%R12,%RCX,8) |
(195) 0x42ecfb MOV %R11,%RCX |
(195) 0x42ecfe IMUL %RAX,%RCX |
(195) 0x42ed02 ADD %RDX,%RCX |
(195) 0x42ed05 VMOVSD (%R13,%RAX,8),%XMM0 |
(195) 0x42ed0c VMOVSD %XMM0,(%RDI,%RCX,8) |
(195) 0x42ed11 IMUL %R15,%RAX |
(195) 0x42ed15 ADD %RDX,%RAX |
(195) 0x42ed18 VMOVSD (%R14,%RDX,8),%XMM0 |
(195) 0x42ed1e VMOVSD %XMM0,(%RBX,%RAX,8) |
(195) 0x42ed23 INC %RSI |
(195) 0x42ed26 CMP %RSI,%R9 |
(195) 0x42ed29 JE 42ecb7 |
(195) 0x42ed2b MOV %RSI,%RAX |
(195) 0x42ed2e OR %R8,%RAX |
(195) 0x42ed31 SHR $0x20,%RAX |
(195) 0x42ed35 JNE 42ece0 |
(195) 0x42ed37 MOV %ESI,%EAX |
(195) 0x42ed39 XOR %EDX,%EDX |
(195) 0x42ed3b DIV %R8D |
(195) 0x42ed3e JMP 42ece8 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | initialise_chunk.cpp:77-83 |
Module | exec |
nb instructions | 98 |
nb uops | 100 |
loop length | 423 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 9 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 16.67 cycles |
front end | 16.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 3.50 | 3.50 | 9.67 | 9.67 | 11.50 | 7.00 | 3.40 | 11.50 | 11.50 | 11.50 | 3.60 | 9.67 |
cycles | 3.50 | 3.50 | 9.67 | 9.67 | 11.50 | 7.00 | 3.40 | 11.50 | 11.50 | 11.50 | 3.60 | 9.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 16.43-16.44 |
Stall cycles | 0.00 |
Front-end | 16.67 |
Dispatch | 11.50 |
Overall L1 | 16.67 |
all | 9% |
load | 25% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 0% |
load | NA (no load vectorizable/vectorized instructions) |
store | NA (no store vectorizable/vectorized instructions) |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 9% |
load | 25% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 5% |
all | 15% |
load | 21% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | NA (no load vectorizable/vectorized instructions) |
store | NA (no store vectorizable/vectorized instructions) |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 21% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x68,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x88(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x30(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x38(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x18(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x683250,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 403020 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 42ecb7 <_Z16initialise_chunkiR16global_variables.extracted.7+0x417> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVQ %R12,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMULSD %XMM0,%XMM1,%XMM16 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x2a0(%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x290(%R15),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x228(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x248(%R15),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2b8(%R15),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2a8(%R15),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2d0(%R15),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2c0(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R9,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R9,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 42ecd5 <_Z16initialise_chunkiR16global_variables.extracted.7+0x435> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R8,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R10,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R10,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM16,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R11,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R15,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R15,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDQU64 0x397ea(%RIP),%YMM21 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0x39800(%RIP),%YMM22 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0x37896(%RIP),%YMM23 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0x3770c(%RIP),%YMM24 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %RSI,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,-0x40(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 42ecd7 <_Z16initialise_chunkiR16global_variables.extracted.7+0x437> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x683270,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x2c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x68,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 402e90 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 42ed2b <_Z16initialise_chunkiR16global_variables.extracted.7+0x48b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | initialise_chunk.cpp:77-83 |
Module | exec |
nb instructions | 98 |
nb uops | 100 |
loop length | 423 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 9 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 16.67 cycles |
front end | 16.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 3.50 | 3.50 | 9.67 | 9.67 | 11.50 | 7.00 | 3.40 | 11.50 | 11.50 | 11.50 | 3.60 | 9.67 |
cycles | 3.50 | 3.50 | 9.67 | 9.67 | 11.50 | 7.00 | 3.40 | 11.50 | 11.50 | 11.50 | 3.60 | 9.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 16.43-16.44 |
Stall cycles | 0.00 |
Front-end | 16.67 |
Dispatch | 11.50 |
Overall L1 | 16.67 |
all | 9% |
load | 25% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 0% |
load | NA (no load vectorizable/vectorized instructions) |
store | NA (no store vectorizable/vectorized instructions) |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 9% |
load | 25% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 5% |
all | 15% |
load | 21% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 12% |
load | NA (no load vectorizable/vectorized instructions) |
store | NA (no store vectorizable/vectorized instructions) |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 21% |
store | 10% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x68,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVL $0,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x88(%RBP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x30(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x38(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x18(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x683250,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 403020 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %R9,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 42ecb7 <_Z16initialise_chunkiR16global_variables.extracted.7+0x417> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMOVQ %R12,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VMULSD %XMM0,%XMM1,%XMM16 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV 0x2a0(%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x290(%R15),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x228(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x248(%R15),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2b8(%R15),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2a8(%R15),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2d0(%R15),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2c0(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R9,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R9,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 42ecd5 <_Z16initialise_chunkiR16global_variables.extracted.7+0x435> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,-0x80(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x70(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R8,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R10,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R10,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM16,%YMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R11,%YMM19 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R15,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R15,%YMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDQU64 0x397ea(%RIP),%YMM21 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0x39800(%RIP),%YMM22 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0x37896(%RIP),%YMM23 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
VMOVDQU64 0x3770c(%RIP),%YMM24 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %RSI,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,-0x40(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x60(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x58(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x50(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 42ecd7 <_Z16initialise_chunkiR16global_variables.extracted.7+0x437> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x683270,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x2c(%RBP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x68,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 402e90 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 42ed2b <_Z16initialise_chunkiR16global_variables.extracted.7+0x48b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼initialise_chunk(int, global_variables&) [clone .extracted.7]– | 0.01 | 0.01 |
○Loop 196 - initialise_chunk.cpp:78-83 - exec | 0.01 | 0.01 |
○Loop 195 - initialise_chunk.cpp:78-83 - exec | 0 | 0 |