Function: PdV_kernel(bool, int, int, int, int, double, clover::Buffer2D<double>&, clover::Buffer2D<d ... | Module: exec | Source: PdV.cpp:48-64 [...] | Coverage: 1.61% |
---|
Function: PdV_kernel(bool, int, int, int, int, double, clover::Buffer2D<double>&, clover::Buffer2D<d ... | Module: exec | Source: PdV.cpp:48-64 [...] | Coverage: 1.61% |
---|
/scratch_na/users/xoserete/qaas_runs/171-291-1828/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
/scratch_na/users/xoserete/qaas_runs/171-291-1828/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/PdV.cpp: 48 - 64 |
-------------------------------------------------------------------------------- |
48: #pragma omp parallel for simd collapse(2) |
49: for (int j = (y_min + 1); j < (y_max + 2); j++) { |
50: for (int i = (x_min + 1); i < (x_max + 2); i++) { |
51: double left_flux = (xarea(i, j) * (xvel0(i, j) + xvel0(i + 0, j + 1) + xvel0(i, j) + xvel0(i + 0, j + 1))) * 0.25 * dt * 0.5; |
52: double right_flux = |
53: (xarea(i + 1, j + 0) * (xvel0(i + 1, j + 0) + xvel0(i + 1, j + 1) + xvel0(i + 1, j + 0) + xvel0(i + 1, j + 1))) * 0.25 * dt * |
54: 0.5; |
55: double bottom_flux = (yarea(i, j) * (yvel0(i, j) + yvel0(i + 1, j + 0) + yvel0(i, j) + yvel0(i + 1, j + 0))) * 0.25 * dt * 0.5; |
56: double top_flux = (yarea(i + 0, j + 1) * (yvel0(i + 0, j + 1) + yvel0(i + 1, j + 1) + yvel0(i + 0, j + 1) + yvel0(i + 1, j + 1))) * |
57: 0.25 * dt * 0.5; |
58: double total_flux = right_flux - left_flux + top_flux - bottom_flux; |
59: double volume_change_s = volume(i, j) / (volume(i, j) + total_flux); |
60: double recip_volume = 1.0 / volume(i, j); |
61: double energy_change = (pressure(i, j) / density0(i, j) + viscosity(i, j) / density0(i, j)) * total_flux * recip_volume; |
62: energy1(i, j) = energy0(i, j) - energy_change; |
63: density1(i, j) = density0(i, j) * volume_change_s; |
64: } |
0x434c50 PUSH %RBP |
0x434c51 MOV %RSP,%RBP |
0x434c54 PUSH %R15 |
0x434c56 PUSH %R14 |
0x434c58 PUSH %R13 |
0x434c5a PUSH %R12 |
0x434c5c PUSH %RBX |
0x434c5d AND $-0x20,%RSP |
0x434c61 SUB $0x420,%RSP |
0x434c68 MOV %R8,0xe0(%RSP) |
0x434c70 MOV %RCX,%R12 |
0x434c73 MOV %RDX,%R13 |
0x434c76 MOV 0x70(%RBP),%RAX |
0x434c7a MOV 0x60(%RBP),%R10 |
0x434c7e MOV 0x58(%RBP),%R11 |
0x434c82 MOV 0x48(%RBP),%RCX |
0x434c86 MOV %RCX,0x30(%RSP) |
0x434c8b MOV 0x40(%RBP),%R15 |
0x434c8f MOV 0x38(%RBP),%R8 |
0x434c93 MOV 0x30(%RBP),%RCX |
0x434c97 MOV %RCX,0x28(%RSP) |
0x434c9c MOV 0x28(%RBP),%RSI |
0x434ca0 MOV 0x20(%RBP),%RBX |
0x434ca4 MOV 0x18(%RBP),%RDX |
0x434ca8 MOV 0x10(%RBP),%R14 |
0x434cac MOV 0x50(%RBP),%ECX |
0x434caf MOV %ECX,0x4(%RSP) |
0x434cb3 MOVL $0,0x4c(%RSP) |
0x434cbb TEST %RAX,%RAX |
0x434cbe JS 43571f |
0x434cc4 MOV %RBX,0x40(%RSP) |
0x434cc9 MOV %R8,0x18(%RSP) |
0x434cce MOV %RSI,0x10(%RSP) |
0x434cd3 MOV %RDX,0x100(%RSP) |
0x434cdb MOV %R9,0x20(%RSP) |
0x434ce0 MOV (%RDI),%ESI |
0x434ce2 MOVQ $0,0x98(%RSP) |
0x434cee MOV %RAX,0x90(%RSP) |
0x434cf6 MOVQ $0x1,0xd8(%RSP) |
0x434d02 SUB $0x8,%RSP |
0x434d06 LEA 0xe0(%RSP),%RAX |
0x434d0e LEA 0x54(%RSP),%RCX |
0x434d13 LEA 0xa0(%RSP),%R8 |
0x434d1b LEA 0x98(%RSP),%R9 |
0x434d23 MOV $0x683730,%EDI |
0x434d28 MOV %ESI,0x50(%RSP) |
0x434d2c MOV $0x22,%EDX |
0x434d31 PUSH $0x1 |
0x434d33 PUSH $0x1 |
0x434d35 PUSH %RAX |
0x434d36 MOV %R11,0x28(%RSP) |
0x434d3b MOV %R10,%RBX |
0x434d3e CALL 403020 <__kmpc_for_static_init_8@plt> |
0x434d43 ADD $0x20,%RSP |
0x434d47 MOV 0x98(%RSP),%RSI |
0x434d4f MOV 0x90(%RSP),%RAX |
0x434d57 MOV %RAX,0x80(%RSP) |
0x434d5f CMP %RAX,%RSI |
0x434d62 JA 435700 |
0x434d68 MOV %RBX,%R11 |
0x434d6b VMOVQ %R13,%XMM0 |
0x434d70 SUB 0x8(%RSP),%R11D |
0x434d75 LEA 0x1(%RSI),%RAX |
0x434d79 MOV 0x80(%RSP),%RCX |
0x434d81 INC %RCX |
0x434d84 CMP %RCX,%RAX |
0x434d87 CMOVG %RAX,%RCX |
0x434d8b MOV (%R12),%RAX |
0x434d8f MOV %RAX,0x78(%RSP) |
0x434d94 MOV 0x10(%R12),%RAX |
0x434d99 MOV %RAX,0x88(%RSP) |
0x434da1 MOV (%R15),%RAX |
0x434da4 MOV %RAX,0x38(%RSP) |
0x434da9 MOV 0x10(%R15),%RDI |
0x434dad MOV 0xe0(%RSP),%RAX |
0x434db5 MOV (%RAX),%RDX |
0x434db8 MOV %RDX,0x70(%RSP) |
0x434dbd MOV 0x10(%RAX),%R15 |
0x434dc1 VMULSD 0x31327(%RIP),%XMM0,%XMM4 |
0x434dc9 MOV 0x30(%RSP),%RAX |
0x434dce MOV (%RAX),%RDX |
0x434dd1 MOV %RDX,0x68(%RSP) |
0x434dd6 MOV 0x10(%RAX),%R13 |
0x434dda MOV 0x20(%RSP),%RAX |
0x434ddf MOV (%RAX),%RDX |
0x434de2 MOV %RDX,0x60(%RSP) |
0x434de7 MOV 0x10(%RAX),%RAX |
0x434deb MOV %RAX,0x30(%RSP) |
0x434df0 MOV 0x28(%RSP),%RAX |
0x434df5 MOV (%RAX),%RBX |
0x434df8 MOV 0x10(%RAX),%RAX |
0x434dfc MOV %RAX,0x28(%RSP) |
0x434e01 MOV (%R14),%RAX |
0x434e04 MOV %RAX,0x58(%RSP) |
0x434e09 MOV 0x10(%R14),%R14 |
0x434e0d MOV 0x18(%RSP),%RAX |
0x434e12 MOV (%RAX),%RDX |
0x434e15 MOV 0x10(%RAX),%RAX |
0x434e19 MOV %RAX,0x20(%RSP) |
0x434e1e MOV 0x40(%RSP),%RAX |
0x434e23 MOV (%RAX),%R8 |
0x434e26 MOV 0x10(%RAX),%RAX |
0x434e2a MOV %RAX,0x18(%RSP) |
0x434e2f MOV 0x10(%RSP),%RAX |
0x434e34 MOV (%RAX),%R9 |
0x434e37 MOV 0x10(%RAX),%RAX |
0x434e3b MOV %RAX,0x10(%RSP) |
0x434e40 MOV 0x100(%RSP),%RAX |
0x434e48 MOV (%RAX),%R10 |
0x434e4b MOV 0x10(%RAX),%R12 |
0x434e4f SUB %RSI,%RCX |
0x434e52 MOV $-0x8,%EAX |
0x434e57 MOV %RCX,0xa8(%RSP) |
0x434e5f AND %RCX,%RAX |
0x434e62 MOV %RBX,0xd0(%RSP) |
0x434e6a MOV %RDX,0xc8(%RSP) |
0x434e72 MOV %R8,0xc0(%RSP) |
0x434e7a MOV %R9,0xb8(%RSP) |
0x434e82 MOV %R10,0xb0(%RSP) |
0x434e8a JE 4358ec |
0x434e90 MOV %RAX,%RCX |
0x434e93 MOV %R11,0xa0(%RSP) |
0x434e9b VPBROADCASTQ %R11,%YMM0 |
0x434ea1 VMOVDQU %YMM0,0x300(%RSP) |
0x434eaa MOV %R12,0x50(%RSP) |
0x434eaf MOV 0x4(%RSP),%EAX |
0x434eb3 VPBROADCASTD %EAX,%YMM0 |
0x434eb9 VMOVDQU %YMM0,0x2e0(%RSP) |
0x434ec2 MOV 0x8(%RSP),%RAX |
0x434ec7 VPBROADCASTD %EAX,%YMM0 |
0x434ecd VMOVDQU %YMM0,0x2c0(%RSP) |
0x434ed6 MOV 0x78(%RSP),%RAX |
0x434edb VPBROADCASTQ %RAX,%YMM0 |
0x434ee1 VMOVDQU %YMM0,0x2a0(%RSP) |
0x434eea MOV 0x38(%RSP),%RAX |
0x434eef VPBROADCASTQ %RAX,%YMM0 |
0x434ef5 VMOVDQU %YMM0,0x280(%RSP) |
0x434efe MOV 0x70(%RSP),%RAX |
0x434f03 VPBROADCASTQ %RAX,%YMM0 |
0x434f09 VMOVDQU %YMM0,0x260(%RSP) |
0x434f12 MOV 0x68(%RSP),%RAX |
0x434f17 VPBROADCASTQ %RAX,%YMM0 |
0x434f1d VMOVDQU %YMM0,0x240(%RSP) |
0x434f26 VMOVUPD %XMM4,0x130(%RSP) |
0x434f2f VBROADCASTSD %XMM4,%YMM0 |
0x434f34 VMOVUPD %YMM0,0x220(%RSP) |
0x434f3d MOV 0x60(%RSP),%RAX |
0x434f42 VPBROADCASTQ %RAX,%YMM0 |
0x434f48 VMOVDQU %YMM0,0x200(%RSP) |
0x434f51 VPBROADCASTQ %RBX,%YMM0 |
0x434f57 VMOVDQU %YMM0,0x1e0(%RSP) |
0x434f60 MOV 0x58(%RSP),%RAX |
0x434f65 VPBROADCASTQ %RAX,%YMM0 |
0x434f6b VMOVDQU %YMM0,0x1c0(%RSP) |
0x434f74 VPBROADCASTQ %RDX,%YMM0 |
0x434f7a VMOVDQU %YMM0,0x1a0(%RSP) |
0x434f83 VPBROADCASTQ %R8,%YMM0 |
0x434f89 VMOVDQU %YMM0,0x180(%RSP) |
0x434f92 VPBROADCASTQ %R9,%YMM0 |
0x434f98 VMOVDQU %YMM0,0x160(%RSP) |
0x434fa1 VPBROADCASTQ %RSI,%YMM0 |
0x434fa7 VPADDQ 0x312d1(%RIP),%YMM0,%YMM9 |
0x434faf VPADDQ 0x31149(%RIP),%YMM0,%YMM0 |
0x434fb7 VPBROADCASTQ %R10,%YMM1 |
0x434fbd VMOVDQU %YMM1,0x140(%RSP) |
0x434fc6 XOR %EAX,%EAX |
0x434fc8 NOPL (%RAX,%RAX,1) |
(247) 0x434fd0 MOV %RAX,0x40(%RSP) |
(247) 0x434fd5 VMOVDQU %YMM0,0xe0(%RSP) |
(247) 0x434fde VMOVDQU %YMM9,0x100(%RSP) |
(247) 0x434fe7 VMOVDQU 0xe0(%RSP),%YMM0 |
(247) 0x434ff0 VMOVUPS 0x300(%RSP),%YMM8 |
(247) 0x434ff9 VMOVAPS %YMM8,%YMM1 |
(247) 0x434ffd MOV %RCX,%R12 |
(247) 0x435000 MOV $0x454690,%RBX |
(247) 0x435007 CALL %RBX |
(247) 0x435009 VMOVDQA %YMM0,%YMM11 |
(247) 0x43500d VMOVDQA %YMM9,%YMM0 |
(247) 0x435011 VMOVAPS %YMM8,%YMM1 |
(247) 0x435015 CALL %RBX |
(247) 0x435017 VPMOVQD %YMM11,%XMM1 |
(247) 0x43501d VPMOVQD %YMM0,%XMM0 |
(247) 0x435023 VINSERTI128 $0x1,%XMM0,%YMM1,%YMM0 |
(247) 0x435029 VPADDD 0x2e0(%RSP),%YMM0,%YMM29 |
(247) 0x435031 VMOVDQU 0xe0(%RSP),%YMM0 |
(247) 0x43503a VMOVAPS %YMM8,%YMM1 |
(247) 0x43503e MOV $0x454460,%RBX |
(247) 0x435045 CALL %RBX |
(247) 0x435047 VMOVDQA %YMM0,%YMM11 |
(247) 0x43504b VMOVDQA %YMM9,%YMM0 |
(247) 0x43504f VMOVAPS %YMM8,%YMM1 |
(247) 0x435053 CALL %RBX |
(247) 0x435055 MOV %R12,%RCX |
(247) 0x435058 VPMOVQD %YMM11,%XMM1 |
(247) 0x43505e VPMOVQD %YMM0,%XMM0 |
(247) 0x435064 VINSERTI128 $0x1,%XMM0,%YMM1,%YMM0 |
(247) 0x43506a VPADDD 0x2c0(%RSP),%YMM0,%YMM11 |
(247) 0x435073 VPMOVSXDQ %XMM11,%YMM13 |
(247) 0x435078 VPMOVSXDQ %XMM29,%YMM15 |
(247) 0x43507e VMOVDQU 0x2a0(%RSP),%YMM9 |
(247) 0x435087 VXORPS %XMM4,%XMM4,%XMM4 |
(247) 0x43508b VPMULLQ %YMM15,%YMM9,%YMM4 |
(247) 0x435091 VPXOR %XMM1,%XMM1,%XMM1 |
(247) 0x435095 VPADDQ %YMM4,%YMM13,%YMM6 |
(247) 0x435099 KXNORW %K0,%K0,%K1 |
(247) 0x43509d VMOVDQU 0x280(%RSP),%YMM3 |
(247) 0x4350a6 VPMULLQ %YMM15,%YMM3,%YMM7 |
(247) 0x4350ac VXORPD %XMM2,%XMM2,%XMM2 |
(247) 0x4350b0 VPADDQ %YMM7,%YMM13,%YMM8 |
(247) 0x4350b4 VPCMPEQD %YMM0,%YMM0,%YMM0 |
(247) 0x4350b8 VPSUBD %YMM0,%YMM29,%YMM5 |
(247) 0x4350be VMOVDQU %YMM5,0x3a0(%RSP) |
(247) 0x4350c7 VPMOVSXDQ %XMM5,%YMM10 |
(247) 0x4350cc VPMULLQ %YMM10,%YMM3,%YMM12 |
(247) 0x4350d2 MOV 0x88(%RSP),%R10 |
(247) 0x4350da VGATHERQPD (%R10,%YMM6,8),%YMM1{%K1} |
(247) 0x4350e1 VMOVUPD %YMM1,0x3e0(%RSP) |
(247) 0x4350ea KXNORW %K0,%K0,%K1 |
(247) 0x4350ee VPSUBD %YMM0,%YMM11,%YMM17 |
(247) 0x4350f4 VPMOVSXDQ %XMM17,%YMM14 |
(247) 0x4350fa VPADDQ %YMM4,%YMM14,%YMM6 |
(247) 0x4350fe VPXOR %XMM0,%XMM0,%XMM0 |
(247) 0x435102 VGATHERQPD (%RDI,%YMM8,8),%YMM2{%K1} |
(247) 0x435109 VMOVUPD %YMM2,0x3c0(%RSP) |
(247) 0x435112 KXNORW %K0,%K0,%K1 |
(247) 0x435116 VPADDQ %YMM7,%YMM14,%YMM8 |
(247) 0x43511a VMOVDQU 0x260(%RSP),%YMM5 |
(247) 0x435123 VXORPS %XMM7,%XMM7,%XMM7 |
(247) 0x435127 VPMULLQ %YMM15,%YMM5,%YMM7 |
(247) 0x43512d VGATHERQPD (%R10,%YMM6,8),%YMM0{%K1} |
(247) 0x435134 VMOVUPD %YMM0,0x380(%RSP) |
(247) 0x43513d VXORPD %XMM0,%XMM0,%XMM0 |
(247) 0x435141 KXNORW %K0,%K0,%K1 |
(247) 0x435145 VPADDQ %YMM13,%YMM7,%YMM16 |
(247) 0x43514b VXORPD %XMM2,%XMM2,%XMM2 |
(247) 0x43514f KXNORW %K0,%K0,%K2 |
(247) 0x435153 VGATHERQPD (%RDI,%YMM8,8),%YMM0{%K1} |
(247) 0x43515a VMOVUPD %YMM0,0x360(%RSP) |
(247) 0x435163 VMOVDQU 0x240(%RSP),%YMM4 |
(247) 0x43516c VXORPS %XMM8,%XMM8,%XMM8 |
(247) 0x435171 VPMULLQ %YMM15,%YMM4,%YMM8 |
(247) 0x435177 VPADDQ %YMM13,%YMM8,%YMM1 |
(247) 0x43517c VXORPD %XMM0,%XMM0,%XMM0 |
(247) 0x435180 VGATHERQPD (%R15,%YMM16,8),%YMM2{%K2} |
(247) 0x435187 VMOVUPD %YMM2,0x340(%RSP) |
(247) 0x435190 KXNORW %K0,%K0,%K1 |
(247) 0x435194 VPADDQ %YMM14,%YMM8,%YMM8 |
(247) 0x435199 VMOVDQU 0x200(%RSP),%YMM2 |
(247) 0x4351a2 VPXORD %XMM16,%XMM16,%XMM16 |
(247) 0x4351a8 VPMULLQ %YMM15,%YMM2,%YMM16 |
(247) 0x4351ae VGATHERQPD (%R13,%YMM1,8),%YMM0{%K1} |
(247) 0x4351b6 VMOVUPD %YMM0,0x320(%RSP) |
(247) 0x4351bf VXORPD %XMM28,%XMM28,%XMM28 |
(247) 0x4351c5 KXNORW %K0,%K0,%K1 |
(247) 0x4351c9 VPADDQ %YMM13,%YMM16,%YMM16 |
(247) 0x4351cf VXORPD %XMM31,%XMM31,%XMM31 |
(247) 0x4351d5 KXNORW %K0,%K0,%K2 |
(247) 0x4351d9 VGATHERQPD (%R13,%YMM8,8),%YMM28{%K1} |
(247) 0x4351e1 VMOVDQU64 0x1e0(%RSP),%YMM27 |
(247) 0x4351e9 VXORPS %XMM8,%XMM8,%XMM8 |
(247) 0x4351ee VPMULLQ %YMM15,%YMM27,%YMM8 |
(247) 0x4351f4 VPADDQ %YMM13,%YMM8,%YMM8 |
(247) 0x4351f9 VPXOR %XMM7,%XMM7,%XMM7 |
(247) 0x4351fd MOV 0x30(%RSP),%RAX |
(247) 0x435202 VGATHERQPD (%RAX,%YMM16,8),%YMM31{%K2} |
(247) 0x435209 KXNORW %K0,%K0,%K1 |
(247) 0x43520d VMOVDQU 0x1a0(%RSP),%YMM1 |
(247) 0x435216 VPXORD %XMM16,%XMM16,%XMM16 |
(247) 0x43521c VPMULLQ %YMM15,%YMM1,%YMM16 |
(247) 0x435222 VPADDQ %YMM13,%YMM16,%YMM16 |
(247) 0x435228 MOV 0x28(%RSP),%RDX |
(247) 0x43522d VGATHERQPD (%RDX,%YMM8,8),%YMM7{%K1} |
(247) 0x435234 VXORPD %XMM19,%XMM19,%XMM19 |
(247) 0x43523a KXNORW %K0,%K0,%K1 |
(247) 0x43523e VMOVDQU 0x180(%RSP),%YMM0 |
(247) 0x435247 VXORPS %XMM8,%XMM8,%XMM8 |
(247) 0x43524c VPMULLQ %YMM15,%YMM0,%YMM8 |
(247) 0x435252 MOV 0x20(%RSP),%R8 |
(247) 0x435257 VGATHERQPD (%R8,%YMM16,8),%YMM19{%K1} |
(247) 0x43525e VPADDQ %YMM13,%YMM8,%YMM8 |
(247) 0x435263 VXORPD %XMM20,%XMM20,%XMM20 |
(247) 0x435269 KXNORW %K0,%K0,%K1 |
(247) 0x43526d MOV 0x18(%RSP),%R9 |
(247) 0x435272 VGATHERQPD (%R9,%YMM8,8),%YMM20{%K1} |
(247) 0x435279 VPADDQ %YMM13,%YMM12,%YMM8 |
(247) 0x43527e VXORPD %XMM23,%XMM23,%XMM23 |
(247) 0x435284 KXNORW %K0,%K0,%K1 |
(247) 0x435288 VPADDQ %YMM14,%YMM12,%YMM12 |
(247) 0x43528d VXORPD %XMM22,%XMM22,%XMM22 |
(247) 0x435293 VGATHERQPD (%RDI,%YMM8,8),%YMM23{%K1} |
(247) 0x43529a KXNORW %K0,%K0,%K1 |
(247) 0x43529e VXORPS %XMM8,%XMM8,%XMM8 |
(247) 0x4352a3 VPMULLQ %YMM10,%YMM5,%YMM8 |
(247) 0x4352a9 VPADDQ %YMM13,%YMM8,%YMM8 |
(247) 0x4352ae VGATHERQPD (%RDI,%YMM12,8),%YMM22{%K1} |
(247) 0x4352b5 VXORPD %XMM21,%XMM21,%XMM21 |
(247) 0x4352bb KXNORW %K0,%K0,%K1 |
(247) 0x4352bf VXORPS %XMM12,%XMM12,%XMM12 |
(247) 0x4352c4 VPMULLQ %YMM10,%YMM4,%YMM12 |
(247) 0x4352ca VGATHERQPD (%R15,%YMM8,8),%YMM21{%K1} |
(247) 0x4352d1 VPADDQ %YMM13,%YMM12,%YMM8 |
(247) 0x4352d6 VXORPD %XMM6,%XMM6,%XMM6 |
(247) 0x4352da KXNORW %K0,%K0,%K1 |
(247) 0x4352de VGATHERQPD (%R13,%YMM8,8),%YMM6{%K1} |
(247) 0x4352e6 VEXTRACTI128 $0x1,%YMM11,%XMM8 |
(247) 0x4352ec VPMOVSXDQ %XMM8,%YMM11 |
(247) 0x4352f1 VPADDQ %YMM14,%YMM12,%YMM8 |
(247) 0x4352f6 VXORPD %XMM24,%XMM24,%XMM24 |
(247) 0x4352fc KXNORW %K0,%K0,%K1 |
(247) 0x435300 VGATHERQPD (%R13,%YMM8,8),%YMM24{%K1} |
(247) 0x435308 VEXTRACTI32X4 $0x1,%YMM29,%XMM8 |
(247) 0x43530f VPMOVSXDQ %XMM8,%YMM12 |
(247) 0x435314 VXORPS %XMM8,%XMM8,%XMM8 |
(247) 0x435319 VPMULLQ %YMM12,%YMM9,%YMM8 |
(247) 0x43531f VPADDQ %YMM11,%YMM8,%YMM14 |
(247) 0x435324 VPXORD %XMM29,%XMM29,%XMM29 |
(247) 0x43532a KXNORW %K0,%K0,%K1 |
(247) 0x43532e VPXORD %XMM16,%XMM16,%XMM16 |
(247) 0x435334 VPMULLQ %YMM12,%YMM3,%YMM16 |
(247) 0x43533a VGATHERQPD (%R10,%YMM14,8),%YMM29{%K1} |
(247) 0x435341 VPADDQ %YMM11,%YMM16,%YMM14 |
(247) 0x435347 VXORPD %XMM25,%XMM25,%XMM25 |
(247) 0x43534d KXNORW %K0,%K0,%K1 |
(247) 0x435351 VEXTRACTI32X4 $0x1,%YMM17,%XMM17 |
(247) 0x435358 VPMOVSXDQ %XMM17,%YMM18 |
(247) 0x43535e VGATHERQPD (%RDI,%YMM14,8),%YMM25{%K1} |
(247) 0x435365 VPADDQ %YMM18,%YMM8,%YMM8 |
(247) 0x43536b VXORPD %XMM26,%XMM26,%XMM26 |
(247) 0x435371 KXNORW %K0,%K0,%K1 |
(247) 0x435375 VPADDQ %YMM18,%YMM16,%YMM14 |
(247) 0x43537b VPXORD %XMM17,%XMM17,%XMM17 |
(247) 0x435381 VGATHERQPD (%R10,%YMM8,8),%YMM26{%K1} |
(247) 0x435388 KXNORW %K0,%K0,%K1 |
(247) 0x43538c VXORPS %XMM8,%XMM8,%XMM8 |
(247) 0x435391 VPMULLQ %YMM12,%YMM5,%YMM8 |
(247) 0x435397 VPADDQ %YMM11,%YMM8,%YMM8 |
(247) 0x43539c VGATHERQPD (%RDI,%YMM14,8),%YMM17{%K1} |
(247) 0x4353a3 VPXOR %XMM9,%XMM9,%XMM9 |
(247) 0x4353a8 KXNORW %K0,%K0,%K1 |
(247) 0x4353ac VXORPS %XMM14,%XMM14,%XMM14 |
(247) 0x4353b1 VPMULLQ %YMM12,%YMM4,%YMM14 |
(247) 0x4353b7 VGATHERQPD (%R15,%YMM8,8),%YMM9{%K1} |
(247) 0x4353be VPADDQ %YMM11,%YMM14,%YMM8 |
(247) 0x4353c3 VXORPD %XMM30,%XMM30,%XMM30 |
(247) 0x4353c9 KXNORW %K0,%K0,%K1 |
(247) 0x4353cd VPADDQ %YMM18,%YMM14,%YMM14 |
(247) 0x4353d3 VPXOR %XMM10,%XMM10,%XMM10 |
(247) 0x4353d8 VGATHERQPD (%R13,%YMM8,8),%YMM30{%K1} |
(247) 0x4353e0 KXNORW %K0,%K0,%K1 |
(247) 0x4353e4 VXORPS %XMM8,%XMM8,%XMM8 |
(247) 0x4353e9 VPMULLQ %YMM12,%YMM2,%YMM8 |
(247) 0x4353ef VPADDQ %YMM11,%YMM8,%YMM8 |
(247) 0x4353f4 VGATHERQPD (%R13,%YMM14,8),%YMM10{%K1} |
(247) 0x4353fc VXORPD %XMM14,%XMM14,%XMM14 |
(247) 0x435401 KXNORW %K0,%K0,%K1 |
(247) 0x435405 VPXORD %XMM16,%XMM16,%XMM16 |
(247) 0x43540b VPMULLQ %YMM12,%YMM27,%YMM16 |
(247) 0x435411 VGATHERQPD (%RAX,%YMM8,8),%YMM14{%K1} |
(247) 0x435418 VPADDQ %YMM11,%YMM16,%YMM8 |
(247) 0x43541e VPXORD %XMM27,%XMM27,%XMM27 |
(247) 0x435424 KXNORW %K0,%K0,%K1 |
(247) 0x435428 VGATHERQPD (%RDX,%YMM8,8),%YMM27{%K1} |
(247) 0x43542f VXORPS %XMM8,%XMM8,%XMM8 |
(247) 0x435434 VPMULLQ %YMM12,%YMM1,%YMM8 |
(247) 0x43543a VPADDQ %YMM11,%YMM8,%YMM8 |
(247) 0x43543f KXNORW %K0,%K0,%K1 |
(247) 0x435443 VPXORD %XMM16,%XMM16,%XMM16 |
(247) 0x435449 VGATHERQPD (%R8,%YMM8,8),%YMM16{%K1} |
(247) 0x435450 VXORPS %XMM8,%XMM8,%XMM8 |
(247) 0x435455 VPMULLQ %YMM12,%YMM0,%YMM8 |
(247) 0x43545b VPADDQ %YMM11,%YMM8,%YMM0 |
(247) 0x435460 KXNORW %K0,%K0,%K1 |
(247) 0x435464 VPXOR %XMM8,%XMM8,%XMM8 |
(247) 0x435469 VGATHERQPD (%R9,%YMM0,8),%YMM8{%K1} |
(247) 0x435470 VMOVDQU 0x3a0(%RSP),%YMM0 |
(247) 0x435479 VEXTRACTI128 $0x1,%YMM0,%XMM0 |
(247) 0x43547f VPMOVSXDQ %XMM0,%YMM1 |
(247) 0x435484 KXNORW %K0,%K0,%K1 |
(247) 0x435488 VXORPS %XMM0,%XMM0,%XMM0 |
(247) 0x43548c VPMULLQ %YMM1,%YMM3,%YMM0 |
(247) 0x435492 VPADDQ %YMM0,%YMM11,%YMM3 |
(247) 0x435496 VPXOR %XMM2,%XMM2,%XMM2 |
(247) 0x43549a VGATHERQPD (%RDI,%YMM3,8),%YMM2{%K1} |
(247) 0x4354a1 VPADDQ %YMM18,%YMM0,%YMM0 |
(247) 0x4354a7 KXNORW %K0,%K0,%K1 |
(247) 0x4354ab VXORPD %XMM3,%XMM3,%XMM3 |
(247) 0x4354af VGATHERQPD (%RDI,%YMM0,8),%YMM3{%K1} |
(247) 0x4354b6 VXORPS %XMM0,%XMM0,%XMM0 |
(247) 0x4354ba VPMULLQ %YMM1,%YMM5,%YMM0 |
(247) 0x4354c0 VPADDQ %YMM0,%YMM11,%YMM0 |
(247) 0x4354c4 KXNORW %K0,%K0,%K1 |
(247) 0x4354c8 VPXOR %XMM5,%XMM5,%XMM5 |
(247) 0x4354cc VGATHERQPD (%R15,%YMM0,8),%YMM5{%K1} |
(247) 0x4354d3 VXORPS %XMM0,%XMM0,%XMM0 |
(247) 0x4354d7 VPMULLQ %YMM1,%YMM4,%YMM0 |
(247) 0x4354dd KXNORW %K0,%K0,%K1 |
(247) 0x4354e1 VPADDQ %YMM0,%YMM11,%YMM1 |
(247) 0x4354e5 VPXOR %XMM4,%XMM4,%XMM4 |
(247) 0x4354e9 VGATHERQPD (%R13,%YMM1,8),%YMM4{%K1} |
(247) 0x4354f1 VPADDQ %YMM18,%YMM0,%YMM0 |
(247) 0x4354f7 KXNORW %K0,%K0,%K1 |
(247) 0x4354fb VXORPD %XMM1,%XMM1,%XMM1 |
(247) 0x4354ff VGATHERQPD (%R13,%YMM0,8),%YMM1{%K1} |
(247) 0x435507 VADDPD %YMM30,%YMM10,%YMM0 |
(247) 0x43550d VADDPD %YMM25,%YMM2,%YMM2 |
(247) 0x435513 VMULPD %YMM0,%YMM9,%YMM0 |
(247) 0x435517 VFMADD231PD %YMM2,%YMM29,%YMM0 |
(247) 0x43551d VADDPD 0x3c0(%RSP),%YMM23,%YMM2 |
(247) 0x435525 VADDPD %YMM17,%YMM3,%YMM3 |
(247) 0x43552b VADDPD 0x320(%RSP),%YMM28,%YMM9 |
(247) 0x435533 VFNMADD231PD %YMM3,%YMM26,%YMM0 |
(247) 0x435539 VMOVDQU 0x1c0(%RSP),%YMM10 |
(247) 0x435542 VXORPS %XMM3,%XMM3,%XMM3 |
(247) 0x435546 VPMULLQ %YMM15,%YMM10,%YMM3 |
(247) 0x43554c VPMULLQ %YMM12,%YMM10,%YMM10 |
(247) 0x435552 VMULPD 0x340(%RSP),%YMM9,%YMM9 |
(247) 0x43555b VFMADD231PD 0x3e0(%RSP),%YMM2,%YMM9 |
(247) 0x435565 VPADDQ %YMM3,%YMM13,%YMM2 |
(247) 0x435569 VPXOR %XMM3,%XMM3,%XMM3 |
(247) 0x43556d KXNORW %K0,%K0,%K1 |
(247) 0x435571 VGATHERQPD (%R14,%YMM2,8),%YMM3{%K1} |
(247) 0x435578 VADDPD 0x360(%RSP),%YMM22,%YMM17 |
(247) 0x435580 VFNMADD231PD 0x380(%RSP),%YMM17,%YMM9 |
(247) 0x435588 VPADDQ %YMM11,%YMM10,%YMM10 |
(247) 0x43558d VXORPD %XMM17,%XMM17,%XMM17 |
(247) 0x435593 KXNORW %K0,%K0,%K1 |
(247) 0x435597 VGATHERQPD (%R14,%YMM10,8),%YMM17{%K1} |
(247) 0x43559e VADDPD %YMM6,%YMM24,%YMM6 |
(247) 0x4355a4 VFMSUB213PD %YMM9,%YMM21,%YMM6 |
(247) 0x4355aa VADDPD %YMM7,%YMM19,%YMM7 |
(247) 0x4355b0 VMOVUPD 0x220(%RSP),%YMM9 |
(247) 0x4355b9 VMULPD %YMM6,%YMM9,%YMM6 |
(247) 0x4355bd VMULPD %YMM31,%YMM3,%YMM3 |
(247) 0x4355c3 VMULPD %YMM6,%YMM7,%YMM7 |
(247) 0x4355c7 VDIVPD %YMM3,%YMM7,%YMM3 |
(247) 0x4355cb VSUBPD %YMM3,%YMM20,%YMM3 |
(247) 0x4355d1 VMOVDQU64 0x160(%RSP),%YMM18 |
(247) 0x4355d9 VXORPS %XMM7,%XMM7,%XMM7 |
(247) 0x4355dd VPMULLQ %YMM15,%YMM18,%YMM7 |
(247) 0x4355e3 VPADDQ %YMM7,%YMM13,%YMM7 |
(247) 0x4355e7 KXNORW %K0,%K0,%K1 |
(247) 0x4355eb MOV 0x10(%RSP),%RAX |
(247) 0x4355f0 VSCATTERQPD %YMM3,(%RAX,%YMM7,8){%K1} |
(247) 0x4355f7 VADDPD %YMM4,%YMM1,%YMM1 |
(247) 0x4355fb VFMSUB213PD %YMM0,%YMM5,%YMM1 |
(247) 0x435600 VADDPD %YMM27,%YMM16,%YMM0 |
(247) 0x435606 VMULPD %YMM1,%YMM9,%YMM1 |
(247) 0x43560a VMOVDQU 0x100(%RSP),%YMM9 |
(247) 0x435613 VMULPD %YMM14,%YMM17,%YMM3 |
(247) 0x435619 VMULPD %YMM1,%YMM0,%YMM0 |
(247) 0x43561d VDIVPD %YMM3,%YMM0,%YMM0 |
(247) 0x435621 VSUBPD %YMM0,%YMM8,%YMM0 |
(247) 0x435625 VXORPS %XMM3,%XMM3,%XMM3 |
(247) 0x435629 VPMULLQ %YMM12,%YMM18,%YMM3 |
(247) 0x43562f VPADDQ %YMM3,%YMM11,%YMM3 |
(247) 0x435633 KXNORW %K0,%K0,%K1 |
(247) 0x435637 VSCATTERQPD %YMM0,(%RAX,%YMM3,8){%K1} |
(247) 0x43563e VXORPD %XMM0,%XMM0,%XMM0 |
(247) 0x435642 KXNORW %K0,%K0,%K1 |
(247) 0x435646 VGATHERQPD (%R14,%YMM10,8),%YMM0{%K1} |
(247) 0x43564d VXORPD %XMM3,%XMM3,%XMM3 |
(247) 0x435651 KXNORW %K0,%K0,%K1 |
(247) 0x435655 VGATHERQPD (%R14,%YMM2,8),%YMM3{%K1} |
(247) 0x43565c VADDPD %YMM31,%YMM6,%YMM2 |
(247) 0x435662 VMULPD %YMM31,%YMM3,%YMM3 |
(247) 0x435668 VMOVDQU 0x140(%RSP),%YMM5 |
(247) 0x435671 VPMULLQ %YMM15,%YMM5,%YMM4 |
(247) 0x435677 VPADDQ %YMM4,%YMM13,%YMM4 |
(247) 0x43567b VDIVPD %YMM2,%YMM3,%YMM2 |
(247) 0x43567f KXNORW %K0,%K0,%K1 |
(247) 0x435683 MOV 0x50(%RSP),%RAX |
(247) 0x435688 VSCATTERQPD %YMM2,(%RAX,%YMM4,8){%K1} |
(247) 0x43568f VADDPD %YMM1,%YMM14,%YMM1 |
(247) 0x435693 VMULPD %YMM0,%YMM14,%YMM0 |
(247) 0x435697 VDIVPD %YMM1,%YMM0,%YMM0 |
(247) 0x43569b VXORPS %XMM1,%XMM1,%XMM1 |
(247) 0x43569f VPMULLQ %YMM12,%YMM5,%YMM1 |
(247) 0x4356a5 VPADDQ %YMM1,%YMM11,%YMM1 |
(247) 0x4356a9 KXNORW %K0,%K0,%K1 |
(247) 0x4356ad VSCATTERQPD %YMM0,(%RAX,%YMM1,8){%K1} |
(247) 0x4356b4 MOV 0x40(%RSP),%RAX |
(247) 0x4356b9 VMOVDQU 0xe0(%RSP),%YMM0 |
(247) 0x4356c2 VPBROADCASTQ 0x30bd5(%RIP),%YMM1 |
(247) 0x4356cb VPADDQ %YMM1,%YMM0,%YMM0 |
(247) 0x4356cf VPADDQ %YMM1,%YMM9,%YMM9 |
(247) 0x4356d3 ADD $0x8,%RAX |
(247) 0x4356d7 CMP %R12,%RAX |
(247) 0x4356da JB 434fd0 |
0x4356e0 CMP %RCX,0xa8(%RSP) |
0x4356e8 MOV 0xa0(%RSP),%R11 |
0x4356f0 VMOVUPD 0x130(%RSP),%XMM4 |
0x4356f9 MOV 0x50(%RSP),%R12 |
0x4356fe JNE 43572e |
0x435700 MOV $0x683750,%EDI |
0x435705 MOV 0x48(%RSP),%ESI |
0x435709 LEA -0x28(%RBP),%RSP |
0x43570d POP %RBX |
0x43570e POP %R12 |
0x435710 POP %R13 |
0x435712 POP %R14 |
0x435714 POP %R15 |
0x435716 POP %RBP |
0x435717 VZEROUPPER |
0x43571a JMP 402e90 |
0x43571f LEA -0x28(%RBP),%RSP |
0x435723 POP %RBX |
0x435724 POP %R12 |
0x435726 POP %R13 |
0x435728 POP %R14 |
0x43572a POP %R15 |
0x43572c POP %RBP |
0x43572d RET |
0x43572e ADD %RCX,%RSI |
0x435731 JMP 4358ec |
0x435736 NOPW %CS:(%RAX,%RAX,1) |
(246) 0x435740 MOV %RSI,%RAX |
(246) 0x435743 CQTO |
(246) 0x435745 IDIV %R11 |
(246) 0x435748 MOV 0x8(%RSP),%RAX |
(246) 0x43574d ADD 0x4(%RSP),%ECX |
(246) 0x435751 ADD %EAX,%EDX |
(246) 0x435753 MOVSXD %EDX,%RDX |
(246) 0x435756 MOVSXD %ECX,%RAX |
(246) 0x435759 MOV %R9,%R8 |
(246) 0x43575c IMUL %RAX,%R8 |
(246) 0x435760 LEA 0x1(%RAX),%ECX |
(246) 0x435763 MOVSXD %ECX,%RCX |
(246) 0x435766 IMUL %RCX,%R9 |
(246) 0x43576a LEA (%R9,%RDX,1),%R10 |
(246) 0x43576e VMOVSD (%RDI,%R10,8),%XMM0 |
(246) 0x435774 LEA (%R8,%RDX,1),%R10 |
(246) 0x435778 VADDSD (%RDI,%R10,8),%XMM0,%XMM0 |
(246) 0x43577e LEA 0x1(%R8,%RDX,1),%R8 |
(246) 0x435783 LEA 0x1(%R9,%RDX,1),%R9 |
(246) 0x435788 VMOVSD (%RDI,%R9,8),%XMM1 |
(246) 0x43578e VADDSD (%RDI,%R8,8),%XMM1,%XMM1 |
(246) 0x435794 MOV 0x68(%RSP),%RBX |
(246) 0x435799 MOV %RBX,%R8 |
(246) 0x43579c IMUL %RAX,%R8 |
(246) 0x4357a0 LEA 0x1(%R8,%RDX,1),%R9 |
(246) 0x4357a5 ADD %RDX,%R8 |
(246) 0x4357a8 VMOVSD (%R13,%R9,8),%XMM2 |
(246) 0x4357af VADDSD (%R13,%R8,8),%XMM2,%XMM2 |
(246) 0x4357b6 MOV 0x70(%RSP),%R10 |
(246) 0x4357bb MOV %R10,%R8 |
(246) 0x4357be IMUL %RCX,%R8 |
(246) 0x4357c2 IMUL %RBX,%RCX |
(246) 0x4357c6 LEA 0x1(%RCX,%RDX,1),%R9 |
(246) 0x4357cb VMOVSD (%R13,%R9,8),%XMM3 |
(246) 0x4357d2 MOV 0x78(%RSP),%R9 |
(246) 0x4357d7 ADD %RDX,%RCX |
(246) 0x4357da VADDSD (%R13,%RCX,8),%XMM3,%XMM3 |
(246) 0x4357e1 IMUL %RAX,%R9 |
(246) 0x4357e5 MOV %R10,%RCX |
(246) 0x4357e8 IMUL %RAX,%RCX |
(246) 0x4357ec ADD %RDX,%RCX |
(246) 0x4357ef VMULSD (%R15,%RCX,8),%XMM2,%XMM2 |
(246) 0x4357f5 LEA 0x1(%R9,%RDX,1),%RCX |
(246) 0x4357fa ADD %RDX,%R9 |
(246) 0x4357fd MOV 0x88(%RSP),%R10 |
(246) 0x435805 VFMADD231SD (%R10,%R9,8),%XMM0,%XMM2 |
(246) 0x43580b ADD %RDX,%R8 |
(246) 0x43580e VFNMADD231SD (%R10,%RCX,8),%XMM1,%XMM2 |
(246) 0x435814 VFMSUB231SD (%R15,%R8,8),%XMM3,%XMM2 |
(246) 0x43581a VMULSD %XMM2,%XMM4,%XMM0 |
(246) 0x43581e MOV 0x60(%RSP),%RCX |
(246) 0x435823 IMUL %RAX,%RCX |
(246) 0x435827 ADD %RDX,%RCX |
(246) 0x43582a MOV 0x30(%RSP),%R8 |
(246) 0x43582f VMOVSD (%R8,%RCX,8),%XMM1 |
(246) 0x435835 MOV 0xd0(%RSP),%RCX |
(246) 0x43583d IMUL %RAX,%RCX |
(246) 0x435841 ADD %RDX,%RCX |
(246) 0x435844 MOV 0xc8(%RSP),%R8 |
(246) 0x43584c IMUL %RAX,%R8 |
(246) 0x435850 ADD %RDX,%R8 |
(246) 0x435853 MOV 0x20(%RSP),%R9 |
(246) 0x435858 VMOVSD (%R9,%R8,8),%XMM2 |
(246) 0x43585e MOV 0x58(%RSP),%R8 |
(246) 0x435863 IMUL %RAX,%R8 |
(246) 0x435867 ADD %RDX,%R8 |
(246) 0x43586a MOV 0x28(%RSP),%R9 |
(246) 0x43586f VADDSD (%R9,%RCX,8),%XMM2,%XMM2 |
(246) 0x435875 VMULSD %XMM0,%XMM2,%XMM2 |
(246) 0x435879 VMULSD (%R14,%R8,8),%XMM1,%XMM3 |
(246) 0x43587f VDIVSD %XMM3,%XMM2,%XMM2 |
(246) 0x435883 MOV 0xc0(%RSP),%RCX |
(246) 0x43588b IMUL %RAX,%RCX |
(246) 0x43588f ADD %RDX,%RCX |
(246) 0x435892 MOV 0x18(%RSP),%R9 |
(246) 0x435897 VMOVSD (%R9,%RCX,8),%XMM3 |
(246) 0x43589d VSUBSD %XMM2,%XMM3,%XMM2 |
(246) 0x4358a1 MOV 0xb8(%RSP),%RCX |
(246) 0x4358a9 IMUL %RAX,%RCX |
(246) 0x4358ad ADD %RDX,%RCX |
(246) 0x4358b0 MOV 0x10(%RSP),%R9 |
(246) 0x4358b5 VMOVSD %XMM2,(%R9,%RCX,8) |
(246) 0x4358bb VMULSD (%R14,%R8,8),%XMM1,%XMM2 |
(246) 0x4358c1 IMUL 0xb0(%RSP),%RAX |
(246) 0x4358ca ADD %RDX,%RAX |
(246) 0x4358cd VADDSD %XMM1,%XMM0,%XMM0 |
(246) 0x4358d1 VDIVSD %XMM0,%XMM2,%XMM0 |
(246) 0x4358d5 VMOVSD %XMM0,(%R12,%RAX,8) |
(246) 0x4358db INC %RSI |
(246) 0x4358de CMP 0x80(%RSP),%RSI |
(246) 0x4358e6 JG 435700 |
(246) 0x4358ec MOV %RSI,%R8 |
(246) 0x4358ef SHR $0x20,%R8 |
(246) 0x4358f3 JE 435910 |
(246) 0x4358f5 MOV %RSI,%RAX |
(246) 0x4358f8 XOR %EDX,%EDX |
(246) 0x4358fa DIV %R11 |
(246) 0x4358fd MOV %RAX,%RCX |
(246) 0x435900 MOV 0x38(%RSP),%R9 |
(246) 0x435905 TEST %R8,%R8 |
(246) 0x435908 JNE 435740 |
(246) 0x43590e JMP 435927 |
(246) 0x435910 MOV %ESI,%EAX |
(246) 0x435912 XOR %EDX,%EDX |
(246) 0x435914 DIV %R11D |
(246) 0x435917 MOV %EAX,%ECX |
(246) 0x435919 MOV 0x38(%RSP),%R9 |
(246) 0x43591e TEST %R8,%R8 |
(246) 0x435921 JNE 435740 |
(246) 0x435927 MOV %ESI,%EAX |
(246) 0x435929 XOR %EDX,%EDX |
(246) 0x43592b DIV %R11D |
(246) 0x43592e JMP 435748 |
0x435933 NOPW %CS:(%RAX,%RAX,1) |
0x43593d NOPL (%RAX) |
Path / |
Source file and lines | PdV.cpp:48-64 |
Module | exec |
nb instructions | 196 |
nb uops | 198 |
loop length | 1005 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 3 |
used zmm registers | 0 |
nb stack references | 61 |
micro-operation queue | 33.00 cycles |
front end | 33.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.80 | 5.80 | 25.33 | 25.33 | 31.00 | 17.00 | 5.80 | 31.00 | 31.00 | 31.00 | 5.60 | 25.33 |
cycles | 5.80 | 5.80 | 25.33 | 25.33 | 31.00 | 17.00 | 5.80 | 31.00 | 31.00 | 31.00 | 5.60 | 25.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 32.85 |
Stall cycles | 0.00 |
Front-end | 33.00 |
Dispatch | 31.00 |
Overall L1 | 33.00 |
all | 18% |
load | 10% |
store | 28% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 66% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 4% |
all | 60% |
load | 50% |
store | 100% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 20% |
load | 14% |
store | 30% |
mul | 0% |
add-sub | 66% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 3% |
all | 18% |
load | 16% |
store | 22% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 25% |
load | 18% |
store | 37% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 18% |
load | 16% |
store | 22% |
mul | 12% |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x420,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ECX,0x4(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,0x4c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 43571f <_Z10PdV_kernelbiiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted.8+0xacf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0xe0(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x54(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0xa0(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x98(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x683730,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %R11,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 403020 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x98(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x90(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 435700 <_Z10PdV_kernelbiiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted.8+0xab0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
SUB 0x8(%RSP),%R11D | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
LEA 0x1(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x80(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV (%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R15),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xe0(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0x31327(%RIP),%XMM0,%XMM4 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RAX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R14),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x100(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $-0x8,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RBX,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4358ec <_Z10PdV_kernelbiiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted.8+0xc9c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R11,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x300(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV %R12,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x4(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x2e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x78(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x280(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x70(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x260(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x68(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x240(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM4,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM4,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x60(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %RBX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x1e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x58(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %RDX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x1a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %R8,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %R9,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %RSI,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ 0x312d1(%RIP),%YMM0,%YMM9 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
VPADDQ 0x31149(%RIP),%YMM0,%YMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
VPBROADCASTQ %R10,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM1,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,0xa8(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV 0xa0(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0x130(%RSP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV 0x50(%RSP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 43572e <_Z10PdV_kernelbiiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted.8+0xade> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x683750,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x48(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 402e90 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
ADD %RCX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 4358ec <_Z10PdV_kernelbiiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted.8+0xc9c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | PdV.cpp:48-64 |
Module | exec |
nb instructions | 196 |
nb uops | 198 |
loop length | 1005 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 3 |
used zmm registers | 0 |
nb stack references | 61 |
micro-operation queue | 33.00 cycles |
front end | 33.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.80 | 5.80 | 25.33 | 25.33 | 31.00 | 17.00 | 5.80 | 31.00 | 31.00 | 31.00 | 5.60 | 25.33 |
cycles | 5.80 | 5.80 | 25.33 | 25.33 | 31.00 | 17.00 | 5.80 | 31.00 | 31.00 | 31.00 | 5.60 | 25.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 32.85 |
Stall cycles | 0.00 |
Front-end | 33.00 |
Dispatch | 31.00 |
Overall L1 | 33.00 |
all | 18% |
load | 10% |
store | 28% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 66% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 4% |
all | 60% |
load | 50% |
store | 100% |
mul | 0% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 20% |
load | 14% |
store | 30% |
mul | 0% |
add-sub | 66% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 3% |
all | 18% |
load | 16% |
store | 22% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 25% |
load | 18% |
store | 37% |
mul | 12% |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 18% |
load | 16% |
store | 22% |
mul | 12% |
add-sub | 35% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x420,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x70(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %ECX,0x4(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,0x4c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 43571f <_Z10PdV_kernelbiiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted.8+0xacf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0xe0(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x54(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0xa0(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x98(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x683730,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %R11,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 403020 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x98(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x90(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 435700 <_Z10PdV_kernelbiiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted.8+0xab0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RBX,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
SUB 0x8(%RSP),%R11D | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
LEA 0x1(%RSI),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x80(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV (%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R15),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xe0(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMULSD 0x31327(%RIP),%XMM0,%XMM4 | 1 | 0.50 | 0.50 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 4 | 0.50 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RAX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R14),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x100(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RSI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $-0x8,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RBX,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 4358ec <_Z10PdV_kernelbiiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted.8+0xc9c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R11,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R11,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x300(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV %R12,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x4(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x2e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x78(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x280(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x70(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x260(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x68(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x240(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VMOVUPD %XMM4,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VBROADCASTSD %XMM4,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %YMM0,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x60(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %RBX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x1e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x58(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %RDX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x1a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %R8,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %R9,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %RSI,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ 0x312d1(%RIP),%YMM0,%YMM9 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
VPADDQ 0x31149(%RIP),%YMM0,%YMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
VPBROADCASTQ %R10,%YMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM1,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,0xa8(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV 0xa0(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVUPD 0x130(%RSP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV 0x50(%RSP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 43572e <_Z10PdV_kernelbiiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted.8+0xade> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x683750,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x48(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 402e90 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
ADD %RCX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 4358ec <_Z10PdV_kernelbiiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted.8+0xc9c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼PdV_kernel(bool, int, int, int, int, double, clover::Buffer2D | 1.61 | 2.57 |
○Loop 247 - PdV.cpp:48-64 - exec | 1.61 | 2.57 |
○Loop 246 - PdV.cpp:49-64 - exec | 0 | 0 |