Function: _Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted | Module: exec | Source: accelerate.cpp:40-53 [...] | Coverage: 3.49% |
---|
Function: _Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted | Module: exec | Source: accelerate.cpp:40-53 [...] | Coverage: 3.49% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-112-9712/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
/home/eoseret/qaas_runs_CPU_9468/171-112-9712/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/accelerate.cpp: 40 - 53 |
-------------------------------------------------------------------------------- |
40: #pragma omp parallel for simd collapse(2) |
41: for (int j = (y_min + 1); j < (y_max + 1 + 2); j++) { |
42: for (int i = (x_min + 1); i < (x_max + 1 + 2); i++) { |
43: double stepbymass_s = halfdt / ((density0(i - 1, j - 1) * volume(i - 1, j - 1) + density0(i - 1, j + 0) * volume(i - 1, j + 0) + |
44: density0(i, j) * volume(i, j) + density0(i + 0, j - 1) * volume(i + 0, j - 1)) * |
45: 0.25); |
46: xvel1(i, j) = xvel0(i, j) - stepbymass_s * (xarea(i, j) * (pressure(i, j) - pressure(i - 1, j + 0)) + |
47: xarea(i + 0, j - 1) * (pressure(i + 0, j - 1) - pressure(i - 1, j - 1))); |
48: yvel1(i, j) = yvel0(i, j) - stepbymass_s * (yarea(i, j) * (pressure(i, j) - pressure(i + 0, j - 1)) + |
49: yarea(i - 1, j + 0) * (pressure(i - 1, j + 0) - pressure(i - 1, j - 1))); |
50: xvel1(i, j) = xvel1(i, j) - stepbymass_s * (xarea(i, j) * (viscosity(i, j) - viscosity(i - 1, j + 0)) + |
51: xarea(i + 0, j - 1) * (viscosity(i + 0, j - 1) - viscosity(i - 1, j - 1))); |
52: yvel1(i, j) = yvel1(i, j) - stepbymass_s * (yarea(i, j) * (viscosity(i, j) - viscosity(i + 0, j - 1)) + |
53: yarea(i - 1, j + 0) * (viscosity(i - 1, j + 0) - viscosity(i - 1, j - 1))); |
0x424d80 PUSH %RBP |
0x424d81 MOV %RSP,%RBP |
0x424d84 PUSH %R15 |
0x424d86 PUSH %R14 |
0x424d88 PUSH %R13 |
0x424d8a PUSH %R12 |
0x424d8c PUSH %RBX |
0x424d8d AND $-0x40,%RSP |
0x424d91 SUB $0x280,%RSP |
0x424d98 MOV 0x68(%RBP),%RAX |
0x424d9c MOV 0x58(%RBP),%R12 |
0x424da0 MOV 0x50(%RBP),%RSI |
0x424da4 MOV 0x38(%RBP),%R11 |
0x424da8 MOV 0x30(%RBP),%R13 |
0x424dac MOV 0x28(%RBP),%R10 |
0x424db0 MOV %R10,0x40(%RSP) |
0x424db5 MOV 0x20(%RBP),%RBX |
0x424db9 MOV 0x18(%RBP),%R15 |
0x424dbd VMOVQ 0x40(%RBP),%XMM0 |
0x424dc2 MOV 0x10(%RBP),%R14 |
0x424dc6 MOV 0x48(%RBP),%R10D |
0x424dca MOV %R10D,0x54(%RSP) |
0x424dcf MOVL $0,0x84(%RSP) |
0x424dda TEST %RAX,%RAX |
0x424ddd JS 4255c0 |
0x424de3 MOV %R15,0x58(%RSP) |
0x424de8 MOV %R11,0x68(%RSP) |
0x424ded MOV %RSI,0x60(%RSP) |
0x424df2 MOV %R9,%R15 |
0x424df5 MOV %R8,0x70(%RSP) |
0x424dfa MOV %RDX,0x48(%RSP) |
0x424dff MOV %RCX,0x38(%RSP) |
0x424e04 MOV (%RDI),%ESI |
0x424e06 MOVQ $0,0xf0(%RSP) |
0x424e12 MOV %RAX,0xe8(%RSP) |
0x424e1a MOVQ $0x1,0x128(%RSP) |
0x424e26 SUB $0x8,%RSP |
0x424e2a LEA 0x130(%RSP),%RAX |
0x424e32 LEA 0x8c(%RSP),%RCX |
0x424e3a LEA 0xf8(%RSP),%R8 |
0x424e42 LEA 0xf0(%RSP),%R9 |
0x424e4a MOV $0x48f3b0,%EDI |
0x424e4f MOV %ESI,0x88(%RSP) |
0x424e56 MOV $0x22,%EDX |
0x424e5b PUSH $0x1 |
0x424e5d PUSH $0x1 |
0x424e5f PUSH %RAX |
0x424e60 VMOVDQU %XMM0,0x150(%RSP) |
0x424e69 CALL 4031f0 <__kmpc_for_static_init_8@plt> |
0x424e6e VMOVUPD 0x150(%RSP),%XMM3 |
0x424e77 ADD $0x20,%RSP |
0x424e7b MOV 0xf0(%RSP),%R11 |
0x424e83 MOV 0xe8(%RSP),%RAX |
0x424e8b MOV %RAX,0xd8(%RSP) |
0x424e93 CMP %RAX,%R11 |
0x424e96 JA 42559c |
0x424e9c MOV %R12,%RCX |
0x424e9f SUB 0x60(%RSP),%ECX |
0x424ea3 MOV (%R15),%RAX |
0x424ea6 MOV %RAX,0x78(%RSP) |
0x424eab MOV 0x10(%R15),%R15 |
0x424eaf LEA 0x1(%R11),%RAX |
0x424eb3 MOV 0xd8(%RSP),%RDI |
0x424ebb INC %RDI |
0x424ebe CMP %RDI,%RAX |
0x424ec1 CMOVG %RAX,%RDI |
0x424ec5 MOV 0x70(%RSP),%R12 |
0x424eca MOV (%R12),%R8 |
0x424ece MOV 0x10(%R12),%R12 |
0x424ed3 MOV (%RBX),%R9 |
0x424ed6 MOV 0x10(%RBX),%RAX |
0x424eda MOV %RAX,0x70(%RSP) |
0x424edf MOV 0x48(%RSP),%RAX |
0x424ee4 MOV (%RAX),%R10 |
0x424ee7 MOV 0x10(%RAX),%RAX |
0x424eeb MOV %RAX,0xd0(%RSP) |
0x424ef3 MOV (%R14),%RDX |
0x424ef6 MOV 0x10(%R14),%RBX |
0x424efa MOV (%R13),%RAX |
0x424efe MOV %RAX,0xc8(%RSP) |
0x424f06 MOV 0x10(%R13),%RAX |
0x424f0a MOV %RAX,0x48(%RSP) |
0x424f0f MOV 0x40(%RSP),%RAX |
0x424f14 MOV (%RAX),%RSI |
0x424f17 MOV %RSI,0xc0(%RSP) |
0x424f1f MOV 0x10(%RAX),%RAX |
0x424f23 MOV %RAX,0xe0(%RSP) |
0x424f2b MOV 0x38(%RSP),%RAX |
0x424f30 MOV (%RAX),%RSI |
0x424f33 MOV %RSI,0xb8(%RSP) |
0x424f3b MOV 0x10(%RAX),%RAX |
0x424f3f MOV %RAX,0xb0(%RSP) |
0x424f47 MOV 0x68(%RSP),%RAX |
0x424f4c MOV (%RAX),%RSI |
0x424f4f MOV 0x10(%RAX),%RAX |
0x424f53 MOV 0x58(%RSP),%R13 |
0x424f58 MOV (%R13),%R14 |
0x424f5c MOV %R14,0xa8(%RSP) |
0x424f64 MOV 0x10(%R13),%R13 |
0x424f68 MOV %R13,0x58(%RSP) |
0x424f6d SUB %R11,%RDI |
0x424f70 MOV $-0x8,%R13D |
0x424f76 MOV %RDI,0xf8(%RSP) |
0x424f7e AND %RDI,%R13 |
0x424f81 MOV 0xd0(%RSP),%R14 |
0x424f89 MOV %RCX,0xa0(%RSP) |
0x424f91 MOV %R15,0x98(%RSP) |
0x424f99 MOV %R8,0x120(%RSP) |
0x424fa1 MOV %R12,0x118(%RSP) |
0x424fa9 MOV %R10,0x108(%RSP) |
0x424fb1 MOV %RDX,0x90(%RSP) |
0x424fb9 MOV %RBX,0x88(%RSP) |
0x424fc1 MOV %RAX,0x68(%RSP) |
0x424fc6 MOV %R9,0x110(%RSP) |
0x424fce MOV %RSI,0x100(%RSP) |
0x424fd6 JE 425892 |
0x424fdc VPBROADCASTQ %RCX,%ZMM16 |
0x424fe2 MOV 0x54(%RSP),%EAX |
0x424fe6 VPBROADCASTD %EAX,%YMM0 |
0x424fec VMOVDQU %YMM0,0x160(%RSP) |
0x424ff5 MOV 0x60(%RSP),%RAX |
0x424ffa VPBROADCASTD %EAX,%YMM0 |
0x425000 VMOVDQU %YMM0,0x140(%RSP) |
0x425009 MOV 0x78(%RSP),%RAX |
0x42500e VPBROADCASTQ %RAX,%ZMM20 |
0x425014 VPBROADCASTQ %R8,%ZMM21 |
0x42501a VBROADCASTSD %XMM3,%ZMM0 |
0x425020 VMOVUPD %ZMM0,0x200(%RSP) |
0x425028 VPBROADCASTQ %R9,%ZMM0 |
0x42502e VMOVDQU64 %ZMM0,0x1c0(%RSP) |
0x425036 VPBROADCASTQ %R10,%ZMM24 |
0x42503c VPBROADCASTQ %RDX,%ZMM25 |
0x425042 MOV 0xc8(%RSP),%RAX |
0x42504a VPBROADCASTQ %RAX,%ZMM0 |
0x425050 VMOVDQU64 %ZMM0,0x180(%RSP) |
0x425058 MOV 0xc0(%RSP),%RAX |
0x425060 VPBROADCASTQ %RAX,%ZMM27 |
0x425066 MOV 0xb8(%RSP),%RAX |
0x42506e VPBROADCASTQ %RAX,%ZMM28 |
0x425074 VPBROADCASTQ %RSI,%ZMM29 |
0x42507a MOV 0xa8(%RSP),%RAX |
0x425082 VPBROADCASTQ %RAX,%ZMM30 |
0x425088 MOV %R11,0x40(%RSP) |
0x42508d VPBROADCASTQ %R11,%ZMM0 |
0x425093 VPADDQ 0x4d4a3(%RIP),%ZMM0,%ZMM17 |
0x42509d MOV %R13,0x38(%RSP) |
0x4250a2 XOR %R13D,%R13D |
0x4250a5 MOV 0xb0(%RSP),%RDI |
0x4250ad MOV 0x58(%RSP),%RSI |
0x4250b2 NOPW %CS:(%RAX,%RAX,1) |
(149) 0x4250c0 VMOVDQA64 %ZMM17,%ZMM0 |
(149) 0x4250c6 VMOVDQA64 %ZMM16,%ZMM1 |
(149) 0x4250cc MOV $0x4603a0,%RAX |
(149) 0x4250d3 CALL %RAX |
(149) 0x4250d5 VPMOVQD %ZMM0,%YMM0 |
(149) 0x4250db VPADDD 0x160(%RSP),%YMM0,%YMM31 |
(149) 0x4250e3 VMOVDQA64 %ZMM17,%ZMM0 |
(149) 0x4250e9 VMOVDQA64 %ZMM16,%ZMM1 |
(149) 0x4250ef CALL 460220 <__svml_i64rem8_z0> |
(149) 0x4250f5 VPMOVQD %ZMM0,%YMM0 |
(149) 0x4250fb VPADDD 0x140(%RSP),%YMM0,%YMM2 |
(149) 0x425104 VPCMPEQD %YMM1,%YMM1,%YMM1 |
(149) 0x425108 VPADDD %YMM1,%YMM2,%YMM0 |
(149) 0x42510c VPADDD %YMM1,%YMM31,%YMM1 |
(149) 0x425112 VPMOVSXDQ %YMM1,%ZMM1 |
(149) 0x425118 VPXOR %XMM5,%XMM5,%XMM5 |
(149) 0x42511c VPMULLQ %ZMM1,%ZMM20,%ZMM5 |
(149) 0x425122 VPMOVSXDQ %YMM0,%ZMM0 |
(149) 0x425128 KXNORW %K0,%K0,%K1 |
(149) 0x42512c VXORPD %XMM4,%XMM4,%XMM4 |
(149) 0x425130 VPMULLQ %ZMM1,%ZMM21,%ZMM8 |
(149) 0x425136 VPADDQ %ZMM0,%ZMM5,%ZMM7 |
(149) 0x42513c KXNORW %K0,%K0,%K2 |
(149) 0x425140 VPMOVSXDQ %YMM31,%ZMM3 |
(149) 0x425146 VPMULLQ %ZMM3,%ZMM20,%ZMM9 |
(149) 0x42514c VPADDQ %ZMM0,%ZMM8,%ZMM10 |
(149) 0x425152 VXORPD %XMM6,%XMM6,%XMM6 |
(149) 0x425156 VGATHERQPD (%R15,%ZMM7,8),%ZMM4{%K1} |
(149) 0x42515d VPADDQ %ZMM0,%ZMM9,%ZMM11 |
(149) 0x425163 VGATHERQPD (%R12,%ZMM10,8),%ZMM6{%K2} |
(149) 0x42516a KXNORW %K0,%K0,%K1 |
(149) 0x42516e VXORPD %XMM7,%XMM7,%XMM7 |
(149) 0x425172 VPXOR %XMM10,%XMM10,%XMM10 |
(149) 0x425177 VPMULLQ %ZMM3,%ZMM21,%ZMM10 |
(149) 0x42517d VPADDQ %ZMM0,%ZMM10,%ZMM12 |
(149) 0x425183 KXNORW %K0,%K0,%K2 |
(149) 0x425187 VGATHERQPD (%R15,%ZMM11,8),%ZMM7{%K1} |
(149) 0x42518e VXORPD %XMM11,%XMM11,%XMM11 |
(149) 0x425193 VGATHERQPD (%R12,%ZMM12,8),%ZMM11{%K2} |
(149) 0x42519a VPMOVSXDQ %YMM2,%ZMM2 |
(149) 0x4251a0 VPADDQ %ZMM2,%ZMM9,%ZMM9 |
(149) 0x4251a6 KXNORW %K0,%K0,%K1 |
(149) 0x4251aa VXORPD %XMM12,%XMM12,%XMM12 |
(149) 0x4251af VPADDQ %ZMM2,%ZMM10,%ZMM10 |
(149) 0x4251b5 KXNORW %K0,%K0,%K2 |
(149) 0x4251b9 VGATHERQPD (%R15,%ZMM9,8),%ZMM12{%K1} |
(149) 0x4251c0 VXORPD %XMM9,%XMM9,%XMM9 |
(149) 0x4251c5 VGATHERQPD (%R12,%ZMM10,8),%ZMM9{%K2} |
(149) 0x4251cc VPADDQ %ZMM2,%ZMM5,%ZMM5 |
(149) 0x4251d2 KXNORW %K0,%K0,%K1 |
(149) 0x4251d6 VXORPD %XMM10,%XMM10,%XMM10 |
(149) 0x4251db VPADDQ %ZMM2,%ZMM8,%ZMM8 |
(149) 0x4251e1 KXNORW %K0,%K0,%K2 |
(149) 0x4251e5 VGATHERQPD (%R15,%ZMM5,8),%ZMM10{%K1} |
(149) 0x4251ec VXORPD %XMM13,%XMM13,%XMM13 |
(149) 0x4251f1 VGATHERQPD (%R12,%ZMM8,8),%ZMM13{%K2} |
(149) 0x4251f8 VPXOR %XMM5,%XMM5,%XMM5 |
(149) 0x4251fc VPMULLQ %ZMM3,%ZMM24,%ZMM5 |
(149) 0x425202 KXNORW %K0,%K0,%K1 |
(149) 0x425206 VXORPD %XMM8,%XMM8,%XMM8 |
(149) 0x42520b VPADDQ %ZMM2,%ZMM5,%ZMM5 |
(149) 0x425211 VPMULLQ %ZMM3,%ZMM25,%ZMM14 |
(149) 0x425217 KXNORW %K0,%K0,%K2 |
(149) 0x42521b VXORPD %XMM15,%XMM15,%XMM15 |
(149) 0x425220 VPADDQ %ZMM2,%ZMM14,%ZMM31 |
(149) 0x425226 VPADDQ %ZMM0,%ZMM14,%ZMM14 |
(149) 0x42522c VGATHERQPD (%R14,%ZMM5,8),%ZMM8{%K1} |
(149) 0x425233 KXNORW %K0,%K0,%K1 |
(149) 0x425237 VGATHERQPD (%RBX,%ZMM31,8),%ZMM15{%K2} |
(149) 0x42523e VXORPD %XMM18,%XMM18,%XMM18 |
(149) 0x425244 VGATHERQPD (%RBX,%ZMM14,8),%ZMM18{%K1} |
(149) 0x42524b VPMULLQ %ZMM1,%ZMM25,%ZMM19 |
(149) 0x425251 KXNORW %K0,%K0,%K1 |
(149) 0x425255 VPADDQ %ZMM2,%ZMM19,%ZMM22 |
(149) 0x42525b VXORPD %XMM23,%XMM23,%XMM23 |
(149) 0x425261 VGATHERQPD (%RBX,%ZMM22,8),%ZMM23{%K1} |
(149) 0x425268 VPADDQ %ZMM0,%ZMM19,%ZMM19 |
(149) 0x42526e KXNORW %K0,%K0,%K1 |
(149) 0x425272 VMULPD %ZMM4,%ZMM6,%ZMM4 |
(149) 0x425278 VXORPD %XMM26,%XMM26,%XMM26 |
(149) 0x42527e VGATHERQPD (%RBX,%ZMM19,8),%ZMM26{%K1} |
(149) 0x425285 VFMADD213PD %ZMM4,%ZMM7,%ZMM11 |
(149) 0x42528b VMOVDQU64 0x1c0(%RSP),%ZMM4 |
(149) 0x425293 VPMULLQ %ZMM3,%ZMM4,%ZMM4 |
(149) 0x425299 KXNORW %K0,%K0,%K1 |
(149) 0x42529d VFMADD213PD %ZMM11,%ZMM12,%ZMM9 |
(149) 0x4252a3 VXORPD %XMM7,%XMM7,%XMM7 |
(149) 0x4252a7 VPXOR %XMM6,%XMM6,%XMM6 |
(149) 0x4252ab VPMULLQ %ZMM1,%ZMM24,%ZMM6 |
(149) 0x4252b1 VPADDQ %ZMM2,%ZMM6,%ZMM6 |
(149) 0x4252b7 VPADDQ %ZMM2,%ZMM4,%ZMM4 |
(149) 0x4252bd KXNORW %K0,%K0,%K2 |
(149) 0x4252c1 MOV 0x70(%RSP),%RAX |
(149) 0x4252c6 VGATHERQPD (%RAX,%ZMM4,8),%ZMM7{%K1} |
(149) 0x4252cd VXORPD %XMM11,%XMM11,%XMM11 |
(149) 0x4252d2 VGATHERQPD (%R14,%ZMM6,8),%ZMM11{%K2} |
(149) 0x4252d9 VFMADD213PD %ZMM9,%ZMM10,%ZMM13 |
(149) 0x4252df VSUBPD %ZMM15,%ZMM18,%ZMM9 |
(149) 0x4252e5 VMULPD 0x4d221(%RIP){1to8},%ZMM13,%ZMM4 |
(149) 0x4252ef VMOVUPD 0x200(%RSP),%ZMM10 |
(149) 0x4252f7 VDIVPD %ZMM4,%ZMM10,%ZMM4 |
(149) 0x4252fd VMULPD %ZMM8,%ZMM9,%ZMM8 |
(149) 0x425303 VSUBPD %ZMM23,%ZMM26,%ZMM9 |
(149) 0x425309 VMOVDQU64 0x180(%RSP),%ZMM10 |
(149) 0x425311 VPMULLQ %ZMM3,%ZMM10,%ZMM10 |
(149) 0x425317 VFMADD213PD %ZMM8,%ZMM11,%ZMM9 |
(149) 0x42531d VPADDQ %ZMM2,%ZMM10,%ZMM8 |
(149) 0x425323 KXNORW %K0,%K0,%K1 |
(149) 0x425327 VPXOR %XMM10,%XMM10,%XMM10 |
(149) 0x42532c VPMULLQ %ZMM3,%ZMM27,%ZMM10 |
(149) 0x425332 VFMADD213PD %ZMM7,%ZMM4,%ZMM9 |
(149) 0x425338 VPXOR %XMM11,%XMM11,%XMM11 |
(149) 0x42533d VPMULLQ %ZMM3,%ZMM28,%ZMM11 |
(149) 0x425343 KXNORW %K0,%K0,%K2 |
(149) 0x425347 VXORPD %XMM12,%XMM12,%XMM12 |
(149) 0x42534c MOV 0x48(%RSP),%RCX |
(149) 0x425351 VSCATTERQPD %ZMM9,(%RCX,%ZMM8,8){%K1} |
(149) 0x425358 KXNORW %K0,%K0,%K1 |
(149) 0x42535c VGATHERQPD (%RBX,%ZMM31,8),%ZMM12{%K2} |
(149) 0x425363 VXORPD %XMM13,%XMM13,%XMM13 |
(149) 0x425368 VGATHERQPD (%RBX,%ZMM22,8),%ZMM13{%K1} |
(149) 0x42536f VPADDQ %ZMM2,%ZMM11,%ZMM7 |
(149) 0x425375 KXNORW %K0,%K0,%K1 |
(149) 0x425379 VXORPD %XMM15,%XMM15,%XMM15 |
(149) 0x42537e KXNORW %K0,%K0,%K2 |
(149) 0x425382 VXORPD %XMM18,%XMM18,%XMM18 |
(149) 0x425388 VGATHERQPD (%RDI,%ZMM7,8),%ZMM15{%K1} |
(149) 0x42538f KXNORW %K0,%K0,%K1 |
(149) 0x425393 VGATHERQPD (%RBX,%ZMM14,8),%ZMM18{%K2} |
(149) 0x42539a VXORPD %XMM14,%XMM14,%XMM14 |
(149) 0x42539f VGATHERQPD (%RBX,%ZMM19,8),%ZMM14{%K1} |
(149) 0x4253a6 KXNORW %K0,%K0,%K1 |
(149) 0x4253aa VXORPD %XMM19,%XMM19,%XMM19 |
(149) 0x4253b0 VPADDQ %ZMM0,%ZMM11,%ZMM9 |
(149) 0x4253b6 VPADDQ %ZMM2,%ZMM10,%ZMM10 |
(149) 0x4253bc KXNORW %K0,%K0,%K2 |
(149) 0x4253c0 MOV 0xe0(%RSP),%RAX |
(149) 0x4253c8 VGATHERQPD (%RAX,%ZMM10,8),%ZMM19{%K1} |
(149) 0x4253cf VXORPD %XMM10,%XMM10,%XMM10 |
(149) 0x4253d4 VGATHERQPD (%RDI,%ZMM9,8),%ZMM10{%K2} |
(149) 0x4253db VSUBPD %ZMM12,%ZMM13,%ZMM11 |
(149) 0x4253e1 VMULPD %ZMM15,%ZMM11,%ZMM11 |
(149) 0x4253e7 VSUBPD %ZMM18,%ZMM14,%ZMM12 |
(149) 0x4253ed VPXOR %XMM13,%XMM13,%XMM13 |
(149) 0x4253f2 VPMULLQ %ZMM3,%ZMM29,%ZMM13 |
(149) 0x4253f8 VFMADD213PD %ZMM11,%ZMM10,%ZMM12 |
(149) 0x4253fe VPADDQ %ZMM2,%ZMM13,%ZMM10 |
(149) 0x425404 VPMULLQ %ZMM3,%ZMM30,%ZMM3 |
(149) 0x42540a VFMADD213PD %ZMM19,%ZMM4,%ZMM12 |
(149) 0x425410 KXNORW %K0,%K0,%K1 |
(149) 0x425414 VPADDQ %ZMM2,%ZMM3,%ZMM11 |
(149) 0x42541a KXNORW %K0,%K0,%K2 |
(149) 0x42541e VPXOR %XMM13,%XMM13,%XMM13 |
(149) 0x425423 VPADDQ %ZMM0,%ZMM3,%ZMM3 |
(149) 0x425429 MOV 0x68(%RSP),%RAX |
(149) 0x42542e VSCATTERQPD %ZMM12,(%RAX,%ZMM10,8){%K1} |
(149) 0x425435 KXNORW %K0,%K0,%K1 |
(149) 0x425439 VGATHERQPD (%RSI,%ZMM11,8),%ZMM13{%K2} |
(149) 0x425440 VXORPD %XMM12,%XMM12,%XMM12 |
(149) 0x425445 VGATHERQPD (%RSI,%ZMM3,8),%ZMM12{%K1} |
(149) 0x42544c VPMULLQ %ZMM1,%ZMM30,%ZMM1 |
(149) 0x425452 KXNORW %K0,%K0,%K1 |
(149) 0x425456 VXORPD %XMM14,%XMM14,%XMM14 |
(149) 0x42545b VGATHERQPD (%R14,%ZMM5,8),%ZMM14{%K1} |
(149) 0x425462 KXNORW %K0,%K0,%K1 |
(149) 0x425466 VPADDQ %ZMM2,%ZMM1,%ZMM2 |
(149) 0x42546c KXNORW %K0,%K0,%K2 |
(149) 0x425470 VPADDQ %ZMM0,%ZMM1,%ZMM0 |
(149) 0x425476 VPXOR %XMM1,%XMM1,%XMM1 |
(149) 0x42547a VXORPD %XMM5,%XMM5,%XMM5 |
(149) 0x42547e VGATHERQPD (%R14,%ZMM6,8),%ZMM1{%K1} |
(149) 0x425485 KXNORW %K0,%K0,%K1 |
(149) 0x425489 VGATHERQPD (%RSI,%ZMM2,8),%ZMM5{%K2} |
(149) 0x425490 VXORPD %XMM6,%XMM6,%XMM6 |
(149) 0x425494 VGATHERQPD (%RSI,%ZMM0,8),%ZMM6{%K1} |
(149) 0x42549b KXNORW %K0,%K0,%K1 |
(149) 0x42549f VSUBPD %ZMM13,%ZMM12,%ZMM12 |
(149) 0x4254a5 VXORPD %XMM13,%XMM13,%XMM13 |
(149) 0x4254aa VGATHERQPD (%RCX,%ZMM8,8),%ZMM13{%K1} |
(149) 0x4254b1 VMULPD %ZMM14,%ZMM12,%ZMM12 |
(149) 0x4254b7 VSUBPD %ZMM5,%ZMM6,%ZMM5 |
(149) 0x4254bd VFMADD213PD %ZMM12,%ZMM1,%ZMM5 |
(149) 0x4254c3 VFMADD213PD %ZMM13,%ZMM4,%ZMM5 |
(149) 0x4254c9 KXNORW %K0,%K0,%K1 |
(149) 0x4254cd VSCATTERQPD %ZMM5,(%RCX,%ZMM8,8){%K1} |
(149) 0x4254d4 KXNORW %K0,%K0,%K1 |
(149) 0x4254d8 VXORPD %XMM1,%XMM1,%XMM1 |
(149) 0x4254dc KXNORW %K0,%K0,%K2 |
(149) 0x4254e0 VGATHERQPD (%RSI,%ZMM11,8),%ZMM1{%K1} |
(149) 0x4254e7 VXORPD %XMM5,%XMM5,%XMM5 |
(149) 0x4254eb VGATHERQPD (%RSI,%ZMM2,8),%ZMM5{%K2} |
(149) 0x4254f2 KXNORW %K0,%K0,%K1 |
(149) 0x4254f6 VXORPD %XMM2,%XMM2,%XMM2 |
(149) 0x4254fa VGATHERQPD (%RDI,%ZMM7,8),%ZMM2{%K1} |
(149) 0x425501 KXNORW %K0,%K0,%K1 |
(149) 0x425505 VXORPD %XMM6,%XMM6,%XMM6 |
(149) 0x425509 KXNORW %K0,%K0,%K2 |
(149) 0x42550d VGATHERQPD (%RSI,%ZMM3,8),%ZMM6{%K1} |
(149) 0x425514 VXORPD %XMM3,%XMM3,%XMM3 |
(149) 0x425518 VGATHERQPD (%RSI,%ZMM0,8),%ZMM3{%K2} |
(149) 0x42551f KXNORW %K0,%K0,%K1 |
(149) 0x425523 VXORPD %XMM0,%XMM0,%XMM0 |
(149) 0x425527 VGATHERQPD (%RDI,%ZMM9,8),%ZMM0{%K1} |
(149) 0x42552e KXNORW %K0,%K0,%K1 |
(149) 0x425532 VSUBPD %ZMM1,%ZMM5,%ZMM1 |
(149) 0x425538 VXORPD %XMM5,%XMM5,%XMM5 |
(149) 0x42553c VGATHERQPD (%RAX,%ZMM10,8),%ZMM5{%K1} |
(149) 0x425543 VMULPD %ZMM2,%ZMM1,%ZMM1 |
(149) 0x425549 VSUBPD %ZMM6,%ZMM3,%ZMM2 |
(149) 0x42554f VFMADD213PD %ZMM1,%ZMM0,%ZMM2 |
(149) 0x425555 VFMADD213PD %ZMM5,%ZMM4,%ZMM2 |
(149) 0x42555b KXNORW %K0,%K0,%K1 |
(149) 0x42555f VSCATTERQPD %ZMM2,(%RAX,%ZMM10,8){%K1} |
(149) 0x425566 VPADDQ 0x4cfa8(%RIP){1to8},%ZMM17,%ZMM17 |
(149) 0x425570 ADD $0x8,%R13 |
(149) 0x425574 CMP 0x38(%RSP),%R13 |
(149) 0x425579 JB 4250c0 |
0x42557f MOV 0x38(%RSP),%RAX |
0x425584 CMP %RAX,0xf8(%RSP) |
0x42558c VMOVUPD 0x130(%RSP),%XMM3 |
0x425595 MOV 0x40(%RSP),%R11 |
0x42559a JNE 425600 |
0x42559c MOV $0x48f3d0,%EDI |
0x4255a1 MOV 0x80(%RSP),%ESI |
0x4255a8 LEA -0x28(%RBP),%RSP |
0x4255ac POP %RBX |
0x4255ad POP %R12 |
0x4255af POP %R13 |
0x4255b1 POP %R14 |
0x4255b3 POP %R15 |
0x4255b5 POP %RBP |
0x4255b6 VZEROUPPER |
0x4255b9 JMP 403050 |
0x4255be XCHG %AX,%AX |
0x4255c0 LEA -0x28(%RBP),%RSP |
0x4255c4 POP %RBX |
0x4255c5 POP %R12 |
0x4255c7 POP %R13 |
0x4255c9 POP %R14 |
0x4255cb POP %R15 |
0x4255cd POP %RBP |
0x4255ce RET |
0x4255cf NOPW %CS:(%RAX,%RAX,1) |
0x4255de NOPW %CS:(%RAX,%RAX,1) |
0x4255ed NOPW %CS:(%RAX,%RAX,1) |
0x4255fc NOPL (%RAX) |
0x425600 ADD %RAX,%R11 |
0x425603 JMP 425892 |
0x425608 NOPW %CS:(%RAX,%RAX,1) |
0x425617 NOPW %CS:(%RAX,%RAX,1) |
0x425626 NOPW %CS:(%RAX,%RAX,1) |
0x425635 NOPW %CS:(%RAX,%RAX,1) |
(148) 0x425640 MOV %R11,%RAX |
(148) 0x425643 CQTO |
(148) 0x425645 IDIV %R9 |
(148) 0x425648 ADD %R10D,%EDX |
(148) 0x42564b LEA -0x1(%RCX),%EAX |
(148) 0x42564e MOVSXD %EAX,%RDI |
(148) 0x425651 MOV %R13,%R8 |
(148) 0x425654 IMUL %RDI,%R8 |
(148) 0x425658 MOVSXD %EDX,%RDX |
(148) 0x42565b LEA -0x1(%R8,%RDX,1),%R9 |
(148) 0x425660 MOV 0x120(%RSP),%R12 |
(148) 0x425668 MOV %R12,%R10 |
(148) 0x42566b IMUL %RDI,%R10 |
(148) 0x42566f LEA -0x1(%R10,%RDX,1),%R11 |
(148) 0x425674 MOV 0x118(%RSP),%R15 |
(148) 0x42567c VMOVSD (%R15,%R11,8),%XMM0 |
(148) 0x425682 VMULSD (%R14,%R9,8),%XMM0,%XMM0 |
(148) 0x425688 MOVSXD %ECX,%RCX |
(148) 0x42568b MOV %R13,%R9 |
(148) 0x42568e IMUL %RCX,%R9 |
(148) 0x425692 LEA -0x1(%R9,%RDX,1),%R11 |
(148) 0x425697 IMUL %RCX,%R12 |
(148) 0x42569b LEA -0x1(%R12,%RDX,1),%R13 |
(148) 0x4256a0 VMOVSD (%R15,%R13,8),%XMM1 |
(148) 0x4256a6 VFMADD132SD (%R14,%R11,8),%XMM0,%XMM1 |
(148) 0x4256ac ADD %RDX,%R9 |
(148) 0x4256af ADD %RDX,%R12 |
(148) 0x4256b2 VMOVSD (%R15,%R12,8),%XMM0 |
(148) 0x4256b8 VFMADD132SD (%R14,%R9,8),%XMM1,%XMM0 |
(148) 0x4256be ADD %RDX,%R8 |
(148) 0x4256c1 ADD %RDX,%R10 |
(148) 0x4256c4 VMOVSD (%R15,%R10,8),%XMM1 |
(148) 0x4256ca VFMADD132SD (%R14,%R8,8),%XMM0,%XMM1 |
(148) 0x4256d0 VMULSD 0x4ce38(%RIP),%XMM1,%XMM0 |
(148) 0x4256d8 VDIVSD %XMM0,%XMM3,%XMM0 |
(148) 0x4256dc MOV 0x110(%RSP),%R11 |
(148) 0x4256e4 IMUL %RCX,%R11 |
(148) 0x4256e8 ADD %RDX,%R11 |
(148) 0x4256eb MOV 0x108(%RSP),%R10 |
(148) 0x4256f3 MOV %R10,%R9 |
(148) 0x4256f6 IMUL %RCX,%R9 |
(148) 0x4256fa ADD %RDX,%R9 |
(148) 0x4256fd MOV %RSI,%R8 |
(148) 0x425700 IMUL %RCX,%R8 |
(148) 0x425704 LEA -0x1(%R8,%RDX,1),%R13 |
(148) 0x425709 ADD %RDX,%R8 |
(148) 0x42570c VMOVSD (%RBX,%R13,8),%XMM1 |
(148) 0x425712 VSUBSD (%RBX,%R8,8),%XMM1,%XMM1 |
(148) 0x425718 MOV %RSI,%R12 |
(148) 0x42571b MOV 0xd0(%RSP),%RSI |
(148) 0x425723 VMULSD (%RSI,%R9,8),%XMM1,%XMM1 |
(148) 0x425729 IMUL %RDI,%R10 |
(148) 0x42572d ADD %RDX,%R10 |
(148) 0x425730 IMUL %RDI,%R12 |
(148) 0x425734 LEA -0x1(%R12,%RDX,1),%R15 |
(148) 0x425739 ADD %RDX,%R12 |
(148) 0x42573c VMOVSD (%RBX,%R15,8),%XMM2 |
(148) 0x425742 VSUBSD (%RBX,%R12,8),%XMM2,%XMM2 |
(148) 0x425748 VFMADD132SD (%RSI,%R10,8),%XMM1,%XMM2 |
(148) 0x42574e MOV 0x70(%RSP),%R14 |
(148) 0x425753 VFMADD213SD (%R14,%R11,8),%XMM0,%XMM2 |
(148) 0x425759 MOV 0xc8(%RSP),%R11 |
(148) 0x425761 IMUL %RCX,%R11 |
(148) 0x425765 ADD %RDX,%R11 |
(148) 0x425768 MOV 0x48(%RSP),%RAX |
(148) 0x42576d VMOVSD %XMM2,(%RAX,%R11,8) |
(148) 0x425773 VMOVSD (%RBX,%R12,8),%XMM1 |
(148) 0x425779 MOV 0xc0(%RSP),%R14 |
(148) 0x425781 IMUL %RCX,%R14 |
(148) 0x425785 ADD %RDX,%R14 |
(148) 0x425788 VSUBSD (%RBX,%R8,8),%XMM1,%XMM1 |
(148) 0x42578e MOV 0xb8(%RSP),%R8 |
(148) 0x425796 IMUL %RCX,%R8 |
(148) 0x42579a VMOVSD (%RBX,%R15,8),%XMM2 |
(148) 0x4257a0 LEA (%R8,%RDX,1),%R12 |
(148) 0x4257a4 MOV 0xb0(%RSP),%R15 |
(148) 0x4257ac VMULSD (%R15,%R12,8),%XMM1,%XMM1 |
(148) 0x4257b2 LEA -0x1(%R8,%RDX,1),%RAX |
(148) 0x4257b7 MOV %RAX,0x38(%RSP) |
(148) 0x4257bc VSUBSD (%RBX,%R13,8),%XMM2,%XMM2 |
(148) 0x4257c2 VFMADD132SD (%R15,%RAX,8),%XMM1,%XMM2 |
(148) 0x4257c8 MOV 0xe0(%RSP),%RBX |
(148) 0x4257d0 VFMADD213SD (%RBX,%R14,8),%XMM0,%XMM2 |
(148) 0x4257d6 MOV 0x100(%RSP),%R13 |
(148) 0x4257de IMUL %RCX,%R13 |
(148) 0x4257e2 ADD %RDX,%R13 |
(148) 0x4257e5 MOV 0x68(%RSP),%R8 |
(148) 0x4257ea VMOVSD %XMM2,(%R8,%R13,8) |
(148) 0x4257f0 MOV 0xa8(%RSP),%RBX |
(148) 0x4257f8 IMUL %RBX,%RCX |
(148) 0x4257fc LEA -0x1(%RCX,%RDX,1),%R14 |
(148) 0x425801 ADD %RDX,%RCX |
(148) 0x425804 MOV 0x58(%RSP),%RAX |
(148) 0x425809 VMOVSD (%RAX,%R14,8),%XMM1 |
(148) 0x42580f VSUBSD (%RAX,%RCX,8),%XMM1,%XMM1 |
(148) 0x425814 VMULSD (%RSI,%R9,8),%XMM1,%XMM1 |
(148) 0x42581a IMUL %RBX,%RDI |
(148) 0x42581e LEA (%RDI,%RDX,1),%R9 |
(148) 0x425822 LEA -0x1(%RDI,%RDX,1),%RDX |
(148) 0x425827 VMOVSD (%RAX,%RDX,8),%XMM2 |
(148) 0x42582c VSUBSD (%RAX,%R9,8),%XMM2,%XMM2 |
(148) 0x425832 VFMADD132SD (%RSI,%R10,8),%XMM1,%XMM2 |
(148) 0x425838 MOV 0x48(%RSP),%RBX |
(148) 0x42583d VFMADD213SD (%RBX,%R11,8),%XMM0,%XMM2 |
(148) 0x425843 VMOVSD %XMM2,(%RBX,%R11,8) |
(148) 0x425849 VMOVSD (%RAX,%R9,8),%XMM1 |
(148) 0x42584f VSUBSD (%RAX,%RCX,8),%XMM1,%XMM1 |
(148) 0x425854 VMULSD (%R15,%R12,8),%XMM1,%XMM1 |
(148) 0x42585a VMOVSD (%RAX,%RDX,8),%XMM2 |
(148) 0x42585f VSUBSD (%RAX,%R14,8),%XMM2,%XMM2 |
(148) 0x425865 MOV 0x38(%RSP),%RAX |
(148) 0x42586a VFMADD132SD (%R15,%RAX,8),%XMM1,%XMM2 |
(148) 0x425870 VFMADD213SD (%R8,%R13,8),%XMM0,%XMM2 |
(148) 0x425876 VMOVSD %XMM2,(%R8,%R13,8) |
(148) 0x42587c MOV 0x40(%RSP),%R11 |
(148) 0x425881 INC %R11 |
(148) 0x425884 CMP 0xd8(%RSP),%R11 |
(148) 0x42588c JG 42559c |
(148) 0x425892 MOV %R11,%R8 |
(148) 0x425895 SHR $0x20,%R8 |
(148) 0x425899 JE 4258c0 |
(148) 0x42589b MOV %R11,%RAX |
(148) 0x42589e XOR %EDX,%EDX |
(148) 0x4258a0 MOV 0xa0(%RSP),%R9 |
(148) 0x4258a8 DIV %R9 |
(148) 0x4258ab MOV %RAX,%RCX |
(148) 0x4258ae JMP 4258d2 |
0x4258b0 NOPW %CS:(%RAX,%RAX,1) |
0x4258bf NOP |
(148) 0x4258c0 MOV %R11D,%EAX |
(148) 0x4258c3 XOR %EDX,%EDX |
(148) 0x4258c5 MOV 0xa0(%RSP),%R9 |
(148) 0x4258cd DIV %R9D |
(148) 0x4258d0 MOV %EAX,%ECX |
(148) 0x4258d2 MOV 0x60(%RSP),%R10 |
(148) 0x4258d7 MOV 0x98(%RSP),%R14 |
(148) 0x4258df MOV 0x90(%RSP),%RSI |
(148) 0x4258e7 MOV 0x88(%RSP),%RBX |
(148) 0x4258ef MOV 0x78(%RSP),%R13 |
(148) 0x4258f4 ADD 0x54(%RSP),%ECX |
(148) 0x4258f8 TEST %R8,%R8 |
(148) 0x4258fb MOV %R11,0x40(%RSP) |
(148) 0x425900 JNE 425640 |
(148) 0x425906 MOV %R11D,%EAX |
(148) 0x425909 XOR %EDX,%EDX |
(148) 0x42590b DIV %R9D |
(148) 0x42590e JMP 425648 |
0x425913 NOPW %CS:(%RAX,%RAX,1) |
0x42591d NOPW %CS:(%RAX,%RAX,1) |
0x425927 NOPW %CS:(%RAX,%RAX,1) |
0x425931 NOPW %CS:(%RAX,%RAX,1) |
0x42593b NOPL (%RAX,%RAX,1) |
Path / |
Source file and lines | accelerate.cpp:40-53 |
Module | exec |
nb instructions | 192 |
nb uops | 194 |
loop length | 1086 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 11 |
nb stack references | 52 |
micro-operation queue | 32.33 cycles |
front end | 32.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.30 | 5.20 | 24.00 | 24.00 | 27.00 | 15.00 | 5.30 | 27.00 | 27.00 | 27.00 | 5.20 | 24.00 |
cycles | 5.30 | 5.20 | 24.00 | 24.00 | 27.00 | 15.00 | 5.30 | 27.00 | 27.00 | 27.00 | 5.20 | 24.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 32.16 |
Stall cycles | 0.00 |
Front-end | 32.33 |
Dispatch | 27.00 |
Overall L1 | 32.33 |
all | 8% |
load | 5% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 4% |
all | 75% |
load | 100% |
store | 100% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 15% |
store | 13% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 16% |
load | 16% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 53% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 40% |
load | 25% |
store | 100% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 17% |
load | 17% |
store | 19% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 53% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x40,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x280,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x68(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ 0x40(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%R10D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10D,0x54(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,0x84(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4255c0 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0x840> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,0x128(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x130(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x8c(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0xf8(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0xf0(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x48f3b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
VMOVDQU %XMM0,0x150(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
CALL 4031f0 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVUPD 0x150(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xf0(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xe8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 42559c <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0x81c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB 0x60(%RSP),%ECX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%R11),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xd8(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RSP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R12),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R12),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R14),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R14),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R13),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R11,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $-0x8,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,0xf8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND %RDI,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0xd0(%RSP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x118(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x108(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 425892 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0xb12> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VPBROADCASTQ %RCX,%ZMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x54(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x60(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x78(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%ZMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R8,%ZMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM3,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM0,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 1 |
VPBROADCASTQ %R9,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU64 %ZMM0,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 1 |
VPBROADCASTQ %R10,%ZMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RDX,%ZMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0xc8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU64 %ZMM0,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 1 |
MOV 0xc0(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%ZMM27 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0xb8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%ZMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RSI,%ZMM29 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0xa8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%ZMM30 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R11,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ 0x4d4a3(%RIP),%ZMM0,%ZMM17 | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.67 |
MOV %R13,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,0xf8(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
VMOVUPD 0x130(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV 0x40(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 425600 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0x880> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x48f3d0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x80(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 403050 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %RAX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 425892 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0xb12> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | accelerate.cpp:40-53 |
Module | exec |
nb instructions | 192 |
nb uops | 194 |
loop length | 1086 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 11 |
nb stack references | 52 |
micro-operation queue | 32.33 cycles |
front end | 32.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.30 | 5.20 | 24.00 | 24.00 | 27.00 | 15.00 | 5.30 | 27.00 | 27.00 | 27.00 | 5.20 | 24.00 |
cycles | 5.30 | 5.20 | 24.00 | 24.00 | 27.00 | 15.00 | 5.30 | 27.00 | 27.00 | 27.00 | 5.20 | 24.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 32.16 |
Stall cycles | 0.00 |
Front-end | 32.33 |
Dispatch | 27.00 |
Overall L1 | 32.33 |
all | 8% |
load | 5% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 4% |
all | 75% |
load | 100% |
store | 100% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 15% |
store | 13% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 16% |
load | 16% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 53% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 40% |
load | 25% |
store | 100% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 17% |
load | 17% |
store | 19% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 53% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x40,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x280,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x68(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ 0x40(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%R10D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10D,0x54(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,0x84(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4255c0 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0x840> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,0x128(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x130(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x8c(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0xf8(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0xf0(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x48f3b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
VMOVDQU %XMM0,0x150(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
CALL 4031f0 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVUPD 0x150(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xf0(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xe8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 42559c <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0x81c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB 0x60(%RSP),%ECX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV (%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%R11),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xd8(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
INC %RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RDI,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RSP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R12),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R12),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R14),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R14),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R13),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R11,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $-0x8,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,0xf8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND %RDI,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0xd0(%RSP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x118(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x108(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 425892 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0xb12> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VPBROADCASTQ %RCX,%ZMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x54(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x60(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x78(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%ZMM20 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R8,%ZMM21 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VBROADCASTSD %XMM3,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVUPD %ZMM0,0x200(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 1 |
VPBROADCASTQ %R9,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU64 %ZMM0,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 1 |
VPBROADCASTQ %R10,%ZMM24 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RDX,%ZMM25 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0xc8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU64 %ZMM0,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 1 |
MOV 0xc0(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%ZMM27 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0xb8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%ZMM28 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RSI,%ZMM29 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0xa8(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%ZMM30 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R11,%ZMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ 0x4d4a3(%RIP),%ZMM0,%ZMM17 | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.67 |
MOV %R13,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xb0(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x38(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RAX,0xf8(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
VMOVUPD 0x130(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV 0x40(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 425600 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0x880> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x48f3d0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x80(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 403050 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %RAX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 425892 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0xb12> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted– | 3.49 | 2.39 |
○Loop 149 - accelerate.cpp:40-53 - exec | 3.49 | 2.39 |
○Loop 148 - accelerate.cpp:40-53 - exec | 0 | 0 |