Function: accelerate_kernel(int, int, int, int, double, clover::Buffer2D<double>&, clover::Buffer2D< ... | Module: exec | Source: accelerate.cpp:40-54 [...] | Coverage: 2.31% |
---|
Function: accelerate_kernel(int, int, int, int, double, clover::Buffer2D<double>&, clover::Buffer2D< ... | Module: exec | Source: accelerate.cpp:40-54 [...] | Coverage: 2.31% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-4969/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/accelerate.cpp: 40 - 54 |
-------------------------------------------------------------------------------- |
40: #pragma omp parallel for simd collapse(2) |
41: for (int j = (y_min + 1); j < (y_max + 1 + 2); j++) { |
42: for (int i = (x_min + 1); i < (x_max + 1 + 2); i++) { |
43: double stepbymass_s = halfdt / ((density0(i - 1, j - 1) * volume(i - 1, j - 1) + density0(i - 1, j + 0) * volume(i - 1, j + 0) + |
44: density0(i, j) * volume(i, j) + density0(i + 0, j - 1) * volume(i + 0, j - 1)) * |
45: 0.25); |
46: xvel1(i, j) = xvel0(i, j) - stepbymass_s * (xarea(i, j) * (pressure(i, j) - pressure(i - 1, j + 0)) + |
47: xarea(i + 0, j - 1) * (pressure(i + 0, j - 1) - pressure(i - 1, j - 1))); |
48: yvel1(i, j) = yvel0(i, j) - stepbymass_s * (yarea(i, j) * (pressure(i, j) - pressure(i + 0, j - 1)) + |
49: yarea(i - 1, j + 0) * (pressure(i - 1, j + 0) - pressure(i - 1, j - 1))); |
50: xvel1(i, j) = xvel1(i, j) - stepbymass_s * (xarea(i, j) * (viscosity(i, j) - viscosity(i - 1, j + 0)) + |
51: xarea(i + 0, j - 1) * (viscosity(i + 0, j - 1) - viscosity(i - 1, j - 1))); |
52: yvel1(i, j) = yvel1(i, j) - stepbymass_s * (yarea(i, j) * (viscosity(i, j) - viscosity(i + 0, j - 1)) + |
53: yarea(i - 1, j + 0) * (viscosity(i - 1, j + 0) - viscosity(i - 1, j - 1))); |
54: } |
/scratch_na/users/xoserete/qaas_runs/171-415-4969/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
0x41d030 PUSH %RBP |
0x41d031 MOV %RSP,%RBP |
0x41d034 PUSH %R15 |
0x41d036 PUSH %R14 |
0x41d038 PUSH %R13 |
0x41d03a PUSH %R12 |
0x41d03c PUSH %RBX |
0x41d03d AND $-0x20,%RSP |
0x41d041 SUB $0x220,%RSP |
0x41d048 MOV %R9,%R13 |
0x41d04b MOV %R8,%R12 |
0x41d04e MOV %RDX,%R10 |
0x41d051 MOV 0x68(%RBP),%RAX |
0x41d055 MOV 0x58(%RBP),%R15 |
0x41d059 MOV 0x50(%RBP),%RSI |
0x41d05d MOV 0x38(%RBP),%R8 |
0x41d061 MOV 0x30(%RBP),%RDX |
0x41d065 MOV %RDX,0x28(%RSP) |
0x41d06a MOV 0x28(%RBP),%R11 |
0x41d06e MOV 0x20(%RBP),%R14 |
0x41d072 MOV 0x18(%RBP),%R9 |
0x41d076 VMOVQ 0x40(%RBP),%XMM0 |
0x41d07b MOV 0x10(%RBP),%RBX |
0x41d07f MOV 0x48(%RBP),%EDX |
0x41d082 MOV %EDX,0x34(%RSP) |
0x41d086 MOVL $0,0x5c(%RSP) |
0x41d08e TEST %RAX,%RAX |
0x41d091 JS 41d864 |
0x41d097 MOV %R11,0x40(%RSP) |
0x41d09c MOV %R10,0x20(%RSP) |
0x41d0a1 MOV %R9,0x38(%RSP) |
0x41d0a6 MOV %R8,0x60(%RSP) |
0x41d0ab MOV %RCX,0x18(%RSP) |
0x41d0b0 MOV %RSI,0x50(%RSP) |
0x41d0b5 MOV (%RDI),%ESI |
0x41d0b7 MOVQ $0,0xc8(%RSP) |
0x41d0c3 MOV %RAX,0xc0(%RSP) |
0x41d0cb MOVQ $0x1,0x118(%RSP) |
0x41d0d7 SUB $0x8,%RSP |
0x41d0db LEA 0x120(%RSP),%RAX |
0x41d0e3 LEA 0x64(%RSP),%RCX |
0x41d0e8 LEA 0xd0(%RSP),%R8 |
0x41d0f0 LEA 0xc8(%RSP),%R9 |
0x41d0f8 MOV $0x682390,%EDI |
0x41d0fd MOV %ESI,0x60(%RSP) |
0x41d101 MOV $0x22,%EDX |
0x41d106 PUSH $0x1 |
0x41d108 PUSH $0x1 |
0x41d10a PUSH %RAX |
0x41d10b VMOVDQU %XMM0,0x140(%RSP) |
0x41d114 CALL 403020 <__kmpc_for_static_init_8@plt> |
0x41d119 VMOVDQU 0x140(%RSP),%XMM3 |
0x41d122 ADD $0x20,%RSP |
0x41d126 MOV 0xc8(%RSP),%R11 |
0x41d12e MOV 0xc0(%RSP),%RAX |
0x41d136 MOV %RAX,0xa0(%RSP) |
0x41d13e CMP %RAX,%R11 |
0x41d141 JA 41d845 |
0x41d147 MOV %R15,%RCX |
0x41d14a SUB 0x50(%RSP),%ECX |
0x41d14e MOV (%R13),%RAX |
0x41d152 MOV %RAX,0x48(%RSP) |
0x41d157 MOV 0x10(%R13),%RAX |
0x41d15b MOV %RAX,0x98(%RSP) |
0x41d163 LEA 0x1(%R11),%RAX |
0x41d167 MOV 0xa0(%RSP),%RDI |
0x41d16f LEA 0x1(%RDI),%R10 |
0x41d173 CMP %R10,%RAX |
0x41d176 CMOVG %RAX,%R10 |
0x41d17a MOV (%R12),%RAX |
0x41d17e MOV %RAX,0x90(%RSP) |
0x41d186 MOV 0x10(%R12),%R12 |
0x41d18b MOV (%R14),%R9 |
0x41d18e MOV 0x10(%R14),%RAX |
0x41d192 MOV %RAX,0xb8(%RSP) |
0x41d19a MOV 0x20(%RSP),%RAX |
0x41d19f MOV (%RAX),%RDX |
0x41d1a2 MOV %RDX,0x88(%RSP) |
0x41d1aa MOV 0x10(%RAX),%RAX |
0x41d1ae MOV %RAX,0x20(%RSP) |
0x41d1b3 MOV (%RBX),%R14 |
0x41d1b6 MOV 0x10(%RBX),%RAX |
0x41d1ba MOV %RAX,0x80(%RSP) |
0x41d1c2 MOV 0x28(%RSP),%RAX |
0x41d1c7 MOV (%RAX),%RBX |
0x41d1ca MOV 0x10(%RAX),%RAX |
0x41d1ce MOV %RAX,0x28(%RSP) |
0x41d1d3 MOV 0x40(%RSP),%RAX |
0x41d1d8 MOV (%RAX),%RDX |
0x41d1db MOV 0x10(%RAX),%RAX |
0x41d1df MOV %RAX,0x40(%RSP) |
0x41d1e4 MOV 0x18(%RSP),%RAX |
0x41d1e9 MOV (%RAX),%R13 |
0x41d1ec MOV 0x10(%RAX),%R15 |
0x41d1f0 MOV 0x60(%RSP),%RAX |
0x41d1f5 MOV (%RAX),%R8 |
0x41d1f8 MOV 0x10(%RAX),%RAX |
0x41d1fc MOV 0x38(%RSP),%RDI |
0x41d201 MOV (%RDI),%RSI |
0x41d204 MOV 0x10(%RDI),%RDI |
0x41d208 MOV %RDI,0x38(%RSP) |
0x41d20d SUB %R11,%R10 |
0x41d210 MOV $-0x4,%EDI |
0x41d215 MOV %R10,0xd0(%RSP) |
0x41d21d AND %R10,%RDI |
0x41d220 MOV %RDI,%R10 |
0x41d223 MOV 0x48(%RSP),%RDI |
0x41d228 MOV %RCX,0x78(%RSP) |
0x41d22d MOV %R12,0x110(%RSP) |
0x41d235 MOV %R14,0x100(%RSP) |
0x41d23d MOV %RSI,0xd8(%RSP) |
0x41d245 MOV %R9,0x108(%RSP) |
0x41d24d MOV %RBX,0xf8(%RSP) |
0x41d255 MOV %RDX,0xf0(%RSP) |
0x41d25d MOV %R13,0xe8(%RSP) |
0x41d265 MOV %R15,0xb0(%RSP) |
0x41d26d MOV %R8,0xe0(%RSP) |
0x41d275 MOV %RAX,0xa8(%RSP) |
0x41d27d JE 41dafe |
0x41d283 VPBROADCASTQ %RCX,%YMM8 |
0x41d289 MOV 0x34(%RSP),%EAX |
0x41d28d VPBROADCASTD %EAX,%XMM0 |
0x41d293 VMOVDQU %XMM0,0x60(%RSP) |
0x41d299 MOV 0x50(%RSP),%RAX |
0x41d29e VPBROADCASTD %EAX,%XMM0 |
0x41d2a4 VMOVDQU %XMM0,0x130(%RSP) |
0x41d2ad VPBROADCASTQ %RDI,%YMM12 |
0x41d2b3 MOV 0x90(%RSP),%RAX |
0x41d2bb VPBROADCASTQ %RAX,%YMM13 |
0x41d2c1 VPBROADCASTQ %XMM3,%YMM0 |
0x41d2c6 VMOVDQU %YMM0,0x1e0(%RSP) |
0x41d2cf VPBROADCASTQ %R9,%YMM0 |
0x41d2d5 VMOVDQU %YMM0,0x1c0(%RSP) |
0x41d2de MOV 0x88(%RSP),%RAX |
0x41d2e6 VPBROADCASTQ %RAX,%YMM16 |
0x41d2ec VPBROADCASTQ %R14,%YMM17 |
0x41d2f2 VPBROADCASTQ %RBX,%YMM0 |
0x41d2f8 VMOVDQU %YMM0,0x1a0(%RSP) |
0x41d301 VPBROADCASTQ %RDX,%YMM0 |
0x41d307 VMOVDQU %YMM0,0x180(%RSP) |
0x41d310 VPBROADCASTQ %R13,%YMM0 |
0x41d316 VMOVDQU %YMM0,0x160(%RSP) |
0x41d31f VPBROADCASTQ %R8,%YMM0 |
0x41d325 VMOVDQU %YMM0,0x140(%RSP) |
0x41d32e VPBROADCASTQ %RSI,%YMM22 |
0x41d334 MOV %R11,0x18(%RSP) |
0x41d339 VPBROADCASTQ %R11,%YMM0 |
0x41d33f VPADDQ 0x48db9(%RIP),%YMM0,%YMM9 |
0x41d347 XOR %R13D,%R13D |
0x41d34a MOV 0x98(%RSP),%R15 |
0x41d352 MOV 0x20(%RSP),%RBX |
0x41d357 MOV 0x80(%RSP),%RSI |
0x41d35f MOV 0x38(%RSP),%R14 |
0x41d364 NOPW %CS:(%RAX,%RAX,1) |
(101) 0x41d370 VMOVDQA %YMM9,%YMM0 |
(101) 0x41d374 VMOVDQA %YMM8,%YMM1 |
(101) 0x41d378 MOV %R12,%RDI |
(101) 0x41d37b MOV %R10,%R12 |
(101) 0x41d37e MOV $0x454690,%RAX |
(101) 0x41d385 CALL %RAX |
(101) 0x41d387 VPMOVQD %YMM0,%XMM0 |
(101) 0x41d38d VPADDD 0x60(%RSP),%XMM0,%XMM26 |
(101) 0x41d395 VMOVDQA %YMM9,%YMM0 |
(101) 0x41d399 VMOVDQA %YMM8,%YMM1 |
(101) 0x41d39d CALL 454460 <__svml_i64rem4_l9> |
(101) 0x41d3a3 MOV %R12,%R10 |
(101) 0x41d3a6 MOV %RDI,%R12 |
(101) 0x41d3a9 VPMOVQD %YMM0,%XMM0 |
(101) 0x41d3af VPCMPEQD %XMM3,%XMM3,%XMM3 |
(101) 0x41d3b3 VPADDD %XMM3,%XMM26,%XMM1 |
(101) 0x41d3b9 VPMOVSXDQ %XMM1,%YMM1 |
(101) 0x41d3be VXORPS %XMM6,%XMM6,%XMM6 |
(101) 0x41d3c2 VPMULLQ %YMM1,%YMM12,%YMM6 |
(101) 0x41d3c8 VPADDD 0x130(%RSP),%XMM0,%XMM2 |
(101) 0x41d3d1 VPADDD %XMM3,%XMM2,%XMM0 |
(101) 0x41d3d5 VPMOVSXDQ %XMM0,%YMM0 |
(101) 0x41d3da VPMULLQ %YMM1,%YMM13,%YMM30 |
(101) 0x41d3e0 VPADDQ %YMM0,%YMM6,%YMM3 |
(101) 0x41d3e4 KXNORW %K0,%K0,%K1 |
(101) 0x41d3e8 VXORPD %XMM4,%XMM4,%XMM4 |
(101) 0x41d3ec VPADDQ %YMM0,%YMM30,%YMM5 |
(101) 0x41d3f2 KXNORW %K0,%K0,%K2 |
(101) 0x41d3f6 VXORPD %XMM7,%XMM7,%XMM7 |
(101) 0x41d3fa VGATHERQPD (%R15,%YMM3,8),%YMM4{%K1} |
(101) 0x41d401 VPMOVSXDQ %XMM26,%YMM3 |
(101) 0x41d407 VPMULLQ %YMM3,%YMM12,%YMM28 |
(101) 0x41d40d VPADDQ %YMM0,%YMM28,%YMM27 |
(101) 0x41d413 VGATHERQPD (%RDI,%YMM5,8),%YMM7{%K2} |
(101) 0x41d41a KXNORW %K0,%K0,%K1 |
(101) 0x41d41e VPXORD %XMM26,%XMM26,%XMM26 |
(101) 0x41d424 VXORPS %XMM5,%XMM5,%XMM5 |
(101) 0x41d428 VPMULLQ %YMM3,%YMM13,%YMM5 |
(101) 0x41d42e VGATHERQPD (%R15,%YMM27,8),%YMM26{%K1} |
(101) 0x41d435 VPADDQ %YMM0,%YMM5,%YMM29 |
(101) 0x41d43b KXNORW %K0,%K0,%K1 |
(101) 0x41d43f VXORPD %XMM27,%XMM27,%XMM27 |
(101) 0x41d445 VPMOVSXDQ %XMM2,%YMM2 |
(101) 0x41d44a VGATHERQPD (%RDI,%YMM29,8),%YMM27{%K1} |
(101) 0x41d451 VPADDQ %YMM2,%YMM28,%YMM29 |
(101) 0x41d457 KXNORW %K0,%K0,%K2 |
(101) 0x41d45b VPXORD %XMM28,%XMM28,%XMM28 |
(101) 0x41d461 VPADDQ %YMM2,%YMM5,%YMM24 |
(101) 0x41d467 KXNORW %K0,%K0,%K1 |
(101) 0x41d46b VGATHERQPD (%R15,%YMM29,8),%YMM28{%K2} |
(101) 0x41d472 VXORPD %XMM31,%XMM31,%XMM31 |
(101) 0x41d478 VXORPS %XMM5,%XMM5,%XMM5 |
(101) 0x41d47c VPMULLQ %YMM3,%YMM16,%YMM5 |
(101) 0x41d482 VPADDQ %YMM2,%YMM5,%YMM5 |
(101) 0x41d486 VGATHERQPD (%RDI,%YMM24,8),%YMM31{%K1} |
(101) 0x41d48d KXNORW %K0,%K0,%K1 |
(101) 0x41d491 VXORPD %XMM24,%XMM24,%XMM24 |
(101) 0x41d497 VPMULLQ %YMM3,%YMM17,%YMM25 |
(101) 0x41d49d VGATHERQPD (%RBX,%YMM5,8),%YMM24{%K1} |
(101) 0x41d4a4 VPADDQ %YMM2,%YMM25,%YMM29 |
(101) 0x41d4aa KXNORW %K0,%K0,%K1 |
(101) 0x41d4ae VXORPD %XMM23,%XMM23,%XMM23 |
(101) 0x41d4b4 VGATHERQPD (%RSI,%YMM29,8),%YMM23{%K1} |
(101) 0x41d4bb VPADDQ %YMM2,%YMM6,%YMM6 |
(101) 0x41d4bf KXNORW %K0,%K0,%K1 |
(101) 0x41d4c3 VXORPD %XMM11,%XMM11,%XMM11 |
(101) 0x41d4c8 VPADDQ %YMM2,%YMM30,%YMM14 |
(101) 0x41d4ce KXNORW %K0,%K0,%K2 |
(101) 0x41d4d2 VGATHERQPD (%R15,%YMM6,8),%YMM11{%K1} |
(101) 0x41d4d9 VXORPD %XMM15,%XMM15,%XMM15 |
(101) 0x41d4de VMOVDQU 0x1c0(%RSP),%YMM6 |
(101) 0x41d4e7 VPMULLQ %YMM3,%YMM6,%YMM6 |
(101) 0x41d4ed VPADDQ %YMM0,%YMM25,%YMM30 |
(101) 0x41d4f3 VGATHERQPD (%RDI,%YMM14,8),%YMM15{%K2} |
(101) 0x41d4fa KXNORW %K0,%K0,%K1 |
(101) 0x41d4fe VXORPD %XMM14,%XMM14,%XMM14 |
(101) 0x41d503 VPXORD %XMM25,%XMM25,%XMM25 |
(101) 0x41d509 VPMULLQ %YMM1,%YMM17,%YMM25 |
(101) 0x41d50f VGATHERQPD (%RSI,%YMM30,8),%YMM14{%K1} |
(101) 0x41d516 VPADDQ %YMM2,%YMM25,%YMM18 |
(101) 0x41d51c KXNORW %K0,%K0,%K1 |
(101) 0x41d520 VXORPD %XMM19,%XMM19,%XMM19 |
(101) 0x41d526 VGATHERQPD (%RSI,%YMM18,8),%YMM19{%K1} |
(101) 0x41d52d VPADDQ %YMM2,%YMM6,%YMM6 |
(101) 0x41d531 VPADDQ %YMM0,%YMM25,%YMM25 |
(101) 0x41d537 KXNORW %K0,%K0,%K1 |
(101) 0x41d53b VXORPD %XMM20,%XMM20,%XMM20 |
(101) 0x41d541 VGATHERQPD (%RSI,%YMM25,8),%YMM20{%K1} |
(101) 0x41d548 KXNORW %K0,%K0,%K1 |
(101) 0x41d54c VXORPD %XMM21,%XMM21,%XMM21 |
(101) 0x41d552 VPMULLQ %YMM1,%YMM16,%YMM10 |
(101) 0x41d558 MOV 0xb8(%RSP),%RAX |
(101) 0x41d560 VGATHERQPD (%RAX,%YMM6,8),%YMM21{%K1} |
(101) 0x41d567 VPADDQ %YMM2,%YMM10,%YMM6 |
(101) 0x41d56b KXNORW %K0,%K0,%K1 |
(101) 0x41d56f VPXOR %XMM10,%XMM10,%XMM10 |
(101) 0x41d574 VGATHERQPD (%RBX,%YMM6,8),%YMM10{%K1} |
(101) 0x41d57b VMULPD %YMM4,%YMM7,%YMM4 |
(101) 0x41d57f VFMADD213PD %YMM4,%YMM26,%YMM27 |
(101) 0x41d585 VFMADD213PD %YMM27,%YMM28,%YMM31 |
(101) 0x41d58b VFMADD213PD %YMM31,%YMM11,%YMM15 |
(101) 0x41d591 VSUBPD %YMM23,%YMM14,%YMM7 |
(101) 0x41d597 VMULPD 0x48b4f(%RIP){1to4},%YMM15,%YMM4 |
(101) 0x41d5a1 VMOVUPD 0x1e0(%RSP),%YMM11 |
(101) 0x41d5aa VDIVPD %YMM4,%YMM11,%YMM4 |
(101) 0x41d5ae VMULPD %YMM24,%YMM7,%YMM7 |
(101) 0x41d5b4 VMOVDQU 0x1a0(%RSP),%YMM11 |
(101) 0x41d5bd VPMULLQ %YMM3,%YMM11,%YMM11 |
(101) 0x41d5c3 VSUBPD %YMM19,%YMM20,%YMM14 |
(101) 0x41d5c9 VFMADD213PD %YMM7,%YMM10,%YMM14 |
(101) 0x41d5ce VFMADD213PD %YMM21,%YMM4,%YMM14 |
(101) 0x41d5d4 VMOVDQU 0x160(%RSP),%YMM7 |
(101) 0x41d5dd VXORPS %XMM10,%XMM10,%XMM10 |
(101) 0x41d5e2 VPMULLQ %YMM3,%YMM7,%YMM10 |
(101) 0x41d5e8 VPADDQ %YMM2,%YMM11,%YMM26 |
(101) 0x41d5ee KXNORW %K0,%K0,%K1 |
(101) 0x41d5f2 MOV 0x28(%RSP),%RDX |
(101) 0x41d5f7 VSCATTERQPD %YMM14,(%RDX,%YMM26,8){%K1} |
(101) 0x41d5fe VPADDQ %YMM2,%YMM10,%YMM7 |
(101) 0x41d602 KXNORW %K0,%K0,%K1 |
(101) 0x41d606 VPXOR %XMM11,%XMM11,%XMM11 |
(101) 0x41d60b MOV 0xb0(%RSP),%RCX |
(101) 0x41d613 VGATHERQPD (%RCX,%YMM7,8),%YMM11{%K1} |
(101) 0x41d61a KXNORW %K0,%K0,%K1 |
(101) 0x41d61e VXORPD %XMM14,%XMM14,%XMM14 |
(101) 0x41d623 VGATHERQPD (%RSI,%YMM29,8),%YMM14{%K1} |
(101) 0x41d62a KXNORW %K0,%K0,%K1 |
(101) 0x41d62e VXORPD %XMM15,%XMM15,%XMM15 |
(101) 0x41d633 VGATHERQPD (%RSI,%YMM18,8),%YMM15{%K1} |
(101) 0x41d63a KXNORW %K0,%K0,%K1 |
(101) 0x41d63e VXORPD %XMM18,%XMM18,%XMM18 |
(101) 0x41d644 VGATHERQPD (%RSI,%YMM30,8),%YMM18{%K1} |
(101) 0x41d64b VMOVDQU64 0x180(%RSP),%YMM19 |
(101) 0x41d653 VPMULLQ %YMM3,%YMM19,%YMM19 |
(101) 0x41d659 KXNORW %K0,%K0,%K1 |
(101) 0x41d65d VXORPD %XMM20,%XMM20,%XMM20 |
(101) 0x41d663 VGATHERQPD (%RSI,%YMM25,8),%YMM20{%K1} |
(101) 0x41d66a VPADDQ %YMM2,%YMM19,%YMM19 |
(101) 0x41d670 KXNORW %K0,%K0,%K1 |
(101) 0x41d674 VXORPD %XMM21,%XMM21,%XMM21 |
(101) 0x41d67a MOV 0x40(%RSP),%RAX |
(101) 0x41d67f VGATHERQPD (%RAX,%YMM19,8),%YMM21{%K1} |
(101) 0x41d686 VPADDQ %YMM0,%YMM10,%YMM27 |
(101) 0x41d68c KXNORW %K0,%K0,%K1 |
(101) 0x41d690 VPXOR %XMM10,%XMM10,%XMM10 |
(101) 0x41d695 VGATHERQPD (%RCX,%YMM27,8),%YMM10{%K1} |
(101) 0x41d69c VSUBPD %YMM14,%YMM15,%YMM14 |
(101) 0x41d6a1 VSUBPD %YMM18,%YMM20,%YMM15 |
(101) 0x41d6a7 VMOVDQU64 0x140(%RSP),%YMM18 |
(101) 0x41d6af VPMULLQ %YMM3,%YMM18,%YMM18 |
(101) 0x41d6b5 VMULPD %YMM11,%YMM14,%YMM11 |
(101) 0x41d6ba VFMADD213PD %YMM11,%YMM10,%YMM15 |
(101) 0x41d6bf VPADDQ %YMM2,%YMM18,%YMM28 |
(101) 0x41d6c5 VPMULLQ %YMM3,%YMM22,%YMM3 |
(101) 0x41d6cb VFMADD213PD %YMM21,%YMM4,%YMM15 |
(101) 0x41d6d1 KXNORW %K0,%K0,%K1 |
(101) 0x41d6d5 MOV 0xa8(%RSP),%RAX |
(101) 0x41d6dd VSCATTERQPD %YMM15,(%RAX,%YMM28,8){%K1} |
(101) 0x41d6e4 VPADDQ %YMM2,%YMM3,%YMM10 |
(101) 0x41d6e8 KXNORW %K0,%K0,%K1 |
(101) 0x41d6ec VXORPD %XMM11,%XMM11,%XMM11 |
(101) 0x41d6f1 VGATHERQPD (%R14,%YMM10,8),%YMM11{%K1} |
(101) 0x41d6f8 VPADDQ %YMM0,%YMM3,%YMM3 |
(101) 0x41d6fc KXNORW %K0,%K0,%K1 |
(101) 0x41d700 VXORPD %XMM14,%XMM14,%XMM14 |
(101) 0x41d705 VGATHERQPD (%R14,%YMM3,8),%YMM14{%K1} |
(101) 0x41d70c KXNORW %K0,%K0,%K1 |
(101) 0x41d710 VXORPD %XMM15,%XMM15,%XMM15 |
(101) 0x41d715 VPMULLQ %YMM1,%YMM22,%YMM1 |
(101) 0x41d71b VGATHERQPD (%RBX,%YMM5,8),%YMM15{%K1} |
(101) 0x41d722 VPADDQ %YMM2,%YMM1,%YMM2 |
(101) 0x41d726 KXNORW %K0,%K0,%K1 |
(101) 0x41d72a VXORPD %XMM5,%XMM5,%XMM5 |
(101) 0x41d72e VGATHERQPD (%R14,%YMM2,8),%YMM5{%K1} |
(101) 0x41d735 VPADDQ %YMM0,%YMM1,%YMM0 |
(101) 0x41d739 KXNORW %K0,%K0,%K1 |
(101) 0x41d73d VPXOR %XMM1,%XMM1,%XMM1 |
(101) 0x41d741 VGATHERQPD (%R14,%YMM0,8),%YMM1{%K1} |
(101) 0x41d748 KXNORW %K0,%K0,%K1 |
(101) 0x41d74c VPXORD %XMM18,%XMM18,%XMM18 |
(101) 0x41d752 VGATHERQPD (%RBX,%YMM6,8),%YMM18{%K1} |
(101) 0x41d759 KXNORW %K0,%K0,%K1 |
(101) 0x41d75d VXORPD %XMM6,%XMM6,%XMM6 |
(101) 0x41d761 VGATHERQPD (%RDX,%YMM26,8),%YMM6{%K1} |
(101) 0x41d768 VSUBPD %YMM11,%YMM14,%YMM11 |
(101) 0x41d76d VMULPD %YMM15,%YMM11,%YMM11 |
(101) 0x41d772 VSUBPD %YMM5,%YMM1,%YMM1 |
(101) 0x41d776 VFMADD213PD %YMM11,%YMM18,%YMM1 |
(101) 0x41d77c VFMADD213PD %YMM6,%YMM4,%YMM1 |
(101) 0x41d781 KXNORW %K0,%K0,%K1 |
(101) 0x41d785 VSCATTERQPD %YMM1,(%RDX,%YMM26,8){%K1} |
(101) 0x41d78c KXNORW %K0,%K0,%K1 |
(101) 0x41d790 VXORPD %XMM1,%XMM1,%XMM1 |
(101) 0x41d794 VGATHERQPD (%R14,%YMM10,8),%YMM1{%K1} |
(101) 0x41d79b KXNORW %K0,%K0,%K1 |
(101) 0x41d79f VXORPD %XMM5,%XMM5,%XMM5 |
(101) 0x41d7a3 VGATHERQPD (%R14,%YMM2,8),%YMM5{%K1} |
(101) 0x41d7aa KXNORW %K0,%K0,%K1 |
(101) 0x41d7ae VXORPD %XMM2,%XMM2,%XMM2 |
(101) 0x41d7b2 VGATHERQPD (%RCX,%YMM7,8),%YMM2{%K1} |
(101) 0x41d7b9 KXNORW %K0,%K0,%K1 |
(101) 0x41d7bd VXORPD %XMM6,%XMM6,%XMM6 |
(101) 0x41d7c1 VGATHERQPD (%R14,%YMM3,8),%YMM6{%K1} |
(101) 0x41d7c8 KXNORW %K0,%K0,%K1 |
(101) 0x41d7cc VXORPD %XMM3,%XMM3,%XMM3 |
(101) 0x41d7d0 VGATHERQPD (%R14,%YMM0,8),%YMM3{%K1} |
(101) 0x41d7d7 KXNORW %K0,%K0,%K1 |
(101) 0x41d7db VXORPD %XMM0,%XMM0,%XMM0 |
(101) 0x41d7df VGATHERQPD (%RCX,%YMM27,8),%YMM0{%K1} |
(101) 0x41d7e6 KXNORW %K0,%K0,%K1 |
(101) 0x41d7ea VXORPD %XMM7,%XMM7,%XMM7 |
(101) 0x41d7ee VGATHERQPD (%RAX,%YMM28,8),%YMM7{%K1} |
(101) 0x41d7f5 VSUBPD %YMM1,%YMM5,%YMM1 |
(101) 0x41d7f9 VMULPD %YMM2,%YMM1,%YMM1 |
(101) 0x41d7fd VSUBPD %YMM6,%YMM3,%YMM2 |
(101) 0x41d801 VFMADD213PD %YMM1,%YMM0,%YMM2 |
(101) 0x41d806 VFMADD213PD %YMM7,%YMM4,%YMM2 |
(101) 0x41d80b KXNORW %K0,%K0,%K1 |
(101) 0x41d80f VSCATTERQPD %YMM2,(%RAX,%YMM28,8){%K1} |
(101) 0x41d816 VPADDQ 0x488d8(%RIP){1to4},%YMM9,%YMM9 |
(101) 0x41d820 ADD $0x4,%R13 |
(101) 0x41d824 CMP %R10,%R13 |
(101) 0x41d827 JB 41d370 |
0x41d82d CMP %R10,0xd0(%RSP) |
0x41d835 VMOVDQU 0x120(%RSP),%XMM3 |
0x41d83e MOV 0x18(%RSP),%R11 |
0x41d843 JNE 41d873 |
0x41d845 MOV $0x6823b0,%EDI |
0x41d84a MOV 0x58(%RSP),%ESI |
0x41d84e LEA -0x28(%RBP),%RSP |
0x41d852 POP %RBX |
0x41d853 POP %R12 |
0x41d855 POP %R13 |
0x41d857 POP %R14 |
0x41d859 POP %R15 |
0x41d85b POP %RBP |
0x41d85c VZEROUPPER |
0x41d85f JMP 402e90 |
0x41d864 LEA -0x28(%RBP),%RSP |
0x41d868 POP %RBX |
0x41d869 POP %R12 |
0x41d86b POP %R13 |
0x41d86d POP %R14 |
0x41d86f POP %R15 |
0x41d871 POP %RBP |
0x41d872 RET |
0x41d873 ADD %R10,%R11 |
0x41d876 JMP 41dafe |
0x41d87b NOPL (%RAX,%RAX,1) |
(100) 0x41d880 MOV %R11,%RAX |
(100) 0x41d883 CQTO |
(100) 0x41d885 IDIV %RDI |
(100) 0x41d888 ADD 0x34(%RSP),%ECX |
(100) 0x41d88c ADD 0x50(%RSP),%EDX |
(100) 0x41d890 LEA -0x1(%RCX),%EAX |
(100) 0x41d893 CLTQ |
(100) 0x41d895 MOV %R12,%R8 |
(100) 0x41d898 IMUL %RAX,%R8 |
(100) 0x41d89c MOVSXD %EDX,%RDX |
(100) 0x41d89f LEA -0x1(%R8,%RDX,1),%R9 |
(100) 0x41d8a4 MOV 0x90(%RSP),%R13 |
(100) 0x41d8ac MOV %R13,%R10 |
(100) 0x41d8af IMUL %RAX,%R10 |
(100) 0x41d8b3 LEA -0x1(%R10,%RDX,1),%R11 |
(100) 0x41d8b8 MOV 0x110(%RSP),%RBX |
(100) 0x41d8c0 VMOVSD (%RBX,%R11,8),%XMM0 |
(100) 0x41d8c6 MOV 0x98(%RSP),%RDI |
(100) 0x41d8ce VMULSD (%RDI,%R9,8),%XMM0,%XMM0 |
(100) 0x41d8d4 MOVSXD %ECX,%RCX |
(100) 0x41d8d7 MOV %R12,%R9 |
(100) 0x41d8da IMUL %RCX,%R9 |
(100) 0x41d8de LEA -0x1(%R9,%RDX,1),%R11 |
(100) 0x41d8e3 MOV %R13,%R12 |
(100) 0x41d8e6 IMUL %RCX,%R12 |
(100) 0x41d8ea LEA -0x1(%R12,%RDX,1),%R13 |
(100) 0x41d8ef VMOVSD (%RBX,%R13,8),%XMM1 |
(100) 0x41d8f5 VFMADD132SD (%RDI,%R11,8),%XMM0,%XMM1 |
(100) 0x41d8fb ADD %RDX,%R9 |
(100) 0x41d8fe ADD %RDX,%R12 |
(100) 0x41d901 VMOVSD (%RBX,%R12,8),%XMM0 |
(100) 0x41d907 VFMADD132SD (%RDI,%R9,8),%XMM1,%XMM0 |
(100) 0x41d90d ADD %RDX,%R8 |
(100) 0x41d910 ADD %RDX,%R10 |
(100) 0x41d913 VMOVSD (%RBX,%R10,8),%XMM1 |
(100) 0x41d919 VFMADD132SD (%RDI,%R8,8),%XMM0,%XMM1 |
(100) 0x41d91f VMULSD 0x487c9(%RIP),%XMM1,%XMM0 |
(100) 0x41d927 VDIVSD %XMM0,%XMM3,%XMM0 |
(100) 0x41d92b MOV 0x108(%RSP),%R10 |
(100) 0x41d933 IMUL %RCX,%R10 |
(100) 0x41d937 ADD %RDX,%R10 |
(100) 0x41d93a MOV 0x88(%RSP),%R9 |
(100) 0x41d942 MOV %R9,%R8 |
(100) 0x41d945 IMUL %RCX,%R8 |
(100) 0x41d949 ADD %RDX,%R8 |
(100) 0x41d94c MOV 0x100(%RSP),%RDI |
(100) 0x41d954 MOV %RDI,%R13 |
(100) 0x41d957 IMUL %RCX,%R13 |
(100) 0x41d95b LEA -0x1(%R13,%RDX,1),%R11 |
(100) 0x41d960 ADD %RDX,%R13 |
(100) 0x41d963 MOV 0x80(%RSP),%R15 |
(100) 0x41d96b VMOVSD (%R15,%R11,8),%XMM1 |
(100) 0x41d971 VSUBSD (%R15,%R13,8),%XMM1,%XMM1 |
(100) 0x41d977 MOV 0x20(%RSP),%RSI |
(100) 0x41d97c VMULSD (%RSI,%R8,8),%XMM1,%XMM1 |
(100) 0x41d982 MOV %RAX,%R12 |
(100) 0x41d985 IMUL %RAX,%R9 |
(100) 0x41d989 ADD %RDX,%R9 |
(100) 0x41d98c IMUL %RAX,%RDI |
(100) 0x41d990 LEA -0x1(%RDI,%RDX,1),%RAX |
(100) 0x41d995 ADD %RDX,%RDI |
(100) 0x41d998 VMOVSD (%R15,%RAX,8),%XMM2 |
(100) 0x41d99e VSUBSD (%R15,%RDI,8),%XMM2,%XMM2 |
(100) 0x41d9a4 VFMADD132SD (%RSI,%R9,8),%XMM1,%XMM2 |
(100) 0x41d9aa MOV 0xb8(%RSP),%RBX |
(100) 0x41d9b2 VFMADD213SD (%RBX,%R10,8),%XMM0,%XMM2 |
(100) 0x41d9b8 MOV 0xf8(%RSP),%R10 |
(100) 0x41d9c0 IMUL %RCX,%R10 |
(100) 0x41d9c4 ADD %RDX,%R10 |
(100) 0x41d9c7 MOV 0x28(%RSP),%RSI |
(100) 0x41d9cc VMOVSD %XMM2,(%RSI,%R10,8) |
(100) 0x41d9d2 VMOVSD (%R15,%RDI,8),%XMM1 |
(100) 0x41d9d8 MOV 0xf0(%RSP),%RDI |
(100) 0x41d9e0 IMUL %RCX,%RDI |
(100) 0x41d9e4 ADD %RDX,%RDI |
(100) 0x41d9e7 VSUBSD (%R15,%R13,8),%XMM1,%XMM1 |
(100) 0x41d9ed MOV 0xe8(%RSP),%R13 |
(100) 0x41d9f5 IMUL %RCX,%R13 |
(100) 0x41d9f9 VMOVSD (%R15,%RAX,8),%XMM2 |
(100) 0x41d9ff LEA (%R13,%RDX,1),%RAX |
(100) 0x41da04 MOV %RAX,0x60(%RSP) |
(100) 0x41da09 MOV 0xb0(%RSP),%R14 |
(100) 0x41da11 VMULSD (%R14,%RAX,8),%XMM1,%XMM1 |
(100) 0x41da17 LEA -0x1(%R13,%RDX,1),%R13 |
(100) 0x41da1c VSUBSD (%R15,%R11,8),%XMM2,%XMM2 |
(100) 0x41da22 VFMADD132SD (%R14,%R13,8),%XMM1,%XMM2 |
(100) 0x41da28 MOV 0x40(%RSP),%R11 |
(100) 0x41da2d VFMADD213SD (%R11,%RDI,8),%XMM0,%XMM2 |
(100) 0x41da33 MOV 0xe0(%RSP),%R11 |
(100) 0x41da3b IMUL %RCX,%R11 |
(100) 0x41da3f ADD %RDX,%R11 |
(100) 0x41da42 MOV 0xa8(%RSP),%R15 |
(100) 0x41da4a VMOVSD %XMM2,(%R15,%R11,8) |
(100) 0x41da50 MOV 0xd8(%RSP),%RSI |
(100) 0x41da58 IMUL %RSI,%RCX |
(100) 0x41da5c LEA -0x1(%RCX,%RDX,1),%RBX |
(100) 0x41da61 ADD %RDX,%RCX |
(100) 0x41da64 MOV 0x38(%RSP),%RAX |
(100) 0x41da69 VMOVSD (%RAX,%RBX,8),%XMM1 |
(100) 0x41da6e VSUBSD (%RAX,%RCX,8),%XMM1,%XMM1 |
(100) 0x41da73 MOV 0x20(%RSP),%RDI |
(100) 0x41da78 VMULSD (%RDI,%R8,8),%XMM1,%XMM1 |
(100) 0x41da7e IMUL %RSI,%R12 |
(100) 0x41da82 LEA (%R12,%RDX,1),%R8 |
(100) 0x41da86 LEA -0x1(%R12,%RDX,1),%RDX |
(100) 0x41da8b VMOVSD (%RAX,%RDX,8),%XMM2 |
(100) 0x41da90 VSUBSD (%RAX,%R8,8),%XMM2,%XMM2 |
(100) 0x41da96 VFMADD132SD (%RDI,%R9,8),%XMM1,%XMM2 |
(100) 0x41da9c MOV 0x28(%RSP),%RSI |
(100) 0x41daa1 VFMADD213SD (%RSI,%R10,8),%XMM0,%XMM2 |
(100) 0x41daa7 VMOVSD %XMM2,(%RSI,%R10,8) |
(100) 0x41daad VMOVSD (%RAX,%R8,8),%XMM1 |
(100) 0x41dab3 VSUBSD (%RAX,%RCX,8),%XMM1,%XMM1 |
(100) 0x41dab8 MOV %RAX,%RCX |
(100) 0x41dabb MOV 0x60(%RSP),%RAX |
(100) 0x41dac0 VMULSD (%R14,%RAX,8),%XMM1,%XMM1 |
(100) 0x41dac6 VMOVSD (%RCX,%RDX,8),%XMM2 |
(100) 0x41dacb MOV %R15,%RAX |
(100) 0x41dace MOV %R14,%R15 |
(100) 0x41dad1 VSUBSD (%RCX,%RBX,8),%XMM2,%XMM2 |
(100) 0x41dad6 VFMADD132SD (%R14,%R13,8),%XMM1,%XMM2 |
(100) 0x41dadc VFMADD213SD (%RAX,%R11,8),%XMM0,%XMM2 |
(100) 0x41dae2 VMOVSD %XMM2,(%RAX,%R11,8) |
(100) 0x41dae8 MOV 0x18(%RSP),%R11 |
(100) 0x41daed INC %R11 |
(100) 0x41daf0 CMP 0xa0(%RSP),%R11 |
(100) 0x41daf8 JG 41d845 |
(100) 0x41dafe MOV %R11,%R8 |
(100) 0x41db01 SHR $0x20,%R8 |
(100) 0x41db05 JE 41db30 |
(100) 0x41db07 MOV %R11,%RAX |
(100) 0x41db0a XOR %EDX,%EDX |
(100) 0x41db0c MOV 0x78(%RSP),%RDI |
(100) 0x41db11 DIV %RDI |
(100) 0x41db14 MOV %RAX,%RCX |
(100) 0x41db17 MOV 0x48(%RSP),%R12 |
(100) 0x41db1c TEST %R8,%R8 |
(100) 0x41db1f MOV %R11,0x18(%RSP) |
(100) 0x41db24 JNE 41d880 |
(100) 0x41db2a JMP 41db51 |
0x41db2c NOPL (%RAX) |
(100) 0x41db30 MOV %R11D,%EAX |
(100) 0x41db33 XOR %EDX,%EDX |
(100) 0x41db35 MOV 0x78(%RSP),%RDI |
(100) 0x41db3a DIV %EDI |
(100) 0x41db3c MOV %EAX,%ECX |
(100) 0x41db3e MOV 0x48(%RSP),%R12 |
(100) 0x41db43 TEST %R8,%R8 |
(100) 0x41db46 MOV %R11,0x18(%RSP) |
(100) 0x41db4b JNE 41d880 |
(100) 0x41db51 MOV %R11D,%EAX |
(100) 0x41db54 XOR %EDX,%EDX |
(100) 0x41db56 DIV %EDI |
(100) 0x41db58 JMP 41d888 |
0x41db5d NOPL (%RAX) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | accelerate.cpp:40-54 |
Module | exec |
nb instructions | 182 |
nb uops | 184 |
loop length | 922 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 8 |
used zmm registers | 0 |
nb stack references | 53 |
micro-operation queue | 30.67 cycles |
front end | 30.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.40 | 5.20 | 23.33 | 23.33 | 28.00 | 15.00 | 5.20 | 28.00 | 28.00 | 28.00 | 5.20 | 23.33 |
cycles | 5.40 | 5.20 | 23.33 | 23.33 | 28.00 | 15.00 | 5.20 | 28.00 | 28.00 | 28.00 | 5.20 | 23.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 30.49 |
Stall cycles | 0.00 |
Front-end | 30.67 |
Dispatch | 28.00 |
Overall L1 | 30.67 |
all | 14% |
load | 13% |
store | 19% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 15% |
load | 14% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 28% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x220,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x68(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ 0x40(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%EDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EDX,0x34(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,0x5c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 41d864 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0x834> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R11,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,0x118(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x120(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x64(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0xd0(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0xc8(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x682390,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
VMOVDQU %XMM0,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
CALL 403020 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVDQU 0x140(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xc8(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 41d845 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0x815> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB 0x50(%RSP),%ECX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%R11),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa0(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RDI),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R10 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV (%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R12),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R14),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RBX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R11,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $-0x4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND %R10,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RDI,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x48(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x108(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0xf8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 41dafe <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0xace> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VPBROADCASTQ %RCX,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x34(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %XMM0,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x50(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %XMM0,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %RDI,%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x90(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %XMM3,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x1e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %R9,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x88(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R14,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RBX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x1a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %RDX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %R13,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %R8,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %RSI,%YMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R11,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ 0x48db9(%RIP),%YMM0,%YMM9 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x98(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RSP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,0xd0(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
VMOVDQU 0x120(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV 0x18(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 41d873 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0x843> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x6823b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x58(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 402e90 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
ADD %R10,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 41dafe <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0xace> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | accelerate.cpp:40-54 |
Module | exec |
nb instructions | 182 |
nb uops | 184 |
loop length | 922 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 8 |
used zmm registers | 0 |
nb stack references | 53 |
micro-operation queue | 30.67 cycles |
front end | 30.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 5.40 | 5.20 | 23.33 | 23.33 | 28.00 | 15.00 | 5.20 | 28.00 | 28.00 | 28.00 | 5.20 | 23.33 |
cycles | 5.40 | 5.20 | 23.33 | 23.33 | 28.00 | 15.00 | 5.20 | 28.00 | 28.00 | 28.00 | 5.20 | 23.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 30.49 |
Stall cycles | 0.00 |
Front-end | 30.67 |
Dispatch | 28.00 |
Overall L1 | 30.67 |
all | 14% |
load | 13% |
store | 19% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 50% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 15% |
load | 14% |
store | 17% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 28% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x220,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x68(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x50(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ 0x40(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%EDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EDX,0x34(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0,0x5c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 41d864 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0x834> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R11,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVQ $0,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0x1,0x118(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x120(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x64(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0xd0(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0xc8(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x682390,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
VMOVDQU %XMM0,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
CALL 403020 <__kmpc_for_static_init_8@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVDQU 0x140(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xc8(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc0(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 41d845 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0x815> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB 0x50(%RSP),%ECX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%R11),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0xa0(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%RDI),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%R10 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV (%R12),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R12),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R14),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R14),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RBX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x18(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RDI),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R11,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $-0x4,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND %R10,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RDI,%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x48(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R12,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x108(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,0xf8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JE 41dafe <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0xace> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VPBROADCASTQ %RCX,%YMM8 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x34(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %XMM0,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x50(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTD %EAX,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %XMM0,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %RDI,%YMM12 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x90(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM13 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %XMM3,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x1e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %R9,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x1c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
MOV 0x88(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VPBROADCASTQ %RAX,%YMM16 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %R14,%YMM17 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPBROADCASTQ %RBX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x1a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %RDX,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %R13,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %R8,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VMOVDQU %YMM0,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0-1 | 0.50 |
VPBROADCASTQ %RSI,%YMM22 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VPBROADCASTQ %R11,%YMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ 0x48db9(%RIP),%YMM0,%YMM9 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.40 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x98(%RSP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x80(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RSP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R10,0xd0(%RSP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
VMOVDQU 0x120(%RSP),%XMM3 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV 0x18(%RSP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 41d873 <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0x843> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x6823b0,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x58(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
JMP 402e90 <__kmpc_for_static_fini@plt> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
ADD %R10,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JMP 41dafe <_Z17accelerate_kerneliiiidRN6clover8Buffer2DIdEES2_S2_S2_S2_S2_S2_S2_S2_S2_.extracted+0xace> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼accelerate_kernel(int, int, int, int, double, clover::Buffer2D | 2.31 | 2.82 |
○Loop 101 - accelerate.cpp:41-54 - exec | 2.31 | 2.8 |
○Loop 100 - accelerate.cpp:41-54 - exec | 0 | 0 |