Name | Module | Coverage (%) | Inclusive Time w.r.t. Wall Time(s) | Max Inc. Time over Threads(s) | Nb Threads | GFLOP/s | Deviation (coverage) | Deviation (time) |
Neoverse V1 ACFL Ofast Manual Unroll ONLY (no Hoisting) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Hoisting ONLY (no Unroll) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll ONLY (no Hoisting) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Hoisting ONLY (no Unroll) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll ONLY (no Hoisting) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Hoisting ONLY (no Unroll) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll ONLY (no Hoisting) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Hoisting ONLY (no Unroll) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll ONLY (no Hoisting) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Hoisting ONLY (no Unroll) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll ONLY (no Hoisting) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Hoisting ONLY (no Unroll) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll ONLY (no Hoisting) (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Hoisting ONLY (no Unroll) (250 iterations, 64 threads) |
k_means(int, point_t*, point_t*, int*, int, int) [clone .omp_outlined] | binary | 72.09 | 72.87 | 13.27 | 14.78 | 16.49 | 17.97 | 64 | 64 | 5.66 | 5.05 | 7.98 | 6.04 | 1.43 | 1.08 |
kmp_flag_64<false, true>::wait(kmp_info*, int, void*) | libomp.so | 18.39 | 19.12 | 3.38 | 3.88 | 5.63 | 4.20 | 64 | 64 | 0.00 | 0.00 | 5.50 | 2.84 | 0.95 | 0.57 |
k_means(int, point_t*, point_t*, int*, int, int) [clone .omp_outlined.3] | binary | 7.44 | 5.83 | 1.37 | 1.18 | 1.76 | 1.76 | 64 | 64 | 1.72 | 0.94 | 3.20 | 3.51 | 0.57 | 0.70 |
kmp_flag_native<unsigned long long, (flag_type)1, true>::notdone_check() | libomp.so | 1.10 | 1.16 | 0.20 | 0.24 | 0.31 | 0.28 | 64 | 63 | 0.00 | 0.00 | 0.34 | 0.11 | 0.06 | 0.02 |
__sched_yield | libc.so.6 | 0.89 | 0.91 | 0.16 | 0.19 | 0.28 | 0.22 | 64 | 63 | 0.00 | 0.00 | 0.27 | 0.10 | 0.05 | 0.02 |
@plt_start@ | libomp.so | 0.06 | 0.07 | 0.01 | 0.01 | 0.02 | 0.02 | 64 | 63 | 0.00 | 0.00 | 0.03 | 0.02 | 0.00 | 0.00 |
__kmp_yield | libomp.so | 0.03 | 0.03 | 0.01 | 0.01 | 0.01 | 0.01 | 64 | 63 | 0.00 | 0.00 | 0.02 | 0.01 | 0.00 | 0.00 |
__kmp_finish_implicit_task | libomp.so | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 4 | 6 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_invoke_task_func | libomp.so | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 4 | 5 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_hyper_barrier_gather(barrier_type, kmp_info*, int, int, void (*)(void*, void*), void*) | libomp.so | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 5 | 4 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_hyper_barrier_release(barrier_type, kmp_info*, int, int, int, void*) | libomp.so | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 4 | 5 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmpc_for_static_fini | libomp.so | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 5 | 3 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
unknown_function | binary | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 5 | 3 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__aarch64_ldadd8_acq_rel | libomp.so | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 4 | 4 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmpc_reduce_nowait | libomp.so | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 1 | 5 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
kmp_flag_native<unsigned long long, (flag_type)1, true>::done_check() | libomp.so | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 4 | 1 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmpc_for_static_init_4 | libomp.so | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 3 | 1 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_join_barrier(int) | libomp.so | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 2 | 2 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_barrier | libomp.so | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 1 | 3 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_determine_reduction_method | libomp.so | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 1 | 2 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_invoke_microtask | libomp.so | 0.00 | NA | 0.00 | NA | 0.00 | NA | 3 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
k_means(int, point_t*, point_t*, int*, int, int) [clone .omp_outlined_debug__.2] [clone .omp] [clone .reduction] [clone .reduction_func] | binary | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 1 | 1 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_launch_thread | libomp.so | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
__kmpc_end_reduce_nowait | libomp.so | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
__memset | libastring.so | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
__vfscanf_internal | libc.so.6 | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
__kmp_get_global_thread_id_reg | libomp.so | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
__kmp_fork_call | libomp.so | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
__kmp_resume_if_soft_paused | libomp.so | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
__kmp_join_call | libomp.so | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
unknown_kernel_region | kernel | 0.00 | NA | 0.00 | NA | 0.00 | NA | 8 | NA | NA | NA | 0.00 | NA | 0.00 | NA |