Name | Module | Coverage (%) | Inclusive Time w.r.t. Wall Time(s) | Max Inc. Time over Threads(s) | Nb Threads | GFLOP/s | Deviation (coverage) | Deviation (time) |
Neoverse V1 GCC O3 Manual Unroll (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll (250 iterations, 64 threads) | Neoverse V1 GCC O3 Manual Unroll (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll (250 iterations, 64 threads) | Neoverse V1 GCC O3 Manual Unroll (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll (250 iterations, 64 threads) | Neoverse V1 GCC O3 Manual Unroll (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll (250 iterations, 64 threads) | Neoverse V1 GCC O3 Manual Unroll (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll (250 iterations, 64 threads) | Neoverse V1 GCC O3 Manual Unroll (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll (250 iterations, 64 threads) | Neoverse V1 GCC O3 Manual Unroll (250 iterations, 64 threads) | Neoverse V1 ACFL Ofast Manual Unroll (250 iterations, 64 threads) |
k_means(int, point_t*, point_t*, int*, int, int) [clone ._omp_fn.0] | binary | 83.57 | NA | 27.39 | NA | 31.04 | NA | 64 | NA | 0.97 | NA | 6.02 | NA | 1.78 | NA |
k_means(int, point_t*, point_t*, int*, int, int) [clone .omp_outlined] | binary | NA | 66.55 | NA | 10.80 | NA | 12.53 | NA | 64 | NA | 2.26 | NA | 6.32 | NA | 0.92 |
kmp_flag_64<false, true>::wait(kmp_info*, int, void*) | libomp.so | NA | 23.21 | NA | 3.77 | NA | 4.05 | NA | 64 | NA | 0.00 | NA | 3.06 | NA | 0.50 |
gomp_team_barrier_wait_end | libgomp.so.1.0.0 | 10.67 | NA | 3.50 | NA | 6.12 | NA | 64 | NA | 0.00 | NA | 4.10 | NA | 1.33 | NA |
k_means(int, point_t*, point_t*, int*, int, int) [clone .omp_outlined.3] | binary | NA | 7.63 | NA | 1.24 | NA | 1.71 | NA | 64 | NA | 2.03 | NA | 3.86 | NA | 0.61 |
k_means(int, point_t*, point_t*, int*, int, int) [clone ._omp_fn.1] | binary | 3.55 | NA | 1.16 | NA | 1.75 | NA | 64 | NA | 1.54 | NA | 2.21 | NA | 0.72 | NA |
gomp_barrier_wait_end | libgomp.so.1.0.0 | 2.20 | NA | 0.72 | NA | 0.87 | NA | 63 | NA | 0.00 | NA | 0.70 | NA | 0.23 | NA |
kmp_flag_native<unsigned long long, (flag_type)1, true>::notdone_check() | libomp.so | NA | 1.39 | NA | 0.23 | NA | 0.28 | NA | 64 | NA | 0.00 | NA | 0.20 | NA | 0.03 |
__sched_yield | libc.so.6 | NA | 1.11 | NA | 0.18 | NA | 0.22 | NA | 64 | NA | 0.00 | NA | 0.16 | NA | 0.03 |
@plt_start@ | libomp.so | NA | 0.07 | NA | 0.01 | NA | 0.02 | NA | 63 | NA | 0.00 | NA | 0.02 | NA | 0.00 |
__kmp_yield | libomp.so | NA | 0.04 | NA | 0.01 | NA | 0.01 | NA | 64 | NA | 0.00 | NA | 0.02 | NA | 0.00 |
__kmpc_for_static_fini | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 10 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
__aarch64_ldadd8_acq_rel | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 8 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
__aarch64_ldadd4_acq_rel | libgomp.so.1.0.0 | 0.00 | NA | 0.00 | NA | 0.00 | NA | 9 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
__kmp_hyper_barrier_release(barrier_type, kmp_info*, int, int, int, void*) | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 5 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
__kmp_hyper_barrier_gather(barrier_type, kmp_info*, int, int, void (*)(void*, void*), void*) | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 4 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
unknown_function | binary | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 2 | 3 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_join_barrier(int) | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 3 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
__kmpc_reduce_nowait | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 3 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
__kmp_invoke_task_func | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 3 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
__kmp_init_implicit_task | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 2 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
kmp_flag_native<unsigned long long, (flag_type)1, true>::done_check() | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 2 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
__kmpc_for_static_init_4 | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 2 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
__kmp_launch_thread | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 2 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
k_means(int, point_t*, point_t*, int*, int, int) [clone .omp_outlined_debug__.2] [clone .omp] [clone .reduction] [clone .reduction_func] | binary | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 2 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
getenv | libc.so.6 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 1 | 1 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
gomp_thread_start | libgomp.so.1.0.0 | 0.00 | NA | 0.00 | NA | 0.00 | NA | 3 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
gomp_ialias_omp_get_num_threads | libgomp.so.1.0.0 | 0.00 | NA | 0.00 | NA | 0.00 | NA | 3 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
__aarch64_ldadd4_rel | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
__kmp_fork_barrier(int, int) | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
__kmp_task_team_sync | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
__kmp_join_call | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
__kmp_finish_implicit_task | libomp.so | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 |
gomp_team_barrier_wait_final | libgomp.so.1.0.0 | 0.00 | NA | 0.00 | NA | 0.00 | NA | 2 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
gomp_team_start | libgomp.so.1.0.0 | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
GOMP_atomic_start | libgomp.so.1.0.0 | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
k_means(int, point_t*, point_t*, int*, int, int) | binary | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
__aarch64_swp4_rel | libgomp.so.1.0.0 | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
__aarch64_cas4_acq | libgomp.so.1.0.0 | 0.00 | NA | 0.00 | NA | 0.00 | NA | 1 | NA | 0.00 | NA | 0.00 | NA | 0.00 | NA |
unknown_kernel_region | kernel | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 2 | 5 | NA | NA | 0.00 | 0.00 | 0.00 | 0.00 |