|  | // SPDX-License-Identifier: GPL-2.0 | 
|  | /* | 
|  | * Benchmark scanning sysfs files for PMU information. | 
|  | * | 
|  | * Copyright 2023 Google LLC. | 
|  | */ | 
|  | #include <stdio.h> | 
|  | #include "bench.h" | 
|  | #include "util/debug.h" | 
|  | #include "util/pmu.h" | 
|  | #include "util/pmus.h" | 
|  | #include "util/stat.h" | 
|  | #include <linux/atomic.h> | 
|  | #include <linux/err.h> | 
|  | #include <linux/time64.h> | 
|  | #include <subcmd/parse-options.h> | 
|  |  | 
|  | static unsigned int iterations = 100; | 
|  |  | 
|  | struct pmu_scan_result { | 
|  | char *name; | 
|  | int nr_aliases; | 
|  | int nr_formats; | 
|  | int nr_caps; | 
|  | bool is_core; | 
|  | }; | 
|  |  | 
|  | static const struct option options[] = { | 
|  | OPT_UINTEGER('i', "iterations", &iterations, | 
|  | "Number of iterations used to compute average"), | 
|  | OPT_END() | 
|  | }; | 
|  |  | 
|  | static const char *const bench_usage[] = { | 
|  | "perf bench internals pmu-scan <options>", | 
|  | NULL | 
|  | }; | 
|  |  | 
|  | static int nr_pmus; | 
|  | static struct pmu_scan_result *results; | 
|  |  | 
|  | static int save_result(void) | 
|  | { | 
|  | struct perf_pmu *pmu = NULL; | 
|  | struct list_head *list; | 
|  | struct pmu_scan_result *r; | 
|  |  | 
|  | while ((pmu = perf_pmus__scan(pmu)) != NULL) { | 
|  | r = realloc(results, (nr_pmus + 1) * sizeof(*r)); | 
|  | if (r == NULL) | 
|  | return -ENOMEM; | 
|  |  | 
|  | results = r; | 
|  | r = results + nr_pmus; | 
|  |  | 
|  | r->name = strdup(pmu->name); | 
|  | r->is_core = pmu->is_core; | 
|  | r->nr_caps = pmu->nr_caps; | 
|  |  | 
|  | r->nr_aliases = perf_pmu__num_events(pmu); | 
|  |  | 
|  | r->nr_formats = 0; | 
|  | list_for_each(list, &pmu->format) | 
|  | r->nr_formats++; | 
|  |  | 
|  | pr_debug("pmu[%d] name=%s, nr_caps=%d, nr_aliases=%d, nr_formats=%d\n", | 
|  | nr_pmus, r->name, r->nr_caps, r->nr_aliases, r->nr_formats); | 
|  | nr_pmus++; | 
|  | } | 
|  |  | 
|  | perf_pmus__destroy(); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | static int check_result(bool core_only) | 
|  | { | 
|  | struct pmu_scan_result *r; | 
|  | struct perf_pmu *pmu; | 
|  | struct list_head *list; | 
|  | int nr; | 
|  |  | 
|  | for (int i = 0; i < nr_pmus; i++) { | 
|  | r = &results[i]; | 
|  | if (core_only && !r->is_core) | 
|  | continue; | 
|  |  | 
|  | pmu = perf_pmus__find(r->name); | 
|  | if (pmu == NULL) { | 
|  | pr_err("Cannot find PMU %s\n", r->name); | 
|  | return -1; | 
|  | } | 
|  |  | 
|  | if (pmu->nr_caps != (u32)r->nr_caps) { | 
|  | pr_err("Unmatched number of event caps in %s: expect %d vs got %d\n", | 
|  | pmu->name, r->nr_caps, pmu->nr_caps); | 
|  | return -1; | 
|  | } | 
|  |  | 
|  | nr = perf_pmu__num_events(pmu); | 
|  | if (nr != r->nr_aliases) { | 
|  | pr_err("Unmatched number of event aliases in %s: expect %d vs got %d\n", | 
|  | pmu->name, r->nr_aliases, nr); | 
|  | return -1; | 
|  | } | 
|  |  | 
|  | nr = 0; | 
|  | list_for_each(list, &pmu->format) | 
|  | nr++; | 
|  | if (nr != r->nr_formats) { | 
|  | pr_err("Unmatched number of event formats in %s: expect %d vs got %d\n", | 
|  | pmu->name, r->nr_formats, nr); | 
|  | return -1; | 
|  | } | 
|  | } | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | static void delete_result(void) | 
|  | { | 
|  | for (int i = 0; i < nr_pmus; i++) | 
|  | free(results[i].name); | 
|  | free(results); | 
|  |  | 
|  | results = NULL; | 
|  | nr_pmus = 0; | 
|  | } | 
|  |  | 
|  | static int run_pmu_scan(void) | 
|  | { | 
|  | struct stats stats; | 
|  | struct timeval start, end, diff; | 
|  | double time_average, time_stddev; | 
|  | u64 runtime_us; | 
|  | int ret; | 
|  |  | 
|  | init_stats(&stats); | 
|  | pr_info("Computing performance of sysfs PMU event scan for %u times\n", | 
|  | iterations); | 
|  |  | 
|  | if (save_result() < 0) { | 
|  | pr_err("Failed to initialize PMU scan result\n"); | 
|  | return -1; | 
|  | } | 
|  |  | 
|  | for (int j = 0; j < 2; j++) { | 
|  | bool core_only = (j == 0); | 
|  |  | 
|  | for (unsigned int i = 0; i < iterations; i++) { | 
|  | gettimeofday(&start, NULL); | 
|  | if (core_only) | 
|  | perf_pmus__scan_core(NULL); | 
|  | else | 
|  | perf_pmus__scan(NULL); | 
|  | gettimeofday(&end, NULL); | 
|  | timersub(&end, &start, &diff); | 
|  | runtime_us = diff.tv_sec * USEC_PER_SEC + diff.tv_usec; | 
|  | update_stats(&stats, runtime_us); | 
|  |  | 
|  | ret = check_result(core_only); | 
|  | perf_pmus__destroy(); | 
|  | if (ret < 0) | 
|  | break; | 
|  | } | 
|  | time_average = avg_stats(&stats); | 
|  | time_stddev = stddev_stats(&stats); | 
|  | pr_info("  Average%s PMU scanning took: %.3f usec (+- %.3f usec)\n", | 
|  | core_only ? " core" : "", time_average, time_stddev); | 
|  | } | 
|  | delete_result(); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | int bench_pmu_scan(int argc, const char **argv) | 
|  | { | 
|  | int err = 0; | 
|  |  | 
|  | argc = parse_options(argc, argv, options, bench_usage, 0); | 
|  | if (argc) { | 
|  | usage_with_options(bench_usage, options); | 
|  | exit(EXIT_FAILURE); | 
|  | } | 
|  |  | 
|  | err = run_pmu_scan(); | 
|  |  | 
|  | return err; | 
|  | } |