1
linux/tools/perf/util/bpf_kwork.c
Namhyung Kim 066fd84087 perf kwork: Constify control data for BPF
The control knobs set before loading BPF programs should be declared as
'const volatile' so that it can be optimized by the BPF core.

Committer testing:

  root@x1:~# perf kwork report --use-bpf
  Starting trace, Hit <Ctrl+C> to stop and report
  ^C
    Kwork Name                     | Cpu  | Total Runtime | Count     | Max runtime   | Max runtime start   | Max runtime end     |
   --------------------------------------------------------------------------------------------------------------------------------
    (w)intel_atomic_commit_work [  | 0009 |     18.680 ms |         2 |     18.553 ms |     362410.681580 s |     362410.700133 s |
    (w)pm_runtime_work             | 0007 |     13.300 ms |         1 |     13.300 ms |     362410.254996 s |     362410.268295 s |
    (w)intel_atomic_commit_work [  | 0009 |      9.846 ms |         2 |      9.717 ms |     362410.172352 s |     362410.182069 s |
    (w)acpi_ec_event_processor     | 0002 |      8.106 ms |         1 |      8.106 ms |     362410.463187 s |     362410.471293 s |
    (s)SCHED:7                     | 0000 |      1.351 ms |       106 |      0.063 ms |     362410.658017 s |     362410.658080 s |
    i915:157                       | 0008 |      0.994 ms |        13 |      0.361 ms |     362411.222125 s |     362411.222486 s |
    (s)SCHED:7                     | 0001 |      0.703 ms |        98 |      0.047 ms |     362410.245004 s |     362410.245051 s |
    (s)SCHED:7                     | 0005 |      0.674 ms |        42 |      0.074 ms |     362411.483039 s |     362411.483113 s |
    (s)NET_RX:3                    | 0001 |      0.556 ms |        10 |      0.079 ms |     362411.066388 s |     362411.066467 s |
  <SNIP>

  root@x1:~# perf trace -e bpf --max-events 5 perf kwork report --use-bpf
       0.000 ( 0.016 ms): perf/2948007 bpf(cmd: 36, uattr: 0x7ffededa6660, size: 8)          = -1 EOPNOTSUPP (Operation not supported)
       0.026 ( 0.106 ms): perf/2948007 bpf(cmd: PROG_LOAD, uattr: 0x7ffededa6390, size: 148) = 12
       0.152 ( 0.032 ms): perf/2948007 bpf(cmd: PROG_LOAD, uattr: 0x7ffededa6450, size: 148) = 12
      26.247 ( 0.138 ms): perf/2948007 bpf(cmd: PROG_LOAD, uattr: 0x7ffededa6300, size: 148) = 12
      26.396 ( 0.012 ms): perf/2948007 bpf(uattr: 0x7ffededa64b0, size: 80)                  = 12
  Starting trace, Hit <Ctrl+C> to stop and report
  root@x1:~#

Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Tested-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: Ian Rogers <irogers@google.com>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@kernel.org>
Cc: Kan Liang <kan.liang@linux.intel.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Song Liu <song@kernel.org>
Cc: Yang Jihong <yangjihong@bytedance.com>
Link: https://lore.kernel.org/r/20240902200515.2103769-4-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2024-09-03 11:50:20 -03:00

353 lines
8.1 KiB
C

// SPDX-License-Identifier: GPL-2.0
/*
* bpf_kwork.c
*
* Copyright (c) 2022 Huawei Inc, Yang Jihong <yangjihong1@huawei.com>
*/
#include <time.h>
#include <fcntl.h>
#include <signal.h>
#include <stdio.h>
#include <unistd.h>
#include <linux/time64.h>
#include "util/debug.h"
#include "util/evsel.h"
#include "util/kwork.h"
#include <bpf/bpf.h>
#include <perf/cpumap.h>
#include "util/bpf_skel/kwork_trace.skel.h"
/*
* This should be in sync with "util/kwork_trace.bpf.c"
*/
#define MAX_KWORKNAME 128
struct work_key {
u32 type;
u32 cpu;
u64 id;
};
struct report_data {
u64 nr;
u64 total_time;
u64 max_time;
u64 max_time_start;
u64 max_time_end;
};
struct kwork_class_bpf {
struct kwork_class *class;
void (*load_prepare)(struct perf_kwork *kwork);
int (*get_work_name)(struct work_key *key, char **ret_name);
};
static struct kwork_trace_bpf *skel;
static struct timespec ts_start;
static struct timespec ts_end;
void perf_kwork__trace_start(void)
{
clock_gettime(CLOCK_MONOTONIC, &ts_start);
skel->bss->enabled = 1;
}
void perf_kwork__trace_finish(void)
{
clock_gettime(CLOCK_MONOTONIC, &ts_end);
skel->bss->enabled = 0;
}
static int get_work_name_from_map(struct work_key *key, char **ret_name)
{
char name[MAX_KWORKNAME] = { 0 };
int fd = bpf_map__fd(skel->maps.perf_kwork_names);
*ret_name = NULL;
if (fd < 0) {
pr_debug("Invalid names map fd\n");
return 0;
}
if ((bpf_map_lookup_elem(fd, key, name) == 0) && (strlen(name) != 0)) {
*ret_name = strdup(name);
if (*ret_name == NULL) {
pr_err("Failed to copy work name\n");
return -1;
}
}
return 0;
}
static void irq_load_prepare(struct perf_kwork *kwork)
{
if (kwork->report == KWORK_REPORT_RUNTIME) {
bpf_program__set_autoload(skel->progs.report_irq_handler_entry, true);
bpf_program__set_autoload(skel->progs.report_irq_handler_exit, true);
}
}
static struct kwork_class_bpf kwork_irq_bpf = {
.load_prepare = irq_load_prepare,
.get_work_name = get_work_name_from_map,
};
static void softirq_load_prepare(struct perf_kwork *kwork)
{
if (kwork->report == KWORK_REPORT_RUNTIME) {
bpf_program__set_autoload(skel->progs.report_softirq_entry, true);
bpf_program__set_autoload(skel->progs.report_softirq_exit, true);
} else if (kwork->report == KWORK_REPORT_LATENCY) {
bpf_program__set_autoload(skel->progs.latency_softirq_raise, true);
bpf_program__set_autoload(skel->progs.latency_softirq_entry, true);
}
}
static struct kwork_class_bpf kwork_softirq_bpf = {
.load_prepare = softirq_load_prepare,
.get_work_name = get_work_name_from_map,
};
static void workqueue_load_prepare(struct perf_kwork *kwork)
{
if (kwork->report == KWORK_REPORT_RUNTIME) {
bpf_program__set_autoload(skel->progs.report_workqueue_execute_start, true);
bpf_program__set_autoload(skel->progs.report_workqueue_execute_end, true);
} else if (kwork->report == KWORK_REPORT_LATENCY) {
bpf_program__set_autoload(skel->progs.latency_workqueue_activate_work, true);
bpf_program__set_autoload(skel->progs.latency_workqueue_execute_start, true);
}
}
static struct kwork_class_bpf kwork_workqueue_bpf = {
.load_prepare = workqueue_load_prepare,
.get_work_name = get_work_name_from_map,
};
static struct kwork_class_bpf *
kwork_class_bpf_supported_list[KWORK_CLASS_MAX] = {
[KWORK_CLASS_IRQ] = &kwork_irq_bpf,
[KWORK_CLASS_SOFTIRQ] = &kwork_softirq_bpf,
[KWORK_CLASS_WORKQUEUE] = &kwork_workqueue_bpf,
};
static bool valid_kwork_class_type(enum kwork_class_type type)
{
return type >= 0 && type < KWORK_CLASS_MAX ? true : false;
}
static int setup_filters(struct perf_kwork *kwork)
{
if (kwork->cpu_list != NULL) {
int idx, nr_cpus;
struct perf_cpu_map *map;
struct perf_cpu cpu;
int fd = bpf_map__fd(skel->maps.perf_kwork_cpu_filter);
if (fd < 0) {
pr_debug("Invalid cpu filter fd\n");
return -1;
}
map = perf_cpu_map__new(kwork->cpu_list);
if (map == NULL) {
pr_debug("Invalid cpu_list\n");
return -1;
}
nr_cpus = libbpf_num_possible_cpus();
perf_cpu_map__for_each_cpu(cpu, idx, map) {
u8 val = 1;
if (cpu.cpu >= nr_cpus) {
perf_cpu_map__put(map);
pr_err("Requested cpu %d too large\n", cpu.cpu);
return -1;
}
bpf_map_update_elem(fd, &cpu.cpu, &val, BPF_ANY);
}
perf_cpu_map__put(map);
}
if (kwork->profile_name != NULL) {
int key, fd;
if (strlen(kwork->profile_name) >= MAX_KWORKNAME) {
pr_err("Requested name filter %s too large, limit to %d\n",
kwork->profile_name, MAX_KWORKNAME - 1);
return -1;
}
fd = bpf_map__fd(skel->maps.perf_kwork_name_filter);
if (fd < 0) {
pr_debug("Invalid name filter fd\n");
return -1;
}
key = 0;
bpf_map_update_elem(fd, &key, kwork->profile_name, BPF_ANY);
}
return 0;
}
int perf_kwork__trace_prepare_bpf(struct perf_kwork *kwork)
{
struct bpf_program *prog;
struct kwork_class *class;
struct kwork_class_bpf *class_bpf;
enum kwork_class_type type;
skel = kwork_trace_bpf__open();
if (!skel) {
pr_debug("Failed to open kwork trace skeleton\n");
return -1;
}
/*
* set all progs to non-autoload,
* then set corresponding progs according to config
*/
bpf_object__for_each_program(prog, skel->obj)
bpf_program__set_autoload(prog, false);
list_for_each_entry(class, &kwork->class_list, list) {
type = class->type;
if (!valid_kwork_class_type(type) ||
(kwork_class_bpf_supported_list[type] == NULL)) {
pr_err("Unsupported bpf trace class %s\n", class->name);
goto out;
}
class_bpf = kwork_class_bpf_supported_list[type];
class_bpf->class = class;
if (class_bpf->load_prepare != NULL)
class_bpf->load_prepare(kwork);
}
if (kwork->cpu_list != NULL)
skel->rodata->has_cpu_filter = 1;
if (kwork->profile_name != NULL)
skel->rodata->has_name_filter = 1;
if (kwork_trace_bpf__load(skel)) {
pr_debug("Failed to load kwork trace skeleton\n");
goto out;
}
if (setup_filters(kwork))
goto out;
if (kwork_trace_bpf__attach(skel)) {
pr_debug("Failed to attach kwork trace skeleton\n");
goto out;
}
return 0;
out:
kwork_trace_bpf__destroy(skel);
return -1;
}
static int add_work(struct perf_kwork *kwork,
struct work_key *key,
struct report_data *data)
{
struct kwork_work *work;
struct kwork_class_bpf *bpf_trace;
struct kwork_work tmp = {
.id = key->id,
.name = NULL,
.cpu = key->cpu,
};
enum kwork_class_type type = key->type;
if (!valid_kwork_class_type(type)) {
pr_debug("Invalid class type %d to add work\n", type);
return -1;
}
bpf_trace = kwork_class_bpf_supported_list[type];
tmp.class = bpf_trace->class;
if ((bpf_trace->get_work_name != NULL) &&
(bpf_trace->get_work_name(key, &tmp.name)))
return -1;
work = perf_kwork_add_work(kwork, tmp.class, &tmp);
if (work == NULL)
return -1;
if (kwork->report == KWORK_REPORT_RUNTIME) {
work->nr_atoms = data->nr;
work->total_runtime = data->total_time;
work->max_runtime = data->max_time;
work->max_runtime_start = data->max_time_start;
work->max_runtime_end = data->max_time_end;
} else if (kwork->report == KWORK_REPORT_LATENCY) {
work->nr_atoms = data->nr;
work->total_latency = data->total_time;
work->max_latency = data->max_time;
work->max_latency_start = data->max_time_start;
work->max_latency_end = data->max_time_end;
} else {
pr_debug("Invalid bpf report type %d\n", kwork->report);
return -1;
}
kwork->timestart = (u64)ts_start.tv_sec * NSEC_PER_SEC + ts_start.tv_nsec;
kwork->timeend = (u64)ts_end.tv_sec * NSEC_PER_SEC + ts_end.tv_nsec;
return 0;
}
int perf_kwork__report_read_bpf(struct perf_kwork *kwork)
{
struct report_data data;
struct work_key key = {
.type = 0,
.cpu = 0,
.id = 0,
};
struct work_key prev = {
.type = 0,
.cpu = 0,
.id = 0,
};
int fd = bpf_map__fd(skel->maps.perf_kwork_report);
if (fd < 0) {
pr_debug("Invalid report fd\n");
return -1;
}
while (!bpf_map_get_next_key(fd, &prev, &key)) {
if ((bpf_map_lookup_elem(fd, &key, &data)) != 0) {
pr_debug("Failed to lookup report elem\n");
return -1;
}
if ((data.nr != 0) && (add_work(kwork, &key, &data) != 0))
return -1;
prev = key;
}
return 0;
}
void perf_kwork__report_cleanup_bpf(void)
{
kwork_trace_bpf__destroy(skel);
}