root/samples/bpf/cpustat_user.c
// SPDX-License-Identifier: GPL-2.0

#define _GNU_SOURCE
#include <errno.h>
#include <stdio.h>
#include <stdlib.h>
#include <signal.h>
#include <sched.h>
#include <string.h>
#include <unistd.h>
#include <fcntl.h>
#include <locale.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/time.h>
#include <sys/wait.h>

#include <bpf/bpf.h>
#include <bpf/libbpf.h>

static int cstate_map_fd, pstate_map_fd;

#define MAX_CPU                 8
#define MAX_PSTATE_ENTRIES      5
#define MAX_CSTATE_ENTRIES      3
#define MAX_STARS               40

#define CPUFREQ_MAX_SYSFS_PATH  "/sys/devices/system/cpu/cpu0/cpufreq/scaling_max_freq"
#define CPUFREQ_LOWEST_FREQ     "208000"
#define CPUFREQ_HIGHEST_FREQ    "12000000"

struct cpu_stat_data {
        unsigned long cstate[MAX_CSTATE_ENTRIES];
        unsigned long pstate[MAX_PSTATE_ENTRIES];
};

static struct cpu_stat_data stat_data[MAX_CPU];

static void cpu_stat_print(void)
{
        int i, j;
        char state_str[sizeof("cstate-9")];
        struct cpu_stat_data *data;

        /* Clear screen */
        printf("\033[2J");

        /* Header */
        printf("\nCPU states statistics:\n");
        printf("%-10s ", "state(ms)");

        for (i = 0; i < MAX_CSTATE_ENTRIES; i++) {
                sprintf(state_str, "cstate-%d", i);
                printf("%-11s ", state_str);
        }

        for (i = 0; i < MAX_PSTATE_ENTRIES; i++) {
                sprintf(state_str, "pstate-%d", i);
                printf("%-11s ", state_str);
        }

        printf("\n");

        for (j = 0; j < MAX_CPU; j++) {
                data = &stat_data[j];

                printf("CPU-%-6d ", j);
                for (i = 0; i < MAX_CSTATE_ENTRIES; i++)
                        printf("%-11lu ", data->cstate[i] / 1000000);

                for (i = 0; i < MAX_PSTATE_ENTRIES; i++)
                        printf("%-11lu ", data->pstate[i] / 1000000);

                printf("\n");
        }
}

static void cpu_stat_update(int cstate_fd, int pstate_fd)
{
        unsigned long key, value;
        int c, i;

        for (c = 0; c < MAX_CPU; c++) {
                for (i = 0; i < MAX_CSTATE_ENTRIES; i++) {
                        key = c * MAX_CSTATE_ENTRIES + i;
                        bpf_map_lookup_elem(cstate_fd, &key, &value);
                        stat_data[c].cstate[i] = value;
                }

                for (i = 0; i < MAX_PSTATE_ENTRIES; i++) {
                        key = c * MAX_PSTATE_ENTRIES + i;
                        bpf_map_lookup_elem(pstate_fd, &key, &value);
                        stat_data[c].pstate[i] = value;
                }
        }
}

/*
 * This function is copied from 'idlestat' tool function
 * idlestat_wake_all() in idlestate.c.
 *
 * It sets the self running task affinity to cpus one by one so can wake up
 * the specific CPU to handle scheduling; this results in all cpus can be
 * waken up once and produce ftrace event 'trace_cpu_idle'.
 */
static int cpu_stat_inject_cpu_idle_event(void)
{
        int rcpu, i, ret;
        cpu_set_t cpumask;
        cpu_set_t original_cpumask;

        ret = sysconf(_SC_NPROCESSORS_CONF);
        if (ret < 0)
                return -1;

        rcpu = sched_getcpu();
        if (rcpu < 0)
                return -1;

        /* Keep track of the CPUs we will run on */
        sched_getaffinity(0, sizeof(original_cpumask), &original_cpumask);

        for (i = 0; i < ret; i++) {

                /* Pointless to wake up ourself */
                if (i == rcpu)
                        continue;

                /* Pointless to wake CPUs we will not run on */
                if (!CPU_ISSET(i, &original_cpumask))
                        continue;

                CPU_ZERO(&cpumask);
                CPU_SET(i, &cpumask);

                sched_setaffinity(0, sizeof(cpumask), &cpumask);
        }

        /* Enable all the CPUs of the original mask */
        sched_setaffinity(0, sizeof(original_cpumask), &original_cpumask);
        return 0;
}

/*
 * It's possible to have no any frequency change for long time and cannot
 * get ftrace event 'trace_cpu_frequency' for long period, this introduces
 * big deviation for pstate statistics.
 *
 * To solve this issue, below code forces to set 'scaling_max_freq' to 208MHz
 * for triggering ftrace event 'trace_cpu_frequency' and then recovery back to
 * the maximum frequency value 1.2GHz.
 */
static int cpu_stat_inject_cpu_frequency_event(void)
{
        int len, fd;

        fd = open(CPUFREQ_MAX_SYSFS_PATH, O_WRONLY);
        if (fd < 0) {
                printf("failed to open scaling_max_freq, errno=%d\n", errno);
                return fd;
        }

        len = write(fd, CPUFREQ_LOWEST_FREQ, strlen(CPUFREQ_LOWEST_FREQ));
        if (len < 0) {
                printf("failed to open scaling_max_freq, errno=%d\n", errno);
                goto err;
        }

        len = write(fd, CPUFREQ_HIGHEST_FREQ, strlen(CPUFREQ_HIGHEST_FREQ));
        if (len < 0) {
                printf("failed to open scaling_max_freq, errno=%d\n", errno);
                goto err;
        }

err:
        close(fd);
        return len;
}

static void int_exit(int sig)
{
        cpu_stat_inject_cpu_idle_event();
        cpu_stat_inject_cpu_frequency_event();
        cpu_stat_update(cstate_map_fd, pstate_map_fd);
        cpu_stat_print();
        exit(0);
}

int main(int argc, char **argv)
{
        struct bpf_link *link = NULL;
        struct bpf_program *prog;
        struct bpf_object *obj;
        char filename[256];
        int ret;

        snprintf(filename, sizeof(filename), "%s_kern.o", argv[0]);
        obj = bpf_object__open_file(filename, NULL);
        if (libbpf_get_error(obj)) {
                fprintf(stderr, "ERROR: opening BPF object file failed\n");
                return 0;
        }

        prog = bpf_object__find_program_by_name(obj, "bpf_prog1");
        if (!prog) {
                printf("finding a prog in obj file failed\n");
                goto cleanup;
        }

        /* load BPF program */
        if (bpf_object__load(obj)) {
                fprintf(stderr, "ERROR: loading BPF object file failed\n");
                goto cleanup;
        }

        cstate_map_fd = bpf_object__find_map_fd_by_name(obj, "cstate_duration");
        pstate_map_fd = bpf_object__find_map_fd_by_name(obj, "pstate_duration");
        if (cstate_map_fd < 0 || pstate_map_fd < 0) {
                fprintf(stderr, "ERROR: finding a map in obj file failed\n");
                goto cleanup;
        }

        link = bpf_program__attach(prog);
        if (libbpf_get_error(link)) {
                fprintf(stderr, "ERROR: bpf_program__attach failed\n");
                link = NULL;
                goto cleanup;
        }

        ret = cpu_stat_inject_cpu_idle_event();
        if (ret < 0)
                return 1;

        ret = cpu_stat_inject_cpu_frequency_event();
        if (ret < 0)
                return 1;

        signal(SIGINT, int_exit);
        signal(SIGTERM, int_exit);

        while (1) {
                cpu_stat_update(cstate_map_fd, pstate_map_fd);
                cpu_stat_print();
                sleep(5);
        }

cleanup:
        bpf_link__destroy(link);
        bpf_object__close(obj);
        return 0;
}