| // SPDX-License-Identifier: GPL-2.0 |
| |
| #define _GNU_SOURCE |
| #include <errno.h> |
| #include <stdio.h> |
| #include <stdlib.h> |
| #include <signal.h> |
| #include <sched.h> |
| #include <string.h> |
| #include <unistd.h> |
| #include <fcntl.h> |
| #include <linux/bpf.h> |
| #include <locale.h> |
| #include <sys/types.h> |
| #include <sys/stat.h> |
| #include <sys/time.h> |
| #include <sys/resource.h> |
| #include <sys/wait.h> |
| |
| #include "libbpf.h" |
| #include "bpf_load.h" |
| |
| #define MAX_CPU 8 |
| #define MAX_PSTATE_ENTRIES 5 |
| #define MAX_CSTATE_ENTRIES 3 |
| #define MAX_STARS 40 |
| |
| #define CPUFREQ_MAX_SYSFS_PATH "/sys/devices/system/cpu/cpu0/cpufreq/scaling_max_freq" |
| #define CPUFREQ_LOWEST_FREQ "208000" |
| #define CPUFREQ_HIGHEST_FREQ "12000000" |
| |
| struct cpu_stat_data { |
| unsigned long cstate[MAX_CSTATE_ENTRIES]; |
| unsigned long pstate[MAX_PSTATE_ENTRIES]; |
| }; |
| |
| static struct cpu_stat_data stat_data[MAX_CPU]; |
| |
| static void cpu_stat_print(void) |
| { |
| int i, j; |
| char state_str[sizeof("cstate-9")]; |
| struct cpu_stat_data *data; |
| |
| /* Clear screen */ |
| printf("\033[2J"); |
| |
| /* Header */ |
| printf("\nCPU states statistics:\n"); |
| printf("%-10s ", "state(ms)"); |
| |
| for (i = 0; i < MAX_CSTATE_ENTRIES; i++) { |
| sprintf(state_str, "cstate-%d", i); |
| printf("%-11s ", state_str); |
| } |
| |
| for (i = 0; i < MAX_PSTATE_ENTRIES; i++) { |
| sprintf(state_str, "pstate-%d", i); |
| printf("%-11s ", state_str); |
| } |
| |
| printf("\n"); |
| |
| for (j = 0; j < MAX_CPU; j++) { |
| data = &stat_data[j]; |
| |
| printf("CPU-%-6d ", j); |
| for (i = 0; i < MAX_CSTATE_ENTRIES; i++) |
| printf("%-11ld ", data->cstate[i] / 1000000); |
| |
| for (i = 0; i < MAX_PSTATE_ENTRIES; i++) |
| printf("%-11ld ", data->pstate[i] / 1000000); |
| |
| printf("\n"); |
| } |
| } |
| |
| static void cpu_stat_update(int cstate_fd, int pstate_fd) |
| { |
| unsigned long key, value; |
| int c, i; |
| |
| for (c = 0; c < MAX_CPU; c++) { |
| for (i = 0; i < MAX_CSTATE_ENTRIES; i++) { |
| key = c * MAX_CSTATE_ENTRIES + i; |
| bpf_map_lookup_elem(cstate_fd, &key, &value); |
| stat_data[c].cstate[i] = value; |
| } |
| |
| for (i = 0; i < MAX_PSTATE_ENTRIES; i++) { |
| key = c * MAX_PSTATE_ENTRIES + i; |
| bpf_map_lookup_elem(pstate_fd, &key, &value); |
| stat_data[c].pstate[i] = value; |
| } |
| } |
| } |
| |
| /* |
| * This function is copied from 'idlestat' tool function |
| * idlestat_wake_all() in idlestate.c. |
| * |
| * It sets the self running task affinity to cpus one by one so can wake up |
| * the specific CPU to handle scheduling; this results in all cpus can be |
| * waken up once and produce ftrace event 'trace_cpu_idle'. |
| */ |
| static int cpu_stat_inject_cpu_idle_event(void) |
| { |
| int rcpu, i, ret; |
| cpu_set_t cpumask; |
| cpu_set_t original_cpumask; |
| |
| ret = sysconf(_SC_NPROCESSORS_CONF); |
| if (ret < 0) |
| return -1; |
| |
| rcpu = sched_getcpu(); |
| if (rcpu < 0) |
| return -1; |
| |
| /* Keep track of the CPUs we will run on */ |
| sched_getaffinity(0, sizeof(original_cpumask), &original_cpumask); |
| |
| for (i = 0; i < ret; i++) { |
| |
| /* Pointless to wake up ourself */ |
| if (i == rcpu) |
| continue; |
| |
| /* Pointless to wake CPUs we will not run on */ |
| if (!CPU_ISSET(i, &original_cpumask)) |
| continue; |
| |
| CPU_ZERO(&cpumask); |
| CPU_SET(i, &cpumask); |
| |
| sched_setaffinity(0, sizeof(cpumask), &cpumask); |
| } |
| |
| /* Enable all the CPUs of the original mask */ |
| sched_setaffinity(0, sizeof(original_cpumask), &original_cpumask); |
| return 0; |
| } |
| |
| /* |
| * It's possible to have no any frequency change for long time and cannot |
| * get ftrace event 'trace_cpu_frequency' for long period, this introduces |
| * big deviation for pstate statistics. |
| * |
| * To solve this issue, below code forces to set 'scaling_max_freq' to 208MHz |
| * for triggering ftrace event 'trace_cpu_frequency' and then recovery back to |
| * the maximum frequency value 1.2GHz. |
| */ |
| static int cpu_stat_inject_cpu_frequency_event(void) |
| { |
| int len, fd; |
| |
| fd = open(CPUFREQ_MAX_SYSFS_PATH, O_WRONLY); |
| if (fd < 0) { |
| printf("failed to open scaling_max_freq, errno=%d\n", errno); |
| return fd; |
| } |
| |
| len = write(fd, CPUFREQ_LOWEST_FREQ, strlen(CPUFREQ_LOWEST_FREQ)); |
| if (len < 0) { |
| printf("failed to open scaling_max_freq, errno=%d\n", errno); |
| goto err; |
| } |
| |
| len = write(fd, CPUFREQ_HIGHEST_FREQ, strlen(CPUFREQ_HIGHEST_FREQ)); |
| if (len < 0) { |
| printf("failed to open scaling_max_freq, errno=%d\n", errno); |
| goto err; |
| } |
| |
| err: |
| close(fd); |
| return len; |
| } |
| |
| static void int_exit(int sig) |
| { |
| cpu_stat_inject_cpu_idle_event(); |
| cpu_stat_inject_cpu_frequency_event(); |
| cpu_stat_update(map_fd[1], map_fd[2]); |
| cpu_stat_print(); |
| exit(0); |
| } |
| |
| int main(int argc, char **argv) |
| { |
| char filename[256]; |
| int ret; |
| |
| snprintf(filename, sizeof(filename), "%s_kern.o", argv[0]); |
| |
| if (load_bpf_file(filename)) { |
| printf("%s", bpf_log_buf); |
| return 1; |
| } |
| |
| ret = cpu_stat_inject_cpu_idle_event(); |
| if (ret < 0) |
| return 1; |
| |
| ret = cpu_stat_inject_cpu_frequency_event(); |
| if (ret < 0) |
| return 1; |
| |
| signal(SIGINT, int_exit); |
| signal(SIGTERM, int_exit); |
| |
| while (1) { |
| cpu_stat_update(map_fd[1], map_fd[2]); |
| cpu_stat_print(); |
| sleep(5); |
| } |
| |
| return 0; |
| } |