| // SPDX-License-Identifier: GPL-2.0 | 
 |  | 
 | #define _GNU_SOURCE | 
 | #include <errno.h> | 
 | #include <stdio.h> | 
 | #include <stdlib.h> | 
 | #include <signal.h> | 
 | #include <sched.h> | 
 | #include <string.h> | 
 | #include <unistd.h> | 
 | #include <fcntl.h> | 
 | #include <linux/bpf.h> | 
 | #include <locale.h> | 
 | #include <sys/types.h> | 
 | #include <sys/stat.h> | 
 | #include <sys/time.h> | 
 | #include <sys/resource.h> | 
 | #include <sys/wait.h> | 
 |  | 
 | #include <bpf/bpf.h> | 
 | #include "bpf_load.h" | 
 |  | 
 | #define MAX_CPU			8 | 
 | #define MAX_PSTATE_ENTRIES	5 | 
 | #define MAX_CSTATE_ENTRIES	3 | 
 | #define MAX_STARS		40 | 
 |  | 
 | #define CPUFREQ_MAX_SYSFS_PATH	"/sys/devices/system/cpu/cpu0/cpufreq/scaling_max_freq" | 
 | #define CPUFREQ_LOWEST_FREQ	"208000" | 
 | #define CPUFREQ_HIGHEST_FREQ	"12000000" | 
 |  | 
 | struct cpu_stat_data { | 
 | 	unsigned long cstate[MAX_CSTATE_ENTRIES]; | 
 | 	unsigned long pstate[MAX_PSTATE_ENTRIES]; | 
 | }; | 
 |  | 
 | static struct cpu_stat_data stat_data[MAX_CPU]; | 
 |  | 
 | static void cpu_stat_print(void) | 
 | { | 
 | 	int i, j; | 
 | 	char state_str[sizeof("cstate-9")]; | 
 | 	struct cpu_stat_data *data; | 
 |  | 
 | 	/* Clear screen */ | 
 | 	printf("\033[2J"); | 
 |  | 
 | 	/* Header */ | 
 | 	printf("\nCPU states statistics:\n"); | 
 | 	printf("%-10s ", "state(ms)"); | 
 |  | 
 | 	for (i = 0; i < MAX_CSTATE_ENTRIES; i++) { | 
 | 		sprintf(state_str, "cstate-%d", i); | 
 | 		printf("%-11s ", state_str); | 
 | 	} | 
 |  | 
 | 	for (i = 0; i < MAX_PSTATE_ENTRIES; i++) { | 
 | 		sprintf(state_str, "pstate-%d", i); | 
 | 		printf("%-11s ", state_str); | 
 | 	} | 
 |  | 
 | 	printf("\n"); | 
 |  | 
 | 	for (j = 0; j < MAX_CPU; j++) { | 
 | 		data = &stat_data[j]; | 
 |  | 
 | 		printf("CPU-%-6d ", j); | 
 | 		for (i = 0; i < MAX_CSTATE_ENTRIES; i++) | 
 | 			printf("%-11ld ", data->cstate[i] / 1000000); | 
 |  | 
 | 		for (i = 0; i < MAX_PSTATE_ENTRIES; i++) | 
 | 			printf("%-11ld ", data->pstate[i] / 1000000); | 
 |  | 
 | 		printf("\n"); | 
 | 	} | 
 | } | 
 |  | 
 | static void cpu_stat_update(int cstate_fd, int pstate_fd) | 
 | { | 
 | 	unsigned long key, value; | 
 | 	int c, i; | 
 |  | 
 | 	for (c = 0; c < MAX_CPU; c++) { | 
 | 		for (i = 0; i < MAX_CSTATE_ENTRIES; i++) { | 
 | 			key = c * MAX_CSTATE_ENTRIES + i; | 
 | 			bpf_map_lookup_elem(cstate_fd, &key, &value); | 
 | 			stat_data[c].cstate[i] = value; | 
 | 		} | 
 |  | 
 | 		for (i = 0; i < MAX_PSTATE_ENTRIES; i++) { | 
 | 			key = c * MAX_PSTATE_ENTRIES + i; | 
 | 			bpf_map_lookup_elem(pstate_fd, &key, &value); | 
 | 			stat_data[c].pstate[i] = value; | 
 | 		} | 
 | 	} | 
 | } | 
 |  | 
 | /* | 
 |  * This function is copied from 'idlestat' tool function | 
 |  * idlestat_wake_all() in idlestate.c. | 
 |  * | 
 |  * It sets the self running task affinity to cpus one by one so can wake up | 
 |  * the specific CPU to handle scheduling; this results in all cpus can be | 
 |  * waken up once and produce ftrace event 'trace_cpu_idle'. | 
 |  */ | 
 | static int cpu_stat_inject_cpu_idle_event(void) | 
 | { | 
 | 	int rcpu, i, ret; | 
 | 	cpu_set_t cpumask; | 
 | 	cpu_set_t original_cpumask; | 
 |  | 
 | 	ret = sysconf(_SC_NPROCESSORS_CONF); | 
 | 	if (ret < 0) | 
 | 		return -1; | 
 |  | 
 | 	rcpu = sched_getcpu(); | 
 | 	if (rcpu < 0) | 
 | 		return -1; | 
 |  | 
 | 	/* Keep track of the CPUs we will run on */ | 
 | 	sched_getaffinity(0, sizeof(original_cpumask), &original_cpumask); | 
 |  | 
 | 	for (i = 0; i < ret; i++) { | 
 |  | 
 | 		/* Pointless to wake up ourself */ | 
 | 		if (i == rcpu) | 
 | 			continue; | 
 |  | 
 | 		/* Pointless to wake CPUs we will not run on */ | 
 | 		if (!CPU_ISSET(i, &original_cpumask)) | 
 | 			continue; | 
 |  | 
 | 		CPU_ZERO(&cpumask); | 
 | 		CPU_SET(i, &cpumask); | 
 |  | 
 | 		sched_setaffinity(0, sizeof(cpumask), &cpumask); | 
 | 	} | 
 |  | 
 | 	/* Enable all the CPUs of the original mask */ | 
 | 	sched_setaffinity(0, sizeof(original_cpumask), &original_cpumask); | 
 | 	return 0; | 
 | } | 
 |  | 
 | /* | 
 |  * It's possible to have no any frequency change for long time and cannot | 
 |  * get ftrace event 'trace_cpu_frequency' for long period, this introduces | 
 |  * big deviation for pstate statistics. | 
 |  * | 
 |  * To solve this issue, below code forces to set 'scaling_max_freq' to 208MHz | 
 |  * for triggering ftrace event 'trace_cpu_frequency' and then recovery back to | 
 |  * the maximum frequency value 1.2GHz. | 
 |  */ | 
 | static int cpu_stat_inject_cpu_frequency_event(void) | 
 | { | 
 | 	int len, fd; | 
 |  | 
 | 	fd = open(CPUFREQ_MAX_SYSFS_PATH, O_WRONLY); | 
 | 	if (fd < 0) { | 
 | 		printf("failed to open scaling_max_freq, errno=%d\n", errno); | 
 | 		return fd; | 
 | 	} | 
 |  | 
 | 	len = write(fd, CPUFREQ_LOWEST_FREQ, strlen(CPUFREQ_LOWEST_FREQ)); | 
 | 	if (len < 0) { | 
 | 		printf("failed to open scaling_max_freq, errno=%d\n", errno); | 
 | 		goto err; | 
 | 	} | 
 |  | 
 | 	len = write(fd, CPUFREQ_HIGHEST_FREQ, strlen(CPUFREQ_HIGHEST_FREQ)); | 
 | 	if (len < 0) { | 
 | 		printf("failed to open scaling_max_freq, errno=%d\n", errno); | 
 | 		goto err; | 
 | 	} | 
 |  | 
 | err: | 
 | 	close(fd); | 
 | 	return len; | 
 | } | 
 |  | 
 | static void int_exit(int sig) | 
 | { | 
 | 	cpu_stat_inject_cpu_idle_event(); | 
 | 	cpu_stat_inject_cpu_frequency_event(); | 
 | 	cpu_stat_update(map_fd[1], map_fd[2]); | 
 | 	cpu_stat_print(); | 
 | 	exit(0); | 
 | } | 
 |  | 
 | int main(int argc, char **argv) | 
 | { | 
 | 	char filename[256]; | 
 | 	int ret; | 
 |  | 
 | 	snprintf(filename, sizeof(filename), "%s_kern.o", argv[0]); | 
 |  | 
 | 	if (load_bpf_file(filename)) { | 
 | 		printf("%s", bpf_log_buf); | 
 | 		return 1; | 
 | 	} | 
 |  | 
 | 	ret = cpu_stat_inject_cpu_idle_event(); | 
 | 	if (ret < 0) | 
 | 		return 1; | 
 |  | 
 | 	ret = cpu_stat_inject_cpu_frequency_event(); | 
 | 	if (ret < 0) | 
 | 		return 1; | 
 |  | 
 | 	signal(SIGINT, int_exit); | 
 | 	signal(SIGTERM, int_exit); | 
 |  | 
 | 	while (1) { | 
 | 		cpu_stat_update(map_fd[1], map_fd[2]); | 
 | 		cpu_stat_print(); | 
 | 		sleep(5); | 
 | 	} | 
 |  | 
 | 	return 0; | 
 | } |