1 // SPDX-License-Identifier: GPL-2.0
12 #include <linux/bpf.h>
14 #include <sys/types.h>
17 #include <sys/resource.h>
24 #define MAX_PSTATE_ENTRIES 5
25 #define MAX_CSTATE_ENTRIES 3
28 #define CPUFREQ_MAX_SYSFS_PATH "/sys/devices/system/cpu/cpu0/cpufreq/scaling_max_freq"
29 #define CPUFREQ_LOWEST_FREQ "208000"
30 #define CPUFREQ_HIGHEST_FREQ "12000000"
32 struct cpu_stat_data
{
33 unsigned long cstate
[MAX_CSTATE_ENTRIES
];
34 unsigned long pstate
[MAX_PSTATE_ENTRIES
];
37 static struct cpu_stat_data stat_data
[MAX_CPU
];
39 static void cpu_stat_print(void)
42 char state_str
[sizeof("cstate-9")];
43 struct cpu_stat_data
*data
;
49 printf("\nCPU states statistics:\n");
50 printf("%-10s ", "state(ms)");
52 for (i
= 0; i
< MAX_CSTATE_ENTRIES
; i
++) {
53 sprintf(state_str
, "cstate-%d", i
);
54 printf("%-11s ", state_str
);
57 for (i
= 0; i
< MAX_PSTATE_ENTRIES
; i
++) {
58 sprintf(state_str
, "pstate-%d", i
);
59 printf("%-11s ", state_str
);
64 for (j
= 0; j
< MAX_CPU
; j
++) {
67 printf("CPU-%-6d ", j
);
68 for (i
= 0; i
< MAX_CSTATE_ENTRIES
; i
++)
69 printf("%-11ld ", data
->cstate
[i
] / 1000000);
71 for (i
= 0; i
< MAX_PSTATE_ENTRIES
; i
++)
72 printf("%-11ld ", data
->pstate
[i
] / 1000000);
78 static void cpu_stat_update(int cstate_fd
, int pstate_fd
)
80 unsigned long key
, value
;
83 for (c
= 0; c
< MAX_CPU
; c
++) {
84 for (i
= 0; i
< MAX_CSTATE_ENTRIES
; i
++) {
85 key
= c
* MAX_CSTATE_ENTRIES
+ i
;
86 bpf_map_lookup_elem(cstate_fd
, &key
, &value
);
87 stat_data
[c
].cstate
[i
] = value
;
90 for (i
= 0; i
< MAX_PSTATE_ENTRIES
; i
++) {
91 key
= c
* MAX_PSTATE_ENTRIES
+ i
;
92 bpf_map_lookup_elem(pstate_fd
, &key
, &value
);
93 stat_data
[c
].pstate
[i
] = value
;
99 * This function is copied from 'idlestat' tool function
100 * idlestat_wake_all() in idlestate.c.
102 * It sets the self running task affinity to cpus one by one so can wake up
103 * the specific CPU to handle scheduling; this results in all cpus can be
104 * waken up once and produce ftrace event 'trace_cpu_idle'.
106 static int cpu_stat_inject_cpu_idle_event(void)
110 cpu_set_t original_cpumask
;
112 ret
= sysconf(_SC_NPROCESSORS_CONF
);
116 rcpu
= sched_getcpu();
120 /* Keep track of the CPUs we will run on */
121 sched_getaffinity(0, sizeof(original_cpumask
), &original_cpumask
);
123 for (i
= 0; i
< ret
; i
++) {
125 /* Pointless to wake up ourself */
129 /* Pointless to wake CPUs we will not run on */
130 if (!CPU_ISSET(i
, &original_cpumask
))
134 CPU_SET(i
, &cpumask
);
136 sched_setaffinity(0, sizeof(cpumask
), &cpumask
);
139 /* Enable all the CPUs of the original mask */
140 sched_setaffinity(0, sizeof(original_cpumask
), &original_cpumask
);
145 * It's possible to have no any frequency change for long time and cannot
146 * get ftrace event 'trace_cpu_frequency' for long period, this introduces
147 * big deviation for pstate statistics.
149 * To solve this issue, below code forces to set 'scaling_max_freq' to 208MHz
150 * for triggering ftrace event 'trace_cpu_frequency' and then recovery back to
151 * the maximum frequency value 1.2GHz.
153 static int cpu_stat_inject_cpu_frequency_event(void)
157 fd
= open(CPUFREQ_MAX_SYSFS_PATH
, O_WRONLY
);
159 printf("failed to open scaling_max_freq, errno=%d\n", errno
);
163 len
= write(fd
, CPUFREQ_LOWEST_FREQ
, strlen(CPUFREQ_LOWEST_FREQ
));
165 printf("failed to open scaling_max_freq, errno=%d\n", errno
);
169 len
= write(fd
, CPUFREQ_HIGHEST_FREQ
, strlen(CPUFREQ_HIGHEST_FREQ
));
171 printf("failed to open scaling_max_freq, errno=%d\n", errno
);
180 static void int_exit(int sig
)
182 cpu_stat_inject_cpu_idle_event();
183 cpu_stat_inject_cpu_frequency_event();
184 cpu_stat_update(map_fd
[1], map_fd
[2]);
189 int main(int argc
, char **argv
)
194 snprintf(filename
, sizeof(filename
), "%s_kern.o", argv
[0]);
196 if (load_bpf_file(filename
)) {
197 printf("%s", bpf_log_buf
);
201 ret
= cpu_stat_inject_cpu_idle_event();
205 ret
= cpu_stat_inject_cpu_frequency_event();
209 signal(SIGINT
, int_exit
);
210 signal(SIGTERM
, int_exit
);
213 cpu_stat_update(map_fd
[1], map_fd
[2]);