2 * turbostat -- show CPU frequency and C-state residency
3 * on modern Intel turbo-capable processors.
5 * Copyright (c) 2010, Intel Corporation.
6 * Len Brown <len.brown@intel.com>
8 * This program is free software; you can redistribute it and/or modify it
9 * under the terms and conditions of the GNU General Public License,
10 * version 2, as published by the Free Software Foundation.
12 * This program is distributed in the hope it will be useful, but WITHOUT
13 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
17 * You should have received a copy of the GNU General Public License along with
18 * this program; if not, write to the Free Software Foundation, Inc.,
19 * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
24 #include <sys/types.h>
27 #include <sys/resource.h>
37 #define MSR_NEHALEM_PLATFORM_INFO 0xCE
38 #define MSR_NEHALEM_TURBO_RATIO_LIMIT 0x1AD
39 #define MSR_APERF 0xE8
40 #define MSR_MPERF 0xE7
41 #define MSR_PKG_C2_RESIDENCY 0x60D /* SNB only */
42 #define MSR_PKG_C3_RESIDENCY 0x3F8
43 #define MSR_PKG_C6_RESIDENCY 0x3F9
44 #define MSR_PKG_C7_RESIDENCY 0x3FA /* SNB only */
45 #define MSR_CORE_C3_RESIDENCY 0x3FC
46 #define MSR_CORE_C6_RESIDENCY 0x3FD
47 #define MSR_CORE_C7_RESIDENCY 0x3FE /* SNB only */
49 char *proc_stat
= "/proc/stat";
50 unsigned int interval_sec
= 5; /* set with -i interval_sec */
51 unsigned int verbose
; /* set with -v */
54 unsigned int do_nhm_cstates
;
55 unsigned int do_snb_cstates
;
56 unsigned int has_aperf
;
57 unsigned int units
= 1000000000; /* Ghz etc */
58 unsigned int genuine_intel
;
59 unsigned int has_invariant_tsc
;
60 unsigned int do_nehalem_platform_info
;
61 unsigned int do_nehalem_turbo_ratio_limit
;
62 unsigned int extra_msr_offset
;
64 unsigned int show_pkg
;
65 unsigned int show_core
;
66 unsigned int show_cpu
;
68 int aperf_mperf_unstable
;
71 int need_reinitialize
;
76 unsigned long long tsc
; /* per thread */
77 unsigned long long aperf
; /* per thread */
78 unsigned long long mperf
; /* per thread */
79 unsigned long long c1
; /* per thread (calculated) */
80 unsigned long long c3
; /* per core */
81 unsigned long long c6
; /* per core */
82 unsigned long long c7
; /* per core */
83 unsigned long long pc2
; /* per package */
84 unsigned long long pc3
; /* per package */
85 unsigned long long pc6
; /* per package */
86 unsigned long long pc7
; /* per package */
87 unsigned long long extra_msr
; /* per thread */
91 struct counters
*next
;
94 struct counters
*cnt_even
;
95 struct counters
*cnt_odd
;
96 struct counters
*cnt_delta
;
97 struct counters
*cnt_average
;
98 struct timeval tv_even
;
99 struct timeval tv_odd
;
100 struct timeval tv_delta
;
102 unsigned long long get_msr(int cpu
, off_t offset
)
105 unsigned long long msr
;
109 sprintf(pathname
, "/dev/cpu/%d/msr", cpu
);
110 fd
= open(pathname
, O_RDONLY
);
113 need_reinitialize
= 1;
117 retval
= pread(fd
, &msr
, sizeof msr
, offset
);
118 if (retval
!= sizeof msr
) {
119 fprintf(stderr
, "cpu%d pread(..., 0x%zx) = %jd\n",
120 cpu
, offset
, retval
);
128 void print_header(void)
131 fprintf(stderr
, "pk");
133 fprintf(stderr
, " cr");
135 fprintf(stderr
, " CPU");
137 fprintf(stderr
, " %%c0 ");
139 fprintf(stderr
, " GHz");
140 fprintf(stderr
, " TSC");
142 fprintf(stderr
, " %%c1");
144 fprintf(stderr
, " %%c3");
146 fprintf(stderr
, " %%c6");
148 fprintf(stderr
, " %%c7");
150 fprintf(stderr
, " %%pc2");
152 fprintf(stderr
, " %%pc3");
154 fprintf(stderr
, " %%pc6");
156 fprintf(stderr
, " %%pc7");
157 if (extra_msr_offset
)
158 fprintf(stderr
, " MSR 0x%x ", extra_msr_offset
);
163 void dump_cnt(struct counters
*cnt
)
167 if (cnt
->pkg
) fprintf(stderr
, "package: %d ", cnt
->pkg
);
168 if (cnt
->core
) fprintf(stderr
, "core:: %d ", cnt
->core
);
169 if (cnt
->cpu
) fprintf(stderr
, "CPU: %d ", cnt
->cpu
);
170 if (cnt
->tsc
) fprintf(stderr
, "TSC: %016llX\n", cnt
->tsc
);
171 if (cnt
->c3
) fprintf(stderr
, "c3: %016llX\n", cnt
->c3
);
172 if (cnt
->c6
) fprintf(stderr
, "c6: %016llX\n", cnt
->c6
);
173 if (cnt
->c7
) fprintf(stderr
, "c7: %016llX\n", cnt
->c7
);
174 if (cnt
->aperf
) fprintf(stderr
, "aperf: %016llX\n", cnt
->aperf
);
175 if (cnt
->pc2
) fprintf(stderr
, "pc2: %016llX\n", cnt
->pc2
);
176 if (cnt
->pc3
) fprintf(stderr
, "pc3: %016llX\n", cnt
->pc3
);
177 if (cnt
->pc6
) fprintf(stderr
, "pc6: %016llX\n", cnt
->pc6
);
178 if (cnt
->pc7
) fprintf(stderr
, "pc7: %016llX\n", cnt
->pc7
);
179 if (cnt
->extra_msr
) fprintf(stderr
, "msr0x%x: %016llX\n", extra_msr_offset
, cnt
->extra_msr
);
182 void dump_list(struct counters
*cnt
)
184 printf("dump_list 0x%p\n", cnt
);
186 for (; cnt
; cnt
= cnt
->next
)
190 void print_cnt(struct counters
*p
)
192 double interval_float
;
194 interval_float
= tv_delta
.tv_sec
+ tv_delta
.tv_usec
/1000000.0;
196 /* topology columns, print blanks on 1st (average) line */
197 if (p
== cnt_average
) {
199 fprintf(stderr
, " ");
201 fprintf(stderr
, " ");
203 fprintf(stderr
, " ");
206 fprintf(stderr
, "%d", p
->pkg
);
208 fprintf(stderr
, "%4d", p
->core
);
210 fprintf(stderr
, "%4d", p
->cpu
);
214 if (do_nhm_cstates
) {
216 fprintf(stderr
, "%7.2f", 100.0 * p
->mperf
/p
->tsc
);
218 fprintf(stderr
, " ****");
223 if (!aperf_mperf_unstable
) {
224 fprintf(stderr
, "%5.2f",
225 1.0 * p
->tsc
/ units
* p
->aperf
/
226 p
->mperf
/ interval_float
);
228 if (p
->aperf
> p
->tsc
|| p
->mperf
> p
->tsc
) {
229 fprintf(stderr
, " ****");
231 fprintf(stderr
, "%4.1f*",
234 p
->mperf
/ interval_float
);
240 fprintf(stderr
, "%5.2f", 1.0 * p
->tsc
/units
/interval_float
);
242 if (do_nhm_cstates
) {
244 fprintf(stderr
, "%7.2f", 100.0 * p
->c1
/p
->tsc
);
246 fprintf(stderr
, " ****");
249 fprintf(stderr
, " %6.2f", 100.0 * p
->c3
/p
->tsc
);
251 fprintf(stderr
, " %6.2f", 100.0 * p
->c6
/p
->tsc
);
253 fprintf(stderr
, " %6.2f", 100.0 * p
->c7
/p
->tsc
);
255 fprintf(stderr
, " %5.2f", 100.0 * p
->pc2
/p
->tsc
);
257 fprintf(stderr
, " %5.2f", 100.0 * p
->pc3
/p
->tsc
);
259 fprintf(stderr
, " %5.2f", 100.0 * p
->pc6
/p
->tsc
);
261 fprintf(stderr
, " %5.2f", 100.0 * p
->pc7
/p
->tsc
);
262 if (extra_msr_offset
)
263 fprintf(stderr
, " 0x%016llx", p
->extra_msr
);
267 void print_counters(struct counters
*counters
)
269 struct counters
*cnt
;
274 print_cnt(cnt_average
);
276 for (cnt
= counters
; cnt
!= NULL
; cnt
= cnt
->next
)
281 #define SUBTRACT_COUNTER(after, before, delta) (delta = (after - before), (before > after))
283 int compute_delta(struct counters
*after
,
284 struct counters
*before
, struct counters
*delta
)
289 skip_c0
= skip_c1
= 0;
291 for ( ; after
&& before
&& delta
;
292 after
= after
->next
, before
= before
->next
, delta
= delta
->next
) {
293 if (before
->cpu
!= after
->cpu
) {
294 printf("cpu configuration changed: %d != %d\n",
295 before
->cpu
, after
->cpu
);
299 if (SUBTRACT_COUNTER(after
->tsc
, before
->tsc
, delta
->tsc
)) {
300 fprintf(stderr
, "cpu%d TSC went backwards %llX to %llX\n",
301 before
->cpu
, before
->tsc
, after
->tsc
);
304 /* check for TSC < 1 Mcycles over interval */
305 if (delta
->tsc
< (1000 * 1000)) {
306 fprintf(stderr
, "Insanely slow TSC rate,"
307 " TSC stops in idle?\n");
308 fprintf(stderr
, "You can disable all c-states"
309 " by booting with \"idle=poll\"\n");
310 fprintf(stderr
, "or just the deep ones with"
311 " \"processor.max_cstate=1\"\n");
314 if (SUBTRACT_COUNTER(after
->c3
, before
->c3
, delta
->c3
)) {
315 fprintf(stderr
, "cpu%d c3 counter went backwards %llX to %llX\n",
316 before
->cpu
, before
->c3
, after
->c3
);
319 if (SUBTRACT_COUNTER(after
->c6
, before
->c6
, delta
->c6
)) {
320 fprintf(stderr
, "cpu%d c6 counter went backwards %llX to %llX\n",
321 before
->cpu
, before
->c6
, after
->c6
);
324 if (SUBTRACT_COUNTER(after
->c7
, before
->c7
, delta
->c7
)) {
325 fprintf(stderr
, "cpu%d c7 counter went backwards %llX to %llX\n",
326 before
->cpu
, before
->c7
, after
->c7
);
329 if (SUBTRACT_COUNTER(after
->pc2
, before
->pc2
, delta
->pc2
)) {
330 fprintf(stderr
, "cpu%d pc2 counter went backwards %llX to %llX\n",
331 before
->cpu
, before
->pc2
, after
->pc2
);
334 if (SUBTRACT_COUNTER(after
->pc3
, before
->pc3
, delta
->pc3
)) {
335 fprintf(stderr
, "cpu%d pc3 counter went backwards %llX to %llX\n",
336 before
->cpu
, before
->pc3
, after
->pc3
);
339 if (SUBTRACT_COUNTER(after
->pc6
, before
->pc6
, delta
->pc6
)) {
340 fprintf(stderr
, "cpu%d pc6 counter went backwards %llX to %llX\n",
341 before
->cpu
, before
->pc6
, after
->pc6
);
344 if (SUBTRACT_COUNTER(after
->pc7
, before
->pc7
, delta
->pc7
)) {
345 fprintf(stderr
, "cpu%d pc7 counter went backwards %llX to %llX\n",
346 before
->cpu
, before
->pc7
, after
->pc7
);
350 perf_err
= SUBTRACT_COUNTER(after
->aperf
, before
->aperf
, delta
->aperf
);
352 fprintf(stderr
, "cpu%d aperf counter went backwards %llX to %llX\n",
353 before
->cpu
, before
->aperf
, after
->aperf
);
355 perf_err
|= SUBTRACT_COUNTER(after
->mperf
, before
->mperf
, delta
->mperf
);
357 fprintf(stderr
, "cpu%d mperf counter went backwards %llX to %llX\n",
358 before
->cpu
, before
->mperf
, after
->mperf
);
361 if (!aperf_mperf_unstable
) {
362 fprintf(stderr
, "%s: APERF or MPERF went backwards *\n", progname
);
363 fprintf(stderr
, "* Frequency results do not cover entire interval *\n");
364 fprintf(stderr
, "* fix this by running Linux-2.6.30 or later *\n");
366 aperf_mperf_unstable
= 1;
369 * mperf delta is likely a huge "positive" number
370 * can not use it for calculating c0 time
377 * As mperf and tsc collection are not atomic,
378 * it is possible for mperf's non-halted cycles
379 * to exceed TSC's all cycles: show c1 = 0% in that case.
381 if (delta
->mperf
> delta
->tsc
)
383 else /* normal case, derive c1 */
384 delta
->c1
= delta
->tsc
- delta
->mperf
385 - delta
->c3
- delta
->c6
- delta
->c7
;
387 if (delta
->mperf
== 0)
388 delta
->mperf
= 1; /* divide by 0 protection */
391 * for "extra msr", just copy the latest w/o subtracting
393 delta
->extra_msr
= after
->extra_msr
;
395 fprintf(stderr
, "ERROR cpu%d before:\n", before
->cpu
);
397 fprintf(stderr
, "ERROR cpu%d after:\n", before
->cpu
);
405 void compute_average(struct counters
*delta
, struct counters
*avg
)
407 struct counters
*sum
;
409 sum
= calloc(1, sizeof(struct counters
));
411 perror("calloc sum");
415 for (; delta
; delta
= delta
->next
) {
416 sum
->tsc
+= delta
->tsc
;
417 sum
->c1
+= delta
->c1
;
418 sum
->c3
+= delta
->c3
;
419 sum
->c6
+= delta
->c6
;
420 sum
->c7
+= delta
->c7
;
421 sum
->aperf
+= delta
->aperf
;
422 sum
->mperf
+= delta
->mperf
;
423 sum
->pc2
+= delta
->pc2
;
424 sum
->pc3
+= delta
->pc3
;
425 sum
->pc6
+= delta
->pc6
;
426 sum
->pc7
+= delta
->pc7
;
428 avg
->tsc
= sum
->tsc
/num_cpus
;
429 avg
->c1
= sum
->c1
/num_cpus
;
430 avg
->c3
= sum
->c3
/num_cpus
;
431 avg
->c6
= sum
->c6
/num_cpus
;
432 avg
->c7
= sum
->c7
/num_cpus
;
433 avg
->aperf
= sum
->aperf
/num_cpus
;
434 avg
->mperf
= sum
->mperf
/num_cpus
;
435 avg
->pc2
= sum
->pc2
/num_cpus
;
436 avg
->pc3
= sum
->pc3
/num_cpus
;
437 avg
->pc6
= sum
->pc6
/num_cpus
;
438 avg
->pc7
= sum
->pc7
/num_cpus
;
443 void get_counters(struct counters
*cnt
)
445 for ( ; cnt
; cnt
= cnt
->next
) {
446 cnt
->tsc
= get_msr(cnt
->cpu
, MSR_TSC
);
448 cnt
->c3
= get_msr(cnt
->cpu
, MSR_CORE_C3_RESIDENCY
);
450 cnt
->c6
= get_msr(cnt
->cpu
, MSR_CORE_C6_RESIDENCY
);
452 cnt
->c7
= get_msr(cnt
->cpu
, MSR_CORE_C7_RESIDENCY
);
454 cnt
->aperf
= get_msr(cnt
->cpu
, MSR_APERF
);
456 cnt
->mperf
= get_msr(cnt
->cpu
, MSR_MPERF
);
458 cnt
->pc2
= get_msr(cnt
->cpu
, MSR_PKG_C2_RESIDENCY
);
460 cnt
->pc3
= get_msr(cnt
->cpu
, MSR_PKG_C3_RESIDENCY
);
462 cnt
->pc6
= get_msr(cnt
->cpu
, MSR_PKG_C6_RESIDENCY
);
464 cnt
->pc7
= get_msr(cnt
->cpu
, MSR_PKG_C7_RESIDENCY
);
465 if (extra_msr_offset
)
466 cnt
->extra_msr
= get_msr(cnt
->cpu
, extra_msr_offset
);
470 void print_nehalem_info(void)
472 unsigned long long msr
;
475 if (!do_nehalem_platform_info
)
478 msr
= get_msr(0, MSR_NEHALEM_PLATFORM_INFO
);
480 ratio
= (msr
>> 40) & 0xFF;
481 fprintf(stderr
, "%d * %.0f = %.0f MHz max efficiency\n",
482 ratio
, bclk
, ratio
* bclk
);
484 ratio
= (msr
>> 8) & 0xFF;
485 fprintf(stderr
, "%d * %.0f = %.0f MHz TSC frequency\n",
486 ratio
, bclk
, ratio
* bclk
);
489 fprintf(stderr
, "MSR_NEHALEM_PLATFORM_INFO: 0x%llx\n", msr
);
491 if (!do_nehalem_turbo_ratio_limit
)
494 msr
= get_msr(0, MSR_NEHALEM_TURBO_RATIO_LIMIT
);
496 ratio
= (msr
>> 24) & 0xFF;
498 fprintf(stderr
, "%d * %.0f = %.0f MHz max turbo 4 active cores\n",
499 ratio
, bclk
, ratio
* bclk
);
501 ratio
= (msr
>> 16) & 0xFF;
503 fprintf(stderr
, "%d * %.0f = %.0f MHz max turbo 3 active cores\n",
504 ratio
, bclk
, ratio
* bclk
);
506 ratio
= (msr
>> 8) & 0xFF;
508 fprintf(stderr
, "%d * %.0f = %.0f MHz max turbo 2 active cores\n",
509 ratio
, bclk
, ratio
* bclk
);
511 ratio
= (msr
>> 0) & 0xFF;
513 fprintf(stderr
, "%d * %.0f = %.0f MHz max turbo 1 active cores\n",
514 ratio
, bclk
, ratio
* bclk
);
518 void free_counter_list(struct counters
*list
)
522 for (p
= list
; p
; ) {
523 struct counters
*free_me
;
531 void free_all_counters(void)
533 free_counter_list(cnt_even
);
536 free_counter_list(cnt_odd
);
539 free_counter_list(cnt_delta
);
542 free_counter_list(cnt_average
);
546 void insert_counters(struct counters
**list
,
547 struct counters
*new)
549 struct counters
*prev
;
560 show_cpu
= 1; /* there is more than one CPU */
563 * insert on front of list.
564 * It is sorted by ascending package#, core#, cpu#
566 if (((*list
)->pkg
> new->pkg
) ||
567 (((*list
)->pkg
== new->pkg
) && ((*list
)->core
> new->core
)) ||
568 (((*list
)->pkg
== new->pkg
) && ((*list
)->core
== new->core
) && ((*list
)->cpu
> new->cpu
))) {
576 while (prev
->next
&& (prev
->next
->pkg
< new->pkg
)) {
578 show_pkg
= 1; /* there is more than 1 package */
581 while (prev
->next
&& (prev
->next
->pkg
== new->pkg
)
582 && (prev
->next
->core
< new->core
)) {
584 show_core
= 1; /* there is more than 1 core */
587 while (prev
->next
&& (prev
->next
->pkg
== new->pkg
)
588 && (prev
->next
->core
== new->core
)
589 && (prev
->next
->cpu
< new->cpu
)) {
594 * insert after "prev"
596 new->next
= prev
->next
;
600 void alloc_new_counters(int pkg
, int core
, int cpu
)
602 struct counters
*new;
605 printf("pkg%d core%d, cpu%d\n", pkg
, core
, cpu
);
607 new = (struct counters
*)calloc(1, sizeof(struct counters
));
615 insert_counters(&cnt_odd
, new);
617 new = (struct counters
*)calloc(1,
618 sizeof(struct counters
));
626 insert_counters(&cnt_even
, new);
628 new = (struct counters
*)calloc(1, sizeof(struct counters
));
636 insert_counters(&cnt_delta
, new);
638 new = (struct counters
*)calloc(1, sizeof(struct counters
));
649 int get_physical_package_id(int cpu
)
655 sprintf(path
, "/sys/devices/system/cpu/cpu%d/topology/physical_package_id", cpu
);
656 filep
= fopen(path
, "r");
661 fscanf(filep
, "%d", &pkg
);
666 int get_core_id(int cpu
)
672 sprintf(path
, "/sys/devices/system/cpu/cpu%d/topology/core_id", cpu
);
673 filep
= fopen(path
, "r");
678 fscanf(filep
, "%d", &core
);
684 * run func(index, cpu) on every cpu in /proc/stat
687 int for_all_cpus(void (func
)(int, int, int))
693 fp
= fopen(proc_stat
, "r");
699 retval
= fscanf(fp
, "cpu %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n");
701 perror("/proc/stat format");
705 for (cpu_count
= 0; ; cpu_count
++) {
708 retval
= fscanf(fp
, "cpu%u %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n", &cpu
);
712 func(get_physical_package_id(cpu
), get_core_id(cpu
), cpu
);
718 void re_initialize(void)
720 printf("turbostat: topology changed, re-initializing.\n");
722 num_cpus
= for_all_cpus(alloc_new_counters
);
723 need_reinitialize
= 0;
724 printf("num_cpus is now %d\n", num_cpus
);
727 void dummy(int pkg
, int core
, int cpu
) { return; }
729 * check to see if a cpu came on-line
731 void verify_num_cpus(void)
735 new_num_cpus
= for_all_cpus(dummy
);
737 if (new_num_cpus
!= num_cpus
) {
739 printf("num_cpus was %d, is now %d\n",
740 num_cpus
, new_num_cpus
);
741 need_reinitialize
= 1;
745 void turbostat_loop()
748 get_counters(cnt_even
);
749 gettimeofday(&tv_even
, (struct timezone
*)NULL
);
753 if (need_reinitialize
) {
758 get_counters(cnt_odd
);
759 gettimeofday(&tv_odd
, (struct timezone
*)NULL
);
761 compute_delta(cnt_odd
, cnt_even
, cnt_delta
);
762 timersub(&tv_odd
, &tv_even
, &tv_delta
);
763 compute_average(cnt_delta
, cnt_average
);
764 print_counters(cnt_delta
);
765 if (need_reinitialize
) {
770 get_counters(cnt_even
);
771 gettimeofday(&tv_even
, (struct timezone
*)NULL
);
772 compute_delta(cnt_even
, cnt_odd
, cnt_delta
);
773 timersub(&tv_even
, &tv_odd
, &tv_delta
);
774 compute_average(cnt_delta
, cnt_average
);
775 print_counters(cnt_delta
);
783 if (stat("/dev/cpu/0/msr", &sb
)) {
784 fprintf(stderr
, "no /dev/cpu/0/msr\n");
785 fprintf(stderr
, "Try \"# modprobe msr\"\n");
790 void check_super_user()
793 fprintf(stderr
, "must be root\n");
798 int has_nehalem_turbo_ratio_limit(unsigned int family
, unsigned int model
)
807 case 0x1A: /* Core i7, Xeon 5500 series - Bloomfield, Gainstown NHM-EP */
808 case 0x1E: /* Core i7 and i5 Processor - Clarksfield, Lynnfield, Jasper Forest */
809 case 0x1F: /* Core i7 and i5 Processor - Nehalem */
810 case 0x25: /* Westmere Client - Clarkdale, Arrandale */
811 case 0x2C: /* Westmere EP - Gulftown */
813 case 0x2D: /* SNB Xeon */
815 case 0x2E: /* Nehalem-EX Xeon - Beckton */
816 case 0x2F: /* Westmere-EX Xeon - Eagleton */
822 int is_snb(unsigned int family
, unsigned int model
)
835 double discover_bclk(unsigned int family
, unsigned int model
)
837 if (is_snb(family
, model
))
845 unsigned int eax
, ebx
, ecx
, edx
, max_level
;
846 unsigned int fms
, family
, model
, stepping
;
848 eax
= ebx
= ecx
= edx
= 0;
850 asm("cpuid" : "=a" (max_level
), "=b" (ebx
), "=c" (ecx
), "=d" (edx
) : "a" (0));
852 if (ebx
== 0x756e6547 && edx
== 0x49656e69 && ecx
== 0x6c65746e)
856 fprintf(stderr
, "%.4s%.4s%.4s ",
857 (char *)&ebx
, (char *)&edx
, (char *)&ecx
);
859 asm("cpuid" : "=a" (fms
), "=c" (ecx
), "=d" (edx
) : "a" (1) : "ebx");
860 family
= (fms
>> 8) & 0xf;
861 model
= (fms
>> 4) & 0xf;
862 stepping
= fms
& 0xf;
863 if (family
== 6 || family
== 0xf)
864 model
+= ((fms
>> 16) & 0xf) << 4;
867 fprintf(stderr
, "%d CPUID levels; family:model:stepping 0x%x:%x:%x (%d:%d:%d)\n",
868 max_level
, family
, model
, stepping
, family
, model
, stepping
);
870 if (!(edx
& (1 << 5))) {
871 fprintf(stderr
, "CPUID: no MSR\n");
876 * check max extended function levels of CPUID.
877 * This is needed to check for invariant TSC.
878 * This check is valid for both Intel and AMD.
881 asm("cpuid" : "=a" (max_level
), "=b" (ebx
), "=c" (ecx
), "=d" (edx
) : "a" (0x80000000));
883 if (max_level
< 0x80000007) {
884 fprintf(stderr
, "CPUID: no invariant TSC (max_level 0x%x)\n", max_level
);
889 * Non-Stop TSC is advertised by CPUID.EAX=0x80000007: EDX.bit8
890 * this check is valid for both Intel and AMD
892 asm("cpuid" : "=a" (eax
), "=b" (ebx
), "=c" (ecx
), "=d" (edx
) : "a" (0x80000007));
893 has_invariant_tsc
= edx
& (1 << 8);
895 if (!has_invariant_tsc
) {
896 fprintf(stderr
, "No invariant TSC\n");
901 * APERF/MPERF is advertised by CPUID.EAX=0x6: ECX.bit0
902 * this check is valid for both Intel and AMD
905 asm("cpuid" : "=a" (eax
), "=b" (ebx
), "=c" (ecx
), "=d" (edx
) : "a" (0x6));
906 has_aperf
= ecx
& (1 << 0);
908 fprintf(stderr
, "No APERF MSR\n");
912 do_nehalem_platform_info
= genuine_intel
&& has_invariant_tsc
;
913 do_nhm_cstates
= genuine_intel
; /* all Intel w/ non-stop TSC have NHM counters */
914 do_snb_cstates
= is_snb(family
, model
);
915 bclk
= discover_bclk(family
, model
);
917 do_nehalem_turbo_ratio_limit
= has_nehalem_turbo_ratio_limit(family
, model
);
923 fprintf(stderr
, "%s: [-v] [-M MSR#] [-i interval_sec | command ...]\n",
930 * in /dev/cpu/ return success for names that are numbers
931 * ie. filter out ".", "..", "microcode".
933 int dir_filter(const struct dirent
*dirp
)
935 if (isdigit(dirp
->d_name
[0]))
941 int open_dev_cpu_msr(int dummy1
)
946 void turbostat_init()
953 num_cpus
= for_all_cpus(alloc_new_counters
);
956 print_nehalem_info();
959 int fork_it(char **argv
)
963 get_counters(cnt_even
);
964 gettimeofday(&tv_even
, (struct timezone
*)NULL
);
969 execvp(argv
[0], argv
);
974 if (child_pid
== -1) {
979 signal(SIGINT
, SIG_IGN
);
980 signal(SIGQUIT
, SIG_IGN
);
981 if (waitpid(child_pid
, &status
, 0) == -1) {
986 get_counters(cnt_odd
);
987 gettimeofday(&tv_odd
, (struct timezone
*)NULL
);
988 retval
= compute_delta(cnt_odd
, cnt_even
, cnt_delta
);
990 timersub(&tv_odd
, &tv_even
, &tv_delta
);
991 compute_average(cnt_delta
, cnt_average
);
993 print_counters(cnt_delta
);
995 fprintf(stderr
, "%.6f sec\n", tv_delta
.tv_sec
+ tv_delta
.tv_usec
/1000000.0);
1000 void cmdline(int argc
, char **argv
)
1006 while ((opt
= getopt(argc
, argv
, "+vi:M:")) != -1) {
1012 interval_sec
= atoi(optarg
);
1015 sscanf(optarg
, "%x", &extra_msr_offset
);
1017 fprintf(stderr
, "MSR 0x%X\n", extra_msr_offset
);
1025 int main(int argc
, char **argv
)
1027 cmdline(argc
, argv
);
1030 fprintf(stderr
, "turbostat Dec 6, 2010"
1031 " - Len Brown <lenb@kernel.org>\n");
1033 fprintf(stderr
, "http://userweb.kernel.org/~lenb/acpi/utils/pmtools/turbostat/\n");
1038 * if any params left, it must be a command to fork
1041 return fork_it(argv
+ optind
);