| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 1 | /* | 
|  | 2 | * turbostat -- show CPU frequency and C-state residency | 
|  | 3 | * on modern Intel turbo-capable processors. | 
|  | 4 | * | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 5 | * Copyright (c) 2012 Intel Corporation. | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 6 | * Len Brown <len.brown@intel.com> | 
|  | 7 | * | 
|  | 8 | * This program is free software; you can redistribute it and/or modify it | 
|  | 9 | * under the terms and conditions of the GNU General Public License, | 
|  | 10 | * version 2, as published by the Free Software Foundation. | 
|  | 11 | * | 
|  | 12 | * This program is distributed in the hope it will be useful, but WITHOUT | 
|  | 13 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | 
|  | 14 | * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for | 
|  | 15 | * more details. | 
|  | 16 | * | 
|  | 17 | * You should have received a copy of the GNU General Public License along with | 
|  | 18 | * this program; if not, write to the Free Software Foundation, Inc., | 
|  | 19 | * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA. | 
|  | 20 | */ | 
|  | 21 |  | 
| Len Brown | 88c3281 | 2012-03-29 21:44:40 -0400 | [diff] [blame] | 22 | #define _GNU_SOURCE | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 23 | #include <stdio.h> | 
|  | 24 | #include <unistd.h> | 
|  | 25 | #include <sys/types.h> | 
|  | 26 | #include <sys/wait.h> | 
|  | 27 | #include <sys/stat.h> | 
|  | 28 | #include <sys/resource.h> | 
|  | 29 | #include <fcntl.h> | 
|  | 30 | #include <signal.h> | 
|  | 31 | #include <sys/time.h> | 
|  | 32 | #include <stdlib.h> | 
|  | 33 | #include <dirent.h> | 
|  | 34 | #include <string.h> | 
|  | 35 | #include <ctype.h> | 
| Len Brown | 88c3281 | 2012-03-29 21:44:40 -0400 | [diff] [blame] | 36 | #include <sched.h> | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 37 |  | 
|  | 38 | #define MSR_TSC	0x10 | 
|  | 39 | #define MSR_NEHALEM_PLATFORM_INFO	0xCE | 
|  | 40 | #define MSR_NEHALEM_TURBO_RATIO_LIMIT	0x1AD | 
|  | 41 | #define MSR_APERF	0xE8 | 
|  | 42 | #define MSR_MPERF	0xE7 | 
|  | 43 | #define MSR_PKG_C2_RESIDENCY	0x60D	/* SNB only */ | 
|  | 44 | #define MSR_PKG_C3_RESIDENCY	0x3F8 | 
|  | 45 | #define MSR_PKG_C6_RESIDENCY	0x3F9 | 
|  | 46 | #define MSR_PKG_C7_RESIDENCY	0x3FA	/* SNB only */ | 
|  | 47 | #define MSR_CORE_C3_RESIDENCY	0x3FC | 
|  | 48 | #define MSR_CORE_C6_RESIDENCY	0x3FD | 
|  | 49 | #define MSR_CORE_C7_RESIDENCY	0x3FE	/* SNB only */ | 
|  | 50 |  | 
|  | 51 | char *proc_stat = "/proc/stat"; | 
|  | 52 | unsigned int interval_sec = 5;	/* set with -i interval_sec */ | 
|  | 53 | unsigned int verbose;		/* set with -v */ | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 54 | unsigned int summary_only;	/* set with -s */ | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 55 | unsigned int skip_c0; | 
|  | 56 | unsigned int skip_c1; | 
|  | 57 | unsigned int do_nhm_cstates; | 
|  | 58 | unsigned int do_snb_cstates; | 
|  | 59 | unsigned int has_aperf; | 
|  | 60 | unsigned int units = 1000000000;	/* Ghz etc */ | 
|  | 61 | unsigned int genuine_intel; | 
|  | 62 | unsigned int has_invariant_tsc; | 
|  | 63 | unsigned int do_nehalem_platform_info; | 
|  | 64 | unsigned int do_nehalem_turbo_ratio_limit; | 
|  | 65 | unsigned int extra_msr_offset; | 
|  | 66 | double bclk; | 
|  | 67 | unsigned int show_pkg; | 
|  | 68 | unsigned int show_core; | 
|  | 69 | unsigned int show_cpu; | 
|  | 70 |  | 
|  | 71 | int aperf_mperf_unstable; | 
|  | 72 | int backwards_count; | 
|  | 73 | char *progname; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 74 |  | 
|  | 75 | int num_cpus; | 
| Len Brown | d15cf7c | 2012-06-03 23:24:00 -0400 | [diff] [blame] | 76 | cpu_set_t *cpu_present_set, *cpu_mask; | 
|  | 77 | size_t cpu_present_setsize, cpu_mask_size; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 78 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 79 | struct counters { | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 80 | unsigned long long tsc;		/* per thread */ | 
|  | 81 | unsigned long long aperf;	/* per thread */ | 
|  | 82 | unsigned long long mperf;	/* per thread */ | 
|  | 83 | unsigned long long c1;	/* per thread (calculated) */ | 
|  | 84 | unsigned long long c3;	/* per core */ | 
|  | 85 | unsigned long long c6;	/* per core */ | 
|  | 86 | unsigned long long c7;	/* per core */ | 
|  | 87 | unsigned long long pc2;	/* per package */ | 
|  | 88 | unsigned long long pc3;	/* per package */ | 
|  | 89 | unsigned long long pc6;	/* per package */ | 
|  | 90 | unsigned long long pc7;	/* per package */ | 
|  | 91 | unsigned long long extra_msr;	/* per thread */ | 
|  | 92 | int pkg; | 
|  | 93 | int core; | 
|  | 94 | int cpu; | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 95 | struct counters *next; | 
|  | 96 | }; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 97 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 98 | struct counters *cnt_even; | 
|  | 99 | struct counters *cnt_odd; | 
|  | 100 | struct counters *cnt_delta; | 
|  | 101 | struct counters *cnt_average; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 102 | struct timeval tv_even; | 
|  | 103 | struct timeval tv_odd; | 
|  | 104 | struct timeval tv_delta; | 
|  | 105 |  | 
| Len Brown | d15cf7c | 2012-06-03 23:24:00 -0400 | [diff] [blame] | 106 | int mark_cpu_present(int pkg, int core, int cpu) | 
|  | 107 | { | 
|  | 108 | CPU_SET_S(cpu, cpu_present_setsize, cpu_present_set); | 
|  | 109 | return 0; | 
|  | 110 | } | 
|  | 111 |  | 
| Len Brown | 88c3281 | 2012-03-29 21:44:40 -0400 | [diff] [blame] | 112 | /* | 
|  | 113 | * cpu_mask_init(ncpus) | 
|  | 114 | * | 
|  | 115 | * allocate and clear cpu_mask | 
|  | 116 | * set cpu_mask_size | 
|  | 117 | */ | 
|  | 118 | void cpu_mask_init(int ncpus) | 
|  | 119 | { | 
|  | 120 | cpu_mask = CPU_ALLOC(ncpus); | 
|  | 121 | if (cpu_mask == NULL) { | 
|  | 122 | perror("CPU_ALLOC"); | 
|  | 123 | exit(3); | 
|  | 124 | } | 
|  | 125 | cpu_mask_size = CPU_ALLOC_SIZE(ncpus); | 
|  | 126 | CPU_ZERO_S(cpu_mask_size, cpu_mask); | 
| Len Brown | d15cf7c | 2012-06-03 23:24:00 -0400 | [diff] [blame] | 127 |  | 
|  | 128 | /* | 
|  | 129 | * Allocate and initialize cpu_present_set | 
|  | 130 | */ | 
|  | 131 | cpu_present_set = CPU_ALLOC(ncpus); | 
|  | 132 | if (cpu_present_set == NULL) { | 
|  | 133 | perror("CPU_ALLOC"); | 
|  | 134 | exit(3); | 
|  | 135 | } | 
|  | 136 | cpu_present_setsize = CPU_ALLOC_SIZE(ncpus); | 
|  | 137 | CPU_ZERO_S(cpu_present_setsize, cpu_present_set); | 
|  | 138 | for_all_cpus(mark_cpu_present); | 
| Len Brown | 88c3281 | 2012-03-29 21:44:40 -0400 | [diff] [blame] | 139 | } | 
|  | 140 |  | 
|  | 141 | void cpu_mask_uninit() | 
|  | 142 | { | 
|  | 143 | CPU_FREE(cpu_mask); | 
|  | 144 | cpu_mask = NULL; | 
|  | 145 | cpu_mask_size = 0; | 
| Len Brown | d15cf7c | 2012-06-03 23:24:00 -0400 | [diff] [blame] | 146 | CPU_FREE(cpu_present_set); | 
|  | 147 | cpu_present_set = NULL; | 
|  | 148 | cpu_present_setsize = 0; | 
| Len Brown | 88c3281 | 2012-03-29 21:44:40 -0400 | [diff] [blame] | 149 | } | 
|  | 150 |  | 
|  | 151 | int cpu_migrate(int cpu) | 
|  | 152 | { | 
|  | 153 | CPU_ZERO_S(cpu_mask_size, cpu_mask); | 
|  | 154 | CPU_SET_S(cpu, cpu_mask_size, cpu_mask); | 
|  | 155 | if (sched_setaffinity(0, cpu_mask_size, cpu_mask) == -1) | 
|  | 156 | return -1; | 
|  | 157 | else | 
|  | 158 | return 0; | 
|  | 159 | } | 
|  | 160 |  | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 161 | int get_msr(int cpu, off_t offset, unsigned long long *msr) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 162 | { | 
|  | 163 | ssize_t retval; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 164 | char pathname[32]; | 
|  | 165 | int fd; | 
|  | 166 |  | 
|  | 167 | sprintf(pathname, "/dev/cpu/%d/msr", cpu); | 
|  | 168 | fd = open(pathname, O_RDONLY); | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 169 | if (fd < 0) | 
|  | 170 | return -1; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 171 |  | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 172 | retval = pread(fd, msr, sizeof *msr, offset); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 173 | close(fd); | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 174 |  | 
|  | 175 | if (retval != sizeof *msr) | 
|  | 176 | return -1; | 
|  | 177 |  | 
|  | 178 | return 0; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 179 | } | 
|  | 180 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 181 | void print_header(void) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 182 | { | 
|  | 183 | if (show_pkg) | 
| Len Brown | d30c4b7 | 2011-07-31 18:19:33 -0400 | [diff] [blame] | 184 | fprintf(stderr, "pk"); | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 185 | if (show_pkg) | 
|  | 186 | fprintf(stderr, " "); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 187 | if (show_core) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 188 | fprintf(stderr, "cor"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 189 | if (show_cpu) | 
|  | 190 | fprintf(stderr, " CPU"); | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 191 | if (show_pkg || show_core || show_cpu) | 
|  | 192 | fprintf(stderr, " "); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 193 | if (do_nhm_cstates) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 194 | fprintf(stderr, "   %%c0"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 195 | if (has_aperf) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 196 | fprintf(stderr, "  GHz"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 197 | fprintf(stderr, "  TSC"); | 
|  | 198 | if (do_nhm_cstates) | 
| Len Brown | d30c4b7 | 2011-07-31 18:19:33 -0400 | [diff] [blame] | 199 | fprintf(stderr, "    %%c1"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 200 | if (do_nhm_cstates) | 
| Len Brown | d30c4b7 | 2011-07-31 18:19:33 -0400 | [diff] [blame] | 201 | fprintf(stderr, "    %%c3"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 202 | if (do_nhm_cstates) | 
| Len Brown | d30c4b7 | 2011-07-31 18:19:33 -0400 | [diff] [blame] | 203 | fprintf(stderr, "    %%c6"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 204 | if (do_snb_cstates) | 
| Len Brown | d30c4b7 | 2011-07-31 18:19:33 -0400 | [diff] [blame] | 205 | fprintf(stderr, "    %%c7"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 206 | if (do_snb_cstates) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 207 | fprintf(stderr, "   %%pc2"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 208 | if (do_nhm_cstates) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 209 | fprintf(stderr, "   %%pc3"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 210 | if (do_nhm_cstates) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 211 | fprintf(stderr, "   %%pc6"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 212 | if (do_snb_cstates) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 213 | fprintf(stderr, "   %%pc7"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 214 | if (extra_msr_offset) | 
| Len Brown | d30c4b7 | 2011-07-31 18:19:33 -0400 | [diff] [blame] | 215 | fprintf(stderr, "        MSR 0x%x ", extra_msr_offset); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 216 |  | 
|  | 217 | putc('\n', stderr); | 
|  | 218 | } | 
|  | 219 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 220 | void dump_cnt(struct counters *cnt) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 221 | { | 
| Len Brown | aeae1e9 | 2011-07-03 21:41:33 -0400 | [diff] [blame] | 222 | if (!cnt) | 
|  | 223 | return; | 
|  | 224 | if (cnt->pkg) fprintf(stderr, "package: %d ", cnt->pkg); | 
|  | 225 | if (cnt->core) fprintf(stderr, "core:: %d ", cnt->core); | 
|  | 226 | if (cnt->cpu) fprintf(stderr, "CPU: %d ", cnt->cpu); | 
|  | 227 | if (cnt->tsc) fprintf(stderr, "TSC: %016llX\n", cnt->tsc); | 
|  | 228 | if (cnt->c3) fprintf(stderr, "c3: %016llX\n", cnt->c3); | 
|  | 229 | if (cnt->c6) fprintf(stderr, "c6: %016llX\n", cnt->c6); | 
|  | 230 | if (cnt->c7) fprintf(stderr, "c7: %016llX\n", cnt->c7); | 
|  | 231 | if (cnt->aperf) fprintf(stderr, "aperf: %016llX\n", cnt->aperf); | 
|  | 232 | if (cnt->pc2) fprintf(stderr, "pc2: %016llX\n", cnt->pc2); | 
|  | 233 | if (cnt->pc3) fprintf(stderr, "pc3: %016llX\n", cnt->pc3); | 
|  | 234 | if (cnt->pc6) fprintf(stderr, "pc6: %016llX\n", cnt->pc6); | 
|  | 235 | if (cnt->pc7) fprintf(stderr, "pc7: %016llX\n", cnt->pc7); | 
|  | 236 | if (cnt->extra_msr) fprintf(stderr, "msr0x%x: %016llX\n", extra_msr_offset, cnt->extra_msr); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 237 | } | 
|  | 238 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 239 | void dump_list(struct counters *cnt) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 240 | { | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 241 | printf("dump_list 0x%p\n", cnt); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 242 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 243 | for (; cnt; cnt = cnt->next) | 
|  | 244 | dump_cnt(cnt); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 245 | } | 
|  | 246 |  | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 247 | /* | 
|  | 248 | * column formatting convention & formats | 
|  | 249 | * package: "pk" 2 columns %2d | 
|  | 250 | * core: "cor" 3 columns %3d | 
|  | 251 | * CPU: "CPU" 3 columns %3d | 
|  | 252 | * GHz: "GHz" 3 columns %3.2 | 
|  | 253 | * TSC: "TSC" 3 columns %3.2 | 
|  | 254 | * percentage " %pc3" %6.2 | 
|  | 255 | */ | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 256 | void print_cnt(struct counters *p) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 257 | { | 
|  | 258 | double interval_float; | 
|  | 259 |  | 
|  | 260 | interval_float = tv_delta.tv_sec + tv_delta.tv_usec/1000000.0; | 
|  | 261 |  | 
|  | 262 | /* topology columns, print blanks on 1st (average) line */ | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 263 | if (p == cnt_average) { | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 264 | if (show_pkg) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 265 | fprintf(stderr, "  "); | 
|  | 266 | if (show_pkg && show_core) | 
| Len Brown | d30c4b7 | 2011-07-31 18:19:33 -0400 | [diff] [blame] | 267 | fprintf(stderr, " "); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 268 | if (show_core) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 269 | fprintf(stderr, "   "); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 270 | if (show_cpu) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 271 | fprintf(stderr, " " "   "); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 272 | } else { | 
|  | 273 | if (show_pkg) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 274 | fprintf(stderr, "%2d", p->pkg); | 
|  | 275 | if (show_pkg && show_core) | 
|  | 276 | fprintf(stderr, " "); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 277 | if (show_core) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 278 | fprintf(stderr, "%3d", p->core); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 279 | if (show_cpu) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 280 | fprintf(stderr, " %3d", p->cpu); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 281 | } | 
|  | 282 |  | 
|  | 283 | /* %c0 */ | 
|  | 284 | if (do_nhm_cstates) { | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 285 | if (show_pkg || show_core || show_cpu) | 
|  | 286 | fprintf(stderr, " "); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 287 | if (!skip_c0) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 288 | fprintf(stderr, "%6.2f", 100.0 * p->mperf/p->tsc); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 289 | else | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 290 | fprintf(stderr, "  ****"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 291 | } | 
|  | 292 |  | 
|  | 293 | /* GHz */ | 
|  | 294 | if (has_aperf) { | 
|  | 295 | if (!aperf_mperf_unstable) { | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 296 | fprintf(stderr, " %3.2f", | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 297 | 1.0 * p->tsc / units * p->aperf / | 
|  | 298 | p->mperf / interval_float); | 
|  | 299 | } else { | 
|  | 300 | if (p->aperf > p->tsc || p->mperf > p->tsc) { | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 301 | fprintf(stderr, " ***"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 302 | } else { | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 303 | fprintf(stderr, "%3.1f*", | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 304 | 1.0 * p->tsc / | 
|  | 305 | units * p->aperf / | 
|  | 306 | p->mperf / interval_float); | 
|  | 307 | } | 
|  | 308 | } | 
|  | 309 | } | 
|  | 310 |  | 
|  | 311 | /* TSC */ | 
|  | 312 | fprintf(stderr, "%5.2f", 1.0 * p->tsc/units/interval_float); | 
|  | 313 |  | 
|  | 314 | if (do_nhm_cstates) { | 
|  | 315 | if (!skip_c1) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 316 | fprintf(stderr, " %6.2f", 100.0 * p->c1/p->tsc); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 317 | else | 
| Len Brown | d30c4b7 | 2011-07-31 18:19:33 -0400 | [diff] [blame] | 318 | fprintf(stderr, "  ****"); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 319 | } | 
|  | 320 | if (do_nhm_cstates) | 
| Len Brown | d30c4b7 | 2011-07-31 18:19:33 -0400 | [diff] [blame] | 321 | fprintf(stderr, " %6.2f", 100.0 * p->c3/p->tsc); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 322 | if (do_nhm_cstates) | 
| Len Brown | d30c4b7 | 2011-07-31 18:19:33 -0400 | [diff] [blame] | 323 | fprintf(stderr, " %6.2f", 100.0 * p->c6/p->tsc); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 324 | if (do_snb_cstates) | 
| Len Brown | d30c4b7 | 2011-07-31 18:19:33 -0400 | [diff] [blame] | 325 | fprintf(stderr, " %6.2f", 100.0 * p->c7/p->tsc); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 326 | if (do_snb_cstates) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 327 | fprintf(stderr, " %6.2f", 100.0 * p->pc2/p->tsc); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 328 | if (do_nhm_cstates) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 329 | fprintf(stderr, " %6.2f", 100.0 * p->pc3/p->tsc); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 330 | if (do_nhm_cstates) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 331 | fprintf(stderr, " %6.2f", 100.0 * p->pc6/p->tsc); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 332 | if (do_snb_cstates) | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 333 | fprintf(stderr, " %6.2f", 100.0 * p->pc7/p->tsc); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 334 | if (extra_msr_offset) | 
|  | 335 | fprintf(stderr, "  0x%016llx", p->extra_msr); | 
|  | 336 | putc('\n', stderr); | 
|  | 337 | } | 
|  | 338 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 339 | void print_counters(struct counters *counters) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 340 | { | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 341 | struct counters *cnt; | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 342 | static int printed; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 343 |  | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 344 |  | 
|  | 345 | if (!printed || !summary_only) | 
|  | 346 | print_header(); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 347 |  | 
|  | 348 | if (num_cpus > 1) | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 349 | print_cnt(cnt_average); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 350 |  | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 351 | printed = 1; | 
|  | 352 |  | 
|  | 353 | if (summary_only) | 
|  | 354 | return; | 
|  | 355 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 356 | for (cnt = counters; cnt != NULL; cnt = cnt->next) | 
|  | 357 | print_cnt(cnt); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 358 |  | 
|  | 359 | } | 
|  | 360 |  | 
|  | 361 | #define SUBTRACT_COUNTER(after, before, delta) (delta = (after - before), (before > after)) | 
|  | 362 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 363 | int compute_delta(struct counters *after, | 
|  | 364 | struct counters *before, struct counters *delta) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 365 | { | 
|  | 366 | int errors = 0; | 
|  | 367 | int perf_err = 0; | 
|  | 368 |  | 
|  | 369 | skip_c0 = skip_c1 = 0; | 
|  | 370 |  | 
|  | 371 | for ( ; after && before && delta; | 
|  | 372 | after = after->next, before = before->next, delta = delta->next) { | 
|  | 373 | if (before->cpu != after->cpu) { | 
|  | 374 | printf("cpu configuration changed: %d != %d\n", | 
|  | 375 | before->cpu, after->cpu); | 
|  | 376 | return -1; | 
|  | 377 | } | 
|  | 378 |  | 
|  | 379 | if (SUBTRACT_COUNTER(after->tsc, before->tsc, delta->tsc)) { | 
|  | 380 | fprintf(stderr, "cpu%d TSC went backwards %llX to %llX\n", | 
|  | 381 | before->cpu, before->tsc, after->tsc); | 
|  | 382 | errors++; | 
|  | 383 | } | 
|  | 384 | /* check for TSC < 1 Mcycles over interval */ | 
|  | 385 | if (delta->tsc < (1000 * 1000)) { | 
|  | 386 | fprintf(stderr, "Insanely slow TSC rate," | 
|  | 387 | " TSC stops in idle?\n"); | 
|  | 388 | fprintf(stderr, "You can disable all c-states" | 
|  | 389 | " by booting with \"idle=poll\"\n"); | 
|  | 390 | fprintf(stderr, "or just the deep ones with" | 
|  | 391 | " \"processor.max_cstate=1\"\n"); | 
|  | 392 | exit(-3); | 
|  | 393 | } | 
|  | 394 | if (SUBTRACT_COUNTER(after->c3, before->c3, delta->c3)) { | 
|  | 395 | fprintf(stderr, "cpu%d c3 counter went backwards %llX to %llX\n", | 
|  | 396 | before->cpu, before->c3, after->c3); | 
|  | 397 | errors++; | 
|  | 398 | } | 
|  | 399 | if (SUBTRACT_COUNTER(after->c6, before->c6, delta->c6)) { | 
|  | 400 | fprintf(stderr, "cpu%d c6 counter went backwards %llX to %llX\n", | 
|  | 401 | before->cpu, before->c6, after->c6); | 
|  | 402 | errors++; | 
|  | 403 | } | 
|  | 404 | if (SUBTRACT_COUNTER(after->c7, before->c7, delta->c7)) { | 
|  | 405 | fprintf(stderr, "cpu%d c7 counter went backwards %llX to %llX\n", | 
|  | 406 | before->cpu, before->c7, after->c7); | 
|  | 407 | errors++; | 
|  | 408 | } | 
|  | 409 | if (SUBTRACT_COUNTER(after->pc2, before->pc2, delta->pc2)) { | 
|  | 410 | fprintf(stderr, "cpu%d pc2 counter went backwards %llX to %llX\n", | 
|  | 411 | before->cpu, before->pc2, after->pc2); | 
|  | 412 | errors++; | 
|  | 413 | } | 
|  | 414 | if (SUBTRACT_COUNTER(after->pc3, before->pc3, delta->pc3)) { | 
|  | 415 | fprintf(stderr, "cpu%d pc3 counter went backwards %llX to %llX\n", | 
|  | 416 | before->cpu, before->pc3, after->pc3); | 
|  | 417 | errors++; | 
|  | 418 | } | 
|  | 419 | if (SUBTRACT_COUNTER(after->pc6, before->pc6, delta->pc6)) { | 
|  | 420 | fprintf(stderr, "cpu%d pc6 counter went backwards %llX to %llX\n", | 
|  | 421 | before->cpu, before->pc6, after->pc6); | 
|  | 422 | errors++; | 
|  | 423 | } | 
|  | 424 | if (SUBTRACT_COUNTER(after->pc7, before->pc7, delta->pc7)) { | 
|  | 425 | fprintf(stderr, "cpu%d pc7 counter went backwards %llX to %llX\n", | 
|  | 426 | before->cpu, before->pc7, after->pc7); | 
|  | 427 | errors++; | 
|  | 428 | } | 
|  | 429 |  | 
|  | 430 | perf_err = SUBTRACT_COUNTER(after->aperf, before->aperf, delta->aperf); | 
|  | 431 | if (perf_err) { | 
|  | 432 | fprintf(stderr, "cpu%d aperf counter went backwards %llX to %llX\n", | 
|  | 433 | before->cpu, before->aperf, after->aperf); | 
|  | 434 | } | 
|  | 435 | perf_err |= SUBTRACT_COUNTER(after->mperf, before->mperf, delta->mperf); | 
|  | 436 | if (perf_err) { | 
|  | 437 | fprintf(stderr, "cpu%d mperf counter went backwards %llX to %llX\n", | 
|  | 438 | before->cpu, before->mperf, after->mperf); | 
|  | 439 | } | 
|  | 440 | if (perf_err) { | 
|  | 441 | if (!aperf_mperf_unstable) { | 
|  | 442 | fprintf(stderr, "%s: APERF or MPERF went backwards *\n", progname); | 
|  | 443 | fprintf(stderr, "* Frequency results do not cover entire interval *\n"); | 
|  | 444 | fprintf(stderr, "* fix this by running Linux-2.6.30 or later *\n"); | 
|  | 445 |  | 
|  | 446 | aperf_mperf_unstable = 1; | 
|  | 447 | } | 
|  | 448 | /* | 
|  | 449 | * mperf delta is likely a huge "positive" number | 
|  | 450 | * can not use it for calculating c0 time | 
|  | 451 | */ | 
|  | 452 | skip_c0 = 1; | 
|  | 453 | skip_c1 = 1; | 
|  | 454 | } | 
|  | 455 |  | 
|  | 456 | /* | 
|  | 457 | * As mperf and tsc collection are not atomic, | 
|  | 458 | * it is possible for mperf's non-halted cycles | 
|  | 459 | * to exceed TSC's all cycles: show c1 = 0% in that case. | 
|  | 460 | */ | 
|  | 461 | if (delta->mperf > delta->tsc) | 
|  | 462 | delta->c1 = 0; | 
|  | 463 | else /* normal case, derive c1 */ | 
|  | 464 | delta->c1 = delta->tsc - delta->mperf | 
|  | 465 | - delta->c3 - delta->c6 - delta->c7; | 
|  | 466 |  | 
|  | 467 | if (delta->mperf == 0) | 
|  | 468 | delta->mperf = 1;	/* divide by 0 protection */ | 
|  | 469 |  | 
|  | 470 | /* | 
|  | 471 | * for "extra msr", just copy the latest w/o subtracting | 
|  | 472 | */ | 
|  | 473 | delta->extra_msr = after->extra_msr; | 
|  | 474 | if (errors) { | 
|  | 475 | fprintf(stderr, "ERROR cpu%d before:\n", before->cpu); | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 476 | dump_cnt(before); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 477 | fprintf(stderr, "ERROR cpu%d after:\n", before->cpu); | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 478 | dump_cnt(after); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 479 | errors = 0; | 
|  | 480 | } | 
|  | 481 | } | 
|  | 482 | return 0; | 
|  | 483 | } | 
|  | 484 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 485 | void compute_average(struct counters *delta, struct counters *avg) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 486 | { | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 487 | struct counters *sum; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 488 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 489 | sum = calloc(1, sizeof(struct counters)); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 490 | if (sum == NULL) { | 
|  | 491 | perror("calloc sum"); | 
|  | 492 | exit(1); | 
|  | 493 | } | 
|  | 494 |  | 
|  | 495 | for (; delta; delta = delta->next) { | 
|  | 496 | sum->tsc += delta->tsc; | 
|  | 497 | sum->c1 += delta->c1; | 
|  | 498 | sum->c3 += delta->c3; | 
|  | 499 | sum->c6 += delta->c6; | 
|  | 500 | sum->c7 += delta->c7; | 
|  | 501 | sum->aperf += delta->aperf; | 
|  | 502 | sum->mperf += delta->mperf; | 
|  | 503 | sum->pc2 += delta->pc2; | 
|  | 504 | sum->pc3 += delta->pc3; | 
|  | 505 | sum->pc6 += delta->pc6; | 
|  | 506 | sum->pc7 += delta->pc7; | 
|  | 507 | } | 
|  | 508 | avg->tsc = sum->tsc/num_cpus; | 
|  | 509 | avg->c1 = sum->c1/num_cpus; | 
|  | 510 | avg->c3 = sum->c3/num_cpus; | 
|  | 511 | avg->c6 = sum->c6/num_cpus; | 
|  | 512 | avg->c7 = sum->c7/num_cpus; | 
|  | 513 | avg->aperf = sum->aperf/num_cpus; | 
|  | 514 | avg->mperf = sum->mperf/num_cpus; | 
|  | 515 | avg->pc2 = sum->pc2/num_cpus; | 
|  | 516 | avg->pc3 = sum->pc3/num_cpus; | 
|  | 517 | avg->pc6 = sum->pc6/num_cpus; | 
|  | 518 | avg->pc7 = sum->pc7/num_cpus; | 
|  | 519 |  | 
|  | 520 | free(sum); | 
|  | 521 | } | 
|  | 522 |  | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 523 | int get_counters(struct counters *cnt) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 524 | { | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 525 | for ( ; cnt; cnt = cnt->next) { | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 526 |  | 
|  | 527 | if (cpu_migrate(cnt->cpu)) | 
|  | 528 | return -1; | 
|  | 529 |  | 
|  | 530 | if (get_msr(cnt->cpu, MSR_TSC, &cnt->tsc)) | 
|  | 531 | return -1; | 
|  | 532 |  | 
|  | 533 | if (has_aperf) { | 
|  | 534 | if (get_msr(cnt->cpu, MSR_APERF, &cnt->aperf)) | 
|  | 535 | return -1; | 
|  | 536 | if (get_msr(cnt->cpu, MSR_MPERF, &cnt->mperf)) | 
|  | 537 | return -1; | 
| Len Brown | 88c3281 | 2012-03-29 21:44:40 -0400 | [diff] [blame] | 538 | } | 
|  | 539 |  | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 540 | if (do_nhm_cstates) { | 
|  | 541 | if (get_msr(cnt->cpu, MSR_CORE_C3_RESIDENCY, &cnt->c3)) | 
|  | 542 | return -1; | 
|  | 543 | if (get_msr(cnt->cpu, MSR_CORE_C6_RESIDENCY, &cnt->c6)) | 
|  | 544 | return -1; | 
|  | 545 | } | 
|  | 546 |  | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 547 | if (do_snb_cstates) | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 548 | if (get_msr(cnt->cpu, MSR_CORE_C7_RESIDENCY, &cnt->c7)) | 
|  | 549 | return -1; | 
|  | 550 |  | 
|  | 551 | if (do_nhm_cstates) { | 
|  | 552 | if (get_msr(cnt->cpu, MSR_PKG_C3_RESIDENCY, &cnt->pc3)) | 
|  | 553 | return -1; | 
|  | 554 | if (get_msr(cnt->cpu, MSR_PKG_C6_RESIDENCY, &cnt->pc6)) | 
|  | 555 | return -1; | 
|  | 556 | } | 
|  | 557 | if (do_snb_cstates) { | 
|  | 558 | if (get_msr(cnt->cpu, MSR_PKG_C2_RESIDENCY, &cnt->pc2)) | 
|  | 559 | return -1; | 
|  | 560 | if (get_msr(cnt->cpu, MSR_PKG_C7_RESIDENCY, &cnt->pc7)) | 
|  | 561 | return -1; | 
|  | 562 | } | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 563 | if (extra_msr_offset) | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 564 | if (get_msr(cnt->cpu, extra_msr_offset, &cnt->extra_msr)) | 
|  | 565 | return -1; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 566 | } | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 567 | return 0; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 568 | } | 
|  | 569 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 570 | void print_nehalem_info(void) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 571 | { | 
|  | 572 | unsigned long long msr; | 
|  | 573 | unsigned int ratio; | 
|  | 574 |  | 
|  | 575 | if (!do_nehalem_platform_info) | 
|  | 576 | return; | 
|  | 577 |  | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 578 | get_msr(0, MSR_NEHALEM_PLATFORM_INFO, &msr); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 579 |  | 
|  | 580 | ratio = (msr >> 40) & 0xFF; | 
|  | 581 | fprintf(stderr, "%d * %.0f = %.0f MHz max efficiency\n", | 
|  | 582 | ratio, bclk, ratio * bclk); | 
|  | 583 |  | 
|  | 584 | ratio = (msr >> 8) & 0xFF; | 
|  | 585 | fprintf(stderr, "%d * %.0f = %.0f MHz TSC frequency\n", | 
|  | 586 | ratio, bclk, ratio * bclk); | 
|  | 587 |  | 
|  | 588 | if (verbose > 1) | 
|  | 589 | fprintf(stderr, "MSR_NEHALEM_PLATFORM_INFO: 0x%llx\n", msr); | 
|  | 590 |  | 
|  | 591 | if (!do_nehalem_turbo_ratio_limit) | 
|  | 592 | return; | 
|  | 593 |  | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 594 | get_msr(0, MSR_NEHALEM_TURBO_RATIO_LIMIT, &msr); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 595 |  | 
|  | 596 | ratio = (msr >> 24) & 0xFF; | 
|  | 597 | if (ratio) | 
|  | 598 | fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 4 active cores\n", | 
|  | 599 | ratio, bclk, ratio * bclk); | 
|  | 600 |  | 
|  | 601 | ratio = (msr >> 16) & 0xFF; | 
|  | 602 | if (ratio) | 
|  | 603 | fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 3 active cores\n", | 
|  | 604 | ratio, bclk, ratio * bclk); | 
|  | 605 |  | 
|  | 606 | ratio = (msr >> 8) & 0xFF; | 
|  | 607 | if (ratio) | 
|  | 608 | fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 2 active cores\n", | 
|  | 609 | ratio, bclk, ratio * bclk); | 
|  | 610 |  | 
|  | 611 | ratio = (msr >> 0) & 0xFF; | 
|  | 612 | if (ratio) | 
|  | 613 | fprintf(stderr, "%d * %.0f = %.0f MHz max turbo 1 active cores\n", | 
|  | 614 | ratio, bclk, ratio * bclk); | 
|  | 615 |  | 
|  | 616 | } | 
|  | 617 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 618 | void free_counter_list(struct counters *list) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 619 | { | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 620 | struct counters *p; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 621 |  | 
|  | 622 | for (p = list; p; ) { | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 623 | struct counters *free_me; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 624 |  | 
|  | 625 | free_me = p; | 
|  | 626 | p = p->next; | 
|  | 627 | free(free_me); | 
|  | 628 | } | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 629 | } | 
|  | 630 |  | 
|  | 631 | void free_all_counters(void) | 
|  | 632 | { | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 633 | free_counter_list(cnt_even); | 
|  | 634 | cnt_even = NULL; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 635 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 636 | free_counter_list(cnt_odd); | 
|  | 637 | cnt_odd = NULL; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 638 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 639 | free_counter_list(cnt_delta); | 
|  | 640 | cnt_delta = NULL; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 641 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 642 | free_counter_list(cnt_average); | 
|  | 643 | cnt_average = NULL; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 644 | } | 
|  | 645 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 646 | void insert_counters(struct counters **list, | 
|  | 647 | struct counters *new) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 648 | { | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 649 | struct counters *prev; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 650 |  | 
|  | 651 | /* | 
|  | 652 | * list was empty | 
|  | 653 | */ | 
|  | 654 | if (*list == NULL) { | 
|  | 655 | new->next = *list; | 
|  | 656 | *list = new; | 
|  | 657 | return; | 
|  | 658 | } | 
|  | 659 |  | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 660 | if (!summary_only) | 
|  | 661 | show_cpu = 1;	/* there is more than one CPU */ | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 662 |  | 
|  | 663 | /* | 
|  | 664 | * insert on front of list. | 
|  | 665 | * It is sorted by ascending package#, core#, cpu# | 
|  | 666 | */ | 
|  | 667 | if (((*list)->pkg > new->pkg) || | 
|  | 668 | (((*list)->pkg == new->pkg) && ((*list)->core > new->core)) || | 
|  | 669 | (((*list)->pkg == new->pkg) && ((*list)->core == new->core) && ((*list)->cpu > new->cpu))) { | 
|  | 670 | new->next = *list; | 
|  | 671 | *list = new; | 
|  | 672 | return; | 
|  | 673 | } | 
|  | 674 |  | 
|  | 675 | prev = *list; | 
|  | 676 |  | 
|  | 677 | while (prev->next && (prev->next->pkg < new->pkg)) { | 
|  | 678 | prev = prev->next; | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 679 | if (!summary_only) | 
|  | 680 | show_pkg = 1;	/* there is more than 1 package */ | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 681 | } | 
|  | 682 |  | 
|  | 683 | while (prev->next && (prev->next->pkg == new->pkg) | 
|  | 684 | && (prev->next->core < new->core)) { | 
|  | 685 | prev = prev->next; | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 686 | if (!summary_only) | 
|  | 687 | show_core = 1;	/* there is more than 1 core */ | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 688 | } | 
|  | 689 |  | 
|  | 690 | while (prev->next && (prev->next->pkg == new->pkg) | 
|  | 691 | && (prev->next->core == new->core) | 
|  | 692 | && (prev->next->cpu < new->cpu)) { | 
|  | 693 | prev = prev->next; | 
|  | 694 | } | 
|  | 695 |  | 
|  | 696 | /* | 
|  | 697 | * insert after "prev" | 
|  | 698 | */ | 
|  | 699 | new->next = prev->next; | 
|  | 700 | prev->next = new; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 701 | } | 
|  | 702 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 703 | void alloc_new_counters(int pkg, int core, int cpu) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 704 | { | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 705 | struct counters *new; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 706 |  | 
|  | 707 | if (verbose > 1) | 
|  | 708 | printf("pkg%d core%d, cpu%d\n", pkg, core, cpu); | 
|  | 709 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 710 | new = (struct counters *)calloc(1, sizeof(struct counters)); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 711 | if (new == NULL) { | 
|  | 712 | perror("calloc"); | 
|  | 713 | exit(1); | 
|  | 714 | } | 
|  | 715 | new->pkg = pkg; | 
|  | 716 | new->core = core; | 
|  | 717 | new->cpu = cpu; | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 718 | insert_counters(&cnt_odd, new); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 719 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 720 | new = (struct counters *)calloc(1, | 
|  | 721 | sizeof(struct counters)); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 722 | if (new == NULL) { | 
|  | 723 | perror("calloc"); | 
|  | 724 | exit(1); | 
|  | 725 | } | 
|  | 726 | new->pkg = pkg; | 
|  | 727 | new->core = core; | 
|  | 728 | new->cpu = cpu; | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 729 | insert_counters(&cnt_even, new); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 730 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 731 | new = (struct counters *)calloc(1, sizeof(struct counters)); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 732 | if (new == NULL) { | 
|  | 733 | perror("calloc"); | 
|  | 734 | exit(1); | 
|  | 735 | } | 
|  | 736 | new->pkg = pkg; | 
|  | 737 | new->core = core; | 
|  | 738 | new->cpu = cpu; | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 739 | insert_counters(&cnt_delta, new); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 740 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 741 | new = (struct counters *)calloc(1, sizeof(struct counters)); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 742 | if (new == NULL) { | 
|  | 743 | perror("calloc"); | 
|  | 744 | exit(1); | 
|  | 745 | } | 
|  | 746 | new->pkg = pkg; | 
|  | 747 | new->core = core; | 
|  | 748 | new->cpu = cpu; | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 749 | cnt_average = new; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 750 | } | 
|  | 751 |  | 
|  | 752 | int get_physical_package_id(int cpu) | 
|  | 753 | { | 
|  | 754 | char path[64]; | 
|  | 755 | FILE *filep; | 
|  | 756 | int pkg; | 
|  | 757 |  | 
|  | 758 | sprintf(path, "/sys/devices/system/cpu/cpu%d/topology/physical_package_id", cpu); | 
|  | 759 | filep = fopen(path, "r"); | 
|  | 760 | if (filep == NULL) { | 
|  | 761 | perror(path); | 
|  | 762 | exit(1); | 
|  | 763 | } | 
|  | 764 | fscanf(filep, "%d", &pkg); | 
|  | 765 | fclose(filep); | 
|  | 766 | return pkg; | 
|  | 767 | } | 
|  | 768 |  | 
|  | 769 | int get_core_id(int cpu) | 
|  | 770 | { | 
|  | 771 | char path[64]; | 
|  | 772 | FILE *filep; | 
|  | 773 | int core; | 
|  | 774 |  | 
|  | 775 | sprintf(path, "/sys/devices/system/cpu/cpu%d/topology/core_id", cpu); | 
|  | 776 | filep = fopen(path, "r"); | 
|  | 777 | if (filep == NULL) { | 
|  | 778 | perror(path); | 
|  | 779 | exit(1); | 
|  | 780 | } | 
|  | 781 | fscanf(filep, "%d", &core); | 
|  | 782 | fclose(filep); | 
|  | 783 | return core; | 
|  | 784 | } | 
|  | 785 |  | 
|  | 786 | /* | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 787 | * run func(pkg, core, cpu) on every cpu in /proc/stat | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 788 | */ | 
|  | 789 |  | 
|  | 790 | int for_all_cpus(void (func)(int, int, int)) | 
|  | 791 | { | 
|  | 792 | FILE *fp; | 
|  | 793 | int cpu_count; | 
|  | 794 | int retval; | 
|  | 795 |  | 
|  | 796 | fp = fopen(proc_stat, "r"); | 
|  | 797 | if (fp == NULL) { | 
|  | 798 | perror(proc_stat); | 
|  | 799 | exit(1); | 
|  | 800 | } | 
|  | 801 |  | 
|  | 802 | retval = fscanf(fp, "cpu %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n"); | 
|  | 803 | if (retval != 0) { | 
|  | 804 | perror("/proc/stat format"); | 
|  | 805 | exit(1); | 
|  | 806 | } | 
|  | 807 |  | 
|  | 808 | for (cpu_count = 0; ; cpu_count++) { | 
|  | 809 | int cpu; | 
|  | 810 |  | 
|  | 811 | retval = fscanf(fp, "cpu%u %*d %*d %*d %*d %*d %*d %*d %*d %*d %*d\n", &cpu); | 
|  | 812 | if (retval != 1) | 
|  | 813 | break; | 
|  | 814 |  | 
|  | 815 | func(get_physical_package_id(cpu), get_core_id(cpu), cpu); | 
|  | 816 | } | 
|  | 817 | fclose(fp); | 
|  | 818 | return cpu_count; | 
|  | 819 | } | 
|  | 820 |  | 
|  | 821 | void re_initialize(void) | 
|  | 822 | { | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 823 | free_all_counters(); | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 824 | num_cpus = for_all_cpus(alloc_new_counters); | 
| Len Brown | 88c3281 | 2012-03-29 21:44:40 -0400 | [diff] [blame] | 825 | cpu_mask_uninit(); | 
|  | 826 | cpu_mask_init(num_cpus); | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 827 | printf("turbostat: re-initialized with num_cpus %d\n", num_cpus); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 828 | } | 
|  | 829 |  | 
|  | 830 | void dummy(int pkg, int core, int cpu) { return; } | 
|  | 831 | /* | 
|  | 832 | * check to see if a cpu came on-line | 
|  | 833 | */ | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 834 | int verify_num_cpus(void) | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 835 | { | 
|  | 836 | int new_num_cpus; | 
|  | 837 |  | 
|  | 838 | new_num_cpus = for_all_cpus(dummy); | 
|  | 839 |  | 
|  | 840 | if (new_num_cpus != num_cpus) { | 
|  | 841 | if (verbose) | 
|  | 842 | printf("num_cpus was %d, is now  %d\n", | 
|  | 843 | num_cpus, new_num_cpus); | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 844 | return -1; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 845 | } | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 846 | return 0; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 847 | } | 
|  | 848 |  | 
|  | 849 | void turbostat_loop() | 
|  | 850 | { | 
|  | 851 | restart: | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 852 | get_counters(cnt_even); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 853 | gettimeofday(&tv_even, (struct timezone *)NULL); | 
|  | 854 |  | 
|  | 855 | while (1) { | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 856 | if (verify_num_cpus()) { | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 857 | re_initialize(); | 
|  | 858 | goto restart; | 
|  | 859 | } | 
|  | 860 | sleep(interval_sec); | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 861 | if (get_counters(cnt_odd)) { | 
|  | 862 | re_initialize(); | 
|  | 863 | goto restart; | 
|  | 864 | } | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 865 | gettimeofday(&tv_odd, (struct timezone *)NULL); | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 866 | compute_delta(cnt_odd, cnt_even, cnt_delta); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 867 | timersub(&tv_odd, &tv_even, &tv_delta); | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 868 | compute_average(cnt_delta, cnt_average); | 
|  | 869 | print_counters(cnt_delta); | 
| Len Brown | 15aaa34 | 2012-03-29 22:19:58 -0400 | [diff] [blame] | 870 | sleep(interval_sec); | 
|  | 871 | if (get_counters(cnt_even)) { | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 872 | re_initialize(); | 
|  | 873 | goto restart; | 
|  | 874 | } | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 875 | gettimeofday(&tv_even, (struct timezone *)NULL); | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 876 | compute_delta(cnt_even, cnt_odd, cnt_delta); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 877 | timersub(&tv_even, &tv_odd, &tv_delta); | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 878 | compute_average(cnt_delta, cnt_average); | 
|  | 879 | print_counters(cnt_delta); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 880 | } | 
|  | 881 | } | 
|  | 882 |  | 
|  | 883 | void check_dev_msr() | 
|  | 884 | { | 
|  | 885 | struct stat sb; | 
|  | 886 |  | 
|  | 887 | if (stat("/dev/cpu/0/msr", &sb)) { | 
|  | 888 | fprintf(stderr, "no /dev/cpu/0/msr\n"); | 
|  | 889 | fprintf(stderr, "Try \"# modprobe msr\"\n"); | 
|  | 890 | exit(-5); | 
|  | 891 | } | 
|  | 892 | } | 
|  | 893 |  | 
|  | 894 | void check_super_user() | 
|  | 895 | { | 
|  | 896 | if (getuid() != 0) { | 
|  | 897 | fprintf(stderr, "must be root\n"); | 
|  | 898 | exit(-6); | 
|  | 899 | } | 
|  | 900 | } | 
|  | 901 |  | 
|  | 902 | int has_nehalem_turbo_ratio_limit(unsigned int family, unsigned int model) | 
|  | 903 | { | 
|  | 904 | if (!genuine_intel) | 
|  | 905 | return 0; | 
|  | 906 |  | 
|  | 907 | if (family != 6) | 
|  | 908 | return 0; | 
|  | 909 |  | 
|  | 910 | switch (model) { | 
|  | 911 | case 0x1A:	/* Core i7, Xeon 5500 series - Bloomfield, Gainstown NHM-EP */ | 
|  | 912 | case 0x1E:	/* Core i7 and i5 Processor - Clarksfield, Lynnfield, Jasper Forest */ | 
|  | 913 | case 0x1F:	/* Core i7 and i5 Processor - Nehalem */ | 
|  | 914 | case 0x25:	/* Westmere Client - Clarkdale, Arrandale */ | 
|  | 915 | case 0x2C:	/* Westmere EP - Gulftown */ | 
|  | 916 | case 0x2A:	/* SNB */ | 
|  | 917 | case 0x2D:	/* SNB Xeon */ | 
| Len Brown | 553575f | 2011-11-18 03:32:01 -0500 | [diff] [blame] | 918 | case 0x3A:	/* IVB */ | 
|  | 919 | case 0x3D:	/* IVB Xeon */ | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 920 | return 1; | 
|  | 921 | case 0x2E:	/* Nehalem-EX Xeon - Beckton */ | 
|  | 922 | case 0x2F:	/* Westmere-EX Xeon - Eagleton */ | 
|  | 923 | default: | 
|  | 924 | return 0; | 
|  | 925 | } | 
|  | 926 | } | 
|  | 927 |  | 
|  | 928 | int is_snb(unsigned int family, unsigned int model) | 
|  | 929 | { | 
|  | 930 | if (!genuine_intel) | 
|  | 931 | return 0; | 
|  | 932 |  | 
|  | 933 | switch (model) { | 
|  | 934 | case 0x2A: | 
|  | 935 | case 0x2D: | 
| Len Brown | 650a37f | 2012-06-03 23:34:44 -0400 | [diff] [blame] | 936 | case 0x3A:	/* IVB */ | 
|  | 937 | case 0x3D:	/* IVB Xeon */ | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 938 | return 1; | 
|  | 939 | } | 
|  | 940 | return 0; | 
|  | 941 | } | 
|  | 942 |  | 
|  | 943 | double discover_bclk(unsigned int family, unsigned int model) | 
|  | 944 | { | 
|  | 945 | if (is_snb(family, model)) | 
|  | 946 | return 100.00; | 
|  | 947 | else | 
|  | 948 | return 133.33; | 
|  | 949 | } | 
|  | 950 |  | 
|  | 951 | void check_cpuid() | 
|  | 952 | { | 
|  | 953 | unsigned int eax, ebx, ecx, edx, max_level; | 
|  | 954 | unsigned int fms, family, model, stepping; | 
|  | 955 |  | 
|  | 956 | eax = ebx = ecx = edx = 0; | 
|  | 957 |  | 
|  | 958 | asm("cpuid" : "=a" (max_level), "=b" (ebx), "=c" (ecx), "=d" (edx) : "a" (0)); | 
|  | 959 |  | 
|  | 960 | if (ebx == 0x756e6547 && edx == 0x49656e69 && ecx == 0x6c65746e) | 
|  | 961 | genuine_intel = 1; | 
|  | 962 |  | 
|  | 963 | if (verbose) | 
|  | 964 | fprintf(stderr, "%.4s%.4s%.4s ", | 
|  | 965 | (char *)&ebx, (char *)&edx, (char *)&ecx); | 
|  | 966 |  | 
|  | 967 | asm("cpuid" : "=a" (fms), "=c" (ecx), "=d" (edx) : "a" (1) : "ebx"); | 
|  | 968 | family = (fms >> 8) & 0xf; | 
|  | 969 | model = (fms >> 4) & 0xf; | 
|  | 970 | stepping = fms & 0xf; | 
|  | 971 | if (family == 6 || family == 0xf) | 
|  | 972 | model += ((fms >> 16) & 0xf) << 4; | 
|  | 973 |  | 
|  | 974 | if (verbose) | 
|  | 975 | fprintf(stderr, "%d CPUID levels; family:model:stepping 0x%x:%x:%x (%d:%d:%d)\n", | 
|  | 976 | max_level, family, model, stepping, family, model, stepping); | 
|  | 977 |  | 
|  | 978 | if (!(edx & (1 << 5))) { | 
|  | 979 | fprintf(stderr, "CPUID: no MSR\n"); | 
|  | 980 | exit(1); | 
|  | 981 | } | 
|  | 982 |  | 
|  | 983 | /* | 
|  | 984 | * check max extended function levels of CPUID. | 
|  | 985 | * This is needed to check for invariant TSC. | 
|  | 986 | * This check is valid for both Intel and AMD. | 
|  | 987 | */ | 
|  | 988 | ebx = ecx = edx = 0; | 
|  | 989 | asm("cpuid" : "=a" (max_level), "=b" (ebx), "=c" (ecx), "=d" (edx) : "a" (0x80000000)); | 
|  | 990 |  | 
|  | 991 | if (max_level < 0x80000007) { | 
|  | 992 | fprintf(stderr, "CPUID: no invariant TSC (max_level 0x%x)\n", max_level); | 
|  | 993 | exit(1); | 
|  | 994 | } | 
|  | 995 |  | 
|  | 996 | /* | 
|  | 997 | * Non-Stop TSC is advertised by CPUID.EAX=0x80000007: EDX.bit8 | 
|  | 998 | * this check is valid for both Intel and AMD | 
|  | 999 | */ | 
|  | 1000 | asm("cpuid" : "=a" (eax), "=b" (ebx), "=c" (ecx), "=d" (edx) : "a" (0x80000007)); | 
| Thomas Renninger | 8209e05 | 2011-01-21 15:11:19 +0100 | [diff] [blame] | 1001 | has_invariant_tsc = edx & (1 << 8); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 1002 |  | 
|  | 1003 | if (!has_invariant_tsc) { | 
|  | 1004 | fprintf(stderr, "No invariant TSC\n"); | 
|  | 1005 | exit(1); | 
|  | 1006 | } | 
|  | 1007 |  | 
|  | 1008 | /* | 
|  | 1009 | * APERF/MPERF is advertised by CPUID.EAX=0x6: ECX.bit0 | 
|  | 1010 | * this check is valid for both Intel and AMD | 
|  | 1011 | */ | 
|  | 1012 |  | 
|  | 1013 | asm("cpuid" : "=a" (eax), "=b" (ebx), "=c" (ecx), "=d" (edx) : "a" (0x6)); | 
| Thomas Renninger | 8209e05 | 2011-01-21 15:11:19 +0100 | [diff] [blame] | 1014 | has_aperf = ecx & (1 << 0); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 1015 | if (!has_aperf) { | 
|  | 1016 | fprintf(stderr, "No APERF MSR\n"); | 
|  | 1017 | exit(1); | 
|  | 1018 | } | 
|  | 1019 |  | 
|  | 1020 | do_nehalem_platform_info = genuine_intel && has_invariant_tsc; | 
|  | 1021 | do_nhm_cstates = genuine_intel;	/* all Intel w/ non-stop TSC have NHM counters */ | 
|  | 1022 | do_snb_cstates = is_snb(family, model); | 
|  | 1023 | bclk = discover_bclk(family, model); | 
|  | 1024 |  | 
|  | 1025 | do_nehalem_turbo_ratio_limit = has_nehalem_turbo_ratio_limit(family, model); | 
|  | 1026 | } | 
|  | 1027 |  | 
|  | 1028 |  | 
|  | 1029 | void usage() | 
|  | 1030 | { | 
|  | 1031 | fprintf(stderr, "%s: [-v] [-M MSR#] [-i interval_sec | command ...]\n", | 
|  | 1032 | progname); | 
|  | 1033 | exit(1); | 
|  | 1034 | } | 
|  | 1035 |  | 
|  | 1036 |  | 
|  | 1037 | /* | 
|  | 1038 | * in /dev/cpu/ return success for names that are numbers | 
|  | 1039 | * ie. filter out ".", "..", "microcode". | 
|  | 1040 | */ | 
|  | 1041 | int dir_filter(const struct dirent *dirp) | 
|  | 1042 | { | 
|  | 1043 | if (isdigit(dirp->d_name[0])) | 
|  | 1044 | return 1; | 
|  | 1045 | else | 
|  | 1046 | return 0; | 
|  | 1047 | } | 
|  | 1048 |  | 
|  | 1049 | int open_dev_cpu_msr(int dummy1) | 
|  | 1050 | { | 
|  | 1051 | return 0; | 
|  | 1052 | } | 
|  | 1053 |  | 
|  | 1054 | void turbostat_init() | 
|  | 1055 | { | 
|  | 1056 | check_cpuid(); | 
|  | 1057 |  | 
|  | 1058 | check_dev_msr(); | 
|  | 1059 | check_super_user(); | 
|  | 1060 |  | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 1061 | num_cpus = for_all_cpus(alloc_new_counters); | 
| Len Brown | 88c3281 | 2012-03-29 21:44:40 -0400 | [diff] [blame] | 1062 | cpu_mask_init(num_cpus); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 1063 |  | 
|  | 1064 | if (verbose) | 
|  | 1065 | print_nehalem_info(); | 
|  | 1066 | } | 
|  | 1067 |  | 
|  | 1068 | int fork_it(char **argv) | 
|  | 1069 | { | 
|  | 1070 | int retval; | 
|  | 1071 | pid_t child_pid; | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 1072 | get_counters(cnt_even); | 
| Len Brown | d15cf7c | 2012-06-03 23:24:00 -0400 | [diff] [blame] | 1073 |  | 
|  | 1074 | /* clear affinity side-effect of get_counters() */ | 
|  | 1075 | sched_setaffinity(0, cpu_present_setsize, cpu_present_set); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 1076 | gettimeofday(&tv_even, (struct timezone *)NULL); | 
|  | 1077 |  | 
|  | 1078 | child_pid = fork(); | 
|  | 1079 | if (!child_pid) { | 
|  | 1080 | /* child */ | 
|  | 1081 | execvp(argv[0], argv); | 
|  | 1082 | } else { | 
|  | 1083 | int status; | 
|  | 1084 |  | 
|  | 1085 | /* parent */ | 
|  | 1086 | if (child_pid == -1) { | 
|  | 1087 | perror("fork"); | 
|  | 1088 | exit(1); | 
|  | 1089 | } | 
|  | 1090 |  | 
|  | 1091 | signal(SIGINT, SIG_IGN); | 
|  | 1092 | signal(SIGQUIT, SIG_IGN); | 
|  | 1093 | if (waitpid(child_pid, &status, 0) == -1) { | 
|  | 1094 | perror("wait"); | 
|  | 1095 | exit(1); | 
|  | 1096 | } | 
|  | 1097 | } | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 1098 | get_counters(cnt_odd); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 1099 | gettimeofday(&tv_odd, (struct timezone *)NULL); | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 1100 | retval = compute_delta(cnt_odd, cnt_even, cnt_delta); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 1101 |  | 
|  | 1102 | timersub(&tv_odd, &tv_even, &tv_delta); | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 1103 | compute_average(cnt_delta, cnt_average); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 1104 | if (!retval) | 
| Len Brown | a829eb4 | 2011-02-10 23:36:34 -0500 | [diff] [blame] | 1105 | print_counters(cnt_delta); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 1106 |  | 
| Justin P. Mattock | 6eab04a | 2011-04-08 19:49:08 -0700 | [diff] [blame] | 1107 | fprintf(stderr, "%.6f sec\n", tv_delta.tv_sec + tv_delta.tv_usec/1000000.0); | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 1108 |  | 
|  | 1109 | return 0; | 
|  | 1110 | } | 
|  | 1111 |  | 
|  | 1112 | void cmdline(int argc, char **argv) | 
|  | 1113 | { | 
|  | 1114 | int opt; | 
|  | 1115 |  | 
|  | 1116 | progname = argv[0]; | 
|  | 1117 |  | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 1118 | while ((opt = getopt(argc, argv, "+svi:M:")) != -1) { | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 1119 | switch (opt) { | 
| Len Brown | e23da03 | 2012-02-06 18:37:16 -0500 | [diff] [blame] | 1120 | case 's': | 
|  | 1121 | summary_only++; | 
|  | 1122 | break; | 
| Len Brown | 103a8fe | 2010-10-22 23:53:03 -0400 | [diff] [blame] | 1123 | case 'v': | 
|  | 1124 | verbose++; | 
|  | 1125 | break; | 
|  | 1126 | case 'i': | 
|  | 1127 | interval_sec = atoi(optarg); | 
|  | 1128 | break; | 
|  | 1129 | case 'M': | 
|  | 1130 | sscanf(optarg, "%x", &extra_msr_offset); | 
|  | 1131 | if (verbose > 1) | 
|  | 1132 | fprintf(stderr, "MSR 0x%X\n", extra_msr_offset); | 
|  | 1133 | break; | 
|  | 1134 | default: | 
|  | 1135 | usage(); | 
|  | 1136 | } | 
|  | 1137 | } | 
|  | 1138 | } | 
|  | 1139 |  | 
|  | 1140 | int main(int argc, char **argv) | 
|  | 1141 | { | 
|  | 1142 | cmdline(argc, argv); | 
|  | 1143 |  | 
|  | 1144 | if (verbose > 1) | 
|  | 1145 | fprintf(stderr, "turbostat Dec 6, 2010" | 
|  | 1146 | " - Len Brown <lenb@kernel.org>\n"); | 
|  | 1147 | if (verbose > 1) | 
|  | 1148 | fprintf(stderr, "http://userweb.kernel.org/~lenb/acpi/utils/pmtools/turbostat/\n"); | 
|  | 1149 |  | 
|  | 1150 | turbostat_init(); | 
|  | 1151 |  | 
|  | 1152 | /* | 
|  | 1153 | * if any params left, it must be a command to fork | 
|  | 1154 | */ | 
|  | 1155 | if (argc - optind) | 
|  | 1156 | return fork_it(argv + optind); | 
|  | 1157 | else | 
|  | 1158 | turbostat_loop(); | 
|  | 1159 |  | 
|  | 1160 | return 0; | 
|  | 1161 | } |