john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 1 | /* |
| 2 | * This code largely moved from arch/i386/kernel/timer/timer_tsc.c |
| 3 | * which was originally moved from arch/i386/kernel/time.c. |
| 4 | * See comments there for proper credits. |
| 5 | */ |
| 6 | |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 7 | #include <linux/clocksource.h> |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 8 | #include <linux/workqueue.h> |
| 9 | #include <linux/cpufreq.h> |
| 10 | #include <linux/jiffies.h> |
| 11 | #include <linux/init.h> |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 12 | #include <linux/dmi.h> |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 13 | |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 14 | #include <asm/delay.h> |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 15 | #include <asm/tsc.h> |
| 16 | #include <asm/io.h> |
Zachary Amsden | 6cb9a83 | 2007-03-05 00:30:35 -0800 | [diff] [blame] | 17 | #include <asm/timer.h> |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 18 | |
| 19 | #include "mach_timer.h" |
| 20 | |
Thomas Gleixner | d9a5c0a | 2007-03-24 23:02:49 +0100 | [diff] [blame] | 21 | static int tsc_enabled; |
| 22 | |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 23 | /* |
| 24 | * On some systems the TSC frequency does not |
| 25 | * change with the cpu frequency. So we need |
| 26 | * an extra value to store the TSC freq |
| 27 | */ |
| 28 | unsigned int tsc_khz; |
| 29 | |
Vivek Goyal | 664c0d3 | 2007-01-10 23:15:36 -0800 | [diff] [blame] | 30 | int tsc_disable; |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 31 | |
| 32 | #ifdef CONFIG_X86_TSC |
| 33 | static int __init tsc_setup(char *str) |
| 34 | { |
| 35 | printk(KERN_WARNING "notsc: Kernel compiled with CONFIG_X86_TSC, " |
| 36 | "cannot disable TSC.\n"); |
| 37 | return 1; |
| 38 | } |
| 39 | #else |
| 40 | /* |
| 41 | * disable flag for tsc. Takes effect by clearing the TSC cpu flag |
| 42 | * in cpu/common.c |
| 43 | */ |
| 44 | static int __init tsc_setup(char *str) |
| 45 | { |
| 46 | tsc_disable = 1; |
| 47 | |
| 48 | return 1; |
| 49 | } |
| 50 | #endif |
| 51 | |
| 52 | __setup("notsc", tsc_setup); |
| 53 | |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 54 | /* |
| 55 | * code to mark and check if the TSC is unstable |
| 56 | * due to cpufreq or due to unsynced TSCs |
| 57 | */ |
| 58 | static int tsc_unstable; |
| 59 | |
| 60 | static inline int check_tsc_unstable(void) |
| 61 | { |
| 62 | return tsc_unstable; |
| 63 | } |
| 64 | |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 65 | /* Accellerators for sched_clock() |
| 66 | * convert from cycles(64bits) => nanoseconds (64bits) |
| 67 | * basic equation: |
| 68 | * ns = cycles / (freq / ns_per_sec) |
| 69 | * ns = cycles * (ns_per_sec / freq) |
| 70 | * ns = cycles * (10^9 / (cpu_khz * 10^3)) |
| 71 | * ns = cycles * (10^6 / cpu_khz) |
| 72 | * |
| 73 | * Then we use scaling math (suggested by george@mvista.com) to get: |
| 74 | * ns = cycles * (10^6 * SC / cpu_khz) / SC |
| 75 | * ns = cycles * cyc2ns_scale / SC |
| 76 | * |
| 77 | * And since SC is a constant power of two, we can convert the div |
| 78 | * into a shift. |
| 79 | * |
| 80 | * We can use khz divisor instead of mhz to keep a better percision, since |
| 81 | * cyc2ns_scale is limited to 10^6 * 2^10, which fits in 32 bits. |
| 82 | * (mathieu.desnoyers@polymtl.ca) |
| 83 | * |
| 84 | * -johnstul@us.ibm.com "math is hard, lets go shopping!" |
| 85 | */ |
| 86 | static unsigned long cyc2ns_scale __read_mostly; |
| 87 | |
| 88 | #define CYC2NS_SCALE_FACTOR 10 /* 2^10, carefully chosen */ |
| 89 | |
| 90 | static inline void set_cyc2ns_scale(unsigned long cpu_khz) |
| 91 | { |
| 92 | cyc2ns_scale = (1000000 << CYC2NS_SCALE_FACTOR)/cpu_khz; |
| 93 | } |
| 94 | |
| 95 | static inline unsigned long long cycles_2_ns(unsigned long long cyc) |
| 96 | { |
| 97 | return (cyc * cyc2ns_scale) >> CYC2NS_SCALE_FACTOR; |
| 98 | } |
| 99 | |
| 100 | /* |
| 101 | * Scheduler clock - returns current time in nanosec units. |
| 102 | */ |
| 103 | unsigned long long sched_clock(void) |
| 104 | { |
| 105 | unsigned long long this_offset; |
| 106 | |
| 107 | /* |
Ingo Molnar | f969098 | 2007-02-13 13:26:22 +0100 | [diff] [blame] | 108 | * Fall back to jiffies if there's no TSC available: |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 109 | */ |
Thomas Gleixner | d9a5c0a | 2007-03-24 23:02:49 +0100 | [diff] [blame] | 110 | if (unlikely(!tsc_enabled)) |
Ingo Molnar | f969098 | 2007-02-13 13:26:22 +0100 | [diff] [blame] | 111 | /* No locking but a rare wrong value is not a big deal: */ |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 112 | return (jiffies_64 - INITIAL_JIFFIES) * (1000000000 / HZ); |
| 113 | |
| 114 | /* read the Time Stamp Counter: */ |
Zachary Amsden | 6cb9a83 | 2007-03-05 00:30:35 -0800 | [diff] [blame] | 115 | get_scheduled_cycles(this_offset); |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 116 | |
| 117 | /* return the value in ns */ |
| 118 | return cycles_2_ns(this_offset); |
| 119 | } |
| 120 | |
Zachary Amsden | 1182d85 | 2007-03-05 00:30:36 -0800 | [diff] [blame] | 121 | unsigned long native_calculate_cpu_khz(void) |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 122 | { |
| 123 | unsigned long long start, end; |
| 124 | unsigned long count; |
| 125 | u64 delta64; |
| 126 | int i; |
| 127 | unsigned long flags; |
| 128 | |
| 129 | local_irq_save(flags); |
| 130 | |
| 131 | /* run 3 times to ensure the cache is warm */ |
| 132 | for (i = 0; i < 3; i++) { |
| 133 | mach_prepare_counter(); |
| 134 | rdtscll(start); |
| 135 | mach_countup(&count); |
| 136 | rdtscll(end); |
| 137 | } |
| 138 | /* |
| 139 | * Error: ECTCNEVERSET |
| 140 | * The CTC wasn't reliable: we got a hit on the very first read, |
| 141 | * or the CPU was so fast/slow that the quotient wouldn't fit in |
| 142 | * 32 bits.. |
| 143 | */ |
| 144 | if (count <= 1) |
| 145 | goto err; |
| 146 | |
| 147 | delta64 = end - start; |
| 148 | |
| 149 | /* cpu freq too fast: */ |
| 150 | if (delta64 > (1ULL<<32)) |
| 151 | goto err; |
| 152 | |
| 153 | /* cpu freq too slow: */ |
| 154 | if (delta64 <= CALIBRATE_TIME_MSEC) |
| 155 | goto err; |
| 156 | |
| 157 | delta64 += CALIBRATE_TIME_MSEC/2; /* round for do_div */ |
| 158 | do_div(delta64,CALIBRATE_TIME_MSEC); |
| 159 | |
| 160 | local_irq_restore(flags); |
| 161 | return (unsigned long)delta64; |
| 162 | err: |
| 163 | local_irq_restore(flags); |
| 164 | return 0; |
| 165 | } |
| 166 | |
| 167 | int recalibrate_cpu_khz(void) |
| 168 | { |
| 169 | #ifndef CONFIG_SMP |
| 170 | unsigned long cpu_khz_old = cpu_khz; |
| 171 | |
| 172 | if (cpu_has_tsc) { |
| 173 | cpu_khz = calculate_cpu_khz(); |
| 174 | tsc_khz = cpu_khz; |
| 175 | cpu_data[0].loops_per_jiffy = |
| 176 | cpufreq_scale(cpu_data[0].loops_per_jiffy, |
| 177 | cpu_khz_old, cpu_khz); |
| 178 | return 0; |
| 179 | } else |
| 180 | return -ENODEV; |
| 181 | #else |
| 182 | return -ENODEV; |
| 183 | #endif |
| 184 | } |
| 185 | |
| 186 | EXPORT_SYMBOL(recalibrate_cpu_khz); |
| 187 | |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 188 | #ifdef CONFIG_CPU_FREQ |
| 189 | |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 190 | /* |
| 191 | * if the CPU frequency is scaled, TSC-based delays will need a different |
| 192 | * loops_per_jiffy value to function properly. |
| 193 | */ |
| 194 | static unsigned int ref_freq = 0; |
| 195 | static unsigned long loops_per_jiffy_ref = 0; |
| 196 | static unsigned long cpu_khz_ref = 0; |
| 197 | |
| 198 | static int |
| 199 | time_cpufreq_notifier(struct notifier_block *nb, unsigned long val, void *data) |
| 200 | { |
| 201 | struct cpufreq_freqs *freq = data; |
| 202 | |
| 203 | if (val != CPUFREQ_RESUMECHANGE && val != CPUFREQ_SUSPENDCHANGE) |
| 204 | write_seqlock_irq(&xtime_lock); |
| 205 | |
| 206 | if (!ref_freq) { |
| 207 | if (!freq->old){ |
| 208 | ref_freq = freq->new; |
| 209 | goto end; |
| 210 | } |
| 211 | ref_freq = freq->old; |
| 212 | loops_per_jiffy_ref = cpu_data[freq->cpu].loops_per_jiffy; |
| 213 | cpu_khz_ref = cpu_khz; |
| 214 | } |
| 215 | |
| 216 | if ((val == CPUFREQ_PRECHANGE && freq->old < freq->new) || |
| 217 | (val == CPUFREQ_POSTCHANGE && freq->old > freq->new) || |
| 218 | (val == CPUFREQ_RESUMECHANGE)) { |
| 219 | if (!(freq->flags & CPUFREQ_CONST_LOOPS)) |
| 220 | cpu_data[freq->cpu].loops_per_jiffy = |
| 221 | cpufreq_scale(loops_per_jiffy_ref, |
| 222 | ref_freq, freq->new); |
| 223 | |
| 224 | if (cpu_khz) { |
| 225 | |
| 226 | if (num_online_cpus() == 1) |
| 227 | cpu_khz = cpufreq_scale(cpu_khz_ref, |
| 228 | ref_freq, freq->new); |
| 229 | if (!(freq->flags & CPUFREQ_CONST_LOOPS)) { |
| 230 | tsc_khz = cpu_khz; |
| 231 | set_cyc2ns_scale(cpu_khz); |
| 232 | /* |
| 233 | * TSC based sched_clock turns |
| 234 | * to junk w/ cpufreq |
| 235 | */ |
john stultz | 5a90cf2 | 2007-05-02 19:27:08 +0200 | [diff] [blame^] | 236 | mark_tsc_unstable("cpufreq changes"); |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 237 | } |
| 238 | } |
| 239 | } |
| 240 | end: |
| 241 | if (val != CPUFREQ_RESUMECHANGE && val != CPUFREQ_SUSPENDCHANGE) |
| 242 | write_sequnlock_irq(&xtime_lock); |
| 243 | |
| 244 | return 0; |
| 245 | } |
| 246 | |
| 247 | static struct notifier_block time_cpufreq_notifier_block = { |
| 248 | .notifier_call = time_cpufreq_notifier |
| 249 | }; |
| 250 | |
| 251 | static int __init cpufreq_tsc(void) |
| 252 | { |
Thomas Gleixner | 26a08eb | 2007-02-16 01:27:32 -0800 | [diff] [blame] | 253 | return cpufreq_register_notifier(&time_cpufreq_notifier_block, |
| 254 | CPUFREQ_TRANSITION_NOTIFIER); |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 255 | } |
john stultz | 539eb11 | 2006-06-26 00:25:10 -0700 | [diff] [blame] | 256 | core_initcall(cpufreq_tsc); |
| 257 | |
| 258 | #endif |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 259 | |
| 260 | /* clock source code */ |
| 261 | |
| 262 | static unsigned long current_tsc_khz = 0; |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 263 | |
| 264 | static cycle_t read_tsc(void) |
| 265 | { |
| 266 | cycle_t ret; |
| 267 | |
| 268 | rdtscll(ret); |
| 269 | |
| 270 | return ret; |
| 271 | } |
| 272 | |
| 273 | static struct clocksource clocksource_tsc = { |
| 274 | .name = "tsc", |
| 275 | .rating = 300, |
| 276 | .read = read_tsc, |
Jim Cromie | 7f9f303 | 2006-06-26 00:25:15 -0700 | [diff] [blame] | 277 | .mask = CLOCKSOURCE_MASK(64), |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 278 | .mult = 0, /* to be set */ |
| 279 | .shift = 22, |
Thomas Gleixner | 73b08d2 | 2007-02-16 01:27:36 -0800 | [diff] [blame] | 280 | .flags = CLOCK_SOURCE_IS_CONTINUOUS | |
| 281 | CLOCK_SOURCE_MUST_VERIFY, |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 282 | }; |
| 283 | |
john stultz | 5a90cf2 | 2007-05-02 19:27:08 +0200 | [diff] [blame^] | 284 | void mark_tsc_unstable(char *reason) |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 285 | { |
Thomas Gleixner | 7e69f2b | 2007-02-16 01:27:42 -0800 | [diff] [blame] | 286 | if (!tsc_unstable) { |
| 287 | tsc_unstable = 1; |
Thomas Gleixner | d9a5c0a | 2007-03-24 23:02:49 +0100 | [diff] [blame] | 288 | tsc_enabled = 0; |
john stultz | 5a90cf2 | 2007-05-02 19:27:08 +0200 | [diff] [blame^] | 289 | printk("Marking TSC unstable due to: %s.\n", reason); |
Thomas Gleixner | 7e69f2b | 2007-02-16 01:27:42 -0800 | [diff] [blame] | 290 | /* Can be called before registration */ |
| 291 | if (clocksource_tsc.mult) |
| 292 | clocksource_change_rating(&clocksource_tsc, 0); |
| 293 | else |
| 294 | clocksource_tsc.rating = 0; |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 295 | } |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 296 | } |
Thomas Gleixner | 7e69f2b | 2007-02-16 01:27:42 -0800 | [diff] [blame] | 297 | EXPORT_SYMBOL_GPL(mark_tsc_unstable); |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 298 | |
| 299 | static int __init dmi_mark_tsc_unstable(struct dmi_system_id *d) |
| 300 | { |
| 301 | printk(KERN_NOTICE "%s detected: marking TSC unstable.\n", |
| 302 | d->ident); |
Thomas Gleixner | 7e69f2b | 2007-02-16 01:27:42 -0800 | [diff] [blame] | 303 | tsc_unstable = 1; |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 304 | return 0; |
| 305 | } |
| 306 | |
| 307 | /* List of systems that have known TSC problems */ |
| 308 | static struct dmi_system_id __initdata bad_tsc_dmi_table[] = { |
| 309 | { |
| 310 | .callback = dmi_mark_tsc_unstable, |
| 311 | .ident = "IBM Thinkpad 380XD", |
| 312 | .matches = { |
| 313 | DMI_MATCH(DMI_BOARD_VENDOR, "IBM"), |
| 314 | DMI_MATCH(DMI_BOARD_NAME, "2635FA0"), |
| 315 | }, |
| 316 | }, |
| 317 | {} |
| 318 | }; |
| 319 | |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 320 | /* |
| 321 | * Make an educated guess if the TSC is trustworthy and synchronized |
| 322 | * over all CPUs. |
| 323 | */ |
Ingo Molnar | 95492e4 | 2007-02-16 01:27:34 -0800 | [diff] [blame] | 324 | __cpuinit int unsynchronized_tsc(void) |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 325 | { |
Ingo Molnar | 95492e4 | 2007-02-16 01:27:34 -0800 | [diff] [blame] | 326 | if (!cpu_has_tsc || tsc_unstable) |
| 327 | return 1; |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 328 | /* |
| 329 | * Intel systems are normally all synchronized. |
| 330 | * Exceptions must mark TSC as unstable: |
| 331 | */ |
Thomas Gleixner | 7e69f2b | 2007-02-16 01:27:42 -0800 | [diff] [blame] | 332 | if (boot_cpu_data.x86_vendor != X86_VENDOR_INTEL) { |
| 333 | /* assume multi socket systems are not synchronized: */ |
| 334 | if (num_possible_cpus() > 1) |
| 335 | tsc_unstable = 1; |
| 336 | } |
| 337 | return tsc_unstable; |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 338 | } |
| 339 | |
Marcelo Tosatti | 07190a0 | 2007-02-16 01:27:44 -0800 | [diff] [blame] | 340 | /* |
| 341 | * Geode_LX - the OLPC CPU has a possibly a very reliable TSC |
| 342 | */ |
| 343 | #ifdef CONFIG_MGEODE_LX |
| 344 | /* RTSC counts during suspend */ |
| 345 | #define RTSC_SUSP 0x100 |
| 346 | |
| 347 | static void __init check_geode_tsc_reliable(void) |
| 348 | { |
| 349 | unsigned long val; |
| 350 | |
| 351 | rdmsrl(MSR_GEODE_BUSCONT_CONF0, val); |
| 352 | if ((val & RTSC_SUSP)) |
| 353 | clocksource_tsc.flags &= ~CLOCK_SOURCE_MUST_VERIFY; |
| 354 | } |
| 355 | #else |
| 356 | static inline void check_geode_tsc_reliable(void) { } |
| 357 | #endif |
| 358 | |
john stultz | 6bb74df | 2007-03-05 00:30:50 -0800 | [diff] [blame] | 359 | |
| 360 | void __init tsc_init(void) |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 361 | { |
john stultz | 6bb74df | 2007-03-05 00:30:50 -0800 | [diff] [blame] | 362 | if (!cpu_has_tsc || tsc_disable) |
| 363 | goto out_no_tsc; |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 364 | |
john stultz | 6bb74df | 2007-03-05 00:30:50 -0800 | [diff] [blame] | 365 | cpu_khz = calculate_cpu_khz(); |
| 366 | tsc_khz = cpu_khz; |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 367 | |
john stultz | 6bb74df | 2007-03-05 00:30:50 -0800 | [diff] [blame] | 368 | if (!cpu_khz) |
| 369 | goto out_no_tsc; |
| 370 | |
| 371 | printk("Detected %lu.%03lu MHz processor.\n", |
| 372 | (unsigned long)cpu_khz / 1000, |
| 373 | (unsigned long)cpu_khz % 1000); |
| 374 | |
| 375 | set_cyc2ns_scale(cpu_khz); |
| 376 | use_tsc_delay(); |
| 377 | |
| 378 | /* Check and install the TSC clocksource */ |
| 379 | dmi_check_system(bad_tsc_dmi_table); |
| 380 | |
| 381 | unsynchronized_tsc(); |
| 382 | check_geode_tsc_reliable(); |
| 383 | current_tsc_khz = tsc_khz; |
| 384 | clocksource_tsc.mult = clocksource_khz2mult(current_tsc_khz, |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 385 | clocksource_tsc.shift); |
john stultz | 6bb74df | 2007-03-05 00:30:50 -0800 | [diff] [blame] | 386 | /* lower the rating if we already know its unstable: */ |
| 387 | if (check_tsc_unstable()) { |
| 388 | clocksource_tsc.rating = 0; |
| 389 | clocksource_tsc.flags &= ~CLOCK_SOURCE_IS_CONTINUOUS; |
Thomas Gleixner | d9a5c0a | 2007-03-24 23:02:49 +0100 | [diff] [blame] | 390 | } else |
| 391 | tsc_enabled = 1; |
| 392 | |
john stultz | 6bb74df | 2007-03-05 00:30:50 -0800 | [diff] [blame] | 393 | clocksource_register(&clocksource_tsc); |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 394 | |
john stultz | 6bb74df | 2007-03-05 00:30:50 -0800 | [diff] [blame] | 395 | return; |
| 396 | |
| 397 | out_no_tsc: |
| 398 | /* |
| 399 | * Set the tsc_disable flag if there's no TSC support, this |
| 400 | * makes it a fast flag for the kernel to see whether it |
| 401 | * should be using the TSC. |
| 402 | */ |
| 403 | tsc_disable = 1; |
john stultz | 5d0cf41 | 2006-06-26 00:25:12 -0700 | [diff] [blame] | 404 | } |