blob: 216fc9d742478902ca0109faa3aaf432a73381a8 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/x86-64/kernel/time.c
3 *
4 * "High Precision Event Timer" based timekeeping.
5 *
6 * Copyright (c) 1991,1992,1995 Linus Torvalds
7 * Copyright (c) 1994 Alan Modra
8 * Copyright (c) 1995 Markus Kuhn
9 * Copyright (c) 1996 Ingo Molnar
10 * Copyright (c) 1998 Andrea Arcangeli
Vojtech Pavlik2f82bde42006-06-26 13:58:38 +020011 * Copyright (c) 2002,2006 Vojtech Pavlik
Linus Torvalds1da177e2005-04-16 15:20:36 -070012 * Copyright (c) 2003 Andi Kleen
13 * RTC support code taken from arch/i386/kernel/timers/time_hpet.c
14 */
15
16#include <linux/kernel.h>
17#include <linux/sched.h>
18#include <linux/interrupt.h>
19#include <linux/init.h>
20#include <linux/mc146818rtc.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <linux/time.h>
22#include <linux/ioport.h>
23#include <linux/module.h>
24#include <linux/device.h>
25#include <linux/sysdev.h>
26#include <linux/bcd.h>
Vojtech Pavlika670fad2006-09-26 10:52:28 +020027#include <linux/notifier.h>
28#include <linux/cpu.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070029#include <linux/kallsyms.h>
Andi Kleen312df5f2005-05-16 21:53:28 -070030#include <linux/acpi.h>
Andi Kleen8d916402005-05-31 14:39:26 -070031#ifdef CONFIG_ACPI
Andi Kleen312df5f2005-05-16 21:53:28 -070032#include <acpi/achware.h> /* for PM timer frequency */
Andi Kleen0e5f61b2006-07-29 21:42:37 +020033#include <acpi/acpi_bus.h>
Andi Kleen8d916402005-05-31 14:39:26 -070034#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070035#include <asm/8253pit.h>
36#include <asm/pgtable.h>
37#include <asm/vsyscall.h>
38#include <asm/timex.h>
39#include <asm/proto.h>
40#include <asm/hpet.h>
41#include <asm/sections.h>
42#include <linux/cpufreq.h>
43#include <linux/hpet.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070044#include <asm/apic.h>
john stultzc37e7bb2007-02-16 01:28:19 -080045#include <asm/hpet.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070046
Linus Torvalds1da177e2005-04-16 15:20:36 -070047#ifdef CONFIG_CPU_FREQ
john stultzc37e7bb2007-02-16 01:28:19 -080048extern void cpufreq_delayed_get(void);
Linus Torvalds1da177e2005-04-16 15:20:36 -070049#endif
50extern void i8254_timer_resume(void);
51extern int using_apic_timer;
52
Vojtech Pavlika670fad2006-09-26 10:52:28 +020053static char *timename = NULL;
Andi Kleene8b91772006-02-26 04:18:49 +010054
Linus Torvalds1da177e2005-04-16 15:20:36 -070055DEFINE_SPINLOCK(rtc_lock);
Andi Kleen2ee60e172006-06-26 13:59:44 +020056EXPORT_SYMBOL(rtc_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -070057DEFINE_SPINLOCK(i8253_lock);
58
Linus Torvalds1da177e2005-04-16 15:20:36 -070059unsigned long vxtime_hz = PIT_TICK_RATE;
60int report_lost_ticks; /* command line option */
61unsigned long long monotonic_base;
62
63struct vxtime_data __vxtime __section_vxtime; /* for vsyscalls */
64
65volatile unsigned long __jiffies __section_jiffies = INITIAL_JIFFIES;
Linus Torvalds1da177e2005-04-16 15:20:36 -070066struct timespec __xtime __section_xtime;
67struct timezone __sys_tz __section_sys_tz;
68
Linus Torvalds1da177e2005-04-16 15:20:36 -070069unsigned int (*do_gettimeoffset)(void) = do_gettimeoffset_tsc;
70
71/*
72 * This version of gettimeofday() has microsecond resolution and better than
73 * microsecond precision, as we're using at least a 10 MHz (usually 14.31818
74 * MHz) HPET timer.
75 */
76
77void do_gettimeofday(struct timeval *tv)
78{
Atsushi Nemoto8ef38602006-09-30 23:28:31 -070079 unsigned long seq;
Linus Torvalds1da177e2005-04-16 15:20:36 -070080 unsigned int sec, usec;
81
82 do {
83 seq = read_seqbegin(&xtime_lock);
84
85 sec = xtime.tv_sec;
Vojtech Pavlik42211332006-06-26 13:58:32 +020086 usec = xtime.tv_nsec / NSEC_PER_USEC;
Linus Torvalds1da177e2005-04-16 15:20:36 -070087
88 /* i386 does some correction here to keep the clock
89 monotonous even when ntpd is fixing drift.
90 But they didn't work for me, there is a non monotonic
91 clock anyways with ntp.
92 I dropped all corrections now until a real solution can
93 be found. Note when you fix it here you need to do the same
94 in arch/x86_64/kernel/vsyscall.c and export all needed
95 variables in vmlinux.lds. -AK */
Atsushi Nemoto8ef38602006-09-30 23:28:31 -070096 usec += do_gettimeoffset();
Linus Torvalds1da177e2005-04-16 15:20:36 -070097
98 } while (read_seqretry(&xtime_lock, seq));
99
Vojtech Pavlik42211332006-06-26 13:58:32 +0200100 tv->tv_sec = sec + usec / USEC_PER_SEC;
101 tv->tv_usec = usec % USEC_PER_SEC;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102}
103
104EXPORT_SYMBOL(do_gettimeofday);
105
106/*
107 * settimeofday() first undoes the correction that gettimeofday would do
108 * on the time, and then saves it. This is ugly, but has been like this for
109 * ages already.
110 */
111
112int do_settimeofday(struct timespec *tv)
113{
114 time_t wtm_sec, sec = tv->tv_sec;
115 long wtm_nsec, nsec = tv->tv_nsec;
116
117 if ((unsigned long)tv->tv_nsec >= NSEC_PER_SEC)
118 return -EINVAL;
119
120 write_seqlock_irq(&xtime_lock);
121
Atsushi Nemoto8ef38602006-09-30 23:28:31 -0700122 nsec -= do_gettimeoffset() * NSEC_PER_USEC;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700123
124 wtm_sec = wall_to_monotonic.tv_sec + (xtime.tv_sec - sec);
125 wtm_nsec = wall_to_monotonic.tv_nsec + (xtime.tv_nsec - nsec);
126
127 set_normalized_timespec(&xtime, sec, nsec);
128 set_normalized_timespec(&wall_to_monotonic, wtm_sec, wtm_nsec);
129
john stultzb149ee22005-09-06 15:17:46 -0700130 ntp_clear();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131
132 write_sequnlock_irq(&xtime_lock);
133 clock_was_set();
134 return 0;
135}
136
137EXPORT_SYMBOL(do_settimeofday);
138
139unsigned long profile_pc(struct pt_regs *regs)
140{
141 unsigned long pc = instruction_pointer(regs);
142
Andi Kleen31679f32006-09-26 10:52:28 +0200143 /* Assume the lock function has either no stack frame or a copy
144 of eflags from PUSHF
145 Eflags always has bits 22 and up cleared unlike kernel addresses. */
Andi Kleend5a26012006-07-28 14:44:42 +0200146 if (!user_mode(regs) && in_lock_functions(pc)) {
Andi Kleen31679f32006-09-26 10:52:28 +0200147 unsigned long *sp = (unsigned long *)regs->rsp;
148 if (sp[0] >> 22)
149 return sp[0];
150 if (sp[1] >> 22)
151 return sp[1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700152 }
153 return pc;
154}
155EXPORT_SYMBOL(profile_pc);
156
157/*
158 * In order to set the CMOS clock precisely, set_rtc_mmss has to be called 500
159 * ms after the second nowtime has started, because when nowtime is written
160 * into the registers of the CMOS clock, it will jump to the next second
161 * precisely 500 ms later. Check the Motorola MC146818A or Dallas DS12887 data
162 * sheet for details.
163 */
164
165static void set_rtc_mmss(unsigned long nowtime)
166{
167 int real_seconds, real_minutes, cmos_minutes;
168 unsigned char control, freq_select;
169
170/*
171 * IRQs are disabled when we're called from the timer interrupt,
172 * no need for spin_lock_irqsave()
173 */
174
175 spin_lock(&rtc_lock);
176
177/*
178 * Tell the clock it's being set and stop it.
179 */
180
181 control = CMOS_READ(RTC_CONTROL);
182 CMOS_WRITE(control | RTC_SET, RTC_CONTROL);
183
184 freq_select = CMOS_READ(RTC_FREQ_SELECT);
185 CMOS_WRITE(freq_select | RTC_DIV_RESET2, RTC_FREQ_SELECT);
186
187 cmos_minutes = CMOS_READ(RTC_MINUTES);
188 BCD_TO_BIN(cmos_minutes);
189
190/*
191 * since we're only adjusting minutes and seconds, don't interfere with hour
192 * overflow. This avoids messing with unknown time zones but requires your RTC
193 * not to be off by more than 15 minutes. Since we're calling it only when
194 * our clock is externally synchronized using NTP, this shouldn't be a problem.
195 */
196
197 real_seconds = nowtime % 60;
198 real_minutes = nowtime / 60;
199 if (((abs(real_minutes - cmos_minutes) + 15) / 30) & 1)
200 real_minutes += 30; /* correct for half hour time zone */
201 real_minutes %= 60;
202
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203 if (abs(real_minutes - cmos_minutes) >= 30) {
204 printk(KERN_WARNING "time.c: can't update CMOS clock "
205 "from %d to %d\n", cmos_minutes, real_minutes);
Andi Kleen28456ed2006-03-25 16:30:37 +0100206 } else {
Andi Kleen0b913172006-01-11 22:45:33 +0100207 BIN_TO_BCD(real_seconds);
208 BIN_TO_BCD(real_minutes);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700209 CMOS_WRITE(real_seconds, RTC_SECONDS);
210 CMOS_WRITE(real_minutes, RTC_MINUTES);
211 }
212
213/*
214 * The following flags have to be released exactly in this order, otherwise the
215 * DS12887 (popular MC146818A clone with integrated battery and quartz) will
216 * not reset the oscillator and will not update precisely 500 ms later. You
217 * won't find this mentioned in the Dallas Semiconductor data sheets, but who
218 * believes data sheets anyway ... -- Markus Kuhn
219 */
220
221 CMOS_WRITE(control, RTC_CONTROL);
222 CMOS_WRITE(freq_select, RTC_FREQ_SELECT);
223
224 spin_unlock(&rtc_lock);
225}
226
227
228/* monotonic_clock(): returns # of nanoseconds passed since time_init()
229 * Note: This function is required to return accurate
230 * time even in the absence of multiple timer ticks.
231 */
john stultzc37e7bb2007-02-16 01:28:19 -0800232extern unsigned long long cycles_2_ns(unsigned long long cyc);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233unsigned long long monotonic_clock(void)
234{
235 unsigned long seq;
236 u32 last_offset, this_offset, offset;
237 unsigned long long base;
238
239 if (vxtime.mode == VXTIME_HPET) {
240 do {
241 seq = read_seqbegin(&xtime_lock);
242
243 last_offset = vxtime.last;
244 base = monotonic_base;
john stultza3a00752005-06-23 00:08:36 -0700245 this_offset = hpet_readl(HPET_COUNTER);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246 } while (read_seqretry(&xtime_lock, seq));
247 offset = (this_offset - last_offset);
Vojtech Pavlik42211332006-06-26 13:58:32 +0200248 offset *= NSEC_PER_TICK / hpet_tick;
Andi Kleen0b913172006-01-11 22:45:33 +0100249 } else {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700250 do {
251 seq = read_seqbegin(&xtime_lock);
252
253 last_offset = vxtime.last_tsc;
254 base = monotonic_base;
255 } while (read_seqretry(&xtime_lock, seq));
Andi Kleenc818a182006-01-11 22:45:24 +0100256 this_offset = get_cycles_sync();
Dimitri Sivanichcbf9b4b2006-09-26 10:52:34 +0200257 offset = cycles_2_ns(this_offset - last_offset);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258 }
Andi Kleen7351c0b2006-03-25 16:30:34 +0100259 return base + offset;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700260}
261EXPORT_SYMBOL(monotonic_clock);
262
David Howells7d12e782006-10-05 14:55:46 +0100263static noinline void handle_lost_ticks(int lost)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700264{
Andi Kleen7351c0b2006-03-25 16:30:34 +0100265 static long lost_count;
266 static int warned;
267 if (report_lost_ticks) {
268 printk(KERN_WARNING "time.c: Lost %d timer tick(s)! ", lost);
David Howells7d12e782006-10-05 14:55:46 +0100269 print_symbol("rip %s)\n", get_irq_regs()->rip);
Andi Kleen7351c0b2006-03-25 16:30:34 +0100270 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271
Andi Kleen7351c0b2006-03-25 16:30:34 +0100272 if (lost_count == 1000 && !warned) {
273 printk(KERN_WARNING "warning: many lost ticks.\n"
274 KERN_WARNING "Your time source seems to be instable or "
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275 "some driver is hogging interupts\n");
David Howells7d12e782006-10-05 14:55:46 +0100276 print_symbol("rip %s\n", get_irq_regs()->rip);
john stultz2d0c87c2007-02-16 01:28:18 -0800277 if (vxtime.mode == VXTIME_TSC && hpet_address) {
Andi Kleen7351c0b2006-03-25 16:30:34 +0100278 printk(KERN_WARNING "Falling back to HPET\n");
279 if (hpet_use_timer)
280 vxtime.last = hpet_readl(HPET_T0_CMP) -
281 hpet_tick;
282 else
283 vxtime.last = hpet_readl(HPET_COUNTER);
284 vxtime.mode = VXTIME_HPET;
john stultz2d0c87c2007-02-16 01:28:18 -0800285 vxtime.hpet_address = hpet_address;
Andi Kleen7351c0b2006-03-25 16:30:34 +0100286 do_gettimeoffset = do_gettimeoffset_hpet;
287 }
288 /* else should fall back to PIT, but code missing. */
289 warned = 1;
290 } else
291 lost_count++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292
293#ifdef CONFIG_CPU_FREQ
Andi Kleen7351c0b2006-03-25 16:30:34 +0100294 /* In some cases the CPU can change frequency without us noticing
295 Give cpufreq a change to catch up. */
296 if ((lost_count+1) % 25 == 0)
297 cpufreq_delayed_get();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298#endif
299}
300
David Howells7d12e782006-10-05 14:55:46 +0100301void main_timer_handler(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302{
303 static unsigned long rtc_update = 0;
304 unsigned long tsc;
Andi Kleen9ede6b02006-03-25 16:29:31 +0100305 int delay = 0, offset = 0, lost = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306
307/*
308 * Here we are in the timer irq handler. We have irqs locally disabled (so we
309 * don't need spin_lock_irqsave()) but we don't know if the timer_bh is running
310 * on the other CPU, so we need a lock. We also need to lock the vsyscall
311 * variables, because both do_timer() and us change them -arca+vojtech
312 */
313
314 write_seqlock(&xtime_lock);
315
john stultz2d0c87c2007-02-16 01:28:18 -0800316 if (hpet_address)
john stultza3a00752005-06-23 00:08:36 -0700317 offset = hpet_readl(HPET_COUNTER);
318
319 if (hpet_use_timer) {
320 /* if we're using the hpet timer functionality,
321 * we can more accurately know the counter value
322 * when the timer interrupt occured.
323 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700324 offset = hpet_readl(HPET_T0_CMP) - hpet_tick;
325 delay = hpet_readl(HPET_COUNTER) - offset;
Andi Kleen9ede6b02006-03-25 16:29:31 +0100326 } else if (!pmtmr_ioport) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327 spin_lock(&i8253_lock);
328 outb_p(0x00, 0x43);
329 delay = inb_p(0x40);
330 delay |= inb(0x40) << 8;
331 spin_unlock(&i8253_lock);
332 delay = LATCH - 1 - delay;
333 }
334
Andi Kleenc818a182006-01-11 22:45:24 +0100335 tsc = get_cycles_sync();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336
337 if (vxtime.mode == VXTIME_HPET) {
338 if (offset - vxtime.last > hpet_tick) {
339 lost = (offset - vxtime.last) / hpet_tick - 1;
340 }
341
342 monotonic_base +=
Vojtech Pavlik42211332006-06-26 13:58:32 +0200343 (offset - vxtime.last) * NSEC_PER_TICK / hpet_tick;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344
345 vxtime.last = offset;
Andi Kleen312df5f2005-05-16 21:53:28 -0700346#ifdef CONFIG_X86_PM_TIMER
347 } else if (vxtime.mode == VXTIME_PMTMR) {
348 lost = pmtimer_mark_offset();
349#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700350 } else {
351 offset = (((tsc - vxtime.last_tsc) *
Vojtech Pavlik42211332006-06-26 13:58:32 +0200352 vxtime.tsc_quot) >> US_SCALE) - USEC_PER_TICK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700353
354 if (offset < 0)
355 offset = 0;
356
Vojtech Pavlik42211332006-06-26 13:58:32 +0200357 if (offset > USEC_PER_TICK) {
358 lost = offset / USEC_PER_TICK;
359 offset %= USEC_PER_TICK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700360 }
361
Dimitri Sivanichcbf9b4b2006-09-26 10:52:34 +0200362 monotonic_base += cycles_2_ns(tsc - vxtime.last_tsc);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363
364 vxtime.last_tsc = tsc - vxtime.quot * delay / vxtime.tsc_quot;
365
366 if ((((tsc - vxtime.last_tsc) *
Vojtech Pavlik42211332006-06-26 13:58:32 +0200367 vxtime.tsc_quot) >> US_SCALE) < offset)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700368 vxtime.last_tsc = tsc -
Vojtech Pavlik42211332006-06-26 13:58:32 +0200369 (((long) offset << US_SCALE) / vxtime.tsc_quot) - 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370 }
371
Atsushi Nemoto3171a032006-09-29 02:00:32 -0700372 if (lost > 0)
David Howells7d12e782006-10-05 14:55:46 +0100373 handle_lost_ticks(lost);
Atsushi Nemoto3171a032006-09-29 02:00:32 -0700374 else
375 lost = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376
377/*
378 * Do the timer stuff.
379 */
380
Atsushi Nemoto3171a032006-09-29 02:00:32 -0700381 do_timer(lost + 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700382#ifndef CONFIG_SMP
David Howells7d12e782006-10-05 14:55:46 +0100383 update_process_times(user_mode(get_irq_regs()));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700384#endif
385
386/*
387 * In the SMP case we use the local APIC timer interrupt to do the profiling,
388 * except when we simulate SMP mode on a uniprocessor system, in that case we
389 * have to call the local interrupt handler.
390 */
391
Linus Torvalds1da177e2005-04-16 15:20:36 -0700392 if (!using_apic_timer)
David Howells7d12e782006-10-05 14:55:46 +0100393 smp_local_timer_interrupt();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394
395/*
396 * If we have an externally synchronized Linux clock, then update CMOS clock
397 * accordingly every ~11 minutes. set_rtc_mmss() will be called in the jiffy
398 * closest to exactly 500 ms before the next second. If the update fails, we
399 * don't care, as it'll be updated on the next turn, and the problem (time way
400 * off) isn't likely to go away much sooner anyway.
401 */
402
john stultzb149ee22005-09-06 15:17:46 -0700403 if (ntp_synced() && xtime.tv_sec > rtc_update &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700404 abs(xtime.tv_nsec - 500000000) <= tick_nsec / 2) {
405 set_rtc_mmss(xtime.tv_sec);
406 rtc_update = xtime.tv_sec + 660;
407 }
408
409 write_sequnlock(&xtime_lock);
Andi Kleen73dea472006-02-03 21:50:50 +0100410}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700411
David Howells7d12e782006-10-05 14:55:46 +0100412static irqreturn_t timer_interrupt(int irq, void *dev_id)
Andi Kleen73dea472006-02-03 21:50:50 +0100413{
414 if (apic_runs_main_timer > 1)
415 return IRQ_HANDLED;
David Howells7d12e782006-10-05 14:55:46 +0100416 main_timer_handler();
Venkatesh Pallipadid25bf7e2006-01-11 22:44:24 +0100417 if (using_apic_timer)
418 smp_send_timer_broadcast_ipi();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700419 return IRQ_HANDLED;
420}
421
Andi Kleenbdf2b1c2006-01-11 22:46:39 +0100422static unsigned long get_cmos_time(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700423{
Matt Mackall641f71f2006-03-28 01:56:01 -0800424 unsigned int year, mon, day, hour, min, sec;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700425 unsigned long flags;
Alexey Starikovskiyad718602007-02-02 19:48:19 +0300426 unsigned century = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700427
Linus Torvalds1da177e2005-04-16 15:20:36 -0700428 spin_lock_irqsave(&rtc_lock, flags);
429
Matt Mackall641f71f2006-03-28 01:56:01 -0800430 do {
431 sec = CMOS_READ(RTC_SECONDS);
432 min = CMOS_READ(RTC_MINUTES);
433 hour = CMOS_READ(RTC_HOURS);
434 day = CMOS_READ(RTC_DAY_OF_MONTH);
435 mon = CMOS_READ(RTC_MONTH);
436 year = CMOS_READ(RTC_YEAR);
Andi Kleen6954bee2006-03-25 16:30:31 +0100437#ifdef CONFIG_ACPI
Alexey Starikovskiyad718602007-02-02 19:48:19 +0300438 if (acpi_gbl_FADT.header.revision >= FADT2_REVISION_ID &&
439 acpi_gbl_FADT.century)
440 century = CMOS_READ(acpi_gbl_FADT.century);
Andi Kleen6954bee2006-03-25 16:30:31 +0100441#endif
Matt Mackall641f71f2006-03-28 01:56:01 -0800442 } while (sec != CMOS_READ(RTC_SECONDS));
Andi Kleen6954bee2006-03-25 16:30:31 +0100443
Linus Torvalds1da177e2005-04-16 15:20:36 -0700444 spin_unlock_irqrestore(&rtc_lock, flags);
445
Andi Kleen0b913172006-01-11 22:45:33 +0100446 /*
447 * We know that x86-64 always uses BCD format, no need to check the
448 * config register.
Andi Kleen7351c0b2006-03-25 16:30:34 +0100449 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700450
Andi Kleen0b913172006-01-11 22:45:33 +0100451 BCD_TO_BIN(sec);
452 BCD_TO_BIN(min);
453 BCD_TO_BIN(hour);
454 BCD_TO_BIN(day);
455 BCD_TO_BIN(mon);
456 BCD_TO_BIN(year);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700457
Alexey Starikovskiyad718602007-02-02 19:48:19 +0300458 if (century) {
459 BCD_TO_BIN(century);
460 year += century * 100;
461 printk(KERN_INFO "Extended CMOS year: %d\n", century * 100);
Andi Kleen6954bee2006-03-25 16:30:31 +0100462 } else {
463 /*
464 * x86-64 systems only exists since 2002.
465 * This will work up to Dec 31, 2100
466 */
467 year += 2000;
468 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700469
470 return mktime(year, mon, day, hour, min, sec);
471}
472
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473
474/*
475 * pit_calibrate_tsc() uses the speaker output (channel 2) of
476 * the PIT. This is better than using the timer interrupt output,
477 * because we can read the value of the speaker with just one inb(),
478 * where we need three i/o operations for the interrupt channel.
479 * We count how many ticks the TSC does in 50 ms.
480 */
481
482static unsigned int __init pit_calibrate_tsc(void)
483{
484 unsigned long start, end;
485 unsigned long flags;
486
487 spin_lock_irqsave(&i8253_lock, flags);
488
489 outb((inb(0x61) & ~0x02) | 0x01, 0x61);
490
491 outb(0xb0, 0x43);
492 outb((PIT_TICK_RATE / (1000 / 50)) & 0xff, 0x42);
493 outb((PIT_TICK_RATE / (1000 / 50)) >> 8, 0x42);
Andi Kleenc818a182006-01-11 22:45:24 +0100494 start = get_cycles_sync();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700495 while ((inb(0x61) & 0x20) == 0);
Andi Kleenc818a182006-01-11 22:45:24 +0100496 end = get_cycles_sync();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700497
498 spin_unlock_irqrestore(&i8253_lock, flags);
499
500 return (end - start) / 50;
501}
502
Andi Kleen73dea472006-02-03 21:50:50 +0100503#define PIT_MODE 0x43
504#define PIT_CH0 0x40
505
506static void __init __pit_init(int val, u8 mode)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700507{
508 unsigned long flags;
509
510 spin_lock_irqsave(&i8253_lock, flags);
Andi Kleen73dea472006-02-03 21:50:50 +0100511 outb_p(mode, PIT_MODE);
512 outb_p(val & 0xff, PIT_CH0); /* LSB */
513 outb_p(val >> 8, PIT_CH0); /* MSB */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700514 spin_unlock_irqrestore(&i8253_lock, flags);
515}
516
Andi Kleen73dea472006-02-03 21:50:50 +0100517void __init pit_init(void)
518{
519 __pit_init(LATCH, 0x34); /* binary, mode 2, LSB/MSB, ch 0 */
520}
521
522void __init pit_stop_interrupt(void)
523{
524 __pit_init(0, 0x30); /* mode 0 */
525}
526
527void __init stop_timer_interrupt(void)
528{
529 char *name;
john stultz2d0c87c2007-02-16 01:28:18 -0800530 if (hpet_address) {
Andi Kleen73dea472006-02-03 21:50:50 +0100531 name = "HPET";
532 hpet_timer_stop_set_go(0);
533 } else {
534 name = "PIT";
535 pit_stop_interrupt();
536 }
537 printk(KERN_INFO "timer: %s interrupt stopped.\n", name);
538}
539
Linus Torvalds1da177e2005-04-16 15:20:36 -0700540int __init time_setup(char *str)
541{
542 report_lost_ticks = 1;
543 return 1;
544}
545
546static struct irqaction irq0 = {
Thomas Gleixnerb1e05aa2006-07-01 19:29:29 -0700547 timer_interrupt, IRQF_DISABLED, CPU_MASK_NONE, "timer", NULL, NULL
Linus Torvalds1da177e2005-04-16 15:20:36 -0700548};
549
Linus Torvalds1da177e2005-04-16 15:20:36 -0700550void __init time_init(void)
551{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700552 if (nohpet)
john stultz2d0c87c2007-02-16 01:28:18 -0800553 hpet_address = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700554 xtime.tv_sec = get_cmos_time();
555 xtime.tv_nsec = 0;
556
557 set_normalized_timespec(&wall_to_monotonic,
558 -xtime.tv_sec, -xtime.tv_nsec);
559
john stultzc37e7bb2007-02-16 01:28:19 -0800560 if (!hpet_arch_init())
Vojtech Pavlik42211332006-06-26 13:58:32 +0200561 vxtime_hz = (FSEC_PER_SEC + hpet_period / 2) / hpet_period;
Andi Kleen68e18892005-12-12 22:17:07 -0800562 else
john stultz2d0c87c2007-02-16 01:28:18 -0800563 hpet_address = 0;
john stultza3a00752005-06-23 00:08:36 -0700564
565 if (hpet_use_timer) {
Jordan Hargraveb20367a2006-04-07 19:50:18 +0200566 /* set tick_nsec to use the proper rate for HPET */
567 tick_nsec = TICK_NSEC_HPET;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700568 cpu_khz = hpet_calibrate_tsc();
569 timename = "HPET";
Andi Kleen312df5f2005-05-16 21:53:28 -0700570#ifdef CONFIG_X86_PM_TIMER
john stultz2d0c87c2007-02-16 01:28:18 -0800571 } else if (pmtmr_ioport && !hpet_address) {
Andi Kleen312df5f2005-05-16 21:53:28 -0700572 vxtime_hz = PM_TIMER_FREQUENCY;
573 timename = "PM";
574 pit_init();
575 cpu_khz = pit_calibrate_tsc();
576#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700577 } else {
578 pit_init();
579 cpu_khz = pit_calibrate_tsc();
580 timename = "PIT";
581 }
582
Andi Kleene8b91772006-02-26 04:18:49 +0100583 vxtime.mode = VXTIME_TSC;
Vojtech Pavlik42211332006-06-26 13:58:32 +0200584 vxtime.quot = (USEC_PER_SEC << US_SCALE) / vxtime_hz;
585 vxtime.tsc_quot = (USEC_PER_MSEC << US_SCALE) / cpu_khz;
Andi Kleenc818a182006-01-11 22:45:24 +0100586 vxtime.last_tsc = get_cycles_sync();
Mathieu Desnoyersdacb16b2005-10-30 14:59:25 -0800587 set_cyc2ns_scale(cpu_khz);
Dimitri Sivanichcbf9b4b2006-09-26 10:52:34 +0200588 setup_irq(0, &irq0);
Vojtech Pavlika670fad2006-09-26 10:52:28 +0200589
590#ifndef CONFIG_SMP
591 time_init_gtod();
592#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593}
594
Andi Kleen312df5f2005-05-16 21:53:28 -0700595/*
Andi Kleene8b91772006-02-26 04:18:49 +0100596 * Decide what mode gettimeofday should use.
Andi Kleena8ab26f2005-04-16 15:25:19 -0700597 */
Vojtech Pavlika670fad2006-09-26 10:52:28 +0200598void time_init_gtod(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700599{
600 char *timetype;
601
Andi Kleen312df5f2005-05-16 21:53:28 -0700602 if (unsynchronized_tsc())
Linus Torvalds1da177e2005-04-16 15:20:36 -0700603 notsc = 1;
Vojtech Pavlika670fad2006-09-26 10:52:28 +0200604
john stultz2d0c87c2007-02-16 01:28:18 -0800605 if (cpu_has(&boot_cpu_data, X86_FEATURE_RDTSCP))
Vojtech Pavlikc08c8202006-09-26 10:52:28 +0200606 vgetcpu_mode = VGETCPU_RDTSCP;
607 else
608 vgetcpu_mode = VGETCPU_LSL;
609
john stultz2d0c87c2007-02-16 01:28:18 -0800610 if (hpet_address && notsc) {
john stultza3a00752005-06-23 00:08:36 -0700611 timetype = hpet_use_timer ? "HPET" : "PIT/HPET";
Chris McDermott33042a92006-02-11 17:55:50 -0800612 if (hpet_use_timer)
613 vxtime.last = hpet_readl(HPET_T0_CMP) - hpet_tick;
614 else
615 vxtime.last = hpet_readl(HPET_COUNTER);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700616 vxtime.mode = VXTIME_HPET;
john stultz2d0c87c2007-02-16 01:28:18 -0800617 vxtime.hpet_address = hpet_address;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700618 do_gettimeoffset = do_gettimeoffset_hpet;
Andi Kleen312df5f2005-05-16 21:53:28 -0700619#ifdef CONFIG_X86_PM_TIMER
620 /* Using PM for gettimeofday is quite slow, but we have no other
621 choice because the TSC is too unreliable on some systems. */
john stultz2d0c87c2007-02-16 01:28:18 -0800622 } else if (pmtmr_ioport && !hpet_address && notsc) {
Andi Kleen312df5f2005-05-16 21:53:28 -0700623 timetype = "PM";
624 do_gettimeoffset = do_gettimeoffset_pm;
625 vxtime.mode = VXTIME_PMTMR;
626 sysctl_vsyscall = 0;
627 printk(KERN_INFO "Disabling vsyscall due to use of PM timer\n");
628#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700629 } else {
john stultza3a00752005-06-23 00:08:36 -0700630 timetype = hpet_use_timer ? "HPET/TSC" : "PIT/TSC";
Linus Torvalds1da177e2005-04-16 15:20:36 -0700631 vxtime.mode = VXTIME_TSC;
632 }
Vojtech Pavlika670fad2006-09-26 10:52:28 +0200633
634 printk(KERN_INFO "time.c: Using %ld.%06ld MHz WALL %s GTOD %s timer.\n",
635 vxtime_hz / 1000000, vxtime_hz % 1000000, timename, timetype);
636 printk(KERN_INFO "time.c: Detected %d.%03d MHz processor.\n",
637 cpu_khz / 1000, cpu_khz % 1000);
638 vxtime.quot = (USEC_PER_SEC << US_SCALE) / vxtime_hz;
639 vxtime.tsc_quot = (USEC_PER_MSEC << US_SCALE) / cpu_khz;
640 vxtime.last_tsc = get_cycles_sync();
641
642 set_cyc2ns_scale(cpu_khz);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700643}
644
645__setup("report_lost_ticks", time_setup);
646
647static long clock_cmos_diff;
648static unsigned long sleep_start;
649
Andi Kleen0b913172006-01-11 22:45:33 +0100650/*
651 * sysfs support for the timer.
652 */
653
Pavel Machek0b9c33a2005-04-16 15:25:31 -0700654static int timer_suspend(struct sys_device *dev, pm_message_t state)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700655{
656 /*
657 * Estimate time zone so that set_time can update the clock
658 */
659 long cmos_time = get_cmos_time();
660
661 clock_cmos_diff = -cmos_time;
662 clock_cmos_diff += get_seconds();
663 sleep_start = cmos_time;
664 return 0;
665}
666
667static int timer_resume(struct sys_device *dev)
668{
669 unsigned long flags;
670 unsigned long sec;
671 unsigned long ctime = get_cmos_time();
Rafael J. Wysocki34464a52006-09-26 10:52:37 +0200672 long sleep_length = (ctime - sleep_start) * HZ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700673
Rafael J. Wysocki34464a52006-09-26 10:52:37 +0200674 if (sleep_length < 0) {
675 printk(KERN_WARNING "Time skew detected in timer resume!\n");
676 /* The time after the resume must not be earlier than the time
677 * before the suspend or some nasty things will happen
678 */
679 sleep_length = 0;
680 ctime = sleep_start;
681 }
john stultz2d0c87c2007-02-16 01:28:18 -0800682 if (hpet_address)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700683 hpet_reenable();
684 else
685 i8254_timer_resume();
686
687 sec = ctime + clock_cmos_diff;
688 write_seqlock_irqsave(&xtime_lock,flags);
689 xtime.tv_sec = sec;
690 xtime.tv_nsec = 0;
Shaohua Li0dd2ea92006-02-03 21:50:56 +0100691 if (vxtime.mode == VXTIME_HPET) {
692 if (hpet_use_timer)
693 vxtime.last = hpet_readl(HPET_T0_CMP) - hpet_tick;
694 else
695 vxtime.last = hpet_readl(HPET_COUNTER);
696#ifdef CONFIG_X86_PM_TIMER
697 } else if (vxtime.mode == VXTIME_PMTMR) {
698 pmtimer_resume();
699#endif
700 } else
701 vxtime.last_tsc = get_cycles_sync();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700702 write_sequnlock_irqrestore(&xtime_lock,flags);
703 jiffies += sleep_length;
Shaohua Li0dd2ea92006-02-03 21:50:56 +0100704 monotonic_base += sleep_length * (NSEC_PER_SEC/HZ);
Ingo Molnar8446f1d2005-09-06 15:16:27 -0700705 touch_softlockup_watchdog();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700706 return 0;
707}
708
709static struct sysdev_class timer_sysclass = {
710 .resume = timer_resume,
711 .suspend = timer_suspend,
712 set_kset_name("timer"),
713};
714
Linus Torvalds1da177e2005-04-16 15:20:36 -0700715/* XXX this driverfs stuff should probably go elsewhere later -john */
716static struct sys_device device_timer = {
717 .id = 0,
718 .cls = &timer_sysclass,
719};
720
721static int time_init_device(void)
722{
723 int error = sysdev_class_register(&timer_sysclass);
724 if (!error)
725 error = sysdev_register(&device_timer);
726 return error;
727}
728
729device_initcall(time_init_device);