blob: 06f40ae13b7bb45006a1851d19595fe136a973d9 [file] [log] [blame]
john stultz85240702007-05-08 00:27:59 -07001/*
2 * linux/kernel/time/timekeeping.c
3 *
4 * Kernel timekeeping code and accessor functions
5 *
6 * This code was moved from linux/kernel/timer.c.
7 * Please see that file for copyright and history logs.
8 *
9 */
10
11#include <linux/module.h>
12#include <linux/interrupt.h>
13#include <linux/percpu.h>
14#include <linux/init.h>
15#include <linux/mm.h>
Alexey Dobriyand43c36d2009-10-07 17:09:06 +040016#include <linux/sched.h>
Rafael J. Wysockie1a85b22011-03-23 22:16:04 +010017#include <linux/syscore_ops.h>
john stultz85240702007-05-08 00:27:59 -070018#include <linux/clocksource.h>
19#include <linux/jiffies.h>
20#include <linux/time.h>
21#include <linux/tick.h>
Martin Schwidefsky75c51582009-08-14 15:47:30 +020022#include <linux/stop_machine.h>
john stultz85240702007-05-08 00:27:59 -070023
Martin Schwidefsky155ec602009-08-14 15:47:26 +020024/* Structure holding internal timekeeping values. */
25struct timekeeper {
26 /* Current clocksource used for timekeeping. */
27 struct clocksource *clock;
Thomas Gleixner058892e2011-11-13 23:19:48 +000028 /* NTP adjusted clock multiplier */
29 u32 mult;
Martin Schwidefsky23ce7212009-08-14 15:47:27 +020030 /* The shift value of the current clocksource. */
31 int shift;
Martin Schwidefsky155ec602009-08-14 15:47:26 +020032
33 /* Number of clock cycles in one NTP interval. */
34 cycle_t cycle_interval;
35 /* Number of clock shifted nano seconds in one NTP interval. */
36 u64 xtime_interval;
Kasper Pedersena386b5a2010-10-20 15:55:15 -070037 /* shifted nano seconds left over when rounding cycle_interval */
38 s64 xtime_remainder;
Martin Schwidefsky155ec602009-08-14 15:47:26 +020039 /* Raw nano seconds accumulated per NTP interval. */
40 u32 raw_interval;
41
42 /* Clock shifted nano seconds remainder not stored in xtime.tv_nsec. */
43 u64 xtime_nsec;
44 /* Difference between accumulated time and NTP time in ntp
45 * shifted nano seconds. */
46 s64 ntp_error;
Martin Schwidefsky23ce7212009-08-14 15:47:27 +020047 /* Shift conversion between clock shifted nano seconds and
48 * ntp shifted nano seconds. */
49 int ntp_error_shift;
John Stultz00c5fb72011-11-14 11:23:15 -080050
John Stultz8ff2cb92011-11-14 11:40:54 -080051 /* The current time */
52 struct timespec xtime;
John Stultzd9f72172011-11-14 11:29:32 -080053 /*
54 * wall_to_monotonic is what we need to add to xtime (or xtime corrected
55 * for sub jiffie times) to get to monotonic time. Monotonic is pegged
56 * at zero at system boot time, so wall_to_monotonic will be negative,
57 * however, we will ALWAYS keep the tv_nsec part positive so we can use
58 * the usual normalization.
59 *
60 * wall_to_monotonic is moved after resume from suspend for the
61 * monotonic time not to jump. We need to add total_sleep_time to
62 * wall_to_monotonic to get the real boot based time offset.
63 *
64 * - wall_to_monotonic is no longer the boot time, getboottime must be
65 * used instead.
66 */
67 struct timespec wall_to_monotonic;
John Stultz00c5fb72011-11-14 11:23:15 -080068 /* time spent in suspend */
69 struct timespec total_sleep_time;
John Stultz01f71b42011-11-14 11:43:49 -080070 /* The raw monotonic time for the CLOCK_MONOTONIC_RAW posix clock. */
71 struct timespec raw_time;
John Stultz70471f22011-11-14 12:48:10 -080072
73 /* Seqlock for all timekeeper values */
74 seqlock_t lock;
Martin Schwidefsky155ec602009-08-14 15:47:26 +020075};
76
H Hartley Sweetenafa14e72011-01-11 17:59:38 -060077static struct timekeeper timekeeper;
Martin Schwidefsky155ec602009-08-14 15:47:26 +020078
John Stultz8fcce542011-11-14 11:46:39 -080079/*
80 * This read-write spinlock protects us from races in SMP while
81 * playing with xtime.
82 */
83__cacheline_aligned_in_smp DEFINE_SEQLOCK(xtime_lock);
84
85
86/* flag for if timekeeping is suspended */
87int __read_mostly timekeeping_suspended;
88
89
90
Martin Schwidefsky155ec602009-08-14 15:47:26 +020091/**
92 * timekeeper_setup_internals - Set up internals to use clocksource clock.
93 *
94 * @clock: Pointer to clocksource.
95 *
96 * Calculates a fixed cycle/nsec interval for a given clocksource/adjustment
97 * pair and interval request.
98 *
99 * Unless you're the timekeeping code, you should not be using this!
100 */
101static void timekeeper_setup_internals(struct clocksource *clock)
102{
103 cycle_t interval;
Kasper Pedersena386b5a2010-10-20 15:55:15 -0700104 u64 tmp, ntpinterval;
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200105
106 timekeeper.clock = clock;
107 clock->cycle_last = clock->read(clock);
108
109 /* Do the ns -> cycle conversion first, using original mult */
110 tmp = NTP_INTERVAL_LENGTH;
111 tmp <<= clock->shift;
Kasper Pedersena386b5a2010-10-20 15:55:15 -0700112 ntpinterval = tmp;
Martin Schwidefsky0a544192009-08-14 15:47:28 +0200113 tmp += clock->mult/2;
114 do_div(tmp, clock->mult);
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200115 if (tmp == 0)
116 tmp = 1;
117
118 interval = (cycle_t) tmp;
119 timekeeper.cycle_interval = interval;
120
121 /* Go back from cycles -> shifted ns */
122 timekeeper.xtime_interval = (u64) interval * clock->mult;
Kasper Pedersena386b5a2010-10-20 15:55:15 -0700123 timekeeper.xtime_remainder = ntpinterval - timekeeper.xtime_interval;
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200124 timekeeper.raw_interval =
Martin Schwidefsky0a544192009-08-14 15:47:28 +0200125 ((u64) interval * clock->mult) >> clock->shift;
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200126
127 timekeeper.xtime_nsec = 0;
Martin Schwidefsky23ce7212009-08-14 15:47:27 +0200128 timekeeper.shift = clock->shift;
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200129
130 timekeeper.ntp_error = 0;
Martin Schwidefsky23ce7212009-08-14 15:47:27 +0200131 timekeeper.ntp_error_shift = NTP_SCALE_SHIFT - clock->shift;
Martin Schwidefsky0a544192009-08-14 15:47:28 +0200132
133 /*
134 * The timekeeper keeps its own mult values for the currently
135 * active clocksource. These value will be adjusted via NTP
136 * to counteract clock drifting.
137 */
138 timekeeper.mult = clock->mult;
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200139}
john stultz85240702007-05-08 00:27:59 -0700140
Martin Schwidefsky2ba2a302009-08-14 15:47:29 +0200141/* Timekeeper helper functions. */
142static inline s64 timekeeping_get_ns(void)
143{
144 cycle_t cycle_now, cycle_delta;
145 struct clocksource *clock;
146
147 /* read clocksource: */
148 clock = timekeeper.clock;
149 cycle_now = clock->read(clock);
150
151 /* calculate the delta since the last update_wall_time: */
152 cycle_delta = (cycle_now - clock->cycle_last) & clock->mask;
153
154 /* return delta convert to nanoseconds using ntp adjusted mult. */
155 return clocksource_cyc2ns(cycle_delta, timekeeper.mult,
156 timekeeper.shift);
157}
158
159static inline s64 timekeeping_get_ns_raw(void)
160{
161 cycle_t cycle_now, cycle_delta;
162 struct clocksource *clock;
163
164 /* read clocksource: */
165 clock = timekeeper.clock;
166 cycle_now = clock->read(clock);
167
168 /* calculate the delta since the last update_wall_time: */
169 cycle_delta = (cycle_now - clock->cycle_last) & clock->mask;
170
Dan McGeec9fad422011-10-17 13:58:43 -0500171 /* return delta convert to nanoseconds. */
Martin Schwidefsky2ba2a302009-08-14 15:47:29 +0200172 return clocksource_cyc2ns(cycle_delta, clock->mult, clock->shift);
173}
174
John Stultz31089c12009-08-14 15:47:18 +0200175void timekeeping_leap_insert(int leapsecond)
176{
John Stultz70471f22011-11-14 12:48:10 -0800177 unsigned long flags;
178
179 write_seqlock_irqsave(&timekeeper.lock, flags);
180
John Stultz8ff2cb92011-11-14 11:40:54 -0800181 timekeeper.xtime.tv_sec += leapsecond;
John Stultzd9f72172011-11-14 11:29:32 -0800182 timekeeper.wall_to_monotonic.tv_sec -= leapsecond;
John Stultz8ff2cb92011-11-14 11:40:54 -0800183 update_vsyscall(&timekeeper.xtime, &timekeeper.wall_to_monotonic,
184 timekeeper.clock, timekeeper.mult);
John Stultz70471f22011-11-14 12:48:10 -0800185
186 write_sequnlock_irqrestore(&timekeeper.lock, flags);
187
John Stultz31089c12009-08-14 15:47:18 +0200188}
john stultz85240702007-05-08 00:27:59 -0700189
john stultz85240702007-05-08 00:27:59 -0700190/**
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200191 * timekeeping_forward_now - update clock to the current time
john stultz85240702007-05-08 00:27:59 -0700192 *
Roman Zippel9a055112008-08-20 16:37:28 -0700193 * Forward the current clock to update its state since the last call to
194 * update_wall_time(). This is useful before significant clock changes,
195 * as it avoids having to deal with this time offset explicitly.
john stultz85240702007-05-08 00:27:59 -0700196 */
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200197static void timekeeping_forward_now(void)
john stultz85240702007-05-08 00:27:59 -0700198{
199 cycle_t cycle_now, cycle_delta;
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200200 struct clocksource *clock;
Roman Zippel9a055112008-08-20 16:37:28 -0700201 s64 nsec;
john stultz85240702007-05-08 00:27:59 -0700202
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200203 clock = timekeeper.clock;
Martin Schwidefskya0f7d482009-08-14 15:47:19 +0200204 cycle_now = clock->read(clock);
john stultz85240702007-05-08 00:27:59 -0700205 cycle_delta = (cycle_now - clock->cycle_last) & clock->mask;
Roman Zippel9a055112008-08-20 16:37:28 -0700206 clock->cycle_last = cycle_now;
john stultz85240702007-05-08 00:27:59 -0700207
Martin Schwidefsky0a544192009-08-14 15:47:28 +0200208 nsec = clocksource_cyc2ns(cycle_delta, timekeeper.mult,
209 timekeeper.shift);
john stultz7d275582009-05-01 13:10:26 -0700210
211 /* If arch requires, add in gettimeoffset() */
212 nsec += arch_gettimeoffset();
213
John Stultz8ff2cb92011-11-14 11:40:54 -0800214 timespec_add_ns(&timekeeper.xtime, nsec);
John Stultz2d422442008-08-20 16:37:30 -0700215
Martin Schwidefsky0a544192009-08-14 15:47:28 +0200216 nsec = clocksource_cyc2ns(cycle_delta, clock->mult, clock->shift);
John Stultz01f71b42011-11-14 11:43:49 -0800217 timespec_add_ns(&timekeeper.raw_time, nsec);
john stultz85240702007-05-08 00:27:59 -0700218}
219
220/**
Geert Uytterhoevenefd9ac82008-01-30 13:30:01 +0100221 * getnstimeofday - Returns the time of day in a timespec
john stultz85240702007-05-08 00:27:59 -0700222 * @ts: pointer to the timespec to be set
223 *
Geert Uytterhoevenefd9ac82008-01-30 13:30:01 +0100224 * Returns the time of day in a timespec.
john stultz85240702007-05-08 00:27:59 -0700225 */
Geert Uytterhoevenefd9ac82008-01-30 13:30:01 +0100226void getnstimeofday(struct timespec *ts)
john stultz85240702007-05-08 00:27:59 -0700227{
228 unsigned long seq;
229 s64 nsecs;
230
Thomas Gleixner1c5745a2008-12-22 23:05:28 +0100231 WARN_ON(timekeeping_suspended);
232
john stultz85240702007-05-08 00:27:59 -0700233 do {
John Stultz70471f22011-11-14 12:48:10 -0800234 seq = read_seqbegin(&timekeeper.lock);
john stultz85240702007-05-08 00:27:59 -0700235
John Stultz8ff2cb92011-11-14 11:40:54 -0800236 *ts = timekeeper.xtime;
Martin Schwidefsky2ba2a302009-08-14 15:47:29 +0200237 nsecs = timekeeping_get_ns();
john stultz85240702007-05-08 00:27:59 -0700238
john stultz7d275582009-05-01 13:10:26 -0700239 /* If arch requires, add in gettimeoffset() */
240 nsecs += arch_gettimeoffset();
241
John Stultz70471f22011-11-14 12:48:10 -0800242 } while (read_seqretry(&timekeeper.lock, seq));
john stultz85240702007-05-08 00:27:59 -0700243
244 timespec_add_ns(ts, nsecs);
245}
246
john stultz85240702007-05-08 00:27:59 -0700247EXPORT_SYMBOL(getnstimeofday);
248
Martin Schwidefsky951ed4d2009-07-07 11:27:28 +0200249ktime_t ktime_get(void)
250{
Martin Schwidefsky951ed4d2009-07-07 11:27:28 +0200251 unsigned int seq;
252 s64 secs, nsecs;
253
254 WARN_ON(timekeeping_suspended);
255
256 do {
John Stultz70471f22011-11-14 12:48:10 -0800257 seq = read_seqbegin(&timekeeper.lock);
John Stultz8ff2cb92011-11-14 11:40:54 -0800258 secs = timekeeper.xtime.tv_sec +
259 timekeeper.wall_to_monotonic.tv_sec;
260 nsecs = timekeeper.xtime.tv_nsec +
261 timekeeper.wall_to_monotonic.tv_nsec;
Martin Schwidefsky2ba2a302009-08-14 15:47:29 +0200262 nsecs += timekeeping_get_ns();
Hector Palaciosd004e022011-11-14 11:15:25 +0100263 /* If arch requires, add in gettimeoffset() */
264 nsecs += arch_gettimeoffset();
Martin Schwidefsky951ed4d2009-07-07 11:27:28 +0200265
John Stultz70471f22011-11-14 12:48:10 -0800266 } while (read_seqretry(&timekeeper.lock, seq));
Martin Schwidefsky951ed4d2009-07-07 11:27:28 +0200267 /*
268 * Use ktime_set/ktime_add_ns to create a proper ktime on
269 * 32-bit architectures without CONFIG_KTIME_SCALAR.
270 */
271 return ktime_add_ns(ktime_set(secs, 0), nsecs);
272}
273EXPORT_SYMBOL_GPL(ktime_get);
274
275/**
276 * ktime_get_ts - get the monotonic clock in timespec format
277 * @ts: pointer to timespec variable
278 *
279 * The function calculates the monotonic clock from the realtime
280 * clock and the wall_to_monotonic offset and stores the result
281 * in normalized timespec format in the variable pointed to by @ts.
282 */
283void ktime_get_ts(struct timespec *ts)
284{
Martin Schwidefsky951ed4d2009-07-07 11:27:28 +0200285 struct timespec tomono;
286 unsigned int seq;
287 s64 nsecs;
288
289 WARN_ON(timekeeping_suspended);
290
291 do {
John Stultz70471f22011-11-14 12:48:10 -0800292 seq = read_seqbegin(&timekeeper.lock);
John Stultz8ff2cb92011-11-14 11:40:54 -0800293 *ts = timekeeper.xtime;
John Stultzd9f72172011-11-14 11:29:32 -0800294 tomono = timekeeper.wall_to_monotonic;
Martin Schwidefsky2ba2a302009-08-14 15:47:29 +0200295 nsecs = timekeeping_get_ns();
Hector Palaciosd004e022011-11-14 11:15:25 +0100296 /* If arch requires, add in gettimeoffset() */
297 nsecs += arch_gettimeoffset();
Martin Schwidefsky951ed4d2009-07-07 11:27:28 +0200298
John Stultz70471f22011-11-14 12:48:10 -0800299 } while (read_seqretry(&timekeeper.lock, seq));
Martin Schwidefsky951ed4d2009-07-07 11:27:28 +0200300
301 set_normalized_timespec(ts, ts->tv_sec + tomono.tv_sec,
302 ts->tv_nsec + tomono.tv_nsec + nsecs);
303}
304EXPORT_SYMBOL_GPL(ktime_get_ts);
305
Alexander Gordeeve2c18e42011-01-12 17:00:57 -0800306#ifdef CONFIG_NTP_PPS
307
308/**
309 * getnstime_raw_and_real - get day and raw monotonic time in timespec format
310 * @ts_raw: pointer to the timespec to be set to raw monotonic time
311 * @ts_real: pointer to the timespec to be set to the time of day
312 *
313 * This function reads both the time of day and raw monotonic time at the
314 * same time atomically and stores the resulting timestamps in timespec
315 * format.
316 */
317void getnstime_raw_and_real(struct timespec *ts_raw, struct timespec *ts_real)
318{
319 unsigned long seq;
320 s64 nsecs_raw, nsecs_real;
321
322 WARN_ON_ONCE(timekeeping_suspended);
323
324 do {
325 u32 arch_offset;
326
John Stultz70471f22011-11-14 12:48:10 -0800327 seq = read_seqbegin(&timekeeper.lock);
Alexander Gordeeve2c18e42011-01-12 17:00:57 -0800328
John Stultz01f71b42011-11-14 11:43:49 -0800329 *ts_raw = timekeeper.raw_time;
John Stultz8ff2cb92011-11-14 11:40:54 -0800330 *ts_real = timekeeper.xtime;
Alexander Gordeeve2c18e42011-01-12 17:00:57 -0800331
332 nsecs_raw = timekeeping_get_ns_raw();
333 nsecs_real = timekeeping_get_ns();
334
335 /* If arch requires, add in gettimeoffset() */
336 arch_offset = arch_gettimeoffset();
337 nsecs_raw += arch_offset;
338 nsecs_real += arch_offset;
339
John Stultz70471f22011-11-14 12:48:10 -0800340 } while (read_seqretry(&timekeeper.lock, seq));
Alexander Gordeeve2c18e42011-01-12 17:00:57 -0800341
342 timespec_add_ns(ts_raw, nsecs_raw);
343 timespec_add_ns(ts_real, nsecs_real);
344}
345EXPORT_SYMBOL(getnstime_raw_and_real);
346
347#endif /* CONFIG_NTP_PPS */
348
john stultz85240702007-05-08 00:27:59 -0700349/**
350 * do_gettimeofday - Returns the time of day in a timeval
351 * @tv: pointer to the timeval to be set
352 *
Geert Uytterhoevenefd9ac82008-01-30 13:30:01 +0100353 * NOTE: Users should be converted to using getnstimeofday()
john stultz85240702007-05-08 00:27:59 -0700354 */
355void do_gettimeofday(struct timeval *tv)
356{
357 struct timespec now;
358
Geert Uytterhoevenefd9ac82008-01-30 13:30:01 +0100359 getnstimeofday(&now);
john stultz85240702007-05-08 00:27:59 -0700360 tv->tv_sec = now.tv_sec;
361 tv->tv_usec = now.tv_nsec/1000;
362}
363
364EXPORT_SYMBOL(do_gettimeofday);
365/**
366 * do_settimeofday - Sets the time of day
367 * @tv: pointer to the timespec variable containing the new time
368 *
369 * Sets the time of day to the new time and update NTP and notify hrtimers
370 */
Richard Cochran1e6d7672011-02-01 13:50:58 +0000371int do_settimeofday(const struct timespec *tv)
john stultz85240702007-05-08 00:27:59 -0700372{
Roman Zippel9a055112008-08-20 16:37:28 -0700373 struct timespec ts_delta;
John Stultz92c1d3e2011-11-14 14:05:44 -0800374 unsigned long flags;
john stultz85240702007-05-08 00:27:59 -0700375
376 if ((unsigned long)tv->tv_nsec >= NSEC_PER_SEC)
377 return -EINVAL;
378
John Stultz92c1d3e2011-11-14 14:05:44 -0800379 write_seqlock_irqsave(&timekeeper.lock, flags);
john stultz85240702007-05-08 00:27:59 -0700380
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200381 timekeeping_forward_now();
john stultz85240702007-05-08 00:27:59 -0700382
John Stultz8ff2cb92011-11-14 11:40:54 -0800383 ts_delta.tv_sec = tv->tv_sec - timekeeper.xtime.tv_sec;
384 ts_delta.tv_nsec = tv->tv_nsec - timekeeper.xtime.tv_nsec;
John Stultzd9f72172011-11-14 11:29:32 -0800385 timekeeper.wall_to_monotonic =
386 timespec_sub(timekeeper.wall_to_monotonic, ts_delta);
john stultz85240702007-05-08 00:27:59 -0700387
John Stultz8ff2cb92011-11-14 11:40:54 -0800388 timekeeper.xtime = *tv;
Roman Zippel9a055112008-08-20 16:37:28 -0700389
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200390 timekeeper.ntp_error = 0;
john stultz85240702007-05-08 00:27:59 -0700391 ntp_clear();
392
John Stultz8ff2cb92011-11-14 11:40:54 -0800393 update_vsyscall(&timekeeper.xtime, &timekeeper.wall_to_monotonic,
394 timekeeper.clock, timekeeper.mult);
john stultz85240702007-05-08 00:27:59 -0700395
John Stultz92c1d3e2011-11-14 14:05:44 -0800396 write_sequnlock_irqrestore(&timekeeper.lock, flags);
john stultz85240702007-05-08 00:27:59 -0700397
398 /* signal hrtimers about time change */
399 clock_was_set();
400
401 return 0;
402}
403
404EXPORT_SYMBOL(do_settimeofday);
405
John Stultzc528f7c2011-02-01 13:52:17 +0000406
407/**
408 * timekeeping_inject_offset - Adds or subtracts from the current time.
409 * @tv: pointer to the timespec variable containing the offset
410 *
411 * Adds or subtracts an offset value from the current time.
412 */
413int timekeeping_inject_offset(struct timespec *ts)
414{
John Stultz92c1d3e2011-11-14 14:05:44 -0800415 unsigned long flags;
John Stultzc528f7c2011-02-01 13:52:17 +0000416
417 if ((unsigned long)ts->tv_nsec >= NSEC_PER_SEC)
418 return -EINVAL;
419
John Stultz92c1d3e2011-11-14 14:05:44 -0800420 write_seqlock_irqsave(&timekeeper.lock, flags);
John Stultzc528f7c2011-02-01 13:52:17 +0000421
422 timekeeping_forward_now();
423
John Stultz8ff2cb92011-11-14 11:40:54 -0800424 timekeeper.xtime = timespec_add(timekeeper.xtime, *ts);
John Stultzd9f72172011-11-14 11:29:32 -0800425 timekeeper.wall_to_monotonic =
426 timespec_sub(timekeeper.wall_to_monotonic, *ts);
John Stultzc528f7c2011-02-01 13:52:17 +0000427
428 timekeeper.ntp_error = 0;
429 ntp_clear();
430
John Stultz8ff2cb92011-11-14 11:40:54 -0800431 update_vsyscall(&timekeeper.xtime, &timekeeper.wall_to_monotonic,
432 timekeeper.clock, timekeeper.mult);
John Stultzc528f7c2011-02-01 13:52:17 +0000433
John Stultz92c1d3e2011-11-14 14:05:44 -0800434 write_sequnlock_irqrestore(&timekeeper.lock, flags);
John Stultzc528f7c2011-02-01 13:52:17 +0000435
436 /* signal hrtimers about time change */
437 clock_was_set();
438
439 return 0;
440}
441EXPORT_SYMBOL(timekeeping_inject_offset);
442
john stultz85240702007-05-08 00:27:59 -0700443/**
444 * change_clocksource - Swaps clocksources if a new one is available
445 *
446 * Accumulates current time interval and initializes new clocksource
447 */
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200448static int change_clocksource(void *data)
john stultz85240702007-05-08 00:27:59 -0700449{
Magnus Damm4614e6a2009-04-21 12:24:02 -0700450 struct clocksource *new, *old;
john stultz85240702007-05-08 00:27:59 -0700451
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200452 new = (struct clocksource *) data;
john stultz85240702007-05-08 00:27:59 -0700453
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200454 timekeeping_forward_now();
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200455 if (!new->enable || new->enable(new) == 0) {
456 old = timekeeper.clock;
457 timekeeper_setup_internals(new);
458 if (old->disable)
459 old->disable(old);
460 }
461 return 0;
462}
john stultz85240702007-05-08 00:27:59 -0700463
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200464/**
465 * timekeeping_notify - Install a new clock source
466 * @clock: pointer to the clock source
467 *
468 * This function is called from clocksource.c after a new, better clock
469 * source has been registered. The caller holds the clocksource_mutex.
470 */
471void timekeeping_notify(struct clocksource *clock)
472{
473 if (timekeeper.clock == clock)
Magnus Damm4614e6a2009-04-21 12:24:02 -0700474 return;
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200475 stop_machine(change_clocksource, clock, NULL);
john stultz85240702007-05-08 00:27:59 -0700476 tick_clock_notify();
john stultz85240702007-05-08 00:27:59 -0700477}
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200478
Thomas Gleixnera40f2622009-07-07 13:00:31 +0200479/**
480 * ktime_get_real - get the real (wall-) time in ktime_t format
481 *
482 * returns the time in ktime_t format
483 */
484ktime_t ktime_get_real(void)
485{
486 struct timespec now;
487
488 getnstimeofday(&now);
489
490 return timespec_to_ktime(now);
491}
492EXPORT_SYMBOL_GPL(ktime_get_real);
john stultz85240702007-05-08 00:27:59 -0700493
494/**
John Stultz2d422442008-08-20 16:37:30 -0700495 * getrawmonotonic - Returns the raw monotonic time in a timespec
496 * @ts: pointer to the timespec to be set
497 *
498 * Returns the raw monotonic time (completely un-modified by ntp)
499 */
500void getrawmonotonic(struct timespec *ts)
501{
502 unsigned long seq;
503 s64 nsecs;
John Stultz2d422442008-08-20 16:37:30 -0700504
505 do {
John Stultz70471f22011-11-14 12:48:10 -0800506 seq = read_seqbegin(&timekeeper.lock);
Martin Schwidefsky2ba2a302009-08-14 15:47:29 +0200507 nsecs = timekeeping_get_ns_raw();
John Stultz01f71b42011-11-14 11:43:49 -0800508 *ts = timekeeper.raw_time;
John Stultz2d422442008-08-20 16:37:30 -0700509
John Stultz70471f22011-11-14 12:48:10 -0800510 } while (read_seqretry(&timekeeper.lock, seq));
John Stultz2d422442008-08-20 16:37:30 -0700511
512 timespec_add_ns(ts, nsecs);
513}
514EXPORT_SYMBOL(getrawmonotonic);
515
516
517/**
Li Zefancf4fc6c2008-02-08 04:19:24 -0800518 * timekeeping_valid_for_hres - Check if timekeeping is suitable for hres
john stultz85240702007-05-08 00:27:59 -0700519 */
Li Zefancf4fc6c2008-02-08 04:19:24 -0800520int timekeeping_valid_for_hres(void)
john stultz85240702007-05-08 00:27:59 -0700521{
522 unsigned long seq;
523 int ret;
524
525 do {
John Stultz70471f22011-11-14 12:48:10 -0800526 seq = read_seqbegin(&timekeeper.lock);
john stultz85240702007-05-08 00:27:59 -0700527
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200528 ret = timekeeper.clock->flags & CLOCK_SOURCE_VALID_FOR_HRES;
john stultz85240702007-05-08 00:27:59 -0700529
John Stultz70471f22011-11-14 12:48:10 -0800530 } while (read_seqretry(&timekeeper.lock, seq));
john stultz85240702007-05-08 00:27:59 -0700531
532 return ret;
533}
534
535/**
Jon Hunter98962462009-08-18 12:45:10 -0500536 * timekeeping_max_deferment - Returns max time the clocksource can be deferred
Jon Hunter98962462009-08-18 12:45:10 -0500537 */
538u64 timekeeping_max_deferment(void)
539{
John Stultz70471f22011-11-14 12:48:10 -0800540 unsigned long seq;
541 u64 ret;
542 do {
543 seq = read_seqbegin(&timekeeper.lock);
544
545 ret = timekeeper.clock->max_idle_ns;
546
547 } while (read_seqretry(&timekeeper.lock, seq));
548
549 return ret;
Jon Hunter98962462009-08-18 12:45:10 -0500550}
551
552/**
Martin Schwidefskyd4f587c2009-08-14 15:47:31 +0200553 * read_persistent_clock - Return time from the persistent clock.
john stultz85240702007-05-08 00:27:59 -0700554 *
555 * Weak dummy function for arches that do not yet support it.
Martin Schwidefskyd4f587c2009-08-14 15:47:31 +0200556 * Reads the time from the battery backed persistent clock.
557 * Returns a timespec with tv_sec=0 and tv_nsec=0 if unsupported.
john stultz85240702007-05-08 00:27:59 -0700558 *
559 * XXX - Do be sure to remove it once all arches implement it.
560 */
Martin Schwidefskyd4f587c2009-08-14 15:47:31 +0200561void __attribute__((weak)) read_persistent_clock(struct timespec *ts)
john stultz85240702007-05-08 00:27:59 -0700562{
Martin Schwidefskyd4f587c2009-08-14 15:47:31 +0200563 ts->tv_sec = 0;
564 ts->tv_nsec = 0;
john stultz85240702007-05-08 00:27:59 -0700565}
566
Martin Schwidefsky23970e32009-08-14 15:47:32 +0200567/**
568 * read_boot_clock - Return time of the system start.
569 *
570 * Weak dummy function for arches that do not yet support it.
571 * Function to read the exact time the system has been started.
572 * Returns a timespec with tv_sec=0 and tv_nsec=0 if unsupported.
573 *
574 * XXX - Do be sure to remove it once all arches implement it.
575 */
576void __attribute__((weak)) read_boot_clock(struct timespec *ts)
577{
578 ts->tv_sec = 0;
579 ts->tv_nsec = 0;
580}
581
john stultz85240702007-05-08 00:27:59 -0700582/*
583 * timekeeping_init - Initializes the clocksource and common timekeeping values
584 */
585void __init timekeeping_init(void)
586{
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200587 struct clocksource *clock;
john stultz85240702007-05-08 00:27:59 -0700588 unsigned long flags;
Martin Schwidefsky23970e32009-08-14 15:47:32 +0200589 struct timespec now, boot;
Martin Schwidefskyd4f587c2009-08-14 15:47:31 +0200590
591 read_persistent_clock(&now);
Martin Schwidefsky23970e32009-08-14 15:47:32 +0200592 read_boot_clock(&boot);
john stultz85240702007-05-08 00:27:59 -0700593
John Stultz70471f22011-11-14 12:48:10 -0800594 seqlock_init(&timekeeper.lock);
595
Roman Zippel7dffa3c2008-05-01 04:34:41 -0700596 ntp_init();
john stultz85240702007-05-08 00:27:59 -0700597
John Stultz70471f22011-11-14 12:48:10 -0800598 write_seqlock_irqsave(&timekeeper.lock, flags);
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200599 clock = clocksource_default_clock();
Martin Schwidefskya0f7d482009-08-14 15:47:19 +0200600 if (clock->enable)
601 clock->enable(clock);
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200602 timekeeper_setup_internals(clock);
john stultz85240702007-05-08 00:27:59 -0700603
John Stultz8ff2cb92011-11-14 11:40:54 -0800604 timekeeper.xtime.tv_sec = now.tv_sec;
605 timekeeper.xtime.tv_nsec = now.tv_nsec;
John Stultz01f71b42011-11-14 11:43:49 -0800606 timekeeper.raw_time.tv_sec = 0;
607 timekeeper.raw_time.tv_nsec = 0;
Martin Schwidefsky23970e32009-08-14 15:47:32 +0200608 if (boot.tv_sec == 0 && boot.tv_nsec == 0) {
John Stultz8ff2cb92011-11-14 11:40:54 -0800609 boot.tv_sec = timekeeper.xtime.tv_sec;
610 boot.tv_nsec = timekeeper.xtime.tv_nsec;
Martin Schwidefsky23970e32009-08-14 15:47:32 +0200611 }
John Stultzd9f72172011-11-14 11:29:32 -0800612 set_normalized_timespec(&timekeeper.wall_to_monotonic,
Martin Schwidefsky23970e32009-08-14 15:47:32 +0200613 -boot.tv_sec, -boot.tv_nsec);
John Stultz00c5fb72011-11-14 11:23:15 -0800614 timekeeper.total_sleep_time.tv_sec = 0;
615 timekeeper.total_sleep_time.tv_nsec = 0;
John Stultz70471f22011-11-14 12:48:10 -0800616 write_sequnlock_irqrestore(&timekeeper.lock, flags);
john stultz85240702007-05-08 00:27:59 -0700617}
618
john stultz85240702007-05-08 00:27:59 -0700619/* time in seconds when suspend began */
Martin Schwidefskyd4f587c2009-08-14 15:47:31 +0200620static struct timespec timekeeping_suspend_time;
john stultz85240702007-05-08 00:27:59 -0700621
622/**
John Stultz304529b2011-04-01 14:32:09 -0700623 * __timekeeping_inject_sleeptime - Internal function to add sleep interval
624 * @delta: pointer to a timespec delta value
625 *
626 * Takes a timespec offset measuring a suspend interval and properly
627 * adds the sleep offset to the timekeeping variables.
628 */
629static void __timekeeping_inject_sleeptime(struct timespec *delta)
630{
John Stultzcb5de2f8d2011-06-01 18:18:09 -0700631 if (!timespec_valid(delta)) {
John Stultzcbaa5152011-07-20 15:42:55 -0700632 printk(KERN_WARNING "__timekeeping_inject_sleeptime: Invalid "
John Stultzcb5de2f8d2011-06-01 18:18:09 -0700633 "sleep delta value!\n");
634 return;
635 }
636
John Stultz8ff2cb92011-11-14 11:40:54 -0800637 timekeeper.xtime = timespec_add(timekeeper.xtime, *delta);
John Stultzd9f72172011-11-14 11:29:32 -0800638 timekeeper.wall_to_monotonic =
639 timespec_sub(timekeeper.wall_to_monotonic, *delta);
John Stultz00c5fb72011-11-14 11:23:15 -0800640 timekeeper.total_sleep_time = timespec_add(
641 timekeeper.total_sleep_time, *delta);
John Stultz304529b2011-04-01 14:32:09 -0700642}
643
644
645/**
646 * timekeeping_inject_sleeptime - Adds suspend interval to timeekeeping values
647 * @delta: pointer to a timespec delta value
648 *
649 * This hook is for architectures that cannot support read_persistent_clock
650 * because their RTC/persistent clock is only accessible when irqs are enabled.
651 *
652 * This function should only be called by rtc_resume(), and allows
653 * a suspend offset to be injected into the timekeeping values.
654 */
655void timekeeping_inject_sleeptime(struct timespec *delta)
656{
John Stultz92c1d3e2011-11-14 14:05:44 -0800657 unsigned long flags;
John Stultz304529b2011-04-01 14:32:09 -0700658 struct timespec ts;
659
660 /* Make sure we don't set the clock twice */
661 read_persistent_clock(&ts);
662 if (!(ts.tv_sec == 0 && ts.tv_nsec == 0))
663 return;
664
John Stultz92c1d3e2011-11-14 14:05:44 -0800665 write_seqlock_irqsave(&timekeeper.lock, flags);
John Stultz70471f22011-11-14 12:48:10 -0800666
John Stultz304529b2011-04-01 14:32:09 -0700667 timekeeping_forward_now();
668
669 __timekeeping_inject_sleeptime(delta);
670
671 timekeeper.ntp_error = 0;
672 ntp_clear();
John Stultz8ff2cb92011-11-14 11:40:54 -0800673 update_vsyscall(&timekeeper.xtime, &timekeeper.wall_to_monotonic,
674 timekeeper.clock, timekeeper.mult);
John Stultz304529b2011-04-01 14:32:09 -0700675
John Stultz92c1d3e2011-11-14 14:05:44 -0800676 write_sequnlock_irqrestore(&timekeeper.lock, flags);
John Stultz304529b2011-04-01 14:32:09 -0700677
678 /* signal hrtimers about time change */
679 clock_was_set();
680}
681
682
683/**
john stultz85240702007-05-08 00:27:59 -0700684 * timekeeping_resume - Resumes the generic timekeeping subsystem.
john stultz85240702007-05-08 00:27:59 -0700685 *
686 * This is for the generic clocksource timekeeping.
687 * xtime/wall_to_monotonic/jiffies/etc are
688 * still managed by arch specific suspend/resume code.
689 */
Rafael J. Wysockie1a85b22011-03-23 22:16:04 +0100690static void timekeeping_resume(void)
john stultz85240702007-05-08 00:27:59 -0700691{
John Stultz92c1d3e2011-11-14 14:05:44 -0800692 unsigned long flags;
Martin Schwidefskyd4f587c2009-08-14 15:47:31 +0200693 struct timespec ts;
694
695 read_persistent_clock(&ts);
john stultz85240702007-05-08 00:27:59 -0700696
Thomas Gleixnerd10ff3f2007-05-14 11:10:02 +0200697 clocksource_resume();
698
John Stultz92c1d3e2011-11-14 14:05:44 -0800699 write_seqlock_irqsave(&timekeeper.lock, flags);
john stultz85240702007-05-08 00:27:59 -0700700
Martin Schwidefskyd4f587c2009-08-14 15:47:31 +0200701 if (timespec_compare(&ts, &timekeeping_suspend_time) > 0) {
702 ts = timespec_sub(ts, timekeeping_suspend_time);
John Stultz304529b2011-04-01 14:32:09 -0700703 __timekeeping_inject_sleeptime(&ts);
john stultz85240702007-05-08 00:27:59 -0700704 }
705 /* re-base the last cycle value */
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200706 timekeeper.clock->cycle_last = timekeeper.clock->read(timekeeper.clock);
707 timekeeper.ntp_error = 0;
john stultz85240702007-05-08 00:27:59 -0700708 timekeeping_suspended = 0;
John Stultz92c1d3e2011-11-14 14:05:44 -0800709 write_sequnlock_irqrestore(&timekeeper.lock, flags);
john stultz85240702007-05-08 00:27:59 -0700710
711 touch_softlockup_watchdog();
712
713 clockevents_notify(CLOCK_EVT_NOTIFY_RESUME, NULL);
714
715 /* Resume hrtimers */
Thomas Gleixnerb12a03c2011-05-02 16:48:57 +0200716 hrtimers_resume();
john stultz85240702007-05-08 00:27:59 -0700717}
718
Rafael J. Wysockie1a85b22011-03-23 22:16:04 +0100719static int timekeeping_suspend(void)
john stultz85240702007-05-08 00:27:59 -0700720{
John Stultz92c1d3e2011-11-14 14:05:44 -0800721 unsigned long flags;
John Stultzcb332172011-05-31 22:53:23 -0700722 struct timespec delta, delta_delta;
723 static struct timespec old_delta;
john stultz85240702007-05-08 00:27:59 -0700724
Martin Schwidefskyd4f587c2009-08-14 15:47:31 +0200725 read_persistent_clock(&timekeeping_suspend_time);
Thomas Gleixner3be90952007-09-16 15:36:43 +0200726
John Stultz92c1d3e2011-11-14 14:05:44 -0800727 write_seqlock_irqsave(&timekeeper.lock, flags);
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200728 timekeeping_forward_now();
john stultz85240702007-05-08 00:27:59 -0700729 timekeeping_suspended = 1;
John Stultzcb332172011-05-31 22:53:23 -0700730
731 /*
732 * To avoid drift caused by repeated suspend/resumes,
733 * which each can add ~1 second drift error,
734 * try to compensate so the difference in system time
735 * and persistent_clock time stays close to constant.
736 */
John Stultz8ff2cb92011-11-14 11:40:54 -0800737 delta = timespec_sub(timekeeper.xtime, timekeeping_suspend_time);
John Stultzcb332172011-05-31 22:53:23 -0700738 delta_delta = timespec_sub(delta, old_delta);
739 if (abs(delta_delta.tv_sec) >= 2) {
740 /*
741 * if delta_delta is too large, assume time correction
742 * has occured and set old_delta to the current delta.
743 */
744 old_delta = delta;
745 } else {
746 /* Otherwise try to adjust old_system to compensate */
747 timekeeping_suspend_time =
748 timespec_add(timekeeping_suspend_time, delta_delta);
749 }
John Stultz92c1d3e2011-11-14 14:05:44 -0800750 write_sequnlock_irqrestore(&timekeeper.lock, flags);
john stultz85240702007-05-08 00:27:59 -0700751
752 clockevents_notify(CLOCK_EVT_NOTIFY_SUSPEND, NULL);
Magnus Dammc54a42b2010-02-02 14:41:41 -0800753 clocksource_suspend();
john stultz85240702007-05-08 00:27:59 -0700754
755 return 0;
756}
757
758/* sysfs resume/suspend bits for timekeeping */
Rafael J. Wysockie1a85b22011-03-23 22:16:04 +0100759static struct syscore_ops timekeeping_syscore_ops = {
john stultz85240702007-05-08 00:27:59 -0700760 .resume = timekeeping_resume,
761 .suspend = timekeeping_suspend,
john stultz85240702007-05-08 00:27:59 -0700762};
763
Rafael J. Wysockie1a85b22011-03-23 22:16:04 +0100764static int __init timekeeping_init_ops(void)
john stultz85240702007-05-08 00:27:59 -0700765{
Rafael J. Wysockie1a85b22011-03-23 22:16:04 +0100766 register_syscore_ops(&timekeeping_syscore_ops);
767 return 0;
john stultz85240702007-05-08 00:27:59 -0700768}
769
Rafael J. Wysockie1a85b22011-03-23 22:16:04 +0100770device_initcall(timekeeping_init_ops);
john stultz85240702007-05-08 00:27:59 -0700771
772/*
773 * If the error is already larger, we look ahead even further
774 * to compensate for late or lost adjustments.
775 */
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200776static __always_inline int timekeeping_bigadjust(s64 error, s64 *interval,
john stultz85240702007-05-08 00:27:59 -0700777 s64 *offset)
778{
779 s64 tick_error, i;
780 u32 look_ahead, adj;
781 s32 error2, mult;
782
783 /*
784 * Use the current error value to determine how much to look ahead.
785 * The larger the error the slower we adjust for it to avoid problems
786 * with losing too many ticks, otherwise we would overadjust and
787 * produce an even larger error. The smaller the adjustment the
788 * faster we try to adjust for it, as lost ticks can do less harm
Li Zefan3eb05672008-02-08 04:19:25 -0800789 * here. This is tuned so that an error of about 1 msec is adjusted
john stultz85240702007-05-08 00:27:59 -0700790 * within about 1 sec (or 2^20 nsec in 2^SHIFT_HZ ticks).
791 */
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200792 error2 = timekeeper.ntp_error >> (NTP_SCALE_SHIFT + 22 - 2 * SHIFT_HZ);
john stultz85240702007-05-08 00:27:59 -0700793 error2 = abs(error2);
794 for (look_ahead = 0; error2 > 0; look_ahead++)
795 error2 >>= 2;
796
797 /*
798 * Now calculate the error in (1 << look_ahead) ticks, but first
799 * remove the single look ahead already included in the error.
800 */
John Stultzea7cf49a2011-11-14 13:18:07 -0800801 tick_error = ntp_tick_length() >> (timekeeper.ntp_error_shift + 1);
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200802 tick_error -= timekeeper.xtime_interval >> 1;
john stultz85240702007-05-08 00:27:59 -0700803 error = ((error - tick_error) >> look_ahead) + tick_error;
804
805 /* Finally calculate the adjustment shift value. */
806 i = *interval;
807 mult = 1;
808 if (error < 0) {
809 error = -error;
810 *interval = -*interval;
811 *offset = -*offset;
812 mult = -1;
813 }
814 for (adj = 0; error > i; adj++)
815 error >>= 1;
816
817 *interval <<= adj;
818 *offset <<= adj;
819 return mult << adj;
820}
821
822/*
823 * Adjust the multiplier to reduce the error value,
824 * this is optimized for the most common adjustments of -1,0,1,
825 * for other values we can do a bit more work.
826 */
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200827static void timekeeping_adjust(s64 offset)
john stultz85240702007-05-08 00:27:59 -0700828{
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200829 s64 error, interval = timekeeper.cycle_interval;
john stultz85240702007-05-08 00:27:59 -0700830 int adj;
831
John Stultzc2bc1112011-10-27 18:12:42 -0700832 /*
833 * The point of this is to check if the error is greater then half
834 * an interval.
835 *
836 * First we shift it down from NTP_SHIFT to clocksource->shifted nsecs.
837 *
838 * Note we subtract one in the shift, so that error is really error*2.
John Stultz3f86f282011-10-27 17:41:17 -0700839 * This "saves" dividing(shifting) interval twice, but keeps the
840 * (error > interval) comparison as still measuring if error is
John Stultzc2bc1112011-10-27 18:12:42 -0700841 * larger then half an interval.
842 *
John Stultz3f86f282011-10-27 17:41:17 -0700843 * Note: It does not "save" on aggravation when reading the code.
John Stultzc2bc1112011-10-27 18:12:42 -0700844 */
Martin Schwidefsky23ce7212009-08-14 15:47:27 +0200845 error = timekeeper.ntp_error >> (timekeeper.ntp_error_shift - 1);
john stultz85240702007-05-08 00:27:59 -0700846 if (error > interval) {
John Stultzc2bc1112011-10-27 18:12:42 -0700847 /*
848 * We now divide error by 4(via shift), which checks if
849 * the error is greater then twice the interval.
850 * If it is greater, we need a bigadjust, if its smaller,
851 * we can adjust by 1.
852 */
john stultz85240702007-05-08 00:27:59 -0700853 error >>= 2;
John Stultzc2bc1112011-10-27 18:12:42 -0700854 /*
855 * XXX - In update_wall_time, we round up to the next
856 * nanosecond, and store the amount rounded up into
857 * the error. This causes the likely below to be unlikely.
858 *
John Stultz3f86f282011-10-27 17:41:17 -0700859 * The proper fix is to avoid rounding up by using
John Stultzc2bc1112011-10-27 18:12:42 -0700860 * the high precision timekeeper.xtime_nsec instead of
861 * xtime.tv_nsec everywhere. Fixing this will take some
862 * time.
863 */
john stultz85240702007-05-08 00:27:59 -0700864 if (likely(error <= interval))
865 adj = 1;
866 else
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200867 adj = timekeeping_bigadjust(error, &interval, &offset);
john stultz85240702007-05-08 00:27:59 -0700868 } else if (error < -interval) {
John Stultzc2bc1112011-10-27 18:12:42 -0700869 /* See comment above, this is just switched for the negative */
john stultz85240702007-05-08 00:27:59 -0700870 error >>= 2;
871 if (likely(error >= -interval)) {
872 adj = -1;
873 interval = -interval;
874 offset = -offset;
875 } else
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200876 adj = timekeeping_bigadjust(error, &interval, &offset);
John Stultzc2bc1112011-10-27 18:12:42 -0700877 } else /* No adjustment needed */
john stultz85240702007-05-08 00:27:59 -0700878 return;
879
John Stultzd65670a2011-10-31 17:06:35 -0400880 WARN_ONCE(timekeeper.clock->maxadj &&
881 (timekeeper.mult + adj > timekeeper.clock->mult +
882 timekeeper.clock->maxadj),
883 "Adjusting %s more then 11%% (%ld vs %ld)\n",
884 timekeeper.clock->name, (long)timekeeper.mult + adj,
885 (long)timekeeper.clock->mult +
886 timekeeper.clock->maxadj);
John Stultzc2bc1112011-10-27 18:12:42 -0700887 /*
888 * So the following can be confusing.
889 *
890 * To keep things simple, lets assume adj == 1 for now.
891 *
892 * When adj != 1, remember that the interval and offset values
893 * have been appropriately scaled so the math is the same.
894 *
895 * The basic idea here is that we're increasing the multiplier
896 * by one, this causes the xtime_interval to be incremented by
897 * one cycle_interval. This is because:
898 * xtime_interval = cycle_interval * mult
899 * So if mult is being incremented by one:
900 * xtime_interval = cycle_interval * (mult + 1)
901 * Its the same as:
902 * xtime_interval = (cycle_interval * mult) + cycle_interval
903 * Which can be shortened to:
904 * xtime_interval += cycle_interval
905 *
906 * So offset stores the non-accumulated cycles. Thus the current
907 * time (in shifted nanoseconds) is:
908 * now = (offset * adj) + xtime_nsec
909 * Now, even though we're adjusting the clock frequency, we have
910 * to keep time consistent. In other words, we can't jump back
911 * in time, and we also want to avoid jumping forward in time.
912 *
913 * So given the same offset value, we need the time to be the same
914 * both before and after the freq adjustment.
915 * now = (offset * adj_1) + xtime_nsec_1
916 * now = (offset * adj_2) + xtime_nsec_2
917 * So:
918 * (offset * adj_1) + xtime_nsec_1 =
919 * (offset * adj_2) + xtime_nsec_2
920 * And we know:
921 * adj_2 = adj_1 + 1
922 * So:
923 * (offset * adj_1) + xtime_nsec_1 =
924 * (offset * (adj_1+1)) + xtime_nsec_2
925 * (offset * adj_1) + xtime_nsec_1 =
926 * (offset * adj_1) + offset + xtime_nsec_2
927 * Canceling the sides:
928 * xtime_nsec_1 = offset + xtime_nsec_2
929 * Which gives us:
930 * xtime_nsec_2 = xtime_nsec_1 - offset
931 * Which simplfies to:
932 * xtime_nsec -= offset
933 *
934 * XXX - TODO: Doc ntp_error calculation.
935 */
Martin Schwidefsky0a544192009-08-14 15:47:28 +0200936 timekeeper.mult += adj;
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200937 timekeeper.xtime_interval += interval;
938 timekeeper.xtime_nsec -= offset;
939 timekeeper.ntp_error -= (interval - offset) <<
Martin Schwidefsky23ce7212009-08-14 15:47:27 +0200940 timekeeper.ntp_error_shift;
john stultz85240702007-05-08 00:27:59 -0700941}
942
Linus Torvalds83f57a12009-12-22 14:10:37 -0800943
john stultz85240702007-05-08 00:27:59 -0700944/**
john stultza092ff02009-10-02 16:17:53 -0700945 * logarithmic_accumulation - shifted accumulation of cycles
946 *
947 * This functions accumulates a shifted interval of cycles into
948 * into a shifted interval nanoseconds. Allows for O(log) accumulation
949 * loop.
950 *
951 * Returns the unconsumed cycles.
952 */
953static cycle_t logarithmic_accumulation(cycle_t offset, int shift)
954{
955 u64 nsecps = (u64)NSEC_PER_SEC << timekeeper.shift;
Jason Wesseldeda2e82010-08-09 14:20:09 -0700956 u64 raw_nsecs;
john stultza092ff02009-10-02 16:17:53 -0700957
958 /* If the offset is smaller then a shifted interval, do nothing */
959 if (offset < timekeeper.cycle_interval<<shift)
960 return offset;
961
962 /* Accumulate one shifted interval */
963 offset -= timekeeper.cycle_interval << shift;
964 timekeeper.clock->cycle_last += timekeeper.cycle_interval << shift;
965
966 timekeeper.xtime_nsec += timekeeper.xtime_interval << shift;
967 while (timekeeper.xtime_nsec >= nsecps) {
968 timekeeper.xtime_nsec -= nsecps;
John Stultz8ff2cb92011-11-14 11:40:54 -0800969 timekeeper.xtime.tv_sec++;
john stultza092ff02009-10-02 16:17:53 -0700970 second_overflow();
971 }
972
Jason Wesseldeda2e82010-08-09 14:20:09 -0700973 /* Accumulate raw time */
974 raw_nsecs = timekeeper.raw_interval << shift;
John Stultz01f71b42011-11-14 11:43:49 -0800975 raw_nsecs += timekeeper.raw_time.tv_nsec;
John Stultzc7dcf872010-08-13 11:30:58 -0700976 if (raw_nsecs >= NSEC_PER_SEC) {
977 u64 raw_secs = raw_nsecs;
978 raw_nsecs = do_div(raw_secs, NSEC_PER_SEC);
John Stultz01f71b42011-11-14 11:43:49 -0800979 timekeeper.raw_time.tv_sec += raw_secs;
john stultza092ff02009-10-02 16:17:53 -0700980 }
John Stultz01f71b42011-11-14 11:43:49 -0800981 timekeeper.raw_time.tv_nsec = raw_nsecs;
john stultza092ff02009-10-02 16:17:53 -0700982
983 /* Accumulate error between NTP and clock interval */
John Stultzea7cf49a2011-11-14 13:18:07 -0800984 timekeeper.ntp_error += ntp_tick_length() << shift;
Kasper Pedersena386b5a2010-10-20 15:55:15 -0700985 timekeeper.ntp_error -=
986 (timekeeper.xtime_interval + timekeeper.xtime_remainder) <<
john stultza092ff02009-10-02 16:17:53 -0700987 (timekeeper.ntp_error_shift + shift);
988
989 return offset;
990}
991
Linus Torvalds83f57a12009-12-22 14:10:37 -0800992
john stultz85240702007-05-08 00:27:59 -0700993/**
994 * update_wall_time - Uses the current clocksource to increment the wall time
995 *
john stultz85240702007-05-08 00:27:59 -0700996 */
Torben Hohn871cf1e2011-01-27 15:58:55 +0100997static void update_wall_time(void)
john stultz85240702007-05-08 00:27:59 -0700998{
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200999 struct clocksource *clock;
john stultz85240702007-05-08 00:27:59 -07001000 cycle_t offset;
john stultza092ff02009-10-02 16:17:53 -07001001 int shift = 0, maxshift;
John Stultz70471f22011-11-14 12:48:10 -08001002 unsigned long flags;
1003
1004 write_seqlock_irqsave(&timekeeper.lock, flags);
john stultz85240702007-05-08 00:27:59 -07001005
1006 /* Make sure we're fully resumed: */
1007 if (unlikely(timekeeping_suspended))
John Stultz70471f22011-11-14 12:48:10 -08001008 goto out;
john stultz85240702007-05-08 00:27:59 -07001009
Martin Schwidefsky155ec602009-08-14 15:47:26 +02001010 clock = timekeeper.clock;
John Stultz592913e2010-07-13 17:56:20 -07001011
1012#ifdef CONFIG_ARCH_USES_GETTIMEOFFSET
Martin Schwidefsky155ec602009-08-14 15:47:26 +02001013 offset = timekeeper.cycle_interval;
John Stultz592913e2010-07-13 17:56:20 -07001014#else
1015 offset = (clock->read(clock) - clock->cycle_last) & clock->mask;
john stultz85240702007-05-08 00:27:59 -07001016#endif
John Stultz8ff2cb92011-11-14 11:40:54 -08001017 timekeeper.xtime_nsec = (s64)timekeeper.xtime.tv_nsec <<
1018 timekeeper.shift;
john stultz85240702007-05-08 00:27:59 -07001019
john stultza092ff02009-10-02 16:17:53 -07001020 /*
1021 * With NO_HZ we may have to accumulate many cycle_intervals
1022 * (think "ticks") worth of time at once. To do this efficiently,
1023 * we calculate the largest doubling multiple of cycle_intervals
1024 * that is smaller then the offset. We then accumulate that
1025 * chunk in one go, and then try to consume the next smaller
1026 * doubled multiple.
john stultz85240702007-05-08 00:27:59 -07001027 */
john stultza092ff02009-10-02 16:17:53 -07001028 shift = ilog2(offset) - ilog2(timekeeper.cycle_interval);
1029 shift = max(0, shift);
1030 /* Bound shift to one less then what overflows tick_length */
John Stultzea7cf49a2011-11-14 13:18:07 -08001031 maxshift = (64 - (ilog2(ntp_tick_length())+1)) - 1;
john stultza092ff02009-10-02 16:17:53 -07001032 shift = min(shift, maxshift);
Martin Schwidefsky155ec602009-08-14 15:47:26 +02001033 while (offset >= timekeeper.cycle_interval) {
john stultza092ff02009-10-02 16:17:53 -07001034 offset = logarithmic_accumulation(offset, shift);
John Stultz830ec042010-03-18 14:47:30 -07001035 if(offset < timekeeper.cycle_interval<<shift)
1036 shift--;
john stultz85240702007-05-08 00:27:59 -07001037 }
1038
1039 /* correct the clock when NTP error is too big */
Martin Schwidefsky155ec602009-08-14 15:47:26 +02001040 timekeeping_adjust(offset);
john stultz85240702007-05-08 00:27:59 -07001041
john stultz6c9bacb2008-12-01 18:34:41 -08001042 /*
1043 * Since in the loop above, we accumulate any amount of time
1044 * in xtime_nsec over a second into xtime.tv_sec, its possible for
1045 * xtime_nsec to be fairly small after the loop. Further, if we're
Martin Schwidefsky155ec602009-08-14 15:47:26 +02001046 * slightly speeding the clocksource up in timekeeping_adjust(),
john stultz6c9bacb2008-12-01 18:34:41 -08001047 * its possible the required corrective factor to xtime_nsec could
1048 * cause it to underflow.
1049 *
1050 * Now, we cannot simply roll the accumulated second back, since
1051 * the NTP subsystem has been notified via second_overflow. So
1052 * instead we push xtime_nsec forward by the amount we underflowed,
1053 * and add that amount into the error.
1054 *
1055 * We'll correct this error next time through this function, when
1056 * xtime_nsec is not as small.
1057 */
Martin Schwidefsky155ec602009-08-14 15:47:26 +02001058 if (unlikely((s64)timekeeper.xtime_nsec < 0)) {
1059 s64 neg = -(s64)timekeeper.xtime_nsec;
1060 timekeeper.xtime_nsec = 0;
Martin Schwidefsky23ce7212009-08-14 15:47:27 +02001061 timekeeper.ntp_error += neg << timekeeper.ntp_error_shift;
john stultz6c9bacb2008-12-01 18:34:41 -08001062 }
1063
John Stultz6a867a32010-04-06 14:30:51 -07001064
1065 /*
1066 * Store full nanoseconds into xtime after rounding it up and
Roman Zippel5cd1c9c2008-09-22 14:42:43 -07001067 * add the remainder to the error difference.
1068 */
John Stultz8ff2cb92011-11-14 11:40:54 -08001069 timekeeper.xtime.tv_nsec = ((s64)timekeeper.xtime_nsec >>
1070 timekeeper.shift) + 1;
1071 timekeeper.xtime_nsec -= (s64)timekeeper.xtime.tv_nsec <<
1072 timekeeper.shift;
Martin Schwidefsky23ce7212009-08-14 15:47:27 +02001073 timekeeper.ntp_error += timekeeper.xtime_nsec <<
1074 timekeeper.ntp_error_shift;
john stultz85240702007-05-08 00:27:59 -07001075
John Stultz6a867a32010-04-06 14:30:51 -07001076 /*
1077 * Finally, make sure that after the rounding
1078 * xtime.tv_nsec isn't larger then NSEC_PER_SEC
1079 */
John Stultz8ff2cb92011-11-14 11:40:54 -08001080 if (unlikely(timekeeper.xtime.tv_nsec >= NSEC_PER_SEC)) {
1081 timekeeper.xtime.tv_nsec -= NSEC_PER_SEC;
1082 timekeeper.xtime.tv_sec++;
John Stultz6a867a32010-04-06 14:30:51 -07001083 second_overflow();
1084 }
Linus Torvalds83f57a12009-12-22 14:10:37 -08001085
john stultz85240702007-05-08 00:27:59 -07001086 /* check to see if there is a new clocksource to use */
John Stultz8ff2cb92011-11-14 11:40:54 -08001087 update_vsyscall(&timekeeper.xtime, &timekeeper.wall_to_monotonic,
1088 timekeeper.clock, timekeeper.mult);
John Stultz70471f22011-11-14 12:48:10 -08001089
1090out:
1091 write_sequnlock_irqrestore(&timekeeper.lock, flags);
1092
john stultz85240702007-05-08 00:27:59 -07001093}
Tomas Janousek7c3f1a52007-07-15 23:39:41 -07001094
1095/**
1096 * getboottime - Return the real time of system boot.
1097 * @ts: pointer to the timespec to be set
1098 *
John Stultzabb3a4e2011-02-14 17:52:09 -08001099 * Returns the wall-time of boot in a timespec.
Tomas Janousek7c3f1a52007-07-15 23:39:41 -07001100 *
1101 * This is based on the wall_to_monotonic offset and the total suspend
1102 * time. Calls to settimeofday will affect the value returned (which
1103 * basically means that however wrong your real time clock is at boot time,
1104 * you get the right time here).
1105 */
1106void getboottime(struct timespec *ts)
1107{
Hiroshi Shimamoto36d47482009-08-25 15:08:30 +09001108 struct timespec boottime = {
John Stultzd9f72172011-11-14 11:29:32 -08001109 .tv_sec = timekeeper.wall_to_monotonic.tv_sec +
John Stultz00c5fb72011-11-14 11:23:15 -08001110 timekeeper.total_sleep_time.tv_sec,
John Stultzd9f72172011-11-14 11:29:32 -08001111 .tv_nsec = timekeeper.wall_to_monotonic.tv_nsec +
John Stultz00c5fb72011-11-14 11:23:15 -08001112 timekeeper.total_sleep_time.tv_nsec
Hiroshi Shimamoto36d47482009-08-25 15:08:30 +09001113 };
Martin Schwidefskyd4f587c2009-08-14 15:47:31 +02001114
Martin Schwidefskyd4f587c2009-08-14 15:47:31 +02001115 set_normalized_timespec(ts, -boottime.tv_sec, -boottime.tv_nsec);
Tomas Janousek7c3f1a52007-07-15 23:39:41 -07001116}
Jason Wangc93d89f2010-01-27 19:13:40 +08001117EXPORT_SYMBOL_GPL(getboottime);
Tomas Janousek7c3f1a52007-07-15 23:39:41 -07001118
John Stultzabb3a4e2011-02-14 17:52:09 -08001119
1120/**
1121 * get_monotonic_boottime - Returns monotonic time since boot
1122 * @ts: pointer to the timespec to be set
1123 *
1124 * Returns the monotonic time since boot in a timespec.
1125 *
1126 * This is similar to CLOCK_MONTONIC/ktime_get_ts, but also
1127 * includes the time spent in suspend.
1128 */
1129void get_monotonic_boottime(struct timespec *ts)
1130{
1131 struct timespec tomono, sleep;
1132 unsigned int seq;
1133 s64 nsecs;
1134
1135 WARN_ON(timekeeping_suspended);
1136
1137 do {
John Stultz70471f22011-11-14 12:48:10 -08001138 seq = read_seqbegin(&timekeeper.lock);
John Stultz8ff2cb92011-11-14 11:40:54 -08001139 *ts = timekeeper.xtime;
John Stultzd9f72172011-11-14 11:29:32 -08001140 tomono = timekeeper.wall_to_monotonic;
John Stultz00c5fb72011-11-14 11:23:15 -08001141 sleep = timekeeper.total_sleep_time;
John Stultzabb3a4e2011-02-14 17:52:09 -08001142 nsecs = timekeeping_get_ns();
1143
John Stultz70471f22011-11-14 12:48:10 -08001144 } while (read_seqretry(&timekeeper.lock, seq));
John Stultzabb3a4e2011-02-14 17:52:09 -08001145
1146 set_normalized_timespec(ts, ts->tv_sec + tomono.tv_sec + sleep.tv_sec,
1147 ts->tv_nsec + tomono.tv_nsec + sleep.tv_nsec + nsecs);
1148}
1149EXPORT_SYMBOL_GPL(get_monotonic_boottime);
1150
1151/**
1152 * ktime_get_boottime - Returns monotonic time since boot in a ktime
1153 *
1154 * Returns the monotonic time since boot in a ktime
1155 *
1156 * This is similar to CLOCK_MONTONIC/ktime_get, but also
1157 * includes the time spent in suspend.
1158 */
1159ktime_t ktime_get_boottime(void)
1160{
1161 struct timespec ts;
1162
1163 get_monotonic_boottime(&ts);
1164 return timespec_to_ktime(ts);
1165}
1166EXPORT_SYMBOL_GPL(ktime_get_boottime);
1167
Tomas Janousek7c3f1a52007-07-15 23:39:41 -07001168/**
1169 * monotonic_to_bootbased - Convert the monotonic time to boot based.
1170 * @ts: pointer to the timespec to be converted
1171 */
1172void monotonic_to_bootbased(struct timespec *ts)
1173{
John Stultz00c5fb72011-11-14 11:23:15 -08001174 *ts = timespec_add(*ts, timekeeper.total_sleep_time);
Tomas Janousek7c3f1a52007-07-15 23:39:41 -07001175}
Jason Wangc93d89f2010-01-27 19:13:40 +08001176EXPORT_SYMBOL_GPL(monotonic_to_bootbased);
john stultz2c6b47d2007-07-24 17:47:43 -07001177
john stultz17c38b72007-07-24 18:38:34 -07001178unsigned long get_seconds(void)
1179{
John Stultz8ff2cb92011-11-14 11:40:54 -08001180 return timekeeper.xtime.tv_sec;
john stultz17c38b72007-07-24 18:38:34 -07001181}
1182EXPORT_SYMBOL(get_seconds);
1183
john stultzda15cfd2009-08-19 19:13:34 -07001184struct timespec __current_kernel_time(void)
1185{
John Stultz8ff2cb92011-11-14 11:40:54 -08001186 return timekeeper.xtime;
john stultzda15cfd2009-08-19 19:13:34 -07001187}
john stultz17c38b72007-07-24 18:38:34 -07001188
john stultz2c6b47d2007-07-24 17:47:43 -07001189struct timespec current_kernel_time(void)
1190{
1191 struct timespec now;
1192 unsigned long seq;
1193
1194 do {
John Stultz70471f22011-11-14 12:48:10 -08001195 seq = read_seqbegin(&timekeeper.lock);
Linus Torvalds83f57a12009-12-22 14:10:37 -08001196
John Stultz8ff2cb92011-11-14 11:40:54 -08001197 now = timekeeper.xtime;
John Stultz70471f22011-11-14 12:48:10 -08001198 } while (read_seqretry(&timekeeper.lock, seq));
john stultz2c6b47d2007-07-24 17:47:43 -07001199
1200 return now;
1201}
john stultz2c6b47d2007-07-24 17:47:43 -07001202EXPORT_SYMBOL(current_kernel_time);
john stultzda15cfd2009-08-19 19:13:34 -07001203
1204struct timespec get_monotonic_coarse(void)
1205{
1206 struct timespec now, mono;
1207 unsigned long seq;
1208
1209 do {
John Stultz70471f22011-11-14 12:48:10 -08001210 seq = read_seqbegin(&timekeeper.lock);
Linus Torvalds83f57a12009-12-22 14:10:37 -08001211
John Stultz8ff2cb92011-11-14 11:40:54 -08001212 now = timekeeper.xtime;
John Stultzd9f72172011-11-14 11:29:32 -08001213 mono = timekeeper.wall_to_monotonic;
John Stultz70471f22011-11-14 12:48:10 -08001214 } while (read_seqretry(&timekeeper.lock, seq));
john stultzda15cfd2009-08-19 19:13:34 -07001215
1216 set_normalized_timespec(&now, now.tv_sec + mono.tv_sec,
1217 now.tv_nsec + mono.tv_nsec);
1218 return now;
1219}
Torben Hohn871cf1e2011-01-27 15:58:55 +01001220
1221/*
1222 * The 64-bit jiffies value is not atomic - you MUST NOT read it
1223 * without sampling the sequence number in xtime_lock.
1224 * jiffies is defined in the linker script...
1225 */
1226void do_timer(unsigned long ticks)
1227{
1228 jiffies_64 += ticks;
1229 update_wall_time();
1230 calc_global_load(ticks);
1231}
Torben Hohn48cf76f72011-01-27 15:59:05 +01001232
1233/**
John Stultz314ac372011-02-14 18:43:08 -08001234 * get_xtime_and_monotonic_and_sleep_offset() - get xtime, wall_to_monotonic,
1235 * and sleep offsets.
Torben Hohn48cf76f72011-01-27 15:59:05 +01001236 * @xtim: pointer to timespec to be set with xtime
1237 * @wtom: pointer to timespec to be set with wall_to_monotonic
John Stultz314ac372011-02-14 18:43:08 -08001238 * @sleep: pointer to timespec to be set with time in suspend
Torben Hohn48cf76f72011-01-27 15:59:05 +01001239 */
John Stultz314ac372011-02-14 18:43:08 -08001240void get_xtime_and_monotonic_and_sleep_offset(struct timespec *xtim,
1241 struct timespec *wtom, struct timespec *sleep)
Torben Hohn48cf76f72011-01-27 15:59:05 +01001242{
1243 unsigned long seq;
1244
1245 do {
John Stultz70471f22011-11-14 12:48:10 -08001246 seq = read_seqbegin(&timekeeper.lock);
John Stultz8ff2cb92011-11-14 11:40:54 -08001247 *xtim = timekeeper.xtime;
John Stultzd9f72172011-11-14 11:29:32 -08001248 *wtom = timekeeper.wall_to_monotonic;
John Stultz00c5fb72011-11-14 11:23:15 -08001249 *sleep = timekeeper.total_sleep_time;
John Stultz70471f22011-11-14 12:48:10 -08001250 } while (read_seqretry(&timekeeper.lock, seq));
Torben Hohn48cf76f72011-01-27 15:59:05 +01001251}
Torben Hohnf0af911a92011-01-27 15:59:10 +01001252
1253/**
Thomas Gleixner99ee5312011-04-27 14:16:42 +02001254 * ktime_get_monotonic_offset() - get wall_to_monotonic in ktime_t format
1255 */
1256ktime_t ktime_get_monotonic_offset(void)
1257{
1258 unsigned long seq;
1259 struct timespec wtom;
1260
1261 do {
John Stultz70471f22011-11-14 12:48:10 -08001262 seq = read_seqbegin(&timekeeper.lock);
John Stultzd9f72172011-11-14 11:29:32 -08001263 wtom = timekeeper.wall_to_monotonic;
John Stultz70471f22011-11-14 12:48:10 -08001264 } while (read_seqretry(&timekeeper.lock, seq));
1265
Thomas Gleixner99ee5312011-04-27 14:16:42 +02001266 return timespec_to_ktime(wtom);
1267}
1268
1269/**
Torben Hohnf0af911a92011-01-27 15:59:10 +01001270 * xtime_update() - advances the timekeeping infrastructure
1271 * @ticks: number of ticks, that have elapsed since the last call.
1272 *
1273 * Must be called with interrupts disabled.
1274 */
1275void xtime_update(unsigned long ticks)
1276{
1277 write_seqlock(&xtime_lock);
1278 do_timer(ticks);
1279 write_sequnlock(&xtime_lock);
1280}