blob: 9b8451a4330fc51430b74be032096dc22752c78b [file] [log] [blame]
Russell King112f38a42010-12-15 19:23:07 +00001/*
2 * sched_clock.c: support for extending counters to full 64-bit ns counter
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
7 */
8#include <linux/clocksource.h>
9#include <linux/init.h>
10#include <linux/jiffies.h>
11#include <linux/kernel.h>
Russell Kinga42c3622012-09-09 18:39:28 +010012#include <linux/moduleparam.h>
Russell King112f38a42010-12-15 19:23:07 +000013#include <linux/sched.h>
Russell Kingf153d012012-02-04 12:31:27 +000014#include <linux/syscore_ops.h>
Russell King112f38a42010-12-15 19:23:07 +000015#include <linux/timer.h>
16
17#include <asm/sched_clock.h>
18
Marc Zyngier2f0778af2011-12-15 12:19:23 +010019struct clock_data {
20 u64 epoch_ns;
21 u32 epoch_cyc;
22 u32 epoch_cyc_copy;
23 u32 mult;
24 u32 shift;
25};
26
Russell King112f38a42010-12-15 19:23:07 +000027static void sched_clock_poll(unsigned long wrap_ticks);
28static DEFINE_TIMER(sched_clock_timer, sched_clock_poll, 0, 0);
Russell Kinga42c3622012-09-09 18:39:28 +010029static int irqtime = -1;
30
31core_param(irqtime, irqtime, int, 0400);
Marc Zyngier2f0778af2011-12-15 12:19:23 +010032
33static struct clock_data cd = {
34 .mult = NSEC_PER_SEC / HZ,
35};
36
37static u32 __read_mostly sched_clock_mask = 0xffffffff;
38
39static u32 notrace jiffy_sched_clock_read(void)
40{
41 return (u32)(jiffies - INITIAL_JIFFIES);
42}
43
44static u32 __read_mostly (*read_sched_clock)(void) = jiffy_sched_clock_read;
45
46static inline u64 cyc_to_ns(u64 cyc, u32 mult, u32 shift)
47{
48 return (cyc * mult) >> shift;
49}
50
51static unsigned long long cyc_to_sched_clock(u32 cyc, u32 mask)
52{
53 u64 epoch_ns;
54 u32 epoch_cyc;
55
56 /*
57 * Load the epoch_cyc and epoch_ns atomically. We do this by
58 * ensuring that we always write epoch_cyc, epoch_ns and
59 * epoch_cyc_copy in strict order, and read them in strict order.
60 * If epoch_cyc and epoch_cyc_copy are not equal, then we're in
61 * the middle of an update, and we should repeat the load.
62 */
63 do {
64 epoch_cyc = cd.epoch_cyc;
65 smp_rmb();
66 epoch_ns = cd.epoch_ns;
67 smp_rmb();
68 } while (epoch_cyc != cd.epoch_cyc_copy);
69
70 return epoch_ns + cyc_to_ns((cyc - epoch_cyc) & mask, cd.mult, cd.shift);
71}
72
73/*
74 * Atomically update the sched_clock epoch.
75 */
76static void notrace update_sched_clock(void)
77{
78 unsigned long flags;
79 u32 cyc;
80 u64 ns;
81
82 cyc = read_sched_clock();
83 ns = cd.epoch_ns +
84 cyc_to_ns((cyc - cd.epoch_cyc) & sched_clock_mask,
85 cd.mult, cd.shift);
86 /*
87 * Write epoch_cyc and epoch_ns in a way that the update is
88 * detectable in cyc_to_fixed_sched_clock().
89 */
90 raw_local_irq_save(flags);
91 cd.epoch_cyc = cyc;
92 smp_wmb();
93 cd.epoch_ns = ns;
94 smp_wmb();
95 cd.epoch_cyc_copy = cyc;
96 raw_local_irq_restore(flags);
97}
Russell King112f38a42010-12-15 19:23:07 +000098
99static void sched_clock_poll(unsigned long wrap_ticks)
100{
101 mod_timer(&sched_clock_timer, round_jiffies(jiffies + wrap_ticks));
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100102 update_sched_clock();
Russell King112f38a42010-12-15 19:23:07 +0000103}
104
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100105void __init setup_sched_clock(u32 (*read)(void), int bits, unsigned long rate)
Russell King112f38a42010-12-15 19:23:07 +0000106{
107 unsigned long r, w;
108 u64 res, wrap;
109 char r_unit;
110
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100111 BUG_ON(bits > 32);
112 WARN_ON(!irqs_disabled());
113 WARN_ON(read_sched_clock != jiffy_sched_clock_read);
114 read_sched_clock = read;
115 sched_clock_mask = (1 << bits) - 1;
Russell King112f38a42010-12-15 19:23:07 +0000116
117 /* calculate the mult/shift to convert counter ticks to ns. */
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100118 clocks_calc_mult_shift(&cd.mult, &cd.shift, rate, NSEC_PER_SEC, 0);
Russell King112f38a42010-12-15 19:23:07 +0000119
120 r = rate;
121 if (r >= 4000000) {
122 r /= 1000000;
123 r_unit = 'M';
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100124 } else if (r >= 1000) {
Russell King112f38a42010-12-15 19:23:07 +0000125 r /= 1000;
126 r_unit = 'k';
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100127 } else
128 r_unit = ' ';
Russell King112f38a42010-12-15 19:23:07 +0000129
130 /* calculate how many ns until we wrap */
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100131 wrap = cyc_to_ns((1ULL << bits) - 1, cd.mult, cd.shift);
Russell King112f38a42010-12-15 19:23:07 +0000132 do_div(wrap, NSEC_PER_MSEC);
133 w = wrap;
134
135 /* calculate the ns resolution of this counter */
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100136 res = cyc_to_ns(1ULL, cd.mult, cd.shift);
Russell King112f38a42010-12-15 19:23:07 +0000137 pr_info("sched_clock: %u bits at %lu%cHz, resolution %lluns, wraps every %lums\n",
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100138 bits, r, r_unit, res, w);
Russell King112f38a42010-12-15 19:23:07 +0000139
140 /*
141 * Start the timer to keep sched_clock() properly updated and
142 * sets the initial epoch.
143 */
144 sched_clock_timer.data = msecs_to_jiffies(w - (w / 10));
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100145 update_sched_clock();
Russell King112f38a42010-12-15 19:23:07 +0000146
147 /*
148 * Ensure that sched_clock() starts off at 0ns
149 */
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100150 cd.epoch_ns = 0;
151
Russell Kinga42c3622012-09-09 18:39:28 +0100152 /* Enable IRQ time accounting if we have a fast enough sched_clock */
153 if (irqtime > 0 || (irqtime == -1 && rate >= 1000000))
154 enable_sched_clock_irqtime();
155
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100156 pr_debug("Registered %pF as sched_clock source\n", read);
157}
158
159unsigned long long notrace sched_clock(void)
160{
161 u32 cyc = read_sched_clock();
162 return cyc_to_sched_clock(cyc, sched_clock_mask);
Russell King112f38a42010-12-15 19:23:07 +0000163}
Russell King211baa702011-01-11 16:23:04 +0000164
165void __init sched_clock_postinit(void)
166{
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100167 /*
168 * If no sched_clock function has been provided at that point,
169 * make it the final one one.
170 */
171 if (read_sched_clock == jiffy_sched_clock_read)
172 setup_sched_clock(jiffy_sched_clock_read, 32, HZ);
173
Russell King211baa702011-01-11 16:23:04 +0000174 sched_clock_poll(sched_clock_timer.data);
175}
Russell Kingf153d012012-02-04 12:31:27 +0000176
177static int sched_clock_suspend(void)
178{
179 sched_clock_poll(sched_clock_timer.data);
180 return 0;
181}
182
183static struct syscore_ops sched_clock_ops = {
184 .suspend = sched_clock_suspend,
185};
186
187static int __init sched_clock_syscore_init(void)
188{
189 register_syscore_ops(&sched_clock_ops);
190 return 0;
191}
192device_initcall(sched_clock_syscore_init);