sched_clock: Fix integer overflow
[linux-2.6-block.git] / kernel / time / sched_clock.c
CommitLineData
112f38a4
RK
1/*
2 * sched_clock.c: support for extending counters to full 64-bit ns counter
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
7 */
8#include <linux/clocksource.h>
9#include <linux/init.h>
10#include <linux/jiffies.h>
11#include <linux/kernel.h>
a42c3629 12#include <linux/moduleparam.h>
112f38a4 13#include <linux/sched.h>
f153d017 14#include <linux/syscore_ops.h>
112f38a4 15#include <linux/timer.h>
38ff87f7 16#include <linux/sched_clock.h>
112f38a4 17
2f0778af
MZ
18struct clock_data {
19 u64 epoch_ns;
20 u32 epoch_cyc;
21 u32 epoch_cyc_copy;
c115739d 22 unsigned long rate;
2f0778af
MZ
23 u32 mult;
24 u32 shift;
237ec6f2 25 bool suspended;
2f0778af
MZ
26};
27
112f38a4
RK
28static void sched_clock_poll(unsigned long wrap_ticks);
29static DEFINE_TIMER(sched_clock_timer, sched_clock_poll, 0, 0);
a42c3629
RK
30static int irqtime = -1;
31
32core_param(irqtime, irqtime, int, 0400);
2f0778af
MZ
33
34static struct clock_data cd = {
35 .mult = NSEC_PER_SEC / HZ,
36};
37
38static u32 __read_mostly sched_clock_mask = 0xffffffff;
39
40static u32 notrace jiffy_sched_clock_read(void)
41{
42 return (u32)(jiffies - INITIAL_JIFFIES);
43}
44
45static u32 __read_mostly (*read_sched_clock)(void) = jiffy_sched_clock_read;
46
cea15092 47static inline u64 notrace cyc_to_ns(u64 cyc, u32 mult, u32 shift)
2f0778af
MZ
48{
49 return (cyc * mult) >> shift;
50}
51
336ae118 52static unsigned long long notrace sched_clock_32(void)
2f0778af
MZ
53{
54 u64 epoch_ns;
55 u32 epoch_cyc;
336ae118
SB
56 u32 cyc;
57
58 if (cd.suspended)
59 return cd.epoch_ns;
2f0778af
MZ
60
61 /*
62 * Load the epoch_cyc and epoch_ns atomically. We do this by
63 * ensuring that we always write epoch_cyc, epoch_ns and
64 * epoch_cyc_copy in strict order, and read them in strict order.
65 * If epoch_cyc and epoch_cyc_copy are not equal, then we're in
66 * the middle of an update, and we should repeat the load.
67 */
68 do {
69 epoch_cyc = cd.epoch_cyc;
70 smp_rmb();
71 epoch_ns = cd.epoch_ns;
72 smp_rmb();
73 } while (epoch_cyc != cd.epoch_cyc_copy);
74
336ae118
SB
75 cyc = read_sched_clock();
76 cyc = (cyc - epoch_cyc) & sched_clock_mask;
77 return epoch_ns + cyc_to_ns(cyc, cd.mult, cd.shift);
2f0778af
MZ
78}
79
80/*
81 * Atomically update the sched_clock epoch.
82 */
83static void notrace update_sched_clock(void)
84{
85 unsigned long flags;
86 u32 cyc;
87 u64 ns;
88
89 cyc = read_sched_clock();
90 ns = cd.epoch_ns +
91 cyc_to_ns((cyc - cd.epoch_cyc) & sched_clock_mask,
92 cd.mult, cd.shift);
93 /*
94 * Write epoch_cyc and epoch_ns in a way that the update is
95 * detectable in cyc_to_fixed_sched_clock().
96 */
97 raw_local_irq_save(flags);
7c4e9ced 98 cd.epoch_cyc_copy = cyc;
2f0778af
MZ
99 smp_wmb();
100 cd.epoch_ns = ns;
101 smp_wmb();
7c4e9ced 102 cd.epoch_cyc = cyc;
2f0778af
MZ
103 raw_local_irq_restore(flags);
104}
112f38a4
RK
105
106static void sched_clock_poll(unsigned long wrap_ticks)
107{
108 mod_timer(&sched_clock_timer, round_jiffies(jiffies + wrap_ticks));
2f0778af 109 update_sched_clock();
112f38a4
RK
110}
111
2f0778af 112void __init setup_sched_clock(u32 (*read)(void), int bits, unsigned long rate)
112f38a4
RK
113{
114 unsigned long r, w;
115 u64 res, wrap;
116 char r_unit;
117
c115739d
RH
118 if (cd.rate > rate)
119 return;
120
2f0778af
MZ
121 BUG_ON(bits > 32);
122 WARN_ON(!irqs_disabled());
2f0778af 123 read_sched_clock = read;
53c03520 124 sched_clock_mask = (1ULL << bits) - 1;
c115739d 125 cd.rate = rate;
112f38a4
RK
126
127 /* calculate the mult/shift to convert counter ticks to ns. */
2f0778af 128 clocks_calc_mult_shift(&cd.mult, &cd.shift, rate, NSEC_PER_SEC, 0);
112f38a4
RK
129
130 r = rate;
131 if (r >= 4000000) {
132 r /= 1000000;
133 r_unit = 'M';
2f0778af 134 } else if (r >= 1000) {
112f38a4
RK
135 r /= 1000;
136 r_unit = 'k';
2f0778af
MZ
137 } else
138 r_unit = ' ';
112f38a4
RK
139
140 /* calculate how many ns until we wrap */
2f0778af 141 wrap = cyc_to_ns((1ULL << bits) - 1, cd.mult, cd.shift);
112f38a4
RK
142 do_div(wrap, NSEC_PER_MSEC);
143 w = wrap;
144
145 /* calculate the ns resolution of this counter */
2f0778af 146 res = cyc_to_ns(1ULL, cd.mult, cd.shift);
112f38a4 147 pr_info("sched_clock: %u bits at %lu%cHz, resolution %lluns, wraps every %lums\n",
2f0778af 148 bits, r, r_unit, res, w);
112f38a4
RK
149
150 /*
151 * Start the timer to keep sched_clock() properly updated and
152 * sets the initial epoch.
153 */
154 sched_clock_timer.data = msecs_to_jiffies(w - (w / 10));
2f0778af 155 update_sched_clock();
112f38a4
RK
156
157 /*
158 * Ensure that sched_clock() starts off at 0ns
159 */
2f0778af
MZ
160 cd.epoch_ns = 0;
161
a42c3629
RK
162 /* Enable IRQ time accounting if we have a fast enough sched_clock */
163 if (irqtime > 0 || (irqtime == -1 && rate >= 1000000))
164 enable_sched_clock_irqtime();
165
2f0778af
MZ
166 pr_debug("Registered %pF as sched_clock source\n", read);
167}
168
7e48c0b9
RH
169unsigned long long __read_mostly (*sched_clock_func)(void) = sched_clock_32;
170
171unsigned long long notrace sched_clock(void)
172{
173 return sched_clock_func();
174}
175
211baa70
RK
176void __init sched_clock_postinit(void)
177{
2f0778af
MZ
178 /*
179 * If no sched_clock function has been provided at that point,
180 * make it the final one one.
181 */
182 if (read_sched_clock == jiffy_sched_clock_read)
183 setup_sched_clock(jiffy_sched_clock_read, 32, HZ);
184
211baa70
RK
185 sched_clock_poll(sched_clock_timer.data);
186}
f153d017
RK
187
188static int sched_clock_suspend(void)
189{
190 sched_clock_poll(sched_clock_timer.data);
6a4dae5e 191 cd.suspended = true;
f153d017
RK
192 return 0;
193}
194
237ec6f2
CC
195static void sched_clock_resume(void)
196{
6a4dae5e
FB
197 cd.epoch_cyc = read_sched_clock();
198 cd.epoch_cyc_copy = cd.epoch_cyc;
199 cd.suspended = false;
237ec6f2
CC
200}
201
f153d017
RK
202static struct syscore_ops sched_clock_ops = {
203 .suspend = sched_clock_suspend,
237ec6f2 204 .resume = sched_clock_resume,
f153d017
RK
205};
206
207static int __init sched_clock_syscore_init(void)
208{
209 register_syscore_ops(&sched_clock_ops);
210 return 0;
211}
212device_initcall(sched_clock_syscore_init);