blob: 040168e8a60dd38017b9952d013d372aebdc50bf [file] [log] [blame]
Russell King112f38a42010-12-15 19:23:07 +00001/*
2 * sched_clock.c: support for extending counters to full 64-bit ns counter
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
7 */
8#include <linux/clocksource.h>
9#include <linux/init.h>
10#include <linux/jiffies.h>
11#include <linux/kernel.h>
Russell Kinga42c3622012-09-09 18:39:28 +010012#include <linux/moduleparam.h>
Russell King112f38a42010-12-15 19:23:07 +000013#include <linux/sched.h>
Russell Kingf153d012012-02-04 12:31:27 +000014#include <linux/syscore_ops.h>
Russell King112f38a42010-12-15 19:23:07 +000015#include <linux/timer.h>
16
17#include <asm/sched_clock.h>
18
Marc Zyngier2f0778af2011-12-15 12:19:23 +010019struct clock_data {
20 u64 epoch_ns;
21 u32 epoch_cyc;
22 u32 epoch_cyc_copy;
Rob Herringc1157392013-02-08 16:14:59 -060023 unsigned long rate;
Marc Zyngier2f0778af2011-12-15 12:19:23 +010024 u32 mult;
25 u32 shift;
Colin Cross237ec6f2012-08-07 19:05:10 +010026 bool suspended;
27 bool needs_suspend;
Marc Zyngier2f0778af2011-12-15 12:19:23 +010028};
29
Russell King112f38a42010-12-15 19:23:07 +000030static void sched_clock_poll(unsigned long wrap_ticks);
31static DEFINE_TIMER(sched_clock_timer, sched_clock_poll, 0, 0);
Russell Kinga42c3622012-09-09 18:39:28 +010032static int irqtime = -1;
33
34core_param(irqtime, irqtime, int, 0400);
Marc Zyngier2f0778af2011-12-15 12:19:23 +010035
36static struct clock_data cd = {
37 .mult = NSEC_PER_SEC / HZ,
38};
39
40static u32 __read_mostly sched_clock_mask = 0xffffffff;
41
42static u32 notrace jiffy_sched_clock_read(void)
43{
44 return (u32)(jiffies - INITIAL_JIFFIES);
45}
46
47static u32 __read_mostly (*read_sched_clock)(void) = jiffy_sched_clock_read;
48
49static inline u64 cyc_to_ns(u64 cyc, u32 mult, u32 shift)
50{
51 return (cyc * mult) >> shift;
52}
53
54static unsigned long long cyc_to_sched_clock(u32 cyc, u32 mask)
55{
56 u64 epoch_ns;
57 u32 epoch_cyc;
58
Colin Cross237ec6f2012-08-07 19:05:10 +010059 if (cd.suspended)
60 return cd.epoch_ns;
61
Marc Zyngier2f0778af2011-12-15 12:19:23 +010062 /*
63 * Load the epoch_cyc and epoch_ns atomically. We do this by
64 * ensuring that we always write epoch_cyc, epoch_ns and
65 * epoch_cyc_copy in strict order, and read them in strict order.
66 * If epoch_cyc and epoch_cyc_copy are not equal, then we're in
67 * the middle of an update, and we should repeat the load.
68 */
69 do {
70 epoch_cyc = cd.epoch_cyc;
71 smp_rmb();
72 epoch_ns = cd.epoch_ns;
73 smp_rmb();
74 } while (epoch_cyc != cd.epoch_cyc_copy);
75
76 return epoch_ns + cyc_to_ns((cyc - epoch_cyc) & mask, cd.mult, cd.shift);
77}
78
79/*
80 * Atomically update the sched_clock epoch.
81 */
82static void notrace update_sched_clock(void)
83{
84 unsigned long flags;
85 u32 cyc;
86 u64 ns;
87
88 cyc = read_sched_clock();
89 ns = cd.epoch_ns +
90 cyc_to_ns((cyc - cd.epoch_cyc) & sched_clock_mask,
91 cd.mult, cd.shift);
92 /*
93 * Write epoch_cyc and epoch_ns in a way that the update is
94 * detectable in cyc_to_fixed_sched_clock().
95 */
96 raw_local_irq_save(flags);
Joonsoo Kim7c4e9ce2013-02-09 05:52:45 +010097 cd.epoch_cyc_copy = cyc;
Marc Zyngier2f0778af2011-12-15 12:19:23 +010098 smp_wmb();
99 cd.epoch_ns = ns;
100 smp_wmb();
Joonsoo Kim7c4e9ce2013-02-09 05:52:45 +0100101 cd.epoch_cyc = cyc;
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100102 raw_local_irq_restore(flags);
103}
Russell King112f38a42010-12-15 19:23:07 +0000104
105static void sched_clock_poll(unsigned long wrap_ticks)
106{
107 mod_timer(&sched_clock_timer, round_jiffies(jiffies + wrap_ticks));
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100108 update_sched_clock();
Russell King112f38a42010-12-15 19:23:07 +0000109}
110
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100111void __init setup_sched_clock(u32 (*read)(void), int bits, unsigned long rate)
Russell King112f38a42010-12-15 19:23:07 +0000112{
113 unsigned long r, w;
114 u64 res, wrap;
115 char r_unit;
116
Rob Herringc1157392013-02-08 16:14:59 -0600117 if (cd.rate > rate)
118 return;
119
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100120 BUG_ON(bits > 32);
121 WARN_ON(!irqs_disabled());
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100122 read_sched_clock = read;
123 sched_clock_mask = (1 << bits) - 1;
Rob Herringc1157392013-02-08 16:14:59 -0600124 cd.rate = rate;
Russell King112f38a42010-12-15 19:23:07 +0000125
126 /* calculate the mult/shift to convert counter ticks to ns. */
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100127 clocks_calc_mult_shift(&cd.mult, &cd.shift, rate, NSEC_PER_SEC, 0);
Russell King112f38a42010-12-15 19:23:07 +0000128
129 r = rate;
130 if (r >= 4000000) {
131 r /= 1000000;
132 r_unit = 'M';
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100133 } else if (r >= 1000) {
Russell King112f38a42010-12-15 19:23:07 +0000134 r /= 1000;
135 r_unit = 'k';
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100136 } else
137 r_unit = ' ';
Russell King112f38a42010-12-15 19:23:07 +0000138
139 /* calculate how many ns until we wrap */
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100140 wrap = cyc_to_ns((1ULL << bits) - 1, cd.mult, cd.shift);
Russell King112f38a42010-12-15 19:23:07 +0000141 do_div(wrap, NSEC_PER_MSEC);
142 w = wrap;
143
144 /* calculate the ns resolution of this counter */
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100145 res = cyc_to_ns(1ULL, cd.mult, cd.shift);
Russell King112f38a42010-12-15 19:23:07 +0000146 pr_info("sched_clock: %u bits at %lu%cHz, resolution %lluns, wraps every %lums\n",
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100147 bits, r, r_unit, res, w);
Russell King112f38a42010-12-15 19:23:07 +0000148
149 /*
150 * Start the timer to keep sched_clock() properly updated and
151 * sets the initial epoch.
152 */
153 sched_clock_timer.data = msecs_to_jiffies(w - (w / 10));
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100154 update_sched_clock();
Russell King112f38a42010-12-15 19:23:07 +0000155
156 /*
157 * Ensure that sched_clock() starts off at 0ns
158 */
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100159 cd.epoch_ns = 0;
160
Russell Kinga42c3622012-09-09 18:39:28 +0100161 /* Enable IRQ time accounting if we have a fast enough sched_clock */
162 if (irqtime > 0 || (irqtime == -1 && rate >= 1000000))
163 enable_sched_clock_irqtime();
164
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100165 pr_debug("Registered %pF as sched_clock source\n", read);
166}
167
168unsigned long long notrace sched_clock(void)
169{
170 u32 cyc = read_sched_clock();
171 return cyc_to_sched_clock(cyc, sched_clock_mask);
Russell King112f38a42010-12-15 19:23:07 +0000172}
Russell King211baa702011-01-11 16:23:04 +0000173
174void __init sched_clock_postinit(void)
175{
Marc Zyngier2f0778af2011-12-15 12:19:23 +0100176 /*
177 * If no sched_clock function has been provided at that point,
178 * make it the final one one.
179 */
180 if (read_sched_clock == jiffy_sched_clock_read)
181 setup_sched_clock(jiffy_sched_clock_read, 32, HZ);
182
Russell King211baa702011-01-11 16:23:04 +0000183 sched_clock_poll(sched_clock_timer.data);
184}
Russell Kingf153d012012-02-04 12:31:27 +0000185
186static int sched_clock_suspend(void)
187{
188 sched_clock_poll(sched_clock_timer.data);
Felipe Balbi 26a4dae52012-10-23 19:00:03 +0100189 cd.suspended = true;
Russell Kingf153d012012-02-04 12:31:27 +0000190 return 0;
191}
192
Colin Cross237ec6f2012-08-07 19:05:10 +0100193static void sched_clock_resume(void)
194{
Felipe Balbi 26a4dae52012-10-23 19:00:03 +0100195 cd.epoch_cyc = read_sched_clock();
196 cd.epoch_cyc_copy = cd.epoch_cyc;
197 cd.suspended = false;
Colin Cross237ec6f2012-08-07 19:05:10 +0100198}
199
Russell Kingf153d012012-02-04 12:31:27 +0000200static struct syscore_ops sched_clock_ops = {
201 .suspend = sched_clock_suspend,
Colin Cross237ec6f2012-08-07 19:05:10 +0100202 .resume = sched_clock_resume,
Russell Kingf153d012012-02-04 12:31:27 +0000203};
204
205static int __init sched_clock_syscore_init(void)
206{
207 register_syscore_ops(&sched_clock_ops);
208 return 0;
209}
210device_initcall(sched_clock_syscore_init);