blob: 5697155f1868037fa0fd1863cfabc6ee69399b98 [file] [log] [blame]
john stultz734efb42006-06-26 00:25:05 -07001/*
2 * linux/kernel/time/clocksource.c
3 *
4 * This file contains the functions which manage clocksource drivers.
5 *
6 * Copyright (C) 2004, 2005 IBM, John Stultz (johnstul@us.ibm.com)
7 *
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; either version 2 of the License, or
11 * (at your option) any later version.
12 *
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
17 *
18 * You should have received a copy of the GNU General Public License
19 * along with this program; if not, write to the Free Software
20 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
21 *
22 * TODO WishList:
23 * o Allow clocksource drivers to be unregistered
john stultz734efb42006-06-26 00:25:05 -070024 */
25
26#include <linux/clocksource.h>
27#include <linux/sysdev.h>
28#include <linux/init.h>
29#include <linux/module.h>
Mathieu Desnoyersdc29a362007-02-10 01:43:43 -080030#include <linux/sched.h> /* for spin_unlock_irq() using preempt_count() m68k */
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -080031#include <linux/tick.h>
Martin Schwidefsky01548f42009-08-18 17:09:42 +020032#include <linux/kthread.h>
john stultz734efb42006-06-26 00:25:05 -070033
Patrick Ohlya038a352009-02-12 05:03:34 +000034void timecounter_init(struct timecounter *tc,
35 const struct cyclecounter *cc,
36 u64 start_tstamp)
37{
38 tc->cc = cc;
39 tc->cycle_last = cc->read(cc);
40 tc->nsec = start_tstamp;
41}
42EXPORT_SYMBOL(timecounter_init);
43
44/**
45 * timecounter_read_delta - get nanoseconds since last call of this function
46 * @tc: Pointer to time counter
47 *
48 * When the underlying cycle counter runs over, this will be handled
49 * correctly as long as it does not run over more than once between
50 * calls.
51 *
52 * The first call to this function for a new time counter initializes
53 * the time tracking and returns an undefined result.
54 */
55static u64 timecounter_read_delta(struct timecounter *tc)
56{
57 cycle_t cycle_now, cycle_delta;
58 u64 ns_offset;
59
60 /* read cycle counter: */
61 cycle_now = tc->cc->read(tc->cc);
62
63 /* calculate the delta since the last timecounter_read_delta(): */
64 cycle_delta = (cycle_now - tc->cycle_last) & tc->cc->mask;
65
66 /* convert to nanoseconds: */
67 ns_offset = cyclecounter_cyc2ns(tc->cc, cycle_delta);
68
69 /* update time stamp of timecounter_read_delta() call: */
70 tc->cycle_last = cycle_now;
71
72 return ns_offset;
73}
74
75u64 timecounter_read(struct timecounter *tc)
76{
77 u64 nsec;
78
79 /* increment time by nanoseconds since last call */
80 nsec = timecounter_read_delta(tc);
81 nsec += tc->nsec;
82 tc->nsec = nsec;
83
84 return nsec;
85}
86EXPORT_SYMBOL(timecounter_read);
87
88u64 timecounter_cyc2time(struct timecounter *tc,
89 cycle_t cycle_tstamp)
90{
91 u64 cycle_delta = (cycle_tstamp - tc->cycle_last) & tc->cc->mask;
92 u64 nsec;
93
94 /*
95 * Instead of always treating cycle_tstamp as more recent
96 * than tc->cycle_last, detect when it is too far in the
97 * future and treat it as old time stamp instead.
98 */
99 if (cycle_delta > tc->cc->mask / 2) {
100 cycle_delta = (tc->cycle_last - cycle_tstamp) & tc->cc->mask;
101 nsec = tc->nsec - cyclecounter_cyc2ns(tc->cc, cycle_delta);
102 } else {
103 nsec = cyclecounter_cyc2ns(tc->cc, cycle_delta) + tc->nsec;
104 }
105
106 return nsec;
107}
108EXPORT_SYMBOL(timecounter_cyc2time);
109
john stultz734efb42006-06-26 00:25:05 -0700110/*[Clocksource internal variables]---------
111 * curr_clocksource:
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200112 * currently selected clocksource.
john stultz734efb42006-06-26 00:25:05 -0700113 * clocksource_list:
114 * linked list with the registered clocksources
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200115 * clocksource_mutex:
116 * protects manipulations to curr_clocksource and the clocksource_list
john stultz734efb42006-06-26 00:25:05 -0700117 * override_name:
118 * Name of the user-specified clocksource.
119 */
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200120static struct clocksource *curr_clocksource;
john stultz734efb42006-06-26 00:25:05 -0700121static LIST_HEAD(clocksource_list);
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200122static DEFINE_MUTEX(clocksource_mutex);
john stultz734efb42006-06-26 00:25:05 -0700123static char override_name[32];
john stultz734efb42006-06-26 00:25:05 -0700124
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800125#ifdef CONFIG_CLOCKSOURCE_WATCHDOG
Martin Schwidefskyf79e0252009-09-11 15:33:05 +0200126static void clocksource_watchdog_work(struct work_struct *work);
127
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800128static LIST_HEAD(watchdog_list);
129static struct clocksource *watchdog;
130static struct timer_list watchdog_timer;
Martin Schwidefskyf79e0252009-09-11 15:33:05 +0200131static DECLARE_WORK(watchdog_work, clocksource_watchdog_work);
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800132static DEFINE_SPINLOCK(watchdog_lock);
133static cycle_t watchdog_last;
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200134static int watchdog_running;
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700135
Martin Schwidefsky01548f42009-08-18 17:09:42 +0200136static int clocksource_watchdog_kthread(void *data);
Thomas Gleixnerd0981a12009-08-19 11:26:09 +0200137static void __clocksource_change_rating(struct clocksource *cs, int rating);
Martin Schwidefskyc55c87c2009-08-14 15:47:25 +0200138
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800139/*
Daniel Walker35c35d12007-05-09 02:33:40 -0700140 * Interval: 0.5sec Threshold: 0.0625s
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800141 */
142#define WATCHDOG_INTERVAL (HZ >> 1)
Daniel Walker35c35d12007-05-09 02:33:40 -0700143#define WATCHDOG_THRESHOLD (NSEC_PER_SEC >> 4)
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800144
Martin Schwidefsky01548f42009-08-18 17:09:42 +0200145static void clocksource_watchdog_work(struct work_struct *work)
146{
147 /*
148 * If kthread_run fails the next watchdog scan over the
149 * watchdog_list will find the unstable clock again.
150 */
151 kthread_run(clocksource_watchdog_kthread, NULL, "kwatchdog");
152}
153
Thomas Gleixner7285dd72009-08-28 20:25:24 +0200154static void __clocksource_unstable(struct clocksource *cs)
155{
156 cs->flags &= ~(CLOCK_SOURCE_VALID_FOR_HRES | CLOCK_SOURCE_WATCHDOG);
157 cs->flags |= CLOCK_SOURCE_UNSTABLE;
158 schedule_work(&watchdog_work);
159}
160
Martin Schwidefsky8cf4e752009-08-14 15:47:22 +0200161static void clocksource_unstable(struct clocksource *cs, int64_t delta)
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800162{
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800163 printk(KERN_WARNING "Clocksource %s unstable (delta = %Ld ns)\n",
164 cs->name, delta);
Thomas Gleixner7285dd72009-08-28 20:25:24 +0200165 __clocksource_unstable(cs);
166}
167
168/**
169 * clocksource_mark_unstable - mark clocksource unstable via watchdog
170 * @cs: clocksource to be marked unstable
171 *
172 * This function is called instead of clocksource_change_rating from
173 * cpu hotplug code to avoid a deadlock between the clocksource mutex
174 * and the cpu hotplug mutex. It defers the update of the clocksource
175 * to the watchdog thread.
176 */
177void clocksource_mark_unstable(struct clocksource *cs)
178{
179 unsigned long flags;
180
181 spin_lock_irqsave(&watchdog_lock, flags);
182 if (!(cs->flags & CLOCK_SOURCE_UNSTABLE)) {
183 if (list_empty(&cs->wd_list))
184 list_add(&cs->wd_list, &watchdog_list);
185 __clocksource_unstable(cs);
186 }
187 spin_unlock_irqrestore(&watchdog_lock, flags);
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800188}
189
190static void clocksource_watchdog(unsigned long data)
191{
Martin Schwidefskyc55c87c2009-08-14 15:47:25 +0200192 struct clocksource *cs;
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800193 cycle_t csnow, wdnow;
194 int64_t wd_nsec, cs_nsec;
Martin Schwidefskyc55c87c2009-08-14 15:47:25 +0200195 int next_cpu;
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800196
197 spin_lock(&watchdog_lock);
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200198 if (!watchdog_running)
199 goto out;
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800200
Magnus Damm8e196082009-04-21 12:24:00 -0700201 wdnow = watchdog->read(watchdog);
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200202 wd_nsec = clocksource_cyc2ns((wdnow - watchdog_last) & watchdog->mask,
203 watchdog->mult, watchdog->shift);
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800204 watchdog_last = wdnow;
205
Martin Schwidefskyc55c87c2009-08-14 15:47:25 +0200206 list_for_each_entry(cs, &watchdog_list, wd_list) {
207
208 /* Clocksource already marked unstable? */
Martin Schwidefsky01548f42009-08-18 17:09:42 +0200209 if (cs->flags & CLOCK_SOURCE_UNSTABLE) {
210 schedule_work(&watchdog_work);
Martin Schwidefskyc55c87c2009-08-14 15:47:25 +0200211 continue;
Martin Schwidefsky01548f42009-08-18 17:09:42 +0200212 }
Martin Schwidefskyc55c87c2009-08-14 15:47:25 +0200213
Magnus Damm8e196082009-04-21 12:24:00 -0700214 csnow = cs->read(cs);
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700215
Martin Schwidefsky8cf4e752009-08-14 15:47:22 +0200216 /* Clocksource initialized ? */
217 if (!(cs->flags & CLOCK_SOURCE_WATCHDOG)) {
218 cs->flags |= CLOCK_SOURCE_WATCHDOG;
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700219 cs->wd_last = csnow;
220 continue;
221 }
222
Martin Schwidefsky8cf4e752009-08-14 15:47:22 +0200223 /* Check the deviation from the watchdog clocksource. */
Martin Schwidefsky155ec602009-08-14 15:47:26 +0200224 cs_nsec = clocksource_cyc2ns((csnow - cs->wd_last) &
225 cs->mask, cs->mult, cs->shift);
Martin Schwidefsky8cf4e752009-08-14 15:47:22 +0200226 cs->wd_last = csnow;
227 if (abs(cs_nsec - wd_nsec) > WATCHDOG_THRESHOLD) {
228 clocksource_unstable(cs, cs_nsec - wd_nsec);
229 continue;
230 }
231
232 if (!(cs->flags & CLOCK_SOURCE_VALID_FOR_HRES) &&
233 (cs->flags & CLOCK_SOURCE_IS_CONTINUOUS) &&
234 (watchdog->flags & CLOCK_SOURCE_IS_CONTINUOUS)) {
235 cs->flags |= CLOCK_SOURCE_VALID_FOR_HRES;
236 /*
237 * We just marked the clocksource as highres-capable,
238 * notify the rest of the system as well so that we
239 * transition into high-res mode:
240 */
241 tick_clock_notify();
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800242 }
243 }
244
Martin Schwidefskyc55c87c2009-08-14 15:47:25 +0200245 /*
246 * Cycle through CPUs to check if the CPUs stay synchronized
247 * to each other.
248 */
249 next_cpu = cpumask_next(raw_smp_processor_id(), cpu_online_mask);
250 if (next_cpu >= nr_cpu_ids)
251 next_cpu = cpumask_first(cpu_online_mask);
252 watchdog_timer.expires += WATCHDOG_INTERVAL;
253 add_timer_on(&watchdog_timer, next_cpu);
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200254out:
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800255 spin_unlock(&watchdog_lock);
256}
Martin Schwidefsky0f8e8ef2009-08-14 15:47:23 +0200257
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200258static inline void clocksource_start_watchdog(void)
259{
260 if (watchdog_running || !watchdog || list_empty(&watchdog_list))
261 return;
262 init_timer(&watchdog_timer);
263 watchdog_timer.function = clocksource_watchdog;
264 watchdog_last = watchdog->read(watchdog);
265 watchdog_timer.expires = jiffies + WATCHDOG_INTERVAL;
266 add_timer_on(&watchdog_timer, cpumask_first(cpu_online_mask));
267 watchdog_running = 1;
268}
269
270static inline void clocksource_stop_watchdog(void)
271{
272 if (!watchdog_running || (watchdog && !list_empty(&watchdog_list)))
273 return;
274 del_timer(&watchdog_timer);
275 watchdog_running = 0;
276}
277
Martin Schwidefsky0f8e8ef2009-08-14 15:47:23 +0200278static inline void clocksource_reset_watchdog(void)
279{
280 struct clocksource *cs;
281
282 list_for_each_entry(cs, &watchdog_list, wd_list)
283 cs->flags &= ~CLOCK_SOURCE_WATCHDOG;
284}
285
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700286static void clocksource_resume_watchdog(void)
287{
Martin Schwidefsky0f8e8ef2009-08-14 15:47:23 +0200288 unsigned long flags;
289
290 spin_lock_irqsave(&watchdog_lock, flags);
291 clocksource_reset_watchdog();
292 spin_unlock_irqrestore(&watchdog_lock, flags);
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700293}
294
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200295static void clocksource_enqueue_watchdog(struct clocksource *cs)
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800296{
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800297 unsigned long flags;
298
299 spin_lock_irqsave(&watchdog_lock, flags);
300 if (cs->flags & CLOCK_SOURCE_MUST_VERIFY) {
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200301 /* cs is a clocksource to be watched. */
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800302 list_add(&cs->wd_list, &watchdog_list);
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200303 cs->flags &= ~CLOCK_SOURCE_WATCHDOG;
Thomas Gleixner948ac6d2007-03-25 14:42:51 +0200304 } else {
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200305 /* cs is a watchdog. */
Thomas Gleixner948ac6d2007-03-25 14:42:51 +0200306 if (cs->flags & CLOCK_SOURCE_IS_CONTINUOUS)
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800307 cs->flags |= CLOCK_SOURCE_VALID_FOR_HRES;
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200308 /* Pick the best watchdog. */
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800309 if (!watchdog || cs->rating > watchdog->rating) {
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800310 watchdog = cs;
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800311 /* Reset watchdog cycles */
Martin Schwidefsky0f8e8ef2009-08-14 15:47:23 +0200312 clocksource_reset_watchdog();
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800313 }
314 }
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200315 /* Check if the watchdog timer needs to be started. */
316 clocksource_start_watchdog();
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800317 spin_unlock_irqrestore(&watchdog_lock, flags);
318}
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200319
320static void clocksource_dequeue_watchdog(struct clocksource *cs)
321{
322 struct clocksource *tmp;
323 unsigned long flags;
324
325 spin_lock_irqsave(&watchdog_lock, flags);
326 if (cs->flags & CLOCK_SOURCE_MUST_VERIFY) {
327 /* cs is a watched clocksource. */
328 list_del_init(&cs->wd_list);
329 } else if (cs == watchdog) {
330 /* Reset watchdog cycles */
331 clocksource_reset_watchdog();
332 /* Current watchdog is removed. Find an alternative. */
333 watchdog = NULL;
334 list_for_each_entry(tmp, &clocksource_list, list) {
335 if (tmp == cs || tmp->flags & CLOCK_SOURCE_MUST_VERIFY)
336 continue;
337 if (!watchdog || tmp->rating > watchdog->rating)
338 watchdog = tmp;
339 }
340 }
341 cs->flags &= ~CLOCK_SOURCE_WATCHDOG;
342 /* Check if the watchdog timer needs to be stopped. */
343 clocksource_stop_watchdog();
344 spin_unlock_irqrestore(&watchdog_lock, flags);
345}
346
Martin Schwidefsky01548f42009-08-18 17:09:42 +0200347static int clocksource_watchdog_kthread(void *data)
Martin Schwidefskyc55c87c2009-08-14 15:47:25 +0200348{
349 struct clocksource *cs, *tmp;
350 unsigned long flags;
Thomas Gleixner6ea41d22009-08-15 13:20:42 +0200351 LIST_HEAD(unstable);
Martin Schwidefskyc55c87c2009-08-14 15:47:25 +0200352
Thomas Gleixnerd0981a12009-08-19 11:26:09 +0200353 mutex_lock(&clocksource_mutex);
Martin Schwidefskyc55c87c2009-08-14 15:47:25 +0200354 spin_lock_irqsave(&watchdog_lock, flags);
355 list_for_each_entry_safe(cs, tmp, &watchdog_list, wd_list)
356 if (cs->flags & CLOCK_SOURCE_UNSTABLE) {
357 list_del_init(&cs->wd_list);
Thomas Gleixner6ea41d22009-08-15 13:20:42 +0200358 list_add(&cs->wd_list, &unstable);
Martin Schwidefskyc55c87c2009-08-14 15:47:25 +0200359 }
360 /* Check if the watchdog timer needs to be stopped. */
361 clocksource_stop_watchdog();
Thomas Gleixner6ea41d22009-08-15 13:20:42 +0200362 spin_unlock_irqrestore(&watchdog_lock, flags);
363
364 /* Needs to be done outside of watchdog lock */
365 list_for_each_entry_safe(cs, tmp, &unstable, wd_list) {
366 list_del_init(&cs->wd_list);
Thomas Gleixnerd0981a12009-08-19 11:26:09 +0200367 __clocksource_change_rating(cs, 0);
Thomas Gleixner6ea41d22009-08-15 13:20:42 +0200368 }
Thomas Gleixnerd0981a12009-08-19 11:26:09 +0200369 mutex_unlock(&clocksource_mutex);
Martin Schwidefsky01548f42009-08-18 17:09:42 +0200370 return 0;
Martin Schwidefskyc55c87c2009-08-14 15:47:25 +0200371}
372
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200373#else /* CONFIG_CLOCKSOURCE_WATCHDOG */
374
375static void clocksource_enqueue_watchdog(struct clocksource *cs)
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800376{
377 if (cs->flags & CLOCK_SOURCE_IS_CONTINUOUS)
378 cs->flags |= CLOCK_SOURCE_VALID_FOR_HRES;
379}
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700380
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200381static inline void clocksource_dequeue_watchdog(struct clocksource *cs) { }
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700382static inline void clocksource_resume_watchdog(void) { }
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200383
384#endif /* CONFIG_CLOCKSOURCE_WATCHDOG */
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800385
john stultz734efb42006-06-26 00:25:05 -0700386/**
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700387 * clocksource_resume - resume the clocksource(s)
388 */
389void clocksource_resume(void)
390{
Matthias Kaehlcke2e197582007-10-18 23:39:58 -0700391 struct clocksource *cs;
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700392
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200393 mutex_lock(&clocksource_mutex);
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700394
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200395 list_for_each_entry(cs, &clocksource_list, list)
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700396 if (cs->resume)
397 cs->resume();
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700398
399 clocksource_resume_watchdog();
400
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200401 mutex_unlock(&clocksource_mutex);
Thomas Gleixnerb52f52a2007-05-09 02:35:15 -0700402}
403
404/**
Jason Wessel7c3078b2008-02-15 14:55:54 -0600405 * clocksource_touch_watchdog - Update watchdog
406 *
407 * Update the watchdog after exception contexts such as kgdb so as not
408 * to incorrectly trip the watchdog.
409 *
410 */
411void clocksource_touch_watchdog(void)
412{
413 clocksource_resume_watchdog();
414}
415
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200416#ifdef CONFIG_GENERIC_TIME
john stultz734efb42006-06-26 00:25:05 -0700417
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200418static int finished_booting;
john stultz734efb42006-06-26 00:25:05 -0700419
420/**
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200421 * clocksource_select - Select the best clocksource available
john stultz734efb42006-06-26 00:25:05 -0700422 *
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200423 * Private function. Must hold clocksource_mutex when called.
john stultz734efb42006-06-26 00:25:05 -0700424 *
Thomas Gleixner92c7e002007-02-16 01:27:33 -0800425 * Select the clocksource with the best rating, or the clocksource,
426 * which is selected by userspace override.
john stultz734efb42006-06-26 00:25:05 -0700427 */
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200428static void clocksource_select(void)
john stultz734efb42006-06-26 00:25:05 -0700429{
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200430 struct clocksource *best, *cs;
Thomas Gleixner5d8b34f2007-02-16 01:27:43 -0800431
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200432 if (!finished_booting || list_empty(&clocksource_list))
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200433 return;
434 /* First clocksource on the list has the best rating. */
435 best = list_first_entry(&clocksource_list, struct clocksource, list);
436 /* Check for the override clocksource. */
437 list_for_each_entry(cs, &clocksource_list, list) {
438 if (strcmp(cs->name, override_name) != 0)
439 continue;
440 /*
441 * Check to make sure we don't switch to a non-highres
442 * capable clocksource if the tick code is in oneshot
443 * mode (highres or nohz)
444 */
445 if (!(cs->flags & CLOCK_SOURCE_VALID_FOR_HRES) &&
446 tick_oneshot_mode_active()) {
447 /* Override clocksource cannot be used. */
448 printk(KERN_WARNING "Override clocksource %s is not "
449 "HRT compatible. Cannot switch while in "
450 "HRT/NOHZ mode\n", cs->name);
451 override_name[0] = 0;
452 } else
453 /* Override clocksource can be used. */
454 best = cs;
455 break;
456 }
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200457 if (curr_clocksource != best) {
458 printk(KERN_INFO "Switching to clocksource %s\n", best->name);
459 curr_clocksource = best;
460 timekeeping_notify(curr_clocksource);
461 }
john stultz734efb42006-06-26 00:25:05 -0700462}
463
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200464/*
465 * clocksource_done_booting - Called near the end of core bootup
466 *
467 * Hack to avoid lots of clocksource churn at boot time.
468 * We use fs_initcall because we want this to start before
469 * device_initcall but after subsys_initcall.
470 */
471static int __init clocksource_done_booting(void)
472{
473 finished_booting = 1;
474 clocksource_select();
475 return 0;
476}
477fs_initcall(clocksource_done_booting);
478
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200479#else /* CONFIG_GENERIC_TIME */
480
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200481static inline void clocksource_select(void) { }
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200482
483#endif
484
Thomas Gleixner92c7e002007-02-16 01:27:33 -0800485/*
486 * Enqueue the clocksource sorted by rating
john stultz734efb42006-06-26 00:25:05 -0700487 */
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200488static void clocksource_enqueue(struct clocksource *cs)
john stultz734efb42006-06-26 00:25:05 -0700489{
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200490 struct list_head *entry = &clocksource_list;
491 struct clocksource *tmp;
john stultz734efb42006-06-26 00:25:05 -0700492
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200493 list_for_each_entry(tmp, &clocksource_list, list)
Thomas Gleixner92c7e002007-02-16 01:27:33 -0800494 /* Keep track of the place, where to insert */
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200495 if (tmp->rating >= cs->rating)
496 entry = &tmp->list;
497 list_add(&cs->list, entry);
john stultz734efb42006-06-26 00:25:05 -0700498}
499
500/**
john stultza2752542006-06-26 00:25:14 -0700501 * clocksource_register - Used to install new clocksources
john stultz734efb42006-06-26 00:25:05 -0700502 * @t: clocksource to be registered
503 *
504 * Returns -EBUSY if registration fails, zero otherwise.
505 */
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200506int clocksource_register(struct clocksource *cs)
john stultz734efb42006-06-26 00:25:05 -0700507{
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200508 mutex_lock(&clocksource_mutex);
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200509 clocksource_enqueue(cs);
510 clocksource_select();
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200511 clocksource_enqueue_watchdog(cs);
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200512 mutex_unlock(&clocksource_mutex);
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200513 return 0;
john stultz734efb42006-06-26 00:25:05 -0700514}
john stultza2752542006-06-26 00:25:14 -0700515EXPORT_SYMBOL(clocksource_register);
john stultz734efb42006-06-26 00:25:05 -0700516
Thomas Gleixnerd0981a12009-08-19 11:26:09 +0200517static void __clocksource_change_rating(struct clocksource *cs, int rating)
518{
519 list_del(&cs->list);
520 cs->rating = rating;
521 clocksource_enqueue(cs);
522 clocksource_select();
523}
524
john stultz734efb42006-06-26 00:25:05 -0700525/**
Thomas Gleixner92c7e002007-02-16 01:27:33 -0800526 * clocksource_change_rating - Change the rating of a registered clocksource
john stultz734efb42006-06-26 00:25:05 -0700527 */
Thomas Gleixner92c7e002007-02-16 01:27:33 -0800528void clocksource_change_rating(struct clocksource *cs, int rating)
john stultz734efb42006-06-26 00:25:05 -0700529{
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200530 mutex_lock(&clocksource_mutex);
Thomas Gleixnerd0981a12009-08-19 11:26:09 +0200531 __clocksource_change_rating(cs, rating);
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200532 mutex_unlock(&clocksource_mutex);
john stultz734efb42006-06-26 00:25:05 -0700533}
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200534EXPORT_SYMBOL(clocksource_change_rating);
john stultz734efb42006-06-26 00:25:05 -0700535
Thomas Gleixner4713e22c2008-01-30 13:30:02 +0100536/**
537 * clocksource_unregister - remove a registered clocksource
538 */
539void clocksource_unregister(struct clocksource *cs)
540{
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200541 mutex_lock(&clocksource_mutex);
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200542 clocksource_dequeue_watchdog(cs);
Thomas Gleixner4713e22c2008-01-30 13:30:02 +0100543 list_del(&cs->list);
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200544 clocksource_select();
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200545 mutex_unlock(&clocksource_mutex);
Thomas Gleixner4713e22c2008-01-30 13:30:02 +0100546}
Martin Schwidefskyfb63a0e2009-08-14 15:47:24 +0200547EXPORT_SYMBOL(clocksource_unregister);
Thomas Gleixner4713e22c2008-01-30 13:30:02 +0100548
Daniel Walker2b013702006-12-10 02:21:30 -0800549#ifdef CONFIG_SYSFS
john stultz734efb42006-06-26 00:25:05 -0700550/**
551 * sysfs_show_current_clocksources - sysfs interface for current clocksource
552 * @dev: unused
553 * @buf: char buffer to be filled with clocksource list
554 *
555 * Provides sysfs interface for listing current clocksource.
556 */
557static ssize_t
Andi Kleen4a0b2b42008-07-01 18:48:41 +0200558sysfs_show_current_clocksources(struct sys_device *dev,
559 struct sysdev_attribute *attr, char *buf)
john stultz734efb42006-06-26 00:25:05 -0700560{
Miao Xie5e2cb102008-02-06 01:36:53 -0800561 ssize_t count = 0;
john stultz734efb42006-06-26 00:25:05 -0700562
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200563 mutex_lock(&clocksource_mutex);
Miao Xie5e2cb102008-02-06 01:36:53 -0800564 count = snprintf(buf, PAGE_SIZE, "%s\n", curr_clocksource->name);
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200565 mutex_unlock(&clocksource_mutex);
john stultz734efb42006-06-26 00:25:05 -0700566
Miao Xie5e2cb102008-02-06 01:36:53 -0800567 return count;
john stultz734efb42006-06-26 00:25:05 -0700568}
569
570/**
571 * sysfs_override_clocksource - interface for manually overriding clocksource
572 * @dev: unused
573 * @buf: name of override clocksource
574 * @count: length of buffer
575 *
576 * Takes input from sysfs interface for manually overriding the default
577 * clocksource selction.
578 */
579static ssize_t sysfs_override_clocksource(struct sys_device *dev,
Andi Kleen4a0b2b42008-07-01 18:48:41 +0200580 struct sysdev_attribute *attr,
john stultz734efb42006-06-26 00:25:05 -0700581 const char *buf, size_t count)
582{
583 size_t ret = count;
Thomas Gleixner92c7e002007-02-16 01:27:33 -0800584
john stultz734efb42006-06-26 00:25:05 -0700585 /* strings from sysfs write are not 0 terminated! */
586 if (count >= sizeof(override_name))
587 return -EINVAL;
588
589 /* strip of \n: */
590 if (buf[count-1] == '\n')
591 count--;
john stultz734efb42006-06-26 00:25:05 -0700592
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200593 mutex_lock(&clocksource_mutex);
john stultz734efb42006-06-26 00:25:05 -0700594
Thomas Gleixner92c7e002007-02-16 01:27:33 -0800595 if (count > 0)
596 memcpy(override_name, buf, count);
john stultz734efb42006-06-26 00:25:05 -0700597 override_name[count] = 0;
Martin Schwidefskyf1b82742009-08-14 15:47:21 +0200598 clocksource_select();
john stultz734efb42006-06-26 00:25:05 -0700599
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200600 mutex_unlock(&clocksource_mutex);
john stultz734efb42006-06-26 00:25:05 -0700601
602 return ret;
603}
604
605/**
606 * sysfs_show_available_clocksources - sysfs interface for listing clocksource
607 * @dev: unused
608 * @buf: char buffer to be filled with clocksource list
609 *
610 * Provides sysfs interface for listing registered clocksources
611 */
612static ssize_t
Andi Kleen4a0b2b42008-07-01 18:48:41 +0200613sysfs_show_available_clocksources(struct sys_device *dev,
614 struct sysdev_attribute *attr,
615 char *buf)
john stultz734efb42006-06-26 00:25:05 -0700616{
Matthias Kaehlcke2e197582007-10-18 23:39:58 -0700617 struct clocksource *src;
Miao Xie5e2cb102008-02-06 01:36:53 -0800618 ssize_t count = 0;
john stultz734efb42006-06-26 00:25:05 -0700619
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200620 mutex_lock(&clocksource_mutex);
Matthias Kaehlcke2e197582007-10-18 23:39:58 -0700621 list_for_each_entry(src, &clocksource_list, list) {
Thomas Gleixnercd6d95d2009-06-12 11:29:27 +0200622 /*
623 * Don't show non-HRES clocksource if the tick code is
624 * in one shot mode (highres=on or nohz=on)
625 */
626 if (!tick_oneshot_mode_active() ||
627 (src->flags & CLOCK_SOURCE_VALID_FOR_HRES))
john stultz3f685352009-01-21 22:53:22 -0700628 count += snprintf(buf + count,
Miao Xie5e2cb102008-02-06 01:36:53 -0800629 max((ssize_t)PAGE_SIZE - count, (ssize_t)0),
630 "%s ", src->name);
john stultz734efb42006-06-26 00:25:05 -0700631 }
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200632 mutex_unlock(&clocksource_mutex);
john stultz734efb42006-06-26 00:25:05 -0700633
Miao Xie5e2cb102008-02-06 01:36:53 -0800634 count += snprintf(buf + count,
635 max((ssize_t)PAGE_SIZE - count, (ssize_t)0), "\n");
john stultz734efb42006-06-26 00:25:05 -0700636
Miao Xie5e2cb102008-02-06 01:36:53 -0800637 return count;
john stultz734efb42006-06-26 00:25:05 -0700638}
639
640/*
641 * Sysfs setup bits:
642 */
Heiko Carstens4f95f812008-05-03 14:23:14 +0200643static SYSDEV_ATTR(current_clocksource, 0644, sysfs_show_current_clocksources,
Daniel Walkerf5f1a242006-12-10 02:21:33 -0800644 sysfs_override_clocksource);
john stultz734efb42006-06-26 00:25:05 -0700645
Heiko Carstens4f95f812008-05-03 14:23:14 +0200646static SYSDEV_ATTR(available_clocksource, 0444,
Daniel Walkerf5f1a242006-12-10 02:21:33 -0800647 sysfs_show_available_clocksources, NULL);
john stultz734efb42006-06-26 00:25:05 -0700648
649static struct sysdev_class clocksource_sysclass = {
Kay Sieversaf5ca3f2007-12-20 02:09:39 +0100650 .name = "clocksource",
john stultz734efb42006-06-26 00:25:05 -0700651};
652
653static struct sys_device device_clocksource = {
654 .id = 0,
655 .cls = &clocksource_sysclass,
656};
657
john stultzad596172006-06-26 00:25:06 -0700658static int __init init_clocksource_sysfs(void)
john stultz734efb42006-06-26 00:25:05 -0700659{
660 int error = sysdev_class_register(&clocksource_sysclass);
661
662 if (!error)
663 error = sysdev_register(&device_clocksource);
664 if (!error)
665 error = sysdev_create_file(
666 &device_clocksource,
667 &attr_current_clocksource);
668 if (!error)
669 error = sysdev_create_file(
670 &device_clocksource,
671 &attr_available_clocksource);
672 return error;
673}
674
675device_initcall(init_clocksource_sysfs);
Daniel Walker2b013702006-12-10 02:21:30 -0800676#endif /* CONFIG_SYSFS */
john stultz734efb42006-06-26 00:25:05 -0700677
678/**
679 * boot_override_clocksource - boot clock override
680 * @str: override name
681 *
682 * Takes a clocksource= boot argument and uses it
683 * as the clocksource override name.
684 */
685static int __init boot_override_clocksource(char* str)
686{
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200687 mutex_lock(&clocksource_mutex);
john stultz734efb42006-06-26 00:25:05 -0700688 if (str)
689 strlcpy(override_name, str, sizeof(override_name));
Martin Schwidefsky75c51582009-08-14 15:47:30 +0200690 mutex_unlock(&clocksource_mutex);
john stultz734efb42006-06-26 00:25:05 -0700691 return 1;
692}
693
694__setup("clocksource=", boot_override_clocksource);
695
696/**
697 * boot_override_clock - Compatibility layer for deprecated boot option
698 * @str: override name
699 *
700 * DEPRECATED! Takes a clock= boot argument and uses it
701 * as the clocksource override name
702 */
703static int __init boot_override_clock(char* str)
704{
john stultz5d0cf412006-06-26 00:25:12 -0700705 if (!strcmp(str, "pmtmr")) {
706 printk("Warning: clock=pmtmr is deprecated. "
707 "Use clocksource=acpi_pm.\n");
708 return boot_override_clocksource("acpi_pm");
709 }
710 printk("Warning! clock= boot option is deprecated. "
711 "Use clocksource=xyz\n");
john stultz734efb42006-06-26 00:25:05 -0700712 return boot_override_clocksource(str);
713}
714
715__setup("clock=", boot_override_clock);