2 * linux/kernel/time/clocksource.c
4 * This file contains the functions which manage clocksource drivers.
6 * Copyright (C) 2004, 2005 IBM, John Stultz (johnstul@us.ibm.com)
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; either version 2 of the License, or
11 * (at your option) any later version.
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
18 * You should have received a copy of the GNU General Public License
19 * along with this program; if not, write to the Free Software
20 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
23 * o Allow clocksource drivers to be unregistered
24 * o get rid of clocksource_jiffies extern
27 #include <linux/clocksource.h>
28 #include <linux/sysdev.h>
29 #include <linux/init.h>
30 #include <linux/module.h>
31 #include <linux/sched.h> /* for spin_unlock_irq() using preempt_count() m68k */
32 #include <linux/tick.h>
34 void timecounter_init(struct timecounter
*tc
,
35 const struct cyclecounter
*cc
,
39 tc
->cycle_last
= cc
->read(cc
);
40 tc
->nsec
= start_tstamp
;
42 EXPORT_SYMBOL(timecounter_init
);
45 * timecounter_read_delta - get nanoseconds since last call of this function
46 * @tc: Pointer to time counter
48 * When the underlying cycle counter runs over, this will be handled
49 * correctly as long as it does not run over more than once between
52 * The first call to this function for a new time counter initializes
53 * the time tracking and returns an undefined result.
55 static u64
timecounter_read_delta(struct timecounter
*tc
)
57 cycle_t cycle_now
, cycle_delta
;
60 /* read cycle counter: */
61 cycle_now
= tc
->cc
->read(tc
->cc
);
63 /* calculate the delta since the last timecounter_read_delta(): */
64 cycle_delta
= (cycle_now
- tc
->cycle_last
) & tc
->cc
->mask
;
66 /* convert to nanoseconds: */
67 ns_offset
= cyclecounter_cyc2ns(tc
->cc
, cycle_delta
);
69 /* update time stamp of timecounter_read_delta() call: */
70 tc
->cycle_last
= cycle_now
;
75 u64
timecounter_read(struct timecounter
*tc
)
79 /* increment time by nanoseconds since last call */
80 nsec
= timecounter_read_delta(tc
);
86 EXPORT_SYMBOL(timecounter_read
);
88 u64
timecounter_cyc2time(struct timecounter
*tc
,
91 u64 cycle_delta
= (cycle_tstamp
- tc
->cycle_last
) & tc
->cc
->mask
;
95 * Instead of always treating cycle_tstamp as more recent
96 * than tc->cycle_last, detect when it is too far in the
97 * future and treat it as old time stamp instead.
99 if (cycle_delta
> tc
->cc
->mask
/ 2) {
100 cycle_delta
= (tc
->cycle_last
- cycle_tstamp
) & tc
->cc
->mask
;
101 nsec
= tc
->nsec
- cyclecounter_cyc2ns(tc
->cc
, cycle_delta
);
103 nsec
= cyclecounter_cyc2ns(tc
->cc
, cycle_delta
) + tc
->nsec
;
108 EXPORT_SYMBOL(timecounter_cyc2time
);
110 /* XXX - Would like a better way for initializing curr_clocksource */
111 extern struct clocksource clocksource_jiffies
;
113 /*[Clocksource internal variables]---------
115 * currently selected clocksource. Initialized to clocksource_jiffies.
117 * pending next selected clocksource.
119 * linked list with the registered clocksources
121 * protects manipulations to curr_clocksource and next_clocksource
122 * and the clocksource_list
124 * Name of the user-specified clocksource.
126 static struct clocksource
*curr_clocksource
= &clocksource_jiffies
;
127 static struct clocksource
*next_clocksource
;
128 static struct clocksource
*clocksource_override
;
129 static LIST_HEAD(clocksource_list
);
130 static DEFINE_SPINLOCK(clocksource_lock
);
131 static char override_name
[32];
132 static int finished_booting
;
134 /* clocksource_done_booting - Called near the end of core bootup
136 * Hack to avoid lots of clocksource churn at boot time.
137 * We use fs_initcall because we want this to start before
138 * device_initcall but after subsys_initcall.
140 static int __init
clocksource_done_booting(void)
142 finished_booting
= 1;
145 fs_initcall(clocksource_done_booting
);
147 #ifdef CONFIG_CLOCKSOURCE_WATCHDOG
148 static LIST_HEAD(watchdog_list
);
149 static struct clocksource
*watchdog
;
150 static struct timer_list watchdog_timer
;
151 static DEFINE_SPINLOCK(watchdog_lock
);
152 static cycle_t watchdog_last
;
153 static unsigned long watchdog_resumed
;
156 * Interval: 0.5sec Threshold: 0.0625s
158 #define WATCHDOG_INTERVAL (HZ >> 1)
159 #define WATCHDOG_THRESHOLD (NSEC_PER_SEC >> 4)
161 static void clocksource_ratewd(struct clocksource
*cs
, int64_t delta
)
163 if (delta
> -WATCHDOG_THRESHOLD
&& delta
< WATCHDOG_THRESHOLD
)
166 printk(KERN_WARNING
"Clocksource %s unstable (delta = %Ld ns)\n",
168 cs
->flags
&= ~(CLOCK_SOURCE_VALID_FOR_HRES
| CLOCK_SOURCE_WATCHDOG
);
169 clocksource_change_rating(cs
, 0);
170 list_del(&cs
->wd_list
);
173 static void clocksource_watchdog(unsigned long data
)
175 struct clocksource
*cs
, *tmp
;
176 cycle_t csnow
, wdnow
;
177 int64_t wd_nsec
, cs_nsec
;
180 spin_lock(&watchdog_lock
);
182 resumed
= test_and_clear_bit(0, &watchdog_resumed
);
184 wdnow
= watchdog
->read(watchdog
);
185 wd_nsec
= cyc2ns(watchdog
, (wdnow
- watchdog_last
) & watchdog
->mask
);
186 watchdog_last
= wdnow
;
188 list_for_each_entry_safe(cs
, tmp
, &watchdog_list
, wd_list
) {
189 csnow
= cs
->read(cs
);
191 if (unlikely(resumed
)) {
197 if (!(cs
->flags
& CLOCK_SOURCE_WATCHDOG
)) {
198 if ((cs
->flags
& CLOCK_SOURCE_IS_CONTINUOUS
) &&
199 (watchdog
->flags
& CLOCK_SOURCE_IS_CONTINUOUS
)) {
200 cs
->flags
|= CLOCK_SOURCE_VALID_FOR_HRES
;
202 * We just marked the clocksource as
203 * highres-capable, notify the rest of the
204 * system as well so that we transition
205 * into high-res mode:
209 cs
->flags
|= CLOCK_SOURCE_WATCHDOG
;
212 cs_nsec
= cyc2ns(cs
, (csnow
- cs
->wd_last
) & cs
->mask
);
214 /* Check the delta. Might remove from the list ! */
215 clocksource_ratewd(cs
, cs_nsec
- wd_nsec
);
219 if (!list_empty(&watchdog_list
)) {
221 * Cycle through CPUs to check if the CPUs stay
222 * synchronized to each other.
224 int next_cpu
= cpumask_next(raw_smp_processor_id(),
227 if (next_cpu
>= nr_cpu_ids
)
228 next_cpu
= cpumask_first(cpu_online_mask
);
229 watchdog_timer
.expires
+= WATCHDOG_INTERVAL
;
230 add_timer_on(&watchdog_timer
, next_cpu
);
232 spin_unlock(&watchdog_lock
);
234 static void clocksource_resume_watchdog(void)
236 set_bit(0, &watchdog_resumed
);
239 static void clocksource_check_watchdog(struct clocksource
*cs
)
241 struct clocksource
*cse
;
244 spin_lock_irqsave(&watchdog_lock
, flags
);
245 if (cs
->flags
& CLOCK_SOURCE_MUST_VERIFY
) {
246 int started
= !list_empty(&watchdog_list
);
248 list_add(&cs
->wd_list
, &watchdog_list
);
249 if (!started
&& watchdog
) {
250 watchdog_last
= watchdog
->read(watchdog
);
251 watchdog_timer
.expires
= jiffies
+ WATCHDOG_INTERVAL
;
252 add_timer_on(&watchdog_timer
,
253 cpumask_first(cpu_online_mask
));
256 if (cs
->flags
& CLOCK_SOURCE_IS_CONTINUOUS
)
257 cs
->flags
|= CLOCK_SOURCE_VALID_FOR_HRES
;
259 if (!watchdog
|| cs
->rating
> watchdog
->rating
) {
261 del_timer(&watchdog_timer
);
263 init_timer(&watchdog_timer
);
264 watchdog_timer
.function
= clocksource_watchdog
;
266 /* Reset watchdog cycles */
267 list_for_each_entry(cse
, &watchdog_list
, wd_list
)
268 cse
->flags
&= ~CLOCK_SOURCE_WATCHDOG
;
269 /* Start if list is not empty */
270 if (!list_empty(&watchdog_list
)) {
271 watchdog_last
= watchdog
->read(watchdog
);
272 watchdog_timer
.expires
=
273 jiffies
+ WATCHDOG_INTERVAL
;
274 add_timer_on(&watchdog_timer
,
275 cpumask_first(cpu_online_mask
));
279 spin_unlock_irqrestore(&watchdog_lock
, flags
);
282 static void clocksource_check_watchdog(struct clocksource
*cs
)
284 if (cs
->flags
& CLOCK_SOURCE_IS_CONTINUOUS
)
285 cs
->flags
|= CLOCK_SOURCE_VALID_FOR_HRES
;
288 static inline void clocksource_resume_watchdog(void) { }
292 * clocksource_resume - resume the clocksource(s)
294 void clocksource_resume(void)
296 struct clocksource
*cs
;
299 spin_lock_irqsave(&clocksource_lock
, flags
);
301 list_for_each_entry(cs
, &clocksource_list
, list
) {
306 clocksource_resume_watchdog();
308 spin_unlock_irqrestore(&clocksource_lock
, flags
);
312 * clocksource_touch_watchdog - Update watchdog
314 * Update the watchdog after exception contexts such as kgdb so as not
315 * to incorrectly trip the watchdog.
318 void clocksource_touch_watchdog(void)
320 clocksource_resume_watchdog();
324 * clocksource_get_next - Returns the selected clocksource
327 struct clocksource
*clocksource_get_next(void)
331 spin_lock_irqsave(&clocksource_lock
, flags
);
332 if (next_clocksource
&& finished_booting
) {
333 curr_clocksource
= next_clocksource
;
334 next_clocksource
= NULL
;
336 spin_unlock_irqrestore(&clocksource_lock
, flags
);
338 return curr_clocksource
;
342 * select_clocksource - Selects the best registered clocksource.
344 * Private function. Must hold clocksource_lock when called.
346 * Select the clocksource with the best rating, or the clocksource,
347 * which is selected by userspace override.
349 static struct clocksource
*select_clocksource(void)
351 struct clocksource
*next
;
353 if (list_empty(&clocksource_list
))
356 if (clocksource_override
)
357 next
= clocksource_override
;
359 next
= list_entry(clocksource_list
.next
, struct clocksource
,
362 if (next
== curr_clocksource
)
369 * Enqueue the clocksource sorted by rating
371 static int clocksource_enqueue(struct clocksource
*c
)
373 struct list_head
*tmp
, *entry
= &clocksource_list
;
375 list_for_each(tmp
, &clocksource_list
) {
376 struct clocksource
*cs
;
378 cs
= list_entry(tmp
, struct clocksource
, list
);
381 /* Keep track of the place, where to insert */
382 if (cs
->rating
>= c
->rating
)
385 list_add(&c
->list
, entry
);
387 if (strlen(c
->name
) == strlen(override_name
) &&
388 !strcmp(c
->name
, override_name
))
389 clocksource_override
= c
;
395 * clocksource_register - Used to install new clocksources
396 * @t: clocksource to be registered
398 * Returns -EBUSY if registration fails, zero otherwise.
400 int clocksource_register(struct clocksource
*c
)
405 spin_lock_irqsave(&clocksource_lock
, flags
);
406 ret
= clocksource_enqueue(c
);
408 next_clocksource
= select_clocksource();
409 spin_unlock_irqrestore(&clocksource_lock
, flags
);
411 clocksource_check_watchdog(c
);
414 EXPORT_SYMBOL(clocksource_register
);
417 * clocksource_change_rating - Change the rating of a registered clocksource
420 void clocksource_change_rating(struct clocksource
*cs
, int rating
)
424 spin_lock_irqsave(&clocksource_lock
, flags
);
427 clocksource_enqueue(cs
);
428 next_clocksource
= select_clocksource();
429 spin_unlock_irqrestore(&clocksource_lock
, flags
);
433 * clocksource_unregister - remove a registered clocksource
435 void clocksource_unregister(struct clocksource
*cs
)
439 spin_lock_irqsave(&clocksource_lock
, flags
);
441 if (clocksource_override
== cs
)
442 clocksource_override
= NULL
;
443 next_clocksource
= select_clocksource();
444 spin_unlock_irqrestore(&clocksource_lock
, flags
);
449 * sysfs_show_current_clocksources - sysfs interface for current clocksource
451 * @buf: char buffer to be filled with clocksource list
453 * Provides sysfs interface for listing current clocksource.
456 sysfs_show_current_clocksources(struct sys_device
*dev
,
457 struct sysdev_attribute
*attr
, char *buf
)
461 spin_lock_irq(&clocksource_lock
);
462 count
= snprintf(buf
, PAGE_SIZE
, "%s\n", curr_clocksource
->name
);
463 spin_unlock_irq(&clocksource_lock
);
469 * sysfs_override_clocksource - interface for manually overriding clocksource
471 * @buf: name of override clocksource
472 * @count: length of buffer
474 * Takes input from sysfs interface for manually overriding the default
475 * clocksource selction.
477 static ssize_t
sysfs_override_clocksource(struct sys_device
*dev
,
478 struct sysdev_attribute
*attr
,
479 const char *buf
, size_t count
)
481 struct clocksource
*ovr
= NULL
;
485 /* strings from sysfs write are not 0 terminated! */
486 if (count
>= sizeof(override_name
))
490 if (buf
[count
-1] == '\n')
493 spin_lock_irq(&clocksource_lock
);
496 memcpy(override_name
, buf
, count
);
497 override_name
[count
] = 0;
499 len
= strlen(override_name
);
501 struct clocksource
*cs
;
503 ovr
= clocksource_override
;
504 /* try to select it: */
505 list_for_each_entry(cs
, &clocksource_list
, list
) {
506 if (strlen(cs
->name
) == len
&&
507 !strcmp(cs
->name
, override_name
))
513 * Check to make sure we don't switch to a non-highres capable
514 * clocksource if the tick code is in oneshot mode (highres or nohz)
516 if (tick_oneshot_mode_active() && ovr
&&
517 !(ovr
->flags
& CLOCK_SOURCE_VALID_FOR_HRES
)) {
518 printk(KERN_WARNING
"%s clocksource is not HRT compatible. "
519 "Cannot switch while in HRT/NOHZ mode\n", ovr
->name
);
521 override_name
[0] = 0;
524 /* Reselect, when the override name has changed */
525 if (ovr
!= clocksource_override
) {
526 clocksource_override
= ovr
;
527 next_clocksource
= select_clocksource();
530 spin_unlock_irq(&clocksource_lock
);
536 * sysfs_show_available_clocksources - sysfs interface for listing clocksource
538 * @buf: char buffer to be filled with clocksource list
540 * Provides sysfs interface for listing registered clocksources
543 sysfs_show_available_clocksources(struct sys_device
*dev
,
544 struct sysdev_attribute
*attr
,
547 struct clocksource
*src
;
550 spin_lock_irq(&clocksource_lock
);
551 list_for_each_entry(src
, &clocksource_list
, list
) {
553 * Don't show non-HRES clocksource if the tick code is
554 * in one shot mode (highres=on or nohz=on)
556 if (!tick_oneshot_mode_active() ||
557 (src
->flags
& CLOCK_SOURCE_VALID_FOR_HRES
))
558 count
+= snprintf(buf
+ count
,
559 max((ssize_t
)PAGE_SIZE
- count
, (ssize_t
)0),
562 spin_unlock_irq(&clocksource_lock
);
564 count
+= snprintf(buf
+ count
,
565 max((ssize_t
)PAGE_SIZE
- count
, (ssize_t
)0), "\n");
573 static SYSDEV_ATTR(current_clocksource
, 0644, sysfs_show_current_clocksources
,
574 sysfs_override_clocksource
);
576 static SYSDEV_ATTR(available_clocksource
, 0444,
577 sysfs_show_available_clocksources
, NULL
);
579 static struct sysdev_class clocksource_sysclass
= {
580 .name
= "clocksource",
583 static struct sys_device device_clocksource
= {
585 .cls
= &clocksource_sysclass
,
588 static int __init
init_clocksource_sysfs(void)
590 int error
= sysdev_class_register(&clocksource_sysclass
);
593 error
= sysdev_register(&device_clocksource
);
595 error
= sysdev_create_file(
597 &attr_current_clocksource
);
599 error
= sysdev_create_file(
601 &attr_available_clocksource
);
605 device_initcall(init_clocksource_sysfs
);
606 #endif /* CONFIG_SYSFS */
609 * boot_override_clocksource - boot clock override
610 * @str: override name
612 * Takes a clocksource= boot argument and uses it
613 * as the clocksource override name.
615 static int __init
boot_override_clocksource(char* str
)
618 spin_lock_irqsave(&clocksource_lock
, flags
);
620 strlcpy(override_name
, str
, sizeof(override_name
));
621 spin_unlock_irqrestore(&clocksource_lock
, flags
);
625 __setup("clocksource=", boot_override_clocksource
);
628 * boot_override_clock - Compatibility layer for deprecated boot option
629 * @str: override name
631 * DEPRECATED! Takes a clock= boot argument and uses it
632 * as the clocksource override name
634 static int __init
boot_override_clock(char* str
)
636 if (!strcmp(str
, "pmtmr")) {
637 printk("Warning: clock=pmtmr is deprecated. "
638 "Use clocksource=acpi_pm.\n");
639 return boot_override_clocksource("acpi_pm");
641 printk("Warning! clock= boot option is deprecated. "
642 "Use clocksource=xyz\n");
643 return boot_override_clocksource(str
);
646 __setup("clock=", boot_override_clock
);