[PATCH] fix and optimize clock source update

This fixes the clock source updates in update_wall_time() to correctly track the time coming in via current_tick_length(). Optimize the fast paths to be as short as possible to keep the overhead low. Signed-off-by: Roman Zippel <zippel@linux-m68k.org> Acked-by: John Stultz <johnstul@us.ibm.com> Signed-off-by: Andrew Morton <akpm@osdl.org> Signed-off-by: Linus Torvalds <torvalds@osdl.org>
author: Roman Zippel <zippel@linux-m68k.org> 2006-06-26 03:25:18 -0400
committer: Linus Torvalds <torvalds@g5.osdl.org> 2006-06-26 12:58:21 -0400
commit: 19923c190e0932bf0ac1e1d06a48f5c3678dd0de (patch)
tree: 2a32f5f16b3bbebd74c0f4910493c7f28a70fd84
parent: 6415ce9a922a1446e7ee0ac9b016082232ebe373 (diff)
4 files changed, 123 insertions, 149 deletions
diff --git a/arch/powerpc/kernel/time.c b/arch/powerpc/kernel/time.c
index 742f07a63161..7dd5dab789a1 100644
--- a/arch/powerpc/kernel/time.c
+++ b/arch/powerpc/kernel/time.c
@@ -102,7 +102,7 @@ EXPORT_SYMBOL(tb_ticks_per_sec);	/* for cputime_t conversions */
 u64 tb_to_xs;
 unsigned tb_to_us;
-#define TICKLEN_SCALE   (SHIFT_SCALE - 10)
+#define TICKLEN_SCALE   TICK_LENGTH_SHIFT
 u64 last_tick_len;      /* units are ns / 2^TICKLEN_SCALE */
 u64 ticklen_to_xs;      /* 0.64 fraction */
@@ -534,7 +534,7 @@ static __inline__ void timer_recalc_offset(u64 cur_tb)
        if (__USE_RTC())
                return;
-        tlen = current_tick_length(SHIFT_SCALE - 10);
+        tlen = current_tick_length();
        offset = cur_tb - do_gtod.varp->tb_orig_stamp;
        if (tlen == last_tick_len && offset < 0x80000000u)
                return;
diff --git a/include/linux/clocksource.h b/include/linux/clocksource.h
index 4bc94282c364..d852024ed095 100644
--- a/include/linux/clocksource.h
+++ b/include/linux/clocksource.h
@@ -46,8 +46,8 @@ typedef u64 cycle_t;
 * @shift:              cycle to nanosecond divisor (power of two)
 * @update_callback:    called when safe to alter clocksource values
 * @is_continuous:      defines if clocksource is free-running.
- * @interval_cycles:    Used internally by timekeeping core, please ignore.
+ * @cycle_interval:     Used internally by timekeeping core, please ignore.
- * @interval_snsecs:    Used internally by timekeeping core, please ignore.
+ * @xtime_interval:     Used internally by timekeeping core, please ignore.
 */
 struct clocksource {
        char *name;
@@ -61,8 +61,9 @@ struct clocksource {
        int is_continuous;
        /* timekeeping specific data, ignore */
-        cycle_t interval_cycles;
+        cycle_t cycle_last, cycle_interval;
-        u64 interval_snsecs;
+        u64 xtime_nsec, xtime_interval;
+        s64 error;
 };
 /* simplify initialization of mask field */
@@ -168,107 +169,11 @@ static inline void clocksource_calculate_interval(struct clocksource *c,
        tmp += c->mult/2;
        do_div(tmp, c->mult);
-        c->interval_cycles = (cycle_t)tmp;
+        c->cycle_interval = (cycle_t)tmp;
-        if(c->interval_cycles == 0)
+        if (c->cycle_interval == 0)
-                c->interval_cycles = 1;
+                c->cycle_interval = 1;
-        c->interval_snsecs = (u64)c->interval_cycles * c->mult;
+        c->xtime_interval = (u64)c->cycle_interval * c->mult;
-}
-/**
- * error_aproximation - calculates an error adjustment for a given error
- *
- * @error:      Error value (unsigned)
- * @unit:       Adjustment unit
- *
- * For a given error value, this function takes the adjustment unit
- * and uses binary approximation to return a power of two adjustment value.
- *
- * This function is only for use by the the make_ntp_adj() function
- * and you must hold a write on the xtime_lock when calling.
- */
-static inline int error_aproximation(u64 error, u64 unit)
-{
-        static int saved_adj = 0;
-        u64 adjusted_unit = unit << saved_adj;
-        if (error > (adjusted_unit * 2)) {
-                /* large error, so increment the adjustment factor */
-                saved_adj++;
-        } else if (error > adjusted_unit) {
-                /* just right, don't touch it */
-        } else if (saved_adj) {
-                /* small error, so drop the adjustment factor */
-                saved_adj--;
-                return 0;
-        }
-        return saved_adj;
-}
-/**
- * make_ntp_adj - Adjusts the specified clocksource for a given error
- *
- * @clock:              Pointer to clock to be adjusted
- * @cycles_delta:       Current unacounted cycle delta
- * @error:              Pointer to current error value
- *
- * Returns clock shifted nanosecond adjustment to be applied against
- * the accumulated time value (ie: xtime).
- *
- * If the error value is large enough, this function calulates the
- * (power of two) adjustment value, and adjusts the clock's mult and
- * interval_snsecs values accordingly.
- *
- * However, since there may be some unaccumulated cycles, to avoid
- * time inconsistencies we must adjust the accumulation value
- * accordingly.
- *
- * This is not very intuitive, so the following proof should help:
- * The basic timeofday algorithm:  base + cycle * mult
- * Thus:
- *    new_base + cycle * new_mult = old_base + cycle * old_mult
- *    new_base = old_base + cycle * old_mult - cycle * new_mult
- *    new_base = old_base + cycle * (old_mult - new_mult)
- *    new_base - old_base = cycle * (old_mult - new_mult)
- *    base_delta = cycle * (old_mult - new_mult)
- *    base_delta = cycle * (mult_delta)
- *
- * Where mult_delta is the adjustment value made to mult
- *
- */
-static inline s64 make_ntp_adj(struct clocksource *clock,
-                                cycles_t cycles_delta, s64* error)
-{
-        s64 ret = 0;
-        if (*error  > ((s64)clock->interval_cycles+1)/2) {
-                /* calculate adjustment value */
-                int adjustment = error_aproximation(*error,
-                                                clock->interval_cycles);
-                /* adjust clock */
-                clock->mult += 1 << adjustment;
-                clock->interval_snsecs += clock->interval_cycles << adjustment;
-                /* adjust the base and error for the adjustment */
-                ret =  -(cycles_delta << adjustment);
-                *error -= clock->interval_cycles << adjustment;
-                /* XXX adj error for cycle_delta offset? */
-        } else if ((-(*error))  > ((s64)clock->interval_cycles+1)/2) {
-                /* calculate adjustment value */
-                int adjustment = error_aproximation(-(*error),
-                                                clock->interval_cycles);
-                /* adjust clock */
-                clock->mult -= 1 << adjustment;
-                clock->interval_snsecs -= clock->interval_cycles << adjustment;
-                /* adjust the base and error for the adjustment */
-                ret =  cycles_delta << adjustment;
-                *error += clock->interval_cycles << adjustment;
-                /* XXX adj error for cycle_delta offset? */
-        }
-        return ret;
 }
diff --git a/include/linux/timex.h b/include/linux/timex.h
index 1ba3071fcb82..19bb6538b49e 100644
--- a/include/linux/timex.h
+++ b/include/linux/timex.h
@@ -303,8 +303,10 @@ time_interpolator_reset(void)
 #endif /* !CONFIG_TIME_INTERPOLATION */
+#define TICK_LENGTH_SHIFT       32
 /* Returns how long ticks are at present, in ns / 2^(SHIFT_SCALE-10). */
-extern u64 current_tick_length(long);
+extern u64 current_tick_length(void);
 extern int do_adjtimex(struct timex *);
diff --git a/kernel/timer.c b/kernel/timer.c
index 890a56937cfa..5bb6b7976eec 100644
--- a/kernel/timer.c
+++ b/kernel/timer.c
@@ -770,7 +770,7 @@ static void update_ntp_one_tick(void)
 * specified number of bits to the right of the binary point.
 * This function has no side-effects.
 */
-u64 current_tick_length(long shift)
+u64 current_tick_length(void)
 {
        long delta_nsec;
        u64 ret;
@@ -779,14 +779,8 @@ u64 current_tick_length(long shift)
         *    ie: nanosecond value shifted by (SHIFT_SCALE - 10)
         */
        delta_nsec = tick_nsec + adjtime_adjustment() * 1000;
-        ret = ((u64) delta_nsec << (SHIFT_SCALE - 10)) + time_adj;
+        ret = (u64)delta_nsec << TICK_LENGTH_SHIFT;
+        ret += (s64)time_adj << (TICK_LENGTH_SHIFT - (SHIFT_SCALE - 10));
-        /* convert from (SHIFT_SCALE - 10) to specified shift scale: */
-        shift = shift - (SHIFT_SCALE - 10);
-        if (shift < 0)
-                ret >>= -shift;
-        else
-                ret <<= shift;
        return ret;
 }
@@ -794,7 +788,6 @@ u64 current_tick_length(long shift)
 /* XXX - all of this timekeeping code should be later moved to time.c */
 #include <linux/clocksource.h>
 static struct clocksource *clock; /* pointer to current clocksource */
-static cycle_t last_clock_cycle;  /* cycle value at last update_wall_time */
 #ifdef CONFIG_GENERIC_TIME
 /**
@@ -813,7 +806,7 @@ static inline s64 __get_nsec_offset(void)
        cycle_now = clocksource_read(clock);
        /* calculate the delta since the last update_wall_time: */
-        cycle_delta = (cycle_now - last_clock_cycle) & clock->mask;
+        cycle_delta = (cycle_now - clock->cycle_last) & clock->mask;
        /* convert to nanoseconds: */
        ns_offset = cyc2ns(clock, cycle_delta);
@@ -927,7 +920,7 @@ static int change_clocksource(void)
                timespec_add_ns(&xtime, nsec);
                clock = new;
-                last_clock_cycle = now;
+                clock->cycle_last = now;
                printk(KERN_INFO "Time: %s clocksource has been installed.\n",
                                        clock->name);
                return 1;
@@ -968,7 +961,7 @@ void __init timekeeping_init(void)
        write_seqlock_irqsave(&xtime_lock, flags);
        clock = clocksource_get_next();
        clocksource_calculate_interval(clock, tick_nsec);
-        last_clock_cycle = clocksource_read(clock);
+        clock->cycle_last = clocksource_read(clock);
        ntp_clear();
        write_sequnlock_irqrestore(&xtime_lock, flags);
 }
@@ -988,7 +981,7 @@ static int timekeeping_resume(struct sys_device *dev)
        write_seqlock_irqsave(&xtime_lock, flags);
        /* restart the last cycle value */
-        last_clock_cycle = clocksource_read(clock);
+        clock->cycle_last = clocksource_read(clock);
        write_sequnlock_irqrestore(&xtime_lock, flags);
        return 0;
 }
@@ -1015,60 +1008,134 @@ static int __init timekeeping_init_device(void)
 device_initcall(timekeeping_init_device);
 /*
+ * If the error is already larger, we look ahead another tick,
+ * to compensate for late or lost adjustments.
+ */
+static __always_inline int clocksource_bigadjust(int sign, s64 error, s64 *interval, s64 *offset)
+{
+        int adj;
+        /*
+         * As soon as the machine is synchronized to the external time
+         * source this should be the common case.
+         */
+        error >>= 2;
+        if (likely(sign > 0 ? error <= *interval : error >= *interval))
+                return sign;
+        /*
+         * An extra look ahead dampens the effect of the current error,
+         * which can grow quite large with continously late updates, as
+         * it would dominate the adjustment value and can lead to
+         * oscillation.
+         */
+        error += current_tick_length() >> (TICK_LENGTH_SHIFT - clock->shift + 1);
+        error -= clock->xtime_interval >> 1;
+        adj = 0;
+        while (1) {
+                error >>= 1;
+                if (sign > 0 ? error <= *interval : error >= *interval)
+                        break;
+                adj++;
+        }
+        /*
+         * Add the current adjustments to the error and take the offset
+         * into account, the latter can cause the error to be hardly
+         * reduced at the next tick. Check the error again if there's
+         * room for another adjustment, thus further reducing the error
+         * which otherwise had to be corrected at the next update.
+         */
+        error = (error << 1) - *interval + *offset;
+        if (sign > 0 ? error > *interval : error < *interval)
+                adj++;
+        *interval <<= adj;
+        *offset <<= adj;
+        return sign << adj;
+}
+/*
+ * Adjust the multiplier to reduce the error value,
+ * this is optimized for the most common adjustments of -1,0,1,
+ * for other values we can do a bit more work.
+ */
+static void clocksource_adjust(struct clocksource *clock, s64 offset)
+{
+        s64 error, interval = clock->cycle_interval;
+        int adj;
+        error = clock->error >> (TICK_LENGTH_SHIFT - clock->shift - 1);
+        if (error > interval) {
+                adj = clocksource_bigadjust(1, error, &interval, &offset);
+        } else if (error < -interval) {
+                interval = -interval;
+                offset = -offset;
+                adj = clocksource_bigadjust(-1, error, &interval, &offset);
+        } else
+                return;
+        clock->mult += adj;
+        clock->xtime_interval += interval;
+        clock->xtime_nsec -= offset;
+        clock->error -= (interval - offset) << (TICK_LENGTH_SHIFT - clock->shift);
+}
+/*
 * update_wall_time - Uses the current clocksource to increment the wall time
 *
 * Called from the timer interrupt, must hold a write on xtime_lock.
 */
 static void update_wall_time(void)
 {
-        static s64 remainder_snsecs, error;
+        cycle_t offset;
-        s64 snsecs_per_sec;
-        cycle_t now, offset;
-        snsecs_per_sec = (s64)NSEC_PER_SEC << clock->shift;
+        clock->xtime_nsec += (s64)xtime.tv_nsec << clock->shift;
-        remainder_snsecs += (s64)xtime.tv_nsec << clock->shift;
-        now = clocksource_read(clock);
+#ifdef CONFIG_GENERIC_TIME
-        offset = (now - last_clock_cycle)&clock->mask;
+        offset = (clocksource_read(clock) - clock->cycle_last) & clock->mask;
+#else
+        offset = clock->cycle_interval;
+#endif
        /* normally this loop will run just once, however in the
         * case of lost or late ticks, it will accumulate correctly.
         */
-        while (offset > clock->interval_cycles) {
+        while (offset >= clock->cycle_interval) {
-                /* get the ntp interval in clock shifted nanoseconds */
-                s64 ntp_snsecs  = current_tick_length(clock->shift);
                /* accumulate one interval */
-                remainder_snsecs += clock->interval_snsecs;
+                clock->xtime_nsec += clock->xtime_interval;
-                last_clock_cycle += clock->interval_cycles;
+                clock->cycle_last += clock->cycle_interval;
-                offset -= clock->interval_cycles;
+                offset -= clock->cycle_interval;
+                if (clock->xtime_nsec >= (u64)NSEC_PER_SEC << clock->shift) {
+                        clock->xtime_nsec -= (u64)NSEC_PER_SEC << clock->shift;
+                        xtime.tv_sec++;
+                        second_overflow();
+                }
                /* interpolator bits */
-                time_interpolator_update(clock->interval_snsecs
+                time_interpolator_update(clock->xtime_interval
                                                >> clock->shift);
                /* increment the NTP state machine */
                update_ntp_one_tick();
                /* accumulate error between NTP and clock interval */
-                error += (ntp_snsecs - (s64)clock->interval_snsecs);
+                clock->error += current_tick_length();
+                clock->error -= clock->xtime_interval << (TICK_LENGTH_SHIFT - clock->shift);
+        }
-                /* correct the clock when NTP error is too big */
+        /* correct the clock when NTP error is too big */
-                remainder_snsecs += make_ntp_adj(clock, offset, &error);
+        clocksource_adjust(clock, offset);
-                if (remainder_snsecs >= snsecs_per_sec) {
-                        remainder_snsecs -= snsecs_per_sec;
-                        xtime.tv_sec++;
-                        second_overflow();
-                }
-        }
        /* store full nanoseconds into xtime */
-        xtime.tv_nsec = remainder_snsecs >> clock->shift;
+        xtime.tv_nsec = clock->xtime_nsec >> clock->shift;
-        remainder_snsecs -= (s64)xtime.tv_nsec << clock->shift;
+        clock->xtime_nsec -= (s64)xtime.tv_nsec << clock->shift;
        /* check to see if there is a new clocksource to use */
        if (change_clocksource()) {
-                error = 0;
+                clock->error = 0;
-                remainder_snsecs = 0;
+                clock->xtime_nsec = 0;
                clocksource_calculate_interval(clock, tick_nsec);
        }
 }
author	Roman Zippel <zippel@linux-m68k.org>	2006-06-26 03:25:18 -0400
committer	Linus Torvalds <torvalds@g5.osdl.org>	2006-06-26 12:58:21 -0400
commit	19923c190e0932bf0ac1e1d06a48f5c3678dd0de (patch)
tree	2a32f5f16b3bbebd74c0f4910493c7f28a70fd84
parent	6415ce9a922a1446e7ee0ac9b016082232ebe373 (diff)

diff --git a/arch/powerpc/kernel/time.c b/arch/powerpc/kernel/time.c index 742f07a63161..7dd5dab789a1 100644 --- a/arch/powerpc/kernel/time.c +++ b/arch/powerpc/kernel/time.c
@@ -102,7 +102,7 @@ EXPORT_SYMBOL(tb_ticks_per_sec); /* for cputime_t conversions */
102	u64 tb_to_xs;	102	u64 tb_to_xs;
103	unsigned tb_to_us;	103	unsigned tb_to_us;
104		104
105	#define TICKLEN_SCALE (SHIFT_SCALE - 10)	105	#define TICKLEN_SCALE TICK_LENGTH_SHIFT
106	u64 last_tick_len; /* units are ns / 2^TICKLEN_SCALE */	106	u64 last_tick_len; /* units are ns / 2^TICKLEN_SCALE */
107	u64 ticklen_to_xs; /* 0.64 fraction */	107	u64 ticklen_to_xs; /* 0.64 fraction */
108		108
@@ -534,7 +534,7 @@ static __inline__ void timer_recalc_offset(u64 cur_tb)
534		534
535	if (__USE_RTC())	535	if (__USE_RTC())
536	return;	536	return;
537	tlen = current_tick_length(SHIFT_SCALE - 10);	537	tlen = current_tick_length();
538	offset = cur_tb - do_gtod.varp->tb_orig_stamp;	538	offset = cur_tb - do_gtod.varp->tb_orig_stamp;
539	if (tlen == last_tick_len && offset < 0x80000000u)	539	if (tlen == last_tick_len && offset < 0x80000000u)
540	return;	540	return;


diff --git a/include/linux/clocksource.h b/include/linux/clocksource.h index 4bc94282c364..d852024ed095 100644 --- a/include/linux/clocksource.h +++ b/include/linux/clocksource.h
@@ -46,8 +46,8 @@ typedef u64 cycle_t;
46	* @shift: cycle to nanosecond divisor (power of two)	46	* @shift: cycle to nanosecond divisor (power of two)
47	* @update_callback: called when safe to alter clocksource values	47	* @update_callback: called when safe to alter clocksource values
48	* @is_continuous: defines if clocksource is free-running.	48	* @is_continuous: defines if clocksource is free-running.
49	* @interval_cycles: Used internally by timekeeping core, please ignore.	49	* @cycle_interval: Used internally by timekeeping core, please ignore.
50	* @interval_snsecs: Used internally by timekeeping core, please ignore.	50	* @xtime_interval: Used internally by timekeeping core, please ignore.
51	*/	51	*/
52	struct clocksource {	52	struct clocksource {
53	char *name;	53	char *name;
@@ -61,8 +61,9 @@ struct clocksource {
61	int is_continuous;	61	int is_continuous;
62		62
63	/* timekeeping specific data, ignore */	63	/* timekeeping specific data, ignore */
64	cycle_t interval_cycles;	64	cycle_t cycle_last, cycle_interval;
65	u64 interval_snsecs;	65	u64 xtime_nsec, xtime_interval;
		66	s64 error;
66	};	67	};
67		68
68	/* simplify initialization of mask field */	69	/* simplify initialization of mask field */
@@ -168,107 +169,11 @@ static inline void clocksource_calculate_interval(struct clocksource *c,
168	tmp += c->mult/2;	169	tmp += c->mult/2;
169	do_div(tmp, c->mult);	170	do_div(tmp, c->mult);
170		171
171	c->interval_cycles = (cycle_t)tmp;	172	c->cycle_interval = (cycle_t)tmp;
172	if(c->interval_cycles == 0)	173	if (c->cycle_interval == 0)
173	c->interval_cycles = 1;	174	c->cycle_interval = 1;
174		175
175	c->interval_snsecs = (u64)c->interval_cycles * c->mult;	176	c->xtime_interval = (u64)c->cycle_interval * c->mult;
176	}
177
178
179	/**
180	* error_aproximation - calculates an error adjustment for a given error
181	*
182	* @error: Error value (unsigned)
183	* @unit: Adjustment unit
184	*
185	* For a given error value, this function takes the adjustment unit
186	* and uses binary approximation to return a power of two adjustment value.
187	*
188	* This function is only for use by the the make_ntp_adj() function
189	* and you must hold a write on the xtime_lock when calling.
190	*/
191	static inline int error_aproximation(u64 error, u64 unit)
192	{
193	static int saved_adj = 0;
194	u64 adjusted_unit = unit << saved_adj;
195
196	if (error > (adjusted_unit * 2)) {
197	/* large error, so increment the adjustment factor */
198	saved_adj++;
199	} else if (error > adjusted_unit) {
200	/* just right, don't touch it */
201	} else if (saved_adj) {
202	/* small error, so drop the adjustment factor */
203	saved_adj--;
204	return 0;
205	}
206
207	return saved_adj;
208	}
209
210
211	/**
212	* make_ntp_adj - Adjusts the specified clocksource for a given error
213	*
214	* @clock: Pointer to clock to be adjusted
215	* @cycles_delta: Current unacounted cycle delta
216	* @error: Pointer to current error value
217	*
218	* Returns clock shifted nanosecond adjustment to be applied against
219	* the accumulated time value (ie: xtime).
220	*
221	* If the error value is large enough, this function calulates the
222	* (power of two) adjustment value, and adjusts the clock's mult and
223	* interval_snsecs values accordingly.
224	*
225	* However, since there may be some unaccumulated cycles, to avoid
226	* time inconsistencies we must adjust the accumulation value
227	* accordingly.
228	*
229	* This is not very intuitive, so the following proof should help:
230	* The basic timeofday algorithm: base + cycle * mult
231	* Thus:
232	* new_base + cycle * new_mult = old_base + cycle * old_mult
233	* new_base = old_base + cycle * old_mult - cycle * new_mult
234	* new_base = old_base + cycle * (old_mult - new_mult)
235	* new_base - old_base = cycle * (old_mult - new_mult)
236	* base_delta = cycle * (old_mult - new_mult)
237	* base_delta = cycle * (mult_delta)
238	*
239	* Where mult_delta is the adjustment value made to mult
240	*
241	*/
242	static inline s64 make_ntp_adj(struct clocksource *clock,
243	cycles_t cycles_delta, s64* error)
244	{
245	s64 ret = 0;
246	if (*error > ((s64)clock->interval_cycles+1)/2) {
247	/* calculate adjustment value */
248	int adjustment = error_aproximation(*error,
249	clock->interval_cycles);
250	/* adjust clock */
251	clock->mult += 1 << adjustment;
252	clock->interval_snsecs += clock->interval_cycles << adjustment;
253
254	/* adjust the base and error for the adjustment */
255	ret = -(cycles_delta << adjustment);
256	*error -= clock->interval_cycles << adjustment;
257	/* XXX adj error for cycle_delta offset? */
258	} else if ((-(*error)) > ((s64)clock->interval_cycles+1)/2) {
259	/* calculate adjustment value */
260	int adjustment = error_aproximation(-(*error),
261	clock->interval_cycles);
262	/* adjust clock */
263	clock->mult -= 1 << adjustment;
264	clock->interval_snsecs -= clock->interval_cycles << adjustment;
265
266	/* adjust the base and error for the adjustment */
267	ret = cycles_delta << adjustment;
268	*error += clock->interval_cycles << adjustment;
269	/* XXX adj error for cycle_delta offset? */
270	}
271	return ret;
272	}	177	}
273		178
274		179


diff --git a/include/linux/timex.h b/include/linux/timex.h index 1ba3071fcb82..19bb6538b49e 100644 --- a/include/linux/timex.h +++ b/include/linux/timex.h
@@ -303,8 +303,10 @@ time_interpolator_reset(void)
303		303
304	#endif /* !CONFIG_TIME_INTERPOLATION */	304	#endif /* !CONFIG_TIME_INTERPOLATION */
305		305
		306	#define TICK_LENGTH_SHIFT 32
		307
306	/* Returns how long ticks are at present, in ns / 2^(SHIFT_SCALE-10). */	308	/* Returns how long ticks are at present, in ns / 2^(SHIFT_SCALE-10). */
307	extern u64 current_tick_length(long);	309	extern u64 current_tick_length(void);
308		310
309	extern int do_adjtimex(struct timex *);	311	extern int do_adjtimex(struct timex *);
310		312


diff --git a/kernel/timer.c b/kernel/timer.c index 890a56937cfa..5bb6b7976eec 100644 --- a/kernel/timer.c +++ b/kernel/timer.c
@@ -770,7 +770,7 @@ static void update_ntp_one_tick(void)
770	* specified number of bits to the right of the binary point.	770	* specified number of bits to the right of the binary point.
771	* This function has no side-effects.	771	* This function has no side-effects.
772	*/	772	*/
773	u64 current_tick_length(long shift)	773	u64 current_tick_length(void)
774	{	774	{
775	long delta_nsec;	775	long delta_nsec;
776	u64 ret;	776	u64 ret;
@@ -779,14 +779,8 @@ u64 current_tick_length(long shift)
779	* ie: nanosecond value shifted by (SHIFT_SCALE - 10)	779	* ie: nanosecond value shifted by (SHIFT_SCALE - 10)
780	*/	780	*/
781	delta_nsec = tick_nsec + adjtime_adjustment() * 1000;	781	delta_nsec = tick_nsec + adjtime_adjustment() * 1000;
782	ret = ((u64) delta_nsec << (SHIFT_SCALE - 10)) + time_adj;	782	ret = (u64)delta_nsec << TICK_LENGTH_SHIFT;
783		783	ret += (s64)time_adj << (TICK_LENGTH_SHIFT - (SHIFT_SCALE - 10));
784	/* convert from (SHIFT_SCALE - 10) to specified shift scale: */
785	shift = shift - (SHIFT_SCALE - 10);
786	if (shift < 0)
787	ret >>= -shift;
788	else
789	ret <<= shift;
790		784
791	return ret;	785	return ret;
792	}	786	}
@@ -794,7 +788,6 @@ u64 current_tick_length(long shift)
794	/* XXX - all of this timekeeping code should be later moved to time.c */	788	/* XXX - all of this timekeeping code should be later moved to time.c */
795	#include <linux/clocksource.h>	789	#include <linux/clocksource.h>
796	static struct clocksource clock; / pointer to current clocksource */	790	static struct clocksource clock; / pointer to current clocksource */
797	static cycle_t last_clock_cycle; /* cycle value at last update_wall_time */
798		791
799	#ifdef CONFIG_GENERIC_TIME	792	#ifdef CONFIG_GENERIC_TIME
800	/**	793	/**
@@ -813,7 +806,7 @@ static inline s64 __get_nsec_offset(void)
813	cycle_now = clocksource_read(clock);	806	cycle_now = clocksource_read(clock);
814		807
815	/* calculate the delta since the last update_wall_time: */	808	/* calculate the delta since the last update_wall_time: */
816	cycle_delta = (cycle_now - last_clock_cycle) & clock->mask;	809	cycle_delta = (cycle_now - clock->cycle_last) & clock->mask;
817		810
818	/* convert to nanoseconds: */	811	/* convert to nanoseconds: */
819	ns_offset = cyc2ns(clock, cycle_delta);	812	ns_offset = cyc2ns(clock, cycle_delta);
@@ -927,7 +920,7 @@ static int change_clocksource(void)
927	timespec_add_ns(&xtime, nsec);	920	timespec_add_ns(&xtime, nsec);
928		921
929	clock = new;	922	clock = new;
930	last_clock_cycle = now;	923	clock->cycle_last = now;
931	printk(KERN_INFO "Time: %s clocksource has been installed.\n",	924	printk(KERN_INFO "Time: %s clocksource has been installed.\n",
932	clock->name);	925	clock->name);
933	return 1;	926	return 1;
@@ -968,7 +961,7 @@ void __init timekeeping_init(void)
968	write_seqlock_irqsave(&xtime_lock, flags);	961	write_seqlock_irqsave(&xtime_lock, flags);
969	clock = clocksource_get_next();	962	clock = clocksource_get_next();
970	clocksource_calculate_interval(clock, tick_nsec);	963	clocksource_calculate_interval(clock, tick_nsec);
971	last_clock_cycle = clocksource_read(clock);	964	clock->cycle_last = clocksource_read(clock);
972	ntp_clear();	965	ntp_clear();
973	write_sequnlock_irqrestore(&xtime_lock, flags);	966	write_sequnlock_irqrestore(&xtime_lock, flags);
974	}	967	}
@@ -988,7 +981,7 @@ static int timekeeping_resume(struct sys_device *dev)
988		981
989	write_seqlock_irqsave(&xtime_lock, flags);	982	write_seqlock_irqsave(&xtime_lock, flags);
990	/* restart the last cycle value */	983	/* restart the last cycle value */
991	last_clock_cycle = clocksource_read(clock);	984	clock->cycle_last = clocksource_read(clock);
992	write_sequnlock_irqrestore(&xtime_lock, flags);	985	write_sequnlock_irqrestore(&xtime_lock, flags);
993	return 0;	986	return 0;
994	}	987	}
@@ -1015,60 +1008,134 @@ static int __init timekeeping_init_device(void)
1015	device_initcall(timekeeping_init_device);	1008	device_initcall(timekeeping_init_device);
1016		1009
1017	/*	1010	/*
		1011	* If the error is already larger, we look ahead another tick,
		1012	* to compensate for late or lost adjustments.
		1013	*/
		1014	static __always_inline int clocksource_bigadjust(int sign, s64 error, s64 interval, s64 offset)
		1015	{
		1016	int adj;
		1017
		1018	/*
		1019	* As soon as the machine is synchronized to the external time
		1020	* source this should be the common case.
		1021	*/
		1022	error >>= 2;
		1023	if (likely(sign > 0 ? error <= interval : error >= interval))
		1024	return sign;
		1025
		1026	/*
		1027	* An extra look ahead dampens the effect of the current error,
		1028	* which can grow quite large with continously late updates, as
		1029	* it would dominate the adjustment value and can lead to
		1030	* oscillation.
		1031	*/
		1032	error += current_tick_length() >> (TICK_LENGTH_SHIFT - clock->shift + 1);
		1033	error -= clock->xtime_interval >> 1;
		1034
		1035	adj = 0;
		1036	while (1) {
		1037	error >>= 1;
		1038	if (sign > 0 ? error <= interval : error >= interval)
		1039	break;
		1040	adj++;
		1041	}
		1042
		1043	/*
		1044	* Add the current adjustments to the error and take the offset
		1045	* into account, the latter can cause the error to be hardly
		1046	* reduced at the next tick. Check the error again if there's
		1047	* room for another adjustment, thus further reducing the error
		1048	* which otherwise had to be corrected at the next update.
		1049	*/
		1050	error = (error << 1) - interval + offset;
		1051	if (sign > 0 ? error > interval : error < interval)
		1052	adj++;
		1053
		1054	*interval <<= adj;
		1055	*offset <<= adj;
		1056	return sign << adj;
		1057	}
		1058
		1059	/*
		1060	* Adjust the multiplier to reduce the error value,
		1061	* this is optimized for the most common adjustments of -1,0,1,
		1062	* for other values we can do a bit more work.
		1063	*/
		1064	static void clocksource_adjust(struct clocksource *clock, s64 offset)
		1065	{
		1066	s64 error, interval = clock->cycle_interval;
		1067	int adj;
		1068
		1069	error = clock->error >> (TICK_LENGTH_SHIFT - clock->shift - 1);
		1070	if (error > interval) {
		1071	adj = clocksource_bigadjust(1, error, &interval, &offset);
		1072	} else if (error < -interval) {
		1073	interval = -interval;
		1074	offset = -offset;
		1075	adj = clocksource_bigadjust(-1, error, &interval, &offset);
		1076	} else
		1077	return;
		1078
		1079	clock->mult += adj;
		1080	clock->xtime_interval += interval;
		1081	clock->xtime_nsec -= offset;
		1082	clock->error -= (interval - offset) << (TICK_LENGTH_SHIFT - clock->shift);
		1083	}
		1084
		1085	/*
1018	* update_wall_time - Uses the current clocksource to increment the wall time	1086	* update_wall_time - Uses the current clocksource to increment the wall time
1019	*	1087	*
1020	* Called from the timer interrupt, must hold a write on xtime_lock.	1088	* Called from the timer interrupt, must hold a write on xtime_lock.
1021	*/	1089	*/
1022	static void update_wall_time(void)	1090	static void update_wall_time(void)
1023	{	1091	{
1024	static s64 remainder_snsecs, error;	1092	cycle_t offset;
1025	s64 snsecs_per_sec;
1026	cycle_t now, offset;
1027		1093
1028	snsecs_per_sec = (s64)NSEC_PER_SEC << clock->shift;	1094	clock->xtime_nsec += (s64)xtime.tv_nsec << clock->shift;
1029	remainder_snsecs += (s64)xtime.tv_nsec << clock->shift;
1030		1095
1031	now = clocksource_read(clock);	1096	#ifdef CONFIG_GENERIC_TIME
1032	offset = (now - last_clock_cycle)&clock->mask;	1097	offset = (clocksource_read(clock) - clock->cycle_last) & clock->mask;
		1098	#else
		1099	offset = clock->cycle_interval;
		1100	#endif
1033		1101
1034	/* normally this loop will run just once, however in the	1102	/* normally this loop will run just once, however in the
1035	* case of lost or late ticks, it will accumulate correctly.	1103	* case of lost or late ticks, it will accumulate correctly.
1036	*/	1104	*/
1037	while (offset > clock->interval_cycles) {	1105	while (offset >= clock->cycle_interval) {
1038	/* get the ntp interval in clock shifted nanoseconds */
1039	s64 ntp_snsecs = current_tick_length(clock->shift);
1040
1041	/* accumulate one interval */	1106	/* accumulate one interval */
1042	remainder_snsecs += clock->interval_snsecs;	1107	clock->xtime_nsec += clock->xtime_interval;
1043	last_clock_cycle += clock->interval_cycles;	1108	clock->cycle_last += clock->cycle_interval;
1044	offset -= clock->interval_cycles;	1109	offset -= clock->cycle_interval;
		1110
		1111	if (clock->xtime_nsec >= (u64)NSEC_PER_SEC << clock->shift) {
		1112	clock->xtime_nsec -= (u64)NSEC_PER_SEC << clock->shift;
		1113	xtime.tv_sec++;
		1114	second_overflow();
		1115	}
1045		1116
1046	/* interpolator bits */	1117	/* interpolator bits */
1047	time_interpolator_update(clock->interval_snsecs	1118	time_interpolator_update(clock->xtime_interval
1048	>> clock->shift);	1119	>> clock->shift);
1049	/* increment the NTP state machine */	1120	/* increment the NTP state machine */
1050	update_ntp_one_tick();	1121	update_ntp_one_tick();
1051		1122
1052	/* accumulate error between NTP and clock interval */	1123	/* accumulate error between NTP and clock interval */
1053	error += (ntp_snsecs - (s64)clock->interval_snsecs);	1124	clock->error += current_tick_length();
		1125	clock->error -= clock->xtime_interval << (TICK_LENGTH_SHIFT - clock->shift);
		1126	}
1054		1127
1055	/* correct the clock when NTP error is too big */	1128	/* correct the clock when NTP error is too big */
1056	remainder_snsecs += make_ntp_adj(clock, offset, &error);	1129	clocksource_adjust(clock, offset);
1057		1130
1058	if (remainder_snsecs >= snsecs_per_sec) {
1059	remainder_snsecs -= snsecs_per_sec;
1060	xtime.tv_sec++;
1061	second_overflow();
1062	}
1063	}
1064	/* store full nanoseconds into xtime */	1131	/* store full nanoseconds into xtime */
1065	xtime.tv_nsec = remainder_snsecs >> clock->shift;	1132	xtime.tv_nsec = clock->xtime_nsec >> clock->shift;
1066	remainder_snsecs -= (s64)xtime.tv_nsec << clock->shift;	1133	clock->xtime_nsec -= (s64)xtime.tv_nsec << clock->shift;
1067		1134
1068	/* check to see if there is a new clocksource to use */	1135	/* check to see if there is a new clocksource to use */
1069	if (change_clocksource()) {	1136	if (change_clocksource()) {
1070	error = 0;	1137	clock->error = 0;
1071	remainder_snsecs = 0;	1138	clock->xtime_nsec = 0;
1072	clocksource_calculate_interval(clock, tick_nsec);	1139	clocksource_calculate_interval(clock, tick_nsec);
1073	}	1140	}
1074	}	1141	}