aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorRoman Zippel <zippel@linux-m68k.org>2006-06-26 03:25:18 -0400
committerLinus Torvalds <torvalds@g5.osdl.org>2006-06-26 12:58:21 -0400
commit19923c190e0932bf0ac1e1d06a48f5c3678dd0de (patch)
tree2a32f5f16b3bbebd74c0f4910493c7f28a70fd84
parent6415ce9a922a1446e7ee0ac9b016082232ebe373 (diff)
[PATCH] fix and optimize clock source update
This fixes the clock source updates in update_wall_time() to correctly track the time coming in via current_tick_length(). Optimize the fast paths to be as short as possible to keep the overhead low. Signed-off-by: Roman Zippel <zippel@linux-m68k.org> Acked-by: John Stultz <johnstul@us.ibm.com> Signed-off-by: Andrew Morton <akpm@osdl.org> Signed-off-by: Linus Torvalds <torvalds@osdl.org>
-rw-r--r--arch/powerpc/kernel/time.c4
-rw-r--r--include/linux/clocksource.h113
-rw-r--r--include/linux/timex.h4
-rw-r--r--kernel/timer.c151
4 files changed, 123 insertions, 149 deletions
diff --git a/arch/powerpc/kernel/time.c b/arch/powerpc/kernel/time.c
index 742f07a63161..7dd5dab789a1 100644
--- a/arch/powerpc/kernel/time.c
+++ b/arch/powerpc/kernel/time.c
@@ -102,7 +102,7 @@ EXPORT_SYMBOL(tb_ticks_per_sec); /* for cputime_t conversions */
102u64 tb_to_xs; 102u64 tb_to_xs;
103unsigned tb_to_us; 103unsigned tb_to_us;
104 104
105#define TICKLEN_SCALE (SHIFT_SCALE - 10) 105#define TICKLEN_SCALE TICK_LENGTH_SHIFT
106u64 last_tick_len; /* units are ns / 2^TICKLEN_SCALE */ 106u64 last_tick_len; /* units are ns / 2^TICKLEN_SCALE */
107u64 ticklen_to_xs; /* 0.64 fraction */ 107u64 ticklen_to_xs; /* 0.64 fraction */
108 108
@@ -534,7 +534,7 @@ static __inline__ void timer_recalc_offset(u64 cur_tb)
534 534
535 if (__USE_RTC()) 535 if (__USE_RTC())
536 return; 536 return;
537 tlen = current_tick_length(SHIFT_SCALE - 10); 537 tlen = current_tick_length();
538 offset = cur_tb - do_gtod.varp->tb_orig_stamp; 538 offset = cur_tb - do_gtod.varp->tb_orig_stamp;
539 if (tlen == last_tick_len && offset < 0x80000000u) 539 if (tlen == last_tick_len && offset < 0x80000000u)
540 return; 540 return;
diff --git a/include/linux/clocksource.h b/include/linux/clocksource.h
index 4bc94282c364..d852024ed095 100644
--- a/include/linux/clocksource.h
+++ b/include/linux/clocksource.h
@@ -46,8 +46,8 @@ typedef u64 cycle_t;
46 * @shift: cycle to nanosecond divisor (power of two) 46 * @shift: cycle to nanosecond divisor (power of two)
47 * @update_callback: called when safe to alter clocksource values 47 * @update_callback: called when safe to alter clocksource values
48 * @is_continuous: defines if clocksource is free-running. 48 * @is_continuous: defines if clocksource is free-running.
49 * @interval_cycles: Used internally by timekeeping core, please ignore. 49 * @cycle_interval: Used internally by timekeeping core, please ignore.
50 * @interval_snsecs: Used internally by timekeeping core, please ignore. 50 * @xtime_interval: Used internally by timekeeping core, please ignore.
51 */ 51 */
52struct clocksource { 52struct clocksource {
53 char *name; 53 char *name;
@@ -61,8 +61,9 @@ struct clocksource {
61 int is_continuous; 61 int is_continuous;
62 62
63 /* timekeeping specific data, ignore */ 63 /* timekeeping specific data, ignore */
64 cycle_t interval_cycles; 64 cycle_t cycle_last, cycle_interval;
65 u64 interval_snsecs; 65 u64 xtime_nsec, xtime_interval;
66 s64 error;
66}; 67};
67 68
68/* simplify initialization of mask field */ 69/* simplify initialization of mask field */
@@ -168,107 +169,11 @@ static inline void clocksource_calculate_interval(struct clocksource *c,
168 tmp += c->mult/2; 169 tmp += c->mult/2;
169 do_div(tmp, c->mult); 170 do_div(tmp, c->mult);
170 171
171 c->interval_cycles = (cycle_t)tmp; 172 c->cycle_interval = (cycle_t)tmp;
172 if(c->interval_cycles == 0) 173 if (c->cycle_interval == 0)
173 c->interval_cycles = 1; 174 c->cycle_interval = 1;
174 175
175 c->interval_snsecs = (u64)c->interval_cycles * c->mult; 176 c->xtime_interval = (u64)c->cycle_interval * c->mult;
176}
177
178
179/**
180 * error_aproximation - calculates an error adjustment for a given error
181 *
182 * @error: Error value (unsigned)
183 * @unit: Adjustment unit
184 *
185 * For a given error value, this function takes the adjustment unit
186 * and uses binary approximation to return a power of two adjustment value.
187 *
188 * This function is only for use by the the make_ntp_adj() function
189 * and you must hold a write on the xtime_lock when calling.
190 */
191static inline int error_aproximation(u64 error, u64 unit)
192{
193 static int saved_adj = 0;
194 u64 adjusted_unit = unit << saved_adj;
195
196 if (error > (adjusted_unit * 2)) {
197 /* large error, so increment the adjustment factor */
198 saved_adj++;
199 } else if (error > adjusted_unit) {
200 /* just right, don't touch it */
201 } else if (saved_adj) {
202 /* small error, so drop the adjustment factor */
203 saved_adj--;
204 return 0;
205 }
206
207 return saved_adj;
208}
209
210
211/**
212 * make_ntp_adj - Adjusts the specified clocksource for a given error
213 *
214 * @clock: Pointer to clock to be adjusted
215 * @cycles_delta: Current unacounted cycle delta
216 * @error: Pointer to current error value
217 *
218 * Returns clock shifted nanosecond adjustment to be applied against
219 * the accumulated time value (ie: xtime).
220 *
221 * If the error value is large enough, this function calulates the
222 * (power of two) adjustment value, and adjusts the clock's mult and
223 * interval_snsecs values accordingly.
224 *
225 * However, since there may be some unaccumulated cycles, to avoid
226 * time inconsistencies we must adjust the accumulation value
227 * accordingly.
228 *
229 * This is not very intuitive, so the following proof should help:
230 * The basic timeofday algorithm: base + cycle * mult
231 * Thus:
232 * new_base + cycle * new_mult = old_base + cycle * old_mult
233 * new_base = old_base + cycle * old_mult - cycle * new_mult
234 * new_base = old_base + cycle * (old_mult - new_mult)
235 * new_base - old_base = cycle * (old_mult - new_mult)
236 * base_delta = cycle * (old_mult - new_mult)
237 * base_delta = cycle * (mult_delta)
238 *
239 * Where mult_delta is the adjustment value made to mult
240 *
241 */
242static inline s64 make_ntp_adj(struct clocksource *clock,
243 cycles_t cycles_delta, s64* error)
244{
245 s64 ret = 0;
246 if (*error > ((s64)clock->interval_cycles+1)/2) {
247 /* calculate adjustment value */
248 int adjustment = error_aproximation(*error,
249 clock->interval_cycles);
250 /* adjust clock */
251 clock->mult += 1 << adjustment;
252 clock->interval_snsecs += clock->interval_cycles << adjustment;
253
254 /* adjust the base and error for the adjustment */
255 ret = -(cycles_delta << adjustment);
256 *error -= clock->interval_cycles << adjustment;
257 /* XXX adj error for cycle_delta offset? */
258 } else if ((-(*error)) > ((s64)clock->interval_cycles+1)/2) {
259 /* calculate adjustment value */
260 int adjustment = error_aproximation(-(*error),
261 clock->interval_cycles);
262 /* adjust clock */
263 clock->mult -= 1 << adjustment;
264 clock->interval_snsecs -= clock->interval_cycles << adjustment;
265
266 /* adjust the base and error for the adjustment */
267 ret = cycles_delta << adjustment;
268 *error += clock->interval_cycles << adjustment;
269 /* XXX adj error for cycle_delta offset? */
270 }
271 return ret;
272} 177}
273 178
274 179
diff --git a/include/linux/timex.h b/include/linux/timex.h
index 1ba3071fcb82..19bb6538b49e 100644
--- a/include/linux/timex.h
+++ b/include/linux/timex.h
@@ -303,8 +303,10 @@ time_interpolator_reset(void)
303 303
304#endif /* !CONFIG_TIME_INTERPOLATION */ 304#endif /* !CONFIG_TIME_INTERPOLATION */
305 305
306#define TICK_LENGTH_SHIFT 32
307
306/* Returns how long ticks are at present, in ns / 2^(SHIFT_SCALE-10). */ 308/* Returns how long ticks are at present, in ns / 2^(SHIFT_SCALE-10). */
307extern u64 current_tick_length(long); 309extern u64 current_tick_length(void);
308 310
309extern int do_adjtimex(struct timex *); 311extern int do_adjtimex(struct timex *);
310 312
diff --git a/kernel/timer.c b/kernel/timer.c
index 890a56937cfa..5bb6b7976eec 100644
--- a/kernel/timer.c
+++ b/kernel/timer.c
@@ -770,7 +770,7 @@ static void update_ntp_one_tick(void)
770 * specified number of bits to the right of the binary point. 770 * specified number of bits to the right of the binary point.
771 * This function has no side-effects. 771 * This function has no side-effects.
772 */ 772 */
773u64 current_tick_length(long shift) 773u64 current_tick_length(void)
774{ 774{
775 long delta_nsec; 775 long delta_nsec;
776 u64 ret; 776 u64 ret;
@@ -779,14 +779,8 @@ u64 current_tick_length(long shift)
779 * ie: nanosecond value shifted by (SHIFT_SCALE - 10) 779 * ie: nanosecond value shifted by (SHIFT_SCALE - 10)
780 */ 780 */
781 delta_nsec = tick_nsec + adjtime_adjustment() * 1000; 781 delta_nsec = tick_nsec + adjtime_adjustment() * 1000;
782 ret = ((u64) delta_nsec << (SHIFT_SCALE - 10)) + time_adj; 782 ret = (u64)delta_nsec << TICK_LENGTH_SHIFT;
783 783 ret += (s64)time_adj << (TICK_LENGTH_SHIFT - (SHIFT_SCALE - 10));
784 /* convert from (SHIFT_SCALE - 10) to specified shift scale: */
785 shift = shift - (SHIFT_SCALE - 10);
786 if (shift < 0)
787 ret >>= -shift;
788 else
789 ret <<= shift;
790 784
791 return ret; 785 return ret;
792} 786}
@@ -794,7 +788,6 @@ u64 current_tick_length(long shift)
794/* XXX - all of this timekeeping code should be later moved to time.c */ 788/* XXX - all of this timekeeping code should be later moved to time.c */
795#include <linux/clocksource.h> 789#include <linux/clocksource.h>
796static struct clocksource *clock; /* pointer to current clocksource */ 790static struct clocksource *clock; /* pointer to current clocksource */
797static cycle_t last_clock_cycle; /* cycle value at last update_wall_time */
798 791
799#ifdef CONFIG_GENERIC_TIME 792#ifdef CONFIG_GENERIC_TIME
800/** 793/**
@@ -813,7 +806,7 @@ static inline s64 __get_nsec_offset(void)
813 cycle_now = clocksource_read(clock); 806 cycle_now = clocksource_read(clock);
814 807
815 /* calculate the delta since the last update_wall_time: */ 808 /* calculate the delta since the last update_wall_time: */
816 cycle_delta = (cycle_now - last_clock_cycle) & clock->mask; 809 cycle_delta = (cycle_now - clock->cycle_last) & clock->mask;
817 810
818 /* convert to nanoseconds: */ 811 /* convert to nanoseconds: */
819 ns_offset = cyc2ns(clock, cycle_delta); 812 ns_offset = cyc2ns(clock, cycle_delta);
@@ -927,7 +920,7 @@ static int change_clocksource(void)
927 timespec_add_ns(&xtime, nsec); 920 timespec_add_ns(&xtime, nsec);
928 921
929 clock = new; 922 clock = new;
930 last_clock_cycle = now; 923 clock->cycle_last = now;
931 printk(KERN_INFO "Time: %s clocksource has been installed.\n", 924 printk(KERN_INFO "Time: %s clocksource has been installed.\n",
932 clock->name); 925 clock->name);
933 return 1; 926 return 1;
@@ -968,7 +961,7 @@ void __init timekeeping_init(void)
968 write_seqlock_irqsave(&xtime_lock, flags); 961 write_seqlock_irqsave(&xtime_lock, flags);
969 clock = clocksource_get_next(); 962 clock = clocksource_get_next();
970 clocksource_calculate_interval(clock, tick_nsec); 963 clocksource_calculate_interval(clock, tick_nsec);
971 last_clock_cycle = clocksource_read(clock); 964 clock->cycle_last = clocksource_read(clock);
972 ntp_clear(); 965 ntp_clear();
973 write_sequnlock_irqrestore(&xtime_lock, flags); 966 write_sequnlock_irqrestore(&xtime_lock, flags);
974} 967}
@@ -988,7 +981,7 @@ static int timekeeping_resume(struct sys_device *dev)
988 981
989 write_seqlock_irqsave(&xtime_lock, flags); 982 write_seqlock_irqsave(&xtime_lock, flags);
990 /* restart the last cycle value */ 983 /* restart the last cycle value */
991 last_clock_cycle = clocksource_read(clock); 984 clock->cycle_last = clocksource_read(clock);
992 write_sequnlock_irqrestore(&xtime_lock, flags); 985 write_sequnlock_irqrestore(&xtime_lock, flags);
993 return 0; 986 return 0;
994} 987}
@@ -1015,60 +1008,134 @@ static int __init timekeeping_init_device(void)
1015device_initcall(timekeeping_init_device); 1008device_initcall(timekeeping_init_device);
1016 1009
1017/* 1010/*
1011 * If the error is already larger, we look ahead another tick,
1012 * to compensate for late or lost adjustments.
1013 */
1014static __always_inline int clocksource_bigadjust(int sign, s64 error, s64 *interval, s64 *offset)
1015{
1016 int adj;
1017
1018 /*
1019 * As soon as the machine is synchronized to the external time
1020 * source this should be the common case.
1021 */
1022 error >>= 2;
1023 if (likely(sign > 0 ? error <= *interval : error >= *interval))
1024 return sign;
1025
1026 /*
1027 * An extra look ahead dampens the effect of the current error,
1028 * which can grow quite large with continously late updates, as
1029 * it would dominate the adjustment value and can lead to
1030 * oscillation.
1031 */
1032 error += current_tick_length() >> (TICK_LENGTH_SHIFT - clock->shift + 1);
1033 error -= clock->xtime_interval >> 1;
1034
1035 adj = 0;
1036 while (1) {
1037 error >>= 1;
1038 if (sign > 0 ? error <= *interval : error >= *interval)
1039 break;
1040 adj++;
1041 }
1042
1043 /*
1044 * Add the current adjustments to the error and take the offset
1045 * into account, the latter can cause the error to be hardly
1046 * reduced at the next tick. Check the error again if there's
1047 * room for another adjustment, thus further reducing the error
1048 * which otherwise had to be corrected at the next update.
1049 */
1050 error = (error << 1) - *interval + *offset;
1051 if (sign > 0 ? error > *interval : error < *interval)
1052 adj++;
1053
1054 *interval <<= adj;
1055 *offset <<= adj;
1056 return sign << adj;
1057}
1058
1059/*
1060 * Adjust the multiplier to reduce the error value,
1061 * this is optimized for the most common adjustments of -1,0,1,
1062 * for other values we can do a bit more work.
1063 */
1064static void clocksource_adjust(struct clocksource *clock, s64 offset)
1065{
1066 s64 error, interval = clock->cycle_interval;
1067 int adj;
1068
1069 error = clock->error >> (TICK_LENGTH_SHIFT - clock->shift - 1);
1070 if (error > interval) {
1071 adj = clocksource_bigadjust(1, error, &interval, &offset);
1072 } else if (error < -interval) {
1073 interval = -interval;
1074 offset = -offset;
1075 adj = clocksource_bigadjust(-1, error, &interval, &offset);
1076 } else
1077 return;
1078
1079 clock->mult += adj;
1080 clock->xtime_interval += interval;
1081 clock->xtime_nsec -= offset;
1082 clock->error -= (interval - offset) << (TICK_LENGTH_SHIFT - clock->shift);
1083}
1084
1085/*
1018 * update_wall_time - Uses the current clocksource to increment the wall time 1086 * update_wall_time - Uses the current clocksource to increment the wall time
1019 * 1087 *
1020 * Called from the timer interrupt, must hold a write on xtime_lock. 1088 * Called from the timer interrupt, must hold a write on xtime_lock.
1021 */ 1089 */
1022static void update_wall_time(void) 1090static void update_wall_time(void)
1023{ 1091{
1024 static s64 remainder_snsecs, error; 1092 cycle_t offset;
1025 s64 snsecs_per_sec;
1026 cycle_t now, offset;
1027 1093
1028 snsecs_per_sec = (s64)NSEC_PER_SEC << clock->shift; 1094 clock->xtime_nsec += (s64)xtime.tv_nsec << clock->shift;
1029 remainder_snsecs += (s64)xtime.tv_nsec << clock->shift;
1030 1095
1031 now = clocksource_read(clock); 1096#ifdef CONFIG_GENERIC_TIME
1032 offset = (now - last_clock_cycle)&clock->mask; 1097 offset = (clocksource_read(clock) - clock->cycle_last) & clock->mask;
1098#else
1099 offset = clock->cycle_interval;
1100#endif
1033 1101
1034 /* normally this loop will run just once, however in the 1102 /* normally this loop will run just once, however in the
1035 * case of lost or late ticks, it will accumulate correctly. 1103 * case of lost or late ticks, it will accumulate correctly.
1036 */ 1104 */
1037 while (offset > clock->interval_cycles) { 1105 while (offset >= clock->cycle_interval) {
1038 /* get the ntp interval in clock shifted nanoseconds */
1039 s64 ntp_snsecs = current_tick_length(clock->shift);
1040
1041 /* accumulate one interval */ 1106 /* accumulate one interval */
1042 remainder_snsecs += clock->interval_snsecs; 1107 clock->xtime_nsec += clock->xtime_interval;
1043 last_clock_cycle += clock->interval_cycles; 1108 clock->cycle_last += clock->cycle_interval;
1044 offset -= clock->interval_cycles; 1109 offset -= clock->cycle_interval;
1110
1111 if (clock->xtime_nsec >= (u64)NSEC_PER_SEC << clock->shift) {
1112 clock->xtime_nsec -= (u64)NSEC_PER_SEC << clock->shift;
1113 xtime.tv_sec++;
1114 second_overflow();
1115 }
1045 1116
1046 /* interpolator bits */ 1117 /* interpolator bits */
1047 time_interpolator_update(clock->interval_snsecs 1118 time_interpolator_update(clock->xtime_interval
1048 >> clock->shift); 1119 >> clock->shift);
1049 /* increment the NTP state machine */ 1120 /* increment the NTP state machine */
1050 update_ntp_one_tick(); 1121 update_ntp_one_tick();
1051 1122
1052 /* accumulate error between NTP and clock interval */ 1123 /* accumulate error between NTP and clock interval */
1053 error += (ntp_snsecs - (s64)clock->interval_snsecs); 1124 clock->error += current_tick_length();
1125 clock->error -= clock->xtime_interval << (TICK_LENGTH_SHIFT - clock->shift);
1126 }
1054 1127
1055 /* correct the clock when NTP error is too big */ 1128 /* correct the clock when NTP error is too big */
1056 remainder_snsecs += make_ntp_adj(clock, offset, &error); 1129 clocksource_adjust(clock, offset);
1057 1130
1058 if (remainder_snsecs >= snsecs_per_sec) {
1059 remainder_snsecs -= snsecs_per_sec;
1060 xtime.tv_sec++;
1061 second_overflow();
1062 }
1063 }
1064 /* store full nanoseconds into xtime */ 1131 /* store full nanoseconds into xtime */
1065 xtime.tv_nsec = remainder_snsecs >> clock->shift; 1132 xtime.tv_nsec = clock->xtime_nsec >> clock->shift;
1066 remainder_snsecs -= (s64)xtime.tv_nsec << clock->shift; 1133 clock->xtime_nsec -= (s64)xtime.tv_nsec << clock->shift;
1067 1134
1068 /* check to see if there is a new clocksource to use */ 1135 /* check to see if there is a new clocksource to use */
1069 if (change_clocksource()) { 1136 if (change_clocksource()) {
1070 error = 0; 1137 clock->error = 0;
1071 remainder_snsecs = 0; 1138 clock->xtime_nsec = 0;
1072 clocksource_calculate_interval(clock, tick_nsec); 1139 clocksource_calculate_interval(clock, tick_nsec);
1073 } 1140 }
1074} 1141}