diff options
author | Eric Dumazet <edumazet@google.com> | 2013-06-06 16:56:19 -0400 |
---|---|---|
committer | David S. Miller <davem@davemloft.net> | 2013-06-12 01:39:47 -0400 |
commit | 130d3d68b52097c7ae081109f700b02776adcb9c (patch) | |
tree | 08b3ab56be1de543a9c3e7cd1d9ff532221bda14 /net/sched | |
parent | 45203a3b380cee28f570475c0d28c169f908c209 (diff) |
net_sched: psched_ratecfg_precompute() improvements
Before allowing 64bits bytes rates, refactor
psched_ratecfg_precompute() to get better comments
and increased accuracy.
rate_bps field is renamed to rate_bytes_ps, as we only
have to worry about bytes per second.
Signed-off-by: Eric Dumazet <edumazet@google.com>
Cc: Ben Greear <greearb@candelatech.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
Diffstat (limited to 'net/sched')
-rw-r--r-- | net/sched/sch_generic.c | 44 |
1 files changed, 20 insertions, 24 deletions
diff --git a/net/sched/sch_generic.c b/net/sched/sch_generic.c index 20224086cc28..4626cef4b76e 100644 --- a/net/sched/sch_generic.c +++ b/net/sched/sch_generic.c | |||
@@ -901,37 +901,33 @@ void dev_shutdown(struct net_device *dev) | |||
901 | void psched_ratecfg_precompute(struct psched_ratecfg *r, | 901 | void psched_ratecfg_precompute(struct psched_ratecfg *r, |
902 | const struct tc_ratespec *conf) | 902 | const struct tc_ratespec *conf) |
903 | { | 903 | { |
904 | u64 factor; | ||
905 | u64 mult; | ||
906 | int shift; | ||
907 | |||
908 | memset(r, 0, sizeof(*r)); | 904 | memset(r, 0, sizeof(*r)); |
909 | r->overhead = conf->overhead; | 905 | r->overhead = conf->overhead; |
910 | r->rate_bps = (u64)conf->rate << 3; | 906 | r->rate_bytes_ps = conf->rate; |
911 | r->mult = 1; | 907 | r->mult = 1; |
912 | /* | 908 | /* |
913 | * Calibrate mult, shift so that token counting is accurate | 909 | * The deal here is to replace a divide by a reciprocal one |
914 | * for smallest packet size (64 bytes). Token (time in ns) is | 910 | * in fast path (a reciprocal divide is a multiply and a shift) |
915 | * computed as (bytes * 8) * NSEC_PER_SEC / rate_bps. It will | 911 | * |
916 | * work as long as the smallest packet transfer time can be | 912 | * Normal formula would be : |
917 | * accurately represented in nanosec. | 913 | * time_in_ns = (NSEC_PER_SEC * len) / rate_bps |
914 | * | ||
915 | * We compute mult/shift to use instead : | ||
916 | * time_in_ns = (len * mult) >> shift; | ||
917 | * | ||
918 | * We try to get the highest possible mult value for accuracy, | ||
919 | * but have to make sure no overflows will ever happen. | ||
918 | */ | 920 | */ |
919 | if (r->rate_bps > 0) { | 921 | if (r->rate_bytes_ps > 0) { |
920 | /* | 922 | u64 factor = NSEC_PER_SEC; |
921 | * Higher shift gives better accuracy. Find the largest | 923 | |
922 | * shift such that mult fits in 32 bits. | 924 | for (;;) { |
923 | */ | 925 | r->mult = div64_u64(factor, r->rate_bytes_ps); |
924 | for (shift = 0; shift < 16; shift++) { | 926 | if (r->mult & (1U << 31) || factor & (1ULL << 63)) |
925 | r->shift = shift; | ||
926 | factor = 8LLU * NSEC_PER_SEC * (1 << r->shift); | ||
927 | mult = div64_u64(factor, r->rate_bps); | ||
928 | if (mult > UINT_MAX) | ||
929 | break; | 927 | break; |
928 | factor <<= 1; | ||
929 | r->shift++; | ||
930 | } | 930 | } |
931 | |||
932 | r->shift = shift - 1; | ||
933 | factor = 8LLU * NSEC_PER_SEC * (1 << r->shift); | ||
934 | r->mult = div64_u64(factor, r->rate_bps); | ||
935 | } | 931 | } |
936 | } | 932 | } |
937 | EXPORT_SYMBOL(psched_ratecfg_precompute); | 933 | EXPORT_SYMBOL(psched_ratecfg_precompute); |