diff options
author | Eric Dumazet <eric.dumazet@gmail.com> | 2011-02-23 05:56:17 -0500 |
---|---|---|
committer | David S. Miller <davem@davemloft.net> | 2011-02-23 17:05:11 -0500 |
commit | e13e02a3c68d899169c78d9a18689bd73491d59a (patch) | |
tree | 6e6b40ef37261df391cd445ec0f1b3d538b23a47 /include/linux/pkt_sched.h | |
parent | dee9f4bceb5fd9dbfcc1567148fccdbf16d6a38a (diff) |
net_sched: SFB flow scheduler
This is the Stochastic Fair Blue scheduler, based on work from :
W. Feng, D. Kandlur, D. Saha, K. Shin. Blue: A New Class of Active Queue
Management Algorithms. U. Michigan CSE-TR-387-99, April 1999.
http://www.thefengs.com/wuchang/blue/CSE-TR-387-99.pdf
This implementation is based on work done by Juliusz Chroboczek
General SFB algorithm can be found in figure 14, page 15:
B[l][n] : L x N array of bins (L levels, N bins per level)
enqueue()
Calculate hash function values h{0}, h{1}, .. h{L-1}
Update bins at each level
for i = 0 to L - 1
if (B[i][h{i}].qlen > bin_size)
B[i][h{i}].p_mark += p_increment;
else if (B[i][h{i}].qlen == 0)
B[i][h{i}].p_mark -= p_decrement;
p_min = min(B[0][h{0}].p_mark ... B[L-1][h{L-1}].p_mark);
if (p_min == 1.0)
ratelimit();
else
mark/drop with probabilty p_min;
I did the adaptation of Juliusz code to meet current kernel standards,
and various changes to address previous comments :
http://thread.gmane.org/gmane.linux.network/90225
http://thread.gmane.org/gmane.linux.network/90375
Default flow classifier is the rxhash introduced by RPS in 2.6.35, but
we can use an external flow classifier if wanted.
tc qdisc add dev $DEV parent 1:11 handle 11: \
est 0.5sec 2sec sfb limit 128
tc filter add dev $DEV protocol ip parent 11: handle 3 \
flow hash keys dst divisor 1024
Notes:
1) SFB default child qdisc is pfifo_fast. It can be changed by another
qdisc but a child qdisc MUST not drop a packet previously queued. This
is because SFB needs to handle a dequeued packet in order to maintain
its virtual queue states. pfifo_head_drop or CHOKe should not be used.
2) ECN is enabled by default, unlike RED/CHOKe/GRED
With help from Patrick McHardy & Andi Kleen
Signed-off-by: Eric Dumazet <eric.dumazet@gmail.com>
CC: Juliusz Chroboczek <Juliusz.Chroboczek@pps.jussieu.fr>
CC: Stephen Hemminger <shemminger@vyatta.com>
CC: Patrick McHardy <kaber@trash.net>
CC: Andi Kleen <andi@firstfloor.org>
CC: John W. Linville <linville@tuxdriver.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
Diffstat (limited to 'include/linux/pkt_sched.h')
-rw-r--r-- | include/linux/pkt_sched.h | 39 |
1 files changed, 39 insertions, 0 deletions
diff --git a/include/linux/pkt_sched.h b/include/linux/pkt_sched.h index d4bb6f58c90c..5afee2b238bd 100644 --- a/include/linux/pkt_sched.h +++ b/include/linux/pkt_sched.h | |||
@@ -522,4 +522,43 @@ struct tc_mqprio_qopt { | |||
522 | __u16 offset[TC_QOPT_MAX_QUEUE]; | 522 | __u16 offset[TC_QOPT_MAX_QUEUE]; |
523 | }; | 523 | }; |
524 | 524 | ||
525 | /* SFB */ | ||
526 | |||
527 | enum { | ||
528 | TCA_SFB_UNSPEC, | ||
529 | TCA_SFB_PARMS, | ||
530 | __TCA_SFB_MAX, | ||
531 | }; | ||
532 | |||
533 | #define TCA_SFB_MAX (__TCA_SFB_MAX - 1) | ||
534 | |||
535 | /* | ||
536 | * Note: increment, decrement are Q0.16 fixed-point values. | ||
537 | */ | ||
538 | struct tc_sfb_qopt { | ||
539 | __u32 rehash_interval; /* delay between hash move, in ms */ | ||
540 | __u32 warmup_time; /* double buffering warmup time in ms (warmup_time < rehash_interval) */ | ||
541 | __u32 max; /* max len of qlen_min */ | ||
542 | __u32 bin_size; /* maximum queue length per bin */ | ||
543 | __u32 increment; /* probability increment, (d1 in Blue) */ | ||
544 | __u32 decrement; /* probability decrement, (d2 in Blue) */ | ||
545 | __u32 limit; /* max SFB queue length */ | ||
546 | __u32 penalty_rate; /* inelastic flows are rate limited to 'rate' pps */ | ||
547 | __u32 penalty_burst; | ||
548 | }; | ||
549 | |||
550 | struct tc_sfb_xstats { | ||
551 | __u32 earlydrop; | ||
552 | __u32 penaltydrop; | ||
553 | __u32 bucketdrop; | ||
554 | __u32 queuedrop; | ||
555 | __u32 childdrop; /* drops in child qdisc */ | ||
556 | __u32 marked; | ||
557 | __u32 maxqlen; | ||
558 | __u32 maxprob; | ||
559 | __u32 avgprob; | ||
560 | }; | ||
561 | |||
562 | #define SFB_MAX_PROB 0xFFFF | ||
563 | |||
525 | #endif | 564 | #endif |