diff options
author | Alexander Duyck <alexander.h.duyck@intel.com> | 2008-09-12 19:30:20 -0400 |
---|---|---|
committer | David S. Miller <davem@davemloft.net> | 2008-09-12 19:30:20 -0400 |
commit | ca9b0e27e072be4cef2f5f0cbc0b0fd94eae3520 (patch) | |
tree | c236e31759299193e688cf7fe78809c24449ede1 | |
parent | 92651940ab00dbe64722e908f70d816713d677b7 (diff) |
pkt_action: add new action skbedit
This new action will have the ability to change the priority and/or
queue_mapping fields on an sk_buff.
Signed-off-by: Alexander Duyck <alexander.h.duyck@intel.com>
Signed-off-by: Jeff Kirsher <jeffrey.t.kirsher@intel.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
-rw-r--r-- | Documentation/networking/multiqueue.txt | 9 | ||||
-rw-r--r-- | include/linux/tc_act/Kbuild | 1 | ||||
-rw-r--r-- | include/linux/tc_act/tc_skbedit.h | 44 | ||||
-rw-r--r-- | include/net/tc_act/tc_skbedit.h | 34 | ||||
-rw-r--r-- | net/sched/Kconfig | 11 | ||||
-rw-r--r-- | net/sched/Makefile | 1 | ||||
-rw-r--r-- | net/sched/act_skbedit.c | 203 |
7 files changed, 302 insertions, 1 deletions
diff --git a/Documentation/networking/multiqueue.txt b/Documentation/networking/multiqueue.txt index 5787ee6eca4f..10113ffa8072 100644 --- a/Documentation/networking/multiqueue.txt +++ b/Documentation/networking/multiqueue.txt | |||
@@ -66,7 +66,14 @@ band 3 => queue 3 | |||
66 | Traffic will begin flowing through each queue if your base device has either | 66 | Traffic will begin flowing through each queue if your base device has either |
67 | the default simple_tx_hash or a custom netdev->select_queue() defined. | 67 | the default simple_tx_hash or a custom netdev->select_queue() defined. |
68 | 68 | ||
69 | The behavior of tc filters remains the same. | 69 | The behavior of tc filters remains the same. However a new tc action, |
70 | skbedit, has been added. Assuming you wanted to route all traffic to a | ||
71 | specific host, for example 192.168.0.3, though a specific queue you could use | ||
72 | this action and establish a filter such as: | ||
73 | |||
74 | tc filter add dev eth0 parent 1: protocol ip prio 1 u32 \ | ||
75 | match ip dst 192.168.0.3 \ | ||
76 | action skbedit queue_mapping 3 | ||
70 | 77 | ||
71 | Author: Alexander Duyck <alexander.h.duyck@intel.com> | 78 | Author: Alexander Duyck <alexander.h.duyck@intel.com> |
72 | Original Author: Peter P. Waskiewicz Jr. <peter.p.waskiewicz.jr@intel.com> | 79 | Original Author: Peter P. Waskiewicz Jr. <peter.p.waskiewicz.jr@intel.com> |
diff --git a/include/linux/tc_act/Kbuild b/include/linux/tc_act/Kbuild index 6dac0d7365cc..76990937f4c9 100644 --- a/include/linux/tc_act/Kbuild +++ b/include/linux/tc_act/Kbuild | |||
@@ -3,3 +3,4 @@ header-y += tc_ipt.h | |||
3 | header-y += tc_mirred.h | 3 | header-y += tc_mirred.h |
4 | header-y += tc_pedit.h | 4 | header-y += tc_pedit.h |
5 | header-y += tc_nat.h | 5 | header-y += tc_nat.h |
6 | header-y += tc_skbedit.h | ||
diff --git a/include/linux/tc_act/tc_skbedit.h b/include/linux/tc_act/tc_skbedit.h new file mode 100644 index 000000000000..a14e461a7af7 --- /dev/null +++ b/include/linux/tc_act/tc_skbedit.h | |||
@@ -0,0 +1,44 @@ | |||
1 | /* | ||
2 | * Copyright (c) 2008, Intel Corporation. | ||
3 | * | ||
4 | * This program is free software; you can redistribute it and/or modify it | ||
5 | * under the terms and conditions of the GNU General Public License, | ||
6 | * version 2, as published by the Free Software Foundation. | ||
7 | * | ||
8 | * This program is distributed in the hope it will be useful, but WITHOUT | ||
9 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | ||
10 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for | ||
11 | * more details. | ||
12 | * | ||
13 | * You should have received a copy of the GNU General Public License along with | ||
14 | * this program; if not, write to the Free Software Foundation, Inc., 59 Temple | ||
15 | * Place - Suite 330, Boston, MA 02111-1307 USA. | ||
16 | * | ||
17 | * Author: Alexander Duyck <alexander.h.duyck@intel.com> | ||
18 | */ | ||
19 | |||
20 | #ifndef __LINUX_TC_SKBEDIT_H | ||
21 | #define __LINUX_TC_SKBEDIT_H | ||
22 | |||
23 | #include <linux/pkt_cls.h> | ||
24 | |||
25 | #define TCA_ACT_SKBEDIT 11 | ||
26 | |||
27 | #define SKBEDIT_F_PRIORITY 0x1 | ||
28 | #define SKBEDIT_F_QUEUE_MAPPING 0x2 | ||
29 | |||
30 | struct tc_skbedit { | ||
31 | tc_gen; | ||
32 | }; | ||
33 | |||
34 | enum { | ||
35 | TCA_SKBEDIT_UNSPEC, | ||
36 | TCA_SKBEDIT_TM, | ||
37 | TCA_SKBEDIT_PARMS, | ||
38 | TCA_SKBEDIT_PRIORITY, | ||
39 | TCA_SKBEDIT_QUEUE_MAPPING, | ||
40 | __TCA_SKBEDIT_MAX | ||
41 | }; | ||
42 | #define TCA_SKBEDIT_MAX (__TCA_SKBEDIT_MAX - 1) | ||
43 | |||
44 | #endif | ||
diff --git a/include/net/tc_act/tc_skbedit.h b/include/net/tc_act/tc_skbedit.h new file mode 100644 index 000000000000..6abb3ed3ebf7 --- /dev/null +++ b/include/net/tc_act/tc_skbedit.h | |||
@@ -0,0 +1,34 @@ | |||
1 | /* | ||
2 | * Copyright (c) 2008, Intel Corporation. | ||
3 | * | ||
4 | * This program is free software; you can redistribute it and/or modify it | ||
5 | * under the terms and conditions of the GNU General Public License, | ||
6 | * version 2, as published by the Free Software Foundation. | ||
7 | * | ||
8 | * This program is distributed in the hope it will be useful, but WITHOUT | ||
9 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | ||
10 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for | ||
11 | * more details. | ||
12 | * | ||
13 | * You should have received a copy of the GNU General Public License along with | ||
14 | * this program; if not, write to the Free Software Foundation, Inc., 59 Temple | ||
15 | * Place - Suite 330, Boston, MA 02111-1307 USA. | ||
16 | * | ||
17 | * Author: Alexander Duyck <alexander.h.duyck@intel.com> | ||
18 | */ | ||
19 | |||
20 | #ifndef __NET_TC_SKBEDIT_H | ||
21 | #define __NET_TC_SKBEDIT_H | ||
22 | |||
23 | #include <net/act_api.h> | ||
24 | |||
25 | struct tcf_skbedit { | ||
26 | struct tcf_common common; | ||
27 | u32 flags; | ||
28 | u32 priority; | ||
29 | u16 queue_mapping; | ||
30 | }; | ||
31 | #define to_skbedit(pc) \ | ||
32 | container_of(pc, struct tcf_skbedit, common) | ||
33 | |||
34 | #endif /* __NET_TC_SKBEDIT_H */ | ||
diff --git a/net/sched/Kconfig b/net/sched/Kconfig index efaa7a75e7f3..6767e54155db 100644 --- a/net/sched/Kconfig +++ b/net/sched/Kconfig | |||
@@ -485,6 +485,17 @@ config NET_ACT_SIMP | |||
485 | To compile this code as a module, choose M here: the | 485 | To compile this code as a module, choose M here: the |
486 | module will be called simple. | 486 | module will be called simple. |
487 | 487 | ||
488 | config NET_ACT_SKBEDIT | ||
489 | tristate "SKB Editing" | ||
490 | depends on NET_CLS_ACT | ||
491 | ---help--- | ||
492 | Say Y here to change skb priority or queue_mapping settings. | ||
493 | |||
494 | If unsure, say N. | ||
495 | |||
496 | To compile this code as a module, choose M here: the | ||
497 | module will be called skbedit. | ||
498 | |||
488 | config NET_CLS_IND | 499 | config NET_CLS_IND |
489 | bool "Incoming device classification" | 500 | bool "Incoming device classification" |
490 | depends on NET_CLS_U32 || NET_CLS_FW | 501 | depends on NET_CLS_U32 || NET_CLS_FW |
diff --git a/net/sched/Makefile b/net/sched/Makefile index 3d9b953f7f62..e60c9925b269 100644 --- a/net/sched/Makefile +++ b/net/sched/Makefile | |||
@@ -14,6 +14,7 @@ obj-$(CONFIG_NET_ACT_IPT) += act_ipt.o | |||
14 | obj-$(CONFIG_NET_ACT_NAT) += act_nat.o | 14 | obj-$(CONFIG_NET_ACT_NAT) += act_nat.o |
15 | obj-$(CONFIG_NET_ACT_PEDIT) += act_pedit.o | 15 | obj-$(CONFIG_NET_ACT_PEDIT) += act_pedit.o |
16 | obj-$(CONFIG_NET_ACT_SIMP) += act_simple.o | 16 | obj-$(CONFIG_NET_ACT_SIMP) += act_simple.o |
17 | obj-$(CONFIG_NET_ACT_SKBEDIT) += act_skbedit.o | ||
17 | obj-$(CONFIG_NET_SCH_FIFO) += sch_fifo.o | 18 | obj-$(CONFIG_NET_SCH_FIFO) += sch_fifo.o |
18 | obj-$(CONFIG_NET_SCH_CBQ) += sch_cbq.o | 19 | obj-$(CONFIG_NET_SCH_CBQ) += sch_cbq.o |
19 | obj-$(CONFIG_NET_SCH_HTB) += sch_htb.o | 20 | obj-$(CONFIG_NET_SCH_HTB) += sch_htb.o |
diff --git a/net/sched/act_skbedit.c b/net/sched/act_skbedit.c new file mode 100644 index 000000000000..fe9777e77f35 --- /dev/null +++ b/net/sched/act_skbedit.c | |||
@@ -0,0 +1,203 @@ | |||
1 | /* | ||
2 | * Copyright (c) 2008, Intel Corporation. | ||
3 | * | ||
4 | * This program is free software; you can redistribute it and/or modify it | ||
5 | * under the terms and conditions of the GNU General Public License, | ||
6 | * version 2, as published by the Free Software Foundation. | ||
7 | * | ||
8 | * This program is distributed in the hope it will be useful, but WITHOUT | ||
9 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | ||
10 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for | ||
11 | * more details. | ||
12 | * | ||
13 | * You should have received a copy of the GNU General Public License along with | ||
14 | * this program; if not, write to the Free Software Foundation, Inc., 59 Temple | ||
15 | * Place - Suite 330, Boston, MA 02111-1307 USA. | ||
16 | * | ||
17 | * Author: Alexander Duyck <alexander.h.duyck@intel.com> | ||
18 | */ | ||
19 | |||
20 | #include <linux/module.h> | ||
21 | #include <linux/init.h> | ||
22 | #include <linux/kernel.h> | ||
23 | #include <linux/skbuff.h> | ||
24 | #include <linux/rtnetlink.h> | ||
25 | #include <net/netlink.h> | ||
26 | #include <net/pkt_sched.h> | ||
27 | |||
28 | #include <linux/tc_act/tc_skbedit.h> | ||
29 | #include <net/tc_act/tc_skbedit.h> | ||
30 | |||
31 | #define SKBEDIT_TAB_MASK 15 | ||
32 | static struct tcf_common *tcf_skbedit_ht[SKBEDIT_TAB_MASK + 1]; | ||
33 | static u32 skbedit_idx_gen; | ||
34 | static DEFINE_RWLOCK(skbedit_lock); | ||
35 | |||
36 | static struct tcf_hashinfo skbedit_hash_info = { | ||
37 | .htab = tcf_skbedit_ht, | ||
38 | .hmask = SKBEDIT_TAB_MASK, | ||
39 | .lock = &skbedit_lock, | ||
40 | }; | ||
41 | |||
42 | static int tcf_skbedit(struct sk_buff *skb, struct tc_action *a, | ||
43 | struct tcf_result *res) | ||
44 | { | ||
45 | struct tcf_skbedit *d = a->priv; | ||
46 | |||
47 | spin_lock(&d->tcf_lock); | ||
48 | d->tcf_tm.lastuse = jiffies; | ||
49 | d->tcf_bstats.bytes += qdisc_pkt_len(skb); | ||
50 | d->tcf_bstats.packets++; | ||
51 | |||
52 | if (d->flags & SKBEDIT_F_PRIORITY) | ||
53 | skb->priority = d->priority; | ||
54 | if (d->flags & SKBEDIT_F_QUEUE_MAPPING && | ||
55 | skb->dev->real_num_tx_queues > d->queue_mapping) | ||
56 | skb_set_queue_mapping(skb, d->queue_mapping); | ||
57 | |||
58 | spin_unlock(&d->tcf_lock); | ||
59 | return d->tcf_action; | ||
60 | } | ||
61 | |||
62 | static const struct nla_policy skbedit_policy[TCA_SKBEDIT_MAX + 1] = { | ||
63 | [TCA_SKBEDIT_PARMS] = { .len = sizeof(struct tc_skbedit) }, | ||
64 | [TCA_SKBEDIT_PRIORITY] = { .len = sizeof(u32) }, | ||
65 | [TCA_SKBEDIT_QUEUE_MAPPING] = { .len = sizeof(u16) }, | ||
66 | }; | ||
67 | |||
68 | static int tcf_skbedit_init(struct nlattr *nla, struct nlattr *est, | ||
69 | struct tc_action *a, int ovr, int bind) | ||
70 | { | ||
71 | struct nlattr *tb[TCA_SKBEDIT_MAX + 1]; | ||
72 | struct tc_skbedit *parm; | ||
73 | struct tcf_skbedit *d; | ||
74 | struct tcf_common *pc; | ||
75 | u32 flags = 0, *priority = NULL; | ||
76 | u16 *queue_mapping = NULL; | ||
77 | int ret = 0, err; | ||
78 | |||
79 | if (nla == NULL) | ||
80 | return -EINVAL; | ||
81 | |||
82 | err = nla_parse_nested(tb, TCA_SKBEDIT_MAX, nla, skbedit_policy); | ||
83 | if (err < 0) | ||
84 | return err; | ||
85 | |||
86 | if (tb[TCA_SKBEDIT_PARMS] == NULL) | ||
87 | return -EINVAL; | ||
88 | |||
89 | if (tb[TCA_SKBEDIT_PRIORITY] != NULL) { | ||
90 | flags |= SKBEDIT_F_PRIORITY; | ||
91 | priority = nla_data(tb[TCA_SKBEDIT_PRIORITY]); | ||
92 | } | ||
93 | |||
94 | if (tb[TCA_SKBEDIT_QUEUE_MAPPING] != NULL) { | ||
95 | flags |= SKBEDIT_F_QUEUE_MAPPING; | ||
96 | queue_mapping = nla_data(tb[TCA_SKBEDIT_QUEUE_MAPPING]); | ||
97 | } | ||
98 | if (!flags) | ||
99 | return -EINVAL; | ||
100 | |||
101 | parm = nla_data(tb[TCA_SKBEDIT_PARMS]); | ||
102 | |||
103 | pc = tcf_hash_check(parm->index, a, bind, &skbedit_hash_info); | ||
104 | if (!pc) { | ||
105 | pc = tcf_hash_create(parm->index, est, a, sizeof(*d), bind, | ||
106 | &skbedit_idx_gen, &skbedit_hash_info); | ||
107 | if (unlikely(!pc)) | ||
108 | return -ENOMEM; | ||
109 | |||
110 | d = to_skbedit(pc); | ||
111 | ret = ACT_P_CREATED; | ||
112 | } else { | ||
113 | d = to_skbedit(pc); | ||
114 | if (!ovr) { | ||
115 | tcf_hash_release(pc, bind, &skbedit_hash_info); | ||
116 | return -EEXIST; | ||
117 | } | ||
118 | } | ||
119 | |||
120 | spin_lock_bh(&d->tcf_lock); | ||
121 | |||
122 | d->flags = flags; | ||
123 | if (flags & SKBEDIT_F_PRIORITY) | ||
124 | d->priority = *priority; | ||
125 | if (flags & SKBEDIT_F_QUEUE_MAPPING) | ||
126 | d->queue_mapping = *queue_mapping; | ||
127 | d->tcf_action = parm->action; | ||
128 | |||
129 | spin_unlock_bh(&d->tcf_lock); | ||
130 | |||
131 | if (ret == ACT_P_CREATED) | ||
132 | tcf_hash_insert(pc, &skbedit_hash_info); | ||
133 | return ret; | ||
134 | } | ||
135 | |||
136 | static inline int tcf_skbedit_cleanup(struct tc_action *a, int bind) | ||
137 | { | ||
138 | struct tcf_skbedit *d = a->priv; | ||
139 | |||
140 | if (d) | ||
141 | return tcf_hash_release(&d->common, bind, &skbedit_hash_info); | ||
142 | return 0; | ||
143 | } | ||
144 | |||
145 | static inline int tcf_skbedit_dump(struct sk_buff *skb, struct tc_action *a, | ||
146 | int bind, int ref) | ||
147 | { | ||
148 | unsigned char *b = skb_tail_pointer(skb); | ||
149 | struct tcf_skbedit *d = a->priv; | ||
150 | struct tc_skbedit opt; | ||
151 | struct tcf_t t; | ||
152 | |||
153 | opt.index = d->tcf_index; | ||
154 | opt.refcnt = d->tcf_refcnt - ref; | ||
155 | opt.bindcnt = d->tcf_bindcnt - bind; | ||
156 | opt.action = d->tcf_action; | ||
157 | NLA_PUT(skb, TCA_SKBEDIT_PARMS, sizeof(opt), &opt); | ||
158 | if (d->flags & SKBEDIT_F_PRIORITY) | ||
159 | NLA_PUT(skb, TCA_SKBEDIT_PRIORITY, sizeof(d->priority), | ||
160 | &d->priority); | ||
161 | if (d->flags & SKBEDIT_F_QUEUE_MAPPING) | ||
162 | NLA_PUT(skb, TCA_SKBEDIT_QUEUE_MAPPING, | ||
163 | sizeof(d->queue_mapping), &d->queue_mapping); | ||
164 | t.install = jiffies_to_clock_t(jiffies - d->tcf_tm.install); | ||
165 | t.lastuse = jiffies_to_clock_t(jiffies - d->tcf_tm.lastuse); | ||
166 | t.expires = jiffies_to_clock_t(d->tcf_tm.expires); | ||
167 | NLA_PUT(skb, TCA_SKBEDIT_TM, sizeof(t), &t); | ||
168 | return skb->len; | ||
169 | |||
170 | nla_put_failure: | ||
171 | nlmsg_trim(skb, b); | ||
172 | return -1; | ||
173 | } | ||
174 | |||
175 | static struct tc_action_ops act_skbedit_ops = { | ||
176 | .kind = "skbedit", | ||
177 | .hinfo = &skbedit_hash_info, | ||
178 | .type = TCA_ACT_SKBEDIT, | ||
179 | .capab = TCA_CAP_NONE, | ||
180 | .owner = THIS_MODULE, | ||
181 | .act = tcf_skbedit, | ||
182 | .dump = tcf_skbedit_dump, | ||
183 | .cleanup = tcf_skbedit_cleanup, | ||
184 | .init = tcf_skbedit_init, | ||
185 | .walk = tcf_generic_walker, | ||
186 | }; | ||
187 | |||
188 | MODULE_AUTHOR("Alexander Duyck, <alexander.h.duyck@intel.com>"); | ||
189 | MODULE_DESCRIPTION("SKB Editing"); | ||
190 | MODULE_LICENSE("GPL"); | ||
191 | |||
192 | static int __init skbedit_init_module(void) | ||
193 | { | ||
194 | return tcf_register_action(&act_skbedit_ops); | ||
195 | } | ||
196 | |||
197 | static void __exit skbedit_cleanup_module(void) | ||
198 | { | ||
199 | tcf_unregister_action(&act_skbedit_ops); | ||
200 | } | ||
201 | |||
202 | module_init(skbedit_init_module); | ||
203 | module_exit(skbedit_cleanup_module); | ||