diff options
author | Pravin B Shelar <pshelar@nicira.com> | 2013-03-25 10:49:35 -0400 |
---|---|---|
committer | David S. Miller <davem@davemloft.net> | 2013-03-26 12:27:18 -0400 |
commit | c54419321455631079c7d6e60bc732dd0c5914c5 (patch) | |
tree | a0ad703b72313b98e70f4166bcea9a328d09e937 /include | |
parent | eaac5f3d3ad33547b299935e6db0cfc7be9a576a (diff) |
GRE: Refactor GRE tunneling code.
Following patch refactors GRE code into ip tunneling code and GRE
specific code. Common tunneling code is moved to ip_tunnel module.
ip_tunnel module is written as generic library which can be used
by different tunneling implementations.
ip_tunnel module contains following components:
- packet xmit and rcv generic code. xmit flow looks like
(gre_xmit/ipip_xmit)->ip_tunnel_xmit->ip_local_out.
- hash table of all devices.
- lookup for tunnel devices.
- control plane operations like device create, destroy, ioctl, netlink
operations code.
- registration for tunneling modules, like gre, ipip etc.
- define single pcpu_tstats dev->tstats.
- struct tnl_ptk_info added to pass parsed tunnel packet parameters.
ipip.h header is renamed to ip_tunnel.h
Signed-off-by: Pravin B Shelar <pshelar@nicira.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
Diffstat (limited to 'include')
-rw-r--r-- | include/net/gre.h | 51 | ||||
-rw-r--r-- | include/net/ip6_tunnel.h | 1 | ||||
-rw-r--r-- | include/net/ip_tunnels.h | 177 | ||||
-rw-r--r-- | include/net/ipip.h | 84 |
4 files changed, 229 insertions, 84 deletions
diff --git a/include/net/gre.h b/include/net/gre.h index 82665474bcb7..9f03a390c826 100644 --- a/include/net/gre.h +++ b/include/net/gre.h | |||
@@ -2,6 +2,7 @@ | |||
2 | #define __LINUX_GRE_H | 2 | #define __LINUX_GRE_H |
3 | 3 | ||
4 | #include <linux/skbuff.h> | 4 | #include <linux/skbuff.h> |
5 | #include <net/ip_tunnels.h> | ||
5 | 6 | ||
6 | #define GREPROTO_CISCO 0 | 7 | #define GREPROTO_CISCO 0 |
7 | #define GREPROTO_PPTP 1 | 8 | #define GREPROTO_PPTP 1 |
@@ -12,7 +13,57 @@ struct gre_protocol { | |||
12 | void (*err_handler)(struct sk_buff *skb, u32 info); | 13 | void (*err_handler)(struct sk_buff *skb, u32 info); |
13 | }; | 14 | }; |
14 | 15 | ||
16 | struct gre_base_hdr { | ||
17 | __be16 flags; | ||
18 | __be16 protocol; | ||
19 | }; | ||
20 | #define GRE_HEADER_SECTION 4 | ||
21 | |||
15 | int gre_add_protocol(const struct gre_protocol *proto, u8 version); | 22 | int gre_add_protocol(const struct gre_protocol *proto, u8 version); |
16 | int gre_del_protocol(const struct gre_protocol *proto, u8 version); | 23 | int gre_del_protocol(const struct gre_protocol *proto, u8 version); |
17 | 24 | ||
25 | static inline __be16 gre_flags_to_tnl_flags(__be16 flags) | ||
26 | { | ||
27 | __be16 tflags = 0; | ||
28 | |||
29 | if (flags & GRE_CSUM) | ||
30 | tflags |= TUNNEL_CSUM; | ||
31 | if (flags & GRE_ROUTING) | ||
32 | tflags |= TUNNEL_ROUTING; | ||
33 | if (flags & GRE_KEY) | ||
34 | tflags |= TUNNEL_KEY; | ||
35 | if (flags & GRE_SEQ) | ||
36 | tflags |= TUNNEL_SEQ; | ||
37 | if (flags & GRE_STRICT) | ||
38 | tflags |= TUNNEL_STRICT; | ||
39 | if (flags & GRE_REC) | ||
40 | tflags |= TUNNEL_REC; | ||
41 | if (flags & GRE_VERSION) | ||
42 | tflags |= TUNNEL_VERSION; | ||
43 | |||
44 | return tflags; | ||
45 | } | ||
46 | |||
47 | static inline __be16 tnl_flags_to_gre_flags(__be16 tflags) | ||
48 | { | ||
49 | __be16 flags = 0; | ||
50 | |||
51 | if (tflags & TUNNEL_CSUM) | ||
52 | flags |= GRE_CSUM; | ||
53 | if (tflags & TUNNEL_ROUTING) | ||
54 | flags |= GRE_ROUTING; | ||
55 | if (tflags & TUNNEL_KEY) | ||
56 | flags |= GRE_KEY; | ||
57 | if (tflags & TUNNEL_SEQ) | ||
58 | flags |= GRE_SEQ; | ||
59 | if (tflags & TUNNEL_STRICT) | ||
60 | flags |= GRE_STRICT; | ||
61 | if (tflags & TUNNEL_REC) | ||
62 | flags |= GRE_REC; | ||
63 | if (tflags & TUNNEL_VERSION) | ||
64 | flags |= GRE_VERSION; | ||
65 | |||
66 | return flags; | ||
67 | } | ||
68 | |||
18 | #endif | 69 | #endif |
diff --git a/include/net/ip6_tunnel.h b/include/net/ip6_tunnel.h index ebdef7f60862..4da5de10d1d4 100644 --- a/include/net/ip6_tunnel.h +++ b/include/net/ip6_tunnel.h | |||
@@ -3,6 +3,7 @@ | |||
3 | 3 | ||
4 | #include <linux/ipv6.h> | 4 | #include <linux/ipv6.h> |
5 | #include <linux/netdevice.h> | 5 | #include <linux/netdevice.h> |
6 | #include <linux/if_tunnel.h> | ||
6 | #include <linux/ip6_tunnel.h> | 7 | #include <linux/ip6_tunnel.h> |
7 | 8 | ||
8 | #define IP6TUNNEL_ERR_TIMEO (30*HZ) | 9 | #define IP6TUNNEL_ERR_TIMEO (30*HZ) |
diff --git a/include/net/ip_tunnels.h b/include/net/ip_tunnels.h new file mode 100644 index 000000000000..4b6f0b28f41f --- /dev/null +++ b/include/net/ip_tunnels.h | |||
@@ -0,0 +1,177 @@ | |||
1 | #ifndef __NET_IP_TUNNELS_H | ||
2 | #define __NET_IP_TUNNELS_H 1 | ||
3 | |||
4 | #include <linux/if_tunnel.h> | ||
5 | #include <linux/netdevice.h> | ||
6 | #include <linux/skbuff.h> | ||
7 | #include <linux/types.h> | ||
8 | #include <linux/u64_stats_sync.h> | ||
9 | #include <net/dsfield.h> | ||
10 | #include <net/gro_cells.h> | ||
11 | #include <net/inet_ecn.h> | ||
12 | #include <net/ip.h> | ||
13 | #include <net/rtnetlink.h> | ||
14 | |||
15 | #if IS_ENABLED(CONFIG_IPV6) | ||
16 | #include <net/ipv6.h> | ||
17 | #include <net/ip6_fib.h> | ||
18 | #include <net/ip6_route.h> | ||
19 | #endif | ||
20 | |||
21 | /* Keep error state on tunnel for 30 sec */ | ||
22 | #define IPTUNNEL_ERR_TIMEO (30*HZ) | ||
23 | |||
24 | /* 6rd prefix/relay information */ | ||
25 | #ifdef CONFIG_IPV6_SIT_6RD | ||
26 | struct ip_tunnel_6rd_parm { | ||
27 | struct in6_addr prefix; | ||
28 | __be32 relay_prefix; | ||
29 | u16 prefixlen; | ||
30 | u16 relay_prefixlen; | ||
31 | }; | ||
32 | #endif | ||
33 | |||
34 | struct ip_tunnel_prl_entry { | ||
35 | struct ip_tunnel_prl_entry __rcu *next; | ||
36 | __be32 addr; | ||
37 | u16 flags; | ||
38 | struct rcu_head rcu_head; | ||
39 | }; | ||
40 | |||
41 | struct ip_tunnel { | ||
42 | struct ip_tunnel __rcu *next; | ||
43 | struct hlist_node hash_node; | ||
44 | struct net_device *dev; | ||
45 | |||
46 | int err_count; /* Number of arrived ICMP errors */ | ||
47 | unsigned long err_time; /* Time when the last ICMP error | ||
48 | * arrived */ | ||
49 | |||
50 | /* These four fields used only by GRE */ | ||
51 | __u32 i_seqno; /* The last seen seqno */ | ||
52 | __u32 o_seqno; /* The last output seqno */ | ||
53 | int hlen; /* Precalculated header length */ | ||
54 | int mlink; | ||
55 | |||
56 | struct ip_tunnel_parm parms; | ||
57 | |||
58 | /* for SIT */ | ||
59 | #ifdef CONFIG_IPV6_SIT_6RD | ||
60 | struct ip_tunnel_6rd_parm ip6rd; | ||
61 | #endif | ||
62 | struct ip_tunnel_prl_entry __rcu *prl; /* potential router list */ | ||
63 | unsigned int prl_count; /* # of entries in PRL */ | ||
64 | int ip_tnl_net_id; | ||
65 | struct gro_cells gro_cells; | ||
66 | }; | ||
67 | |||
68 | #define TUNNEL_CSUM __cpu_to_be16(0x01) | ||
69 | #define TUNNEL_ROUTING __cpu_to_be16(0x02) | ||
70 | #define TUNNEL_KEY __cpu_to_be16(0x04) | ||
71 | #define TUNNEL_SEQ __cpu_to_be16(0x08) | ||
72 | #define TUNNEL_STRICT __cpu_to_be16(0x10) | ||
73 | #define TUNNEL_REC __cpu_to_be16(0x20) | ||
74 | #define TUNNEL_VERSION __cpu_to_be16(0x40) | ||
75 | #define TUNNEL_NO_KEY __cpu_to_be16(0x80) | ||
76 | |||
77 | struct tnl_ptk_info { | ||
78 | __be16 flags; | ||
79 | __be16 proto; | ||
80 | __be32 key; | ||
81 | __be32 seq; | ||
82 | }; | ||
83 | |||
84 | #define PACKET_RCVD 0 | ||
85 | #define PACKET_REJECT 1 | ||
86 | |||
87 | #define IP_TNL_HASH_BITS 10 | ||
88 | #define IP_TNL_HASH_SIZE (1 << IP_TNL_HASH_BITS) | ||
89 | |||
90 | struct ip_tunnel_net { | ||
91 | struct hlist_head *tunnels; | ||
92 | struct net_device *fb_tunnel_dev; | ||
93 | }; | ||
94 | |||
95 | int ip_tunnel_init(struct net_device *dev); | ||
96 | void ip_tunnel_uninit(struct net_device *dev); | ||
97 | void ip_tunnel_dellink(struct net_device *dev, struct list_head *head); | ||
98 | int __net_init ip_tunnel_init_net(struct net *net, int ip_tnl_net_id, | ||
99 | struct rtnl_link_ops *ops, char *devname); | ||
100 | |||
101 | void __net_exit ip_tunnel_delete_net(struct ip_tunnel_net *itn); | ||
102 | |||
103 | void ip_tunnel_xmit(struct sk_buff *skb, struct net_device *dev, | ||
104 | const struct iphdr *tnl_params); | ||
105 | int ip_tunnel_ioctl(struct net_device *dev, struct ip_tunnel_parm *p, int cmd); | ||
106 | int ip_tunnel_change_mtu(struct net_device *dev, int new_mtu); | ||
107 | |||
108 | struct rtnl_link_stats64 *ip_tunnel_get_stats64(struct net_device *dev, | ||
109 | struct rtnl_link_stats64 *tot); | ||
110 | struct ip_tunnel *ip_tunnel_lookup(struct ip_tunnel_net *itn, | ||
111 | int link, __be16 flags, | ||
112 | __be32 remote, __be32 local, | ||
113 | __be32 key); | ||
114 | |||
115 | int ip_tunnel_rcv(struct ip_tunnel *tunnel, struct sk_buff *skb, | ||
116 | const struct tnl_ptk_info *tpi, bool log_ecn_error); | ||
117 | int ip_tunnel_changelink(struct net_device *dev, struct nlattr *tb[], | ||
118 | struct ip_tunnel_parm *p); | ||
119 | int ip_tunnel_newlink(struct net_device *dev, struct nlattr *tb[], | ||
120 | struct ip_tunnel_parm *p); | ||
121 | void ip_tunnel_setup(struct net_device *dev, int net_id); | ||
122 | |||
123 | /* Extract dsfield from inner protocol */ | ||
124 | static inline u8 ip_tunnel_get_dsfield(const struct iphdr *iph, | ||
125 | const struct sk_buff *skb) | ||
126 | { | ||
127 | if (skb->protocol == htons(ETH_P_IP)) | ||
128 | return iph->tos; | ||
129 | else if (skb->protocol == htons(ETH_P_IPV6)) | ||
130 | return ipv6_get_dsfield((const struct ipv6hdr *)iph); | ||
131 | else | ||
132 | return 0; | ||
133 | } | ||
134 | |||
135 | /* Propogate ECN bits out */ | ||
136 | static inline u8 ip_tunnel_ecn_encap(u8 tos, const struct iphdr *iph, | ||
137 | const struct sk_buff *skb) | ||
138 | { | ||
139 | u8 inner = ip_tunnel_get_dsfield(iph, skb); | ||
140 | |||
141 | return INET_ECN_encapsulate(tos, inner); | ||
142 | } | ||
143 | |||
144 | static inline void tunnel_ip_select_ident(struct sk_buff *skb, | ||
145 | const struct iphdr *old_iph, | ||
146 | struct dst_entry *dst) | ||
147 | { | ||
148 | struct iphdr *iph = ip_hdr(skb); | ||
149 | |||
150 | /* Use inner packet iph-id if possible. */ | ||
151 | if (skb->protocol == htons(ETH_P_IP) && old_iph->id) | ||
152 | iph->id = old_iph->id; | ||
153 | else | ||
154 | __ip_select_ident(iph, dst, | ||
155 | (skb_shinfo(skb)->gso_segs ?: 1) - 1); | ||
156 | } | ||
157 | |||
158 | static inline void iptunnel_xmit(struct sk_buff *skb, struct net_device *dev) | ||
159 | { | ||
160 | int err; | ||
161 | int pkt_len = skb->len - skb_transport_offset(skb); | ||
162 | struct pcpu_tstats *tstats = this_cpu_ptr(dev->tstats); | ||
163 | |||
164 | nf_reset(skb); | ||
165 | |||
166 | err = ip_local_out(skb); | ||
167 | if (likely(net_xmit_eval(err) == 0)) { | ||
168 | u64_stats_update_begin(&tstats->syncp); | ||
169 | tstats->tx_bytes += pkt_len; | ||
170 | tstats->tx_packets++; | ||
171 | u64_stats_update_end(&tstats->syncp); | ||
172 | } else { | ||
173 | dev->stats.tx_errors++; | ||
174 | dev->stats.tx_aborted_errors++; | ||
175 | } | ||
176 | } | ||
177 | #endif /* __NET_IP_TUNNELS_H */ | ||
diff --git a/include/net/ipip.h b/include/net/ipip.h deleted file mode 100644 index 483b91a10bb2..000000000000 --- a/include/net/ipip.h +++ /dev/null | |||
@@ -1,84 +0,0 @@ | |||
1 | #ifndef __NET_IPIP_H | ||
2 | #define __NET_IPIP_H 1 | ||
3 | |||
4 | #include <linux/if_tunnel.h> | ||
5 | #include <net/gro_cells.h> | ||
6 | #include <net/ip.h> | ||
7 | |||
8 | /* Keep error state on tunnel for 30 sec */ | ||
9 | #define IPTUNNEL_ERR_TIMEO (30*HZ) | ||
10 | |||
11 | /* 6rd prefix/relay information */ | ||
12 | struct ip_tunnel_6rd_parm { | ||
13 | struct in6_addr prefix; | ||
14 | __be32 relay_prefix; | ||
15 | u16 prefixlen; | ||
16 | u16 relay_prefixlen; | ||
17 | }; | ||
18 | |||
19 | struct ip_tunnel { | ||
20 | struct ip_tunnel __rcu *next; | ||
21 | struct net_device *dev; | ||
22 | |||
23 | int err_count; /* Number of arrived ICMP errors */ | ||
24 | unsigned long err_time; /* Time when the last ICMP error arrived */ | ||
25 | |||
26 | /* These four fields used only by GRE */ | ||
27 | __u32 i_seqno; /* The last seen seqno */ | ||
28 | __u32 o_seqno; /* The last output seqno */ | ||
29 | int hlen; /* Precalculated GRE header length */ | ||
30 | int mlink; | ||
31 | |||
32 | struct ip_tunnel_parm parms; | ||
33 | |||
34 | /* for SIT */ | ||
35 | #ifdef CONFIG_IPV6_SIT_6RD | ||
36 | struct ip_tunnel_6rd_parm ip6rd; | ||
37 | #endif | ||
38 | struct ip_tunnel_prl_entry __rcu *prl; /* potential router list */ | ||
39 | unsigned int prl_count; /* # of entries in PRL */ | ||
40 | |||
41 | struct gro_cells gro_cells; | ||
42 | }; | ||
43 | |||
44 | struct ip_tunnel_prl_entry { | ||
45 | struct ip_tunnel_prl_entry __rcu *next; | ||
46 | __be32 addr; | ||
47 | u16 flags; | ||
48 | struct rcu_head rcu_head; | ||
49 | }; | ||
50 | |||
51 | static inline void iptunnel_xmit(struct sk_buff *skb, struct net_device *dev) | ||
52 | { | ||
53 | int err; | ||
54 | int pkt_len = skb->len - skb_transport_offset(skb); | ||
55 | struct pcpu_tstats *tstats = this_cpu_ptr(dev->tstats); | ||
56 | |||
57 | nf_reset(skb); | ||
58 | |||
59 | err = ip_local_out(skb); | ||
60 | if (likely(net_xmit_eval(err) == 0)) { | ||
61 | u64_stats_update_begin(&tstats->syncp); | ||
62 | tstats->tx_bytes += pkt_len; | ||
63 | tstats->tx_packets++; | ||
64 | u64_stats_update_end(&tstats->syncp); | ||
65 | } else { | ||
66 | dev->stats.tx_errors++; | ||
67 | dev->stats.tx_aborted_errors++; | ||
68 | } | ||
69 | } | ||
70 | |||
71 | static inline void tunnel_ip_select_ident(struct sk_buff *skb, | ||
72 | const struct iphdr *old_iph, | ||
73 | struct dst_entry *dst) | ||
74 | { | ||
75 | struct iphdr *iph = ip_hdr(skb); | ||
76 | |||
77 | /* Use inner packet iph-id if possible. */ | ||
78 | if (skb->protocol == htons(ETH_P_IP) && old_iph->id) | ||
79 | iph->id = old_iph->id; | ||
80 | else | ||
81 | __ip_select_ident(iph, dst, | ||
82 | (skb_shinfo(skb)->gso_segs ?: 1) - 1); | ||
83 | } | ||
84 | #endif | ||