diff options
Diffstat (limited to 'net/ipv4/ip_gre.c')
-rw-r--r-- | net/ipv4/ip_gre.c | 237 |
1 files changed, 154 insertions, 83 deletions
diff --git a/net/ipv4/ip_gre.c b/net/ipv4/ip_gre.c index 35c93e8b6a46..d0ffcbe369b7 100644 --- a/net/ipv4/ip_gre.c +++ b/net/ipv4/ip_gre.c | |||
@@ -44,6 +44,7 @@ | |||
44 | #include <net/net_namespace.h> | 44 | #include <net/net_namespace.h> |
45 | #include <net/netns/generic.h> | 45 | #include <net/netns/generic.h> |
46 | #include <net/rtnetlink.h> | 46 | #include <net/rtnetlink.h> |
47 | #include <net/gre.h> | ||
47 | 48 | ||
48 | #if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE) | 49 | #if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE) |
49 | #include <net/ipv6.h> | 50 | #include <net/ipv6.h> |
@@ -63,13 +64,13 @@ | |||
63 | We cannot track such dead loops during route installation, | 64 | We cannot track such dead loops during route installation, |
64 | it is infeasible task. The most general solutions would be | 65 | it is infeasible task. The most general solutions would be |
65 | to keep skb->encapsulation counter (sort of local ttl), | 66 | to keep skb->encapsulation counter (sort of local ttl), |
66 | and silently drop packet when it expires. It is the best | 67 | and silently drop packet when it expires. It is a good |
67 | solution, but it supposes maintaing new variable in ALL | 68 | solution, but it supposes maintaing new variable in ALL |
68 | skb, even if no tunneling is used. | 69 | skb, even if no tunneling is used. |
69 | 70 | ||
70 | Current solution: HARD_TX_LOCK lock breaks dead loops. | 71 | Current solution: xmit_recursion breaks dead loops. This is a percpu |
71 | 72 | counter, since when we enter the first ndo_xmit(), cpu migration is | |
72 | 73 | forbidden. We force an exit if this counter reaches RECURSION_LIMIT | |
73 | 74 | ||
74 | 2. Networking dead loops would not kill routers, but would really | 75 | 2. Networking dead loops would not kill routers, but would really |
75 | kill network. IP hop limit plays role of "t->recursion" in this case, | 76 | kill network. IP hop limit plays role of "t->recursion" in this case, |
@@ -128,7 +129,7 @@ static int ipgre_tunnel_bind_dev(struct net_device *dev); | |||
128 | 129 | ||
129 | static int ipgre_net_id __read_mostly; | 130 | static int ipgre_net_id __read_mostly; |
130 | struct ipgre_net { | 131 | struct ipgre_net { |
131 | struct ip_tunnel *tunnels[4][HASH_SIZE]; | 132 | struct ip_tunnel __rcu *tunnels[4][HASH_SIZE]; |
132 | 133 | ||
133 | struct net_device *fb_tunnel_dev; | 134 | struct net_device *fb_tunnel_dev; |
134 | }; | 135 | }; |
@@ -158,13 +159,40 @@ struct ipgre_net { | |||
158 | #define tunnels_l tunnels[1] | 159 | #define tunnels_l tunnels[1] |
159 | #define tunnels_wc tunnels[0] | 160 | #define tunnels_wc tunnels[0] |
160 | /* | 161 | /* |
161 | * Locking : hash tables are protected by RCU and a spinlock | 162 | * Locking : hash tables are protected by RCU and RTNL |
162 | */ | 163 | */ |
163 | static DEFINE_SPINLOCK(ipgre_lock); | ||
164 | 164 | ||
165 | #define for_each_ip_tunnel_rcu(start) \ | 165 | #define for_each_ip_tunnel_rcu(start) \ |
166 | for (t = rcu_dereference(start); t; t = rcu_dereference(t->next)) | 166 | for (t = rcu_dereference(start); t; t = rcu_dereference(t->next)) |
167 | 167 | ||
168 | /* often modified stats are per cpu, other are shared (netdev->stats) */ | ||
169 | struct pcpu_tstats { | ||
170 | unsigned long rx_packets; | ||
171 | unsigned long rx_bytes; | ||
172 | unsigned long tx_packets; | ||
173 | unsigned long tx_bytes; | ||
174 | }; | ||
175 | |||
176 | static struct net_device_stats *ipgre_get_stats(struct net_device *dev) | ||
177 | { | ||
178 | struct pcpu_tstats sum = { 0 }; | ||
179 | int i; | ||
180 | |||
181 | for_each_possible_cpu(i) { | ||
182 | const struct pcpu_tstats *tstats = per_cpu_ptr(dev->tstats, i); | ||
183 | |||
184 | sum.rx_packets += tstats->rx_packets; | ||
185 | sum.rx_bytes += tstats->rx_bytes; | ||
186 | sum.tx_packets += tstats->tx_packets; | ||
187 | sum.tx_bytes += tstats->tx_bytes; | ||
188 | } | ||
189 | dev->stats.rx_packets = sum.rx_packets; | ||
190 | dev->stats.rx_bytes = sum.rx_bytes; | ||
191 | dev->stats.tx_packets = sum.tx_packets; | ||
192 | dev->stats.tx_bytes = sum.tx_bytes; | ||
193 | return &dev->stats; | ||
194 | } | ||
195 | |||
168 | /* Given src, dst and key, find appropriate for input tunnel. */ | 196 | /* Given src, dst and key, find appropriate for input tunnel. */ |
169 | 197 | ||
170 | static struct ip_tunnel * ipgre_tunnel_lookup(struct net_device *dev, | 198 | static struct ip_tunnel * ipgre_tunnel_lookup(struct net_device *dev, |
@@ -173,8 +201,8 @@ static struct ip_tunnel * ipgre_tunnel_lookup(struct net_device *dev, | |||
173 | { | 201 | { |
174 | struct net *net = dev_net(dev); | 202 | struct net *net = dev_net(dev); |
175 | int link = dev->ifindex; | 203 | int link = dev->ifindex; |
176 | unsigned h0 = HASH(remote); | 204 | unsigned int h0 = HASH(remote); |
177 | unsigned h1 = HASH(key); | 205 | unsigned int h1 = HASH(key); |
178 | struct ip_tunnel *t, *cand = NULL; | 206 | struct ip_tunnel *t, *cand = NULL; |
179 | struct ipgre_net *ign = net_generic(net, ipgre_net_id); | 207 | struct ipgre_net *ign = net_generic(net, ipgre_net_id); |
180 | int dev_type = (gre_proto == htons(ETH_P_TEB)) ? | 208 | int dev_type = (gre_proto == htons(ETH_P_TEB)) ? |
@@ -289,13 +317,13 @@ static struct ip_tunnel * ipgre_tunnel_lookup(struct net_device *dev, | |||
289 | return NULL; | 317 | return NULL; |
290 | } | 318 | } |
291 | 319 | ||
292 | static struct ip_tunnel **__ipgre_bucket(struct ipgre_net *ign, | 320 | static struct ip_tunnel __rcu **__ipgre_bucket(struct ipgre_net *ign, |
293 | struct ip_tunnel_parm *parms) | 321 | struct ip_tunnel_parm *parms) |
294 | { | 322 | { |
295 | __be32 remote = parms->iph.daddr; | 323 | __be32 remote = parms->iph.daddr; |
296 | __be32 local = parms->iph.saddr; | 324 | __be32 local = parms->iph.saddr; |
297 | __be32 key = parms->i_key; | 325 | __be32 key = parms->i_key; |
298 | unsigned h = HASH(key); | 326 | unsigned int h = HASH(key); |
299 | int prio = 0; | 327 | int prio = 0; |
300 | 328 | ||
301 | if (local) | 329 | if (local) |
@@ -308,7 +336,7 @@ static struct ip_tunnel **__ipgre_bucket(struct ipgre_net *ign, | |||
308 | return &ign->tunnels[prio][h]; | 336 | return &ign->tunnels[prio][h]; |
309 | } | 337 | } |
310 | 338 | ||
311 | static inline struct ip_tunnel **ipgre_bucket(struct ipgre_net *ign, | 339 | static inline struct ip_tunnel __rcu **ipgre_bucket(struct ipgre_net *ign, |
312 | struct ip_tunnel *t) | 340 | struct ip_tunnel *t) |
313 | { | 341 | { |
314 | return __ipgre_bucket(ign, &t->parms); | 342 | return __ipgre_bucket(ign, &t->parms); |
@@ -316,23 +344,22 @@ static inline struct ip_tunnel **ipgre_bucket(struct ipgre_net *ign, | |||
316 | 344 | ||
317 | static void ipgre_tunnel_link(struct ipgre_net *ign, struct ip_tunnel *t) | 345 | static void ipgre_tunnel_link(struct ipgre_net *ign, struct ip_tunnel *t) |
318 | { | 346 | { |
319 | struct ip_tunnel **tp = ipgre_bucket(ign, t); | 347 | struct ip_tunnel __rcu **tp = ipgre_bucket(ign, t); |
320 | 348 | ||
321 | spin_lock_bh(&ipgre_lock); | 349 | rcu_assign_pointer(t->next, rtnl_dereference(*tp)); |
322 | t->next = *tp; | ||
323 | rcu_assign_pointer(*tp, t); | 350 | rcu_assign_pointer(*tp, t); |
324 | spin_unlock_bh(&ipgre_lock); | ||
325 | } | 351 | } |
326 | 352 | ||
327 | static void ipgre_tunnel_unlink(struct ipgre_net *ign, struct ip_tunnel *t) | 353 | static void ipgre_tunnel_unlink(struct ipgre_net *ign, struct ip_tunnel *t) |
328 | { | 354 | { |
329 | struct ip_tunnel **tp; | 355 | struct ip_tunnel __rcu **tp; |
330 | 356 | struct ip_tunnel *iter; | |
331 | for (tp = ipgre_bucket(ign, t); *tp; tp = &(*tp)->next) { | 357 | |
332 | if (t == *tp) { | 358 | for (tp = ipgre_bucket(ign, t); |
333 | spin_lock_bh(&ipgre_lock); | 359 | (iter = rtnl_dereference(*tp)) != NULL; |
334 | *tp = t->next; | 360 | tp = &iter->next) { |
335 | spin_unlock_bh(&ipgre_lock); | 361 | if (t == iter) { |
362 | rcu_assign_pointer(*tp, t->next); | ||
336 | break; | 363 | break; |
337 | } | 364 | } |
338 | } | 365 | } |
@@ -346,10 +373,13 @@ static struct ip_tunnel *ipgre_tunnel_find(struct net *net, | |||
346 | __be32 local = parms->iph.saddr; | 373 | __be32 local = parms->iph.saddr; |
347 | __be32 key = parms->i_key; | 374 | __be32 key = parms->i_key; |
348 | int link = parms->link; | 375 | int link = parms->link; |
349 | struct ip_tunnel *t, **tp; | 376 | struct ip_tunnel *t; |
377 | struct ip_tunnel __rcu **tp; | ||
350 | struct ipgre_net *ign = net_generic(net, ipgre_net_id); | 378 | struct ipgre_net *ign = net_generic(net, ipgre_net_id); |
351 | 379 | ||
352 | for (tp = __ipgre_bucket(ign, parms); (t = *tp) != NULL; tp = &t->next) | 380 | for (tp = __ipgre_bucket(ign, parms); |
381 | (t = rtnl_dereference(*tp)) != NULL; | ||
382 | tp = &t->next) | ||
353 | if (local == t->parms.iph.saddr && | 383 | if (local == t->parms.iph.saddr && |
354 | remote == t->parms.iph.daddr && | 384 | remote == t->parms.iph.daddr && |
355 | key == t->parms.i_key && | 385 | key == t->parms.i_key && |
@@ -360,7 +390,7 @@ static struct ip_tunnel *ipgre_tunnel_find(struct net *net, | |||
360 | return t; | 390 | return t; |
361 | } | 391 | } |
362 | 392 | ||
363 | static struct ip_tunnel * ipgre_tunnel_locate(struct net *net, | 393 | static struct ip_tunnel *ipgre_tunnel_locate(struct net *net, |
364 | struct ip_tunnel_parm *parms, int create) | 394 | struct ip_tunnel_parm *parms, int create) |
365 | { | 395 | { |
366 | struct ip_tunnel *t, *nt; | 396 | struct ip_tunnel *t, *nt; |
@@ -582,7 +612,7 @@ static int ipgre_rcv(struct sk_buff *skb) | |||
582 | if ((tunnel = ipgre_tunnel_lookup(skb->dev, | 612 | if ((tunnel = ipgre_tunnel_lookup(skb->dev, |
583 | iph->saddr, iph->daddr, key, | 613 | iph->saddr, iph->daddr, key, |
584 | gre_proto))) { | 614 | gre_proto))) { |
585 | struct net_device_stats *stats = &tunnel->dev->stats; | 615 | struct pcpu_tstats *tstats; |
586 | 616 | ||
587 | secpath_reset(skb); | 617 | secpath_reset(skb); |
588 | 618 | ||
@@ -606,22 +636,22 @@ static int ipgre_rcv(struct sk_buff *skb) | |||
606 | /* Looped back packet, drop it! */ | 636 | /* Looped back packet, drop it! */ |
607 | if (skb_rtable(skb)->fl.iif == 0) | 637 | if (skb_rtable(skb)->fl.iif == 0) |
608 | goto drop; | 638 | goto drop; |
609 | stats->multicast++; | 639 | tunnel->dev->stats.multicast++; |
610 | skb->pkt_type = PACKET_BROADCAST; | 640 | skb->pkt_type = PACKET_BROADCAST; |
611 | } | 641 | } |
612 | #endif | 642 | #endif |
613 | 643 | ||
614 | if (((flags&GRE_CSUM) && csum) || | 644 | if (((flags&GRE_CSUM) && csum) || |
615 | (!(flags&GRE_CSUM) && tunnel->parms.i_flags&GRE_CSUM)) { | 645 | (!(flags&GRE_CSUM) && tunnel->parms.i_flags&GRE_CSUM)) { |
616 | stats->rx_crc_errors++; | 646 | tunnel->dev->stats.rx_crc_errors++; |
617 | stats->rx_errors++; | 647 | tunnel->dev->stats.rx_errors++; |
618 | goto drop; | 648 | goto drop; |
619 | } | 649 | } |
620 | if (tunnel->parms.i_flags&GRE_SEQ) { | 650 | if (tunnel->parms.i_flags&GRE_SEQ) { |
621 | if (!(flags&GRE_SEQ) || | 651 | if (!(flags&GRE_SEQ) || |
622 | (tunnel->i_seqno && (s32)(seqno - tunnel->i_seqno) < 0)) { | 652 | (tunnel->i_seqno && (s32)(seqno - tunnel->i_seqno) < 0)) { |
623 | stats->rx_fifo_errors++; | 653 | tunnel->dev->stats.rx_fifo_errors++; |
624 | stats->rx_errors++; | 654 | tunnel->dev->stats.rx_errors++; |
625 | goto drop; | 655 | goto drop; |
626 | } | 656 | } |
627 | tunnel->i_seqno = seqno + 1; | 657 | tunnel->i_seqno = seqno + 1; |
@@ -630,8 +660,8 @@ static int ipgre_rcv(struct sk_buff *skb) | |||
630 | /* Warning: All skb pointers will be invalidated! */ | 660 | /* Warning: All skb pointers will be invalidated! */ |
631 | if (tunnel->dev->type == ARPHRD_ETHER) { | 661 | if (tunnel->dev->type == ARPHRD_ETHER) { |
632 | if (!pskb_may_pull(skb, ETH_HLEN)) { | 662 | if (!pskb_may_pull(skb, ETH_HLEN)) { |
633 | stats->rx_length_errors++; | 663 | tunnel->dev->stats.rx_length_errors++; |
634 | stats->rx_errors++; | 664 | tunnel->dev->stats.rx_errors++; |
635 | goto drop; | 665 | goto drop; |
636 | } | 666 | } |
637 | 667 | ||
@@ -640,14 +670,19 @@ static int ipgre_rcv(struct sk_buff *skb) | |||
640 | skb_postpull_rcsum(skb, eth_hdr(skb), ETH_HLEN); | 670 | skb_postpull_rcsum(skb, eth_hdr(skb), ETH_HLEN); |
641 | } | 671 | } |
642 | 672 | ||
643 | skb_tunnel_rx(skb, tunnel->dev); | 673 | tstats = this_cpu_ptr(tunnel->dev->tstats); |
674 | tstats->rx_packets++; | ||
675 | tstats->rx_bytes += skb->len; | ||
676 | |||
677 | __skb_tunnel_rx(skb, tunnel->dev); | ||
644 | 678 | ||
645 | skb_reset_network_header(skb); | 679 | skb_reset_network_header(skb); |
646 | ipgre_ecn_decapsulate(iph, skb); | 680 | ipgre_ecn_decapsulate(iph, skb); |
647 | 681 | ||
648 | netif_rx(skb); | 682 | netif_rx(skb); |
683 | |||
649 | rcu_read_unlock(); | 684 | rcu_read_unlock(); |
650 | return(0); | 685 | return 0; |
651 | } | 686 | } |
652 | icmp_send(skb, ICMP_DEST_UNREACH, ICMP_PORT_UNREACH, 0); | 687 | icmp_send(skb, ICMP_DEST_UNREACH, ICMP_PORT_UNREACH, 0); |
653 | 688 | ||
@@ -655,20 +690,19 @@ drop: | |||
655 | rcu_read_unlock(); | 690 | rcu_read_unlock(); |
656 | drop_nolock: | 691 | drop_nolock: |
657 | kfree_skb(skb); | 692 | kfree_skb(skb); |
658 | return(0); | 693 | return 0; |
659 | } | 694 | } |
660 | 695 | ||
661 | static netdev_tx_t ipgre_tunnel_xmit(struct sk_buff *skb, struct net_device *dev) | 696 | static netdev_tx_t ipgre_tunnel_xmit(struct sk_buff *skb, struct net_device *dev) |
662 | { | 697 | { |
663 | struct ip_tunnel *tunnel = netdev_priv(dev); | 698 | struct ip_tunnel *tunnel = netdev_priv(dev); |
664 | struct net_device_stats *stats = &dev->stats; | 699 | struct pcpu_tstats *tstats; |
665 | struct netdev_queue *txq = netdev_get_tx_queue(dev, 0); | ||
666 | struct iphdr *old_iph = ip_hdr(skb); | 700 | struct iphdr *old_iph = ip_hdr(skb); |
667 | struct iphdr *tiph; | 701 | struct iphdr *tiph; |
668 | u8 tos; | 702 | u8 tos; |
669 | __be16 df; | 703 | __be16 df; |
670 | struct rtable *rt; /* Route to the other host */ | 704 | struct rtable *rt; /* Route to the other host */ |
671 | struct net_device *tdev; /* Device to other host */ | 705 | struct net_device *tdev; /* Device to other host */ |
672 | struct iphdr *iph; /* Our new IP header */ | 706 | struct iphdr *iph; /* Our new IP header */ |
673 | unsigned int max_headroom; /* The extra header space needed */ | 707 | unsigned int max_headroom; /* The extra header space needed */ |
674 | int gre_hlen; | 708 | int gre_hlen; |
@@ -690,7 +724,7 @@ static netdev_tx_t ipgre_tunnel_xmit(struct sk_buff *skb, struct net_device *dev | |||
690 | /* NBMA tunnel */ | 724 | /* NBMA tunnel */ |
691 | 725 | ||
692 | if (skb_dst(skb) == NULL) { | 726 | if (skb_dst(skb) == NULL) { |
693 | stats->tx_fifo_errors++; | 727 | dev->stats.tx_fifo_errors++; |
694 | goto tx_error; | 728 | goto tx_error; |
695 | } | 729 | } |
696 | 730 | ||
@@ -736,14 +770,20 @@ static netdev_tx_t ipgre_tunnel_xmit(struct sk_buff *skb, struct net_device *dev | |||
736 | } | 770 | } |
737 | 771 | ||
738 | { | 772 | { |
739 | struct flowi fl = { .oif = tunnel->parms.link, | 773 | struct flowi fl = { |
740 | .nl_u = { .ip4_u = | 774 | .oif = tunnel->parms.link, |
741 | { .daddr = dst, | 775 | .nl_u = { |
742 | .saddr = tiph->saddr, | 776 | .ip4_u = { |
743 | .tos = RT_TOS(tos) } }, | 777 | .daddr = dst, |
744 | .proto = IPPROTO_GRE }; | 778 | .saddr = tiph->saddr, |
779 | .tos = RT_TOS(tos) | ||
780 | } | ||
781 | }, | ||
782 | .proto = IPPROTO_GRE | ||
783 | } | ||
784 | ; | ||
745 | if (ip_route_output_key(dev_net(dev), &rt, &fl)) { | 785 | if (ip_route_output_key(dev_net(dev), &rt, &fl)) { |
746 | stats->tx_carrier_errors++; | 786 | dev->stats.tx_carrier_errors++; |
747 | goto tx_error; | 787 | goto tx_error; |
748 | } | 788 | } |
749 | } | 789 | } |
@@ -751,7 +791,7 @@ static netdev_tx_t ipgre_tunnel_xmit(struct sk_buff *skb, struct net_device *dev | |||
751 | 791 | ||
752 | if (tdev == dev) { | 792 | if (tdev == dev) { |
753 | ip_rt_put(rt); | 793 | ip_rt_put(rt); |
754 | stats->collisions++; | 794 | dev->stats.collisions++; |
755 | goto tx_error; | 795 | goto tx_error; |
756 | } | 796 | } |
757 | 797 | ||
@@ -814,7 +854,7 @@ static netdev_tx_t ipgre_tunnel_xmit(struct sk_buff *skb, struct net_device *dev | |||
814 | dev->needed_headroom = max_headroom; | 854 | dev->needed_headroom = max_headroom; |
815 | if (!new_skb) { | 855 | if (!new_skb) { |
816 | ip_rt_put(rt); | 856 | ip_rt_put(rt); |
817 | txq->tx_dropped++; | 857 | dev->stats.tx_dropped++; |
818 | dev_kfree_skb(skb); | 858 | dev_kfree_skb(skb); |
819 | return NETDEV_TX_OK; | 859 | return NETDEV_TX_OK; |
820 | } | 860 | } |
@@ -881,15 +921,15 @@ static netdev_tx_t ipgre_tunnel_xmit(struct sk_buff *skb, struct net_device *dev | |||
881 | } | 921 | } |
882 | 922 | ||
883 | nf_reset(skb); | 923 | nf_reset(skb); |
884 | 924 | tstats = this_cpu_ptr(dev->tstats); | |
885 | IPTUNNEL_XMIT(); | 925 | __IPTUNNEL_XMIT(tstats, &dev->stats); |
886 | return NETDEV_TX_OK; | 926 | return NETDEV_TX_OK; |
887 | 927 | ||
888 | tx_error_icmp: | 928 | tx_error_icmp: |
889 | dst_link_failure(skb); | 929 | dst_link_failure(skb); |
890 | 930 | ||
891 | tx_error: | 931 | tx_error: |
892 | stats->tx_errors++; | 932 | dev->stats.tx_errors++; |
893 | dev_kfree_skb(skb); | 933 | dev_kfree_skb(skb); |
894 | return NETDEV_TX_OK; | 934 | return NETDEV_TX_OK; |
895 | } | 935 | } |
@@ -909,13 +949,19 @@ static int ipgre_tunnel_bind_dev(struct net_device *dev) | |||
909 | /* Guess output device to choose reasonable mtu and needed_headroom */ | 949 | /* Guess output device to choose reasonable mtu and needed_headroom */ |
910 | 950 | ||
911 | if (iph->daddr) { | 951 | if (iph->daddr) { |
912 | struct flowi fl = { .oif = tunnel->parms.link, | 952 | struct flowi fl = { |
913 | .nl_u = { .ip4_u = | 953 | .oif = tunnel->parms.link, |
914 | { .daddr = iph->daddr, | 954 | .nl_u = { |
915 | .saddr = iph->saddr, | 955 | .ip4_u = { |
916 | .tos = RT_TOS(iph->tos) } }, | 956 | .daddr = iph->daddr, |
917 | .proto = IPPROTO_GRE }; | 957 | .saddr = iph->saddr, |
958 | .tos = RT_TOS(iph->tos) | ||
959 | } | ||
960 | }, | ||
961 | .proto = IPPROTO_GRE | ||
962 | }; | ||
918 | struct rtable *rt; | 963 | struct rtable *rt; |
964 | |||
919 | if (!ip_route_output_key(dev_net(dev), &rt, &fl)) { | 965 | if (!ip_route_output_key(dev_net(dev), &rt, &fl)) { |
920 | tdev = rt->dst.dev; | 966 | tdev = rt->dst.dev; |
921 | ip_rt_put(rt); | 967 | ip_rt_put(rt); |
@@ -1012,7 +1058,7 @@ ipgre_tunnel_ioctl (struct net_device *dev, struct ifreq *ifr, int cmd) | |||
1012 | break; | 1058 | break; |
1013 | } | 1059 | } |
1014 | } else { | 1060 | } else { |
1015 | unsigned nflags = 0; | 1061 | unsigned int nflags = 0; |
1016 | 1062 | ||
1017 | t = netdev_priv(dev); | 1063 | t = netdev_priv(dev); |
1018 | 1064 | ||
@@ -1125,7 +1171,7 @@ static int ipgre_tunnel_change_mtu(struct net_device *dev, int new_mtu) | |||
1125 | 1171 | ||
1126 | static int ipgre_header(struct sk_buff *skb, struct net_device *dev, | 1172 | static int ipgre_header(struct sk_buff *skb, struct net_device *dev, |
1127 | unsigned short type, | 1173 | unsigned short type, |
1128 | const void *daddr, const void *saddr, unsigned len) | 1174 | const void *daddr, const void *saddr, unsigned int len) |
1129 | { | 1175 | { |
1130 | struct ip_tunnel *t = netdev_priv(dev); | 1176 | struct ip_tunnel *t = netdev_priv(dev); |
1131 | struct iphdr *iph = (struct iphdr *)skb_push(skb, t->hlen); | 1177 | struct iphdr *iph = (struct iphdr *)skb_push(skb, t->hlen); |
@@ -1167,13 +1213,19 @@ static int ipgre_open(struct net_device *dev) | |||
1167 | struct ip_tunnel *t = netdev_priv(dev); | 1213 | struct ip_tunnel *t = netdev_priv(dev); |
1168 | 1214 | ||
1169 | if (ipv4_is_multicast(t->parms.iph.daddr)) { | 1215 | if (ipv4_is_multicast(t->parms.iph.daddr)) { |
1170 | struct flowi fl = { .oif = t->parms.link, | 1216 | struct flowi fl = { |
1171 | .nl_u = { .ip4_u = | 1217 | .oif = t->parms.link, |
1172 | { .daddr = t->parms.iph.daddr, | 1218 | .nl_u = { |
1173 | .saddr = t->parms.iph.saddr, | 1219 | .ip4_u = { |
1174 | .tos = RT_TOS(t->parms.iph.tos) } }, | 1220 | .daddr = t->parms.iph.daddr, |
1175 | .proto = IPPROTO_GRE }; | 1221 | .saddr = t->parms.iph.saddr, |
1222 | .tos = RT_TOS(t->parms.iph.tos) | ||
1223 | } | ||
1224 | }, | ||
1225 | .proto = IPPROTO_GRE | ||
1226 | }; | ||
1176 | struct rtable *rt; | 1227 | struct rtable *rt; |
1228 | |||
1177 | if (ip_route_output_key(dev_net(dev), &rt, &fl)) | 1229 | if (ip_route_output_key(dev_net(dev), &rt, &fl)) |
1178 | return -EADDRNOTAVAIL; | 1230 | return -EADDRNOTAVAIL; |
1179 | dev = rt->dst.dev; | 1231 | dev = rt->dst.dev; |
@@ -1193,10 +1245,8 @@ static int ipgre_close(struct net_device *dev) | |||
1193 | if (ipv4_is_multicast(t->parms.iph.daddr) && t->mlink) { | 1245 | if (ipv4_is_multicast(t->parms.iph.daddr) && t->mlink) { |
1194 | struct in_device *in_dev; | 1246 | struct in_device *in_dev; |
1195 | in_dev = inetdev_by_index(dev_net(dev), t->mlink); | 1247 | in_dev = inetdev_by_index(dev_net(dev), t->mlink); |
1196 | if (in_dev) { | 1248 | if (in_dev) |
1197 | ip_mc_dec_group(in_dev, t->parms.iph.daddr); | 1249 | ip_mc_dec_group(in_dev, t->parms.iph.daddr); |
1198 | in_dev_put(in_dev); | ||
1199 | } | ||
1200 | } | 1250 | } |
1201 | return 0; | 1251 | return 0; |
1202 | } | 1252 | } |
@@ -1213,12 +1263,19 @@ static const struct net_device_ops ipgre_netdev_ops = { | |||
1213 | .ndo_start_xmit = ipgre_tunnel_xmit, | 1263 | .ndo_start_xmit = ipgre_tunnel_xmit, |
1214 | .ndo_do_ioctl = ipgre_tunnel_ioctl, | 1264 | .ndo_do_ioctl = ipgre_tunnel_ioctl, |
1215 | .ndo_change_mtu = ipgre_tunnel_change_mtu, | 1265 | .ndo_change_mtu = ipgre_tunnel_change_mtu, |
1266 | .ndo_get_stats = ipgre_get_stats, | ||
1216 | }; | 1267 | }; |
1217 | 1268 | ||
1269 | static void ipgre_dev_free(struct net_device *dev) | ||
1270 | { | ||
1271 | free_percpu(dev->tstats); | ||
1272 | free_netdev(dev); | ||
1273 | } | ||
1274 | |||
1218 | static void ipgre_tunnel_setup(struct net_device *dev) | 1275 | static void ipgre_tunnel_setup(struct net_device *dev) |
1219 | { | 1276 | { |
1220 | dev->netdev_ops = &ipgre_netdev_ops; | 1277 | dev->netdev_ops = &ipgre_netdev_ops; |
1221 | dev->destructor = free_netdev; | 1278 | dev->destructor = ipgre_dev_free; |
1222 | 1279 | ||
1223 | dev->type = ARPHRD_IPGRE; | 1280 | dev->type = ARPHRD_IPGRE; |
1224 | dev->needed_headroom = LL_MAX_HEADER + sizeof(struct iphdr) + 4; | 1281 | dev->needed_headroom = LL_MAX_HEADER + sizeof(struct iphdr) + 4; |
@@ -1256,6 +1313,10 @@ static int ipgre_tunnel_init(struct net_device *dev) | |||
1256 | } else | 1313 | } else |
1257 | dev->header_ops = &ipgre_header_ops; | 1314 | dev->header_ops = &ipgre_header_ops; |
1258 | 1315 | ||
1316 | dev->tstats = alloc_percpu(struct pcpu_tstats); | ||
1317 | if (!dev->tstats) | ||
1318 | return -ENOMEM; | ||
1319 | |||
1259 | return 0; | 1320 | return 0; |
1260 | } | 1321 | } |
1261 | 1322 | ||
@@ -1274,14 +1335,13 @@ static void ipgre_fb_tunnel_init(struct net_device *dev) | |||
1274 | tunnel->hlen = sizeof(struct iphdr) + 4; | 1335 | tunnel->hlen = sizeof(struct iphdr) + 4; |
1275 | 1336 | ||
1276 | dev_hold(dev); | 1337 | dev_hold(dev); |
1277 | ign->tunnels_wc[0] = tunnel; | 1338 | rcu_assign_pointer(ign->tunnels_wc[0], tunnel); |
1278 | } | 1339 | } |
1279 | 1340 | ||
1280 | 1341 | ||
1281 | static const struct net_protocol ipgre_protocol = { | 1342 | static const struct gre_protocol ipgre_protocol = { |
1282 | .handler = ipgre_rcv, | 1343 | .handler = ipgre_rcv, |
1283 | .err_handler = ipgre_err, | 1344 | .err_handler = ipgre_err, |
1284 | .netns_ok = 1, | ||
1285 | }; | 1345 | }; |
1286 | 1346 | ||
1287 | static void ipgre_destroy_tunnels(struct ipgre_net *ign, struct list_head *head) | 1347 | static void ipgre_destroy_tunnels(struct ipgre_net *ign, struct list_head *head) |
@@ -1291,11 +1351,13 @@ static void ipgre_destroy_tunnels(struct ipgre_net *ign, struct list_head *head) | |||
1291 | for (prio = 0; prio < 4; prio++) { | 1351 | for (prio = 0; prio < 4; prio++) { |
1292 | int h; | 1352 | int h; |
1293 | for (h = 0; h < HASH_SIZE; h++) { | 1353 | for (h = 0; h < HASH_SIZE; h++) { |
1294 | struct ip_tunnel *t = ign->tunnels[prio][h]; | 1354 | struct ip_tunnel *t; |
1355 | |||
1356 | t = rtnl_dereference(ign->tunnels[prio][h]); | ||
1295 | 1357 | ||
1296 | while (t != NULL) { | 1358 | while (t != NULL) { |
1297 | unregister_netdevice_queue(t->dev, head); | 1359 | unregister_netdevice_queue(t->dev, head); |
1298 | t = t->next; | 1360 | t = rtnl_dereference(t->next); |
1299 | } | 1361 | } |
1300 | } | 1362 | } |
1301 | } | 1363 | } |
@@ -1441,6 +1503,10 @@ static int ipgre_tap_init(struct net_device *dev) | |||
1441 | 1503 | ||
1442 | ipgre_tunnel_bind_dev(dev); | 1504 | ipgre_tunnel_bind_dev(dev); |
1443 | 1505 | ||
1506 | dev->tstats = alloc_percpu(struct pcpu_tstats); | ||
1507 | if (!dev->tstats) | ||
1508 | return -ENOMEM; | ||
1509 | |||
1444 | return 0; | 1510 | return 0; |
1445 | } | 1511 | } |
1446 | 1512 | ||
@@ -1451,6 +1517,7 @@ static const struct net_device_ops ipgre_tap_netdev_ops = { | |||
1451 | .ndo_set_mac_address = eth_mac_addr, | 1517 | .ndo_set_mac_address = eth_mac_addr, |
1452 | .ndo_validate_addr = eth_validate_addr, | 1518 | .ndo_validate_addr = eth_validate_addr, |
1453 | .ndo_change_mtu = ipgre_tunnel_change_mtu, | 1519 | .ndo_change_mtu = ipgre_tunnel_change_mtu, |
1520 | .ndo_get_stats = ipgre_get_stats, | ||
1454 | }; | 1521 | }; |
1455 | 1522 | ||
1456 | static void ipgre_tap_setup(struct net_device *dev) | 1523 | static void ipgre_tap_setup(struct net_device *dev) |
@@ -1459,7 +1526,7 @@ static void ipgre_tap_setup(struct net_device *dev) | |||
1459 | ether_setup(dev); | 1526 | ether_setup(dev); |
1460 | 1527 | ||
1461 | dev->netdev_ops = &ipgre_tap_netdev_ops; | 1528 | dev->netdev_ops = &ipgre_tap_netdev_ops; |
1462 | dev->destructor = free_netdev; | 1529 | dev->destructor = ipgre_dev_free; |
1463 | 1530 | ||
1464 | dev->iflink = 0; | 1531 | dev->iflink = 0; |
1465 | dev->features |= NETIF_F_NETNS_LOCAL; | 1532 | dev->features |= NETIF_F_NETNS_LOCAL; |
@@ -1487,6 +1554,10 @@ static int ipgre_newlink(struct net *src_net, struct net_device *dev, struct nla | |||
1487 | if (!tb[IFLA_MTU]) | 1554 | if (!tb[IFLA_MTU]) |
1488 | dev->mtu = mtu; | 1555 | dev->mtu = mtu; |
1489 | 1556 | ||
1557 | /* Can use a lockless transmit, unless we generate output sequences */ | ||
1558 | if (!(nt->parms.o_flags & GRE_SEQ)) | ||
1559 | dev->features |= NETIF_F_LLTX; | ||
1560 | |||
1490 | err = register_netdevice(dev); | 1561 | err = register_netdevice(dev); |
1491 | if (err) | 1562 | if (err) |
1492 | goto out; | 1563 | goto out; |
@@ -1522,7 +1593,7 @@ static int ipgre_changelink(struct net_device *dev, struct nlattr *tb[], | |||
1522 | t = nt; | 1593 | t = nt; |
1523 | 1594 | ||
1524 | if (dev->type != ARPHRD_ETHER) { | 1595 | if (dev->type != ARPHRD_ETHER) { |
1525 | unsigned nflags = 0; | 1596 | unsigned int nflags = 0; |
1526 | 1597 | ||
1527 | if (ipv4_is_multicast(p.iph.daddr)) | 1598 | if (ipv4_is_multicast(p.iph.daddr)) |
1528 | nflags = IFF_BROADCAST; | 1599 | nflags = IFF_BROADCAST; |
@@ -1663,7 +1734,7 @@ static int __init ipgre_init(void) | |||
1663 | if (err < 0) | 1734 | if (err < 0) |
1664 | return err; | 1735 | return err; |
1665 | 1736 | ||
1666 | err = inet_add_protocol(&ipgre_protocol, IPPROTO_GRE); | 1737 | err = gre_add_protocol(&ipgre_protocol, GREPROTO_CISCO); |
1667 | if (err < 0) { | 1738 | if (err < 0) { |
1668 | printk(KERN_INFO "ipgre init: can't add protocol\n"); | 1739 | printk(KERN_INFO "ipgre init: can't add protocol\n"); |
1669 | goto add_proto_failed; | 1740 | goto add_proto_failed; |
@@ -1683,7 +1754,7 @@ out: | |||
1683 | tap_ops_failed: | 1754 | tap_ops_failed: |
1684 | rtnl_link_unregister(&ipgre_link_ops); | 1755 | rtnl_link_unregister(&ipgre_link_ops); |
1685 | rtnl_link_failed: | 1756 | rtnl_link_failed: |
1686 | inet_del_protocol(&ipgre_protocol, IPPROTO_GRE); | 1757 | gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO); |
1687 | add_proto_failed: | 1758 | add_proto_failed: |
1688 | unregister_pernet_device(&ipgre_net_ops); | 1759 | unregister_pernet_device(&ipgre_net_ops); |
1689 | goto out; | 1760 | goto out; |
@@ -1693,7 +1764,7 @@ static void __exit ipgre_fini(void) | |||
1693 | { | 1764 | { |
1694 | rtnl_link_unregister(&ipgre_tap_ops); | 1765 | rtnl_link_unregister(&ipgre_tap_ops); |
1695 | rtnl_link_unregister(&ipgre_link_ops); | 1766 | rtnl_link_unregister(&ipgre_link_ops); |
1696 | if (inet_del_protocol(&ipgre_protocol, IPPROTO_GRE) < 0) | 1767 | if (gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO) < 0) |
1697 | printk(KERN_INFO "ipgre close: can't remove protocol\n"); | 1768 | printk(KERN_INFO "ipgre close: can't remove protocol\n"); |
1698 | unregister_pernet_device(&ipgre_net_ops); | 1769 | unregister_pernet_device(&ipgre_net_ops); |
1699 | } | 1770 | } |