aboutsummaryrefslogtreecommitdiffstats
path: root/net/ipv4
diff options
context:
space:
mode:
authorDavid S. Miller <davem@davemloft.net>2010-12-13 15:52:14 -0500
committerDavid S. Miller <davem@davemloft.net>2010-12-13 15:52:14 -0500
commit0dbaee3b37e118a96bb7b8eb0d9bbaeeb46264be (patch)
tree37000c5d7e663e4ae9800a7bcde9934984b8bae9 /net/ipv4
parentcc6f02dd490dac4ad821d5077b934c9b37037cd0 (diff)
net: Abstract default ADVMSS behind an accessor.
Make all RTAX_ADVMSS metric accesses go through a new helper function, dst_metric_advmss(). Leave the actual default metric as "zero" in the real metric slot, and compute the actual default value dynamically via a new dst_ops AF specific callback. For stacked IPSEC routes, we use the advmss of the path which preserves existing behavior. Unlike ipv4/ipv6, DecNET ties the advmss to the mtu and thus updates advmss on pmtu updates. This inconsistency in advmss handling results in more raw metric accesses than I wish we ended up with. Signed-off-by: David S. Miller <davem@davemloft.net>
Diffstat (limited to 'net/ipv4')
-rw-r--r--net/ipv4/route.c24
-rw-r--r--net/ipv4/tcp_ipv4.c2
-rw-r--r--net/ipv4/tcp_output.c14
3 files changed, 27 insertions, 13 deletions
diff --git a/net/ipv4/route.c b/net/ipv4/route.c
index 770f70427f0b..80997333db0c 100644
--- a/net/ipv4/route.c
+++ b/net/ipv4/route.c
@@ -139,6 +139,7 @@ static unsigned long expires_ljiffies;
139 */ 139 */
140 140
141static struct dst_entry *ipv4_dst_check(struct dst_entry *dst, u32 cookie); 141static struct dst_entry *ipv4_dst_check(struct dst_entry *dst, u32 cookie);
142static unsigned int ipv4_default_advmss(const struct dst_entry *dst);
142static void ipv4_dst_destroy(struct dst_entry *dst); 143static void ipv4_dst_destroy(struct dst_entry *dst);
143static struct dst_entry *ipv4_negative_advice(struct dst_entry *dst); 144static struct dst_entry *ipv4_negative_advice(struct dst_entry *dst);
144static void ipv4_link_failure(struct sk_buff *skb); 145static void ipv4_link_failure(struct sk_buff *skb);
@@ -155,6 +156,7 @@ static struct dst_ops ipv4_dst_ops = {
155 .protocol = cpu_to_be16(ETH_P_IP), 156 .protocol = cpu_to_be16(ETH_P_IP),
156 .gc = rt_garbage_collect, 157 .gc = rt_garbage_collect,
157 .check = ipv4_dst_check, 158 .check = ipv4_dst_check,
159 .default_advmss = ipv4_default_advmss,
158 .destroy = ipv4_dst_destroy, 160 .destroy = ipv4_dst_destroy,
159 .ifdown = ipv4_dst_ifdown, 161 .ifdown = ipv4_dst_ifdown,
160 .negative_advice = ipv4_negative_advice, 162 .negative_advice = ipv4_negative_advice,
@@ -383,8 +385,7 @@ static int rt_cache_seq_show(struct seq_file *seq, void *v)
383 (__force u32)r->rt_gateway, 385 (__force u32)r->rt_gateway,
384 r->rt_flags, atomic_read(&r->dst.__refcnt), 386 r->rt_flags, atomic_read(&r->dst.__refcnt),
385 r->dst.__use, 0, (__force u32)r->rt_src, 387 r->dst.__use, 0, (__force u32)r->rt_src,
386 (dst_metric(&r->dst, RTAX_ADVMSS) ? 388 dst_metric_advmss(&r->dst) + 40,
387 (int)dst_metric(&r->dst, RTAX_ADVMSS) + 40 : 0),
388 dst_metric(&r->dst, RTAX_WINDOW), 389 dst_metric(&r->dst, RTAX_WINDOW),
389 (int)((dst_metric(&r->dst, RTAX_RTT) >> 3) + 390 (int)((dst_metric(&r->dst, RTAX_RTT) >> 3) +
390 dst_metric(&r->dst, RTAX_RTTVAR)), 391 dst_metric(&r->dst, RTAX_RTTVAR)),
@@ -1798,6 +1799,19 @@ static void set_class_tag(struct rtable *rt, u32 tag)
1798} 1799}
1799#endif 1800#endif
1800 1801
1802static unsigned int ipv4_default_advmss(const struct dst_entry *dst)
1803{
1804 unsigned int advmss = dst_metric_raw(dst, RTAX_ADVMSS);
1805
1806 if (advmss == 0) {
1807 advmss = max_t(unsigned int, dst->dev->mtu - 40,
1808 ip_rt_min_advmss);
1809 if (advmss > 65535 - 40)
1810 advmss = 65535 - 40;
1811 }
1812 return advmss;
1813}
1814
1801static void rt_set_nexthop(struct rtable *rt, struct fib_result *res, u32 itag) 1815static void rt_set_nexthop(struct rtable *rt, struct fib_result *res, u32 itag)
1802{ 1816{
1803 struct dst_entry *dst = &rt->dst; 1817 struct dst_entry *dst = &rt->dst;
@@ -1823,11 +1837,7 @@ static void rt_set_nexthop(struct rtable *rt, struct fib_result *res, u32 itag)
1823 1837
1824 if (dst_mtu(dst) > IP_MAX_MTU) 1838 if (dst_mtu(dst) > IP_MAX_MTU)
1825 dst_metric_set(dst, RTAX_MTU, IP_MAX_MTU); 1839 dst_metric_set(dst, RTAX_MTU, IP_MAX_MTU);
1826 if (dst_metric(dst, RTAX_ADVMSS) == 0) 1840 if (dst_metric_raw(dst, RTAX_ADVMSS) > 65535 - 40)
1827 dst_metric_set(dst, RTAX_ADVMSS,
1828 max_t(unsigned int, dst->dev->mtu - 40,
1829 ip_rt_min_advmss));
1830 if (dst_metric(dst, RTAX_ADVMSS) > 65535 - 40)
1831 dst_metric_set(dst, RTAX_ADVMSS, 65535 - 40); 1841 dst_metric_set(dst, RTAX_ADVMSS, 65535 - 40);
1832 1842
1833#ifdef CONFIG_NET_CLS_ROUTE 1843#ifdef CONFIG_NET_CLS_ROUTE
diff --git a/net/ipv4/tcp_ipv4.c b/net/ipv4/tcp_ipv4.c
index 4fc3387aa994..f4011027543d 100644
--- a/net/ipv4/tcp_ipv4.c
+++ b/net/ipv4/tcp_ipv4.c
@@ -1436,7 +1436,7 @@ struct sock *tcp_v4_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
1436 1436
1437 tcp_mtup_init(newsk); 1437 tcp_mtup_init(newsk);
1438 tcp_sync_mss(newsk, dst_mtu(dst)); 1438 tcp_sync_mss(newsk, dst_mtu(dst));
1439 newtp->advmss = dst_metric(dst, RTAX_ADVMSS); 1439 newtp->advmss = dst_metric_advmss(dst);
1440 if (tcp_sk(sk)->rx_opt.user_mss && 1440 if (tcp_sk(sk)->rx_opt.user_mss &&
1441 tcp_sk(sk)->rx_opt.user_mss < newtp->advmss) 1441 tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1442 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss; 1442 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
diff --git a/net/ipv4/tcp_output.c b/net/ipv4/tcp_output.c
index 97041f24cd27..2d390669d406 100644
--- a/net/ipv4/tcp_output.c
+++ b/net/ipv4/tcp_output.c
@@ -119,9 +119,13 @@ static __u16 tcp_advertise_mss(struct sock *sk)
119 struct dst_entry *dst = __sk_dst_get(sk); 119 struct dst_entry *dst = __sk_dst_get(sk);
120 int mss = tp->advmss; 120 int mss = tp->advmss;
121 121
122 if (dst && dst_metric(dst, RTAX_ADVMSS) < mss) { 122 if (dst) {
123 mss = dst_metric(dst, RTAX_ADVMSS); 123 unsigned int metric = dst_metric_advmss(dst);
124 tp->advmss = mss; 124
125 if (metric < mss) {
126 mss = metric;
127 tp->advmss = mss;
128 }
125 } 129 }
126 130
127 return (__u16)mss; 131 return (__u16)mss;
@@ -2422,7 +2426,7 @@ struct sk_buff *tcp_make_synack(struct sock *sk, struct dst_entry *dst,
2422 2426
2423 skb_dst_set(skb, dst_clone(dst)); 2427 skb_dst_set(skb, dst_clone(dst));
2424 2428
2425 mss = dst_metric(dst, RTAX_ADVMSS); 2429 mss = dst_metric_advmss(dst);
2426 if (tp->rx_opt.user_mss && tp->rx_opt.user_mss < mss) 2430 if (tp->rx_opt.user_mss && tp->rx_opt.user_mss < mss)
2427 mss = tp->rx_opt.user_mss; 2431 mss = tp->rx_opt.user_mss;
2428 2432
@@ -2556,7 +2560,7 @@ static void tcp_connect_init(struct sock *sk)
2556 2560
2557 if (!tp->window_clamp) 2561 if (!tp->window_clamp)
2558 tp->window_clamp = dst_metric(dst, RTAX_WINDOW); 2562 tp->window_clamp = dst_metric(dst, RTAX_WINDOW);
2559 tp->advmss = dst_metric(dst, RTAX_ADVMSS); 2563 tp->advmss = dst_metric_advmss(dst);
2560 if (tp->rx_opt.user_mss && tp->rx_opt.user_mss < tp->advmss) 2564 if (tp->rx_opt.user_mss && tp->rx_opt.user_mss < tp->advmss)
2561 tp->advmss = tp->rx_opt.user_mss; 2565 tp->advmss = tp->rx_opt.user_mss;
2562 2566