diff options
author | Eric Dumazet <eric.dumazet@gmail.com> | 2009-12-03 19:06:13 -0500 |
---|---|---|
committer | David S. Miller <davem@davemloft.net> | 2009-12-03 19:06:13 -0500 |
commit | 49d09007879ce7bee36ab453c73e97c00adce884 (patch) | |
tree | 6b6a28e0fd8befd4bad5fb1474ce4e0dea9ed6dd | |
parent | 3320eae51d6e4c65b4733bf4d87de3b833973a1f (diff) |
tcp: diag: Dont report negative values for rx queue
Both netlink and /proc/net/tcp interfaces can report transient
negative values for rx queue.
ss ->
State Recv-Q Send-Q Local Address:Port Peer Address:Port
ESTAB -6 6 127.0.0.1:45956 127.0.0.1:3333
netstat ->
tcp 4294967290 6 127.0.0.1:37784 127.0.0.1:3333 ESTABLISHED
This is because we dont lock socket while computing
tp->rcv_nxt - tp->copied_seq,
and another CPU can update copied_seq before rcv_next in RX path.
Signed-off-by: Eric Dumazet <eric.dumazet@gmail.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
-rw-r--r-- | net/ipv4/tcp_diag.c | 2 | ||||
-rw-r--r-- | net/ipv4/tcp_ipv4.c | 12 |
2 files changed, 11 insertions, 3 deletions
diff --git a/net/ipv4/tcp_diag.c b/net/ipv4/tcp_diag.c index fcbcd4ff6c5f..939edb3b8e4d 100644 --- a/net/ipv4/tcp_diag.c +++ b/net/ipv4/tcp_diag.c | |||
@@ -27,7 +27,7 @@ static void tcp_diag_get_info(struct sock *sk, struct inet_diag_msg *r, | |||
27 | r->idiag_rqueue = sk->sk_ack_backlog; | 27 | r->idiag_rqueue = sk->sk_ack_backlog; |
28 | r->idiag_wqueue = sk->sk_max_ack_backlog; | 28 | r->idiag_wqueue = sk->sk_max_ack_backlog; |
29 | } else { | 29 | } else { |
30 | r->idiag_rqueue = tp->rcv_nxt - tp->copied_seq; | 30 | r->idiag_rqueue = max_t(int, tp->rcv_nxt - tp->copied_seq, 0); |
31 | r->idiag_wqueue = tp->write_seq - tp->snd_una; | 31 | r->idiag_wqueue = tp->write_seq - tp->snd_una; |
32 | } | 32 | } |
33 | if (info != NULL) | 33 | if (info != NULL) |
diff --git a/net/ipv4/tcp_ipv4.c b/net/ipv4/tcp_ipv4.c index fee9aabd5aa1..29002ab26e0d 100644 --- a/net/ipv4/tcp_ipv4.c +++ b/net/ipv4/tcp_ipv4.c | |||
@@ -2318,6 +2318,7 @@ static void get_tcp4_sock(struct sock *sk, struct seq_file *f, int i, int *len) | |||
2318 | __be32 src = inet->inet_rcv_saddr; | 2318 | __be32 src = inet->inet_rcv_saddr; |
2319 | __u16 destp = ntohs(inet->inet_dport); | 2319 | __u16 destp = ntohs(inet->inet_dport); |
2320 | __u16 srcp = ntohs(inet->inet_sport); | 2320 | __u16 srcp = ntohs(inet->inet_sport); |
2321 | int rx_queue; | ||
2321 | 2322 | ||
2322 | if (icsk->icsk_pending == ICSK_TIME_RETRANS) { | 2323 | if (icsk->icsk_pending == ICSK_TIME_RETRANS) { |
2323 | timer_active = 1; | 2324 | timer_active = 1; |
@@ -2333,12 +2334,19 @@ static void get_tcp4_sock(struct sock *sk, struct seq_file *f, int i, int *len) | |||
2333 | timer_expires = jiffies; | 2334 | timer_expires = jiffies; |
2334 | } | 2335 | } |
2335 | 2336 | ||
2337 | if (sk->sk_state == TCP_LISTEN) | ||
2338 | rx_queue = sk->sk_ack_backlog; | ||
2339 | else | ||
2340 | /* | ||
2341 | * because we dont lock socket, we might find a transient negative value | ||
2342 | */ | ||
2343 | rx_queue = max_t(int, tp->rcv_nxt - tp->copied_seq, 0); | ||
2344 | |||
2336 | seq_printf(f, "%4d: %08X:%04X %08X:%04X %02X %08X:%08X %02X:%08lX " | 2345 | seq_printf(f, "%4d: %08X:%04X %08X:%04X %02X %08X:%08X %02X:%08lX " |
2337 | "%08X %5d %8d %lu %d %p %lu %lu %u %u %d%n", | 2346 | "%08X %5d %8d %lu %d %p %lu %lu %u %u %d%n", |
2338 | i, src, srcp, dest, destp, sk->sk_state, | 2347 | i, src, srcp, dest, destp, sk->sk_state, |
2339 | tp->write_seq - tp->snd_una, | 2348 | tp->write_seq - tp->snd_una, |
2340 | sk->sk_state == TCP_LISTEN ? sk->sk_ack_backlog : | 2349 | rx_queue, |
2341 | (tp->rcv_nxt - tp->copied_seq), | ||
2342 | timer_active, | 2350 | timer_active, |
2343 | jiffies_to_clock_t(timer_expires - jiffies), | 2351 | jiffies_to_clock_t(timer_expires - jiffies), |
2344 | icsk->icsk_retransmits, | 2352 | icsk->icsk_retransmits, |