diff options
author | Marcelo Ricardo Leitner <marcelo.leitner@gmail.com> | 2015-06-12 09:16:41 -0400 |
---|---|---|
committer | David S. Miller <davem@davemloft.net> | 2015-06-14 15:55:49 -0400 |
commit | 2d45a02d0166caf2627fe91897c6ffc3b19514c4 (patch) | |
tree | 89469e59272cf6fd8efd2878801a1e2c2d8f5fe6 | |
parent | c8d17b451aa18b07b60e771addf17a5fdd4138c7 (diff) |
sctp: fix ASCONF list handling
->auto_asconf_splist is per namespace and mangled by functions like
sctp_setsockopt_auto_asconf() which doesn't guarantee any serialization.
Also, the call to inet_sk_copy_descendant() was backuping
->auto_asconf_list through the copy but was not honoring
->do_auto_asconf, which could lead to list corruption if it was
different between both sockets.
This commit thus fixes the list handling by using ->addr_wq_lock
spinlock to protect the list. A special handling is done upon socket
creation and destruction for that. Error handlig on sctp_init_sock()
will never return an error after having initialized asconf, so
sctp_destroy_sock() can be called without addrq_wq_lock. The lock now
will be take on sctp_close_sock(), before locking the socket, so we
don't do it in inverse order compared to sctp_addr_wq_timeout_handler().
Instead of taking the lock on sctp_sock_migrate() for copying and
restoring the list values, it's preferred to avoid rewritting it by
implementing sctp_copy_descendant().
Issue was found with a test application that kept flipping sysctl
default_auto_asconf on and off, but one could trigger it by issuing
simultaneous setsockopt() calls on multiple sockets or by
creating/destroying sockets fast enough. This is only triggerable
locally.
Fixes: 9f7d653b67ae ("sctp: Add Auto-ASCONF support (core).")
Reported-by: Ji Jianwen <jiji@redhat.com>
Suggested-by: Neil Horman <nhorman@tuxdriver.com>
Suggested-by: Hannes Frederic Sowa <hannes@stressinduktion.org>
Acked-by: Hannes Frederic Sowa <hannes@stressinduktion.org>
Signed-off-by: Marcelo Ricardo Leitner <marcelo.leitner@gmail.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
-rw-r--r-- | include/net/netns/sctp.h | 1 | ||||
-rw-r--r-- | include/net/sctp/structs.h | 4 | ||||
-rw-r--r-- | net/sctp/socket.c | 43 |
3 files changed, 37 insertions, 11 deletions
diff --git a/include/net/netns/sctp.h b/include/net/netns/sctp.h index 3573a81815ad..8ba379f9e467 100644 --- a/include/net/netns/sctp.h +++ b/include/net/netns/sctp.h | |||
@@ -31,6 +31,7 @@ struct netns_sctp { | |||
31 | struct list_head addr_waitq; | 31 | struct list_head addr_waitq; |
32 | struct timer_list addr_wq_timer; | 32 | struct timer_list addr_wq_timer; |
33 | struct list_head auto_asconf_splist; | 33 | struct list_head auto_asconf_splist; |
34 | /* Lock that protects both addr_waitq and auto_asconf_splist */ | ||
34 | spinlock_t addr_wq_lock; | 35 | spinlock_t addr_wq_lock; |
35 | 36 | ||
36 | /* Lock that protects the local_addr_list writers */ | 37 | /* Lock that protects the local_addr_list writers */ |
diff --git a/include/net/sctp/structs.h b/include/net/sctp/structs.h index 2bb2fcf5b11f..495c87e367b3 100644 --- a/include/net/sctp/structs.h +++ b/include/net/sctp/structs.h | |||
@@ -223,6 +223,10 @@ struct sctp_sock { | |||
223 | atomic_t pd_mode; | 223 | atomic_t pd_mode; |
224 | /* Receive to here while partial delivery is in effect. */ | 224 | /* Receive to here while partial delivery is in effect. */ |
225 | struct sk_buff_head pd_lobby; | 225 | struct sk_buff_head pd_lobby; |
226 | |||
227 | /* These must be the last fields, as they will skipped on copies, | ||
228 | * like on accept and peeloff operations | ||
229 | */ | ||
226 | struct list_head auto_asconf_list; | 230 | struct list_head auto_asconf_list; |
227 | int do_auto_asconf; | 231 | int do_auto_asconf; |
228 | }; | 232 | }; |
diff --git a/net/sctp/socket.c b/net/sctp/socket.c index f09de7fac2e6..5f6c4e61325b 100644 --- a/net/sctp/socket.c +++ b/net/sctp/socket.c | |||
@@ -1528,8 +1528,10 @@ static void sctp_close(struct sock *sk, long timeout) | |||
1528 | 1528 | ||
1529 | /* Supposedly, no process has access to the socket, but | 1529 | /* Supposedly, no process has access to the socket, but |
1530 | * the net layers still may. | 1530 | * the net layers still may. |
1531 | * Also, sctp_destroy_sock() needs to be called with addr_wq_lock | ||
1532 | * held and that should be grabbed before socket lock. | ||
1531 | */ | 1533 | */ |
1532 | local_bh_disable(); | 1534 | spin_lock_bh(&net->sctp.addr_wq_lock); |
1533 | bh_lock_sock(sk); | 1535 | bh_lock_sock(sk); |
1534 | 1536 | ||
1535 | /* Hold the sock, since sk_common_release() will put sock_put() | 1537 | /* Hold the sock, since sk_common_release() will put sock_put() |
@@ -1539,7 +1541,7 @@ static void sctp_close(struct sock *sk, long timeout) | |||
1539 | sk_common_release(sk); | 1541 | sk_common_release(sk); |
1540 | 1542 | ||
1541 | bh_unlock_sock(sk); | 1543 | bh_unlock_sock(sk); |
1542 | local_bh_enable(); | 1544 | spin_unlock_bh(&net->sctp.addr_wq_lock); |
1543 | 1545 | ||
1544 | sock_put(sk); | 1546 | sock_put(sk); |
1545 | 1547 | ||
@@ -3580,6 +3582,7 @@ static int sctp_setsockopt_auto_asconf(struct sock *sk, char __user *optval, | |||
3580 | if ((val && sp->do_auto_asconf) || (!val && !sp->do_auto_asconf)) | 3582 | if ((val && sp->do_auto_asconf) || (!val && !sp->do_auto_asconf)) |
3581 | return 0; | 3583 | return 0; |
3582 | 3584 | ||
3585 | spin_lock_bh(&sock_net(sk)->sctp.addr_wq_lock); | ||
3583 | if (val == 0 && sp->do_auto_asconf) { | 3586 | if (val == 0 && sp->do_auto_asconf) { |
3584 | list_del(&sp->auto_asconf_list); | 3587 | list_del(&sp->auto_asconf_list); |
3585 | sp->do_auto_asconf = 0; | 3588 | sp->do_auto_asconf = 0; |
@@ -3588,6 +3591,7 @@ static int sctp_setsockopt_auto_asconf(struct sock *sk, char __user *optval, | |||
3588 | &sock_net(sk)->sctp.auto_asconf_splist); | 3591 | &sock_net(sk)->sctp.auto_asconf_splist); |
3589 | sp->do_auto_asconf = 1; | 3592 | sp->do_auto_asconf = 1; |
3590 | } | 3593 | } |
3594 | spin_unlock_bh(&sock_net(sk)->sctp.addr_wq_lock); | ||
3591 | return 0; | 3595 | return 0; |
3592 | } | 3596 | } |
3593 | 3597 | ||
@@ -4121,18 +4125,28 @@ static int sctp_init_sock(struct sock *sk) | |||
4121 | local_bh_disable(); | 4125 | local_bh_disable(); |
4122 | percpu_counter_inc(&sctp_sockets_allocated); | 4126 | percpu_counter_inc(&sctp_sockets_allocated); |
4123 | sock_prot_inuse_add(net, sk->sk_prot, 1); | 4127 | sock_prot_inuse_add(net, sk->sk_prot, 1); |
4128 | |||
4129 | /* Nothing can fail after this block, otherwise | ||
4130 | * sctp_destroy_sock() will be called without addr_wq_lock held | ||
4131 | */ | ||
4124 | if (net->sctp.default_auto_asconf) { | 4132 | if (net->sctp.default_auto_asconf) { |
4133 | spin_lock(&sock_net(sk)->sctp.addr_wq_lock); | ||
4125 | list_add_tail(&sp->auto_asconf_list, | 4134 | list_add_tail(&sp->auto_asconf_list, |
4126 | &net->sctp.auto_asconf_splist); | 4135 | &net->sctp.auto_asconf_splist); |
4127 | sp->do_auto_asconf = 1; | 4136 | sp->do_auto_asconf = 1; |
4128 | } else | 4137 | spin_unlock(&sock_net(sk)->sctp.addr_wq_lock); |
4138 | } else { | ||
4129 | sp->do_auto_asconf = 0; | 4139 | sp->do_auto_asconf = 0; |
4140 | } | ||
4141 | |||
4130 | local_bh_enable(); | 4142 | local_bh_enable(); |
4131 | 4143 | ||
4132 | return 0; | 4144 | return 0; |
4133 | } | 4145 | } |
4134 | 4146 | ||
4135 | /* Cleanup any SCTP per socket resources. */ | 4147 | /* Cleanup any SCTP per socket resources. Must be called with |
4148 | * sock_net(sk)->sctp.addr_wq_lock held if sp->do_auto_asconf is true | ||
4149 | */ | ||
4136 | static void sctp_destroy_sock(struct sock *sk) | 4150 | static void sctp_destroy_sock(struct sock *sk) |
4137 | { | 4151 | { |
4138 | struct sctp_sock *sp; | 4152 | struct sctp_sock *sp; |
@@ -7195,6 +7209,19 @@ void sctp_copy_sock(struct sock *newsk, struct sock *sk, | |||
7195 | newinet->mc_list = NULL; | 7209 | newinet->mc_list = NULL; |
7196 | } | 7210 | } |
7197 | 7211 | ||
7212 | static inline void sctp_copy_descendant(struct sock *sk_to, | ||
7213 | const struct sock *sk_from) | ||
7214 | { | ||
7215 | int ancestor_size = sizeof(struct inet_sock) + | ||
7216 | sizeof(struct sctp_sock) - | ||
7217 | offsetof(struct sctp_sock, auto_asconf_list); | ||
7218 | |||
7219 | if (sk_from->sk_family == PF_INET6) | ||
7220 | ancestor_size += sizeof(struct ipv6_pinfo); | ||
7221 | |||
7222 | __inet_sk_copy_descendant(sk_to, sk_from, ancestor_size); | ||
7223 | } | ||
7224 | |||
7198 | /* Populate the fields of the newsk from the oldsk and migrate the assoc | 7225 | /* Populate the fields of the newsk from the oldsk and migrate the assoc |
7199 | * and its messages to the newsk. | 7226 | * and its messages to the newsk. |
7200 | */ | 7227 | */ |
@@ -7209,7 +7236,6 @@ static void sctp_sock_migrate(struct sock *oldsk, struct sock *newsk, | |||
7209 | struct sk_buff *skb, *tmp; | 7236 | struct sk_buff *skb, *tmp; |
7210 | struct sctp_ulpevent *event; | 7237 | struct sctp_ulpevent *event; |
7211 | struct sctp_bind_hashbucket *head; | 7238 | struct sctp_bind_hashbucket *head; |
7212 | struct list_head tmplist; | ||
7213 | 7239 | ||
7214 | /* Migrate socket buffer sizes and all the socket level options to the | 7240 | /* Migrate socket buffer sizes and all the socket level options to the |
7215 | * new socket. | 7241 | * new socket. |
@@ -7217,12 +7243,7 @@ static void sctp_sock_migrate(struct sock *oldsk, struct sock *newsk, | |||
7217 | newsk->sk_sndbuf = oldsk->sk_sndbuf; | 7243 | newsk->sk_sndbuf = oldsk->sk_sndbuf; |
7218 | newsk->sk_rcvbuf = oldsk->sk_rcvbuf; | 7244 | newsk->sk_rcvbuf = oldsk->sk_rcvbuf; |
7219 | /* Brute force copy old sctp opt. */ | 7245 | /* Brute force copy old sctp opt. */ |
7220 | if (oldsp->do_auto_asconf) { | 7246 | sctp_copy_descendant(newsk, oldsk); |
7221 | memcpy(&tmplist, &newsp->auto_asconf_list, sizeof(tmplist)); | ||
7222 | inet_sk_copy_descendant(newsk, oldsk); | ||
7223 | memcpy(&newsp->auto_asconf_list, &tmplist, sizeof(tmplist)); | ||
7224 | } else | ||
7225 | inet_sk_copy_descendant(newsk, oldsk); | ||
7226 | 7247 | ||
7227 | /* Restore the ep value that was overwritten with the above structure | 7248 | /* Restore the ep value that was overwritten with the above structure |
7228 | * copy. | 7249 | * copy. |