diff options
author | Ka-Cheong Poon <ka-cheong.poon@oracle.com> | 2018-07-23 23:51:22 -0400 |
---|---|---|
committer | David S. Miller <davem@davemloft.net> | 2018-07-24 00:17:44 -0400 |
commit | 1e2b44e78eead7bcadfbf96f70d95773191541c9 (patch) | |
tree | e7944339dd957ae23cfd690cb0ad6962d98c053c /net/rds/tcp_connect.c | |
parent | eee2fa6ab3225192d6d894c54a6fb02ac9efdff6 (diff) |
rds: Enable RDS IPv6 support
This patch enables RDS to use IPv6 addresses. For RDS/TCP, the
listener is now an IPv6 endpoint which accepts both IPv4 and IPv6
connection requests. RDS/RDMA/IB uses a private data (struct
rds_ib_connect_private) exchange between endpoints at RDS connection
establishment time to support RDMA. This private data exchange uses a
32 bit integer to represent an IP address. This needs to be changed in
order to support IPv6. A new private data struct
rds6_ib_connect_private is introduced to handle this. To ensure
backward compatibility, an IPv6 capable RDS stack uses another RDMA
listener port (RDS_CM_PORT) to accept IPv6 connection. And it
continues to use the original RDS_PORT for IPv4 RDS connections. When
it needs to communicate with an IPv6 peer, it uses the RDS_CM_PORT to
send the connection set up request.
v5: Fixed syntax problem (David Miller).
v4: Changed port history comments in rds.h (Sowmini Varadhan).
v3: Added support to set up IPv4 connection using mapped address
(David Miller).
Added support to set up connection between link local and non-link
addresses.
Various review comments from Santosh Shilimkar and Sowmini Varadhan.
v2: Fixed bound and peer address scope mismatched issue.
Added back rds_connect() IPv6 changes.
Signed-off-by: Ka-Cheong Poon <ka-cheong.poon@oracle.com>
Acked-by: Santosh Shilimkar <santosh.shilimkar@oracle.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
Diffstat (limited to 'net/rds/tcp_connect.c')
-rw-r--r-- | net/rds/tcp_connect.c | 54 |
1 files changed, 42 insertions, 12 deletions
diff --git a/net/rds/tcp_connect.c b/net/rds/tcp_connect.c index 231ae927858e..008f50fb25dd 100644 --- a/net/rds/tcp_connect.c +++ b/net/rds/tcp_connect.c | |||
@@ -89,9 +89,11 @@ out: | |||
89 | int rds_tcp_conn_path_connect(struct rds_conn_path *cp) | 89 | int rds_tcp_conn_path_connect(struct rds_conn_path *cp) |
90 | { | 90 | { |
91 | struct socket *sock = NULL; | 91 | struct socket *sock = NULL; |
92 | struct sockaddr_in6 sin6; | ||
92 | struct sockaddr_in sin; | 93 | struct sockaddr_in sin; |
93 | struct sockaddr *addr; | 94 | struct sockaddr *addr; |
94 | int addrlen; | 95 | int addrlen; |
96 | bool isv6; | ||
95 | int ret; | 97 | int ret; |
96 | struct rds_connection *conn = cp->cp_conn; | 98 | struct rds_connection *conn = cp->cp_conn; |
97 | struct rds_tcp_connection *tc = cp->cp_transport_data; | 99 | struct rds_tcp_connection *tc = cp->cp_transport_data; |
@@ -108,18 +110,36 @@ int rds_tcp_conn_path_connect(struct rds_conn_path *cp) | |||
108 | mutex_unlock(&tc->t_conn_path_lock); | 110 | mutex_unlock(&tc->t_conn_path_lock); |
109 | return 0; | 111 | return 0; |
110 | } | 112 | } |
111 | ret = sock_create_kern(rds_conn_net(conn), PF_INET, | 113 | if (ipv6_addr_v4mapped(&conn->c_laddr)) { |
112 | SOCK_STREAM, IPPROTO_TCP, &sock); | 114 | ret = sock_create_kern(rds_conn_net(conn), PF_INET, |
115 | SOCK_STREAM, IPPROTO_TCP, &sock); | ||
116 | isv6 = false; | ||
117 | } else { | ||
118 | ret = sock_create_kern(rds_conn_net(conn), PF_INET6, | ||
119 | SOCK_STREAM, IPPROTO_TCP, &sock); | ||
120 | isv6 = true; | ||
121 | } | ||
122 | |||
113 | if (ret < 0) | 123 | if (ret < 0) |
114 | goto out; | 124 | goto out; |
115 | 125 | ||
116 | rds_tcp_tune(sock); | 126 | rds_tcp_tune(sock); |
117 | 127 | ||
118 | sin.sin_family = AF_INET; | 128 | if (isv6) { |
119 | sin.sin_addr.s_addr = conn->c_laddr.s6_addr32[3]; | 129 | sin6.sin6_family = AF_INET6; |
120 | sin.sin_port = 0; | 130 | sin6.sin6_addr = conn->c_laddr; |
121 | addr = (struct sockaddr *)&sin; | 131 | sin6.sin6_port = 0; |
122 | addrlen = sizeof(sin); | 132 | sin6.sin6_flowinfo = 0; |
133 | sin6.sin6_scope_id = conn->c_dev_if; | ||
134 | addr = (struct sockaddr *)&sin6; | ||
135 | addrlen = sizeof(sin6); | ||
136 | } else { | ||
137 | sin.sin_family = AF_INET; | ||
138 | sin.sin_addr.s_addr = conn->c_laddr.s6_addr32[3]; | ||
139 | sin.sin_port = 0; | ||
140 | addr = (struct sockaddr *)&sin; | ||
141 | addrlen = sizeof(sin); | ||
142 | } | ||
123 | 143 | ||
124 | ret = sock->ops->bind(sock, addr, addrlen); | 144 | ret = sock->ops->bind(sock, addr, addrlen); |
125 | if (ret) { | 145 | if (ret) { |
@@ -128,11 +148,21 @@ int rds_tcp_conn_path_connect(struct rds_conn_path *cp) | |||
128 | goto out; | 148 | goto out; |
129 | } | 149 | } |
130 | 150 | ||
131 | sin.sin_family = AF_INET; | 151 | if (isv6) { |
132 | sin.sin_addr.s_addr = conn->c_faddr.s6_addr32[3]; | 152 | sin6.sin6_family = AF_INET6; |
133 | sin.sin_port = htons(RDS_TCP_PORT); | 153 | sin6.sin6_addr = conn->c_faddr; |
134 | addr = (struct sockaddr *)&sin; | 154 | sin6.sin6_port = htons(RDS_TCP_PORT); |
135 | addrlen = sizeof(sin); | 155 | sin6.sin6_flowinfo = 0; |
156 | sin6.sin6_scope_id = conn->c_dev_if; | ||
157 | addr = (struct sockaddr *)&sin6; | ||
158 | addrlen = sizeof(sin6); | ||
159 | } else { | ||
160 | sin.sin_family = AF_INET; | ||
161 | sin.sin_addr.s_addr = conn->c_faddr.s6_addr32[3]; | ||
162 | sin.sin_port = htons(RDS_TCP_PORT); | ||
163 | addr = (struct sockaddr *)&sin; | ||
164 | addrlen = sizeof(sin); | ||
165 | } | ||
136 | 166 | ||
137 | /* | 167 | /* |
138 | * once we call connect() we can start getting callbacks and they | 168 | * once we call connect() we can start getting callbacks and they |