diff options
author | Andrea Bastoni <bastoni@cs.unc.edu> | 2010-05-30 19:16:45 -0400 |
---|---|---|
committer | Andrea Bastoni <bastoni@cs.unc.edu> | 2010-05-30 19:16:45 -0400 |
commit | ada47b5fe13d89735805b566185f4885f5a3f750 (patch) | |
tree | 644b88f8a71896307d71438e9b3af49126ffb22b /net/rds | |
parent | 43e98717ad40a4ae64545b5ba047c7b86aa44f4f (diff) | |
parent | 3280f21d43ee541f97f8cda5792150d2dbec20d5 (diff) |
Merge branch 'wip-2.6.34' into old-private-masterarchived-private-master
Diffstat (limited to 'net/rds')
-rw-r--r-- | net/rds/af_rds.c | 17 | ||||
-rw-r--r-- | net/rds/cong.c | 3 | ||||
-rw-r--r-- | net/rds/connection.c | 7 | ||||
-rw-r--r-- | net/rds/ib.c | 5 | ||||
-rw-r--r-- | net/rds/ib.h | 2 | ||||
-rw-r--r-- | net/rds/ib_cm.c | 7 | ||||
-rw-r--r-- | net/rds/ib_rdma.c | 10 | ||||
-rw-r--r-- | net/rds/ib_recv.c | 48 | ||||
-rw-r--r-- | net/rds/ib_send.c | 4 | ||||
-rw-r--r-- | net/rds/ib_sysctl.c | 26 | ||||
-rw-r--r-- | net/rds/info.c | 1 | ||||
-rw-r--r-- | net/rds/iw.c | 5 | ||||
-rw-r--r-- | net/rds/iw.h | 2 | ||||
-rw-r--r-- | net/rds/iw_cm.c | 3 | ||||
-rw-r--r-- | net/rds/iw_rdma.c | 10 | ||||
-rw-r--r-- | net/rds/iw_recv.c | 48 | ||||
-rw-r--r-- | net/rds/iw_send.c | 7 | ||||
-rw-r--r-- | net/rds/iw_sysctl.c | 26 | ||||
-rw-r--r-- | net/rds/loop.c | 1 | ||||
-rw-r--r-- | net/rds/message.c | 4 | ||||
-rw-r--r-- | net/rds/page.c | 1 | ||||
-rw-r--r-- | net/rds/rdma.c | 37 | ||||
-rw-r--r-- | net/rds/rdma.h | 1 | ||||
-rw-r--r-- | net/rds/rdma_transport.c | 2 | ||||
-rw-r--r-- | net/rds/recv.c | 12 | ||||
-rw-r--r-- | net/rds/send.c | 28 | ||||
-rw-r--r-- | net/rds/sysctl.c | 21 | ||||
-rw-r--r-- | net/rds/tcp.c | 1 | ||||
-rw-r--r-- | net/rds/tcp_connect.c | 7 | ||||
-rw-r--r-- | net/rds/tcp_listen.c | 11 | ||||
-rw-r--r-- | net/rds/tcp_recv.c | 1 | ||||
-rw-r--r-- | net/rds/tcp_send.c | 4 | ||||
-rw-r--r-- | net/rds/threads.c | 4 |
33 files changed, 215 insertions, 151 deletions
diff --git a/net/rds/af_rds.c b/net/rds/af_rds.c index 98e05382fd3c..f81862baf4d0 100644 --- a/net/rds/af_rds.c +++ b/net/rds/af_rds.c | |||
@@ -33,6 +33,7 @@ | |||
33 | #include <linux/module.h> | 33 | #include <linux/module.h> |
34 | #include <linux/errno.h> | 34 | #include <linux/errno.h> |
35 | #include <linux/kernel.h> | 35 | #include <linux/kernel.h> |
36 | #include <linux/gfp.h> | ||
36 | #include <linux/in.h> | 37 | #include <linux/in.h> |
37 | #include <linux/poll.h> | 38 | #include <linux/poll.h> |
38 | #include <net/sock.h> | 39 | #include <net/sock.h> |
@@ -174,8 +175,8 @@ static unsigned int rds_poll(struct file *file, struct socket *sock, | |||
174 | mask |= (POLLIN | POLLRDNORM); | 175 | mask |= (POLLIN | POLLRDNORM); |
175 | spin_unlock(&rs->rs_lock); | 176 | spin_unlock(&rs->rs_lock); |
176 | } | 177 | } |
177 | if (!list_empty(&rs->rs_recv_queue) | 178 | if (!list_empty(&rs->rs_recv_queue) || |
178 | || !list_empty(&rs->rs_notify_queue)) | 179 | !list_empty(&rs->rs_notify_queue)) |
179 | mask |= (POLLIN | POLLRDNORM); | 180 | mask |= (POLLIN | POLLRDNORM); |
180 | if (rs->rs_snd_bytes < rds_sk_sndbuf(rs)) | 181 | if (rs->rs_snd_bytes < rds_sk_sndbuf(rs)) |
181 | mask |= (POLLOUT | POLLWRNORM); | 182 | mask |= (POLLOUT | POLLWRNORM); |
@@ -265,6 +266,9 @@ static int rds_setsockopt(struct socket *sock, int level, int optname, | |||
265 | case RDS_GET_MR: | 266 | case RDS_GET_MR: |
266 | ret = rds_get_mr(rs, optval, optlen); | 267 | ret = rds_get_mr(rs, optval, optlen); |
267 | break; | 268 | break; |
269 | case RDS_GET_MR_FOR_DEST: | ||
270 | ret = rds_get_mr_for_dest(rs, optval, optlen); | ||
271 | break; | ||
268 | case RDS_FREE_MR: | 272 | case RDS_FREE_MR: |
269 | ret = rds_free_mr(rs, optval, optlen); | 273 | ret = rds_free_mr(rs, optval, optlen); |
270 | break; | 274 | break; |
@@ -305,8 +309,8 @@ static int rds_getsockopt(struct socket *sock, int level, int optname, | |||
305 | if (len < sizeof(int)) | 309 | if (len < sizeof(int)) |
306 | ret = -EINVAL; | 310 | ret = -EINVAL; |
307 | else | 311 | else |
308 | if (put_user(rs->rs_recverr, (int __user *) optval) | 312 | if (put_user(rs->rs_recverr, (int __user *) optval) || |
309 | || put_user(sizeof(int), optlen)) | 313 | put_user(sizeof(int), optlen)) |
310 | ret = -EFAULT; | 314 | ret = -EFAULT; |
311 | else | 315 | else |
312 | ret = 0; | 316 | ret = 0; |
@@ -407,7 +411,8 @@ static int __rds_create(struct socket *sock, struct sock *sk, int protocol) | |||
407 | return 0; | 411 | return 0; |
408 | } | 412 | } |
409 | 413 | ||
410 | static int rds_create(struct net *net, struct socket *sock, int protocol) | 414 | static int rds_create(struct net *net, struct socket *sock, int protocol, |
415 | int kern) | ||
411 | { | 416 | { |
412 | struct sock *sk; | 417 | struct sock *sk; |
413 | 418 | ||
@@ -431,7 +436,7 @@ void rds_sock_put(struct rds_sock *rs) | |||
431 | sock_put(rds_rs_to_sk(rs)); | 436 | sock_put(rds_rs_to_sk(rs)); |
432 | } | 437 | } |
433 | 438 | ||
434 | static struct net_proto_family rds_family_ops = { | 439 | static const struct net_proto_family rds_family_ops = { |
435 | .family = AF_RDS, | 440 | .family = AF_RDS, |
436 | .create = rds_create, | 441 | .create = rds_create, |
437 | .owner = THIS_MODULE, | 442 | .owner = THIS_MODULE, |
diff --git a/net/rds/cong.c b/net/rds/cong.c index dd2711df640b..f1da27ceb064 100644 --- a/net/rds/cong.c +++ b/net/rds/cong.c | |||
@@ -30,6 +30,7 @@ | |||
30 | * SOFTWARE. | 30 | * SOFTWARE. |
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/slab.h> | ||
33 | #include <linux/types.h> | 34 | #include <linux/types.h> |
34 | #include <linux/rbtree.h> | 35 | #include <linux/rbtree.h> |
35 | 36 | ||
@@ -218,6 +219,8 @@ void rds_cong_queue_updates(struct rds_cong_map *map) | |||
218 | spin_lock_irqsave(&rds_cong_lock, flags); | 219 | spin_lock_irqsave(&rds_cong_lock, flags); |
219 | 220 | ||
220 | list_for_each_entry(conn, &map->m_conn_list, c_map_item) { | 221 | list_for_each_entry(conn, &map->m_conn_list, c_map_item) { |
222 | if (conn->c_loopback) | ||
223 | continue; | ||
221 | if (!test_and_set_bit(0, &conn->c_map_queued)) { | 224 | if (!test_and_set_bit(0, &conn->c_map_queued)) { |
222 | rds_stats_inc(s_cong_update_queued); | 225 | rds_stats_inc(s_cong_update_queued); |
223 | queue_delayed_work(rds_wq, &conn->c_send_w, 0); | 226 | queue_delayed_work(rds_wq, &conn->c_send_w, 0); |
diff --git a/net/rds/connection.c b/net/rds/connection.c index cc8b568c0c84..7619b671ca28 100644 --- a/net/rds/connection.c +++ b/net/rds/connection.c | |||
@@ -32,6 +32,7 @@ | |||
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/list.h> | 34 | #include <linux/list.h> |
35 | #include <linux/slab.h> | ||
35 | #include <net/inet_hashtables.h> | 36 | #include <net/inet_hashtables.h> |
36 | 37 | ||
37 | #include "rds.h" | 38 | #include "rds.h" |
@@ -133,10 +134,8 @@ static struct rds_connection *__rds_conn_create(__be32 laddr, __be32 faddr, | |||
133 | 134 | ||
134 | spin_lock_irqsave(&rds_conn_lock, flags); | 135 | spin_lock_irqsave(&rds_conn_lock, flags); |
135 | conn = rds_conn_lookup(head, laddr, faddr, trans); | 136 | conn = rds_conn_lookup(head, laddr, faddr, trans); |
136 | if (conn | 137 | if (conn && conn->c_loopback && conn->c_trans != &rds_loop_transport && |
137 | && conn->c_loopback | 138 | !is_outgoing) { |
138 | && conn->c_trans != &rds_loop_transport | ||
139 | && !is_outgoing) { | ||
140 | /* This is a looped back IB connection, and we're | 139 | /* This is a looped back IB connection, and we're |
141 | * called by the code handling the incoming connect. | 140 | * called by the code handling the incoming connect. |
142 | * We need a second connection object into which we | 141 | * We need a second connection object into which we |
diff --git a/net/rds/ib.c b/net/rds/ib.c index 536ebe5d3f6b..8f2d6dd7700a 100644 --- a/net/rds/ib.c +++ b/net/rds/ib.c | |||
@@ -37,6 +37,7 @@ | |||
37 | #include <linux/inetdevice.h> | 37 | #include <linux/inetdevice.h> |
38 | #include <linux/if_arp.h> | 38 | #include <linux/if_arp.h> |
39 | #include <linux/delay.h> | 39 | #include <linux/delay.h> |
40 | #include <linux/slab.h> | ||
40 | 41 | ||
41 | #include "rds.h" | 42 | #include "rds.h" |
42 | #include "ib.h" | 43 | #include "ib.h" |
@@ -182,8 +183,8 @@ static int rds_ib_conn_info_visitor(struct rds_connection *conn, | |||
182 | ic = conn->c_transport_data; | 183 | ic = conn->c_transport_data; |
183 | dev_addr = &ic->i_cm_id->route.addr.dev_addr; | 184 | dev_addr = &ic->i_cm_id->route.addr.dev_addr; |
184 | 185 | ||
185 | ib_addr_get_sgid(dev_addr, (union ib_gid *) &iinfo->src_gid); | 186 | rdma_addr_get_sgid(dev_addr, (union ib_gid *) &iinfo->src_gid); |
186 | ib_addr_get_dgid(dev_addr, (union ib_gid *) &iinfo->dst_gid); | 187 | rdma_addr_get_dgid(dev_addr, (union ib_gid *) &iinfo->dst_gid); |
187 | 188 | ||
188 | rds_ibdev = ib_get_client_data(ic->i_cm_id->device, &rds_ib_client); | 189 | rds_ibdev = ib_get_client_data(ic->i_cm_id->device, &rds_ib_client); |
189 | iinfo->max_send_wr = ic->i_send_ring.w_nr; | 190 | iinfo->max_send_wr = ic->i_send_ring.w_nr; |
diff --git a/net/rds/ib.h b/net/rds/ib.h index 1378b854cac0..64df4e79b29f 100644 --- a/net/rds/ib.h +++ b/net/rds/ib.h | |||
@@ -98,6 +98,7 @@ struct rds_ib_connection { | |||
98 | struct rds_ib_send_work *i_sends; | 98 | struct rds_ib_send_work *i_sends; |
99 | 99 | ||
100 | /* rx */ | 100 | /* rx */ |
101 | struct tasklet_struct i_recv_tasklet; | ||
101 | struct mutex i_recv_mutex; | 102 | struct mutex i_recv_mutex; |
102 | struct rds_ib_work_ring i_recv_ring; | 103 | struct rds_ib_work_ring i_recv_ring; |
103 | struct rds_ib_incoming *i_ibinc; | 104 | struct rds_ib_incoming *i_ibinc; |
@@ -303,6 +304,7 @@ void rds_ib_inc_free(struct rds_incoming *inc); | |||
303 | int rds_ib_inc_copy_to_user(struct rds_incoming *inc, struct iovec *iov, | 304 | int rds_ib_inc_copy_to_user(struct rds_incoming *inc, struct iovec *iov, |
304 | size_t size); | 305 | size_t size); |
305 | void rds_ib_recv_cq_comp_handler(struct ib_cq *cq, void *context); | 306 | void rds_ib_recv_cq_comp_handler(struct ib_cq *cq, void *context); |
307 | void rds_ib_recv_tasklet_fn(unsigned long data); | ||
306 | void rds_ib_recv_init_ring(struct rds_ib_connection *ic); | 308 | void rds_ib_recv_init_ring(struct rds_ib_connection *ic); |
307 | void rds_ib_recv_clear_ring(struct rds_ib_connection *ic); | 309 | void rds_ib_recv_clear_ring(struct rds_ib_connection *ic); |
308 | void rds_ib_recv_init_ack(struct rds_ib_connection *ic); | 310 | void rds_ib_recv_init_ack(struct rds_ib_connection *ic); |
diff --git a/net/rds/ib_cm.c b/net/rds/ib_cm.c index c2d372f13dbb..88d0856cb797 100644 --- a/net/rds/ib_cm.c +++ b/net/rds/ib_cm.c | |||
@@ -32,6 +32,7 @@ | |||
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/in.h> | 34 | #include <linux/in.h> |
35 | #include <linux/slab.h> | ||
35 | #include <linux/vmalloc.h> | 36 | #include <linux/vmalloc.h> |
36 | 37 | ||
37 | #include "rds.h" | 38 | #include "rds.h" |
@@ -377,8 +378,8 @@ static u32 rds_ib_protocol_compatible(struct rdma_cm_event *event) | |||
377 | } | 378 | } |
378 | 379 | ||
379 | /* Even if len is crap *now* I still want to check it. -ASG */ | 380 | /* Even if len is crap *now* I still want to check it. -ASG */ |
380 | if (event->param.conn.private_data_len < sizeof (*dp) | 381 | if (event->param.conn.private_data_len < sizeof (*dp) || |
381 | || dp->dp_protocol_major == 0) | 382 | dp->dp_protocol_major == 0) |
382 | return RDS_PROTOCOL_3_0; | 383 | return RDS_PROTOCOL_3_0; |
383 | 384 | ||
384 | common = be16_to_cpu(dp->dp_protocol_minor_mask) & RDS_IB_SUPPORTED_PROTOCOLS; | 385 | common = be16_to_cpu(dp->dp_protocol_minor_mask) & RDS_IB_SUPPORTED_PROTOCOLS; |
@@ -694,6 +695,8 @@ int rds_ib_conn_alloc(struct rds_connection *conn, gfp_t gfp) | |||
694 | return -ENOMEM; | 695 | return -ENOMEM; |
695 | 696 | ||
696 | INIT_LIST_HEAD(&ic->ib_node); | 697 | INIT_LIST_HEAD(&ic->ib_node); |
698 | tasklet_init(&ic->i_recv_tasklet, rds_ib_recv_tasklet_fn, | ||
699 | (unsigned long) ic); | ||
697 | mutex_init(&ic->i_recv_mutex); | 700 | mutex_init(&ic->i_recv_mutex); |
698 | #ifndef KERNEL_HAS_ATOMIC64 | 701 | #ifndef KERNEL_HAS_ATOMIC64 |
699 | spin_lock_init(&ic->i_ack_lock); | 702 | spin_lock_init(&ic->i_ack_lock); |
diff --git a/net/rds/ib_rdma.c b/net/rds/ib_rdma.c index ef3ab5b7283e..059989fdb7d7 100644 --- a/net/rds/ib_rdma.c +++ b/net/rds/ib_rdma.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/slab.h> | ||
34 | 35 | ||
35 | #include "rds.h" | 36 | #include "rds.h" |
36 | #include "rdma.h" | 37 | #include "rdma.h" |
@@ -187,11 +188,8 @@ void __rds_ib_destroy_conns(struct list_head *list, spinlock_t *list_lock) | |||
187 | INIT_LIST_HEAD(list); | 188 | INIT_LIST_HEAD(list); |
188 | spin_unlock_irq(list_lock); | 189 | spin_unlock_irq(list_lock); |
189 | 190 | ||
190 | list_for_each_entry_safe(ic, _ic, &tmp_list, ib_node) { | 191 | list_for_each_entry_safe(ic, _ic, &tmp_list, ib_node) |
191 | if (ic->conn->c_passive) | ||
192 | rds_conn_destroy(ic->conn->c_passive); | ||
193 | rds_conn_destroy(ic->conn); | 192 | rds_conn_destroy(ic->conn); |
194 | } | ||
195 | } | 193 | } |
196 | 194 | ||
197 | struct rds_ib_mr_pool *rds_ib_create_mr_pool(struct rds_ib_device *rds_ibdev) | 195 | struct rds_ib_mr_pool *rds_ib_create_mr_pool(struct rds_ib_device *rds_ibdev) |
@@ -573,8 +571,8 @@ void rds_ib_free_mr(void *trans_private, int invalidate) | |||
573 | spin_unlock_irqrestore(&pool->list_lock, flags); | 571 | spin_unlock_irqrestore(&pool->list_lock, flags); |
574 | 572 | ||
575 | /* If we've pinned too many pages, request a flush */ | 573 | /* If we've pinned too many pages, request a flush */ |
576 | if (atomic_read(&pool->free_pinned) >= pool->max_free_pinned | 574 | if (atomic_read(&pool->free_pinned) >= pool->max_free_pinned || |
577 | || atomic_read(&pool->dirty_count) >= pool->max_items / 10) | 575 | atomic_read(&pool->dirty_count) >= pool->max_items / 10) |
578 | queue_work(rds_wq, &pool->flush_worker); | 576 | queue_work(rds_wq, &pool->flush_worker); |
579 | 577 | ||
580 | if (invalidate) { | 578 | if (invalidate) { |
diff --git a/net/rds/ib_recv.c b/net/rds/ib_recv.c index cd7a6cfcab03..c7dd11b835f0 100644 --- a/net/rds/ib_recv.c +++ b/net/rds/ib_recv.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/slab.h> | ||
34 | #include <linux/pci.h> | 35 | #include <linux/pci.h> |
35 | #include <linux/dma-mapping.h> | 36 | #include <linux/dma-mapping.h> |
36 | #include <rdma/rdma_cm.h> | 37 | #include <rdma/rdma_cm.h> |
@@ -143,15 +144,16 @@ static int rds_ib_recv_refill_one(struct rds_connection *conn, | |||
143 | int ret = -ENOMEM; | 144 | int ret = -ENOMEM; |
144 | 145 | ||
145 | if (recv->r_ibinc == NULL) { | 146 | if (recv->r_ibinc == NULL) { |
146 | if (atomic_read(&rds_ib_allocation) >= rds_ib_sysctl_max_recv_allocation) { | 147 | if (!atomic_add_unless(&rds_ib_allocation, 1, rds_ib_sysctl_max_recv_allocation)) { |
147 | rds_ib_stats_inc(s_ib_rx_alloc_limit); | 148 | rds_ib_stats_inc(s_ib_rx_alloc_limit); |
148 | goto out; | 149 | goto out; |
149 | } | 150 | } |
150 | recv->r_ibinc = kmem_cache_alloc(rds_ib_incoming_slab, | 151 | recv->r_ibinc = kmem_cache_alloc(rds_ib_incoming_slab, |
151 | kptr_gfp); | 152 | kptr_gfp); |
152 | if (recv->r_ibinc == NULL) | 153 | if (recv->r_ibinc == NULL) { |
154 | atomic_dec(&rds_ib_allocation); | ||
153 | goto out; | 155 | goto out; |
154 | atomic_inc(&rds_ib_allocation); | 156 | } |
155 | INIT_LIST_HEAD(&recv->r_ibinc->ii_frags); | 157 | INIT_LIST_HEAD(&recv->r_ibinc->ii_frags); |
156 | rds_inc_init(&recv->r_ibinc->ii_inc, conn, conn->c_faddr); | 158 | rds_inc_init(&recv->r_ibinc->ii_inc, conn, conn->c_faddr); |
157 | } | 159 | } |
@@ -229,8 +231,8 @@ int rds_ib_recv_refill(struct rds_connection *conn, gfp_t kptr_gfp, | |||
229 | int ret = 0; | 231 | int ret = 0; |
230 | u32 pos; | 232 | u32 pos; |
231 | 233 | ||
232 | while ((prefill || rds_conn_up(conn)) | 234 | while ((prefill || rds_conn_up(conn)) && |
233 | && rds_ib_ring_alloc(&ic->i_recv_ring, 1, &pos)) { | 235 | rds_ib_ring_alloc(&ic->i_recv_ring, 1, &pos)) { |
234 | if (pos >= ic->i_recv_ring.w_nr) { | 236 | if (pos >= ic->i_recv_ring.w_nr) { |
235 | printk(KERN_NOTICE "Argh - ring alloc returned pos=%u\n", | 237 | printk(KERN_NOTICE "Argh - ring alloc returned pos=%u\n", |
236 | pos); | 238 | pos); |
@@ -770,10 +772,10 @@ static void rds_ib_process_recv(struct rds_connection *conn, | |||
770 | hdr = &ibinc->ii_inc.i_hdr; | 772 | hdr = &ibinc->ii_inc.i_hdr; |
771 | /* We can't just use memcmp here; fragments of a | 773 | /* We can't just use memcmp here; fragments of a |
772 | * single message may carry different ACKs */ | 774 | * single message may carry different ACKs */ |
773 | if (hdr->h_sequence != ihdr->h_sequence | 775 | if (hdr->h_sequence != ihdr->h_sequence || |
774 | || hdr->h_len != ihdr->h_len | 776 | hdr->h_len != ihdr->h_len || |
775 | || hdr->h_sport != ihdr->h_sport | 777 | hdr->h_sport != ihdr->h_sport || |
776 | || hdr->h_dport != ihdr->h_dport) { | 778 | hdr->h_dport != ihdr->h_dport) { |
777 | rds_ib_conn_error(conn, | 779 | rds_ib_conn_error(conn, |
778 | "fragment header mismatch; forcing reconnect\n"); | 780 | "fragment header mismatch; forcing reconnect\n"); |
779 | return; | 781 | return; |
@@ -824,17 +826,22 @@ void rds_ib_recv_cq_comp_handler(struct ib_cq *cq, void *context) | |||
824 | { | 826 | { |
825 | struct rds_connection *conn = context; | 827 | struct rds_connection *conn = context; |
826 | struct rds_ib_connection *ic = conn->c_transport_data; | 828 | struct rds_ib_connection *ic = conn->c_transport_data; |
827 | struct ib_wc wc; | ||
828 | struct rds_ib_ack_state state = { 0, }; | ||
829 | struct rds_ib_recv_work *recv; | ||
830 | 829 | ||
831 | rdsdebug("conn %p cq %p\n", conn, cq); | 830 | rdsdebug("conn %p cq %p\n", conn, cq); |
832 | 831 | ||
833 | rds_ib_stats_inc(s_ib_rx_cq_call); | 832 | rds_ib_stats_inc(s_ib_rx_cq_call); |
834 | 833 | ||
835 | ib_req_notify_cq(cq, IB_CQ_SOLICITED); | 834 | tasklet_schedule(&ic->i_recv_tasklet); |
835 | } | ||
836 | |||
837 | static inline void rds_poll_cq(struct rds_ib_connection *ic, | ||
838 | struct rds_ib_ack_state *state) | ||
839 | { | ||
840 | struct rds_connection *conn = ic->conn; | ||
841 | struct ib_wc wc; | ||
842 | struct rds_ib_recv_work *recv; | ||
836 | 843 | ||
837 | while (ib_poll_cq(cq, 1, &wc) > 0) { | 844 | while (ib_poll_cq(ic->i_recv_cq, 1, &wc) > 0) { |
838 | rdsdebug("wc wr_id 0x%llx status %u byte_len %u imm_data %u\n", | 845 | rdsdebug("wc wr_id 0x%llx status %u byte_len %u imm_data %u\n", |
839 | (unsigned long long)wc.wr_id, wc.status, wc.byte_len, | 846 | (unsigned long long)wc.wr_id, wc.status, wc.byte_len, |
840 | be32_to_cpu(wc.ex.imm_data)); | 847 | be32_to_cpu(wc.ex.imm_data)); |
@@ -852,7 +859,7 @@ void rds_ib_recv_cq_comp_handler(struct ib_cq *cq, void *context) | |||
852 | if (rds_conn_up(conn) || rds_conn_connecting(conn)) { | 859 | if (rds_conn_up(conn) || rds_conn_connecting(conn)) { |
853 | /* We expect errors as the qp is drained during shutdown */ | 860 | /* We expect errors as the qp is drained during shutdown */ |
854 | if (wc.status == IB_WC_SUCCESS) { | 861 | if (wc.status == IB_WC_SUCCESS) { |
855 | rds_ib_process_recv(conn, recv, wc.byte_len, &state); | 862 | rds_ib_process_recv(conn, recv, wc.byte_len, state); |
856 | } else { | 863 | } else { |
857 | rds_ib_conn_error(conn, "recv completion on " | 864 | rds_ib_conn_error(conn, "recv completion on " |
858 | "%pI4 had status %u, disconnecting and " | 865 | "%pI4 had status %u, disconnecting and " |
@@ -863,6 +870,17 @@ void rds_ib_recv_cq_comp_handler(struct ib_cq *cq, void *context) | |||
863 | 870 | ||
864 | rds_ib_ring_free(&ic->i_recv_ring, 1); | 871 | rds_ib_ring_free(&ic->i_recv_ring, 1); |
865 | } | 872 | } |
873 | } | ||
874 | |||
875 | void rds_ib_recv_tasklet_fn(unsigned long data) | ||
876 | { | ||
877 | struct rds_ib_connection *ic = (struct rds_ib_connection *) data; | ||
878 | struct rds_connection *conn = ic->conn; | ||
879 | struct rds_ib_ack_state state = { 0, }; | ||
880 | |||
881 | rds_poll_cq(ic, &state); | ||
882 | ib_req_notify_cq(ic->i_recv_cq, IB_CQ_SOLICITED); | ||
883 | rds_poll_cq(ic, &state); | ||
866 | 884 | ||
867 | if (state.ack_next_valid) | 885 | if (state.ack_next_valid) |
868 | rds_ib_set_ack(ic, state.ack_next, state.ack_required); | 886 | rds_ib_set_ack(ic, state.ack_next, state.ack_required); |
diff --git a/net/rds/ib_send.c b/net/rds/ib_send.c index 23bf830db2d5..a10fab6886d1 100644 --- a/net/rds/ib_send.c +++ b/net/rds/ib_send.c | |||
@@ -252,8 +252,8 @@ void rds_ib_send_cq_comp_handler(struct ib_cq *cq, void *context) | |||
252 | 252 | ||
253 | rds_ib_ring_free(&ic->i_send_ring, completed); | 253 | rds_ib_ring_free(&ic->i_send_ring, completed); |
254 | 254 | ||
255 | if (test_and_clear_bit(RDS_LL_SEND_FULL, &conn->c_flags) | 255 | if (test_and_clear_bit(RDS_LL_SEND_FULL, &conn->c_flags) || |
256 | || test_bit(0, &conn->c_map_queued)) | 256 | test_bit(0, &conn->c_map_queued)) |
257 | queue_delayed_work(rds_wq, &conn->c_send_w, 0); | 257 | queue_delayed_work(rds_wq, &conn->c_send_w, 0); |
258 | 258 | ||
259 | /* We expect errors as the qp is drained during shutdown */ | 259 | /* We expect errors as the qp is drained during shutdown */ |
diff --git a/net/rds/ib_sysctl.c b/net/rds/ib_sysctl.c index 84b5ffcb280f..03f01cb4e0fe 100644 --- a/net/rds/ib_sysctl.c +++ b/net/rds/ib_sysctl.c | |||
@@ -67,68 +67,62 @@ unsigned int rds_ib_sysctl_flow_control = 0; | |||
67 | 67 | ||
68 | ctl_table rds_ib_sysctl_table[] = { | 68 | ctl_table rds_ib_sysctl_table[] = { |
69 | { | 69 | { |
70 | .ctl_name = CTL_UNNUMBERED, | ||
71 | .procname = "max_send_wr", | 70 | .procname = "max_send_wr", |
72 | .data = &rds_ib_sysctl_max_send_wr, | 71 | .data = &rds_ib_sysctl_max_send_wr, |
73 | .maxlen = sizeof(unsigned long), | 72 | .maxlen = sizeof(unsigned long), |
74 | .mode = 0644, | 73 | .mode = 0644, |
75 | .proc_handler = &proc_doulongvec_minmax, | 74 | .proc_handler = proc_doulongvec_minmax, |
76 | .extra1 = &rds_ib_sysctl_max_wr_min, | 75 | .extra1 = &rds_ib_sysctl_max_wr_min, |
77 | .extra2 = &rds_ib_sysctl_max_wr_max, | 76 | .extra2 = &rds_ib_sysctl_max_wr_max, |
78 | }, | 77 | }, |
79 | { | 78 | { |
80 | .ctl_name = CTL_UNNUMBERED, | ||
81 | .procname = "max_recv_wr", | 79 | .procname = "max_recv_wr", |
82 | .data = &rds_ib_sysctl_max_recv_wr, | 80 | .data = &rds_ib_sysctl_max_recv_wr, |
83 | .maxlen = sizeof(unsigned long), | 81 | .maxlen = sizeof(unsigned long), |
84 | .mode = 0644, | 82 | .mode = 0644, |
85 | .proc_handler = &proc_doulongvec_minmax, | 83 | .proc_handler = proc_doulongvec_minmax, |
86 | .extra1 = &rds_ib_sysctl_max_wr_min, | 84 | .extra1 = &rds_ib_sysctl_max_wr_min, |
87 | .extra2 = &rds_ib_sysctl_max_wr_max, | 85 | .extra2 = &rds_ib_sysctl_max_wr_max, |
88 | }, | 86 | }, |
89 | { | 87 | { |
90 | .ctl_name = CTL_UNNUMBERED, | ||
91 | .procname = "max_unsignaled_wr", | 88 | .procname = "max_unsignaled_wr", |
92 | .data = &rds_ib_sysctl_max_unsig_wrs, | 89 | .data = &rds_ib_sysctl_max_unsig_wrs, |
93 | .maxlen = sizeof(unsigned long), | 90 | .maxlen = sizeof(unsigned long), |
94 | .mode = 0644, | 91 | .mode = 0644, |
95 | .proc_handler = &proc_doulongvec_minmax, | 92 | .proc_handler = proc_doulongvec_minmax, |
96 | .extra1 = &rds_ib_sysctl_max_unsig_wr_min, | 93 | .extra1 = &rds_ib_sysctl_max_unsig_wr_min, |
97 | .extra2 = &rds_ib_sysctl_max_unsig_wr_max, | 94 | .extra2 = &rds_ib_sysctl_max_unsig_wr_max, |
98 | }, | 95 | }, |
99 | { | 96 | { |
100 | .ctl_name = CTL_UNNUMBERED, | ||
101 | .procname = "max_unsignaled_bytes", | 97 | .procname = "max_unsignaled_bytes", |
102 | .data = &rds_ib_sysctl_max_unsig_bytes, | 98 | .data = &rds_ib_sysctl_max_unsig_bytes, |
103 | .maxlen = sizeof(unsigned long), | 99 | .maxlen = sizeof(unsigned long), |
104 | .mode = 0644, | 100 | .mode = 0644, |
105 | .proc_handler = &proc_doulongvec_minmax, | 101 | .proc_handler = proc_doulongvec_minmax, |
106 | .extra1 = &rds_ib_sysctl_max_unsig_bytes_min, | 102 | .extra1 = &rds_ib_sysctl_max_unsig_bytes_min, |
107 | .extra2 = &rds_ib_sysctl_max_unsig_bytes_max, | 103 | .extra2 = &rds_ib_sysctl_max_unsig_bytes_max, |
108 | }, | 104 | }, |
109 | { | 105 | { |
110 | .ctl_name = CTL_UNNUMBERED, | ||
111 | .procname = "max_recv_allocation", | 106 | .procname = "max_recv_allocation", |
112 | .data = &rds_ib_sysctl_max_recv_allocation, | 107 | .data = &rds_ib_sysctl_max_recv_allocation, |
113 | .maxlen = sizeof(unsigned long), | 108 | .maxlen = sizeof(unsigned long), |
114 | .mode = 0644, | 109 | .mode = 0644, |
115 | .proc_handler = &proc_doulongvec_minmax, | 110 | .proc_handler = proc_doulongvec_minmax, |
116 | }, | 111 | }, |
117 | { | 112 | { |
118 | .ctl_name = CTL_UNNUMBERED, | ||
119 | .procname = "flow_control", | 113 | .procname = "flow_control", |
120 | .data = &rds_ib_sysctl_flow_control, | 114 | .data = &rds_ib_sysctl_flow_control, |
121 | .maxlen = sizeof(rds_ib_sysctl_flow_control), | 115 | .maxlen = sizeof(rds_ib_sysctl_flow_control), |
122 | .mode = 0644, | 116 | .mode = 0644, |
123 | .proc_handler = &proc_dointvec, | 117 | .proc_handler = proc_dointvec, |
124 | }, | 118 | }, |
125 | { .ctl_name = 0} | 119 | { } |
126 | }; | 120 | }; |
127 | 121 | ||
128 | static struct ctl_path rds_ib_sysctl_path[] = { | 122 | static struct ctl_path rds_ib_sysctl_path[] = { |
129 | { .procname = "net", .ctl_name = CTL_NET, }, | 123 | { .procname = "net", }, |
130 | { .procname = "rds", .ctl_name = CTL_UNNUMBERED, }, | 124 | { .procname = "rds", }, |
131 | { .procname = "ib", .ctl_name = CTL_UNNUMBERED, }, | 125 | { .procname = "ib", }, |
132 | { } | 126 | { } |
133 | }; | 127 | }; |
134 | 128 | ||
diff --git a/net/rds/info.c b/net/rds/info.c index 814a91a6f4a7..c45c4173a44d 100644 --- a/net/rds/info.c +++ b/net/rds/info.c | |||
@@ -32,6 +32,7 @@ | |||
32 | */ | 32 | */ |
33 | #include <linux/percpu.h> | 33 | #include <linux/percpu.h> |
34 | #include <linux/seq_file.h> | 34 | #include <linux/seq_file.h> |
35 | #include <linux/slab.h> | ||
35 | #include <linux/proc_fs.h> | 36 | #include <linux/proc_fs.h> |
36 | 37 | ||
37 | #include "rds.h" | 38 | #include "rds.h" |
diff --git a/net/rds/iw.c b/net/rds/iw.c index db224f7c2937..c8f3d3525cb9 100644 --- a/net/rds/iw.c +++ b/net/rds/iw.c | |||
@@ -37,6 +37,7 @@ | |||
37 | #include <linux/inetdevice.h> | 37 | #include <linux/inetdevice.h> |
38 | #include <linux/if_arp.h> | 38 | #include <linux/if_arp.h> |
39 | #include <linux/delay.h> | 39 | #include <linux/delay.h> |
40 | #include <linux/slab.h> | ||
40 | 41 | ||
41 | #include "rds.h" | 42 | #include "rds.h" |
42 | #include "iw.h" | 43 | #include "iw.h" |
@@ -184,8 +185,8 @@ static int rds_iw_conn_info_visitor(struct rds_connection *conn, | |||
184 | ic = conn->c_transport_data; | 185 | ic = conn->c_transport_data; |
185 | dev_addr = &ic->i_cm_id->route.addr.dev_addr; | 186 | dev_addr = &ic->i_cm_id->route.addr.dev_addr; |
186 | 187 | ||
187 | ib_addr_get_sgid(dev_addr, (union ib_gid *) &iinfo->src_gid); | 188 | rdma_addr_get_sgid(dev_addr, (union ib_gid *) &iinfo->src_gid); |
188 | ib_addr_get_dgid(dev_addr, (union ib_gid *) &iinfo->dst_gid); | 189 | rdma_addr_get_dgid(dev_addr, (union ib_gid *) &iinfo->dst_gid); |
189 | 190 | ||
190 | rds_iwdev = ib_get_client_data(ic->i_cm_id->device, &rds_iw_client); | 191 | rds_iwdev = ib_get_client_data(ic->i_cm_id->device, &rds_iw_client); |
191 | iinfo->max_send_wr = ic->i_send_ring.w_nr; | 192 | iinfo->max_send_wr = ic->i_send_ring.w_nr; |
diff --git a/net/rds/iw.h b/net/rds/iw.h index dd72b62bd506..eef2f0c28476 100644 --- a/net/rds/iw.h +++ b/net/rds/iw.h | |||
@@ -119,6 +119,7 @@ struct rds_iw_connection { | |||
119 | struct rds_iw_send_work *i_sends; | 119 | struct rds_iw_send_work *i_sends; |
120 | 120 | ||
121 | /* rx */ | 121 | /* rx */ |
122 | struct tasklet_struct i_recv_tasklet; | ||
122 | struct mutex i_recv_mutex; | 123 | struct mutex i_recv_mutex; |
123 | struct rds_iw_work_ring i_recv_ring; | 124 | struct rds_iw_work_ring i_recv_ring; |
124 | struct rds_iw_incoming *i_iwinc; | 125 | struct rds_iw_incoming *i_iwinc; |
@@ -330,6 +331,7 @@ void rds_iw_inc_free(struct rds_incoming *inc); | |||
330 | int rds_iw_inc_copy_to_user(struct rds_incoming *inc, struct iovec *iov, | 331 | int rds_iw_inc_copy_to_user(struct rds_incoming *inc, struct iovec *iov, |
331 | size_t size); | 332 | size_t size); |
332 | void rds_iw_recv_cq_comp_handler(struct ib_cq *cq, void *context); | 333 | void rds_iw_recv_cq_comp_handler(struct ib_cq *cq, void *context); |
334 | void rds_iw_recv_tasklet_fn(unsigned long data); | ||
333 | void rds_iw_recv_init_ring(struct rds_iw_connection *ic); | 335 | void rds_iw_recv_init_ring(struct rds_iw_connection *ic); |
334 | void rds_iw_recv_clear_ring(struct rds_iw_connection *ic); | 336 | void rds_iw_recv_clear_ring(struct rds_iw_connection *ic); |
335 | void rds_iw_recv_init_ack(struct rds_iw_connection *ic); | 337 | void rds_iw_recv_init_ack(struct rds_iw_connection *ic); |
diff --git a/net/rds/iw_cm.c b/net/rds/iw_cm.c index a416b0d492b1..3e9460f935d8 100644 --- a/net/rds/iw_cm.c +++ b/net/rds/iw_cm.c | |||
@@ -32,6 +32,7 @@ | |||
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/in.h> | 34 | #include <linux/in.h> |
35 | #include <linux/slab.h> | ||
35 | #include <linux/vmalloc.h> | 36 | #include <linux/vmalloc.h> |
36 | 37 | ||
37 | #include "rds.h" | 38 | #include "rds.h" |
@@ -696,6 +697,8 @@ int rds_iw_conn_alloc(struct rds_connection *conn, gfp_t gfp) | |||
696 | return -ENOMEM; | 697 | return -ENOMEM; |
697 | 698 | ||
698 | INIT_LIST_HEAD(&ic->iw_node); | 699 | INIT_LIST_HEAD(&ic->iw_node); |
700 | tasklet_init(&ic->i_recv_tasklet, rds_iw_recv_tasklet_fn, | ||
701 | (unsigned long) ic); | ||
699 | mutex_init(&ic->i_recv_mutex); | 702 | mutex_init(&ic->i_recv_mutex); |
700 | #ifndef KERNEL_HAS_ATOMIC64 | 703 | #ifndef KERNEL_HAS_ATOMIC64 |
701 | spin_lock_init(&ic->i_ack_lock); | 704 | spin_lock_init(&ic->i_ack_lock); |
diff --git a/net/rds/iw_rdma.c b/net/rds/iw_rdma.c index de4a1b16bf7b..13dc1862d862 100644 --- a/net/rds/iw_rdma.c +++ b/net/rds/iw_rdma.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/slab.h> | ||
34 | 35 | ||
35 | #include "rds.h" | 36 | #include "rds.h" |
36 | #include "rdma.h" | 37 | #include "rdma.h" |
@@ -245,11 +246,8 @@ void __rds_iw_destroy_conns(struct list_head *list, spinlock_t *list_lock) | |||
245 | INIT_LIST_HEAD(list); | 246 | INIT_LIST_HEAD(list); |
246 | spin_unlock_irq(list_lock); | 247 | spin_unlock_irq(list_lock); |
247 | 248 | ||
248 | list_for_each_entry_safe(ic, _ic, &tmp_list, iw_node) { | 249 | list_for_each_entry_safe(ic, _ic, &tmp_list, iw_node) |
249 | if (ic->conn->c_passive) | ||
250 | rds_conn_destroy(ic->conn->c_passive); | ||
251 | rds_conn_destroy(ic->conn); | 250 | rds_conn_destroy(ic->conn); |
252 | } | ||
253 | } | 251 | } |
254 | 252 | ||
255 | static void rds_iw_set_scatterlist(struct rds_iw_scatterlist *sg, | 253 | static void rds_iw_set_scatterlist(struct rds_iw_scatterlist *sg, |
@@ -576,8 +574,8 @@ void rds_iw_free_mr(void *trans_private, int invalidate) | |||
576 | rds_iw_free_fastreg(pool, ibmr); | 574 | rds_iw_free_fastreg(pool, ibmr); |
577 | 575 | ||
578 | /* If we've pinned too many pages, request a flush */ | 576 | /* If we've pinned too many pages, request a flush */ |
579 | if (atomic_read(&pool->free_pinned) >= pool->max_free_pinned | 577 | if (atomic_read(&pool->free_pinned) >= pool->max_free_pinned || |
580 | || atomic_read(&pool->dirty_count) >= pool->max_items / 10) | 578 | atomic_read(&pool->dirty_count) >= pool->max_items / 10) |
581 | queue_work(rds_wq, &pool->flush_worker); | 579 | queue_work(rds_wq, &pool->flush_worker); |
582 | 580 | ||
583 | if (invalidate) { | 581 | if (invalidate) { |
diff --git a/net/rds/iw_recv.c b/net/rds/iw_recv.c index 8683f5f66c4b..da43ee840ca3 100644 --- a/net/rds/iw_recv.c +++ b/net/rds/iw_recv.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/slab.h> | ||
34 | #include <linux/pci.h> | 35 | #include <linux/pci.h> |
35 | #include <linux/dma-mapping.h> | 36 | #include <linux/dma-mapping.h> |
36 | #include <rdma/rdma_cm.h> | 37 | #include <rdma/rdma_cm.h> |
@@ -143,15 +144,16 @@ static int rds_iw_recv_refill_one(struct rds_connection *conn, | |||
143 | int ret = -ENOMEM; | 144 | int ret = -ENOMEM; |
144 | 145 | ||
145 | if (recv->r_iwinc == NULL) { | 146 | if (recv->r_iwinc == NULL) { |
146 | if (atomic_read(&rds_iw_allocation) >= rds_iw_sysctl_max_recv_allocation) { | 147 | if (!atomic_add_unless(&rds_iw_allocation, 1, rds_iw_sysctl_max_recv_allocation)) { |
147 | rds_iw_stats_inc(s_iw_rx_alloc_limit); | 148 | rds_iw_stats_inc(s_iw_rx_alloc_limit); |
148 | goto out; | 149 | goto out; |
149 | } | 150 | } |
150 | recv->r_iwinc = kmem_cache_alloc(rds_iw_incoming_slab, | 151 | recv->r_iwinc = kmem_cache_alloc(rds_iw_incoming_slab, |
151 | kptr_gfp); | 152 | kptr_gfp); |
152 | if (recv->r_iwinc == NULL) | 153 | if (recv->r_iwinc == NULL) { |
154 | atomic_dec(&rds_iw_allocation); | ||
153 | goto out; | 155 | goto out; |
154 | atomic_inc(&rds_iw_allocation); | 156 | } |
155 | INIT_LIST_HEAD(&recv->r_iwinc->ii_frags); | 157 | INIT_LIST_HEAD(&recv->r_iwinc->ii_frags); |
156 | rds_inc_init(&recv->r_iwinc->ii_inc, conn, conn->c_faddr); | 158 | rds_inc_init(&recv->r_iwinc->ii_inc, conn, conn->c_faddr); |
157 | } | 159 | } |
@@ -229,8 +231,8 @@ int rds_iw_recv_refill(struct rds_connection *conn, gfp_t kptr_gfp, | |||
229 | int ret = 0; | 231 | int ret = 0; |
230 | u32 pos; | 232 | u32 pos; |
231 | 233 | ||
232 | while ((prefill || rds_conn_up(conn)) | 234 | while ((prefill || rds_conn_up(conn)) && |
233 | && rds_iw_ring_alloc(&ic->i_recv_ring, 1, &pos)) { | 235 | rds_iw_ring_alloc(&ic->i_recv_ring, 1, &pos)) { |
234 | if (pos >= ic->i_recv_ring.w_nr) { | 236 | if (pos >= ic->i_recv_ring.w_nr) { |
235 | printk(KERN_NOTICE "Argh - ring alloc returned pos=%u\n", | 237 | printk(KERN_NOTICE "Argh - ring alloc returned pos=%u\n", |
236 | pos); | 238 | pos); |
@@ -729,10 +731,10 @@ static void rds_iw_process_recv(struct rds_connection *conn, | |||
729 | hdr = &iwinc->ii_inc.i_hdr; | 731 | hdr = &iwinc->ii_inc.i_hdr; |
730 | /* We can't just use memcmp here; fragments of a | 732 | /* We can't just use memcmp here; fragments of a |
731 | * single message may carry different ACKs */ | 733 | * single message may carry different ACKs */ |
732 | if (hdr->h_sequence != ihdr->h_sequence | 734 | if (hdr->h_sequence != ihdr->h_sequence || |
733 | || hdr->h_len != ihdr->h_len | 735 | hdr->h_len != ihdr->h_len || |
734 | || hdr->h_sport != ihdr->h_sport | 736 | hdr->h_sport != ihdr->h_sport || |
735 | || hdr->h_dport != ihdr->h_dport) { | 737 | hdr->h_dport != ihdr->h_dport) { |
736 | rds_iw_conn_error(conn, | 738 | rds_iw_conn_error(conn, |
737 | "fragment header mismatch; forcing reconnect\n"); | 739 | "fragment header mismatch; forcing reconnect\n"); |
738 | return; | 740 | return; |
@@ -783,17 +785,22 @@ void rds_iw_recv_cq_comp_handler(struct ib_cq *cq, void *context) | |||
783 | { | 785 | { |
784 | struct rds_connection *conn = context; | 786 | struct rds_connection *conn = context; |
785 | struct rds_iw_connection *ic = conn->c_transport_data; | 787 | struct rds_iw_connection *ic = conn->c_transport_data; |
786 | struct ib_wc wc; | ||
787 | struct rds_iw_ack_state state = { 0, }; | ||
788 | struct rds_iw_recv_work *recv; | ||
789 | 788 | ||
790 | rdsdebug("conn %p cq %p\n", conn, cq); | 789 | rdsdebug("conn %p cq %p\n", conn, cq); |
791 | 790 | ||
792 | rds_iw_stats_inc(s_iw_rx_cq_call); | 791 | rds_iw_stats_inc(s_iw_rx_cq_call); |
793 | 792 | ||
794 | ib_req_notify_cq(cq, IB_CQ_SOLICITED); | 793 | tasklet_schedule(&ic->i_recv_tasklet); |
794 | } | ||
795 | |||
796 | static inline void rds_poll_cq(struct rds_iw_connection *ic, | ||
797 | struct rds_iw_ack_state *state) | ||
798 | { | ||
799 | struct rds_connection *conn = ic->conn; | ||
800 | struct ib_wc wc; | ||
801 | struct rds_iw_recv_work *recv; | ||
795 | 802 | ||
796 | while (ib_poll_cq(cq, 1, &wc) > 0) { | 803 | while (ib_poll_cq(ic->i_recv_cq, 1, &wc) > 0) { |
797 | rdsdebug("wc wr_id 0x%llx status %u byte_len %u imm_data %u\n", | 804 | rdsdebug("wc wr_id 0x%llx status %u byte_len %u imm_data %u\n", |
798 | (unsigned long long)wc.wr_id, wc.status, wc.byte_len, | 805 | (unsigned long long)wc.wr_id, wc.status, wc.byte_len, |
799 | be32_to_cpu(wc.ex.imm_data)); | 806 | be32_to_cpu(wc.ex.imm_data)); |
@@ -811,7 +818,7 @@ void rds_iw_recv_cq_comp_handler(struct ib_cq *cq, void *context) | |||
811 | if (rds_conn_up(conn) || rds_conn_connecting(conn)) { | 818 | if (rds_conn_up(conn) || rds_conn_connecting(conn)) { |
812 | /* We expect errors as the qp is drained during shutdown */ | 819 | /* We expect errors as the qp is drained during shutdown */ |
813 | if (wc.status == IB_WC_SUCCESS) { | 820 | if (wc.status == IB_WC_SUCCESS) { |
814 | rds_iw_process_recv(conn, recv, wc.byte_len, &state); | 821 | rds_iw_process_recv(conn, recv, wc.byte_len, state); |
815 | } else { | 822 | } else { |
816 | rds_iw_conn_error(conn, "recv completion on " | 823 | rds_iw_conn_error(conn, "recv completion on " |
817 | "%pI4 had status %u, disconnecting and " | 824 | "%pI4 had status %u, disconnecting and " |
@@ -822,6 +829,17 @@ void rds_iw_recv_cq_comp_handler(struct ib_cq *cq, void *context) | |||
822 | 829 | ||
823 | rds_iw_ring_free(&ic->i_recv_ring, 1); | 830 | rds_iw_ring_free(&ic->i_recv_ring, 1); |
824 | } | 831 | } |
832 | } | ||
833 | |||
834 | void rds_iw_recv_tasklet_fn(unsigned long data) | ||
835 | { | ||
836 | struct rds_iw_connection *ic = (struct rds_iw_connection *) data; | ||
837 | struct rds_connection *conn = ic->conn; | ||
838 | struct rds_iw_ack_state state = { 0, }; | ||
839 | |||
840 | rds_poll_cq(ic, &state); | ||
841 | ib_req_notify_cq(ic->i_recv_cq, IB_CQ_SOLICITED); | ||
842 | rds_poll_cq(ic, &state); | ||
825 | 843 | ||
826 | if (state.ack_next_valid) | 844 | if (state.ack_next_valid) |
827 | rds_iw_set_ack(ic, state.ack_next, state.ack_required); | 845 | rds_iw_set_ack(ic, state.ack_next, state.ack_required); |
diff --git a/net/rds/iw_send.c b/net/rds/iw_send.c index 1f5abe3cf2b4..1379e9d66a78 100644 --- a/net/rds/iw_send.c +++ b/net/rds/iw_send.c | |||
@@ -288,8 +288,8 @@ void rds_iw_send_cq_comp_handler(struct ib_cq *cq, void *context) | |||
288 | 288 | ||
289 | rds_iw_ring_free(&ic->i_send_ring, completed); | 289 | rds_iw_ring_free(&ic->i_send_ring, completed); |
290 | 290 | ||
291 | if (test_and_clear_bit(RDS_LL_SEND_FULL, &conn->c_flags) | 291 | if (test_and_clear_bit(RDS_LL_SEND_FULL, &conn->c_flags) || |
292 | || test_bit(0, &conn->c_map_queued)) | 292 | test_bit(0, &conn->c_map_queued)) |
293 | queue_delayed_work(rds_wq, &conn->c_send_w, 0); | 293 | queue_delayed_work(rds_wq, &conn->c_send_w, 0); |
294 | 294 | ||
295 | /* We expect errors as the qp is drained during shutdown */ | 295 | /* We expect errors as the qp is drained during shutdown */ |
@@ -519,8 +519,7 @@ int rds_iw_xmit(struct rds_connection *conn, struct rds_message *rm, | |||
519 | BUG_ON(hdr_off != 0 && hdr_off != sizeof(struct rds_header)); | 519 | BUG_ON(hdr_off != 0 && hdr_off != sizeof(struct rds_header)); |
520 | 520 | ||
521 | /* Fastreg support */ | 521 | /* Fastreg support */ |
522 | if (rds_rdma_cookie_key(rm->m_rdma_cookie) | 522 | if (rds_rdma_cookie_key(rm->m_rdma_cookie) && !ic->i_fastreg_posted) { |
523 | && !ic->i_fastreg_posted) { | ||
524 | ret = -EAGAIN; | 523 | ret = -EAGAIN; |
525 | goto out; | 524 | goto out; |
526 | } | 525 | } |
diff --git a/net/rds/iw_sysctl.c b/net/rds/iw_sysctl.c index 9590678cd616..1c4428a61a02 100644 --- a/net/rds/iw_sysctl.c +++ b/net/rds/iw_sysctl.c | |||
@@ -57,68 +57,62 @@ unsigned int rds_iw_sysctl_flow_control = 1; | |||
57 | 57 | ||
58 | ctl_table rds_iw_sysctl_table[] = { | 58 | ctl_table rds_iw_sysctl_table[] = { |
59 | { | 59 | { |
60 | .ctl_name = CTL_UNNUMBERED, | ||
61 | .procname = "max_send_wr", | 60 | .procname = "max_send_wr", |
62 | .data = &rds_iw_sysctl_max_send_wr, | 61 | .data = &rds_iw_sysctl_max_send_wr, |
63 | .maxlen = sizeof(unsigned long), | 62 | .maxlen = sizeof(unsigned long), |
64 | .mode = 0644, | 63 | .mode = 0644, |
65 | .proc_handler = &proc_doulongvec_minmax, | 64 | .proc_handler = proc_doulongvec_minmax, |
66 | .extra1 = &rds_iw_sysctl_max_wr_min, | 65 | .extra1 = &rds_iw_sysctl_max_wr_min, |
67 | .extra2 = &rds_iw_sysctl_max_wr_max, | 66 | .extra2 = &rds_iw_sysctl_max_wr_max, |
68 | }, | 67 | }, |
69 | { | 68 | { |
70 | .ctl_name = CTL_UNNUMBERED, | ||
71 | .procname = "max_recv_wr", | 69 | .procname = "max_recv_wr", |
72 | .data = &rds_iw_sysctl_max_recv_wr, | 70 | .data = &rds_iw_sysctl_max_recv_wr, |
73 | .maxlen = sizeof(unsigned long), | 71 | .maxlen = sizeof(unsigned long), |
74 | .mode = 0644, | 72 | .mode = 0644, |
75 | .proc_handler = &proc_doulongvec_minmax, | 73 | .proc_handler = proc_doulongvec_minmax, |
76 | .extra1 = &rds_iw_sysctl_max_wr_min, | 74 | .extra1 = &rds_iw_sysctl_max_wr_min, |
77 | .extra2 = &rds_iw_sysctl_max_wr_max, | 75 | .extra2 = &rds_iw_sysctl_max_wr_max, |
78 | }, | 76 | }, |
79 | { | 77 | { |
80 | .ctl_name = CTL_UNNUMBERED, | ||
81 | .procname = "max_unsignaled_wr", | 78 | .procname = "max_unsignaled_wr", |
82 | .data = &rds_iw_sysctl_max_unsig_wrs, | 79 | .data = &rds_iw_sysctl_max_unsig_wrs, |
83 | .maxlen = sizeof(unsigned long), | 80 | .maxlen = sizeof(unsigned long), |
84 | .mode = 0644, | 81 | .mode = 0644, |
85 | .proc_handler = &proc_doulongvec_minmax, | 82 | .proc_handler = proc_doulongvec_minmax, |
86 | .extra1 = &rds_iw_sysctl_max_unsig_wr_min, | 83 | .extra1 = &rds_iw_sysctl_max_unsig_wr_min, |
87 | .extra2 = &rds_iw_sysctl_max_unsig_wr_max, | 84 | .extra2 = &rds_iw_sysctl_max_unsig_wr_max, |
88 | }, | 85 | }, |
89 | { | 86 | { |
90 | .ctl_name = CTL_UNNUMBERED, | ||
91 | .procname = "max_unsignaled_bytes", | 87 | .procname = "max_unsignaled_bytes", |
92 | .data = &rds_iw_sysctl_max_unsig_bytes, | 88 | .data = &rds_iw_sysctl_max_unsig_bytes, |
93 | .maxlen = sizeof(unsigned long), | 89 | .maxlen = sizeof(unsigned long), |
94 | .mode = 0644, | 90 | .mode = 0644, |
95 | .proc_handler = &proc_doulongvec_minmax, | 91 | .proc_handler = proc_doulongvec_minmax, |
96 | .extra1 = &rds_iw_sysctl_max_unsig_bytes_min, | 92 | .extra1 = &rds_iw_sysctl_max_unsig_bytes_min, |
97 | .extra2 = &rds_iw_sysctl_max_unsig_bytes_max, | 93 | .extra2 = &rds_iw_sysctl_max_unsig_bytes_max, |
98 | }, | 94 | }, |
99 | { | 95 | { |
100 | .ctl_name = CTL_UNNUMBERED, | ||
101 | .procname = "max_recv_allocation", | 96 | .procname = "max_recv_allocation", |
102 | .data = &rds_iw_sysctl_max_recv_allocation, | 97 | .data = &rds_iw_sysctl_max_recv_allocation, |
103 | .maxlen = sizeof(unsigned long), | 98 | .maxlen = sizeof(unsigned long), |
104 | .mode = 0644, | 99 | .mode = 0644, |
105 | .proc_handler = &proc_doulongvec_minmax, | 100 | .proc_handler = proc_doulongvec_minmax, |
106 | }, | 101 | }, |
107 | { | 102 | { |
108 | .ctl_name = CTL_UNNUMBERED, | ||
109 | .procname = "flow_control", | 103 | .procname = "flow_control", |
110 | .data = &rds_iw_sysctl_flow_control, | 104 | .data = &rds_iw_sysctl_flow_control, |
111 | .maxlen = sizeof(rds_iw_sysctl_flow_control), | 105 | .maxlen = sizeof(rds_iw_sysctl_flow_control), |
112 | .mode = 0644, | 106 | .mode = 0644, |
113 | .proc_handler = &proc_dointvec, | 107 | .proc_handler = proc_dointvec, |
114 | }, | 108 | }, |
115 | { .ctl_name = 0} | 109 | { } |
116 | }; | 110 | }; |
117 | 111 | ||
118 | static struct ctl_path rds_iw_sysctl_path[] = { | 112 | static struct ctl_path rds_iw_sysctl_path[] = { |
119 | { .procname = "net", .ctl_name = CTL_NET, }, | 113 | { .procname = "net", }, |
120 | { .procname = "rds", .ctl_name = CTL_UNNUMBERED, }, | 114 | { .procname = "rds", }, |
121 | { .procname = "iw", .ctl_name = CTL_UNNUMBERED, }, | 115 | { .procname = "iw", }, |
122 | { } | 116 | { } |
123 | }; | 117 | }; |
124 | 118 | ||
diff --git a/net/rds/loop.c b/net/rds/loop.c index 4a61997f554d..0d7a159158b8 100644 --- a/net/rds/loop.c +++ b/net/rds/loop.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/slab.h> | ||
34 | #include <linux/in.h> | 35 | #include <linux/in.h> |
35 | 36 | ||
36 | #include "rds.h" | 37 | #include "rds.h" |
diff --git a/net/rds/message.c b/net/rds/message.c index ca50a8ec9742..9a1d67e001ba 100644 --- a/net/rds/message.c +++ b/net/rds/message.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/slab.h> | ||
34 | 35 | ||
35 | #include "rds.h" | 36 | #include "rds.h" |
36 | #include "rdma.h" | 37 | #include "rdma.h" |
@@ -122,8 +123,7 @@ int rds_message_add_extension(struct rds_header *hdr, | |||
122 | if (hdr->h_exthdr[0] != RDS_EXTHDR_NONE) | 123 | if (hdr->h_exthdr[0] != RDS_EXTHDR_NONE) |
123 | return 0; | 124 | return 0; |
124 | 125 | ||
125 | if (type >= __RDS_EXTHDR_MAX | 126 | if (type >= __RDS_EXTHDR_MAX || len != rds_exthdr_size[type]) |
126 | || len != rds_exthdr_size[type]) | ||
127 | return 0; | 127 | return 0; |
128 | 128 | ||
129 | if (ext_len >= RDS_HEADER_EXT_SPACE) | 129 | if (ext_len >= RDS_HEADER_EXT_SPACE) |
diff --git a/net/rds/page.c b/net/rds/page.c index 36790122dfd4..595a952d4b17 100644 --- a/net/rds/page.c +++ b/net/rds/page.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/highmem.h> | 33 | #include <linux/highmem.h> |
34 | #include <linux/gfp.h> | ||
34 | 35 | ||
35 | #include "rds.h" | 36 | #include "rds.h" |
36 | 37 | ||
diff --git a/net/rds/rdma.c b/net/rds/rdma.c index 8dc83d2caa58..5ce9437cad67 100644 --- a/net/rds/rdma.c +++ b/net/rds/rdma.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/pagemap.h> | 33 | #include <linux/pagemap.h> |
34 | #include <linux/slab.h> | ||
34 | #include <linux/rbtree.h> | 35 | #include <linux/rbtree.h> |
35 | #include <linux/dma-mapping.h> /* for DMA_*_DEVICE */ | 36 | #include <linux/dma-mapping.h> /* for DMA_*_DEVICE */ |
36 | 37 | ||
@@ -317,6 +318,30 @@ int rds_get_mr(struct rds_sock *rs, char __user *optval, int optlen) | |||
317 | return __rds_rdma_map(rs, &args, NULL, NULL); | 318 | return __rds_rdma_map(rs, &args, NULL, NULL); |
318 | } | 319 | } |
319 | 320 | ||
321 | int rds_get_mr_for_dest(struct rds_sock *rs, char __user *optval, int optlen) | ||
322 | { | ||
323 | struct rds_get_mr_for_dest_args args; | ||
324 | struct rds_get_mr_args new_args; | ||
325 | |||
326 | if (optlen != sizeof(struct rds_get_mr_for_dest_args)) | ||
327 | return -EINVAL; | ||
328 | |||
329 | if (copy_from_user(&args, (struct rds_get_mr_for_dest_args __user *)optval, | ||
330 | sizeof(struct rds_get_mr_for_dest_args))) | ||
331 | return -EFAULT; | ||
332 | |||
333 | /* | ||
334 | * Initially, just behave like get_mr(). | ||
335 | * TODO: Implement get_mr as wrapper around this | ||
336 | * and deprecate it. | ||
337 | */ | ||
338 | new_args.vec = args.vec; | ||
339 | new_args.cookie_addr = args.cookie_addr; | ||
340 | new_args.flags = args.flags; | ||
341 | |||
342 | return __rds_rdma_map(rs, &new_args, NULL, NULL); | ||
343 | } | ||
344 | |||
320 | /* | 345 | /* |
321 | * Free the MR indicated by the given R_Key | 346 | * Free the MR indicated by the given R_Key |
322 | */ | 347 | */ |
@@ -607,8 +632,8 @@ int rds_cmsg_rdma_args(struct rds_sock *rs, struct rds_message *rm, | |||
607 | { | 632 | { |
608 | struct rds_rdma_op *op; | 633 | struct rds_rdma_op *op; |
609 | 634 | ||
610 | if (cmsg->cmsg_len < CMSG_LEN(sizeof(struct rds_rdma_args)) | 635 | if (cmsg->cmsg_len < CMSG_LEN(sizeof(struct rds_rdma_args)) || |
611 | || rm->m_rdma_op != NULL) | 636 | rm->m_rdma_op != NULL) |
612 | return -EINVAL; | 637 | return -EINVAL; |
613 | 638 | ||
614 | op = rds_rdma_prepare(rs, CMSG_DATA(cmsg)); | 639 | op = rds_rdma_prepare(rs, CMSG_DATA(cmsg)); |
@@ -631,8 +656,8 @@ int rds_cmsg_rdma_dest(struct rds_sock *rs, struct rds_message *rm, | |||
631 | u32 r_key; | 656 | u32 r_key; |
632 | int err = 0; | 657 | int err = 0; |
633 | 658 | ||
634 | if (cmsg->cmsg_len < CMSG_LEN(sizeof(rds_rdma_cookie_t)) | 659 | if (cmsg->cmsg_len < CMSG_LEN(sizeof(rds_rdma_cookie_t)) || |
635 | || rm->m_rdma_cookie != 0) | 660 | rm->m_rdma_cookie != 0) |
636 | return -EINVAL; | 661 | return -EINVAL; |
637 | 662 | ||
638 | memcpy(&rm->m_rdma_cookie, CMSG_DATA(cmsg), sizeof(rm->m_rdma_cookie)); | 663 | memcpy(&rm->m_rdma_cookie, CMSG_DATA(cmsg), sizeof(rm->m_rdma_cookie)); |
@@ -668,8 +693,8 @@ int rds_cmsg_rdma_dest(struct rds_sock *rs, struct rds_message *rm, | |||
668 | int rds_cmsg_rdma_map(struct rds_sock *rs, struct rds_message *rm, | 693 | int rds_cmsg_rdma_map(struct rds_sock *rs, struct rds_message *rm, |
669 | struct cmsghdr *cmsg) | 694 | struct cmsghdr *cmsg) |
670 | { | 695 | { |
671 | if (cmsg->cmsg_len < CMSG_LEN(sizeof(struct rds_get_mr_args)) | 696 | if (cmsg->cmsg_len < CMSG_LEN(sizeof(struct rds_get_mr_args)) || |
672 | || rm->m_rdma_cookie != 0) | 697 | rm->m_rdma_cookie != 0) |
673 | return -EINVAL; | 698 | return -EINVAL; |
674 | 699 | ||
675 | return __rds_rdma_map(rs, CMSG_DATA(cmsg), &rm->m_rdma_cookie, &rm->m_rdma_mr); | 700 | return __rds_rdma_map(rs, CMSG_DATA(cmsg), &rm->m_rdma_cookie, &rm->m_rdma_mr); |
diff --git a/net/rds/rdma.h b/net/rds/rdma.h index 425512098b0b..909c39835a5d 100644 --- a/net/rds/rdma.h +++ b/net/rds/rdma.h | |||
@@ -61,6 +61,7 @@ static inline u32 rds_rdma_cookie_offset(rds_rdma_cookie_t cookie) | |||
61 | } | 61 | } |
62 | 62 | ||
63 | int rds_get_mr(struct rds_sock *rs, char __user *optval, int optlen); | 63 | int rds_get_mr(struct rds_sock *rs, char __user *optval, int optlen); |
64 | int rds_get_mr_for_dest(struct rds_sock *rs, char __user *optval, int optlen); | ||
64 | int rds_free_mr(struct rds_sock *rs, char __user *optval, int optlen); | 65 | int rds_free_mr(struct rds_sock *rs, char __user *optval, int optlen); |
65 | void rds_rdma_drop_keys(struct rds_sock *rs); | 66 | void rds_rdma_drop_keys(struct rds_sock *rs); |
66 | int rds_cmsg_rdma_args(struct rds_sock *rs, struct rds_message *rm, | 67 | int rds_cmsg_rdma_args(struct rds_sock *rs, struct rds_message *rm, |
diff --git a/net/rds/rdma_transport.c b/net/rds/rdma_transport.c index 9ece910ea394..7b155081b4dc 100644 --- a/net/rds/rdma_transport.c +++ b/net/rds/rdma_transport.c | |||
@@ -134,7 +134,7 @@ static int __init rds_rdma_listen_init(void) | |||
134 | ret = PTR_ERR(cm_id); | 134 | ret = PTR_ERR(cm_id); |
135 | printk(KERN_ERR "RDS/RDMA: failed to setup listener, " | 135 | printk(KERN_ERR "RDS/RDMA: failed to setup listener, " |
136 | "rdma_create_id() returned %d\n", ret); | 136 | "rdma_create_id() returned %d\n", ret); |
137 | goto out; | 137 | return ret; |
138 | } | 138 | } |
139 | 139 | ||
140 | sin.sin_family = AF_INET, | 140 | sin.sin_family = AF_INET, |
diff --git a/net/rds/recv.c b/net/rds/recv.c index fdff33c7b432..e2a2b9344f7b 100644 --- a/net/rds/recv.c +++ b/net/rds/recv.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/slab.h> | ||
34 | #include <net/sock.h> | 35 | #include <net/sock.h> |
35 | #include <linux/in.h> | 36 | #include <linux/in.h> |
36 | 37 | ||
@@ -195,8 +196,8 @@ void rds_recv_incoming(struct rds_connection *conn, __be32 saddr, __be32 daddr, | |||
195 | * XXX we could spend more on the wire to get more robust failure | 196 | * XXX we could spend more on the wire to get more robust failure |
196 | * detection, arguably worth it to avoid data corruption. | 197 | * detection, arguably worth it to avoid data corruption. |
197 | */ | 198 | */ |
198 | if (be64_to_cpu(inc->i_hdr.h_sequence) < conn->c_next_rx_seq | 199 | if (be64_to_cpu(inc->i_hdr.h_sequence) < conn->c_next_rx_seq && |
199 | && (inc->i_hdr.h_flags & RDS_FLAG_RETRANSMITTED)) { | 200 | (inc->i_hdr.h_flags & RDS_FLAG_RETRANSMITTED)) { |
200 | rds_stats_inc(s_recv_drop_old_seq); | 201 | rds_stats_inc(s_recv_drop_old_seq); |
201 | goto out; | 202 | goto out; |
202 | } | 203 | } |
@@ -432,10 +433,9 @@ int rds_recvmsg(struct kiocb *iocb, struct socket *sock, struct msghdr *msg, | |||
432 | } | 433 | } |
433 | 434 | ||
434 | timeo = wait_event_interruptible_timeout(*sk->sk_sleep, | 435 | timeo = wait_event_interruptible_timeout(*sk->sk_sleep, |
435 | (!list_empty(&rs->rs_notify_queue) | 436 | (!list_empty(&rs->rs_notify_queue) || |
436 | || rs->rs_cong_notify | 437 | rs->rs_cong_notify || |
437 | || rds_next_incoming(rs, &inc)), | 438 | rds_next_incoming(rs, &inc)), timeo); |
438 | timeo); | ||
439 | rdsdebug("recvmsg woke inc %p timeo %ld\n", inc, | 439 | rdsdebug("recvmsg woke inc %p timeo %ld\n", inc, |
440 | timeo); | 440 | timeo); |
441 | if (timeo > 0 || timeo == MAX_SCHEDULE_TIMEOUT) | 441 | if (timeo > 0 || timeo == MAX_SCHEDULE_TIMEOUT) |
diff --git a/net/rds/send.c b/net/rds/send.c index 28c88ff3d038..f04b929ded92 100644 --- a/net/rds/send.c +++ b/net/rds/send.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/gfp.h> | ||
34 | #include <net/sock.h> | 35 | #include <net/sock.h> |
35 | #include <linux/in.h> | 36 | #include <linux/in.h> |
36 | #include <linux/list.h> | 37 | #include <linux/list.h> |
@@ -235,8 +236,8 @@ int rds_send_xmit(struct rds_connection *conn) | |||
235 | * connection. | 236 | * connection. |
236 | * Therefore, we never retransmit messages with RDMA ops. | 237 | * Therefore, we never retransmit messages with RDMA ops. |
237 | */ | 238 | */ |
238 | if (rm->m_rdma_op | 239 | if (rm->m_rdma_op && |
239 | && test_bit(RDS_MSG_RETRANSMITTED, &rm->m_flags)) { | 240 | test_bit(RDS_MSG_RETRANSMITTED, &rm->m_flags)) { |
240 | spin_lock_irqsave(&conn->c_lock, flags); | 241 | spin_lock_irqsave(&conn->c_lock, flags); |
241 | if (test_and_clear_bit(RDS_MSG_ON_CONN, &rm->m_flags)) | 242 | if (test_and_clear_bit(RDS_MSG_ON_CONN, &rm->m_flags)) |
242 | list_move(&rm->m_conn_item, &to_be_dropped); | 243 | list_move(&rm->m_conn_item, &to_be_dropped); |
@@ -247,8 +248,8 @@ int rds_send_xmit(struct rds_connection *conn) | |||
247 | 248 | ||
248 | /* Require an ACK every once in a while */ | 249 | /* Require an ACK every once in a while */ |
249 | len = ntohl(rm->m_inc.i_hdr.h_len); | 250 | len = ntohl(rm->m_inc.i_hdr.h_len); |
250 | if (conn->c_unacked_packets == 0 | 251 | if (conn->c_unacked_packets == 0 || |
251 | || conn->c_unacked_bytes < len) { | 252 | conn->c_unacked_bytes < len) { |
252 | __set_bit(RDS_MSG_ACK_REQUIRED, &rm->m_flags); | 253 | __set_bit(RDS_MSG_ACK_REQUIRED, &rm->m_flags); |
253 | 254 | ||
254 | conn->c_unacked_packets = rds_sysctl_max_unacked_packets; | 255 | conn->c_unacked_packets = rds_sysctl_max_unacked_packets; |
@@ -418,8 +419,8 @@ void rds_rdma_send_complete(struct rds_message *rm, int status) | |||
418 | spin_lock(&rm->m_rs_lock); | 419 | spin_lock(&rm->m_rs_lock); |
419 | 420 | ||
420 | ro = rm->m_rdma_op; | 421 | ro = rm->m_rdma_op; |
421 | if (test_bit(RDS_MSG_ON_SOCK, &rm->m_flags) | 422 | if (test_bit(RDS_MSG_ON_SOCK, &rm->m_flags) && |
422 | && ro && ro->r_notify && ro->r_notifier) { | 423 | ro && ro->r_notify && ro->r_notifier) { |
423 | notifier = ro->r_notifier; | 424 | notifier = ro->r_notifier; |
424 | rs = rm->m_rs; | 425 | rs = rm->m_rs; |
425 | sock_hold(rds_rs_to_sk(rs)); | 426 | sock_hold(rds_rs_to_sk(rs)); |
@@ -549,8 +550,7 @@ void rds_send_remove_from_sock(struct list_head *messages, int status) | |||
549 | list_del_init(&rm->m_sock_item); | 550 | list_del_init(&rm->m_sock_item); |
550 | rds_send_sndbuf_remove(rs, rm); | 551 | rds_send_sndbuf_remove(rs, rm); |
551 | 552 | ||
552 | if (ro && ro->r_notifier | 553 | if (ro && ro->r_notifier && (status || ro->r_notify)) { |
553 | && (status || ro->r_notify)) { | ||
554 | notifier = ro->r_notifier; | 554 | notifier = ro->r_notifier; |
555 | list_add_tail(¬ifier->n_list, | 555 | list_add_tail(¬ifier->n_list, |
556 | &rs->rs_notify_queue); | 556 | &rs->rs_notify_queue); |
@@ -877,8 +877,8 @@ int rds_sendmsg(struct kiocb *iocb, struct socket *sock, struct msghdr *msg, | |||
877 | if (ret) | 877 | if (ret) |
878 | goto out; | 878 | goto out; |
879 | 879 | ||
880 | if ((rm->m_rdma_cookie || rm->m_rdma_op) | 880 | if ((rm->m_rdma_cookie || rm->m_rdma_op) && |
881 | && conn->c_trans->xmit_rdma == NULL) { | 881 | conn->c_trans->xmit_rdma == NULL) { |
882 | if (printk_ratelimit()) | 882 | if (printk_ratelimit()) |
883 | printk(KERN_NOTICE "rdma_op %p conn xmit_rdma %p\n", | 883 | printk(KERN_NOTICE "rdma_op %p conn xmit_rdma %p\n", |
884 | rm->m_rdma_op, conn->c_trans->xmit_rdma); | 884 | rm->m_rdma_op, conn->c_trans->xmit_rdma); |
@@ -890,8 +890,8 @@ int rds_sendmsg(struct kiocb *iocb, struct socket *sock, struct msghdr *msg, | |||
890 | * have scheduled a delayed reconnect however - in this case | 890 | * have scheduled a delayed reconnect however - in this case |
891 | * we should not interfere. | 891 | * we should not interfere. |
892 | */ | 892 | */ |
893 | if (rds_conn_state(conn) == RDS_CONN_DOWN | 893 | if (rds_conn_state(conn) == RDS_CONN_DOWN && |
894 | && !test_and_set_bit(RDS_RECONNECT_PENDING, &conn->c_flags)) | 894 | !test_and_set_bit(RDS_RECONNECT_PENDING, &conn->c_flags)) |
895 | queue_delayed_work(rds_wq, &conn->c_conn_w, 0); | 895 | queue_delayed_work(rds_wq, &conn->c_conn_w, 0); |
896 | 896 | ||
897 | ret = rds_cong_wait(conn->c_fcong, dport, nonblock, rs); | 897 | ret = rds_cong_wait(conn->c_fcong, dport, nonblock, rs); |
@@ -973,8 +973,8 @@ rds_send_pong(struct rds_connection *conn, __be16 dport) | |||
973 | * have scheduled a delayed reconnect however - in this case | 973 | * have scheduled a delayed reconnect however - in this case |
974 | * we should not interfere. | 974 | * we should not interfere. |
975 | */ | 975 | */ |
976 | if (rds_conn_state(conn) == RDS_CONN_DOWN | 976 | if (rds_conn_state(conn) == RDS_CONN_DOWN && |
977 | && !test_and_set_bit(RDS_RECONNECT_PENDING, &conn->c_flags)) | 977 | !test_and_set_bit(RDS_RECONNECT_PENDING, &conn->c_flags)) |
978 | queue_delayed_work(rds_wq, &conn->c_conn_w, 0); | 978 | queue_delayed_work(rds_wq, &conn->c_conn_w, 0); |
979 | 979 | ||
980 | ret = rds_cong_wait(conn->c_fcong, dport, 1, NULL); | 980 | ret = rds_cong_wait(conn->c_fcong, dport, 1, NULL); |
diff --git a/net/rds/sysctl.c b/net/rds/sysctl.c index 307dc5c1be15..7829a20325d3 100644 --- a/net/rds/sysctl.c +++ b/net/rds/sysctl.c | |||
@@ -51,55 +51,50 @@ unsigned int rds_sysctl_ping_enable = 1; | |||
51 | 51 | ||
52 | static ctl_table rds_sysctl_rds_table[] = { | 52 | static ctl_table rds_sysctl_rds_table[] = { |
53 | { | 53 | { |
54 | .ctl_name = CTL_UNNUMBERED, | ||
55 | .procname = "reconnect_min_delay_ms", | 54 | .procname = "reconnect_min_delay_ms", |
56 | .data = &rds_sysctl_reconnect_min_jiffies, | 55 | .data = &rds_sysctl_reconnect_min_jiffies, |
57 | .maxlen = sizeof(unsigned long), | 56 | .maxlen = sizeof(unsigned long), |
58 | .mode = 0644, | 57 | .mode = 0644, |
59 | .proc_handler = &proc_doulongvec_ms_jiffies_minmax, | 58 | .proc_handler = proc_doulongvec_ms_jiffies_minmax, |
60 | .extra1 = &rds_sysctl_reconnect_min, | 59 | .extra1 = &rds_sysctl_reconnect_min, |
61 | .extra2 = &rds_sysctl_reconnect_max_jiffies, | 60 | .extra2 = &rds_sysctl_reconnect_max_jiffies, |
62 | }, | 61 | }, |
63 | { | 62 | { |
64 | .ctl_name = CTL_UNNUMBERED, | ||
65 | .procname = "reconnect_max_delay_ms", | 63 | .procname = "reconnect_max_delay_ms", |
66 | .data = &rds_sysctl_reconnect_max_jiffies, | 64 | .data = &rds_sysctl_reconnect_max_jiffies, |
67 | .maxlen = sizeof(unsigned long), | 65 | .maxlen = sizeof(unsigned long), |
68 | .mode = 0644, | 66 | .mode = 0644, |
69 | .proc_handler = &proc_doulongvec_ms_jiffies_minmax, | 67 | .proc_handler = proc_doulongvec_ms_jiffies_minmax, |
70 | .extra1 = &rds_sysctl_reconnect_min_jiffies, | 68 | .extra1 = &rds_sysctl_reconnect_min_jiffies, |
71 | .extra2 = &rds_sysctl_reconnect_max, | 69 | .extra2 = &rds_sysctl_reconnect_max, |
72 | }, | 70 | }, |
73 | { | 71 | { |
74 | .ctl_name = CTL_UNNUMBERED, | ||
75 | .procname = "max_unacked_packets", | 72 | .procname = "max_unacked_packets", |
76 | .data = &rds_sysctl_max_unacked_packets, | 73 | .data = &rds_sysctl_max_unacked_packets, |
77 | .maxlen = sizeof(unsigned long), | 74 | .maxlen = sizeof(unsigned long), |
78 | .mode = 0644, | 75 | .mode = 0644, |
79 | .proc_handler = &proc_dointvec, | 76 | .proc_handler = proc_dointvec, |
80 | }, | 77 | }, |
81 | { | 78 | { |
82 | .ctl_name = CTL_UNNUMBERED, | ||
83 | .procname = "max_unacked_bytes", | 79 | .procname = "max_unacked_bytes", |
84 | .data = &rds_sysctl_max_unacked_bytes, | 80 | .data = &rds_sysctl_max_unacked_bytes, |
85 | .maxlen = sizeof(unsigned long), | 81 | .maxlen = sizeof(unsigned long), |
86 | .mode = 0644, | 82 | .mode = 0644, |
87 | .proc_handler = &proc_dointvec, | 83 | .proc_handler = proc_dointvec, |
88 | }, | 84 | }, |
89 | { | 85 | { |
90 | .ctl_name = CTL_UNNUMBERED, | ||
91 | .procname = "ping_enable", | 86 | .procname = "ping_enable", |
92 | .data = &rds_sysctl_ping_enable, | 87 | .data = &rds_sysctl_ping_enable, |
93 | .maxlen = sizeof(int), | 88 | .maxlen = sizeof(int), |
94 | .mode = 0644, | 89 | .mode = 0644, |
95 | .proc_handler = &proc_dointvec, | 90 | .proc_handler = proc_dointvec, |
96 | }, | 91 | }, |
97 | { .ctl_name = 0} | 92 | { } |
98 | }; | 93 | }; |
99 | 94 | ||
100 | static struct ctl_path rds_sysctl_path[] = { | 95 | static struct ctl_path rds_sysctl_path[] = { |
101 | { .procname = "net", .ctl_name = CTL_NET, }, | 96 | { .procname = "net", }, |
102 | { .procname = "rds", .ctl_name = CTL_UNNUMBERED, }, | 97 | { .procname = "rds", }, |
103 | { } | 98 | { } |
104 | }; | 99 | }; |
105 | 100 | ||
diff --git a/net/rds/tcp.c b/net/rds/tcp.c index b5198aee45d3..babf4577ff7d 100644 --- a/net/rds/tcp.c +++ b/net/rds/tcp.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/slab.h> | ||
34 | #include <linux/in.h> | 35 | #include <linux/in.h> |
35 | #include <net/tcp.h> | 36 | #include <net/tcp.h> |
36 | 37 | ||
diff --git a/net/rds/tcp_connect.c b/net/rds/tcp_connect.c index 211522f9a9a2..056256285987 100644 --- a/net/rds/tcp_connect.c +++ b/net/rds/tcp_connect.c | |||
@@ -90,8 +90,8 @@ int rds_tcp_conn_connect(struct rds_connection *conn) | |||
90 | 90 | ||
91 | ret = sock->ops->bind(sock, (struct sockaddr *)&src, sizeof(src)); | 91 | ret = sock->ops->bind(sock, (struct sockaddr *)&src, sizeof(src)); |
92 | if (ret) { | 92 | if (ret) { |
93 | rdsdebug("bind failed with %d at address %u.%u.%u.%u\n", | 93 | rdsdebug("bind failed with %d at address %pI4\n", |
94 | ret, NIPQUAD(conn->c_laddr)); | 94 | ret, &conn->c_laddr); |
95 | goto out; | 95 | goto out; |
96 | } | 96 | } |
97 | 97 | ||
@@ -108,8 +108,7 @@ int rds_tcp_conn_connect(struct rds_connection *conn) | |||
108 | O_NONBLOCK); | 108 | O_NONBLOCK); |
109 | sock = NULL; | 109 | sock = NULL; |
110 | 110 | ||
111 | rdsdebug("connect to address %u.%u.%u.%u returned %d\n", | 111 | rdsdebug("connect to address %pI4 returned %d\n", &conn->c_faddr, ret); |
112 | NIPQUAD(conn->c_faddr), ret); | ||
113 | if (ret == -EINPROGRESS) | 112 | if (ret == -EINPROGRESS) |
114 | ret = 0; | 113 | ret = 0; |
115 | 114 | ||
diff --git a/net/rds/tcp_listen.c b/net/rds/tcp_listen.c index 24b743eb0b1b..975183fe6950 100644 --- a/net/rds/tcp_listen.c +++ b/net/rds/tcp_listen.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/gfp.h> | ||
34 | #include <linux/in.h> | 35 | #include <linux/in.h> |
35 | #include <net/tcp.h> | 36 | #include <net/tcp.h> |
36 | 37 | ||
@@ -66,12 +67,12 @@ static int rds_tcp_accept_one(struct socket *sock) | |||
66 | 67 | ||
67 | inet = inet_sk(new_sock->sk); | 68 | inet = inet_sk(new_sock->sk); |
68 | 69 | ||
69 | rdsdebug("accepted tcp %u.%u.%u.%u:%u -> %u.%u.%u.%u:%u\n", | 70 | rdsdebug("accepted tcp %pI4:%u -> %pI4:%u\n", |
70 | NIPQUAD(inet->saddr), ntohs(inet->sport), | 71 | &inet->inet_saddr, ntohs(inet->inet_sport), |
71 | NIPQUAD(inet->daddr), ntohs(inet->dport)); | 72 | &inet->inet_daddr, ntohs(inet->inet_dport)); |
72 | 73 | ||
73 | conn = rds_conn_create(inet->saddr, inet->daddr, &rds_tcp_transport, | 74 | conn = rds_conn_create(inet->inet_saddr, inet->inet_daddr, |
74 | GFP_KERNEL); | 75 | &rds_tcp_transport, GFP_KERNEL); |
75 | if (IS_ERR(conn)) { | 76 | if (IS_ERR(conn)) { |
76 | ret = PTR_ERR(conn); | 77 | ret = PTR_ERR(conn); |
77 | goto out; | 78 | goto out; |
diff --git a/net/rds/tcp_recv.c b/net/rds/tcp_recv.c index c00dafffbb5a..e08ec912d8b0 100644 --- a/net/rds/tcp_recv.c +++ b/net/rds/tcp_recv.c | |||
@@ -31,6 +31,7 @@ | |||
31 | * | 31 | * |
32 | */ | 32 | */ |
33 | #include <linux/kernel.h> | 33 | #include <linux/kernel.h> |
34 | #include <linux/slab.h> | ||
34 | #include <net/tcp.h> | 35 | #include <net/tcp.h> |
35 | 36 | ||
36 | #include "rds.h" | 37 | #include "rds.h" |
diff --git a/net/rds/tcp_send.c b/net/rds/tcp_send.c index ab545e0cd5d6..34fdcc059e54 100644 --- a/net/rds/tcp_send.c +++ b/net/rds/tcp_send.c | |||
@@ -193,9 +193,9 @@ out: | |||
193 | rds_tcp_stats_inc(s_tcp_sndbuf_full); | 193 | rds_tcp_stats_inc(s_tcp_sndbuf_full); |
194 | ret = 0; | 194 | ret = 0; |
195 | } else { | 195 | } else { |
196 | printk(KERN_WARNING "RDS/tcp: send to %u.%u.%u.%u " | 196 | printk(KERN_WARNING "RDS/tcp: send to %pI4 " |
197 | "returned %d, disconnecting and reconnecting\n", | 197 | "returned %d, disconnecting and reconnecting\n", |
198 | NIPQUAD(conn->c_faddr), ret); | 198 | &conn->c_faddr, ret); |
199 | rds_conn_drop(conn); | 199 | rds_conn_drop(conn); |
200 | } | 200 | } |
201 | } | 201 | } |
diff --git a/net/rds/threads.c b/net/rds/threads.c index dd7e0cad1e7c..00fa10e59af8 100644 --- a/net/rds/threads.c +++ b/net/rds/threads.c | |||
@@ -170,8 +170,8 @@ void rds_shutdown_worker(struct work_struct *work) | |||
170 | * handler is supposed to check for state DISCONNECTING | 170 | * handler is supposed to check for state DISCONNECTING |
171 | */ | 171 | */ |
172 | mutex_lock(&conn->c_cm_lock); | 172 | mutex_lock(&conn->c_cm_lock); |
173 | if (!rds_conn_transition(conn, RDS_CONN_UP, RDS_CONN_DISCONNECTING) | 173 | if (!rds_conn_transition(conn, RDS_CONN_UP, RDS_CONN_DISCONNECTING) && |
174 | && !rds_conn_transition(conn, RDS_CONN_ERROR, RDS_CONN_DISCONNECTING)) { | 174 | !rds_conn_transition(conn, RDS_CONN_ERROR, RDS_CONN_DISCONNECTING)) { |
175 | rds_conn_error(conn, "shutdown called in state %d\n", | 175 | rds_conn_error(conn, "shutdown called in state %d\n", |
176 | atomic_read(&conn->c_state)); | 176 | atomic_read(&conn->c_state)); |
177 | mutex_unlock(&conn->c_cm_lock); | 177 | mutex_unlock(&conn->c_cm_lock); |