diff options
author | Linus Torvalds <torvalds@linux-foundation.org> | 2011-01-10 10:46:26 -0500 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2011-01-10 10:46:26 -0500 |
commit | f9f265f35578c5fb2266d0e2a1aa5b57f6fdb36a (patch) | |
tree | 8fee08f3ea63633c2cc3e93778ad9c8eb15193c8 /fs | |
parent | 7d44b0440147d83a65270205b22e7d365de28948 (diff) | |
parent | b9d41052794385f9d47ebb7acf4a772f3ad02398 (diff) |
Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/teigland/dlm
* 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/teigland/dlm:
dlm: sanitize work_start() in lowcomms.c
dlm: reduce cond_resched during send
dlm: use TCP_NODELAY
dlm: Use cmwq for send and receive workqueues
dlm: Handle application limited situations properly.
Diffstat (limited to 'fs')
-rw-r--r-- | fs/dlm/lowcomms.c | 63 |
1 files changed, 50 insertions, 13 deletions
diff --git a/fs/dlm/lowcomms.c b/fs/dlm/lowcomms.c index 37a34c2c622a..9c64ae9e4c1a 100644 --- a/fs/dlm/lowcomms.c +++ b/fs/dlm/lowcomms.c | |||
@@ -63,6 +63,9 @@ | |||
63 | #define NEEDED_RMEM (4*1024*1024) | 63 | #define NEEDED_RMEM (4*1024*1024) |
64 | #define CONN_HASH_SIZE 32 | 64 | #define CONN_HASH_SIZE 32 |
65 | 65 | ||
66 | /* Number of messages to send before rescheduling */ | ||
67 | #define MAX_SEND_MSG_COUNT 25 | ||
68 | |||
66 | struct cbuf { | 69 | struct cbuf { |
67 | unsigned int base; | 70 | unsigned int base; |
68 | unsigned int len; | 71 | unsigned int len; |
@@ -108,6 +111,7 @@ struct connection { | |||
108 | #define CF_INIT_PENDING 4 | 111 | #define CF_INIT_PENDING 4 |
109 | #define CF_IS_OTHERCON 5 | 112 | #define CF_IS_OTHERCON 5 |
110 | #define CF_CLOSE 6 | 113 | #define CF_CLOSE 6 |
114 | #define CF_APP_LIMITED 7 | ||
111 | struct list_head writequeue; /* List of outgoing writequeue_entries */ | 115 | struct list_head writequeue; /* List of outgoing writequeue_entries */ |
112 | spinlock_t writequeue_lock; | 116 | spinlock_t writequeue_lock; |
113 | int (*rx_action) (struct connection *); /* What to do when active */ | 117 | int (*rx_action) (struct connection *); /* What to do when active */ |
@@ -295,7 +299,17 @@ static void lowcomms_write_space(struct sock *sk) | |||
295 | { | 299 | { |
296 | struct connection *con = sock2con(sk); | 300 | struct connection *con = sock2con(sk); |
297 | 301 | ||
298 | if (con && !test_and_set_bit(CF_WRITE_PENDING, &con->flags)) | 302 | if (!con) |
303 | return; | ||
304 | |||
305 | clear_bit(SOCK_NOSPACE, &con->sock->flags); | ||
306 | |||
307 | if (test_and_clear_bit(CF_APP_LIMITED, &con->flags)) { | ||
308 | con->sock->sk->sk_write_pending--; | ||
309 | clear_bit(SOCK_ASYNC_NOSPACE, &con->sock->flags); | ||
310 | } | ||
311 | |||
312 | if (!test_and_set_bit(CF_WRITE_PENDING, &con->flags)) | ||
299 | queue_work(send_workqueue, &con->swork); | 313 | queue_work(send_workqueue, &con->swork); |
300 | } | 314 | } |
301 | 315 | ||
@@ -915,6 +929,7 @@ static void tcp_connect_to_sock(struct connection *con) | |||
915 | struct sockaddr_storage saddr, src_addr; | 929 | struct sockaddr_storage saddr, src_addr; |
916 | int addr_len; | 930 | int addr_len; |
917 | struct socket *sock = NULL; | 931 | struct socket *sock = NULL; |
932 | int one = 1; | ||
918 | 933 | ||
919 | if (con->nodeid == 0) { | 934 | if (con->nodeid == 0) { |
920 | log_print("attempt to connect sock 0 foiled"); | 935 | log_print("attempt to connect sock 0 foiled"); |
@@ -960,6 +975,11 @@ static void tcp_connect_to_sock(struct connection *con) | |||
960 | make_sockaddr(&saddr, dlm_config.ci_tcp_port, &addr_len); | 975 | make_sockaddr(&saddr, dlm_config.ci_tcp_port, &addr_len); |
961 | 976 | ||
962 | log_print("connecting to %d", con->nodeid); | 977 | log_print("connecting to %d", con->nodeid); |
978 | |||
979 | /* Turn off Nagle's algorithm */ | ||
980 | kernel_setsockopt(sock, SOL_TCP, TCP_NODELAY, (char *)&one, | ||
981 | sizeof(one)); | ||
982 | |||
963 | result = | 983 | result = |
964 | sock->ops->connect(sock, (struct sockaddr *)&saddr, addr_len, | 984 | sock->ops->connect(sock, (struct sockaddr *)&saddr, addr_len, |
965 | O_NONBLOCK); | 985 | O_NONBLOCK); |
@@ -1011,6 +1031,10 @@ static struct socket *tcp_create_listen_sock(struct connection *con, | |||
1011 | goto create_out; | 1031 | goto create_out; |
1012 | } | 1032 | } |
1013 | 1033 | ||
1034 | /* Turn off Nagle's algorithm */ | ||
1035 | kernel_setsockopt(sock, SOL_TCP, TCP_NODELAY, (char *)&one, | ||
1036 | sizeof(one)); | ||
1037 | |||
1014 | result = kernel_setsockopt(sock, SOL_SOCKET, SO_REUSEADDR, | 1038 | result = kernel_setsockopt(sock, SOL_SOCKET, SO_REUSEADDR, |
1015 | (char *)&one, sizeof(one)); | 1039 | (char *)&one, sizeof(one)); |
1016 | 1040 | ||
@@ -1297,6 +1321,7 @@ static void send_to_sock(struct connection *con) | |||
1297 | const int msg_flags = MSG_DONTWAIT | MSG_NOSIGNAL; | 1321 | const int msg_flags = MSG_DONTWAIT | MSG_NOSIGNAL; |
1298 | struct writequeue_entry *e; | 1322 | struct writequeue_entry *e; |
1299 | int len, offset; | 1323 | int len, offset; |
1324 | int count = 0; | ||
1300 | 1325 | ||
1301 | mutex_lock(&con->sock_mutex); | 1326 | mutex_lock(&con->sock_mutex); |
1302 | if (con->sock == NULL) | 1327 | if (con->sock == NULL) |
@@ -1319,14 +1344,27 @@ static void send_to_sock(struct connection *con) | |||
1319 | ret = kernel_sendpage(con->sock, e->page, offset, len, | 1344 | ret = kernel_sendpage(con->sock, e->page, offset, len, |
1320 | msg_flags); | 1345 | msg_flags); |
1321 | if (ret == -EAGAIN || ret == 0) { | 1346 | if (ret == -EAGAIN || ret == 0) { |
1347 | if (ret == -EAGAIN && | ||
1348 | test_bit(SOCK_ASYNC_NOSPACE, &con->sock->flags) && | ||
1349 | !test_and_set_bit(CF_APP_LIMITED, &con->flags)) { | ||
1350 | /* Notify TCP that we're limited by the | ||
1351 | * application window size. | ||
1352 | */ | ||
1353 | set_bit(SOCK_NOSPACE, &con->sock->flags); | ||
1354 | con->sock->sk->sk_write_pending++; | ||
1355 | } | ||
1322 | cond_resched(); | 1356 | cond_resched(); |
1323 | goto out; | 1357 | goto out; |
1324 | } | 1358 | } |
1325 | if (ret <= 0) | 1359 | if (ret <= 0) |
1326 | goto send_error; | 1360 | goto send_error; |
1327 | } | 1361 | } |
1328 | /* Don't starve people filling buffers */ | 1362 | |
1363 | /* Don't starve people filling buffers */ | ||
1364 | if (++count >= MAX_SEND_MSG_COUNT) { | ||
1329 | cond_resched(); | 1365 | cond_resched(); |
1366 | count = 0; | ||
1367 | } | ||
1330 | 1368 | ||
1331 | spin_lock(&con->writequeue_lock); | 1369 | spin_lock(&con->writequeue_lock); |
1332 | e->offset += ret; | 1370 | e->offset += ret; |
@@ -1430,20 +1468,19 @@ static void work_stop(void) | |||
1430 | 1468 | ||
1431 | static int work_start(void) | 1469 | static int work_start(void) |
1432 | { | 1470 | { |
1433 | int error; | 1471 | recv_workqueue = alloc_workqueue("dlm_recv", WQ_MEM_RECLAIM | |
1434 | recv_workqueue = create_workqueue("dlm_recv"); | 1472 | WQ_HIGHPRI | WQ_FREEZEABLE, 0); |
1435 | error = IS_ERR(recv_workqueue); | 1473 | if (!recv_workqueue) { |
1436 | if (error) { | 1474 | log_print("can't start dlm_recv"); |
1437 | log_print("can't start dlm_recv %d", error); | 1475 | return -ENOMEM; |
1438 | return error; | ||
1439 | } | 1476 | } |
1440 | 1477 | ||
1441 | send_workqueue = create_singlethread_workqueue("dlm_send"); | 1478 | send_workqueue = alloc_workqueue("dlm_send", WQ_MEM_RECLAIM | |
1442 | error = IS_ERR(send_workqueue); | 1479 | WQ_HIGHPRI | WQ_FREEZEABLE, 0); |
1443 | if (error) { | 1480 | if (!send_workqueue) { |
1444 | log_print("can't start dlm_send %d", error); | 1481 | log_print("can't start dlm_send"); |
1445 | destroy_workqueue(recv_workqueue); | 1482 | destroy_workqueue(recv_workqueue); |
1446 | return error; | 1483 | return -ENOMEM; |
1447 | } | 1484 | } |
1448 | 1485 | ||
1449 | return 0; | 1486 | return 0; |