aboutsummaryrefslogtreecommitdiffstats
path: root/include/linux/ceph
diff options
context:
space:
mode:
authorSage Weil <sage@inktank.com>2012-07-10 14:53:34 -0400
committerSage Weil <sage@inktank.com>2012-07-30 12:29:52 -0400
commita16cb1f70799c851410d9dca0a24122e258df06c (patch)
tree0290805d3594d770da3937da7fa68841c1e294ac /include/linux/ceph
parentcd43045c2de60f40a0aea49bfb252a2eafe58f8c (diff)
libceph: fix messenger retry
In ancient times, the messenger could both initiate and accept connections. An artifact if that was data structures to store/process an incoming ceph_msg_connect request and send an outgoing ceph_msg_connect_reply. Sadly, the negotiation code was referencing those structures and ignoring important information (like the peer's connect_seq) from the correct ones. Among other things, this fixes tight reconnect loops where the server sends RETRY_SESSION and we (the client) retries with the same connect_seq as last time. This bug pretty easily triggered by injecting socket failures on the MDS and running some fs workload like workunits/direct_io/test_sync_io. Signed-off-by: Sage Weil <sage@inktank.com>
Diffstat (limited to 'include/linux/ceph')
-rw-r--r--include/linux/ceph/messenger.h12
1 files changed, 2 insertions, 10 deletions
diff --git a/include/linux/ceph/messenger.h b/include/linux/ceph/messenger.h
index 478f814f210..cfb1bbdac62 100644
--- a/include/linux/ceph/messenger.h
+++ b/include/linux/ceph/messenger.h
@@ -172,16 +172,8 @@ struct ceph_connection {
172 172
173 /* connection negotiation temps */ 173 /* connection negotiation temps */
174 char in_banner[CEPH_BANNER_MAX_LEN]; 174 char in_banner[CEPH_BANNER_MAX_LEN];
175 union { 175 struct ceph_msg_connect out_connect;
176 struct { /* outgoing connection */ 176 struct ceph_msg_connect_reply in_reply;
177 struct ceph_msg_connect out_connect;
178 struct ceph_msg_connect_reply in_reply;
179 };
180 struct { /* incoming */
181 struct ceph_msg_connect in_connect;
182 struct ceph_msg_connect_reply out_reply;
183 };
184 };
185 struct ceph_entity_addr actual_peer_addr; 177 struct ceph_entity_addr actual_peer_addr;
186 178
187 /* message out temps */ 179 /* message out temps */