diff options
author | Sage Weil <sage@inktank.com> | 2012-07-10 14:53:34 -0400 |
---|---|---|
committer | Sage Weil <sage@inktank.com> | 2012-07-17 22:35:59 -0400 |
commit | 5bdca4e0768d3e0f4efa43d9a2cc8210aeb91ab9 (patch) | |
tree | de2a46ca2bc95e84737f3fe65e715d602b3b9356 /include | |
parent | a018540141a931f5299a866907b27886916b4374 (diff) |
libceph: fix messenger retry
In ancient times, the messenger could both initiate and accept connections.
An artifact if that was data structures to store/process an incoming
ceph_msg_connect request and send an outgoing ceph_msg_connect_reply.
Sadly, the negotiation code was referencing those structures and ignoring
important information (like the peer's connect_seq) from the correct ones.
Among other things, this fixes tight reconnect loops where the server sends
RETRY_SESSION and we (the client) retries with the same connect_seq as last
time. This bug pretty easily triggered by injecting socket failures on the
MDS and running some fs workload like workunits/direct_io/test_sync_io.
Signed-off-by: Sage Weil <sage@inktank.com>
Diffstat (limited to 'include')
-rw-r--r-- | include/linux/ceph/messenger.h | 12 |
1 files changed, 2 insertions, 10 deletions
diff --git a/include/linux/ceph/messenger.h b/include/linux/ceph/messenger.h index 2521a95fa6d9..44c87e731e9d 100644 --- a/include/linux/ceph/messenger.h +++ b/include/linux/ceph/messenger.h | |||
@@ -163,16 +163,8 @@ struct ceph_connection { | |||
163 | 163 | ||
164 | /* connection negotiation temps */ | 164 | /* connection negotiation temps */ |
165 | char in_banner[CEPH_BANNER_MAX_LEN]; | 165 | char in_banner[CEPH_BANNER_MAX_LEN]; |
166 | union { | 166 | struct ceph_msg_connect out_connect; |
167 | struct { /* outgoing connection */ | 167 | struct ceph_msg_connect_reply in_reply; |
168 | struct ceph_msg_connect out_connect; | ||
169 | struct ceph_msg_connect_reply in_reply; | ||
170 | }; | ||
171 | struct { /* incoming */ | ||
172 | struct ceph_msg_connect in_connect; | ||
173 | struct ceph_msg_connect_reply out_reply; | ||
174 | }; | ||
175 | }; | ||
176 | struct ceph_entity_addr actual_peer_addr; | 168 | struct ceph_entity_addr actual_peer_addr; |
177 | 169 | ||
178 | /* message out temps */ | 170 | /* message out temps */ |