diff options
| author | Sage Weil <sage@inktank.com> | 2012-07-10 14:53:34 -0400 |
|---|---|---|
| committer | Sage Weil <sage@inktank.com> | 2012-07-30 12:29:52 -0400 |
| commit | a16cb1f70799c851410d9dca0a24122e258df06c (patch) | |
| tree | 0290805d3594d770da3937da7fa68841c1e294ac /include/linux/ceph | |
| parent | cd43045c2de60f40a0aea49bfb252a2eafe58f8c (diff) | |
libceph: fix messenger retry
In ancient times, the messenger could both initiate and accept connections.
An artifact if that was data structures to store/process an incoming
ceph_msg_connect request and send an outgoing ceph_msg_connect_reply.
Sadly, the negotiation code was referencing those structures and ignoring
important information (like the peer's connect_seq) from the correct ones.
Among other things, this fixes tight reconnect loops where the server sends
RETRY_SESSION and we (the client) retries with the same connect_seq as last
time. This bug pretty easily triggered by injecting socket failures on the
MDS and running some fs workload like workunits/direct_io/test_sync_io.
Signed-off-by: Sage Weil <sage@inktank.com>
Diffstat (limited to 'include/linux/ceph')
| -rw-r--r-- | include/linux/ceph/messenger.h | 12 |
1 files changed, 2 insertions, 10 deletions
diff --git a/include/linux/ceph/messenger.h b/include/linux/ceph/messenger.h index 478f814f210..cfb1bbdac62 100644 --- a/include/linux/ceph/messenger.h +++ b/include/linux/ceph/messenger.h | |||
| @@ -172,16 +172,8 @@ struct ceph_connection { | |||
| 172 | 172 | ||
| 173 | /* connection negotiation temps */ | 173 | /* connection negotiation temps */ |
| 174 | char in_banner[CEPH_BANNER_MAX_LEN]; | 174 | char in_banner[CEPH_BANNER_MAX_LEN]; |
| 175 | union { | 175 | struct ceph_msg_connect out_connect; |
| 176 | struct { /* outgoing connection */ | 176 | struct ceph_msg_connect_reply in_reply; |
| 177 | struct ceph_msg_connect out_connect; | ||
| 178 | struct ceph_msg_connect_reply in_reply; | ||
| 179 | }; | ||
| 180 | struct { /* incoming */ | ||
| 181 | struct ceph_msg_connect in_connect; | ||
| 182 | struct ceph_msg_connect_reply out_reply; | ||
| 183 | }; | ||
| 184 | }; | ||
| 185 | struct ceph_entity_addr actual_peer_addr; | 177 | struct ceph_entity_addr actual_peer_addr; |
| 186 | 178 | ||
| 187 | /* message out temps */ | 179 | /* message out temps */ |
