diff options
author | Sage Weil <sage@newdream.net> | 2009-10-06 14:31:10 -0400 |
---|---|---|
committer | Sage Weil <sage@newdream.net> | 2009-10-06 14:31:10 -0400 |
commit | f24e9980eb860d8600cbe5ef3d2fd9295320d229 (patch) | |
tree | 10f43450ad2cd4d799dd02d33c02d4ed8bef39d6 /fs/ceph/osd_client.h | |
parent | 2f2dc053404febedc9c273452d9d518fb31fde72 (diff) |
ceph: OSD client
The OSD client is responsible for reading and writing data from/to the
object storage pool. This includes determining where objects are
stored in the cluster, and ensuring that requests are retried or
redirected in the event of a node failure or data migration.
If an OSD does not respond before a timeout expires, keepalive
messages are sent across the lossless, ordered communications channel
to ensure that any break in the TCP is discovered. If the session
does reset, a reconnection is attempted and affected requests are
resent (by the message transport layer).
Signed-off-by: Sage Weil <sage@newdream.net>
Diffstat (limited to 'fs/ceph/osd_client.h')
-rw-r--r-- | fs/ceph/osd_client.h | 144 |
1 files changed, 144 insertions, 0 deletions
diff --git a/fs/ceph/osd_client.h b/fs/ceph/osd_client.h new file mode 100644 index 000000000000..9a4addf7d651 --- /dev/null +++ b/fs/ceph/osd_client.h | |||
@@ -0,0 +1,144 @@ | |||
1 | #ifndef _FS_CEPH_OSD_CLIENT_H | ||
2 | #define _FS_CEPH_OSD_CLIENT_H | ||
3 | |||
4 | #include <linux/completion.h> | ||
5 | #include <linux/mempool.h> | ||
6 | #include <linux/rbtree.h> | ||
7 | |||
8 | #include "types.h" | ||
9 | #include "osdmap.h" | ||
10 | #include "messenger.h" | ||
11 | |||
12 | struct ceph_msg; | ||
13 | struct ceph_snap_context; | ||
14 | struct ceph_osd_request; | ||
15 | struct ceph_osd_client; | ||
16 | |||
17 | /* | ||
18 | * completion callback for async writepages | ||
19 | */ | ||
20 | typedef void (*ceph_osdc_callback_t)(struct ceph_osd_request *, | ||
21 | struct ceph_msg *); | ||
22 | |||
23 | /* a given osd we're communicating with */ | ||
24 | struct ceph_osd { | ||
25 | atomic_t o_ref; | ||
26 | struct ceph_osd_client *o_osdc; | ||
27 | int o_osd; | ||
28 | int o_incarnation; | ||
29 | struct rb_node o_node; | ||
30 | struct ceph_connection o_con; | ||
31 | struct list_head o_requests; | ||
32 | }; | ||
33 | |||
34 | /* an in-flight request */ | ||
35 | struct ceph_osd_request { | ||
36 | u64 r_tid; /* unique for this client */ | ||
37 | struct rb_node r_node; | ||
38 | struct list_head r_osd_item; | ||
39 | struct ceph_osd *r_osd; | ||
40 | |||
41 | struct ceph_msg *r_request, *r_reply; | ||
42 | int r_result; | ||
43 | int r_flags; /* any additional flags for the osd */ | ||
44 | u32 r_sent; /* >0 if r_request is sending/sent */ | ||
45 | int r_prepared_pages, r_got_reply; | ||
46 | |||
47 | struct ceph_osd_client *r_osdc; | ||
48 | atomic_t r_ref; | ||
49 | bool r_mempool; | ||
50 | struct completion r_completion, r_safe_completion; | ||
51 | ceph_osdc_callback_t r_callback, r_safe_callback; | ||
52 | struct ceph_eversion r_reassert_version; | ||
53 | struct list_head r_unsafe_item; | ||
54 | |||
55 | struct inode *r_inode; /* for use by callbacks */ | ||
56 | struct writeback_control *r_wbc; /* ditto */ | ||
57 | |||
58 | char r_oid[40]; /* object name */ | ||
59 | int r_oid_len; | ||
60 | unsigned long r_timeout_stamp; | ||
61 | bool r_resend; /* msg send failed, needs retry */ | ||
62 | |||
63 | struct ceph_file_layout r_file_layout; | ||
64 | struct ceph_snap_context *r_snapc; /* snap context for writes */ | ||
65 | unsigned r_num_pages; /* size of page array (follows) */ | ||
66 | struct page **r_pages; /* pages for data payload */ | ||
67 | int r_pages_from_pool; | ||
68 | int r_own_pages; /* if true, i own page list */ | ||
69 | }; | ||
70 | |||
71 | struct ceph_osd_client { | ||
72 | struct ceph_client *client; | ||
73 | |||
74 | struct ceph_osdmap *osdmap; /* current map */ | ||
75 | struct rw_semaphore map_sem; | ||
76 | struct completion map_waiters; | ||
77 | u64 last_requested_map; | ||
78 | |||
79 | struct mutex request_mutex; | ||
80 | struct rb_root osds; /* osds */ | ||
81 | u64 timeout_tid; /* tid of timeout triggering rq */ | ||
82 | u64 last_tid; /* tid of last request */ | ||
83 | struct rb_root requests; /* pending requests */ | ||
84 | int num_requests; | ||
85 | struct delayed_work timeout_work; | ||
86 | struct dentry *debugfs_file; | ||
87 | |||
88 | mempool_t *req_mempool; | ||
89 | |||
90 | struct ceph_msgpool msgpool_op; | ||
91 | struct ceph_msgpool msgpool_op_reply; | ||
92 | }; | ||
93 | |||
94 | extern int ceph_osdc_init(struct ceph_osd_client *osdc, | ||
95 | struct ceph_client *client); | ||
96 | extern void ceph_osdc_stop(struct ceph_osd_client *osdc); | ||
97 | |||
98 | extern void ceph_osdc_handle_reply(struct ceph_osd_client *osdc, | ||
99 | struct ceph_msg *msg); | ||
100 | extern void ceph_osdc_handle_map(struct ceph_osd_client *osdc, | ||
101 | struct ceph_msg *msg); | ||
102 | |||
103 | extern struct ceph_osd_request *ceph_osdc_new_request(struct ceph_osd_client *, | ||
104 | struct ceph_file_layout *layout, | ||
105 | struct ceph_vino vino, | ||
106 | u64 offset, u64 *len, int op, int flags, | ||
107 | struct ceph_snap_context *snapc, | ||
108 | int do_sync, u32 truncate_seq, | ||
109 | u64 truncate_size, | ||
110 | struct timespec *mtime, | ||
111 | bool use_mempool, int num_reply); | ||
112 | |||
113 | static inline void ceph_osdc_get_request(struct ceph_osd_request *req) | ||
114 | { | ||
115 | atomic_inc(&req->r_ref); | ||
116 | } | ||
117 | extern void ceph_osdc_put_request(struct ceph_osd_request *req); | ||
118 | |||
119 | extern int ceph_osdc_start_request(struct ceph_osd_client *osdc, | ||
120 | struct ceph_osd_request *req, | ||
121 | bool nofail); | ||
122 | extern int ceph_osdc_wait_request(struct ceph_osd_client *osdc, | ||
123 | struct ceph_osd_request *req); | ||
124 | extern void ceph_osdc_sync(struct ceph_osd_client *osdc); | ||
125 | |||
126 | extern int ceph_osdc_readpages(struct ceph_osd_client *osdc, | ||
127 | struct ceph_vino vino, | ||
128 | struct ceph_file_layout *layout, | ||
129 | u64 off, u64 *plen, | ||
130 | u32 truncate_seq, u64 truncate_size, | ||
131 | struct page **pages, int nr_pages); | ||
132 | |||
133 | extern int ceph_osdc_writepages(struct ceph_osd_client *osdc, | ||
134 | struct ceph_vino vino, | ||
135 | struct ceph_file_layout *layout, | ||
136 | struct ceph_snap_context *sc, | ||
137 | u64 off, u64 len, | ||
138 | u32 truncate_seq, u64 truncate_size, | ||
139 | struct timespec *mtime, | ||
140 | struct page **pages, int nr_pages, | ||
141 | int flags, int do_sync, bool nofail); | ||
142 | |||
143 | #endif | ||
144 | |||