]>
Commit | Line | Data |
---|---|---|
f24e9980 SW |
1 | #ifndef _FS_CEPH_OSD_CLIENT_H |
2 | #define _FS_CEPH_OSD_CLIENT_H | |
3 | ||
4 | #include <linux/completion.h> | |
415e49a9 | 5 | #include <linux/kref.h> |
f24e9980 SW |
6 | #include <linux/mempool.h> |
7 | #include <linux/rbtree.h> | |
02113a0f | 8 | #include <linux/refcount.h> |
f24e9980 | 9 | |
6c4a1915 AE |
10 | #include <linux/ceph/types.h> |
11 | #include <linux/ceph/osdmap.h> | |
12 | #include <linux/ceph/messenger.h> | |
b2aa5d0b | 13 | #include <linux/ceph/msgpool.h> |
6c4a1915 | 14 | #include <linux/ceph/auth.h> |
c885837f | 15 | #include <linux/ceph/pagelist.h> |
f24e9980 SW |
16 | |
17 | struct ceph_msg; | |
18 | struct ceph_snap_context; | |
19 | struct ceph_osd_request; | |
20 | struct ceph_osd_client; | |
21 | ||
22 | /* | |
23 | * completion callback for async writepages | |
24 | */ | |
85e084fe | 25 | typedef void (*ceph_osdc_callback_t)(struct ceph_osd_request *); |
f24e9980 | 26 | |
63244fa1 ID |
27 | #define CEPH_HOMELESS_OSD -1 |
28 | ||
f24e9980 SW |
29 | /* a given osd we're communicating with */ |
30 | struct ceph_osd { | |
02113a0f | 31 | refcount_t o_ref; |
f24e9980 SW |
32 | struct ceph_osd_client *o_osdc; |
33 | int o_osd; | |
34 | int o_incarnation; | |
35 | struct rb_node o_node; | |
36 | struct ceph_connection o_con; | |
5aea3dcd | 37 | struct rb_root o_requests; |
922dab61 | 38 | struct rb_root o_linger_requests; |
f5a2041b | 39 | struct list_head o_osd_lru; |
6c4a1915 | 40 | struct ceph_auth_handshake o_auth; |
f5a2041b | 41 | unsigned long lru_ttl; |
422d2cb8 | 42 | struct list_head o_keepalive_item; |
5aea3dcd | 43 | struct mutex lock; |
f24e9980 SW |
44 | }; |
45 | ||
3f1af42a ID |
46 | #define CEPH_OSD_SLAB_OPS 2 |
47 | #define CEPH_OSD_MAX_OPS 16 | |
1b83bef2 | 48 | |
2ac2b7a6 | 49 | enum ceph_osd_data_type { |
ec9123c5 | 50 | CEPH_OSD_DATA_TYPE_NONE = 0, |
2ac2b7a6 | 51 | CEPH_OSD_DATA_TYPE_PAGES, |
9a5e6d09 | 52 | CEPH_OSD_DATA_TYPE_PAGELIST, |
2ac2b7a6 AE |
53 | #ifdef CONFIG_BLOCK |
54 | CEPH_OSD_DATA_TYPE_BIO, | |
55 | #endif /* CONFIG_BLOCK */ | |
56 | }; | |
57 | ||
2794a82a | 58 | struct ceph_osd_data { |
2ac2b7a6 AE |
59 | enum ceph_osd_data_type type; |
60 | union { | |
2794a82a AE |
61 | struct { |
62 | struct page **pages; | |
e0c59487 | 63 | u64 length; |
2794a82a AE |
64 | u32 alignment; |
65 | bool pages_from_pool; | |
66 | bool own_pages; | |
67 | }; | |
9a5e6d09 | 68 | struct ceph_pagelist *pagelist; |
2794a82a | 69 | #ifdef CONFIG_BLOCK |
fdce58cc AE |
70 | struct { |
71 | struct bio *bio; /* list of bios */ | |
72 | size_t bio_length; /* total in list */ | |
73 | }; | |
2794a82a AE |
74 | #endif /* CONFIG_BLOCK */ |
75 | }; | |
76 | }; | |
77 | ||
79528734 AE |
78 | struct ceph_osd_req_op { |
79 | u16 op; /* CEPH_OSD_OP_* */ | |
7b25bf5f | 80 | u32 flags; /* CEPH_OSD_OP_FLAG_* */ |
de2aa102 | 81 | u32 indata_len; /* request */ |
7665d85b YZ |
82 | u32 outdata_len; /* reply */ |
83 | s32 rval; | |
84 | ||
79528734 | 85 | union { |
49719778 | 86 | struct ceph_osd_data raw_data_in; |
79528734 AE |
87 | struct { |
88 | u64 offset, length; | |
89 | u64 truncate_size; | |
90 | u32 truncate_seq; | |
5476492f | 91 | struct ceph_osd_data osd_data; |
79528734 | 92 | } extent; |
d74b50be | 93 | struct { |
d7d5a007 ID |
94 | u32 name_len; |
95 | u32 value_len; | |
d74b50be YZ |
96 | __u8 cmp_op; /* CEPH_OSD_CMPXATTR_OP_* */ |
97 | __u8 cmp_mode; /* CEPH_OSD_CMPXATTR_MODE_* */ | |
98 | struct ceph_osd_data osd_data; | |
99 | } xattr; | |
79528734 AE |
100 | struct { |
101 | const char *class_name; | |
102 | const char *method_name; | |
5476492f | 103 | struct ceph_osd_data request_info; |
04017e29 | 104 | struct ceph_osd_data request_data; |
5476492f | 105 | struct ceph_osd_data response_data; |
79528734 AE |
106 | __u8 class_len; |
107 | __u8 method_len; | |
bb873b53 | 108 | u32 indata_len; |
79528734 AE |
109 | } cls; |
110 | struct { | |
111 | u64 cookie; | |
922dab61 ID |
112 | __u8 op; /* CEPH_OSD_WATCH_OP_ */ |
113 | u32 gen; | |
79528734 | 114 | } watch; |
922dab61 ID |
115 | struct { |
116 | struct ceph_osd_data request_data; | |
117 | } notify_ack; | |
19079203 ID |
118 | struct { |
119 | u64 cookie; | |
120 | struct ceph_osd_data request_data; | |
121 | struct ceph_osd_data response_data; | |
122 | } notify; | |
a4ed38d7 DF |
123 | struct { |
124 | struct ceph_osd_data response_data; | |
125 | } list_watchers; | |
c647b8a8 ID |
126 | struct { |
127 | u64 expected_object_size; | |
128 | u64 expected_write_size; | |
129 | } alloc_hint; | |
79528734 AE |
130 | }; |
131 | }; | |
132 | ||
63244fa1 ID |
133 | struct ceph_osd_request_target { |
134 | struct ceph_object_id base_oid; | |
135 | struct ceph_object_locator base_oloc; | |
136 | struct ceph_object_id target_oid; | |
137 | struct ceph_object_locator target_oloc; | |
138 | ||
139 | struct ceph_pg pgid; | |
140 | u32 pg_num; | |
141 | u32 pg_num_mask; | |
142 | struct ceph_osds acting; | |
143 | struct ceph_osds up; | |
144 | int size; | |
145 | int min_size; | |
146 | bool sort_bitwise; | |
147 | ||
148 | unsigned int flags; /* CEPH_OSD_FLAG_* */ | |
149 | bool paused; | |
150 | ||
dc93e0e2 ID |
151 | u32 last_force_resend; |
152 | ||
63244fa1 ID |
153 | int osd; |
154 | }; | |
155 | ||
f24e9980 SW |
156 | /* an in-flight request */ |
157 | struct ceph_osd_request { | |
158 | u64 r_tid; /* unique for this client */ | |
159 | struct rb_node r_node; | |
4609245e | 160 | struct rb_node r_mc_node; /* map check */ |
f24e9980 | 161 | struct ceph_osd *r_osd; |
a66dd383 ID |
162 | |
163 | struct ceph_osd_request_target r_t; | |
164 | #define r_base_oid r_t.base_oid | |
165 | #define r_base_oloc r_t.base_oloc | |
166 | #define r_flags r_t.flags | |
f24e9980 SW |
167 | |
168 | struct ceph_msg *r_request, *r_reply; | |
f24e9980 | 169 | u32 r_sent; /* >0 if r_request is sending/sent */ |
1b83bef2 | 170 | |
79528734 AE |
171 | /* request osd ops array */ |
172 | unsigned int r_num_ops; | |
79528734 | 173 | |
1b83bef2 | 174 | int r_result; |
f24e9980 SW |
175 | |
176 | struct ceph_osd_client *r_osdc; | |
415e49a9 | 177 | struct kref r_kref; |
f24e9980 | 178 | bool r_mempool; |
b18b9550 | 179 | struct completion r_completion; /* private to osd_client.c */ |
26be8808 | 180 | ceph_osdc_callback_t r_callback; |
f24e9980 SW |
181 | struct list_head r_unsafe_item; |
182 | ||
183 | struct inode *r_inode; /* for use by callbacks */ | |
3d14c5d2 | 184 | void *r_priv; /* ditto */ |
f24e9980 | 185 | |
bb873b53 ID |
186 | /* set by submitter */ |
187 | u64 r_snapid; /* for reads, CEPH_NOSNAP o/w */ | |
188 | struct ceph_snap_context *r_snapc; /* for writes */ | |
189 | struct timespec r_mtime; /* ditto */ | |
190 | u64 r_data_offset; /* ditto */ | |
922dab61 | 191 | bool r_linger; /* don't resend on failure */ |
a1f4020a | 192 | bool r_abort_on_full; /* return ENOSPC when full */ |
f24e9980 | 193 | |
bb873b53 ID |
194 | /* internal */ |
195 | unsigned long r_stamp; /* jiffies, send or check time */ | |
7cc5e38f | 196 | unsigned long r_start_stamp; /* jiffies */ |
bb873b53 | 197 | int r_attempts; |
4609245e | 198 | u32 r_map_dne_bound; |
3f1af42a ID |
199 | |
200 | struct ceph_osd_req_op r_ops[]; | |
f24e9980 SW |
201 | }; |
202 | ||
205ee118 ID |
203 | struct ceph_request_redirect { |
204 | struct ceph_object_locator oloc; | |
205 | }; | |
206 | ||
922dab61 ID |
207 | typedef void (*rados_watchcb2_t)(void *arg, u64 notify_id, u64 cookie, |
208 | u64 notifier_id, void *data, size_t data_len); | |
209 | typedef void (*rados_watcherrcb_t)(void *arg, u64 cookie, int err); | |
210 | ||
211 | struct ceph_osd_linger_request { | |
a40c4f10 | 212 | struct ceph_osd_client *osdc; |
922dab61 ID |
213 | u64 linger_id; |
214 | bool committed; | |
19079203 | 215 | bool is_watch; /* watch or notify */ |
922dab61 ID |
216 | |
217 | struct ceph_osd *osd; | |
218 | struct ceph_osd_request *reg_req; | |
219 | struct ceph_osd_request *ping_req; | |
220 | unsigned long ping_sent; | |
b07d3c4b ID |
221 | unsigned long watch_valid_thru; |
222 | struct list_head pending_lworks; | |
922dab61 ID |
223 | |
224 | struct ceph_osd_request_target t; | |
4609245e | 225 | u32 map_dne_bound; |
922dab61 ID |
226 | |
227 | struct timespec mtime; | |
228 | ||
a40c4f10 | 229 | struct kref kref; |
922dab61 ID |
230 | struct mutex lock; |
231 | struct rb_node node; /* osd */ | |
232 | struct rb_node osdc_node; /* osdc */ | |
4609245e | 233 | struct rb_node mc_node; /* map check */ |
922dab61 ID |
234 | struct list_head scan_item; |
235 | ||
236 | struct completion reg_commit_wait; | |
19079203 | 237 | struct completion notify_finish_wait; |
922dab61 | 238 | int reg_commit_error; |
19079203 | 239 | int notify_finish_error; |
922dab61 ID |
240 | int last_error; |
241 | ||
242 | u32 register_gen; | |
19079203 | 243 | u64 notify_id; |
a40c4f10 | 244 | |
922dab61 ID |
245 | rados_watchcb2_t wcb; |
246 | rados_watcherrcb_t errcb; | |
247 | void *data; | |
19079203 ID |
248 | |
249 | struct page ***preply_pages; | |
250 | size_t *preply_len; | |
a40c4f10 YS |
251 | }; |
252 | ||
a4ed38d7 DF |
253 | struct ceph_watch_item { |
254 | struct ceph_entity_name name; | |
255 | u64 cookie; | |
256 | struct ceph_entity_addr addr; | |
257 | }; | |
258 | ||
264048af ID |
259 | #define CEPH_LINGER_ID_START 0xffff000000000000ULL |
260 | ||
f24e9980 SW |
261 | struct ceph_osd_client { |
262 | struct ceph_client *client; | |
263 | ||
264 | struct ceph_osdmap *osdmap; /* current map */ | |
5aea3dcd | 265 | struct rw_semaphore lock; |
f24e9980 | 266 | |
f24e9980 | 267 | struct rb_root osds; /* osds */ |
f5a2041b | 268 | struct list_head osd_lru; /* idle osds */ |
9dd2845c | 269 | spinlock_t osd_lru_lock; |
58eb7932 | 270 | u32 epoch_barrier; |
5aea3dcd ID |
271 | struct ceph_osd homeless_osd; |
272 | atomic64_t last_tid; /* tid of last request */ | |
922dab61 ID |
273 | u64 last_linger_id; |
274 | struct rb_root linger_requests; /* lingering requests */ | |
4609245e ID |
275 | struct rb_root map_checks; |
276 | struct rb_root linger_map_checks; | |
5aea3dcd ID |
277 | atomic_t num_requests; |
278 | atomic_t num_homeless; | |
f24e9980 | 279 | struct delayed_work timeout_work; |
f5a2041b | 280 | struct delayed_work osds_timeout_work; |
039934b8 | 281 | #ifdef CONFIG_DEBUG_FS |
f24e9980 | 282 | struct dentry *debugfs_file; |
039934b8 | 283 | #endif |
f24e9980 SW |
284 | |
285 | mempool_t *req_mempool; | |
286 | ||
0d59ab81 | 287 | struct ceph_msgpool msgpool_op; |
c16e7869 | 288 | struct ceph_msgpool msgpool_op_reply; |
a40c4f10 | 289 | |
a40c4f10 | 290 | struct workqueue_struct *notify_wq; |
f24e9980 SW |
291 | }; |
292 | ||
b7ec35b3 ID |
293 | static inline bool ceph_osdmap_flag(struct ceph_osd_client *osdc, int flag) |
294 | { | |
295 | return osdc->osdmap->flags & flag; | |
296 | } | |
297 | ||
5522ae0b AE |
298 | extern int ceph_osdc_setup(void); |
299 | extern void ceph_osdc_cleanup(void); | |
300 | ||
f24e9980 SW |
301 | extern int ceph_osdc_init(struct ceph_osd_client *osdc, |
302 | struct ceph_client *client); | |
303 | extern void ceph_osdc_stop(struct ceph_osd_client *osdc); | |
304 | ||
305 | extern void ceph_osdc_handle_reply(struct ceph_osd_client *osdc, | |
306 | struct ceph_msg *msg); | |
307 | extern void ceph_osdc_handle_map(struct ceph_osd_client *osdc, | |
308 | struct ceph_msg *msg); | |
58eb7932 | 309 | void ceph_osdc_update_epoch_barrier(struct ceph_osd_client *osdc, u32 eb); |
f24e9980 | 310 | |
49719778 | 311 | extern void osd_req_op_init(struct ceph_osd_request *osd_req, |
144cba14 | 312 | unsigned int which, u16 opcode, u32 flags); |
49719778 AE |
313 | |
314 | extern void osd_req_op_raw_data_in_pages(struct ceph_osd_request *, | |
315 | unsigned int which, | |
316 | struct page **pages, u64 length, | |
317 | u32 alignment, bool pages_from_pool, | |
318 | bool own_pages); | |
319 | ||
c99d2d4a AE |
320 | extern void osd_req_op_extent_init(struct ceph_osd_request *osd_req, |
321 | unsigned int which, u16 opcode, | |
33803f33 AE |
322 | u64 offset, u64 length, |
323 | u64 truncate_size, u32 truncate_seq); | |
c99d2d4a AE |
324 | extern void osd_req_op_extent_update(struct ceph_osd_request *osd_req, |
325 | unsigned int which, u64 length); | |
2c63f49a YZ |
326 | extern void osd_req_op_extent_dup_last(struct ceph_osd_request *osd_req, |
327 | unsigned int which, u64 offset_inc); | |
a4ce40a9 AE |
328 | |
329 | extern struct ceph_osd_data *osd_req_op_extent_osd_data( | |
330 | struct ceph_osd_request *osd_req, | |
406e2c9f | 331 | unsigned int which); |
a4ce40a9 AE |
332 | |
333 | extern void osd_req_op_extent_osd_data_pages(struct ceph_osd_request *, | |
406e2c9f | 334 | unsigned int which, |
a4ce40a9 AE |
335 | struct page **pages, u64 length, |
336 | u32 alignment, bool pages_from_pool, | |
337 | bool own_pages); | |
338 | extern void osd_req_op_extent_osd_data_pagelist(struct ceph_osd_request *, | |
406e2c9f | 339 | unsigned int which, |
a4ce40a9 AE |
340 | struct ceph_pagelist *pagelist); |
341 | #ifdef CONFIG_BLOCK | |
342 | extern void osd_req_op_extent_osd_data_bio(struct ceph_osd_request *, | |
406e2c9f | 343 | unsigned int which, |
a4ce40a9 AE |
344 | struct bio *bio, size_t bio_length); |
345 | #endif /* CONFIG_BLOCK */ | |
346 | ||
04017e29 AE |
347 | extern void osd_req_op_cls_request_data_pagelist(struct ceph_osd_request *, |
348 | unsigned int which, | |
349 | struct ceph_pagelist *pagelist); | |
6c57b554 AE |
350 | extern void osd_req_op_cls_request_data_pages(struct ceph_osd_request *, |
351 | unsigned int which, | |
352 | struct page **pages, u64 length, | |
353 | u32 alignment, bool pages_from_pool, | |
354 | bool own_pages); | |
a4ce40a9 | 355 | extern void osd_req_op_cls_response_data_pages(struct ceph_osd_request *, |
c99d2d4a | 356 | unsigned int which, |
a4ce40a9 AE |
357 | struct page **pages, u64 length, |
358 | u32 alignment, bool pages_from_pool, | |
359 | bool own_pages); | |
c99d2d4a AE |
360 | extern void osd_req_op_cls_init(struct ceph_osd_request *osd_req, |
361 | unsigned int which, u16 opcode, | |
04017e29 | 362 | const char *class, const char *method); |
d74b50be YZ |
363 | extern int osd_req_op_xattr_init(struct ceph_osd_request *osd_req, unsigned int which, |
364 | u16 opcode, const char *name, const void *value, | |
365 | size_t size, u8 cmp_op, u8 cmp_mode); | |
c647b8a8 ID |
366 | extern void osd_req_op_alloc_hint_init(struct ceph_osd_request *osd_req, |
367 | unsigned int which, | |
368 | u64 expected_object_size, | |
369 | u64 expected_write_size); | |
33803f33 | 370 | |
3499e8a5 | 371 | extern struct ceph_osd_request *ceph_osdc_alloc_request(struct ceph_osd_client *osdc, |
3499e8a5 | 372 | struct ceph_snap_context *snapc, |
acead002 | 373 | unsigned int num_ops, |
3499e8a5 | 374 | bool use_mempool, |
54a54007 | 375 | gfp_t gfp_flags); |
13d1ad16 | 376 | int ceph_osdc_alloc_messages(struct ceph_osd_request *req, gfp_t gfp); |
3499e8a5 | 377 | |
f24e9980 SW |
378 | extern struct ceph_osd_request *ceph_osdc_new_request(struct ceph_osd_client *, |
379 | struct ceph_file_layout *layout, | |
380 | struct ceph_vino vino, | |
acead002 | 381 | u64 offset, u64 *len, |
715e4cd4 YZ |
382 | unsigned int which, int num_ops, |
383 | int opcode, int flags, | |
f24e9980 | 384 | struct ceph_snap_context *snapc, |
acead002 | 385 | u32 truncate_seq, u64 truncate_size, |
153e5167 | 386 | bool use_mempool); |
f24e9980 | 387 | |
9e94af20 ID |
388 | extern void ceph_osdc_get_request(struct ceph_osd_request *req); |
389 | extern void ceph_osdc_put_request(struct ceph_osd_request *req); | |
f24e9980 SW |
390 | |
391 | extern int ceph_osdc_start_request(struct ceph_osd_client *osdc, | |
392 | struct ceph_osd_request *req, | |
393 | bool nofail); | |
c9f9b93d | 394 | extern void ceph_osdc_cancel_request(struct ceph_osd_request *req); |
f24e9980 SW |
395 | extern int ceph_osdc_wait_request(struct ceph_osd_client *osdc, |
396 | struct ceph_osd_request *req); | |
397 | extern void ceph_osdc_sync(struct ceph_osd_client *osdc); | |
398 | ||
dd935f44 | 399 | extern void ceph_osdc_flush_notifies(struct ceph_osd_client *osdc); |
7cca78c9 | 400 | void ceph_osdc_maybe_request_map(struct ceph_osd_client *osdc); |
dd935f44 | 401 | |
428a7158 DF |
402 | int ceph_osdc_call(struct ceph_osd_client *osdc, |
403 | struct ceph_object_id *oid, | |
404 | struct ceph_object_locator *oloc, | |
405 | const char *class, const char *method, | |
406 | unsigned int flags, | |
407 | struct page *req_page, size_t req_len, | |
408 | struct page *resp_page, size_t *resp_len); | |
409 | ||
f24e9980 SW |
410 | extern int ceph_osdc_readpages(struct ceph_osd_client *osdc, |
411 | struct ceph_vino vino, | |
412 | struct ceph_file_layout *layout, | |
413 | u64 off, u64 *plen, | |
414 | u32 truncate_seq, u64 truncate_size, | |
b7495fc2 SW |
415 | struct page **pages, int nr_pages, |
416 | int page_align); | |
f24e9980 SW |
417 | |
418 | extern int ceph_osdc_writepages(struct ceph_osd_client *osdc, | |
419 | struct ceph_vino vino, | |
420 | struct ceph_file_layout *layout, | |
421 | struct ceph_snap_context *sc, | |
422 | u64 off, u64 len, | |
423 | u32 truncate_seq, u64 truncate_size, | |
424 | struct timespec *mtime, | |
24808826 | 425 | struct page **pages, int nr_pages); |
f24e9980 | 426 | |
922dab61 ID |
427 | /* watch/notify */ |
428 | struct ceph_osd_linger_request * | |
429 | ceph_osdc_watch(struct ceph_osd_client *osdc, | |
430 | struct ceph_object_id *oid, | |
431 | struct ceph_object_locator *oloc, | |
432 | rados_watchcb2_t wcb, | |
433 | rados_watcherrcb_t errcb, | |
434 | void *data); | |
435 | int ceph_osdc_unwatch(struct ceph_osd_client *osdc, | |
436 | struct ceph_osd_linger_request *lreq); | |
437 | ||
438 | int ceph_osdc_notify_ack(struct ceph_osd_client *osdc, | |
439 | struct ceph_object_id *oid, | |
440 | struct ceph_object_locator *oloc, | |
441 | u64 notify_id, | |
442 | u64 cookie, | |
443 | void *payload, | |
444 | size_t payload_len); | |
19079203 ID |
445 | int ceph_osdc_notify(struct ceph_osd_client *osdc, |
446 | struct ceph_object_id *oid, | |
447 | struct ceph_object_locator *oloc, | |
448 | void *payload, | |
449 | size_t payload_len, | |
450 | u32 timeout, | |
451 | struct page ***preply_pages, | |
452 | size_t *preply_len); | |
b07d3c4b ID |
453 | int ceph_osdc_watch_check(struct ceph_osd_client *osdc, |
454 | struct ceph_osd_linger_request *lreq); | |
a4ed38d7 DF |
455 | int ceph_osdc_list_watchers(struct ceph_osd_client *osdc, |
456 | struct ceph_object_id *oid, | |
457 | struct ceph_object_locator *oloc, | |
458 | struct ceph_watch_item **watchers, | |
459 | u32 *num_watchers); | |
f24e9980 SW |
460 | #endif |
461 |