]>
Commit | Line | Data |
---|---|---|
f24e9980 SW |
1 | #ifndef _FS_CEPH_OSD_CLIENT_H |
2 | #define _FS_CEPH_OSD_CLIENT_H | |
3 | ||
4 | #include <linux/completion.h> | |
415e49a9 | 5 | #include <linux/kref.h> |
f24e9980 SW |
6 | #include <linux/mempool.h> |
7 | #include <linux/rbtree.h> | |
8 | ||
6c4a1915 AE |
9 | #include <linux/ceph/types.h> |
10 | #include <linux/ceph/osdmap.h> | |
11 | #include <linux/ceph/messenger.h> | |
12 | #include <linux/ceph/auth.h> | |
c885837f | 13 | #include <linux/ceph/pagelist.h> |
f24e9980 SW |
14 | |
15 | struct ceph_msg; | |
16 | struct ceph_snap_context; | |
17 | struct ceph_osd_request; | |
18 | struct ceph_osd_client; | |
4e7a5dcd | 19 | struct ceph_authorizer; |
f24e9980 SW |
20 | |
21 | /* | |
22 | * completion callback for async writepages | |
23 | */ | |
24 | typedef void (*ceph_osdc_callback_t)(struct ceph_osd_request *, | |
25 | struct ceph_msg *); | |
26be8808 | 26 | typedef void (*ceph_osdc_unsafe_callback_t)(struct ceph_osd_request *, bool); |
f24e9980 SW |
27 | |
28 | /* a given osd we're communicating with */ | |
29 | struct ceph_osd { | |
30 | atomic_t o_ref; | |
31 | struct ceph_osd_client *o_osdc; | |
32 | int o_osd; | |
33 | int o_incarnation; | |
34 | struct rb_node o_node; | |
35 | struct ceph_connection o_con; | |
36 | struct list_head o_requests; | |
a40c4f10 | 37 | struct list_head o_linger_requests; |
f5a2041b | 38 | struct list_head o_osd_lru; |
6c4a1915 | 39 | struct ceph_auth_handshake o_auth; |
f5a2041b | 40 | unsigned long lru_ttl; |
422d2cb8 YS |
41 | int o_marked_for_keepalive; |
42 | struct list_head o_keepalive_item; | |
f24e9980 SW |
43 | }; |
44 | ||
1b83bef2 | 45 | |
3f1af42a ID |
46 | #define CEPH_OSD_SLAB_OPS 2 |
47 | #define CEPH_OSD_MAX_OPS 16 | |
1b83bef2 | 48 | |
2ac2b7a6 | 49 | enum ceph_osd_data_type { |
ec9123c5 | 50 | CEPH_OSD_DATA_TYPE_NONE = 0, |
2ac2b7a6 | 51 | CEPH_OSD_DATA_TYPE_PAGES, |
9a5e6d09 | 52 | CEPH_OSD_DATA_TYPE_PAGELIST, |
2ac2b7a6 AE |
53 | #ifdef CONFIG_BLOCK |
54 | CEPH_OSD_DATA_TYPE_BIO, | |
55 | #endif /* CONFIG_BLOCK */ | |
56 | }; | |
57 | ||
2794a82a | 58 | struct ceph_osd_data { |
2ac2b7a6 AE |
59 | enum ceph_osd_data_type type; |
60 | union { | |
2794a82a AE |
61 | struct { |
62 | struct page **pages; | |
e0c59487 | 63 | u64 length; |
2794a82a AE |
64 | u32 alignment; |
65 | bool pages_from_pool; | |
66 | bool own_pages; | |
67 | }; | |
9a5e6d09 | 68 | struct ceph_pagelist *pagelist; |
2794a82a | 69 | #ifdef CONFIG_BLOCK |
fdce58cc AE |
70 | struct { |
71 | struct bio *bio; /* list of bios */ | |
72 | size_t bio_length; /* total in list */ | |
73 | }; | |
2794a82a AE |
74 | #endif /* CONFIG_BLOCK */ |
75 | }; | |
76 | }; | |
77 | ||
79528734 AE |
78 | struct ceph_osd_req_op { |
79 | u16 op; /* CEPH_OSD_OP_* */ | |
7b25bf5f | 80 | u32 flags; /* CEPH_OSD_OP_FLAG_* */ |
de2aa102 | 81 | u32 indata_len; /* request */ |
7665d85b YZ |
82 | u32 outdata_len; /* reply */ |
83 | s32 rval; | |
84 | ||
79528734 | 85 | union { |
49719778 | 86 | struct ceph_osd_data raw_data_in; |
79528734 AE |
87 | struct { |
88 | u64 offset, length; | |
89 | u64 truncate_size; | |
90 | u32 truncate_seq; | |
5476492f | 91 | struct ceph_osd_data osd_data; |
79528734 | 92 | } extent; |
d74b50be | 93 | struct { |
d7d5a007 ID |
94 | u32 name_len; |
95 | u32 value_len; | |
d74b50be YZ |
96 | __u8 cmp_op; /* CEPH_OSD_CMPXATTR_OP_* */ |
97 | __u8 cmp_mode; /* CEPH_OSD_CMPXATTR_MODE_* */ | |
98 | struct ceph_osd_data osd_data; | |
99 | } xattr; | |
79528734 AE |
100 | struct { |
101 | const char *class_name; | |
102 | const char *method_name; | |
5476492f | 103 | struct ceph_osd_data request_info; |
04017e29 | 104 | struct ceph_osd_data request_data; |
5476492f | 105 | struct ceph_osd_data response_data; |
79528734 AE |
106 | __u8 class_len; |
107 | __u8 method_len; | |
108 | __u8 argc; | |
109 | } cls; | |
110 | struct { | |
111 | u64 cookie; | |
112 | u64 ver; | |
113 | u32 prot_ver; | |
114 | u32 timeout; | |
115 | __u8 flag; | |
116 | } watch; | |
c647b8a8 ID |
117 | struct { |
118 | u64 expected_object_size; | |
119 | u64 expected_write_size; | |
120 | } alloc_hint; | |
79528734 AE |
121 | }; |
122 | }; | |
123 | ||
f24e9980 SW |
124 | /* an in-flight request */ |
125 | struct ceph_osd_request { | |
126 | u64 r_tid; /* unique for this client */ | |
127 | struct rb_node r_node; | |
422d2cb8 | 128 | struct list_head r_req_lru_item; |
f24e9980 | 129 | struct list_head r_osd_item; |
a40c4f10 | 130 | struct list_head r_linger_item; |
1d0326b1 | 131 | struct list_head r_linger_osd_item; |
f24e9980 | 132 | struct ceph_osd *r_osd; |
5b191d99 | 133 | struct ceph_pg r_pgid; |
d85b7056 SW |
134 | int r_pg_osds[CEPH_PG_MAX_SIZE]; |
135 | int r_num_pg_osds; | |
f24e9980 SW |
136 | |
137 | struct ceph_msg *r_request, *r_reply; | |
f24e9980 SW |
138 | int r_flags; /* any additional flags for the osd */ |
139 | u32 r_sent; /* >0 if r_request is sending/sent */ | |
1b83bef2 | 140 | |
79528734 AE |
141 | /* request osd ops array */ |
142 | unsigned int r_num_ops; | |
79528734 | 143 | |
1b83bef2 SW |
144 | /* these are updated on each send */ |
145 | __le32 *r_request_osdmap_epoch; | |
146 | __le32 *r_request_flags; | |
147 | __le64 *r_request_pool; | |
148 | void *r_request_pgid; | |
149 | __le32 *r_request_attempts; | |
d29adb34 | 150 | bool r_paused; |
1b83bef2 SW |
151 | struct ceph_eversion *r_request_reassert_version; |
152 | ||
153 | int r_result; | |
350b1c32 | 154 | int r_got_reply; |
a40c4f10 | 155 | int r_linger; |
f24e9980 SW |
156 | |
157 | struct ceph_osd_client *r_osdc; | |
415e49a9 | 158 | struct kref r_kref; |
f24e9980 SW |
159 | bool r_mempool; |
160 | struct completion r_completion, r_safe_completion; | |
26be8808 AE |
161 | ceph_osdc_callback_t r_callback; |
162 | ceph_osdc_unsafe_callback_t r_unsafe_callback; | |
f24e9980 SW |
163 | struct ceph_eversion r_reassert_version; |
164 | struct list_head r_unsafe_item; | |
165 | ||
166 | struct inode *r_inode; /* for use by callbacks */ | |
3d14c5d2 | 167 | void *r_priv; /* ditto */ |
f24e9980 | 168 | |
3c972c95 ID |
169 | struct ceph_object_locator r_base_oloc; |
170 | struct ceph_object_id r_base_oid; | |
205ee118 ID |
171 | struct ceph_object_locator r_target_oloc; |
172 | struct ceph_object_id r_target_oid; | |
22116525 | 173 | |
2169aea6 | 174 | u64 r_snapid; |
3dd72fc0 | 175 | unsigned long r_stamp; /* send OR check time */ |
f24e9980 | 176 | |
f24e9980 | 177 | struct ceph_snap_context *r_snapc; /* snap context for writes */ |
3f1af42a ID |
178 | |
179 | struct ceph_osd_req_op r_ops[]; | |
f24e9980 SW |
180 | }; |
181 | ||
205ee118 ID |
182 | struct ceph_request_redirect { |
183 | struct ceph_object_locator oloc; | |
184 | }; | |
185 | ||
a40c4f10 YS |
186 | struct ceph_osd_event { |
187 | u64 cookie; | |
188 | int one_shot; | |
189 | struct ceph_osd_client *osdc; | |
190 | void (*cb)(u64, u64, u8, void *); | |
191 | void *data; | |
192 | struct rb_node node; | |
193 | struct list_head osd_node; | |
194 | struct kref kref; | |
a40c4f10 YS |
195 | }; |
196 | ||
197 | struct ceph_osd_event_work { | |
198 | struct work_struct work; | |
199 | struct ceph_osd_event *event; | |
200 | u64 ver; | |
201 | u64 notify_id; | |
202 | u8 opcode; | |
203 | }; | |
204 | ||
f24e9980 SW |
205 | struct ceph_osd_client { |
206 | struct ceph_client *client; | |
207 | ||
208 | struct ceph_osdmap *osdmap; /* current map */ | |
209 | struct rw_semaphore map_sem; | |
210 | struct completion map_waiters; | |
211 | u64 last_requested_map; | |
212 | ||
213 | struct mutex request_mutex; | |
214 | struct rb_root osds; /* osds */ | |
f5a2041b | 215 | struct list_head osd_lru; /* idle osds */ |
f24e9980 SW |
216 | u64 timeout_tid; /* tid of timeout triggering rq */ |
217 | u64 last_tid; /* tid of last request */ | |
218 | struct rb_root requests; /* pending requests */ | |
6f6c7006 SW |
219 | struct list_head req_lru; /* in-flight lru */ |
220 | struct list_head req_unsent; /* unsent/need-resend queue */ | |
221 | struct list_head req_notarget; /* map to no osd */ | |
a40c4f10 | 222 | struct list_head req_linger; /* lingering requests */ |
f24e9980 SW |
223 | int num_requests; |
224 | struct delayed_work timeout_work; | |
f5a2041b | 225 | struct delayed_work osds_timeout_work; |
039934b8 | 226 | #ifdef CONFIG_DEBUG_FS |
f24e9980 | 227 | struct dentry *debugfs_file; |
039934b8 | 228 | #endif |
f24e9980 SW |
229 | |
230 | mempool_t *req_mempool; | |
231 | ||
0d59ab81 | 232 | struct ceph_msgpool msgpool_op; |
c16e7869 | 233 | struct ceph_msgpool msgpool_op_reply; |
a40c4f10 YS |
234 | |
235 | spinlock_t event_lock; | |
236 | struct rb_root event_tree; | |
237 | u64 event_count; | |
238 | ||
239 | struct workqueue_struct *notify_wq; | |
f24e9980 SW |
240 | }; |
241 | ||
5522ae0b AE |
242 | extern int ceph_osdc_setup(void); |
243 | extern void ceph_osdc_cleanup(void); | |
244 | ||
f24e9980 SW |
245 | extern int ceph_osdc_init(struct ceph_osd_client *osdc, |
246 | struct ceph_client *client); | |
247 | extern void ceph_osdc_stop(struct ceph_osd_client *osdc); | |
248 | ||
249 | extern void ceph_osdc_handle_reply(struct ceph_osd_client *osdc, | |
250 | struct ceph_msg *msg); | |
251 | extern void ceph_osdc_handle_map(struct ceph_osd_client *osdc, | |
252 | struct ceph_msg *msg); | |
253 | ||
49719778 | 254 | extern void osd_req_op_init(struct ceph_osd_request *osd_req, |
144cba14 | 255 | unsigned int which, u16 opcode, u32 flags); |
49719778 AE |
256 | |
257 | extern void osd_req_op_raw_data_in_pages(struct ceph_osd_request *, | |
258 | unsigned int which, | |
259 | struct page **pages, u64 length, | |
260 | u32 alignment, bool pages_from_pool, | |
261 | bool own_pages); | |
262 | ||
c99d2d4a AE |
263 | extern void osd_req_op_extent_init(struct ceph_osd_request *osd_req, |
264 | unsigned int which, u16 opcode, | |
33803f33 AE |
265 | u64 offset, u64 length, |
266 | u64 truncate_size, u32 truncate_seq); | |
c99d2d4a AE |
267 | extern void osd_req_op_extent_update(struct ceph_osd_request *osd_req, |
268 | unsigned int which, u64 length); | |
a4ce40a9 AE |
269 | |
270 | extern struct ceph_osd_data *osd_req_op_extent_osd_data( | |
271 | struct ceph_osd_request *osd_req, | |
406e2c9f | 272 | unsigned int which); |
a4ce40a9 AE |
273 | extern struct ceph_osd_data *osd_req_op_cls_response_data( |
274 | struct ceph_osd_request *osd_req, | |
275 | unsigned int which); | |
276 | ||
277 | extern void osd_req_op_extent_osd_data_pages(struct ceph_osd_request *, | |
406e2c9f | 278 | unsigned int which, |
a4ce40a9 AE |
279 | struct page **pages, u64 length, |
280 | u32 alignment, bool pages_from_pool, | |
281 | bool own_pages); | |
282 | extern void osd_req_op_extent_osd_data_pagelist(struct ceph_osd_request *, | |
406e2c9f | 283 | unsigned int which, |
a4ce40a9 AE |
284 | struct ceph_pagelist *pagelist); |
285 | #ifdef CONFIG_BLOCK | |
286 | extern void osd_req_op_extent_osd_data_bio(struct ceph_osd_request *, | |
406e2c9f | 287 | unsigned int which, |
a4ce40a9 AE |
288 | struct bio *bio, size_t bio_length); |
289 | #endif /* CONFIG_BLOCK */ | |
290 | ||
04017e29 AE |
291 | extern void osd_req_op_cls_request_data_pagelist(struct ceph_osd_request *, |
292 | unsigned int which, | |
293 | struct ceph_pagelist *pagelist); | |
6c57b554 AE |
294 | extern void osd_req_op_cls_request_data_pages(struct ceph_osd_request *, |
295 | unsigned int which, | |
296 | struct page **pages, u64 length, | |
297 | u32 alignment, bool pages_from_pool, | |
298 | bool own_pages); | |
a4ce40a9 | 299 | extern void osd_req_op_cls_response_data_pages(struct ceph_osd_request *, |
c99d2d4a | 300 | unsigned int which, |
a4ce40a9 AE |
301 | struct page **pages, u64 length, |
302 | u32 alignment, bool pages_from_pool, | |
303 | bool own_pages); | |
304 | ||
c99d2d4a AE |
305 | extern void osd_req_op_cls_init(struct ceph_osd_request *osd_req, |
306 | unsigned int which, u16 opcode, | |
04017e29 | 307 | const char *class, const char *method); |
d74b50be YZ |
308 | extern int osd_req_op_xattr_init(struct ceph_osd_request *osd_req, unsigned int which, |
309 | u16 opcode, const char *name, const void *value, | |
310 | size_t size, u8 cmp_op, u8 cmp_mode); | |
c99d2d4a AE |
311 | extern void osd_req_op_watch_init(struct ceph_osd_request *osd_req, |
312 | unsigned int which, u16 opcode, | |
33803f33 | 313 | u64 cookie, u64 version, int flag); |
c647b8a8 ID |
314 | extern void osd_req_op_alloc_hint_init(struct ceph_osd_request *osd_req, |
315 | unsigned int which, | |
316 | u64 expected_object_size, | |
317 | u64 expected_write_size); | |
33803f33 | 318 | |
3499e8a5 | 319 | extern struct ceph_osd_request *ceph_osdc_alloc_request(struct ceph_osd_client *osdc, |
3499e8a5 | 320 | struct ceph_snap_context *snapc, |
acead002 | 321 | unsigned int num_ops, |
3499e8a5 | 322 | bool use_mempool, |
54a54007 | 323 | gfp_t gfp_flags); |
3499e8a5 | 324 | |
175face2 | 325 | extern void ceph_osdc_build_request(struct ceph_osd_request *req, u64 off, |
68b4476b | 326 | struct ceph_snap_context *snapc, |
4d6b250b | 327 | u64 snap_id, |
af77f26c | 328 | struct timespec *mtime); |
3499e8a5 | 329 | |
f24e9980 SW |
330 | extern struct ceph_osd_request *ceph_osdc_new_request(struct ceph_osd_client *, |
331 | struct ceph_file_layout *layout, | |
332 | struct ceph_vino vino, | |
acead002 | 333 | u64 offset, u64 *len, |
715e4cd4 YZ |
334 | unsigned int which, int num_ops, |
335 | int opcode, int flags, | |
f24e9980 | 336 | struct ceph_snap_context *snapc, |
acead002 | 337 | u32 truncate_seq, u64 truncate_size, |
153e5167 | 338 | bool use_mempool); |
f24e9980 | 339 | |
a40c4f10 YS |
340 | extern void ceph_osdc_set_request_linger(struct ceph_osd_client *osdc, |
341 | struct ceph_osd_request *req); | |
a40c4f10 | 342 | |
9e94af20 ID |
343 | extern void ceph_osdc_get_request(struct ceph_osd_request *req); |
344 | extern void ceph_osdc_put_request(struct ceph_osd_request *req); | |
f24e9980 SW |
345 | |
346 | extern int ceph_osdc_start_request(struct ceph_osd_client *osdc, | |
347 | struct ceph_osd_request *req, | |
348 | bool nofail); | |
c9f9b93d | 349 | extern void ceph_osdc_cancel_request(struct ceph_osd_request *req); |
f24e9980 SW |
350 | extern int ceph_osdc_wait_request(struct ceph_osd_client *osdc, |
351 | struct ceph_osd_request *req); | |
352 | extern void ceph_osdc_sync(struct ceph_osd_client *osdc); | |
353 | ||
dd935f44 JD |
354 | extern void ceph_osdc_flush_notifies(struct ceph_osd_client *osdc); |
355 | ||
f24e9980 SW |
356 | extern int ceph_osdc_readpages(struct ceph_osd_client *osdc, |
357 | struct ceph_vino vino, | |
358 | struct ceph_file_layout *layout, | |
359 | u64 off, u64 *plen, | |
360 | u32 truncate_seq, u64 truncate_size, | |
b7495fc2 SW |
361 | struct page **pages, int nr_pages, |
362 | int page_align); | |
f24e9980 SW |
363 | |
364 | extern int ceph_osdc_writepages(struct ceph_osd_client *osdc, | |
365 | struct ceph_vino vino, | |
366 | struct ceph_file_layout *layout, | |
367 | struct ceph_snap_context *sc, | |
368 | u64 off, u64 len, | |
369 | u32 truncate_seq, u64 truncate_size, | |
370 | struct timespec *mtime, | |
24808826 | 371 | struct page **pages, int nr_pages); |
f24e9980 | 372 | |
a40c4f10 YS |
373 | /* watch/notify events */ |
374 | extern int ceph_osdc_create_event(struct ceph_osd_client *osdc, | |
375 | void (*event_cb)(u64, u64, u8, void *), | |
3c663bbd | 376 | void *data, struct ceph_osd_event **pevent); |
a40c4f10 | 377 | extern void ceph_osdc_cancel_event(struct ceph_osd_event *event); |
a40c4f10 | 378 | extern void ceph_osdc_put_event(struct ceph_osd_event *event); |
f24e9980 SW |
379 | #endif |
380 |