]>
Commit | Line | Data |
---|---|---|
1 | #include <linux/ceph/ceph_debug.h> | |
2 | #include <linux/in.h> | |
3 | ||
4 | #include "super.h" | |
5 | #include "mds_client.h" | |
6 | #include "ioctl.h" | |
7 | ||
8 | ||
9 | /* | |
10 | * ioctls | |
11 | */ | |
12 | ||
13 | /* | |
14 | * get and set the file layout | |
15 | */ | |
16 | static long ceph_ioctl_get_layout(struct file *file, void __user *arg) | |
17 | { | |
18 | struct ceph_inode_info *ci = ceph_inode(file_inode(file)); | |
19 | struct ceph_ioctl_layout l; | |
20 | int err; | |
21 | ||
22 | err = ceph_do_getattr(file_inode(file), CEPH_STAT_CAP_LAYOUT, false); | |
23 | if (!err) { | |
24 | l.stripe_unit = ci->i_layout.stripe_unit; | |
25 | l.stripe_count = ci->i_layout.stripe_count; | |
26 | l.object_size = ci->i_layout.object_size; | |
27 | l.data_pool = ci->i_layout.pool_id; | |
28 | l.preferred_osd = -1; | |
29 | if (copy_to_user(arg, &l, sizeof(l))) | |
30 | return -EFAULT; | |
31 | } | |
32 | ||
33 | return err; | |
34 | } | |
35 | ||
36 | static long __validate_layout(struct ceph_mds_client *mdsc, | |
37 | struct ceph_ioctl_layout *l) | |
38 | { | |
39 | int i, err; | |
40 | ||
41 | /* validate striping parameters */ | |
42 | if ((l->object_size & ~PAGE_MASK) || | |
43 | (l->stripe_unit & ~PAGE_MASK) || | |
44 | ((unsigned)l->stripe_unit != 0 && | |
45 | ((unsigned)l->object_size % (unsigned)l->stripe_unit))) | |
46 | return -EINVAL; | |
47 | ||
48 | /* make sure it's a valid data pool */ | |
49 | mutex_lock(&mdsc->mutex); | |
50 | err = -EINVAL; | |
51 | for (i = 0; i < mdsc->mdsmap->m_num_data_pg_pools; i++) | |
52 | if (mdsc->mdsmap->m_data_pg_pools[i] == l->data_pool) { | |
53 | err = 0; | |
54 | break; | |
55 | } | |
56 | mutex_unlock(&mdsc->mutex); | |
57 | if (err) | |
58 | return err; | |
59 | ||
60 | return 0; | |
61 | } | |
62 | ||
63 | static long ceph_ioctl_set_layout(struct file *file, void __user *arg) | |
64 | { | |
65 | struct inode *inode = file_inode(file); | |
66 | struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc; | |
67 | struct ceph_mds_request *req; | |
68 | struct ceph_ioctl_layout l; | |
69 | struct ceph_inode_info *ci = ceph_inode(file_inode(file)); | |
70 | struct ceph_ioctl_layout nl; | |
71 | int err; | |
72 | ||
73 | if (copy_from_user(&l, arg, sizeof(l))) | |
74 | return -EFAULT; | |
75 | ||
76 | /* validate changed params against current layout */ | |
77 | err = ceph_do_getattr(file_inode(file), CEPH_STAT_CAP_LAYOUT, false); | |
78 | if (err) | |
79 | return err; | |
80 | ||
81 | memset(&nl, 0, sizeof(nl)); | |
82 | if (l.stripe_count) | |
83 | nl.stripe_count = l.stripe_count; | |
84 | else | |
85 | nl.stripe_count = ci->i_layout.stripe_count; | |
86 | if (l.stripe_unit) | |
87 | nl.stripe_unit = l.stripe_unit; | |
88 | else | |
89 | nl.stripe_unit = ci->i_layout.stripe_unit; | |
90 | if (l.object_size) | |
91 | nl.object_size = l.object_size; | |
92 | else | |
93 | nl.object_size = ci->i_layout.object_size; | |
94 | if (l.data_pool) | |
95 | nl.data_pool = l.data_pool; | |
96 | else | |
97 | nl.data_pool = ci->i_layout.pool_id; | |
98 | ||
99 | /* this is obsolete, and always -1 */ | |
100 | nl.preferred_osd = -1; | |
101 | ||
102 | err = __validate_layout(mdsc, &nl); | |
103 | if (err) | |
104 | return err; | |
105 | ||
106 | req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_SETLAYOUT, | |
107 | USE_AUTH_MDS); | |
108 | if (IS_ERR(req)) | |
109 | return PTR_ERR(req); | |
110 | req->r_inode = inode; | |
111 | ihold(inode); | |
112 | req->r_num_caps = 1; | |
113 | ||
114 | req->r_inode_drop = CEPH_CAP_FILE_SHARED | CEPH_CAP_FILE_EXCL; | |
115 | ||
116 | req->r_args.setlayout.layout.fl_stripe_unit = | |
117 | cpu_to_le32(l.stripe_unit); | |
118 | req->r_args.setlayout.layout.fl_stripe_count = | |
119 | cpu_to_le32(l.stripe_count); | |
120 | req->r_args.setlayout.layout.fl_object_size = | |
121 | cpu_to_le32(l.object_size); | |
122 | req->r_args.setlayout.layout.fl_pg_pool = cpu_to_le32(l.data_pool); | |
123 | ||
124 | err = ceph_mdsc_do_request(mdsc, NULL, req); | |
125 | ceph_mdsc_put_request(req); | |
126 | return err; | |
127 | } | |
128 | ||
129 | /* | |
130 | * Set a layout policy on a directory inode. All items in the tree | |
131 | * rooted at this inode will inherit this layout on creation, | |
132 | * (It doesn't apply retroactively ) | |
133 | * unless a subdirectory has its own layout policy. | |
134 | */ | |
135 | static long ceph_ioctl_set_layout_policy (struct file *file, void __user *arg) | |
136 | { | |
137 | struct inode *inode = file_inode(file); | |
138 | struct ceph_mds_request *req; | |
139 | struct ceph_ioctl_layout l; | |
140 | int err; | |
141 | struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc; | |
142 | ||
143 | /* copy and validate */ | |
144 | if (copy_from_user(&l, arg, sizeof(l))) | |
145 | return -EFAULT; | |
146 | ||
147 | err = __validate_layout(mdsc, &l); | |
148 | if (err) | |
149 | return err; | |
150 | ||
151 | req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_SETDIRLAYOUT, | |
152 | USE_AUTH_MDS); | |
153 | ||
154 | if (IS_ERR(req)) | |
155 | return PTR_ERR(req); | |
156 | req->r_inode = inode; | |
157 | ihold(inode); | |
158 | req->r_num_caps = 1; | |
159 | ||
160 | req->r_args.setlayout.layout.fl_stripe_unit = | |
161 | cpu_to_le32(l.stripe_unit); | |
162 | req->r_args.setlayout.layout.fl_stripe_count = | |
163 | cpu_to_le32(l.stripe_count); | |
164 | req->r_args.setlayout.layout.fl_object_size = | |
165 | cpu_to_le32(l.object_size); | |
166 | req->r_args.setlayout.layout.fl_pg_pool = | |
167 | cpu_to_le32(l.data_pool); | |
168 | ||
169 | err = ceph_mdsc_do_request(mdsc, inode, req); | |
170 | ceph_mdsc_put_request(req); | |
171 | return err; | |
172 | } | |
173 | ||
174 | /* | |
175 | * Return object name, size/offset information, and location (OSD | |
176 | * number, network address) for a given file offset. | |
177 | */ | |
178 | static long ceph_ioctl_get_dataloc(struct file *file, void __user *arg) | |
179 | { | |
180 | struct ceph_ioctl_dataloc dl; | |
181 | struct inode *inode = file_inode(file); | |
182 | struct ceph_inode_info *ci = ceph_inode(inode); | |
183 | struct ceph_osd_client *osdc = | |
184 | &ceph_sb_to_client(inode->i_sb)->client->osdc; | |
185 | struct ceph_object_locator oloc; | |
186 | CEPH_DEFINE_OID_ONSTACK(oid); | |
187 | u64 len = 1, olen; | |
188 | u64 tmp; | |
189 | struct ceph_pg pgid; | |
190 | int r; | |
191 | ||
192 | /* copy and validate */ | |
193 | if (copy_from_user(&dl, arg, sizeof(dl))) | |
194 | return -EFAULT; | |
195 | ||
196 | down_read(&osdc->lock); | |
197 | r = ceph_calc_file_object_mapping(&ci->i_layout, dl.file_offset, len, | |
198 | &dl.object_no, &dl.object_offset, | |
199 | &olen); | |
200 | if (r < 0) { | |
201 | up_read(&osdc->lock); | |
202 | return -EIO; | |
203 | } | |
204 | dl.file_offset -= dl.object_offset; | |
205 | dl.object_size = ci->i_layout.object_size; | |
206 | dl.block_size = ci->i_layout.stripe_unit; | |
207 | ||
208 | /* block_offset = object_offset % block_size */ | |
209 | tmp = dl.object_offset; | |
210 | dl.block_offset = do_div(tmp, dl.block_size); | |
211 | ||
212 | snprintf(dl.object_name, sizeof(dl.object_name), "%llx.%08llx", | |
213 | ceph_ino(inode), dl.object_no); | |
214 | ||
215 | oloc.pool = ci->i_layout.pool_id; | |
216 | oloc.pool_ns = ceph_try_get_string(ci->i_layout.pool_ns); | |
217 | ceph_oid_printf(&oid, "%s", dl.object_name); | |
218 | ||
219 | r = ceph_object_locator_to_pg(osdc->osdmap, &oid, &oloc, &pgid); | |
220 | ||
221 | ceph_oloc_destroy(&oloc); | |
222 | if (r < 0) { | |
223 | up_read(&osdc->lock); | |
224 | return r; | |
225 | } | |
226 | ||
227 | dl.osd = ceph_pg_to_acting_primary(osdc->osdmap, &pgid); | |
228 | if (dl.osd >= 0) { | |
229 | struct ceph_entity_addr *a = | |
230 | ceph_osd_addr(osdc->osdmap, dl.osd); | |
231 | if (a) | |
232 | memcpy(&dl.osd_addr, &a->in_addr, sizeof(dl.osd_addr)); | |
233 | } else { | |
234 | memset(&dl.osd_addr, 0, sizeof(dl.osd_addr)); | |
235 | } | |
236 | up_read(&osdc->lock); | |
237 | ||
238 | /* send result back to user */ | |
239 | if (copy_to_user(arg, &dl, sizeof(dl))) | |
240 | return -EFAULT; | |
241 | ||
242 | return 0; | |
243 | } | |
244 | ||
245 | static long ceph_ioctl_lazyio(struct file *file) | |
246 | { | |
247 | struct ceph_file_info *fi = file->private_data; | |
248 | struct inode *inode = file_inode(file); | |
249 | struct ceph_inode_info *ci = ceph_inode(inode); | |
250 | ||
251 | if ((fi->fmode & CEPH_FILE_MODE_LAZY) == 0) { | |
252 | spin_lock(&ci->i_ceph_lock); | |
253 | fi->fmode |= CEPH_FILE_MODE_LAZY; | |
254 | ci->i_nr_by_mode[ffs(CEPH_FILE_MODE_LAZY)]++; | |
255 | spin_unlock(&ci->i_ceph_lock); | |
256 | dout("ioctl_layzio: file %p marked lazy\n", file); | |
257 | ||
258 | ceph_check_caps(ci, 0, NULL); | |
259 | } else { | |
260 | dout("ioctl_layzio: file %p already lazy\n", file); | |
261 | } | |
262 | return 0; | |
263 | } | |
264 | ||
265 | static long ceph_ioctl_syncio(struct file *file) | |
266 | { | |
267 | struct ceph_file_info *fi = file->private_data; | |
268 | ||
269 | fi->flags |= CEPH_F_SYNC; | |
270 | return 0; | |
271 | } | |
272 | ||
273 | long ceph_ioctl(struct file *file, unsigned int cmd, unsigned long arg) | |
274 | { | |
275 | dout("ioctl file %p cmd %u arg %lu\n", file, cmd, arg); | |
276 | switch (cmd) { | |
277 | case CEPH_IOC_GET_LAYOUT: | |
278 | return ceph_ioctl_get_layout(file, (void __user *)arg); | |
279 | ||
280 | case CEPH_IOC_SET_LAYOUT: | |
281 | return ceph_ioctl_set_layout(file, (void __user *)arg); | |
282 | ||
283 | case CEPH_IOC_SET_LAYOUT_POLICY: | |
284 | return ceph_ioctl_set_layout_policy(file, (void __user *)arg); | |
285 | ||
286 | case CEPH_IOC_GET_DATALOC: | |
287 | return ceph_ioctl_get_dataloc(file, (void __user *)arg); | |
288 | ||
289 | case CEPH_IOC_LAZYIO: | |
290 | return ceph_ioctl_lazyio(file); | |
291 | ||
292 | case CEPH_IOC_SYNCIO: | |
293 | return ceph_ioctl_syncio(file); | |
294 | } | |
295 | ||
296 | return -ENOTTY; | |
297 | } |