]> git.proxmox.com Git - mirror_ubuntu-bionic-kernel.git/blob - fs/afs/file.c
afs: Overhaul volume and server record caching and fileserver rotation
[mirror_ubuntu-bionic-kernel.git] / fs / afs / file.c
1 /* AFS filesystem file handling
2 *
3 * Copyright (C) 2002, 2007 Red Hat, Inc. All Rights Reserved.
4 * Written by David Howells (dhowells@redhat.com)
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 */
11
12 #include <linux/kernel.h>
13 #include <linux/module.h>
14 #include <linux/init.h>
15 #include <linux/fs.h>
16 #include <linux/pagemap.h>
17 #include <linux/writeback.h>
18 #include <linux/gfp.h>
19 #include <linux/task_io_accounting_ops.h>
20 #include "internal.h"
21
22 static int afs_readpage(struct file *file, struct page *page);
23 static void afs_invalidatepage(struct page *page, unsigned int offset,
24 unsigned int length);
25 static int afs_releasepage(struct page *page, gfp_t gfp_flags);
26 static int afs_launder_page(struct page *page);
27
28 static int afs_readpages(struct file *filp, struct address_space *mapping,
29 struct list_head *pages, unsigned nr_pages);
30
31 const struct file_operations afs_file_operations = {
32 .open = afs_open,
33 .flush = afs_flush,
34 .release = afs_release,
35 .llseek = generic_file_llseek,
36 .read_iter = generic_file_read_iter,
37 .write_iter = afs_file_write,
38 .mmap = generic_file_readonly_mmap,
39 .splice_read = generic_file_splice_read,
40 .fsync = afs_fsync,
41 .lock = afs_lock,
42 .flock = afs_flock,
43 };
44
45 const struct inode_operations afs_file_inode_operations = {
46 .getattr = afs_getattr,
47 .setattr = afs_setattr,
48 .permission = afs_permission,
49 .listxattr = afs_listxattr,
50 };
51
52 const struct address_space_operations afs_fs_aops = {
53 .readpage = afs_readpage,
54 .readpages = afs_readpages,
55 .set_page_dirty = afs_set_page_dirty,
56 .launder_page = afs_launder_page,
57 .releasepage = afs_releasepage,
58 .invalidatepage = afs_invalidatepage,
59 .write_begin = afs_write_begin,
60 .write_end = afs_write_end,
61 .writepage = afs_writepage,
62 .writepages = afs_writepages,
63 };
64
65 /*
66 * open an AFS file or directory and attach a key to it
67 */
68 int afs_open(struct inode *inode, struct file *file)
69 {
70 struct afs_vnode *vnode = AFS_FS_I(inode);
71 struct key *key;
72 int ret;
73
74 _enter("{%x:%u},", vnode->fid.vid, vnode->fid.vnode);
75
76 key = afs_request_key(vnode->volume->cell);
77 if (IS_ERR(key)) {
78 _leave(" = %ld [key]", PTR_ERR(key));
79 return PTR_ERR(key);
80 }
81
82 ret = afs_validate(vnode, key);
83 if (ret < 0) {
84 _leave(" = %d [val]", ret);
85 return ret;
86 }
87
88 file->private_data = key;
89 _leave(" = 0");
90 return 0;
91 }
92
93 /*
94 * release an AFS file or directory and discard its key
95 */
96 int afs_release(struct inode *inode, struct file *file)
97 {
98 struct afs_vnode *vnode = AFS_FS_I(inode);
99
100 _enter("{%x:%u},", vnode->fid.vid, vnode->fid.vnode);
101
102 key_put(file->private_data);
103 _leave(" = 0");
104 return 0;
105 }
106
107 /*
108 * Dispose of a ref to a read record.
109 */
110 void afs_put_read(struct afs_read *req)
111 {
112 int i;
113
114 if (atomic_dec_and_test(&req->usage)) {
115 for (i = 0; i < req->nr_pages; i++)
116 if (req->pages[i])
117 put_page(req->pages[i]);
118 kfree(req);
119 }
120 }
121
122 #ifdef CONFIG_AFS_FSCACHE
123 /*
124 * deal with notification that a page was read from the cache
125 */
126 static void afs_file_readpage_read_complete(struct page *page,
127 void *data,
128 int error)
129 {
130 _enter("%p,%p,%d", page, data, error);
131
132 /* if the read completes with an error, we just unlock the page and let
133 * the VM reissue the readpage */
134 if (!error)
135 SetPageUptodate(page);
136 unlock_page(page);
137 }
138 #endif
139
140 /*
141 * Fetch file data from the volume.
142 */
143 int afs_fetch_data(struct afs_vnode *vnode, struct key *key, struct afs_read *desc)
144 {
145 struct afs_fs_cursor fc;
146 int ret;
147
148 _enter("%s{%x:%u.%u},%x,,,",
149 vnode->volume->name,
150 vnode->fid.vid,
151 vnode->fid.vnode,
152 vnode->fid.unique,
153 key_serial(key));
154
155 ret = -ERESTARTSYS;
156 if (afs_begin_vnode_operation(&fc, vnode, key)) {
157 while (afs_select_fileserver(&fc)) {
158 fc.cb_break = vnode->cb_break + vnode->cb_s_break;
159 afs_fs_fetch_data(&fc, desc);
160 }
161
162 afs_check_for_remote_deletion(&fc, fc.vnode);
163 afs_vnode_commit_status(&fc, vnode, fc.cb_break);
164 ret = afs_end_vnode_operation(&fc);
165 }
166
167 _leave(" = %d", ret);
168 return ret;
169 }
170
171 /*
172 * read page from file, directory or symlink, given a key to use
173 */
174 int afs_page_filler(void *data, struct page *page)
175 {
176 struct inode *inode = page->mapping->host;
177 struct afs_vnode *vnode = AFS_FS_I(inode);
178 struct afs_read *req;
179 struct key *key = data;
180 int ret;
181
182 _enter("{%x},{%lu},{%lu}", key_serial(key), inode->i_ino, page->index);
183
184 BUG_ON(!PageLocked(page));
185
186 ret = -ESTALE;
187 if (test_bit(AFS_VNODE_DELETED, &vnode->flags))
188 goto error;
189
190 /* is it cached? */
191 #ifdef CONFIG_AFS_FSCACHE
192 ret = fscache_read_or_alloc_page(vnode->cache,
193 page,
194 afs_file_readpage_read_complete,
195 NULL,
196 GFP_KERNEL);
197 #else
198 ret = -ENOBUFS;
199 #endif
200 switch (ret) {
201 /* read BIO submitted (page in cache) */
202 case 0:
203 break;
204
205 /* page not yet cached */
206 case -ENODATA:
207 _debug("cache said ENODATA");
208 goto go_on;
209
210 /* page will not be cached */
211 case -ENOBUFS:
212 _debug("cache said ENOBUFS");
213 default:
214 go_on:
215 req = kzalloc(sizeof(struct afs_read) + sizeof(struct page *),
216 GFP_KERNEL);
217 if (!req)
218 goto enomem;
219
220 /* We request a full page. If the page is a partial one at the
221 * end of the file, the server will return a short read and the
222 * unmarshalling code will clear the unfilled space.
223 */
224 atomic_set(&req->usage, 1);
225 req->pos = (loff_t)page->index << PAGE_SHIFT;
226 req->len = PAGE_SIZE;
227 req->nr_pages = 1;
228 req->pages[0] = page;
229 get_page(page);
230
231 /* read the contents of the file from the server into the
232 * page */
233 ret = afs_fetch_data(vnode, key, req);
234 afs_put_read(req);
235 if (ret < 0) {
236 if (ret == -ENOENT) {
237 _debug("got NOENT from server"
238 " - marking file deleted and stale");
239 set_bit(AFS_VNODE_DELETED, &vnode->flags);
240 ret = -ESTALE;
241 }
242
243 #ifdef CONFIG_AFS_FSCACHE
244 fscache_uncache_page(vnode->cache, page);
245 #endif
246 BUG_ON(PageFsCache(page));
247
248 if (ret == -EINTR ||
249 ret == -ENOMEM ||
250 ret == -ERESTARTSYS ||
251 ret == -EAGAIN)
252 goto error;
253 goto io_error;
254 }
255
256 SetPageUptodate(page);
257
258 /* send the page to the cache */
259 #ifdef CONFIG_AFS_FSCACHE
260 if (PageFsCache(page) &&
261 fscache_write_page(vnode->cache, page, GFP_KERNEL) != 0) {
262 fscache_uncache_page(vnode->cache, page);
263 BUG_ON(PageFsCache(page));
264 }
265 #endif
266 unlock_page(page);
267 }
268
269 _leave(" = 0");
270 return 0;
271
272 io_error:
273 SetPageError(page);
274 goto error;
275 enomem:
276 ret = -ENOMEM;
277 error:
278 unlock_page(page);
279 _leave(" = %d", ret);
280 return ret;
281 }
282
283 /*
284 * read page from file, directory or symlink, given a file to nominate the key
285 * to be used
286 */
287 static int afs_readpage(struct file *file, struct page *page)
288 {
289 struct key *key;
290 int ret;
291
292 if (file) {
293 key = file->private_data;
294 ASSERT(key != NULL);
295 ret = afs_page_filler(key, page);
296 } else {
297 struct inode *inode = page->mapping->host;
298 key = afs_request_key(AFS_FS_S(inode->i_sb)->cell);
299 if (IS_ERR(key)) {
300 ret = PTR_ERR(key);
301 } else {
302 ret = afs_page_filler(key, page);
303 key_put(key);
304 }
305 }
306 return ret;
307 }
308
309 /*
310 * Make pages available as they're filled.
311 */
312 static void afs_readpages_page_done(struct afs_call *call, struct afs_read *req)
313 {
314 #ifdef CONFIG_AFS_FSCACHE
315 struct afs_vnode *vnode = call->reply[0];
316 #endif
317 struct page *page = req->pages[req->index];
318
319 req->pages[req->index] = NULL;
320 SetPageUptodate(page);
321
322 /* send the page to the cache */
323 #ifdef CONFIG_AFS_FSCACHE
324 if (PageFsCache(page) &&
325 fscache_write_page(vnode->cache, page, GFP_KERNEL) != 0) {
326 fscache_uncache_page(vnode->cache, page);
327 BUG_ON(PageFsCache(page));
328 }
329 #endif
330 unlock_page(page);
331 put_page(page);
332 }
333
334 /*
335 * Read a contiguous set of pages.
336 */
337 static int afs_readpages_one(struct file *file, struct address_space *mapping,
338 struct list_head *pages)
339 {
340 struct afs_vnode *vnode = AFS_FS_I(mapping->host);
341 struct afs_read *req;
342 struct list_head *p;
343 struct page *first, *page;
344 struct key *key = file->private_data;
345 pgoff_t index;
346 int ret, n, i;
347
348 /* Count the number of contiguous pages at the front of the list. Note
349 * that the list goes prev-wards rather than next-wards.
350 */
351 first = list_entry(pages->prev, struct page, lru);
352 index = first->index + 1;
353 n = 1;
354 for (p = first->lru.prev; p != pages; p = p->prev) {
355 page = list_entry(p, struct page, lru);
356 if (page->index != index)
357 break;
358 index++;
359 n++;
360 }
361
362 req = kzalloc(sizeof(struct afs_read) + sizeof(struct page *) * n,
363 GFP_NOFS);
364 if (!req)
365 return -ENOMEM;
366
367 atomic_set(&req->usage, 1);
368 req->page_done = afs_readpages_page_done;
369 req->pos = first->index;
370 req->pos <<= PAGE_SHIFT;
371
372 /* Transfer the pages to the request. We add them in until one fails
373 * to add to the LRU and then we stop (as that'll make a hole in the
374 * contiguous run.
375 *
376 * Note that it's possible for the file size to change whilst we're
377 * doing this, but we rely on the server returning less than we asked
378 * for if the file shrank. We also rely on this to deal with a partial
379 * page at the end of the file.
380 */
381 do {
382 page = list_entry(pages->prev, struct page, lru);
383 list_del(&page->lru);
384 index = page->index;
385 if (add_to_page_cache_lru(page, mapping, index,
386 readahead_gfp_mask(mapping))) {
387 #ifdef CONFIG_AFS_FSCACHE
388 fscache_uncache_page(vnode->cache, page);
389 #endif
390 put_page(page);
391 break;
392 }
393
394 req->pages[req->nr_pages++] = page;
395 req->len += PAGE_SIZE;
396 } while (req->nr_pages < n);
397
398 if (req->nr_pages == 0) {
399 kfree(req);
400 return 0;
401 }
402
403 ret = afs_fetch_data(vnode, key, req);
404 if (ret < 0)
405 goto error;
406
407 task_io_account_read(PAGE_SIZE * req->nr_pages);
408 afs_put_read(req);
409 return 0;
410
411 error:
412 if (ret == -ENOENT) {
413 _debug("got NOENT from server"
414 " - marking file deleted and stale");
415 set_bit(AFS_VNODE_DELETED, &vnode->flags);
416 ret = -ESTALE;
417 }
418
419 for (i = 0; i < req->nr_pages; i++) {
420 page = req->pages[i];
421 if (page) {
422 #ifdef CONFIG_AFS_FSCACHE
423 fscache_uncache_page(vnode->cache, page);
424 #endif
425 SetPageError(page);
426 unlock_page(page);
427 }
428 }
429
430 afs_put_read(req);
431 return ret;
432 }
433
434 /*
435 * read a set of pages
436 */
437 static int afs_readpages(struct file *file, struct address_space *mapping,
438 struct list_head *pages, unsigned nr_pages)
439 {
440 struct key *key = file->private_data;
441 struct afs_vnode *vnode;
442 int ret = 0;
443
444 _enter("{%d},{%lu},,%d",
445 key_serial(key), mapping->host->i_ino, nr_pages);
446
447 ASSERT(key != NULL);
448
449 vnode = AFS_FS_I(mapping->host);
450 if (test_bit(AFS_VNODE_DELETED, &vnode->flags)) {
451 _leave(" = -ESTALE");
452 return -ESTALE;
453 }
454
455 /* attempt to read as many of the pages as possible */
456 #ifdef CONFIG_AFS_FSCACHE
457 ret = fscache_read_or_alloc_pages(vnode->cache,
458 mapping,
459 pages,
460 &nr_pages,
461 afs_file_readpage_read_complete,
462 NULL,
463 mapping_gfp_mask(mapping));
464 #else
465 ret = -ENOBUFS;
466 #endif
467
468 switch (ret) {
469 /* all pages are being read from the cache */
470 case 0:
471 BUG_ON(!list_empty(pages));
472 BUG_ON(nr_pages != 0);
473 _leave(" = 0 [reading all]");
474 return 0;
475
476 /* there were pages that couldn't be read from the cache */
477 case -ENODATA:
478 case -ENOBUFS:
479 break;
480
481 /* other error */
482 default:
483 _leave(" = %d", ret);
484 return ret;
485 }
486
487 while (!list_empty(pages)) {
488 ret = afs_readpages_one(file, mapping, pages);
489 if (ret < 0)
490 break;
491 }
492
493 _leave(" = %d [netting]", ret);
494 return ret;
495 }
496
497 /*
498 * write back a dirty page
499 */
500 static int afs_launder_page(struct page *page)
501 {
502 _enter("{%lu}", page->index);
503
504 return 0;
505 }
506
507 /*
508 * invalidate part or all of a page
509 * - release a page and clean up its private data if offset is 0 (indicating
510 * the entire page)
511 */
512 static void afs_invalidatepage(struct page *page, unsigned int offset,
513 unsigned int length)
514 {
515 struct afs_writeback *wb = (struct afs_writeback *) page_private(page);
516
517 _enter("{%lu},%u,%u", page->index, offset, length);
518
519 BUG_ON(!PageLocked(page));
520
521 /* we clean up only if the entire page is being invalidated */
522 if (offset == 0 && length == PAGE_SIZE) {
523 #ifdef CONFIG_AFS_FSCACHE
524 if (PageFsCache(page)) {
525 struct afs_vnode *vnode = AFS_FS_I(page->mapping->host);
526 fscache_wait_on_page_write(vnode->cache, page);
527 fscache_uncache_page(vnode->cache, page);
528 }
529 #endif
530
531 if (PagePrivate(page)) {
532 if (wb && !PageWriteback(page)) {
533 set_page_private(page, 0);
534 afs_put_writeback(wb);
535 }
536
537 if (!page_private(page))
538 ClearPagePrivate(page);
539 }
540 }
541
542 _leave("");
543 }
544
545 /*
546 * release a page and clean up its private state if it's not busy
547 * - return true if the page can now be released, false if not
548 */
549 static int afs_releasepage(struct page *page, gfp_t gfp_flags)
550 {
551 struct afs_writeback *wb = (struct afs_writeback *) page_private(page);
552 struct afs_vnode *vnode = AFS_FS_I(page->mapping->host);
553
554 _enter("{{%x:%u}[%lu],%lx},%x",
555 vnode->fid.vid, vnode->fid.vnode, page->index, page->flags,
556 gfp_flags);
557
558 /* deny if page is being written to the cache and the caller hasn't
559 * elected to wait */
560 #ifdef CONFIG_AFS_FSCACHE
561 if (!fscache_maybe_release_page(vnode->cache, page, gfp_flags)) {
562 _leave(" = F [cache busy]");
563 return 0;
564 }
565 #endif
566
567 if (PagePrivate(page)) {
568 if (wb) {
569 set_page_private(page, 0);
570 afs_put_writeback(wb);
571 }
572 ClearPagePrivate(page);
573 }
574
575 /* indicate that the page can be released */
576 _leave(" = T");
577 return 1;
578 }