1 /* AFS filesystem file handling
2 *
3 * Copyright (C) 2002, 2007 Red Hat, Inc. All Rights Reserved.
4 * Written by David Howells (dhowells@redhat.com)
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 */
11
12 #include <linux/kernel.h>
13 #include <linux/module.h>
14 #include <linux/init.h>
15 #include <linux/fs.h>
16 #include <linux/pagemap.h>
17 #include <linux/writeback.h>
18 #include <linux/gfp.h>
19 #include <linux/task_io_accounting_ops.h>
20 #include "internal.h"
21
22 static int afs_file_mmap(struct file *file, struct vm_area_struct *vma);
23 static int afs_readpage(struct file *file, struct page *page);
24 static void afs_invalidatepage(struct page *page, unsigned int offset,
25 unsigned int length);
26 static int afs_releasepage(struct page *page, gfp_t gfp_flags);
27
28 static int afs_readpages(struct file *filp, struct address_space *mapping,
29 struct list_head *pages, unsigned nr_pages);
30
31 const struct file_operations afs_file_operations = {
32 .open = afs_open,
33 .release = afs_release,
34 .llseek = generic_file_llseek,
35 .read_iter = generic_file_read_iter,
36 .write_iter = afs_file_write,
37 .mmap = afs_file_mmap,
38 .splice_read = generic_file_splice_read,
39 .fsync = afs_fsync,
40 .lock = afs_lock,
41 .flock = afs_flock,
42 };
43
44 const struct inode_operations afs_file_inode_operations = {
45 .getattr = afs_getattr,
46 .setattr = afs_setattr,
47 .permission = afs_permission,
48 .listxattr = afs_listxattr,
49 };
50
51 const struct address_space_operations afs_fs_aops = {
52 .readpage = afs_readpage,
53 .readpages = afs_readpages,
54 .set_page_dirty = afs_set_page_dirty,
55 .launder_page = afs_launder_page,
56 .releasepage = afs_releasepage,
57 .invalidatepage = afs_invalidatepage,
58 .write_begin = afs_write_begin,
59 .write_end = afs_write_end,
60 .writepage = afs_writepage,
61 .writepages = afs_writepages,
62 };
63
64 static const struct vm_operations_struct afs_vm_ops = {
65 .fault = filemap_fault,
66 .map_pages = filemap_map_pages,
67 .page_mkwrite = afs_page_mkwrite,
68 };
69
70 /*
71 * Discard a pin on a writeback key.
72 */
afs_put_wb_key(struct afs_wb_key * wbk)73 void afs_put_wb_key(struct afs_wb_key *wbk)
74 {
75 if (refcount_dec_and_test(&wbk->usage)) {
76 key_put(wbk->key);
77 kfree(wbk);
78 }
79 }
80
81 /*
82 * Cache key for writeback.
83 */
afs_cache_wb_key(struct afs_vnode * vnode,struct afs_file * af)84 int afs_cache_wb_key(struct afs_vnode *vnode, struct afs_file *af)
85 {
86 struct afs_wb_key *wbk, *p;
87
88 wbk = kzalloc(sizeof(struct afs_wb_key), GFP_KERNEL);
89 if (!wbk)
90 return -ENOMEM;
91 refcount_set(&wbk->usage, 2);
92 wbk->key = af->key;
93
94 spin_lock(&vnode->wb_lock);
95 list_for_each_entry(p, &vnode->wb_keys, vnode_link) {
96 if (p->key == wbk->key)
97 goto found;
98 }
99
100 key_get(wbk->key);
101 list_add_tail(&wbk->vnode_link, &vnode->wb_keys);
102 spin_unlock(&vnode->wb_lock);
103 af->wb = wbk;
104 return 0;
105
106 found:
107 refcount_inc(&p->usage);
108 spin_unlock(&vnode->wb_lock);
109 af->wb = p;
110 kfree(wbk);
111 return 0;
112 }
113
114 /*
115 * open an AFS file or directory and attach a key to it
116 */
afs_open(struct inode * inode,struct file * file)117 int afs_open(struct inode *inode, struct file *file)
118 {
119 struct afs_vnode *vnode = AFS_FS_I(inode);
120 struct afs_file *af;
121 struct key *key;
122 int ret;
123
124 _enter("{%x:%u},", vnode->fid.vid, vnode->fid.vnode);
125
126 key = afs_request_key(vnode->volume->cell);
127 if (IS_ERR(key)) {
128 ret = PTR_ERR(key);
129 goto error;
130 }
131
132 af = kzalloc(sizeof(*af), GFP_KERNEL);
133 if (!af) {
134 ret = -ENOMEM;
135 goto error_key;
136 }
137 af->key = key;
138
139 ret = afs_validate(vnode, key);
140 if (ret < 0)
141 goto error_af;
142
143 if (file->f_mode & FMODE_WRITE) {
144 ret = afs_cache_wb_key(vnode, af);
145 if (ret < 0)
146 goto error_af;
147 }
148
149 if (file->f_flags & O_TRUNC)
150 set_bit(AFS_VNODE_NEW_CONTENT, &vnode->flags);
151
152 file->private_data = af;
153 _leave(" = 0");
154 return 0;
155
156 error_af:
157 kfree(af);
158 error_key:
159 key_put(key);
160 error:
161 _leave(" = %d", ret);
162 return ret;
163 }
164
165 /*
166 * release an AFS file or directory and discard its key
167 */
afs_release(struct inode * inode,struct file * file)168 int afs_release(struct inode *inode, struct file *file)
169 {
170 struct afs_vnode *vnode = AFS_FS_I(inode);
171 struct afs_file *af = file->private_data;
172
173 _enter("{%x:%u},", vnode->fid.vid, vnode->fid.vnode);
174
175 if ((file->f_mode & FMODE_WRITE))
176 return vfs_fsync(file, 0);
177
178 file->private_data = NULL;
179 if (af->wb)
180 afs_put_wb_key(af->wb);
181 key_put(af->key);
182 kfree(af);
183 afs_prune_wb_keys(vnode);
184 _leave(" = 0");
185 return 0;
186 }
187
188 /*
189 * Dispose of a ref to a read record.
190 */
afs_put_read(struct afs_read * req)191 void afs_put_read(struct afs_read *req)
192 {
193 int i;
194
195 if (refcount_dec_and_test(&req->usage)) {
196 for (i = 0; i < req->nr_pages; i++)
197 if (req->pages[i])
198 put_page(req->pages[i]);
199 if (req->pages != req->array)
200 kfree(req->pages);
201 kfree(req);
202 }
203 }
204
205 #ifdef CONFIG_AFS_FSCACHE
206 /*
207 * deal with notification that a page was read from the cache
208 */
afs_file_readpage_read_complete(struct page * page,void * data,int error)209 static void afs_file_readpage_read_complete(struct page *page,
210 void *data,
211 int error)
212 {
213 _enter("%p,%p,%d", page, data, error);
214
215 /* if the read completes with an error, we just unlock the page and let
216 * the VM reissue the readpage */
217 if (!error)
218 SetPageUptodate(page);
219 unlock_page(page);
220 }
221 #endif
222
223 /*
224 * Fetch file data from the volume.
225 */
afs_fetch_data(struct afs_vnode * vnode,struct key * key,struct afs_read * desc)226 int afs_fetch_data(struct afs_vnode *vnode, struct key *key, struct afs_read *desc)
227 {
228 struct afs_fs_cursor fc;
229 int ret;
230
231 _enter("%s{%x:%u.%u},%x,,,",
232 vnode->volume->name,
233 vnode->fid.vid,
234 vnode->fid.vnode,
235 vnode->fid.unique,
236 key_serial(key));
237
238 ret = -ERESTARTSYS;
239 if (afs_begin_vnode_operation(&fc, vnode, key)) {
240 while (afs_select_fileserver(&fc)) {
241 fc.cb_break = afs_calc_vnode_cb_break(vnode);
242 afs_fs_fetch_data(&fc, desc);
243 }
244
245 afs_check_for_remote_deletion(&fc, fc.vnode);
246 afs_vnode_commit_status(&fc, vnode, fc.cb_break);
247 ret = afs_end_vnode_operation(&fc);
248 }
249
250 if (ret == 0) {
251 afs_stat_v(vnode, n_fetches);
252 atomic_long_add(desc->actual_len,
253 &afs_v2net(vnode)->n_fetch_bytes);
254 }
255
256 _leave(" = %d", ret);
257 return ret;
258 }
259
260 /*
261 * read page from file, directory or symlink, given a key to use
262 */
afs_page_filler(void * data,struct page * page)263 int afs_page_filler(void *data, struct page *page)
264 {
265 struct inode *inode = page->mapping->host;
266 struct afs_vnode *vnode = AFS_FS_I(inode);
267 struct afs_read *req;
268 struct key *key = data;
269 int ret;
270
271 _enter("{%x},{%lu},{%lu}", key_serial(key), inode->i_ino, page->index);
272
273 BUG_ON(!PageLocked(page));
274
275 ret = -ESTALE;
276 if (test_bit(AFS_VNODE_DELETED, &vnode->flags))
277 goto error;
278
279 /* is it cached? */
280 #ifdef CONFIG_AFS_FSCACHE
281 ret = fscache_read_or_alloc_page(vnode->cache,
282 page,
283 afs_file_readpage_read_complete,
284 NULL,
285 GFP_KERNEL);
286 #else
287 ret = -ENOBUFS;
288 #endif
289 switch (ret) {
290 /* read BIO submitted (page in cache) */
291 case 0:
292 break;
293
294 /* page not yet cached */
295 case -ENODATA:
296 _debug("cache said ENODATA");
297 goto go_on;
298
299 /* page will not be cached */
300 case -ENOBUFS:
301 _debug("cache said ENOBUFS");
302 default:
303 go_on:
304 req = kzalloc(sizeof(struct afs_read) + sizeof(struct page *),
305 GFP_KERNEL);
306 if (!req)
307 goto enomem;
308
309 /* We request a full page. If the page is a partial one at the
310 * end of the file, the server will return a short read and the
311 * unmarshalling code will clear the unfilled space.
312 */
313 refcount_set(&req->usage, 1);
314 req->pos = (loff_t)page->index << PAGE_SHIFT;
315 req->len = PAGE_SIZE;
316 req->nr_pages = 1;
317 req->pages = req->array;
318 req->pages[0] = page;
319 get_page(page);
320
321 /* read the contents of the file from the server into the
322 * page */
323 ret = afs_fetch_data(vnode, key, req);
324 afs_put_read(req);
325
326 if (ret < 0) {
327 if (ret == -ENOENT) {
328 _debug("got NOENT from server"
329 " - marking file deleted and stale");
330 set_bit(AFS_VNODE_DELETED, &vnode->flags);
331 ret = -ESTALE;
332 }
333
334 #ifdef CONFIG_AFS_FSCACHE
335 fscache_uncache_page(vnode->cache, page);
336 #endif
337 BUG_ON(PageFsCache(page));
338
339 if (ret == -EINTR ||
340 ret == -ENOMEM ||
341 ret == -ERESTARTSYS ||
342 ret == -EAGAIN)
343 goto error;
344 goto io_error;
345 }
346
347 SetPageUptodate(page);
348
349 /* send the page to the cache */
350 #ifdef CONFIG_AFS_FSCACHE
351 if (PageFsCache(page) &&
352 fscache_write_page(vnode->cache, page, vnode->status.size,
353 GFP_KERNEL) != 0) {
354 fscache_uncache_page(vnode->cache, page);
355 BUG_ON(PageFsCache(page));
356 }
357 #endif
358 unlock_page(page);
359 }
360
361 _leave(" = 0");
362 return 0;
363
364 io_error:
365 SetPageError(page);
366 goto error;
367 enomem:
368 ret = -ENOMEM;
369 error:
370 unlock_page(page);
371 _leave(" = %d", ret);
372 return ret;
373 }
374
375 /*
376 * read page from file, directory or symlink, given a file to nominate the key
377 * to be used
378 */
afs_readpage(struct file * file,struct page * page)379 static int afs_readpage(struct file *file, struct page *page)
380 {
381 struct key *key;
382 int ret;
383
384 if (file) {
385 key = afs_file_key(file);
386 ASSERT(key != NULL);
387 ret = afs_page_filler(key, page);
388 } else {
389 struct inode *inode = page->mapping->host;
390 key = afs_request_key(AFS_FS_S(inode->i_sb)->cell);
391 if (IS_ERR(key)) {
392 ret = PTR_ERR(key);
393 } else {
394 ret = afs_page_filler(key, page);
395 key_put(key);
396 }
397 }
398 return ret;
399 }
400
401 /*
402 * Make pages available as they're filled.
403 */
afs_readpages_page_done(struct afs_call * call,struct afs_read * req)404 static void afs_readpages_page_done(struct afs_call *call, struct afs_read *req)
405 {
406 #ifdef CONFIG_AFS_FSCACHE
407 struct afs_vnode *vnode = call->reply[0];
408 #endif
409 struct page *page = req->pages[req->index];
410
411 req->pages[req->index] = NULL;
412 SetPageUptodate(page);
413
414 /* send the page to the cache */
415 #ifdef CONFIG_AFS_FSCACHE
416 if (PageFsCache(page) &&
417 fscache_write_page(vnode->cache, page, vnode->status.size,
418 GFP_KERNEL) != 0) {
419 fscache_uncache_page(vnode->cache, page);
420 BUG_ON(PageFsCache(page));
421 }
422 #endif
423 unlock_page(page);
424 put_page(page);
425 }
426
427 /*
428 * Read a contiguous set of pages.
429 */
afs_readpages_one(struct file * file,struct address_space * mapping,struct list_head * pages)430 static int afs_readpages_one(struct file *file, struct address_space *mapping,
431 struct list_head *pages)
432 {
433 struct afs_vnode *vnode = AFS_FS_I(mapping->host);
434 struct afs_read *req;
435 struct list_head *p;
436 struct page *first, *page;
437 struct key *key = afs_file_key(file);
438 pgoff_t index;
439 int ret, n, i;
440
441 /* Count the number of contiguous pages at the front of the list. Note
442 * that the list goes prev-wards rather than next-wards.
443 */
444 first = list_entry(pages->prev, struct page, lru);
445 index = first->index + 1;
446 n = 1;
447 for (p = first->lru.prev; p != pages; p = p->prev) {
448 page = list_entry(p, struct page, lru);
449 if (page->index != index)
450 break;
451 index++;
452 n++;
453 }
454
455 req = kzalloc(sizeof(struct afs_read) + sizeof(struct page *) * n,
456 GFP_NOFS);
457 if (!req)
458 return -ENOMEM;
459
460 refcount_set(&req->usage, 1);
461 req->page_done = afs_readpages_page_done;
462 req->pos = first->index;
463 req->pos <<= PAGE_SHIFT;
464 req->pages = req->array;
465
466 /* Transfer the pages to the request. We add them in until one fails
467 * to add to the LRU and then we stop (as that'll make a hole in the
468 * contiguous run.
469 *
470 * Note that it's possible for the file size to change whilst we're
471 * doing this, but we rely on the server returning less than we asked
472 * for if the file shrank. We also rely on this to deal with a partial
473 * page at the end of the file.
474 */
475 do {
476 page = list_entry(pages->prev, struct page, lru);
477 list_del(&page->lru);
478 index = page->index;
479 if (add_to_page_cache_lru(page, mapping, index,
480 readahead_gfp_mask(mapping))) {
481 #ifdef CONFIG_AFS_FSCACHE
482 fscache_uncache_page(vnode->cache, page);
483 #endif
484 put_page(page);
485 break;
486 }
487
488 req->pages[req->nr_pages++] = page;
489 req->len += PAGE_SIZE;
490 } while (req->nr_pages < n);
491
492 if (req->nr_pages == 0) {
493 kfree(req);
494 return 0;
495 }
496
497 ret = afs_fetch_data(vnode, key, req);
498 if (ret < 0)
499 goto error;
500
501 task_io_account_read(PAGE_SIZE * req->nr_pages);
502 afs_put_read(req);
503 return 0;
504
505 error:
506 if (ret == -ENOENT) {
507 _debug("got NOENT from server"
508 " - marking file deleted and stale");
509 set_bit(AFS_VNODE_DELETED, &vnode->flags);
510 ret = -ESTALE;
511 }
512
513 for (i = 0; i < req->nr_pages; i++) {
514 page = req->pages[i];
515 if (page) {
516 #ifdef CONFIG_AFS_FSCACHE
517 fscache_uncache_page(vnode->cache, page);
518 #endif
519 SetPageError(page);
520 unlock_page(page);
521 }
522 }
523
524 afs_put_read(req);
525 return ret;
526 }
527
528 /*
529 * read a set of pages
530 */
afs_readpages(struct file * file,struct address_space * mapping,struct list_head * pages,unsigned nr_pages)531 static int afs_readpages(struct file *file, struct address_space *mapping,
532 struct list_head *pages, unsigned nr_pages)
533 {
534 struct key *key = afs_file_key(file);
535 struct afs_vnode *vnode;
536 int ret = 0;
537
538 _enter("{%d},{%lu},,%d",
539 key_serial(key), mapping->host->i_ino, nr_pages);
540
541 ASSERT(key != NULL);
542
543 vnode = AFS_FS_I(mapping->host);
544 if (test_bit(AFS_VNODE_DELETED, &vnode->flags)) {
545 _leave(" = -ESTALE");
546 return -ESTALE;
547 }
548
549 /* attempt to read as many of the pages as possible */
550 #ifdef CONFIG_AFS_FSCACHE
551 ret = fscache_read_or_alloc_pages(vnode->cache,
552 mapping,
553 pages,
554 &nr_pages,
555 afs_file_readpage_read_complete,
556 NULL,
557 mapping_gfp_mask(mapping));
558 #else
559 ret = -ENOBUFS;
560 #endif
561
562 switch (ret) {
563 /* all pages are being read from the cache */
564 case 0:
565 BUG_ON(!list_empty(pages));
566 BUG_ON(nr_pages != 0);
567 _leave(" = 0 [reading all]");
568 return 0;
569
570 /* there were pages that couldn't be read from the cache */
571 case -ENODATA:
572 case -ENOBUFS:
573 break;
574
575 /* other error */
576 default:
577 _leave(" = %d", ret);
578 return ret;
579 }
580
581 while (!list_empty(pages)) {
582 ret = afs_readpages_one(file, mapping, pages);
583 if (ret < 0)
584 break;
585 }
586
587 _leave(" = %d [netting]", ret);
588 return ret;
589 }
590
591 /*
592 * invalidate part or all of a page
593 * - release a page and clean up its private data if offset is 0 (indicating
594 * the entire page)
595 */
afs_invalidatepage(struct page * page,unsigned int offset,unsigned int length)596 static void afs_invalidatepage(struct page *page, unsigned int offset,
597 unsigned int length)
598 {
599 struct afs_vnode *vnode = AFS_FS_I(page->mapping->host);
600 unsigned long priv;
601
602 _enter("{%lu},%u,%u", page->index, offset, length);
603
604 BUG_ON(!PageLocked(page));
605
606 /* we clean up only if the entire page is being invalidated */
607 if (offset == 0 && length == PAGE_SIZE) {
608 #ifdef CONFIG_AFS_FSCACHE
609 if (PageFsCache(page)) {
610 struct afs_vnode *vnode = AFS_FS_I(page->mapping->host);
611 fscache_wait_on_page_write(vnode->cache, page);
612 fscache_uncache_page(vnode->cache, page);
613 }
614 #endif
615
616 if (PagePrivate(page)) {
617 priv = page_private(page);
618 trace_afs_page_dirty(vnode, tracepoint_string("inval"),
619 page->index, priv);
620 set_page_private(page, 0);
621 ClearPagePrivate(page);
622 }
623 }
624
625 _leave("");
626 }
627
628 /*
629 * release a page and clean up its private state if it's not busy
630 * - return true if the page can now be released, false if not
631 */
afs_releasepage(struct page * page,gfp_t gfp_flags)632 static int afs_releasepage(struct page *page, gfp_t gfp_flags)
633 {
634 struct afs_vnode *vnode = AFS_FS_I(page->mapping->host);
635 unsigned long priv;
636
637 _enter("{{%x:%u}[%lu],%lx},%x",
638 vnode->fid.vid, vnode->fid.vnode, page->index, page->flags,
639 gfp_flags);
640
641 /* deny if page is being written to the cache and the caller hasn't
642 * elected to wait */
643 #ifdef CONFIG_AFS_FSCACHE
644 if (!fscache_maybe_release_page(vnode->cache, page, gfp_flags)) {
645 _leave(" = F [cache busy]");
646 return 0;
647 }
648 #endif
649
650 if (PagePrivate(page)) {
651 priv = page_private(page);
652 trace_afs_page_dirty(vnode, tracepoint_string("rel"),
653 page->index, priv);
654 set_page_private(page, 0);
655 ClearPagePrivate(page);
656 }
657
658 /* indicate that the page can be released */
659 _leave(" = T");
660 return 1;
661 }
662
663 /*
664 * Handle setting up a memory mapping on an AFS file.
665 */
afs_file_mmap(struct file * file,struct vm_area_struct * vma)666 static int afs_file_mmap(struct file *file, struct vm_area_struct *vma)
667 {
668 int ret;
669
670 ret = generic_file_mmap(file, vma);
671 if (ret == 0)
672 vma->vm_ops = &afs_vm_ops;
673 return ret;
674 }
675