blob: 843d3b970b845050701c02febcc585f00321fd95 [file] [log] [blame]
xjb04a4022021-11-25 15:01:52 +08001/* AFS filesystem file handling
2 *
3 * Copyright (C) 2002, 2007 Red Hat, Inc. All Rights Reserved.
4 * Written by David Howells (dhowells@redhat.com)
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 */
11
12#include <linux/kernel.h>
13#include <linux/module.h>
14#include <linux/init.h>
15#include <linux/fs.h>
16#include <linux/pagemap.h>
17#include <linux/writeback.h>
18#include <linux/gfp.h>
19#include <linux/task_io_accounting_ops.h>
20#include "internal.h"
21
22static int afs_file_mmap(struct file *file, struct vm_area_struct *vma);
23static int afs_readpage(struct file *file, struct page *page);
24static void afs_invalidatepage(struct page *page, unsigned int offset,
25 unsigned int length);
26static int afs_releasepage(struct page *page, gfp_t gfp_flags);
27
28static int afs_readpages(struct file *filp, struct address_space *mapping,
29 struct list_head *pages, unsigned nr_pages);
30
31const struct file_operations afs_file_operations = {
32 .open = afs_open,
33 .release = afs_release,
34 .llseek = generic_file_llseek,
35 .read_iter = generic_file_read_iter,
36 .write_iter = afs_file_write,
37 .mmap = afs_file_mmap,
38 .splice_read = generic_file_splice_read,
39 .fsync = afs_fsync,
40 .lock = afs_lock,
41 .flock = afs_flock,
42};
43
44const struct inode_operations afs_file_inode_operations = {
45 .getattr = afs_getattr,
46 .setattr = afs_setattr,
47 .permission = afs_permission,
48 .listxattr = afs_listxattr,
49};
50
51const struct address_space_operations afs_fs_aops = {
52 .readpage = afs_readpage,
53 .readpages = afs_readpages,
54 .set_page_dirty = afs_set_page_dirty,
55 .launder_page = afs_launder_page,
56 .releasepage = afs_releasepage,
57 .invalidatepage = afs_invalidatepage,
58 .write_begin = afs_write_begin,
59 .write_end = afs_write_end,
60 .writepage = afs_writepage,
61 .writepages = afs_writepages,
62};
63
64static const struct vm_operations_struct afs_vm_ops = {
65 .fault = filemap_fault,
66 .map_pages = filemap_map_pages,
67 .page_mkwrite = afs_page_mkwrite,
68};
69
70/*
71 * Discard a pin on a writeback key.
72 */
73void afs_put_wb_key(struct afs_wb_key *wbk)
74{
75 if (refcount_dec_and_test(&wbk->usage)) {
76 key_put(wbk->key);
77 kfree(wbk);
78 }
79}
80
81/*
82 * Cache key for writeback.
83 */
84int afs_cache_wb_key(struct afs_vnode *vnode, struct afs_file *af)
85{
86 struct afs_wb_key *wbk, *p;
87
88 wbk = kzalloc(sizeof(struct afs_wb_key), GFP_KERNEL);
89 if (!wbk)
90 return -ENOMEM;
91 refcount_set(&wbk->usage, 2);
92 wbk->key = af->key;
93
94 spin_lock(&vnode->wb_lock);
95 list_for_each_entry(p, &vnode->wb_keys, vnode_link) {
96 if (p->key == wbk->key)
97 goto found;
98 }
99
100 key_get(wbk->key);
101 list_add_tail(&wbk->vnode_link, &vnode->wb_keys);
102 spin_unlock(&vnode->wb_lock);
103 af->wb = wbk;
104 return 0;
105
106found:
107 refcount_inc(&p->usage);
108 spin_unlock(&vnode->wb_lock);
109 af->wb = p;
110 kfree(wbk);
111 return 0;
112}
113
114/*
115 * open an AFS file or directory and attach a key to it
116 */
117int afs_open(struct inode *inode, struct file *file)
118{
119 struct afs_vnode *vnode = AFS_FS_I(inode);
120 struct afs_file *af;
121 struct key *key;
122 int ret;
123
124 _enter("{%x:%u},", vnode->fid.vid, vnode->fid.vnode);
125
126 key = afs_request_key(vnode->volume->cell);
127 if (IS_ERR(key)) {
128 ret = PTR_ERR(key);
129 goto error;
130 }
131
132 af = kzalloc(sizeof(*af), GFP_KERNEL);
133 if (!af) {
134 ret = -ENOMEM;
135 goto error_key;
136 }
137 af->key = key;
138
139 ret = afs_validate(vnode, key);
140 if (ret < 0)
141 goto error_af;
142
143 if (file->f_mode & FMODE_WRITE) {
144 ret = afs_cache_wb_key(vnode, af);
145 if (ret < 0)
146 goto error_af;
147 }
148
149 if (file->f_flags & O_TRUNC)
150 set_bit(AFS_VNODE_NEW_CONTENT, &vnode->flags);
151
152 file->private_data = af;
153 _leave(" = 0");
154 return 0;
155
156error_af:
157 kfree(af);
158error_key:
159 key_put(key);
160error:
161 _leave(" = %d", ret);
162 return ret;
163}
164
165/*
166 * release an AFS file or directory and discard its key
167 */
168int afs_release(struct inode *inode, struct file *file)
169{
170 struct afs_vnode *vnode = AFS_FS_I(inode);
171 struct afs_file *af = file->private_data;
172
173 _enter("{%x:%u},", vnode->fid.vid, vnode->fid.vnode);
174
175 if ((file->f_mode & FMODE_WRITE))
176 return vfs_fsync(file, 0);
177
178 file->private_data = NULL;
179 if (af->wb)
180 afs_put_wb_key(af->wb);
181 key_put(af->key);
182 kfree(af);
183 afs_prune_wb_keys(vnode);
184 _leave(" = 0");
185 return 0;
186}
187
188/*
189 * Dispose of a ref to a read record.
190 */
191void afs_put_read(struct afs_read *req)
192{
193 int i;
194
195 if (refcount_dec_and_test(&req->usage)) {
196 if (req->pages) {
197 for (i = 0; i < req->nr_pages; i++)
198 if (req->pages[i])
199 put_page(req->pages[i]);
200 if (req->pages != req->array)
201 kfree(req->pages);
202 }
203 kfree(req);
204 }
205}
206
207#ifdef CONFIG_AFS_FSCACHE
208/*
209 * deal with notification that a page was read from the cache
210 */
211static void afs_file_readpage_read_complete(struct page *page,
212 void *data,
213 int error)
214{
215 _enter("%p,%p,%d", page, data, error);
216
217 /* if the read completes with an error, we just unlock the page and let
218 * the VM reissue the readpage */
219 if (!error)
220 SetPageUptodate(page);
221 unlock_page(page);
222}
223#endif
224
225/*
226 * Fetch file data from the volume.
227 */
228int afs_fetch_data(struct afs_vnode *vnode, struct key *key, struct afs_read *desc)
229{
230 struct afs_fs_cursor fc;
231 int ret;
232
233 _enter("%s{%x:%u.%u},%x,,,",
234 vnode->volume->name,
235 vnode->fid.vid,
236 vnode->fid.vnode,
237 vnode->fid.unique,
238 key_serial(key));
239
240 ret = -ERESTARTSYS;
241 if (afs_begin_vnode_operation(&fc, vnode, key)) {
242 while (afs_select_fileserver(&fc)) {
243 fc.cb_break = afs_calc_vnode_cb_break(vnode);
244 afs_fs_fetch_data(&fc, desc);
245 }
246
247 afs_check_for_remote_deletion(&fc, fc.vnode);
248 afs_vnode_commit_status(&fc, vnode, fc.cb_break);
249 ret = afs_end_vnode_operation(&fc);
250 }
251
252 if (ret == 0) {
253 afs_stat_v(vnode, n_fetches);
254 atomic_long_add(desc->actual_len,
255 &afs_v2net(vnode)->n_fetch_bytes);
256 }
257
258 _leave(" = %d", ret);
259 return ret;
260}
261
262/*
263 * read page from file, directory or symlink, given a key to use
264 */
265int afs_page_filler(void *data, struct page *page)
266{
267 struct inode *inode = page->mapping->host;
268 struct afs_vnode *vnode = AFS_FS_I(inode);
269 struct afs_read *req;
270 struct key *key = data;
271 int ret;
272
273 _enter("{%x},{%lu},{%lu}", key_serial(key), inode->i_ino, page->index);
274
275 BUG_ON(!PageLocked(page));
276
277 ret = -ESTALE;
278 if (test_bit(AFS_VNODE_DELETED, &vnode->flags))
279 goto error;
280
281 /* is it cached? */
282#ifdef CONFIG_AFS_FSCACHE
283 ret = fscache_read_or_alloc_page(vnode->cache,
284 page,
285 afs_file_readpage_read_complete,
286 NULL,
287 GFP_KERNEL);
288#else
289 ret = -ENOBUFS;
290#endif
291 switch (ret) {
292 /* read BIO submitted (page in cache) */
293 case 0:
294 break;
295
296 /* page not yet cached */
297 case -ENODATA:
298 _debug("cache said ENODATA");
299 goto go_on;
300
301 /* page will not be cached */
302 case -ENOBUFS:
303 _debug("cache said ENOBUFS");
304 default:
305 go_on:
306 req = kzalloc(sizeof(struct afs_read) + sizeof(struct page *),
307 GFP_KERNEL);
308 if (!req)
309 goto enomem;
310
311 /* We request a full page. If the page is a partial one at the
312 * end of the file, the server will return a short read and the
313 * unmarshalling code will clear the unfilled space.
314 */
315 refcount_set(&req->usage, 1);
316 req->pos = (loff_t)page->index << PAGE_SHIFT;
317 req->len = PAGE_SIZE;
318 req->nr_pages = 1;
319 req->pages = req->array;
320 req->pages[0] = page;
321 get_page(page);
322
323 /* read the contents of the file from the server into the
324 * page */
325 ret = afs_fetch_data(vnode, key, req);
326 afs_put_read(req);
327
328 if (ret < 0) {
329 if (ret == -ENOENT) {
330 _debug("got NOENT from server"
331 " - marking file deleted and stale");
332 set_bit(AFS_VNODE_DELETED, &vnode->flags);
333 ret = -ESTALE;
334 }
335
336#ifdef CONFIG_AFS_FSCACHE
337 fscache_uncache_page(vnode->cache, page);
338#endif
339 BUG_ON(PageFsCache(page));
340
341 if (ret == -EINTR ||
342 ret == -ENOMEM ||
343 ret == -ERESTARTSYS ||
344 ret == -EAGAIN)
345 goto error;
346 goto io_error;
347 }
348
349 SetPageUptodate(page);
350
351 /* send the page to the cache */
352#ifdef CONFIG_AFS_FSCACHE
353 if (PageFsCache(page) &&
354 fscache_write_page(vnode->cache, page, vnode->status.size,
355 GFP_KERNEL) != 0) {
356 fscache_uncache_page(vnode->cache, page);
357 BUG_ON(PageFsCache(page));
358 }
359#endif
360 unlock_page(page);
361 }
362
363 _leave(" = 0");
364 return 0;
365
366io_error:
367 SetPageError(page);
368 goto error;
369enomem:
370 ret = -ENOMEM;
371error:
372 unlock_page(page);
373 _leave(" = %d", ret);
374 return ret;
375}
376
377/*
378 * read page from file, directory or symlink, given a file to nominate the key
379 * to be used
380 */
381static int afs_readpage(struct file *file, struct page *page)
382{
383 struct key *key;
384 int ret;
385
386 if (file) {
387 key = afs_file_key(file);
388 ASSERT(key != NULL);
389 ret = afs_page_filler(key, page);
390 } else {
391 struct inode *inode = page->mapping->host;
392 key = afs_request_key(AFS_FS_S(inode->i_sb)->cell);
393 if (IS_ERR(key)) {
394 ret = PTR_ERR(key);
395 } else {
396 ret = afs_page_filler(key, page);
397 key_put(key);
398 }
399 }
400 return ret;
401}
402
403/*
404 * Make pages available as they're filled.
405 */
406static void afs_readpages_page_done(struct afs_call *call, struct afs_read *req)
407{
408#ifdef CONFIG_AFS_FSCACHE
409 struct afs_vnode *vnode = call->reply[0];
410#endif
411 struct page *page = req->pages[req->index];
412
413 req->pages[req->index] = NULL;
414 SetPageUptodate(page);
415
416 /* send the page to the cache */
417#ifdef CONFIG_AFS_FSCACHE
418 if (PageFsCache(page) &&
419 fscache_write_page(vnode->cache, page, vnode->status.size,
420 GFP_KERNEL) != 0) {
421 fscache_uncache_page(vnode->cache, page);
422 BUG_ON(PageFsCache(page));
423 }
424#endif
425 unlock_page(page);
426 put_page(page);
427}
428
429/*
430 * Read a contiguous set of pages.
431 */
432static int afs_readpages_one(struct file *file, struct address_space *mapping,
433 struct list_head *pages)
434{
435 struct afs_vnode *vnode = AFS_FS_I(mapping->host);
436 struct afs_read *req;
437 struct list_head *p;
438 struct page *first, *page;
439 struct key *key = afs_file_key(file);
440 pgoff_t index;
441 int ret, n, i;
442
443 /* Count the number of contiguous pages at the front of the list. Note
444 * that the list goes prev-wards rather than next-wards.
445 */
446 first = list_entry(pages->prev, struct page, lru);
447 index = first->index + 1;
448 n = 1;
449 for (p = first->lru.prev; p != pages; p = p->prev) {
450 page = list_entry(p, struct page, lru);
451 if (page->index != index)
452 break;
453 index++;
454 n++;
455 }
456
457 req = kzalloc(sizeof(struct afs_read) + sizeof(struct page *) * n,
458 GFP_NOFS);
459 if (!req)
460 return -ENOMEM;
461
462 refcount_set(&req->usage, 1);
463 req->page_done = afs_readpages_page_done;
464 req->pos = first->index;
465 req->pos <<= PAGE_SHIFT;
466 req->pages = req->array;
467
468 /* Transfer the pages to the request. We add them in until one fails
469 * to add to the LRU and then we stop (as that'll make a hole in the
470 * contiguous run.
471 *
472 * Note that it's possible for the file size to change whilst we're
473 * doing this, but we rely on the server returning less than we asked
474 * for if the file shrank. We also rely on this to deal with a partial
475 * page at the end of the file.
476 */
477 do {
478 page = list_entry(pages->prev, struct page, lru);
479 list_del(&page->lru);
480 index = page->index;
481 if (add_to_page_cache_lru(page, mapping, index,
482 readahead_gfp_mask(mapping))) {
483#ifdef CONFIG_AFS_FSCACHE
484 fscache_uncache_page(vnode->cache, page);
485#endif
486 put_page(page);
487 break;
488 }
489
490 req->pages[req->nr_pages++] = page;
491 req->len += PAGE_SIZE;
492 } while (req->nr_pages < n);
493
494 if (req->nr_pages == 0) {
495 kfree(req);
496 return 0;
497 }
498
499 ret = afs_fetch_data(vnode, key, req);
500 if (ret < 0)
501 goto error;
502
503 task_io_account_read(PAGE_SIZE * req->nr_pages);
504 afs_put_read(req);
505 return 0;
506
507error:
508 if (ret == -ENOENT) {
509 _debug("got NOENT from server"
510 " - marking file deleted and stale");
511 set_bit(AFS_VNODE_DELETED, &vnode->flags);
512 ret = -ESTALE;
513 }
514
515 for (i = 0; i < req->nr_pages; i++) {
516 page = req->pages[i];
517 if (page) {
518#ifdef CONFIG_AFS_FSCACHE
519 fscache_uncache_page(vnode->cache, page);
520#endif
521 SetPageError(page);
522 unlock_page(page);
523 }
524 }
525
526 afs_put_read(req);
527 return ret;
528}
529
530/*
531 * read a set of pages
532 */
533static int afs_readpages(struct file *file, struct address_space *mapping,
534 struct list_head *pages, unsigned nr_pages)
535{
536 struct key *key = afs_file_key(file);
537 struct afs_vnode *vnode;
538 int ret = 0;
539
540 _enter("{%d},{%lu},,%d",
541 key_serial(key), mapping->host->i_ino, nr_pages);
542
543 ASSERT(key != NULL);
544
545 vnode = AFS_FS_I(mapping->host);
546 if (test_bit(AFS_VNODE_DELETED, &vnode->flags)) {
547 _leave(" = -ESTALE");
548 return -ESTALE;
549 }
550
551 /* attempt to read as many of the pages as possible */
552#ifdef CONFIG_AFS_FSCACHE
553 ret = fscache_read_or_alloc_pages(vnode->cache,
554 mapping,
555 pages,
556 &nr_pages,
557 afs_file_readpage_read_complete,
558 NULL,
559 mapping_gfp_mask(mapping));
560#else
561 ret = -ENOBUFS;
562#endif
563
564 switch (ret) {
565 /* all pages are being read from the cache */
566 case 0:
567 BUG_ON(!list_empty(pages));
568 BUG_ON(nr_pages != 0);
569 _leave(" = 0 [reading all]");
570 return 0;
571
572 /* there were pages that couldn't be read from the cache */
573 case -ENODATA:
574 case -ENOBUFS:
575 break;
576
577 /* other error */
578 default:
579 _leave(" = %d", ret);
580 return ret;
581 }
582
583 while (!list_empty(pages)) {
584 ret = afs_readpages_one(file, mapping, pages);
585 if (ret < 0)
586 break;
587 }
588
589 _leave(" = %d [netting]", ret);
590 return ret;
591}
592
593/*
594 * invalidate part or all of a page
595 * - release a page and clean up its private data if offset is 0 (indicating
596 * the entire page)
597 */
598static void afs_invalidatepage(struct page *page, unsigned int offset,
599 unsigned int length)
600{
601 struct afs_vnode *vnode = AFS_FS_I(page->mapping->host);
602 unsigned long priv;
603
604 _enter("{%lu},%u,%u", page->index, offset, length);
605
606 BUG_ON(!PageLocked(page));
607
608 /* we clean up only if the entire page is being invalidated */
609 if (offset == 0 && length == PAGE_SIZE) {
610#ifdef CONFIG_AFS_FSCACHE
611 if (PageFsCache(page)) {
612 struct afs_vnode *vnode = AFS_FS_I(page->mapping->host);
613 fscache_wait_on_page_write(vnode->cache, page);
614 fscache_uncache_page(vnode->cache, page);
615 }
616#endif
617
618 if (PagePrivate(page)) {
619 priv = page_private(page);
620 trace_afs_page_dirty(vnode, tracepoint_string("inval"),
621 page->index, priv);
622 set_page_private(page, 0);
623 ClearPagePrivate(page);
624 }
625 }
626
627 _leave("");
628}
629
630/*
631 * release a page and clean up its private state if it's not busy
632 * - return true if the page can now be released, false if not
633 */
634static int afs_releasepage(struct page *page, gfp_t gfp_flags)
635{
636 struct afs_vnode *vnode = AFS_FS_I(page->mapping->host);
637 unsigned long priv;
638
639 _enter("{{%x:%u}[%lu],%lx},%x",
640 vnode->fid.vid, vnode->fid.vnode, page->index, page->flags,
641 gfp_flags);
642
643 /* deny if page is being written to the cache and the caller hasn't
644 * elected to wait */
645#ifdef CONFIG_AFS_FSCACHE
646 if (!fscache_maybe_release_page(vnode->cache, page, gfp_flags)) {
647 _leave(" = F [cache busy]");
648 return 0;
649 }
650#endif
651
652 if (PagePrivate(page)) {
653 priv = page_private(page);
654 trace_afs_page_dirty(vnode, tracepoint_string("rel"),
655 page->index, priv);
656 set_page_private(page, 0);
657 ClearPagePrivate(page);
658 }
659
660 /* indicate that the page can be released */
661 _leave(" = T");
662 return 1;
663}
664
665/*
666 * Handle setting up a memory mapping on an AFS file.
667 */
668static int afs_file_mmap(struct file *file, struct vm_area_struct *vma)
669{
670 int ret;
671
672 ret = generic_file_mmap(file, vma);
673 if (ret == 0)
674 vma->vm_ops = &afs_vm_ops;
675 return ret;
676}