1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /* AFS filesystem file handling
3 *
4 * Copyright (C) 2002, 2007 Red Hat, Inc. All Rights Reserved.
5 * Written by David Howells (dhowells@redhat.com)
6 */
7
8 #include <linux/kernel.h>
9 #include <linux/module.h>
10 #include <linux/init.h>
11 #include <linux/fs.h>
12 #include <linux/pagemap.h>
13 #include <linux/writeback.h>
14 #include <linux/gfp.h>
15 #include <linux/task_io_accounting_ops.h>
16 #include <linux/mm.h>
17 #include <linux/netfs.h>
18 #include "internal.h"
19
20 static int afs_file_mmap(struct file *file, struct vm_area_struct *vma);
21 static int afs_readpage(struct file *file, struct page *page);
22 static void afs_invalidatepage(struct page *page, unsigned int offset,
23 unsigned int length);
24 static int afs_releasepage(struct page *page, gfp_t gfp_flags);
25
26 static void afs_readahead(struct readahead_control *ractl);
27 static ssize_t afs_file_read_iter(struct kiocb *iocb, struct iov_iter *iter);
28 static void afs_vm_open(struct vm_area_struct *area);
29 static void afs_vm_close(struct vm_area_struct *area);
30 static vm_fault_t afs_vm_map_pages(struct vm_fault *vmf, pgoff_t start_pgoff, pgoff_t end_pgoff);
31
32 const struct file_operations afs_file_operations = {
33 .open = afs_open,
34 .release = afs_release,
35 .llseek = generic_file_llseek,
36 .read_iter = afs_file_read_iter,
37 .write_iter = afs_file_write,
38 .mmap = afs_file_mmap,
39 .splice_read = generic_file_splice_read,
40 .splice_write = iter_file_splice_write,
41 .fsync = afs_fsync,
42 .lock = afs_lock,
43 .flock = afs_flock,
44 };
45
46 const struct inode_operations afs_file_inode_operations = {
47 .getattr = afs_getattr,
48 .setattr = afs_setattr,
49 .permission = afs_permission,
50 };
51
52 const struct address_space_operations afs_fs_aops = {
53 .readpage = afs_readpage,
54 .readahead = afs_readahead,
55 .set_page_dirty = afs_set_page_dirty,
56 .launder_page = afs_launder_page,
57 .releasepage = afs_releasepage,
58 .invalidatepage = afs_invalidatepage,
59 .write_begin = afs_write_begin,
60 .write_end = afs_write_end,
61 .writepage = afs_writepage,
62 .writepages = afs_writepages,
63 };
64
65 static const struct vm_operations_struct afs_vm_ops = {
66 .open = afs_vm_open,
67 .close = afs_vm_close,
68 .fault = filemap_fault,
69 .map_pages = afs_vm_map_pages,
70 .page_mkwrite = afs_page_mkwrite,
71 };
72
73 /*
74 * Discard a pin on a writeback key.
75 */
afs_put_wb_key(struct afs_wb_key * wbk)76 void afs_put_wb_key(struct afs_wb_key *wbk)
77 {
78 if (wbk && refcount_dec_and_test(&wbk->usage)) {
79 key_put(wbk->key);
80 kfree(wbk);
81 }
82 }
83
84 /*
85 * Cache key for writeback.
86 */
afs_cache_wb_key(struct afs_vnode * vnode,struct afs_file * af)87 int afs_cache_wb_key(struct afs_vnode *vnode, struct afs_file *af)
88 {
89 struct afs_wb_key *wbk, *p;
90
91 wbk = kzalloc(sizeof(struct afs_wb_key), GFP_KERNEL);
92 if (!wbk)
93 return -ENOMEM;
94 refcount_set(&wbk->usage, 2);
95 wbk->key = af->key;
96
97 spin_lock(&vnode->wb_lock);
98 list_for_each_entry(p, &vnode->wb_keys, vnode_link) {
99 if (p->key == wbk->key)
100 goto found;
101 }
102
103 key_get(wbk->key);
104 list_add_tail(&wbk->vnode_link, &vnode->wb_keys);
105 spin_unlock(&vnode->wb_lock);
106 af->wb = wbk;
107 return 0;
108
109 found:
110 refcount_inc(&p->usage);
111 spin_unlock(&vnode->wb_lock);
112 af->wb = p;
113 kfree(wbk);
114 return 0;
115 }
116
117 /*
118 * open an AFS file or directory and attach a key to it
119 */
afs_open(struct inode * inode,struct file * file)120 int afs_open(struct inode *inode, struct file *file)
121 {
122 struct afs_vnode *vnode = AFS_FS_I(inode);
123 struct afs_file *af;
124 struct key *key;
125 int ret;
126
127 _enter("{%llx:%llu},", vnode->fid.vid, vnode->fid.vnode);
128
129 key = afs_request_key(vnode->volume->cell);
130 if (IS_ERR(key)) {
131 ret = PTR_ERR(key);
132 goto error;
133 }
134
135 af = kzalloc(sizeof(*af), GFP_KERNEL);
136 if (!af) {
137 ret = -ENOMEM;
138 goto error_key;
139 }
140 af->key = key;
141
142 ret = afs_validate(vnode, key);
143 if (ret < 0)
144 goto error_af;
145
146 if (file->f_mode & FMODE_WRITE) {
147 ret = afs_cache_wb_key(vnode, af);
148 if (ret < 0)
149 goto error_af;
150 }
151
152 if (file->f_flags & O_TRUNC)
153 set_bit(AFS_VNODE_NEW_CONTENT, &vnode->flags);
154
155 file->private_data = af;
156 _leave(" = 0");
157 return 0;
158
159 error_af:
160 kfree(af);
161 error_key:
162 key_put(key);
163 error:
164 _leave(" = %d", ret);
165 return ret;
166 }
167
168 /*
169 * release an AFS file or directory and discard its key
170 */
afs_release(struct inode * inode,struct file * file)171 int afs_release(struct inode *inode, struct file *file)
172 {
173 struct afs_vnode *vnode = AFS_FS_I(inode);
174 struct afs_file *af = file->private_data;
175 int ret = 0;
176
177 _enter("{%llx:%llu},", vnode->fid.vid, vnode->fid.vnode);
178
179 if ((file->f_mode & FMODE_WRITE))
180 ret = vfs_fsync(file, 0);
181
182 file->private_data = NULL;
183 if (af->wb)
184 afs_put_wb_key(af->wb);
185 key_put(af->key);
186 kfree(af);
187 afs_prune_wb_keys(vnode);
188 _leave(" = %d", ret);
189 return ret;
190 }
191
192 /*
193 * Allocate a new read record.
194 */
afs_alloc_read(gfp_t gfp)195 struct afs_read *afs_alloc_read(gfp_t gfp)
196 {
197 struct afs_read *req;
198
199 req = kzalloc(sizeof(struct afs_read), gfp);
200 if (req)
201 refcount_set(&req->usage, 1);
202
203 return req;
204 }
205
206 /*
207 * Dispose of a ref to a read record.
208 */
afs_put_read(struct afs_read * req)209 void afs_put_read(struct afs_read *req)
210 {
211 if (refcount_dec_and_test(&req->usage)) {
212 if (req->cleanup)
213 req->cleanup(req);
214 key_put(req->key);
215 kfree(req);
216 }
217 }
218
afs_fetch_data_notify(struct afs_operation * op)219 static void afs_fetch_data_notify(struct afs_operation *op)
220 {
221 struct afs_read *req = op->fetch.req;
222 struct netfs_read_subrequest *subreq = req->subreq;
223 int error = op->error;
224
225 if (error == -ECONNABORTED)
226 error = afs_abort_to_error(op->ac.abort_code);
227 req->error = error;
228
229 if (subreq) {
230 __set_bit(NETFS_SREQ_CLEAR_TAIL, &subreq->flags);
231 netfs_subreq_terminated(subreq, error ?: req->actual_len, false);
232 req->subreq = NULL;
233 } else if (req->done) {
234 req->done(req);
235 }
236 }
237
afs_fetch_data_success(struct afs_operation * op)238 static void afs_fetch_data_success(struct afs_operation *op)
239 {
240 struct afs_vnode *vnode = op->file[0].vnode;
241
242 _enter("op=%08x", op->debug_id);
243 afs_vnode_commit_status(op, &op->file[0]);
244 afs_stat_v(vnode, n_fetches);
245 atomic_long_add(op->fetch.req->actual_len, &op->net->n_fetch_bytes);
246 afs_fetch_data_notify(op);
247 }
248
afs_fetch_data_put(struct afs_operation * op)249 static void afs_fetch_data_put(struct afs_operation *op)
250 {
251 op->fetch.req->error = op->error;
252 afs_put_read(op->fetch.req);
253 }
254
255 static const struct afs_operation_ops afs_fetch_data_operation = {
256 .issue_afs_rpc = afs_fs_fetch_data,
257 .issue_yfs_rpc = yfs_fs_fetch_data,
258 .success = afs_fetch_data_success,
259 .aborted = afs_check_for_remote_deletion,
260 .failed = afs_fetch_data_notify,
261 .put = afs_fetch_data_put,
262 };
263
264 /*
265 * Fetch file data from the volume.
266 */
afs_fetch_data(struct afs_vnode * vnode,struct afs_read * req)267 int afs_fetch_data(struct afs_vnode *vnode, struct afs_read *req)
268 {
269 struct afs_operation *op;
270
271 _enter("%s{%llx:%llu.%u},%x,,,",
272 vnode->volume->name,
273 vnode->fid.vid,
274 vnode->fid.vnode,
275 vnode->fid.unique,
276 key_serial(req->key));
277
278 op = afs_alloc_operation(req->key, vnode->volume);
279 if (IS_ERR(op)) {
280 if (req->subreq)
281 netfs_subreq_terminated(req->subreq, PTR_ERR(op), false);
282 return PTR_ERR(op);
283 }
284
285 afs_op_set_vnode(op, 0, vnode);
286
287 op->fetch.req = afs_get_read(req);
288 op->ops = &afs_fetch_data_operation;
289 return afs_do_sync_operation(op);
290 }
291
afs_req_issue_op(struct netfs_read_subrequest * subreq)292 static void afs_req_issue_op(struct netfs_read_subrequest *subreq)
293 {
294 struct afs_vnode *vnode = AFS_FS_I(subreq->rreq->inode);
295 struct afs_read *fsreq;
296
297 fsreq = afs_alloc_read(GFP_NOFS);
298 if (!fsreq)
299 return netfs_subreq_terminated(subreq, -ENOMEM, false);
300
301 fsreq->subreq = subreq;
302 fsreq->pos = subreq->start + subreq->transferred;
303 fsreq->len = subreq->len - subreq->transferred;
304 fsreq->key = key_get(subreq->rreq->netfs_priv);
305 fsreq->vnode = vnode;
306 fsreq->iter = &fsreq->def_iter;
307
308 iov_iter_xarray(&fsreq->def_iter, READ,
309 &fsreq->vnode->vfs_inode.i_mapping->i_pages,
310 fsreq->pos, fsreq->len);
311
312 afs_fetch_data(fsreq->vnode, fsreq);
313 afs_put_read(fsreq);
314 }
315
afs_symlink_readpage(struct page * page)316 static int afs_symlink_readpage(struct page *page)
317 {
318 struct afs_vnode *vnode = AFS_FS_I(page->mapping->host);
319 struct afs_read *fsreq;
320 int ret;
321
322 fsreq = afs_alloc_read(GFP_NOFS);
323 if (!fsreq)
324 return -ENOMEM;
325
326 fsreq->pos = page->index * PAGE_SIZE;
327 fsreq->len = PAGE_SIZE;
328 fsreq->vnode = vnode;
329 fsreq->iter = &fsreq->def_iter;
330 iov_iter_xarray(&fsreq->def_iter, READ, &page->mapping->i_pages,
331 fsreq->pos, fsreq->len);
332
333 ret = afs_fetch_data(fsreq->vnode, fsreq);
334 page_endio(page, false, ret);
335 return ret;
336 }
337
afs_init_rreq(struct netfs_read_request * rreq,struct file * file)338 static void afs_init_rreq(struct netfs_read_request *rreq, struct file *file)
339 {
340 rreq->netfs_priv = key_get(afs_file_key(file));
341 }
342
afs_is_cache_enabled(struct inode * inode)343 static bool afs_is_cache_enabled(struct inode *inode)
344 {
345 struct fscache_cookie *cookie = afs_vnode_cache(AFS_FS_I(inode));
346
347 return fscache_cookie_enabled(cookie) && !hlist_empty(&cookie->backing_objects);
348 }
349
afs_begin_cache_operation(struct netfs_read_request * rreq)350 static int afs_begin_cache_operation(struct netfs_read_request *rreq)
351 {
352 struct afs_vnode *vnode = AFS_FS_I(rreq->inode);
353
354 return fscache_begin_read_operation(rreq, afs_vnode_cache(vnode));
355 }
356
afs_check_write_begin(struct file * file,loff_t pos,unsigned len,struct page * page,void ** _fsdata)357 static int afs_check_write_begin(struct file *file, loff_t pos, unsigned len,
358 struct page *page, void **_fsdata)
359 {
360 struct afs_vnode *vnode = AFS_FS_I(file_inode(file));
361
362 return test_bit(AFS_VNODE_DELETED, &vnode->flags) ? -ESTALE : 0;
363 }
364
afs_priv_cleanup(struct address_space * mapping,void * netfs_priv)365 static void afs_priv_cleanup(struct address_space *mapping, void *netfs_priv)
366 {
367 key_put(netfs_priv);
368 }
369
370 const struct netfs_read_request_ops afs_req_ops = {
371 .init_rreq = afs_init_rreq,
372 .is_cache_enabled = afs_is_cache_enabled,
373 .begin_cache_operation = afs_begin_cache_operation,
374 .check_write_begin = afs_check_write_begin,
375 .issue_op = afs_req_issue_op,
376 .cleanup = afs_priv_cleanup,
377 };
378
afs_readpage(struct file * file,struct page * page)379 static int afs_readpage(struct file *file, struct page *page)
380 {
381 if (!file)
382 return afs_symlink_readpage(page);
383
384 return netfs_readpage(file, page, &afs_req_ops, NULL);
385 }
386
afs_readahead(struct readahead_control * ractl)387 static void afs_readahead(struct readahead_control *ractl)
388 {
389 netfs_readahead(ractl, &afs_req_ops, NULL);
390 }
391
392 /*
393 * Adjust the dirty region of the page on truncation or full invalidation,
394 * getting rid of the markers altogether if the region is entirely invalidated.
395 */
afs_invalidate_dirty(struct page * page,unsigned int offset,unsigned int length)396 static void afs_invalidate_dirty(struct page *page, unsigned int offset,
397 unsigned int length)
398 {
399 struct afs_vnode *vnode = AFS_FS_I(page->mapping->host);
400 unsigned long priv;
401 unsigned int f, t, end = offset + length;
402
403 priv = page_private(page);
404
405 /* we clean up only if the entire page is being invalidated */
406 if (offset == 0 && length == thp_size(page))
407 goto full_invalidate;
408
409 /* If the page was dirtied by page_mkwrite(), the PTE stays writable
410 * and we don't get another notification to tell us to expand it
411 * again.
412 */
413 if (afs_is_page_dirty_mmapped(priv))
414 return;
415
416 /* We may need to shorten the dirty region */
417 f = afs_page_dirty_from(page, priv);
418 t = afs_page_dirty_to(page, priv);
419
420 if (t <= offset || f >= end)
421 return; /* Doesn't overlap */
422
423 if (f < offset && t > end)
424 return; /* Splits the dirty region - just absorb it */
425
426 if (f >= offset && t <= end)
427 goto undirty;
428
429 if (f < offset)
430 t = offset;
431 else
432 f = end;
433 if (f == t)
434 goto undirty;
435
436 priv = afs_page_dirty(page, f, t);
437 set_page_private(page, priv);
438 trace_afs_page_dirty(vnode, tracepoint_string("trunc"), page);
439 return;
440
441 undirty:
442 trace_afs_page_dirty(vnode, tracepoint_string("undirty"), page);
443 clear_page_dirty_for_io(page);
444 full_invalidate:
445 trace_afs_page_dirty(vnode, tracepoint_string("inval"), page);
446 detach_page_private(page);
447 }
448
449 /*
450 * invalidate part or all of a page
451 * - release a page and clean up its private data if offset is 0 (indicating
452 * the entire page)
453 */
afs_invalidatepage(struct page * page,unsigned int offset,unsigned int length)454 static void afs_invalidatepage(struct page *page, unsigned int offset,
455 unsigned int length)
456 {
457 _enter("{%lu},%u,%u", page->index, offset, length);
458
459 BUG_ON(!PageLocked(page));
460
461 if (PagePrivate(page))
462 afs_invalidate_dirty(page, offset, length);
463
464 wait_on_page_fscache(page);
465 _leave("");
466 }
467
468 /*
469 * release a page and clean up its private state if it's not busy
470 * - return true if the page can now be released, false if not
471 */
afs_releasepage(struct page * page,gfp_t gfp_flags)472 static int afs_releasepage(struct page *page, gfp_t gfp_flags)
473 {
474 struct afs_vnode *vnode = AFS_FS_I(page->mapping->host);
475
476 _enter("{{%llx:%llu}[%lu],%lx},%x",
477 vnode->fid.vid, vnode->fid.vnode, page->index, page->flags,
478 gfp_flags);
479
480 /* deny if page is being written to the cache and the caller hasn't
481 * elected to wait */
482 #ifdef CONFIG_AFS_FSCACHE
483 if (PageFsCache(page)) {
484 if (!(gfp_flags & __GFP_DIRECT_RECLAIM) || !(gfp_flags & __GFP_FS))
485 return false;
486 wait_on_page_fscache(page);
487 }
488 #endif
489
490 if (PagePrivate(page)) {
491 trace_afs_page_dirty(vnode, tracepoint_string("rel"), page);
492 detach_page_private(page);
493 }
494
495 /* indicate that the page can be released */
496 _leave(" = T");
497 return 1;
498 }
499
afs_add_open_mmap(struct afs_vnode * vnode)500 static void afs_add_open_mmap(struct afs_vnode *vnode)
501 {
502 if (atomic_inc_return(&vnode->cb_nr_mmap) == 1) {
503 down_write(&vnode->volume->cell->fs_open_mmaps_lock);
504
505 if (list_empty(&vnode->cb_mmap_link))
506 list_add_tail(&vnode->cb_mmap_link,
507 &vnode->volume->cell->fs_open_mmaps);
508
509 up_write(&vnode->volume->cell->fs_open_mmaps_lock);
510 }
511 }
512
afs_drop_open_mmap(struct afs_vnode * vnode)513 static void afs_drop_open_mmap(struct afs_vnode *vnode)
514 {
515 if (!atomic_dec_and_test(&vnode->cb_nr_mmap))
516 return;
517
518 down_write(&vnode->volume->cell->fs_open_mmaps_lock);
519
520 if (atomic_read(&vnode->cb_nr_mmap) == 0)
521 list_del_init(&vnode->cb_mmap_link);
522
523 up_write(&vnode->volume->cell->fs_open_mmaps_lock);
524 flush_work(&vnode->cb_work);
525 }
526
527 /*
528 * Handle setting up a memory mapping on an AFS file.
529 */
afs_file_mmap(struct file * file,struct vm_area_struct * vma)530 static int afs_file_mmap(struct file *file, struct vm_area_struct *vma)
531 {
532 struct afs_vnode *vnode = AFS_FS_I(file_inode(file));
533 int ret;
534
535 afs_add_open_mmap(vnode);
536
537 ret = generic_file_mmap(file, vma);
538 if (ret == 0)
539 vma->vm_ops = &afs_vm_ops;
540 else
541 afs_drop_open_mmap(vnode);
542 return ret;
543 }
544
afs_vm_open(struct vm_area_struct * vma)545 static void afs_vm_open(struct vm_area_struct *vma)
546 {
547 afs_add_open_mmap(AFS_FS_I(file_inode(vma->vm_file)));
548 }
549
afs_vm_close(struct vm_area_struct * vma)550 static void afs_vm_close(struct vm_area_struct *vma)
551 {
552 afs_drop_open_mmap(AFS_FS_I(file_inode(vma->vm_file)));
553 }
554
afs_vm_map_pages(struct vm_fault * vmf,pgoff_t start_pgoff,pgoff_t end_pgoff)555 static vm_fault_t afs_vm_map_pages(struct vm_fault *vmf, pgoff_t start_pgoff, pgoff_t end_pgoff)
556 {
557 struct afs_vnode *vnode = AFS_FS_I(file_inode(vmf->vma->vm_file));
558 struct afs_file *af = vmf->vma->vm_file->private_data;
559
560 switch (afs_validate(vnode, af->key)) {
561 case 0:
562 return filemap_map_pages(vmf, start_pgoff, end_pgoff);
563 case -ENOMEM:
564 return VM_FAULT_OOM;
565 case -EINTR:
566 case -ERESTARTSYS:
567 return VM_FAULT_RETRY;
568 case -ESTALE:
569 default:
570 return VM_FAULT_SIGBUS;
571 }
572 }
573
afs_file_read_iter(struct kiocb * iocb,struct iov_iter * iter)574 static ssize_t afs_file_read_iter(struct kiocb *iocb, struct iov_iter *iter)
575 {
576 struct afs_vnode *vnode = AFS_FS_I(file_inode(iocb->ki_filp));
577 struct afs_file *af = iocb->ki_filp->private_data;
578 int ret;
579
580 ret = afs_validate(vnode, af->key);
581 if (ret < 0)
582 return ret;
583
584 return generic_file_read_iter(iocb, iter);
585 }
586