1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /* AFS filesystem file handling
3 *
4 * Copyright (C) 2002, 2007 Red Hat, Inc. All Rights Reserved.
5 * Written by David Howells (dhowells@redhat.com)
6 */
7
8 #include <linux/kernel.h>
9 #include <linux/module.h>
10 #include <linux/init.h>
11 #include <linux/fs.h>
12 #include <linux/pagemap.h>
13 #include <linux/writeback.h>
14 #include <linux/gfp.h>
15 #include <linux/task_io_accounting_ops.h>
16 #include <linux/mm.h>
17 #include <linux/swap.h>
18 #include <linux/netfs.h>
19 #include "internal.h"
20
21 static int afs_file_mmap(struct file *file, struct vm_area_struct *vma);
22 static int afs_symlink_read_folio(struct file *file, struct folio *folio);
23 static void afs_invalidate_folio(struct folio *folio, size_t offset,
24 size_t length);
25 static bool afs_release_folio(struct folio *folio, gfp_t gfp_flags);
26
27 static ssize_t afs_file_read_iter(struct kiocb *iocb, struct iov_iter *iter);
28 static ssize_t afs_file_splice_read(struct file *in, loff_t *ppos,
29 struct pipe_inode_info *pipe,
30 size_t len, unsigned int flags);
31 static void afs_vm_open(struct vm_area_struct *area);
32 static void afs_vm_close(struct vm_area_struct *area);
33 static vm_fault_t afs_vm_map_pages(struct vm_fault *vmf, pgoff_t start_pgoff, pgoff_t end_pgoff);
34
35 const struct file_operations afs_file_operations = {
36 .open = afs_open,
37 .release = afs_release,
38 .llseek = generic_file_llseek,
39 .read_iter = afs_file_read_iter,
40 .write_iter = afs_file_write,
41 .mmap = afs_file_mmap,
42 .splice_read = afs_file_splice_read,
43 .splice_write = iter_file_splice_write,
44 .fsync = afs_fsync,
45 .lock = afs_lock,
46 .flock = afs_flock,
47 };
48
49 const struct inode_operations afs_file_inode_operations = {
50 .getattr = afs_getattr,
51 .setattr = afs_setattr,
52 .permission = afs_permission,
53 };
54
55 const struct address_space_operations afs_file_aops = {
56 .read_folio = netfs_read_folio,
57 .readahead = netfs_readahead,
58 .dirty_folio = afs_dirty_folio,
59 .launder_folio = afs_launder_folio,
60 .release_folio = afs_release_folio,
61 .invalidate_folio = afs_invalidate_folio,
62 .write_begin = afs_write_begin,
63 .write_end = afs_write_end,
64 .writepages = afs_writepages,
65 .migrate_folio = filemap_migrate_folio,
66 };
67
68 const struct address_space_operations afs_symlink_aops = {
69 .read_folio = afs_symlink_read_folio,
70 .release_folio = afs_release_folio,
71 .invalidate_folio = afs_invalidate_folio,
72 .migrate_folio = filemap_migrate_folio,
73 };
74
75 static const struct vm_operations_struct afs_vm_ops = {
76 .open = afs_vm_open,
77 .close = afs_vm_close,
78 .fault = filemap_fault,
79 .map_pages = afs_vm_map_pages,
80 .page_mkwrite = afs_page_mkwrite,
81 };
82
83 /*
84 * Discard a pin on a writeback key.
85 */
afs_put_wb_key(struct afs_wb_key * wbk)86 void afs_put_wb_key(struct afs_wb_key *wbk)
87 {
88 if (wbk && refcount_dec_and_test(&wbk->usage)) {
89 key_put(wbk->key);
90 kfree(wbk);
91 }
92 }
93
94 /*
95 * Cache key for writeback.
96 */
afs_cache_wb_key(struct afs_vnode * vnode,struct afs_file * af)97 int afs_cache_wb_key(struct afs_vnode *vnode, struct afs_file *af)
98 {
99 struct afs_wb_key *wbk, *p;
100
101 wbk = kzalloc(sizeof(struct afs_wb_key), GFP_KERNEL);
102 if (!wbk)
103 return -ENOMEM;
104 refcount_set(&wbk->usage, 2);
105 wbk->key = af->key;
106
107 spin_lock(&vnode->wb_lock);
108 list_for_each_entry(p, &vnode->wb_keys, vnode_link) {
109 if (p->key == wbk->key)
110 goto found;
111 }
112
113 key_get(wbk->key);
114 list_add_tail(&wbk->vnode_link, &vnode->wb_keys);
115 spin_unlock(&vnode->wb_lock);
116 af->wb = wbk;
117 return 0;
118
119 found:
120 refcount_inc(&p->usage);
121 spin_unlock(&vnode->wb_lock);
122 af->wb = p;
123 kfree(wbk);
124 return 0;
125 }
126
127 /*
128 * open an AFS file or directory and attach a key to it
129 */
afs_open(struct inode * inode,struct file * file)130 int afs_open(struct inode *inode, struct file *file)
131 {
132 struct afs_vnode *vnode = AFS_FS_I(inode);
133 struct afs_file *af;
134 struct key *key;
135 int ret;
136
137 _enter("{%llx:%llu},", vnode->fid.vid, vnode->fid.vnode);
138
139 key = afs_request_key(vnode->volume->cell);
140 if (IS_ERR(key)) {
141 ret = PTR_ERR(key);
142 goto error;
143 }
144
145 af = kzalloc(sizeof(*af), GFP_KERNEL);
146 if (!af) {
147 ret = -ENOMEM;
148 goto error_key;
149 }
150 af->key = key;
151
152 ret = afs_validate(vnode, key);
153 if (ret < 0)
154 goto error_af;
155
156 if (file->f_mode & FMODE_WRITE) {
157 ret = afs_cache_wb_key(vnode, af);
158 if (ret < 0)
159 goto error_af;
160 }
161
162 if (file->f_flags & O_TRUNC)
163 set_bit(AFS_VNODE_NEW_CONTENT, &vnode->flags);
164
165 fscache_use_cookie(afs_vnode_cache(vnode), file->f_mode & FMODE_WRITE);
166
167 file->private_data = af;
168 _leave(" = 0");
169 return 0;
170
171 error_af:
172 kfree(af);
173 error_key:
174 key_put(key);
175 error:
176 _leave(" = %d", ret);
177 return ret;
178 }
179
180 /*
181 * release an AFS file or directory and discard its key
182 */
afs_release(struct inode * inode,struct file * file)183 int afs_release(struct inode *inode, struct file *file)
184 {
185 struct afs_vnode_cache_aux aux;
186 struct afs_vnode *vnode = AFS_FS_I(inode);
187 struct afs_file *af = file->private_data;
188 loff_t i_size;
189 int ret = 0;
190
191 _enter("{%llx:%llu},", vnode->fid.vid, vnode->fid.vnode);
192
193 if ((file->f_mode & FMODE_WRITE))
194 ret = vfs_fsync(file, 0);
195
196 file->private_data = NULL;
197 if (af->wb)
198 afs_put_wb_key(af->wb);
199
200 if ((file->f_mode & FMODE_WRITE)) {
201 i_size = i_size_read(&vnode->netfs.inode);
202 afs_set_cache_aux(vnode, &aux);
203 fscache_unuse_cookie(afs_vnode_cache(vnode), &aux, &i_size);
204 } else {
205 fscache_unuse_cookie(afs_vnode_cache(vnode), NULL, NULL);
206 }
207
208 key_put(af->key);
209 kfree(af);
210 afs_prune_wb_keys(vnode);
211 _leave(" = %d", ret);
212 return ret;
213 }
214
215 /*
216 * Allocate a new read record.
217 */
afs_alloc_read(gfp_t gfp)218 struct afs_read *afs_alloc_read(gfp_t gfp)
219 {
220 struct afs_read *req;
221
222 req = kzalloc(sizeof(struct afs_read), gfp);
223 if (req)
224 refcount_set(&req->usage, 1);
225
226 return req;
227 }
228
229 /*
230 * Dispose of a ref to a read record.
231 */
afs_put_read(struct afs_read * req)232 void afs_put_read(struct afs_read *req)
233 {
234 if (refcount_dec_and_test(&req->usage)) {
235 if (req->cleanup)
236 req->cleanup(req);
237 key_put(req->key);
238 kfree(req);
239 }
240 }
241
afs_fetch_data_notify(struct afs_operation * op)242 static void afs_fetch_data_notify(struct afs_operation *op)
243 {
244 struct afs_read *req = op->fetch.req;
245 struct netfs_io_subrequest *subreq = req->subreq;
246 int error = op->error;
247
248 if (error == -ECONNABORTED)
249 error = afs_abort_to_error(op->ac.abort_code);
250 req->error = error;
251
252 if (subreq) {
253 __set_bit(NETFS_SREQ_CLEAR_TAIL, &subreq->flags);
254 netfs_subreq_terminated(subreq, error ?: req->actual_len, false);
255 req->subreq = NULL;
256 } else if (req->done) {
257 req->done(req);
258 }
259 }
260
afs_fetch_data_success(struct afs_operation * op)261 static void afs_fetch_data_success(struct afs_operation *op)
262 {
263 struct afs_vnode *vnode = op->file[0].vnode;
264
265 _enter("op=%08x", op->debug_id);
266 afs_vnode_commit_status(op, &op->file[0]);
267 afs_stat_v(vnode, n_fetches);
268 atomic_long_add(op->fetch.req->actual_len, &op->net->n_fetch_bytes);
269 afs_fetch_data_notify(op);
270 }
271
afs_fetch_data_put(struct afs_operation * op)272 static void afs_fetch_data_put(struct afs_operation *op)
273 {
274 op->fetch.req->error = op->error;
275 afs_put_read(op->fetch.req);
276 }
277
278 static const struct afs_operation_ops afs_fetch_data_operation = {
279 .issue_afs_rpc = afs_fs_fetch_data,
280 .issue_yfs_rpc = yfs_fs_fetch_data,
281 .success = afs_fetch_data_success,
282 .aborted = afs_check_for_remote_deletion,
283 .failed = afs_fetch_data_notify,
284 .put = afs_fetch_data_put,
285 };
286
287 /*
288 * Fetch file data from the volume.
289 */
afs_fetch_data(struct afs_vnode * vnode,struct afs_read * req)290 int afs_fetch_data(struct afs_vnode *vnode, struct afs_read *req)
291 {
292 struct afs_operation *op;
293
294 _enter("%s{%llx:%llu.%u},%x,,,",
295 vnode->volume->name,
296 vnode->fid.vid,
297 vnode->fid.vnode,
298 vnode->fid.unique,
299 key_serial(req->key));
300
301 op = afs_alloc_operation(req->key, vnode->volume);
302 if (IS_ERR(op)) {
303 if (req->subreq)
304 netfs_subreq_terminated(req->subreq, PTR_ERR(op), false);
305 return PTR_ERR(op);
306 }
307
308 afs_op_set_vnode(op, 0, vnode);
309
310 op->fetch.req = afs_get_read(req);
311 op->ops = &afs_fetch_data_operation;
312 return afs_do_sync_operation(op);
313 }
314
afs_issue_read(struct netfs_io_subrequest * subreq)315 static void afs_issue_read(struct netfs_io_subrequest *subreq)
316 {
317 struct afs_vnode *vnode = AFS_FS_I(subreq->rreq->inode);
318 struct afs_read *fsreq;
319
320 fsreq = afs_alloc_read(GFP_NOFS);
321 if (!fsreq)
322 return netfs_subreq_terminated(subreq, -ENOMEM, false);
323
324 fsreq->subreq = subreq;
325 fsreq->pos = subreq->start + subreq->transferred;
326 fsreq->len = subreq->len - subreq->transferred;
327 fsreq->key = key_get(subreq->rreq->netfs_priv);
328 fsreq->vnode = vnode;
329 fsreq->iter = &fsreq->def_iter;
330
331 iov_iter_xarray(&fsreq->def_iter, ITER_DEST,
332 &fsreq->vnode->netfs.inode.i_mapping->i_pages,
333 fsreq->pos, fsreq->len);
334
335 afs_fetch_data(fsreq->vnode, fsreq);
336 afs_put_read(fsreq);
337 }
338
afs_symlink_read_folio(struct file * file,struct folio * folio)339 static int afs_symlink_read_folio(struct file *file, struct folio *folio)
340 {
341 struct afs_vnode *vnode = AFS_FS_I(folio->mapping->host);
342 struct afs_read *fsreq;
343 int ret;
344
345 fsreq = afs_alloc_read(GFP_NOFS);
346 if (!fsreq)
347 return -ENOMEM;
348
349 fsreq->pos = folio_pos(folio);
350 fsreq->len = folio_size(folio);
351 fsreq->vnode = vnode;
352 fsreq->iter = &fsreq->def_iter;
353 iov_iter_xarray(&fsreq->def_iter, ITER_DEST, &folio->mapping->i_pages,
354 fsreq->pos, fsreq->len);
355
356 ret = afs_fetch_data(fsreq->vnode, fsreq);
357 if (ret == 0)
358 folio_mark_uptodate(folio);
359 folio_unlock(folio);
360 return ret;
361 }
362
afs_init_request(struct netfs_io_request * rreq,struct file * file)363 static int afs_init_request(struct netfs_io_request *rreq, struct file *file)
364 {
365 rreq->netfs_priv = key_get(afs_file_key(file));
366 return 0;
367 }
368
afs_begin_cache_operation(struct netfs_io_request * rreq)369 static int afs_begin_cache_operation(struct netfs_io_request *rreq)
370 {
371 #ifdef CONFIG_AFS_FSCACHE
372 struct afs_vnode *vnode = AFS_FS_I(rreq->inode);
373
374 return fscache_begin_read_operation(&rreq->cache_resources,
375 afs_vnode_cache(vnode));
376 #else
377 return -ENOBUFS;
378 #endif
379 }
380
afs_check_write_begin(struct file * file,loff_t pos,unsigned len,struct folio ** foliop,void ** _fsdata)381 static int afs_check_write_begin(struct file *file, loff_t pos, unsigned len,
382 struct folio **foliop, void **_fsdata)
383 {
384 struct afs_vnode *vnode = AFS_FS_I(file_inode(file));
385
386 return test_bit(AFS_VNODE_DELETED, &vnode->flags) ? -ESTALE : 0;
387 }
388
afs_free_request(struct netfs_io_request * rreq)389 static void afs_free_request(struct netfs_io_request *rreq)
390 {
391 key_put(rreq->netfs_priv);
392 }
393
394 const struct netfs_request_ops afs_req_ops = {
395 .init_request = afs_init_request,
396 .free_request = afs_free_request,
397 .begin_cache_operation = afs_begin_cache_operation,
398 .check_write_begin = afs_check_write_begin,
399 .issue_read = afs_issue_read,
400 };
401
afs_write_inode(struct inode * inode,struct writeback_control * wbc)402 int afs_write_inode(struct inode *inode, struct writeback_control *wbc)
403 {
404 fscache_unpin_writeback(wbc, afs_vnode_cache(AFS_FS_I(inode)));
405 return 0;
406 }
407
408 /*
409 * Adjust the dirty region of the page on truncation or full invalidation,
410 * getting rid of the markers altogether if the region is entirely invalidated.
411 */
afs_invalidate_dirty(struct folio * folio,size_t offset,size_t length)412 static void afs_invalidate_dirty(struct folio *folio, size_t offset,
413 size_t length)
414 {
415 struct afs_vnode *vnode = AFS_FS_I(folio_inode(folio));
416 unsigned long priv;
417 unsigned int f, t, end = offset + length;
418
419 priv = (unsigned long)folio_get_private(folio);
420
421 /* we clean up only if the entire page is being invalidated */
422 if (offset == 0 && length == folio_size(folio))
423 goto full_invalidate;
424
425 /* If the page was dirtied by page_mkwrite(), the PTE stays writable
426 * and we don't get another notification to tell us to expand it
427 * again.
428 */
429 if (afs_is_folio_dirty_mmapped(priv))
430 return;
431
432 /* We may need to shorten the dirty region */
433 f = afs_folio_dirty_from(folio, priv);
434 t = afs_folio_dirty_to(folio, priv);
435
436 if (t <= offset || f >= end)
437 return; /* Doesn't overlap */
438
439 if (f < offset && t > end)
440 return; /* Splits the dirty region - just absorb it */
441
442 if (f >= offset && t <= end)
443 goto undirty;
444
445 if (f < offset)
446 t = offset;
447 else
448 f = end;
449 if (f == t)
450 goto undirty;
451
452 priv = afs_folio_dirty(folio, f, t);
453 folio_change_private(folio, (void *)priv);
454 trace_afs_folio_dirty(vnode, tracepoint_string("trunc"), folio);
455 return;
456
457 undirty:
458 trace_afs_folio_dirty(vnode, tracepoint_string("undirty"), folio);
459 folio_clear_dirty_for_io(folio);
460 full_invalidate:
461 trace_afs_folio_dirty(vnode, tracepoint_string("inval"), folio);
462 folio_detach_private(folio);
463 }
464
465 /*
466 * invalidate part or all of a page
467 * - release a page and clean up its private data if offset is 0 (indicating
468 * the entire page)
469 */
afs_invalidate_folio(struct folio * folio,size_t offset,size_t length)470 static void afs_invalidate_folio(struct folio *folio, size_t offset,
471 size_t length)
472 {
473 _enter("{%lu},%zu,%zu", folio->index, offset, length);
474
475 BUG_ON(!folio_test_locked(folio));
476
477 if (folio_get_private(folio))
478 afs_invalidate_dirty(folio, offset, length);
479
480 folio_wait_fscache(folio);
481 _leave("");
482 }
483
484 /*
485 * release a page and clean up its private state if it's not busy
486 * - return true if the page can now be released, false if not
487 */
afs_release_folio(struct folio * folio,gfp_t gfp)488 static bool afs_release_folio(struct folio *folio, gfp_t gfp)
489 {
490 struct afs_vnode *vnode = AFS_FS_I(folio_inode(folio));
491
492 _enter("{{%llx:%llu}[%lu],%lx},%x",
493 vnode->fid.vid, vnode->fid.vnode, folio_index(folio), folio->flags,
494 gfp);
495
496 /* deny if folio is being written to the cache and the caller hasn't
497 * elected to wait */
498 #ifdef CONFIG_AFS_FSCACHE
499 if (folio_test_fscache(folio)) {
500 if (current_is_kswapd() || !(gfp & __GFP_FS))
501 return false;
502 folio_wait_fscache(folio);
503 }
504 fscache_note_page_release(afs_vnode_cache(vnode));
505 #endif
506
507 if (folio_test_private(folio)) {
508 trace_afs_folio_dirty(vnode, tracepoint_string("rel"), folio);
509 folio_detach_private(folio);
510 }
511
512 /* Indicate that the folio can be released */
513 _leave(" = T");
514 return true;
515 }
516
afs_add_open_mmap(struct afs_vnode * vnode)517 static void afs_add_open_mmap(struct afs_vnode *vnode)
518 {
519 if (atomic_inc_return(&vnode->cb_nr_mmap) == 1) {
520 down_write(&vnode->volume->cell->fs_open_mmaps_lock);
521
522 if (list_empty(&vnode->cb_mmap_link))
523 list_add_tail(&vnode->cb_mmap_link,
524 &vnode->volume->cell->fs_open_mmaps);
525
526 up_write(&vnode->volume->cell->fs_open_mmaps_lock);
527 }
528 }
529
afs_drop_open_mmap(struct afs_vnode * vnode)530 static void afs_drop_open_mmap(struct afs_vnode *vnode)
531 {
532 if (atomic_add_unless(&vnode->cb_nr_mmap, -1, 1))
533 return;
534
535 down_write(&vnode->volume->cell->fs_open_mmaps_lock);
536
537 read_seqlock_excl(&vnode->cb_lock);
538 // the only place where ->cb_nr_mmap may hit 0
539 // see __afs_break_callback() for the other side...
540 if (atomic_dec_and_test(&vnode->cb_nr_mmap))
541 list_del_init(&vnode->cb_mmap_link);
542 read_sequnlock_excl(&vnode->cb_lock);
543
544 up_write(&vnode->volume->cell->fs_open_mmaps_lock);
545 flush_work(&vnode->cb_work);
546 }
547
548 /*
549 * Handle setting up a memory mapping on an AFS file.
550 */
afs_file_mmap(struct file * file,struct vm_area_struct * vma)551 static int afs_file_mmap(struct file *file, struct vm_area_struct *vma)
552 {
553 struct afs_vnode *vnode = AFS_FS_I(file_inode(file));
554 int ret;
555
556 afs_add_open_mmap(vnode);
557
558 ret = generic_file_mmap(file, vma);
559 if (ret == 0)
560 vma->vm_ops = &afs_vm_ops;
561 else
562 afs_drop_open_mmap(vnode);
563 return ret;
564 }
565
afs_vm_open(struct vm_area_struct * vma)566 static void afs_vm_open(struct vm_area_struct *vma)
567 {
568 afs_add_open_mmap(AFS_FS_I(file_inode(vma->vm_file)));
569 }
570
afs_vm_close(struct vm_area_struct * vma)571 static void afs_vm_close(struct vm_area_struct *vma)
572 {
573 afs_drop_open_mmap(AFS_FS_I(file_inode(vma->vm_file)));
574 }
575
afs_vm_map_pages(struct vm_fault * vmf,pgoff_t start_pgoff,pgoff_t end_pgoff)576 static vm_fault_t afs_vm_map_pages(struct vm_fault *vmf, pgoff_t start_pgoff, pgoff_t end_pgoff)
577 {
578 struct afs_vnode *vnode = AFS_FS_I(file_inode(vmf->vma->vm_file));
579
580 if (afs_pagecache_valid(vnode))
581 return filemap_map_pages(vmf, start_pgoff, end_pgoff);
582 return 0;
583 }
584
afs_file_read_iter(struct kiocb * iocb,struct iov_iter * iter)585 static ssize_t afs_file_read_iter(struct kiocb *iocb, struct iov_iter *iter)
586 {
587 struct afs_vnode *vnode = AFS_FS_I(file_inode(iocb->ki_filp));
588 struct afs_file *af = iocb->ki_filp->private_data;
589 int ret;
590
591 ret = afs_validate(vnode, af->key);
592 if (ret < 0)
593 return ret;
594
595 return generic_file_read_iter(iocb, iter);
596 }
597
afs_file_splice_read(struct file * in,loff_t * ppos,struct pipe_inode_info * pipe,size_t len,unsigned int flags)598 static ssize_t afs_file_splice_read(struct file *in, loff_t *ppos,
599 struct pipe_inode_info *pipe,
600 size_t len, unsigned int flags)
601 {
602 struct afs_vnode *vnode = AFS_FS_I(file_inode(in));
603 struct afs_file *af = in->private_data;
604 int ret;
605
606 ret = afs_validate(vnode, af->key);
607 if (ret < 0)
608 return ret;
609
610 return filemap_splice_read(in, ppos, pipe, len, flags);
611 }
612