1 // SPDX-License-Identifier: GPL-2.0-or-later 2 /* AFS filesystem file handling 3 * 4 * Copyright (C) 2002, 2007 Red Hat, Inc. All Rights Reserved. 5 * Written by David Howells (dhowells@redhat.com) 6 */ 7 8 #include <linux/kernel.h> 9 #include <linux/module.h> 10 #include <linux/init.h> 11 #include <linux/fs.h> 12 #include <linux/pagemap.h> 13 #include <linux/writeback.h> 14 #include <linux/gfp.h> 15 #include <linux/task_io_accounting_ops.h> 16 #include <linux/mm.h> 17 #include <linux/swap.h> 18 #include <linux/netfs.h> 19 #include "internal.h" 20 21 static int afs_file_mmap(struct file *file, struct vm_area_struct *vma); 22 static int afs_readpage(struct file *file, struct page *page); 23 static int afs_symlink_readpage(struct file *file, struct page *page); 24 static void afs_invalidate_folio(struct folio *folio, size_t offset, 25 size_t length); 26 static int afs_releasepage(struct page *page, gfp_t gfp_flags); 27 28 static void afs_readahead(struct readahead_control *ractl); 29 static ssize_t afs_file_read_iter(struct kiocb *iocb, struct iov_iter *iter); 30 static void afs_vm_open(struct vm_area_struct *area); 31 static void afs_vm_close(struct vm_area_struct *area); 32 static vm_fault_t afs_vm_map_pages(struct vm_fault *vmf, pgoff_t start_pgoff, pgoff_t end_pgoff); 33 34 const struct file_operations afs_file_operations = { 35 .open = afs_open, 36 .release = afs_release, 37 .llseek = generic_file_llseek, 38 .read_iter = afs_file_read_iter, 39 .write_iter = afs_file_write, 40 .mmap = afs_file_mmap, 41 .splice_read = generic_file_splice_read, 42 .splice_write = iter_file_splice_write, 43 .fsync = afs_fsync, 44 .lock = afs_lock, 45 .flock = afs_flock, 46 }; 47 48 const struct inode_operations afs_file_inode_operations = { 49 .getattr = afs_getattr, 50 .setattr = afs_setattr, 51 .permission = afs_permission, 52 }; 53 54 const struct address_space_operations afs_file_aops = { 55 .readpage = afs_readpage, 56 .readahead = afs_readahead, 57 .dirty_folio = afs_dirty_folio, 58 .launder_folio = afs_launder_folio, 59 .releasepage = afs_releasepage, 60 .invalidate_folio = afs_invalidate_folio, 61 .write_begin = afs_write_begin, 62 .write_end = afs_write_end, 63 .writepage = afs_writepage, 64 .writepages = afs_writepages, 65 }; 66 67 const struct address_space_operations afs_symlink_aops = { 68 .readpage = afs_symlink_readpage, 69 .releasepage = afs_releasepage, 70 .invalidate_folio = afs_invalidate_folio, 71 }; 72 73 static const struct vm_operations_struct afs_vm_ops = { 74 .open = afs_vm_open, 75 .close = afs_vm_close, 76 .fault = filemap_fault, 77 .map_pages = afs_vm_map_pages, 78 .page_mkwrite = afs_page_mkwrite, 79 }; 80 81 /* 82 * Discard a pin on a writeback key. 83 */ 84 void afs_put_wb_key(struct afs_wb_key *wbk) 85 { 86 if (wbk && refcount_dec_and_test(&wbk->usage)) { 87 key_put(wbk->key); 88 kfree(wbk); 89 } 90 } 91 92 /* 93 * Cache key for writeback. 94 */ 95 int afs_cache_wb_key(struct afs_vnode *vnode, struct afs_file *af) 96 { 97 struct afs_wb_key *wbk, *p; 98 99 wbk = kzalloc(sizeof(struct afs_wb_key), GFP_KERNEL); 100 if (!wbk) 101 return -ENOMEM; 102 refcount_set(&wbk->usage, 2); 103 wbk->key = af->key; 104 105 spin_lock(&vnode->wb_lock); 106 list_for_each_entry(p, &vnode->wb_keys, vnode_link) { 107 if (p->key == wbk->key) 108 goto found; 109 } 110 111 key_get(wbk->key); 112 list_add_tail(&wbk->vnode_link, &vnode->wb_keys); 113 spin_unlock(&vnode->wb_lock); 114 af->wb = wbk; 115 return 0; 116 117 found: 118 refcount_inc(&p->usage); 119 spin_unlock(&vnode->wb_lock); 120 af->wb = p; 121 kfree(wbk); 122 return 0; 123 } 124 125 /* 126 * open an AFS file or directory and attach a key to it 127 */ 128 int afs_open(struct inode *inode, struct file *file) 129 { 130 struct afs_vnode *vnode = AFS_FS_I(inode); 131 struct afs_file *af; 132 struct key *key; 133 int ret; 134 135 _enter("{%llx:%llu},", vnode->fid.vid, vnode->fid.vnode); 136 137 key = afs_request_key(vnode->volume->cell); 138 if (IS_ERR(key)) { 139 ret = PTR_ERR(key); 140 goto error; 141 } 142 143 af = kzalloc(sizeof(*af), GFP_KERNEL); 144 if (!af) { 145 ret = -ENOMEM; 146 goto error_key; 147 } 148 af->key = key; 149 150 ret = afs_validate(vnode, key); 151 if (ret < 0) 152 goto error_af; 153 154 if (file->f_mode & FMODE_WRITE) { 155 ret = afs_cache_wb_key(vnode, af); 156 if (ret < 0) 157 goto error_af; 158 } 159 160 if (file->f_flags & O_TRUNC) 161 set_bit(AFS_VNODE_NEW_CONTENT, &vnode->flags); 162 163 fscache_use_cookie(afs_vnode_cache(vnode), file->f_mode & FMODE_WRITE); 164 165 file->private_data = af; 166 _leave(" = 0"); 167 return 0; 168 169 error_af: 170 kfree(af); 171 error_key: 172 key_put(key); 173 error: 174 _leave(" = %d", ret); 175 return ret; 176 } 177 178 /* 179 * release an AFS file or directory and discard its key 180 */ 181 int afs_release(struct inode *inode, struct file *file) 182 { 183 struct afs_vnode_cache_aux aux; 184 struct afs_vnode *vnode = AFS_FS_I(inode); 185 struct afs_file *af = file->private_data; 186 loff_t i_size; 187 int ret = 0; 188 189 _enter("{%llx:%llu},", vnode->fid.vid, vnode->fid.vnode); 190 191 if ((file->f_mode & FMODE_WRITE)) 192 ret = vfs_fsync(file, 0); 193 194 file->private_data = NULL; 195 if (af->wb) 196 afs_put_wb_key(af->wb); 197 198 if ((file->f_mode & FMODE_WRITE)) { 199 i_size = i_size_read(&vnode->vfs_inode); 200 afs_set_cache_aux(vnode, &aux); 201 fscache_unuse_cookie(afs_vnode_cache(vnode), &aux, &i_size); 202 } else { 203 fscache_unuse_cookie(afs_vnode_cache(vnode), NULL, NULL); 204 } 205 206 key_put(af->key); 207 kfree(af); 208 afs_prune_wb_keys(vnode); 209 _leave(" = %d", ret); 210 return ret; 211 } 212 213 /* 214 * Allocate a new read record. 215 */ 216 struct afs_read *afs_alloc_read(gfp_t gfp) 217 { 218 struct afs_read *req; 219 220 req = kzalloc(sizeof(struct afs_read), gfp); 221 if (req) 222 refcount_set(&req->usage, 1); 223 224 return req; 225 } 226 227 /* 228 * Dispose of a ref to a read record. 229 */ 230 void afs_put_read(struct afs_read *req) 231 { 232 if (refcount_dec_and_test(&req->usage)) { 233 if (req->cleanup) 234 req->cleanup(req); 235 key_put(req->key); 236 kfree(req); 237 } 238 } 239 240 static void afs_fetch_data_notify(struct afs_operation *op) 241 { 242 struct afs_read *req = op->fetch.req; 243 struct netfs_read_subrequest *subreq = req->subreq; 244 int error = op->error; 245 246 if (error == -ECONNABORTED) 247 error = afs_abort_to_error(op->ac.abort_code); 248 req->error = error; 249 250 if (subreq) { 251 __set_bit(NETFS_SREQ_CLEAR_TAIL, &subreq->flags); 252 netfs_subreq_terminated(subreq, error ?: req->actual_len, false); 253 req->subreq = NULL; 254 } else if (req->done) { 255 req->done(req); 256 } 257 } 258 259 static void afs_fetch_data_success(struct afs_operation *op) 260 { 261 struct afs_vnode *vnode = op->file[0].vnode; 262 263 _enter("op=%08x", op->debug_id); 264 afs_vnode_commit_status(op, &op->file[0]); 265 afs_stat_v(vnode, n_fetches); 266 atomic_long_add(op->fetch.req->actual_len, &op->net->n_fetch_bytes); 267 afs_fetch_data_notify(op); 268 } 269 270 static void afs_fetch_data_put(struct afs_operation *op) 271 { 272 op->fetch.req->error = op->error; 273 afs_put_read(op->fetch.req); 274 } 275 276 static const struct afs_operation_ops afs_fetch_data_operation = { 277 .issue_afs_rpc = afs_fs_fetch_data, 278 .issue_yfs_rpc = yfs_fs_fetch_data, 279 .success = afs_fetch_data_success, 280 .aborted = afs_check_for_remote_deletion, 281 .failed = afs_fetch_data_notify, 282 .put = afs_fetch_data_put, 283 }; 284 285 /* 286 * Fetch file data from the volume. 287 */ 288 int afs_fetch_data(struct afs_vnode *vnode, struct afs_read *req) 289 { 290 struct afs_operation *op; 291 292 _enter("%s{%llx:%llu.%u},%x,,,", 293 vnode->volume->name, 294 vnode->fid.vid, 295 vnode->fid.vnode, 296 vnode->fid.unique, 297 key_serial(req->key)); 298 299 op = afs_alloc_operation(req->key, vnode->volume); 300 if (IS_ERR(op)) { 301 if (req->subreq) 302 netfs_subreq_terminated(req->subreq, PTR_ERR(op), false); 303 return PTR_ERR(op); 304 } 305 306 afs_op_set_vnode(op, 0, vnode); 307 308 op->fetch.req = afs_get_read(req); 309 op->ops = &afs_fetch_data_operation; 310 return afs_do_sync_operation(op); 311 } 312 313 static void afs_req_issue_op(struct netfs_read_subrequest *subreq) 314 { 315 struct afs_vnode *vnode = AFS_FS_I(subreq->rreq->inode); 316 struct afs_read *fsreq; 317 318 fsreq = afs_alloc_read(GFP_NOFS); 319 if (!fsreq) 320 return netfs_subreq_terminated(subreq, -ENOMEM, false); 321 322 fsreq->subreq = subreq; 323 fsreq->pos = subreq->start + subreq->transferred; 324 fsreq->len = subreq->len - subreq->transferred; 325 fsreq->key = key_get(subreq->rreq->netfs_priv); 326 fsreq->vnode = vnode; 327 fsreq->iter = &fsreq->def_iter; 328 329 iov_iter_xarray(&fsreq->def_iter, READ, 330 &fsreq->vnode->vfs_inode.i_mapping->i_pages, 331 fsreq->pos, fsreq->len); 332 333 afs_fetch_data(fsreq->vnode, fsreq); 334 afs_put_read(fsreq); 335 } 336 337 static int afs_symlink_readpage(struct file *file, struct page *page) 338 { 339 struct afs_vnode *vnode = AFS_FS_I(page->mapping->host); 340 struct afs_read *fsreq; 341 struct folio *folio = page_folio(page); 342 int ret; 343 344 fsreq = afs_alloc_read(GFP_NOFS); 345 if (!fsreq) 346 return -ENOMEM; 347 348 fsreq->pos = folio_pos(folio); 349 fsreq->len = folio_size(folio); 350 fsreq->vnode = vnode; 351 fsreq->iter = &fsreq->def_iter; 352 iov_iter_xarray(&fsreq->def_iter, READ, &page->mapping->i_pages, 353 fsreq->pos, fsreq->len); 354 355 ret = afs_fetch_data(fsreq->vnode, fsreq); 356 if (ret == 0) 357 SetPageUptodate(page); 358 unlock_page(page); 359 return ret; 360 } 361 362 static void afs_init_rreq(struct netfs_read_request *rreq, struct file *file) 363 { 364 rreq->netfs_priv = key_get(afs_file_key(file)); 365 } 366 367 static bool afs_is_cache_enabled(struct inode *inode) 368 { 369 struct fscache_cookie *cookie = afs_vnode_cache(AFS_FS_I(inode)); 370 371 return fscache_cookie_enabled(cookie) && cookie->cache_priv; 372 } 373 374 static int afs_begin_cache_operation(struct netfs_read_request *rreq) 375 { 376 #ifdef CONFIG_AFS_FSCACHE 377 struct afs_vnode *vnode = AFS_FS_I(rreq->inode); 378 379 return fscache_begin_read_operation(&rreq->cache_resources, 380 afs_vnode_cache(vnode)); 381 #else 382 return -ENOBUFS; 383 #endif 384 } 385 386 static int afs_check_write_begin(struct file *file, loff_t pos, unsigned len, 387 struct folio *folio, void **_fsdata) 388 { 389 struct afs_vnode *vnode = AFS_FS_I(file_inode(file)); 390 391 return test_bit(AFS_VNODE_DELETED, &vnode->flags) ? -ESTALE : 0; 392 } 393 394 static void afs_priv_cleanup(struct address_space *mapping, void *netfs_priv) 395 { 396 key_put(netfs_priv); 397 } 398 399 const struct netfs_read_request_ops afs_req_ops = { 400 .init_rreq = afs_init_rreq, 401 .is_cache_enabled = afs_is_cache_enabled, 402 .begin_cache_operation = afs_begin_cache_operation, 403 .check_write_begin = afs_check_write_begin, 404 .issue_op = afs_req_issue_op, 405 .cleanup = afs_priv_cleanup, 406 }; 407 408 static int afs_readpage(struct file *file, struct page *page) 409 { 410 struct folio *folio = page_folio(page); 411 412 return netfs_readpage(file, folio, &afs_req_ops, NULL); 413 } 414 415 static void afs_readahead(struct readahead_control *ractl) 416 { 417 netfs_readahead(ractl, &afs_req_ops, NULL); 418 } 419 420 int afs_write_inode(struct inode *inode, struct writeback_control *wbc) 421 { 422 fscache_unpin_writeback(wbc, afs_vnode_cache(AFS_FS_I(inode))); 423 return 0; 424 } 425 426 /* 427 * Adjust the dirty region of the page on truncation or full invalidation, 428 * getting rid of the markers altogether if the region is entirely invalidated. 429 */ 430 static void afs_invalidate_dirty(struct folio *folio, size_t offset, 431 size_t length) 432 { 433 struct afs_vnode *vnode = AFS_FS_I(folio_inode(folio)); 434 unsigned long priv; 435 unsigned int f, t, end = offset + length; 436 437 priv = (unsigned long)folio_get_private(folio); 438 439 /* we clean up only if the entire page is being invalidated */ 440 if (offset == 0 && length == folio_size(folio)) 441 goto full_invalidate; 442 443 /* If the page was dirtied by page_mkwrite(), the PTE stays writable 444 * and we don't get another notification to tell us to expand it 445 * again. 446 */ 447 if (afs_is_folio_dirty_mmapped(priv)) 448 return; 449 450 /* We may need to shorten the dirty region */ 451 f = afs_folio_dirty_from(folio, priv); 452 t = afs_folio_dirty_to(folio, priv); 453 454 if (t <= offset || f >= end) 455 return; /* Doesn't overlap */ 456 457 if (f < offset && t > end) 458 return; /* Splits the dirty region - just absorb it */ 459 460 if (f >= offset && t <= end) 461 goto undirty; 462 463 if (f < offset) 464 t = offset; 465 else 466 f = end; 467 if (f == t) 468 goto undirty; 469 470 priv = afs_folio_dirty(folio, f, t); 471 folio_change_private(folio, (void *)priv); 472 trace_afs_folio_dirty(vnode, tracepoint_string("trunc"), folio); 473 return; 474 475 undirty: 476 trace_afs_folio_dirty(vnode, tracepoint_string("undirty"), folio); 477 folio_clear_dirty_for_io(folio); 478 full_invalidate: 479 trace_afs_folio_dirty(vnode, tracepoint_string("inval"), folio); 480 folio_detach_private(folio); 481 } 482 483 /* 484 * invalidate part or all of a page 485 * - release a page and clean up its private data if offset is 0 (indicating 486 * the entire page) 487 */ 488 static void afs_invalidate_folio(struct folio *folio, size_t offset, 489 size_t length) 490 { 491 _enter("{%lu},%zu,%zu", folio->index, offset, length); 492 493 BUG_ON(!folio_test_locked(folio)); 494 495 if (folio_get_private(folio)) 496 afs_invalidate_dirty(folio, offset, length); 497 498 folio_wait_fscache(folio); 499 _leave(""); 500 } 501 502 /* 503 * release a page and clean up its private state if it's not busy 504 * - return true if the page can now be released, false if not 505 */ 506 static int afs_releasepage(struct page *page, gfp_t gfp) 507 { 508 struct folio *folio = page_folio(page); 509 struct afs_vnode *vnode = AFS_FS_I(folio_inode(folio)); 510 511 _enter("{{%llx:%llu}[%lu],%lx},%x", 512 vnode->fid.vid, vnode->fid.vnode, folio_index(folio), folio->flags, 513 gfp); 514 515 /* deny if page is being written to the cache and the caller hasn't 516 * elected to wait */ 517 #ifdef CONFIG_AFS_FSCACHE 518 if (folio_test_fscache(folio)) { 519 if (current_is_kswapd() || !(gfp & __GFP_FS)) 520 return false; 521 folio_wait_fscache(folio); 522 } 523 fscache_note_page_release(afs_vnode_cache(vnode)); 524 #endif 525 526 if (folio_test_private(folio)) { 527 trace_afs_folio_dirty(vnode, tracepoint_string("rel"), folio); 528 folio_detach_private(folio); 529 } 530 531 /* Indicate that the folio can be released */ 532 _leave(" = T"); 533 return true; 534 } 535 536 static void afs_add_open_mmap(struct afs_vnode *vnode) 537 { 538 if (atomic_inc_return(&vnode->cb_nr_mmap) == 1) { 539 down_write(&vnode->volume->cell->fs_open_mmaps_lock); 540 541 if (list_empty(&vnode->cb_mmap_link)) 542 list_add_tail(&vnode->cb_mmap_link, 543 &vnode->volume->cell->fs_open_mmaps); 544 545 up_write(&vnode->volume->cell->fs_open_mmaps_lock); 546 } 547 } 548 549 static void afs_drop_open_mmap(struct afs_vnode *vnode) 550 { 551 if (!atomic_dec_and_test(&vnode->cb_nr_mmap)) 552 return; 553 554 down_write(&vnode->volume->cell->fs_open_mmaps_lock); 555 556 if (atomic_read(&vnode->cb_nr_mmap) == 0) 557 list_del_init(&vnode->cb_mmap_link); 558 559 up_write(&vnode->volume->cell->fs_open_mmaps_lock); 560 flush_work(&vnode->cb_work); 561 } 562 563 /* 564 * Handle setting up a memory mapping on an AFS file. 565 */ 566 static int afs_file_mmap(struct file *file, struct vm_area_struct *vma) 567 { 568 struct afs_vnode *vnode = AFS_FS_I(file_inode(file)); 569 int ret; 570 571 afs_add_open_mmap(vnode); 572 573 ret = generic_file_mmap(file, vma); 574 if (ret == 0) 575 vma->vm_ops = &afs_vm_ops; 576 else 577 afs_drop_open_mmap(vnode); 578 return ret; 579 } 580 581 static void afs_vm_open(struct vm_area_struct *vma) 582 { 583 afs_add_open_mmap(AFS_FS_I(file_inode(vma->vm_file))); 584 } 585 586 static void afs_vm_close(struct vm_area_struct *vma) 587 { 588 afs_drop_open_mmap(AFS_FS_I(file_inode(vma->vm_file))); 589 } 590 591 static vm_fault_t afs_vm_map_pages(struct vm_fault *vmf, pgoff_t start_pgoff, pgoff_t end_pgoff) 592 { 593 struct afs_vnode *vnode = AFS_FS_I(file_inode(vmf->vma->vm_file)); 594 struct afs_file *af = vmf->vma->vm_file->private_data; 595 596 switch (afs_validate(vnode, af->key)) { 597 case 0: 598 return filemap_map_pages(vmf, start_pgoff, end_pgoff); 599 case -ENOMEM: 600 return VM_FAULT_OOM; 601 case -EINTR: 602 case -ERESTARTSYS: 603 return VM_FAULT_RETRY; 604 case -ESTALE: 605 default: 606 return VM_FAULT_SIGBUS; 607 } 608 } 609 610 static ssize_t afs_file_read_iter(struct kiocb *iocb, struct iov_iter *iter) 611 { 612 struct afs_vnode *vnode = AFS_FS_I(file_inode(iocb->ki_filp)); 613 struct afs_file *af = iocb->ki_filp->private_data; 614 int ret; 615 616 ret = afs_validate(vnode, af->key); 617 if (ret < 0) 618 return ret; 619 620 return generic_file_read_iter(iocb, iter); 621 } 622