1 // SPDX-License-Identifier: GPL-2.0-or-later 2 /* AFS filesystem file handling 3 * 4 * Copyright (C) 2002, 2007 Red Hat, Inc. All Rights Reserved. 5 * Written by David Howells (dhowells@redhat.com) 6 */ 7 8 #include <linux/kernel.h> 9 #include <linux/module.h> 10 #include <linux/init.h> 11 #include <linux/fs.h> 12 #include <linux/pagemap.h> 13 #include <linux/writeback.h> 14 #include <linux/gfp.h> 15 #include <linux/task_io_accounting_ops.h> 16 #include <linux/mm.h> 17 #include <linux/swap.h> 18 #include <linux/netfs.h> 19 #include "internal.h" 20 21 static int afs_file_mmap(struct file *file, struct vm_area_struct *vma); 22 static int afs_symlink_read_folio(struct file *file, struct folio *folio); 23 static void afs_invalidate_folio(struct folio *folio, size_t offset, 24 size_t length); 25 static bool afs_release_folio(struct folio *folio, gfp_t gfp_flags); 26 27 static ssize_t afs_file_read_iter(struct kiocb *iocb, struct iov_iter *iter); 28 static void afs_vm_open(struct vm_area_struct *area); 29 static void afs_vm_close(struct vm_area_struct *area); 30 static vm_fault_t afs_vm_map_pages(struct vm_fault *vmf, pgoff_t start_pgoff, pgoff_t end_pgoff); 31 32 const struct file_operations afs_file_operations = { 33 .open = afs_open, 34 .release = afs_release, 35 .llseek = generic_file_llseek, 36 .read_iter = afs_file_read_iter, 37 .write_iter = afs_file_write, 38 .mmap = afs_file_mmap, 39 .splice_read = generic_file_splice_read, 40 .splice_write = iter_file_splice_write, 41 .fsync = afs_fsync, 42 .lock = afs_lock, 43 .flock = afs_flock, 44 }; 45 46 const struct inode_operations afs_file_inode_operations = { 47 .getattr = afs_getattr, 48 .setattr = afs_setattr, 49 .permission = afs_permission, 50 }; 51 52 const struct address_space_operations afs_file_aops = { 53 .read_folio = netfs_read_folio, 54 .readahead = netfs_readahead, 55 .dirty_folio = afs_dirty_folio, 56 .launder_folio = afs_launder_folio, 57 .release_folio = afs_release_folio, 58 .invalidate_folio = afs_invalidate_folio, 59 .write_begin = afs_write_begin, 60 .write_end = afs_write_end, 61 .writepages = afs_writepages, 62 .migrate_folio = filemap_migrate_folio, 63 }; 64 65 const struct address_space_operations afs_symlink_aops = { 66 .read_folio = afs_symlink_read_folio, 67 .release_folio = afs_release_folio, 68 .invalidate_folio = afs_invalidate_folio, 69 .migrate_folio = filemap_migrate_folio, 70 }; 71 72 static const struct vm_operations_struct afs_vm_ops = { 73 .open = afs_vm_open, 74 .close = afs_vm_close, 75 .fault = filemap_fault, 76 .map_pages = afs_vm_map_pages, 77 .page_mkwrite = afs_page_mkwrite, 78 }; 79 80 /* 81 * Discard a pin on a writeback key. 82 */ 83 void afs_put_wb_key(struct afs_wb_key *wbk) 84 { 85 if (wbk && refcount_dec_and_test(&wbk->usage)) { 86 key_put(wbk->key); 87 kfree(wbk); 88 } 89 } 90 91 /* 92 * Cache key for writeback. 93 */ 94 int afs_cache_wb_key(struct afs_vnode *vnode, struct afs_file *af) 95 { 96 struct afs_wb_key *wbk, *p; 97 98 wbk = kzalloc(sizeof(struct afs_wb_key), GFP_KERNEL); 99 if (!wbk) 100 return -ENOMEM; 101 refcount_set(&wbk->usage, 2); 102 wbk->key = af->key; 103 104 spin_lock(&vnode->wb_lock); 105 list_for_each_entry(p, &vnode->wb_keys, vnode_link) { 106 if (p->key == wbk->key) 107 goto found; 108 } 109 110 key_get(wbk->key); 111 list_add_tail(&wbk->vnode_link, &vnode->wb_keys); 112 spin_unlock(&vnode->wb_lock); 113 af->wb = wbk; 114 return 0; 115 116 found: 117 refcount_inc(&p->usage); 118 spin_unlock(&vnode->wb_lock); 119 af->wb = p; 120 kfree(wbk); 121 return 0; 122 } 123 124 /* 125 * open an AFS file or directory and attach a key to it 126 */ 127 int afs_open(struct inode *inode, struct file *file) 128 { 129 struct afs_vnode *vnode = AFS_FS_I(inode); 130 struct afs_file *af; 131 struct key *key; 132 int ret; 133 134 _enter("{%llx:%llu},", vnode->fid.vid, vnode->fid.vnode); 135 136 key = afs_request_key(vnode->volume->cell); 137 if (IS_ERR(key)) { 138 ret = PTR_ERR(key); 139 goto error; 140 } 141 142 af = kzalloc(sizeof(*af), GFP_KERNEL); 143 if (!af) { 144 ret = -ENOMEM; 145 goto error_key; 146 } 147 af->key = key; 148 149 ret = afs_validate(vnode, key); 150 if (ret < 0) 151 goto error_af; 152 153 if (file->f_mode & FMODE_WRITE) { 154 ret = afs_cache_wb_key(vnode, af); 155 if (ret < 0) 156 goto error_af; 157 } 158 159 if (file->f_flags & O_TRUNC) 160 set_bit(AFS_VNODE_NEW_CONTENT, &vnode->flags); 161 162 fscache_use_cookie(afs_vnode_cache(vnode), file->f_mode & FMODE_WRITE); 163 164 file->private_data = af; 165 _leave(" = 0"); 166 return 0; 167 168 error_af: 169 kfree(af); 170 error_key: 171 key_put(key); 172 error: 173 _leave(" = %d", ret); 174 return ret; 175 } 176 177 /* 178 * release an AFS file or directory and discard its key 179 */ 180 int afs_release(struct inode *inode, struct file *file) 181 { 182 struct afs_vnode_cache_aux aux; 183 struct afs_vnode *vnode = AFS_FS_I(inode); 184 struct afs_file *af = file->private_data; 185 loff_t i_size; 186 int ret = 0; 187 188 _enter("{%llx:%llu},", vnode->fid.vid, vnode->fid.vnode); 189 190 if ((file->f_mode & FMODE_WRITE)) 191 ret = vfs_fsync(file, 0); 192 193 file->private_data = NULL; 194 if (af->wb) 195 afs_put_wb_key(af->wb); 196 197 if ((file->f_mode & FMODE_WRITE)) { 198 i_size = i_size_read(&vnode->netfs.inode); 199 afs_set_cache_aux(vnode, &aux); 200 fscache_unuse_cookie(afs_vnode_cache(vnode), &aux, &i_size); 201 } else { 202 fscache_unuse_cookie(afs_vnode_cache(vnode), NULL, NULL); 203 } 204 205 key_put(af->key); 206 kfree(af); 207 afs_prune_wb_keys(vnode); 208 _leave(" = %d", ret); 209 return ret; 210 } 211 212 /* 213 * Allocate a new read record. 214 */ 215 struct afs_read *afs_alloc_read(gfp_t gfp) 216 { 217 struct afs_read *req; 218 219 req = kzalloc(sizeof(struct afs_read), gfp); 220 if (req) 221 refcount_set(&req->usage, 1); 222 223 return req; 224 } 225 226 /* 227 * Dispose of a ref to a read record. 228 */ 229 void afs_put_read(struct afs_read *req) 230 { 231 if (refcount_dec_and_test(&req->usage)) { 232 if (req->cleanup) 233 req->cleanup(req); 234 key_put(req->key); 235 kfree(req); 236 } 237 } 238 239 static void afs_fetch_data_notify(struct afs_operation *op) 240 { 241 struct afs_read *req = op->fetch.req; 242 struct netfs_io_subrequest *subreq = req->subreq; 243 int error = op->error; 244 245 if (error == -ECONNABORTED) 246 error = afs_abort_to_error(op->ac.abort_code); 247 req->error = error; 248 249 if (subreq) { 250 __set_bit(NETFS_SREQ_CLEAR_TAIL, &subreq->flags); 251 netfs_subreq_terminated(subreq, error ?: req->actual_len, false); 252 req->subreq = NULL; 253 } else if (req->done) { 254 req->done(req); 255 } 256 } 257 258 static void afs_fetch_data_success(struct afs_operation *op) 259 { 260 struct afs_vnode *vnode = op->file[0].vnode; 261 262 _enter("op=%08x", op->debug_id); 263 afs_vnode_commit_status(op, &op->file[0]); 264 afs_stat_v(vnode, n_fetches); 265 atomic_long_add(op->fetch.req->actual_len, &op->net->n_fetch_bytes); 266 afs_fetch_data_notify(op); 267 } 268 269 static void afs_fetch_data_put(struct afs_operation *op) 270 { 271 op->fetch.req->error = op->error; 272 afs_put_read(op->fetch.req); 273 } 274 275 static const struct afs_operation_ops afs_fetch_data_operation = { 276 .issue_afs_rpc = afs_fs_fetch_data, 277 .issue_yfs_rpc = yfs_fs_fetch_data, 278 .success = afs_fetch_data_success, 279 .aborted = afs_check_for_remote_deletion, 280 .failed = afs_fetch_data_notify, 281 .put = afs_fetch_data_put, 282 }; 283 284 /* 285 * Fetch file data from the volume. 286 */ 287 int afs_fetch_data(struct afs_vnode *vnode, struct afs_read *req) 288 { 289 struct afs_operation *op; 290 291 _enter("%s{%llx:%llu.%u},%x,,,", 292 vnode->volume->name, 293 vnode->fid.vid, 294 vnode->fid.vnode, 295 vnode->fid.unique, 296 key_serial(req->key)); 297 298 op = afs_alloc_operation(req->key, vnode->volume); 299 if (IS_ERR(op)) { 300 if (req->subreq) 301 netfs_subreq_terminated(req->subreq, PTR_ERR(op), false); 302 return PTR_ERR(op); 303 } 304 305 afs_op_set_vnode(op, 0, vnode); 306 307 op->fetch.req = afs_get_read(req); 308 op->ops = &afs_fetch_data_operation; 309 return afs_do_sync_operation(op); 310 } 311 312 static void afs_issue_read(struct netfs_io_subrequest *subreq) 313 { 314 struct afs_vnode *vnode = AFS_FS_I(subreq->rreq->inode); 315 struct afs_read *fsreq; 316 317 fsreq = afs_alloc_read(GFP_NOFS); 318 if (!fsreq) 319 return netfs_subreq_terminated(subreq, -ENOMEM, false); 320 321 fsreq->subreq = subreq; 322 fsreq->pos = subreq->start + subreq->transferred; 323 fsreq->len = subreq->len - subreq->transferred; 324 fsreq->key = key_get(subreq->rreq->netfs_priv); 325 fsreq->vnode = vnode; 326 fsreq->iter = &fsreq->def_iter; 327 328 iov_iter_xarray(&fsreq->def_iter, ITER_DEST, 329 &fsreq->vnode->netfs.inode.i_mapping->i_pages, 330 fsreq->pos, fsreq->len); 331 332 afs_fetch_data(fsreq->vnode, fsreq); 333 afs_put_read(fsreq); 334 } 335 336 static int afs_symlink_read_folio(struct file *file, struct folio *folio) 337 { 338 struct afs_vnode *vnode = AFS_FS_I(folio->mapping->host); 339 struct afs_read *fsreq; 340 int ret; 341 342 fsreq = afs_alloc_read(GFP_NOFS); 343 if (!fsreq) 344 return -ENOMEM; 345 346 fsreq->pos = folio_pos(folio); 347 fsreq->len = folio_size(folio); 348 fsreq->vnode = vnode; 349 fsreq->iter = &fsreq->def_iter; 350 iov_iter_xarray(&fsreq->def_iter, ITER_DEST, &folio->mapping->i_pages, 351 fsreq->pos, fsreq->len); 352 353 ret = afs_fetch_data(fsreq->vnode, fsreq); 354 if (ret == 0) 355 folio_mark_uptodate(folio); 356 folio_unlock(folio); 357 return ret; 358 } 359 360 static int afs_init_request(struct netfs_io_request *rreq, struct file *file) 361 { 362 rreq->netfs_priv = key_get(afs_file_key(file)); 363 return 0; 364 } 365 366 static int afs_begin_cache_operation(struct netfs_io_request *rreq) 367 { 368 #ifdef CONFIG_AFS_FSCACHE 369 struct afs_vnode *vnode = AFS_FS_I(rreq->inode); 370 371 return fscache_begin_read_operation(&rreq->cache_resources, 372 afs_vnode_cache(vnode)); 373 #else 374 return -ENOBUFS; 375 #endif 376 } 377 378 static int afs_check_write_begin(struct file *file, loff_t pos, unsigned len, 379 struct folio **foliop, void **_fsdata) 380 { 381 struct afs_vnode *vnode = AFS_FS_I(file_inode(file)); 382 383 return test_bit(AFS_VNODE_DELETED, &vnode->flags) ? -ESTALE : 0; 384 } 385 386 static void afs_free_request(struct netfs_io_request *rreq) 387 { 388 key_put(rreq->netfs_priv); 389 } 390 391 const struct netfs_request_ops afs_req_ops = { 392 .init_request = afs_init_request, 393 .free_request = afs_free_request, 394 .begin_cache_operation = afs_begin_cache_operation, 395 .check_write_begin = afs_check_write_begin, 396 .issue_read = afs_issue_read, 397 }; 398 399 int afs_write_inode(struct inode *inode, struct writeback_control *wbc) 400 { 401 fscache_unpin_writeback(wbc, afs_vnode_cache(AFS_FS_I(inode))); 402 return 0; 403 } 404 405 /* 406 * Adjust the dirty region of the page on truncation or full invalidation, 407 * getting rid of the markers altogether if the region is entirely invalidated. 408 */ 409 static void afs_invalidate_dirty(struct folio *folio, size_t offset, 410 size_t length) 411 { 412 struct afs_vnode *vnode = AFS_FS_I(folio_inode(folio)); 413 unsigned long priv; 414 unsigned int f, t, end = offset + length; 415 416 priv = (unsigned long)folio_get_private(folio); 417 418 /* we clean up only if the entire page is being invalidated */ 419 if (offset == 0 && length == folio_size(folio)) 420 goto full_invalidate; 421 422 /* If the page was dirtied by page_mkwrite(), the PTE stays writable 423 * and we don't get another notification to tell us to expand it 424 * again. 425 */ 426 if (afs_is_folio_dirty_mmapped(priv)) 427 return; 428 429 /* We may need to shorten the dirty region */ 430 f = afs_folio_dirty_from(folio, priv); 431 t = afs_folio_dirty_to(folio, priv); 432 433 if (t <= offset || f >= end) 434 return; /* Doesn't overlap */ 435 436 if (f < offset && t > end) 437 return; /* Splits the dirty region - just absorb it */ 438 439 if (f >= offset && t <= end) 440 goto undirty; 441 442 if (f < offset) 443 t = offset; 444 else 445 f = end; 446 if (f == t) 447 goto undirty; 448 449 priv = afs_folio_dirty(folio, f, t); 450 folio_change_private(folio, (void *)priv); 451 trace_afs_folio_dirty(vnode, tracepoint_string("trunc"), folio); 452 return; 453 454 undirty: 455 trace_afs_folio_dirty(vnode, tracepoint_string("undirty"), folio); 456 folio_clear_dirty_for_io(folio); 457 full_invalidate: 458 trace_afs_folio_dirty(vnode, tracepoint_string("inval"), folio); 459 folio_detach_private(folio); 460 } 461 462 /* 463 * invalidate part or all of a page 464 * - release a page and clean up its private data if offset is 0 (indicating 465 * the entire page) 466 */ 467 static void afs_invalidate_folio(struct folio *folio, size_t offset, 468 size_t length) 469 { 470 _enter("{%lu},%zu,%zu", folio->index, offset, length); 471 472 BUG_ON(!folio_test_locked(folio)); 473 474 if (folio_get_private(folio)) 475 afs_invalidate_dirty(folio, offset, length); 476 477 folio_wait_fscache(folio); 478 _leave(""); 479 } 480 481 /* 482 * release a page and clean up its private state if it's not busy 483 * - return true if the page can now be released, false if not 484 */ 485 static bool afs_release_folio(struct folio *folio, gfp_t gfp) 486 { 487 struct afs_vnode *vnode = AFS_FS_I(folio_inode(folio)); 488 489 _enter("{{%llx:%llu}[%lu],%lx},%x", 490 vnode->fid.vid, vnode->fid.vnode, folio_index(folio), folio->flags, 491 gfp); 492 493 /* deny if folio is being written to the cache and the caller hasn't 494 * elected to wait */ 495 #ifdef CONFIG_AFS_FSCACHE 496 if (folio_test_fscache(folio)) { 497 if (current_is_kswapd() || !(gfp & __GFP_FS)) 498 return false; 499 folio_wait_fscache(folio); 500 } 501 fscache_note_page_release(afs_vnode_cache(vnode)); 502 #endif 503 504 if (folio_test_private(folio)) { 505 trace_afs_folio_dirty(vnode, tracepoint_string("rel"), folio); 506 folio_detach_private(folio); 507 } 508 509 /* Indicate that the folio can be released */ 510 _leave(" = T"); 511 return true; 512 } 513 514 static void afs_add_open_mmap(struct afs_vnode *vnode) 515 { 516 if (atomic_inc_return(&vnode->cb_nr_mmap) == 1) { 517 down_write(&vnode->volume->cell->fs_open_mmaps_lock); 518 519 if (list_empty(&vnode->cb_mmap_link)) 520 list_add_tail(&vnode->cb_mmap_link, 521 &vnode->volume->cell->fs_open_mmaps); 522 523 up_write(&vnode->volume->cell->fs_open_mmaps_lock); 524 } 525 } 526 527 static void afs_drop_open_mmap(struct afs_vnode *vnode) 528 { 529 if (!atomic_dec_and_test(&vnode->cb_nr_mmap)) 530 return; 531 532 down_write(&vnode->volume->cell->fs_open_mmaps_lock); 533 534 if (atomic_read(&vnode->cb_nr_mmap) == 0) 535 list_del_init(&vnode->cb_mmap_link); 536 537 up_write(&vnode->volume->cell->fs_open_mmaps_lock); 538 flush_work(&vnode->cb_work); 539 } 540 541 /* 542 * Handle setting up a memory mapping on an AFS file. 543 */ 544 static int afs_file_mmap(struct file *file, struct vm_area_struct *vma) 545 { 546 struct afs_vnode *vnode = AFS_FS_I(file_inode(file)); 547 int ret; 548 549 afs_add_open_mmap(vnode); 550 551 ret = generic_file_mmap(file, vma); 552 if (ret == 0) 553 vma->vm_ops = &afs_vm_ops; 554 else 555 afs_drop_open_mmap(vnode); 556 return ret; 557 } 558 559 static void afs_vm_open(struct vm_area_struct *vma) 560 { 561 afs_add_open_mmap(AFS_FS_I(file_inode(vma->vm_file))); 562 } 563 564 static void afs_vm_close(struct vm_area_struct *vma) 565 { 566 afs_drop_open_mmap(AFS_FS_I(file_inode(vma->vm_file))); 567 } 568 569 static vm_fault_t afs_vm_map_pages(struct vm_fault *vmf, pgoff_t start_pgoff, pgoff_t end_pgoff) 570 { 571 struct afs_vnode *vnode = AFS_FS_I(file_inode(vmf->vma->vm_file)); 572 struct afs_file *af = vmf->vma->vm_file->private_data; 573 574 switch (afs_validate(vnode, af->key)) { 575 case 0: 576 return filemap_map_pages(vmf, start_pgoff, end_pgoff); 577 case -ENOMEM: 578 return VM_FAULT_OOM; 579 case -EINTR: 580 case -ERESTARTSYS: 581 return VM_FAULT_RETRY; 582 case -ESTALE: 583 default: 584 return VM_FAULT_SIGBUS; 585 } 586 } 587 588 static ssize_t afs_file_read_iter(struct kiocb *iocb, struct iov_iter *iter) 589 { 590 struct afs_vnode *vnode = AFS_FS_I(file_inode(iocb->ki_filp)); 591 struct afs_file *af = iocb->ki_filp->private_data; 592 int ret; 593 594 ret = afs_validate(vnode, af->key); 595 if (ret < 0) 596 return ret; 597 598 return generic_file_read_iter(iocb, iter); 599 } 600