1 /* 2 * linux/fs/nfs/inode.c 3 * 4 * Copyright (C) 1992 Rick Sladkey 5 * 6 * nfs inode and superblock handling functions 7 * 8 * Modularised by Alan Cox <alan@lxorguk.ukuu.org.uk>, while hacking some 9 * experimental NFS changes. Modularisation taken straight from SYS5 fs. 10 * 11 * Change to nfs_read_super() to permit NFS mounts to multi-homed hosts. 12 * J.S.Peatfield@damtp.cam.ac.uk 13 * 14 */ 15 16 #include <linux/module.h> 17 #include <linux/init.h> 18 #include <linux/sched.h> 19 #include <linux/time.h> 20 #include <linux/kernel.h> 21 #include <linux/mm.h> 22 #include <linux/string.h> 23 #include <linux/stat.h> 24 #include <linux/errno.h> 25 #include <linux/unistd.h> 26 #include <linux/sunrpc/clnt.h> 27 #include <linux/sunrpc/stats.h> 28 #include <linux/sunrpc/metrics.h> 29 #include <linux/nfs_fs.h> 30 #include <linux/nfs_mount.h> 31 #include <linux/nfs4_mount.h> 32 #include <linux/lockd/bind.h> 33 #include <linux/seq_file.h> 34 #include <linux/mount.h> 35 #include <linux/nfs_idmap.h> 36 #include <linux/vfs.h> 37 #include <linux/inet.h> 38 #include <linux/nfs_xdr.h> 39 #include <linux/slab.h> 40 #include <linux/compat.h> 41 42 #include <asm/system.h> 43 #include <asm/uaccess.h> 44 45 #include "nfs4_fs.h" 46 #include "callback.h" 47 #include "delegation.h" 48 #include "iostat.h" 49 #include "internal.h" 50 #include "fscache.h" 51 #include "dns_resolve.h" 52 #include "pnfs.h" 53 54 #define NFSDBG_FACILITY NFSDBG_VFS 55 56 #define NFS_64_BIT_INODE_NUMBERS_ENABLED 1 57 58 /* Default is to see 64-bit inode numbers */ 59 static int enable_ino64 = NFS_64_BIT_INODE_NUMBERS_ENABLED; 60 61 static void nfs_invalidate_inode(struct inode *); 62 static int nfs_update_inode(struct inode *, struct nfs_fattr *); 63 64 static struct kmem_cache * nfs_inode_cachep; 65 66 static inline unsigned long 67 nfs_fattr_to_ino_t(struct nfs_fattr *fattr) 68 { 69 return nfs_fileid_to_ino_t(fattr->fileid); 70 } 71 72 /** 73 * nfs_wait_bit_killable - helper for functions that are sleeping on bit locks 74 * @word: long word containing the bit lock 75 */ 76 int nfs_wait_bit_killable(void *word) 77 { 78 if (fatal_signal_pending(current)) 79 return -ERESTARTSYS; 80 schedule(); 81 return 0; 82 } 83 84 /** 85 * nfs_compat_user_ino64 - returns the user-visible inode number 86 * @fileid: 64-bit fileid 87 * 88 * This function returns a 32-bit inode number if the boot parameter 89 * nfs.enable_ino64 is zero. 90 */ 91 u64 nfs_compat_user_ino64(u64 fileid) 92 { 93 #ifdef CONFIG_COMPAT 94 compat_ulong_t ino; 95 #else 96 unsigned long ino; 97 #endif 98 99 if (enable_ino64) 100 return fileid; 101 ino = fileid; 102 if (sizeof(ino) < sizeof(fileid)) 103 ino ^= fileid >> (sizeof(fileid)-sizeof(ino)) * 8; 104 return ino; 105 } 106 107 static void nfs_clear_inode(struct inode *inode) 108 { 109 /* 110 * The following should never happen... 111 */ 112 BUG_ON(nfs_have_writebacks(inode)); 113 BUG_ON(!list_empty(&NFS_I(inode)->open_files)); 114 nfs_zap_acl_cache(inode); 115 nfs_access_zap_cache(inode); 116 nfs_fscache_release_inode_cookie(inode); 117 } 118 119 void nfs_evict_inode(struct inode *inode) 120 { 121 truncate_inode_pages(&inode->i_data, 0); 122 end_writeback(inode); 123 nfs_clear_inode(inode); 124 } 125 126 /** 127 * nfs_sync_mapping - helper to flush all mmapped dirty data to disk 128 */ 129 int nfs_sync_mapping(struct address_space *mapping) 130 { 131 int ret = 0; 132 133 if (mapping->nrpages != 0) { 134 unmap_mapping_range(mapping, 0, 0, 0); 135 ret = nfs_wb_all(mapping->host); 136 } 137 return ret; 138 } 139 140 /* 141 * Invalidate the local caches 142 */ 143 static void nfs_zap_caches_locked(struct inode *inode) 144 { 145 struct nfs_inode *nfsi = NFS_I(inode); 146 int mode = inode->i_mode; 147 148 nfs_inc_stats(inode, NFSIOS_ATTRINVALIDATE); 149 150 nfsi->attrtimeo = NFS_MINATTRTIMEO(inode); 151 nfsi->attrtimeo_timestamp = jiffies; 152 153 memset(NFS_COOKIEVERF(inode), 0, sizeof(NFS_COOKIEVERF(inode))); 154 if (S_ISREG(mode) || S_ISDIR(mode) || S_ISLNK(mode)) 155 nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL|NFS_INO_REVAL_PAGECACHE; 156 else 157 nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL|NFS_INO_REVAL_PAGECACHE; 158 } 159 160 void nfs_zap_caches(struct inode *inode) 161 { 162 spin_lock(&inode->i_lock); 163 nfs_zap_caches_locked(inode); 164 spin_unlock(&inode->i_lock); 165 } 166 167 void nfs_zap_mapping(struct inode *inode, struct address_space *mapping) 168 { 169 if (mapping->nrpages != 0) { 170 spin_lock(&inode->i_lock); 171 NFS_I(inode)->cache_validity |= NFS_INO_INVALID_DATA; 172 spin_unlock(&inode->i_lock); 173 } 174 } 175 176 void nfs_zap_acl_cache(struct inode *inode) 177 { 178 void (*clear_acl_cache)(struct inode *); 179 180 clear_acl_cache = NFS_PROTO(inode)->clear_acl_cache; 181 if (clear_acl_cache != NULL) 182 clear_acl_cache(inode); 183 spin_lock(&inode->i_lock); 184 NFS_I(inode)->cache_validity &= ~NFS_INO_INVALID_ACL; 185 spin_unlock(&inode->i_lock); 186 } 187 188 void nfs_invalidate_atime(struct inode *inode) 189 { 190 spin_lock(&inode->i_lock); 191 NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ATIME; 192 spin_unlock(&inode->i_lock); 193 } 194 195 /* 196 * Invalidate, but do not unhash, the inode. 197 * NB: must be called with inode->i_lock held! 198 */ 199 static void nfs_invalidate_inode(struct inode *inode) 200 { 201 set_bit(NFS_INO_STALE, &NFS_I(inode)->flags); 202 nfs_zap_caches_locked(inode); 203 } 204 205 struct nfs_find_desc { 206 struct nfs_fh *fh; 207 struct nfs_fattr *fattr; 208 }; 209 210 /* 211 * In NFSv3 we can have 64bit inode numbers. In order to support 212 * this, and re-exported directories (also seen in NFSv2) 213 * we are forced to allow 2 different inodes to have the same 214 * i_ino. 215 */ 216 static int 217 nfs_find_actor(struct inode *inode, void *opaque) 218 { 219 struct nfs_find_desc *desc = (struct nfs_find_desc *)opaque; 220 struct nfs_fh *fh = desc->fh; 221 struct nfs_fattr *fattr = desc->fattr; 222 223 if (NFS_FILEID(inode) != fattr->fileid) 224 return 0; 225 if (nfs_compare_fh(NFS_FH(inode), fh)) 226 return 0; 227 if (is_bad_inode(inode) || NFS_STALE(inode)) 228 return 0; 229 return 1; 230 } 231 232 static int 233 nfs_init_locked(struct inode *inode, void *opaque) 234 { 235 struct nfs_find_desc *desc = (struct nfs_find_desc *)opaque; 236 struct nfs_fattr *fattr = desc->fattr; 237 238 set_nfs_fileid(inode, fattr->fileid); 239 nfs_copy_fh(NFS_FH(inode), desc->fh); 240 return 0; 241 } 242 243 /* 244 * This is our front-end to iget that looks up inodes by file handle 245 * instead of inode number. 246 */ 247 struct inode * 248 nfs_fhget(struct super_block *sb, struct nfs_fh *fh, struct nfs_fattr *fattr) 249 { 250 struct nfs_find_desc desc = { 251 .fh = fh, 252 .fattr = fattr 253 }; 254 struct inode *inode = ERR_PTR(-ENOENT); 255 unsigned long hash; 256 257 nfs_attr_check_mountpoint(sb, fattr); 258 259 if ((fattr->valid & NFS_ATTR_FATTR_FILEID) == 0 && (fattr->valid & NFS_ATTR_FATTR_MOUNTPOINT) == 0) 260 goto out_no_inode; 261 if ((fattr->valid & NFS_ATTR_FATTR_TYPE) == 0) 262 goto out_no_inode; 263 264 hash = nfs_fattr_to_ino_t(fattr); 265 266 inode = iget5_locked(sb, hash, nfs_find_actor, nfs_init_locked, &desc); 267 if (inode == NULL) { 268 inode = ERR_PTR(-ENOMEM); 269 goto out_no_inode; 270 } 271 272 if (inode->i_state & I_NEW) { 273 struct nfs_inode *nfsi = NFS_I(inode); 274 unsigned long now = jiffies; 275 276 /* We set i_ino for the few things that still rely on it, 277 * such as stat(2) */ 278 inode->i_ino = hash; 279 280 /* We can't support update_atime(), since the server will reset it */ 281 inode->i_flags |= S_NOATIME|S_NOCMTIME; 282 inode->i_mode = fattr->mode; 283 if ((fattr->valid & NFS_ATTR_FATTR_MODE) == 0 284 && nfs_server_capable(inode, NFS_CAP_MODE)) 285 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 286 | NFS_INO_INVALID_ACCESS 287 | NFS_INO_INVALID_ACL; 288 /* Why so? Because we want revalidate for devices/FIFOs, and 289 * that's precisely what we have in nfs_file_inode_operations. 290 */ 291 inode->i_op = NFS_SB(sb)->nfs_client->rpc_ops->file_inode_ops; 292 if (S_ISREG(inode->i_mode)) { 293 inode->i_fop = &nfs_file_operations; 294 inode->i_data.a_ops = &nfs_file_aops; 295 inode->i_data.backing_dev_info = &NFS_SB(sb)->backing_dev_info; 296 } else if (S_ISDIR(inode->i_mode)) { 297 inode->i_op = NFS_SB(sb)->nfs_client->rpc_ops->dir_inode_ops; 298 inode->i_fop = &nfs_dir_operations; 299 inode->i_data.a_ops = &nfs_dir_aops; 300 if (nfs_server_capable(inode, NFS_CAP_READDIRPLUS)) 301 set_bit(NFS_INO_ADVISE_RDPLUS, &NFS_I(inode)->flags); 302 /* Deal with crossing mountpoints */ 303 if (fattr->valid & NFS_ATTR_FATTR_MOUNTPOINT || 304 fattr->valid & NFS_ATTR_FATTR_V4_REFERRAL) { 305 if (fattr->valid & NFS_ATTR_FATTR_V4_REFERRAL) 306 inode->i_op = &nfs_referral_inode_operations; 307 else 308 inode->i_op = &nfs_mountpoint_inode_operations; 309 inode->i_fop = NULL; 310 inode->i_flags |= S_AUTOMOUNT; 311 } 312 } else if (S_ISLNK(inode->i_mode)) 313 inode->i_op = &nfs_symlink_inode_operations; 314 else 315 init_special_inode(inode, inode->i_mode, fattr->rdev); 316 317 memset(&inode->i_atime, 0, sizeof(inode->i_atime)); 318 memset(&inode->i_mtime, 0, sizeof(inode->i_mtime)); 319 memset(&inode->i_ctime, 0, sizeof(inode->i_ctime)); 320 nfsi->change_attr = 0; 321 inode->i_size = 0; 322 inode->i_nlink = 0; 323 inode->i_uid = -2; 324 inode->i_gid = -2; 325 inode->i_blocks = 0; 326 memset(nfsi->cookieverf, 0, sizeof(nfsi->cookieverf)); 327 328 nfsi->read_cache_jiffies = fattr->time_start; 329 nfsi->attr_gencount = fattr->gencount; 330 if (fattr->valid & NFS_ATTR_FATTR_ATIME) 331 inode->i_atime = fattr->atime; 332 else if (nfs_server_capable(inode, NFS_CAP_ATIME)) 333 nfsi->cache_validity |= NFS_INO_INVALID_ATTR; 334 if (fattr->valid & NFS_ATTR_FATTR_MTIME) 335 inode->i_mtime = fattr->mtime; 336 else if (nfs_server_capable(inode, NFS_CAP_MTIME)) 337 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 338 | NFS_INO_INVALID_DATA; 339 if (fattr->valid & NFS_ATTR_FATTR_CTIME) 340 inode->i_ctime = fattr->ctime; 341 else if (nfs_server_capable(inode, NFS_CAP_CTIME)) 342 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 343 | NFS_INO_INVALID_ACCESS 344 | NFS_INO_INVALID_ACL; 345 if (fattr->valid & NFS_ATTR_FATTR_CHANGE) 346 nfsi->change_attr = fattr->change_attr; 347 else if (nfs_server_capable(inode, NFS_CAP_CHANGE_ATTR)) 348 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 349 | NFS_INO_INVALID_DATA; 350 if (fattr->valid & NFS_ATTR_FATTR_SIZE) 351 inode->i_size = nfs_size_to_loff_t(fattr->size); 352 else 353 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 354 | NFS_INO_INVALID_DATA 355 | NFS_INO_REVAL_PAGECACHE; 356 if (fattr->valid & NFS_ATTR_FATTR_NLINK) 357 inode->i_nlink = fattr->nlink; 358 else if (nfs_server_capable(inode, NFS_CAP_NLINK)) 359 nfsi->cache_validity |= NFS_INO_INVALID_ATTR; 360 if (fattr->valid & NFS_ATTR_FATTR_OWNER) 361 inode->i_uid = fattr->uid; 362 else if (nfs_server_capable(inode, NFS_CAP_OWNER)) 363 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 364 | NFS_INO_INVALID_ACCESS 365 | NFS_INO_INVALID_ACL; 366 if (fattr->valid & NFS_ATTR_FATTR_GROUP) 367 inode->i_gid = fattr->gid; 368 else if (nfs_server_capable(inode, NFS_CAP_OWNER_GROUP)) 369 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 370 | NFS_INO_INVALID_ACCESS 371 | NFS_INO_INVALID_ACL; 372 if (fattr->valid & NFS_ATTR_FATTR_BLOCKS_USED) 373 inode->i_blocks = fattr->du.nfs2.blocks; 374 if (fattr->valid & NFS_ATTR_FATTR_SPACE_USED) { 375 /* 376 * report the blocks in 512byte units 377 */ 378 inode->i_blocks = nfs_calc_block_size(fattr->du.nfs3.used); 379 } 380 nfsi->attrtimeo = NFS_MINATTRTIMEO(inode); 381 nfsi->attrtimeo_timestamp = now; 382 nfsi->access_cache = RB_ROOT; 383 384 nfs_fscache_init_inode_cookie(inode); 385 386 unlock_new_inode(inode); 387 } else 388 nfs_refresh_inode(inode, fattr); 389 dprintk("NFS: nfs_fhget(%s/%Ld ct=%d)\n", 390 inode->i_sb->s_id, 391 (long long)NFS_FILEID(inode), 392 atomic_read(&inode->i_count)); 393 394 out: 395 return inode; 396 397 out_no_inode: 398 dprintk("nfs_fhget: iget failed with error %ld\n", PTR_ERR(inode)); 399 goto out; 400 } 401 402 #define NFS_VALID_ATTRS (ATTR_MODE|ATTR_UID|ATTR_GID|ATTR_SIZE|ATTR_ATIME|ATTR_ATIME_SET|ATTR_MTIME|ATTR_MTIME_SET|ATTR_FILE) 403 404 int 405 nfs_setattr(struct dentry *dentry, struct iattr *attr) 406 { 407 struct inode *inode = dentry->d_inode; 408 struct nfs_fattr *fattr; 409 int error = -ENOMEM; 410 411 nfs_inc_stats(inode, NFSIOS_VFSSETATTR); 412 413 /* skip mode change if it's just for clearing setuid/setgid */ 414 if (attr->ia_valid & (ATTR_KILL_SUID | ATTR_KILL_SGID)) 415 attr->ia_valid &= ~ATTR_MODE; 416 417 if (attr->ia_valid & ATTR_SIZE) { 418 if (!S_ISREG(inode->i_mode) || attr->ia_size == i_size_read(inode)) 419 attr->ia_valid &= ~ATTR_SIZE; 420 } 421 422 /* Optimization: if the end result is no change, don't RPC */ 423 attr->ia_valid &= NFS_VALID_ATTRS; 424 if ((attr->ia_valid & ~ATTR_FILE) == 0) 425 return 0; 426 427 /* Write all dirty data */ 428 if (S_ISREG(inode->i_mode)) 429 nfs_wb_all(inode); 430 431 fattr = nfs_alloc_fattr(); 432 if (fattr == NULL) 433 goto out; 434 /* 435 * Return any delegations if we're going to change ACLs 436 */ 437 if ((attr->ia_valid & (ATTR_MODE|ATTR_UID|ATTR_GID)) != 0) 438 nfs_inode_return_delegation(inode); 439 error = NFS_PROTO(inode)->setattr(dentry, fattr, attr); 440 if (error == 0) 441 nfs_refresh_inode(inode, fattr); 442 nfs_free_fattr(fattr); 443 out: 444 return error; 445 } 446 447 /** 448 * nfs_vmtruncate - unmap mappings "freed" by truncate() syscall 449 * @inode: inode of the file used 450 * @offset: file offset to start truncating 451 * 452 * This is a copy of the common vmtruncate, but with the locking 453 * corrected to take into account the fact that NFS requires 454 * inode->i_size to be updated under the inode->i_lock. 455 */ 456 static int nfs_vmtruncate(struct inode * inode, loff_t offset) 457 { 458 loff_t oldsize; 459 int err; 460 461 err = inode_newsize_ok(inode, offset); 462 if (err) 463 goto out; 464 465 spin_lock(&inode->i_lock); 466 oldsize = inode->i_size; 467 i_size_write(inode, offset); 468 spin_unlock(&inode->i_lock); 469 470 truncate_pagecache(inode, oldsize, offset); 471 out: 472 return err; 473 } 474 475 /** 476 * nfs_setattr_update_inode - Update inode metadata after a setattr call. 477 * @inode: pointer to struct inode 478 * @attr: pointer to struct iattr 479 * 480 * Note: we do this in the *proc.c in order to ensure that 481 * it works for things like exclusive creates too. 482 */ 483 void nfs_setattr_update_inode(struct inode *inode, struct iattr *attr) 484 { 485 if ((attr->ia_valid & (ATTR_MODE|ATTR_UID|ATTR_GID)) != 0) { 486 spin_lock(&inode->i_lock); 487 if ((attr->ia_valid & ATTR_MODE) != 0) { 488 int mode = attr->ia_mode & S_IALLUGO; 489 mode |= inode->i_mode & ~S_IALLUGO; 490 inode->i_mode = mode; 491 } 492 if ((attr->ia_valid & ATTR_UID) != 0) 493 inode->i_uid = attr->ia_uid; 494 if ((attr->ia_valid & ATTR_GID) != 0) 495 inode->i_gid = attr->ia_gid; 496 NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 497 spin_unlock(&inode->i_lock); 498 } 499 if ((attr->ia_valid & ATTR_SIZE) != 0) { 500 nfs_inc_stats(inode, NFSIOS_SETATTRTRUNC); 501 nfs_vmtruncate(inode, attr->ia_size); 502 } 503 } 504 505 int nfs_getattr(struct vfsmount *mnt, struct dentry *dentry, struct kstat *stat) 506 { 507 struct inode *inode = dentry->d_inode; 508 int need_atime = NFS_I(inode)->cache_validity & NFS_INO_INVALID_ATIME; 509 int err; 510 511 /* Flush out writes to the server in order to update c/mtime. */ 512 if (S_ISREG(inode->i_mode)) { 513 err = filemap_write_and_wait(inode->i_mapping); 514 if (err) 515 goto out; 516 } 517 518 /* 519 * We may force a getattr if the user cares about atime. 520 * 521 * Note that we only have to check the vfsmount flags here: 522 * - NFS always sets S_NOATIME by so checking it would give a 523 * bogus result 524 * - NFS never sets MS_NOATIME or MS_NODIRATIME so there is 525 * no point in checking those. 526 */ 527 if ((mnt->mnt_flags & MNT_NOATIME) || 528 ((mnt->mnt_flags & MNT_NODIRATIME) && S_ISDIR(inode->i_mode))) 529 need_atime = 0; 530 531 if (need_atime) 532 err = __nfs_revalidate_inode(NFS_SERVER(inode), inode); 533 else 534 err = nfs_revalidate_inode(NFS_SERVER(inode), inode); 535 if (!err) { 536 generic_fillattr(inode, stat); 537 stat->ino = nfs_compat_user_ino64(NFS_FILEID(inode)); 538 } 539 out: 540 return err; 541 } 542 543 static void nfs_init_lock_context(struct nfs_lock_context *l_ctx) 544 { 545 atomic_set(&l_ctx->count, 1); 546 l_ctx->lockowner = current->files; 547 l_ctx->pid = current->tgid; 548 INIT_LIST_HEAD(&l_ctx->list); 549 } 550 551 static struct nfs_lock_context *__nfs_find_lock_context(struct nfs_open_context *ctx) 552 { 553 struct nfs_lock_context *pos; 554 555 list_for_each_entry(pos, &ctx->lock_context.list, list) { 556 if (pos->lockowner != current->files) 557 continue; 558 if (pos->pid != current->tgid) 559 continue; 560 atomic_inc(&pos->count); 561 return pos; 562 } 563 return NULL; 564 } 565 566 struct nfs_lock_context *nfs_get_lock_context(struct nfs_open_context *ctx) 567 { 568 struct nfs_lock_context *res, *new = NULL; 569 struct inode *inode = ctx->path.dentry->d_inode; 570 571 spin_lock(&inode->i_lock); 572 res = __nfs_find_lock_context(ctx); 573 if (res == NULL) { 574 spin_unlock(&inode->i_lock); 575 new = kmalloc(sizeof(*new), GFP_KERNEL); 576 if (new == NULL) 577 return NULL; 578 nfs_init_lock_context(new); 579 spin_lock(&inode->i_lock); 580 res = __nfs_find_lock_context(ctx); 581 if (res == NULL) { 582 list_add_tail(&new->list, &ctx->lock_context.list); 583 new->open_context = ctx; 584 res = new; 585 new = NULL; 586 } 587 } 588 spin_unlock(&inode->i_lock); 589 kfree(new); 590 return res; 591 } 592 593 void nfs_put_lock_context(struct nfs_lock_context *l_ctx) 594 { 595 struct nfs_open_context *ctx = l_ctx->open_context; 596 struct inode *inode = ctx->path.dentry->d_inode; 597 598 if (!atomic_dec_and_lock(&l_ctx->count, &inode->i_lock)) 599 return; 600 list_del(&l_ctx->list); 601 spin_unlock(&inode->i_lock); 602 kfree(l_ctx); 603 } 604 605 /** 606 * nfs_close_context - Common close_context() routine NFSv2/v3 607 * @ctx: pointer to context 608 * @is_sync: is this a synchronous close 609 * 610 * always ensure that the attributes are up to date if we're mounted 611 * with close-to-open semantics 612 */ 613 void nfs_close_context(struct nfs_open_context *ctx, int is_sync) 614 { 615 struct inode *inode; 616 struct nfs_server *server; 617 618 if (!(ctx->mode & FMODE_WRITE)) 619 return; 620 if (!is_sync) 621 return; 622 inode = ctx->path.dentry->d_inode; 623 if (!list_empty(&NFS_I(inode)->open_files)) 624 return; 625 server = NFS_SERVER(inode); 626 if (server->flags & NFS_MOUNT_NOCTO) 627 return; 628 nfs_revalidate_inode(server, inode); 629 } 630 631 struct nfs_open_context *alloc_nfs_open_context(struct path *path, struct rpc_cred *cred, fmode_t f_mode) 632 { 633 struct nfs_open_context *ctx; 634 635 ctx = kmalloc(sizeof(*ctx), GFP_KERNEL); 636 if (ctx != NULL) { 637 ctx->path = *path; 638 path_get(&ctx->path); 639 ctx->cred = get_rpccred(cred); 640 ctx->state = NULL; 641 ctx->mode = f_mode; 642 ctx->flags = 0; 643 ctx->error = 0; 644 nfs_init_lock_context(&ctx->lock_context); 645 ctx->lock_context.open_context = ctx; 646 INIT_LIST_HEAD(&ctx->list); 647 } 648 return ctx; 649 } 650 651 struct nfs_open_context *get_nfs_open_context(struct nfs_open_context *ctx) 652 { 653 if (ctx != NULL) 654 atomic_inc(&ctx->lock_context.count); 655 return ctx; 656 } 657 658 static void __put_nfs_open_context(struct nfs_open_context *ctx, int is_sync) 659 { 660 struct inode *inode = ctx->path.dentry->d_inode; 661 662 if (!list_empty(&ctx->list)) { 663 if (!atomic_dec_and_lock(&ctx->lock_context.count, &inode->i_lock)) 664 return; 665 list_del(&ctx->list); 666 spin_unlock(&inode->i_lock); 667 } else if (!atomic_dec_and_test(&ctx->lock_context.count)) 668 return; 669 if (inode != NULL) 670 NFS_PROTO(inode)->close_context(ctx, is_sync); 671 if (ctx->cred != NULL) 672 put_rpccred(ctx->cred); 673 path_put(&ctx->path); 674 kfree(ctx); 675 } 676 677 void put_nfs_open_context(struct nfs_open_context *ctx) 678 { 679 __put_nfs_open_context(ctx, 0); 680 } 681 682 /* 683 * Ensure that mmap has a recent RPC credential for use when writing out 684 * shared pages 685 */ 686 void nfs_file_set_open_context(struct file *filp, struct nfs_open_context *ctx) 687 { 688 struct inode *inode = filp->f_path.dentry->d_inode; 689 struct nfs_inode *nfsi = NFS_I(inode); 690 691 filp->private_data = get_nfs_open_context(ctx); 692 spin_lock(&inode->i_lock); 693 list_add(&ctx->list, &nfsi->open_files); 694 spin_unlock(&inode->i_lock); 695 } 696 697 /* 698 * Given an inode, search for an open context with the desired characteristics 699 */ 700 struct nfs_open_context *nfs_find_open_context(struct inode *inode, struct rpc_cred *cred, fmode_t mode) 701 { 702 struct nfs_inode *nfsi = NFS_I(inode); 703 struct nfs_open_context *pos, *ctx = NULL; 704 705 spin_lock(&inode->i_lock); 706 list_for_each_entry(pos, &nfsi->open_files, list) { 707 if (cred != NULL && pos->cred != cred) 708 continue; 709 if ((pos->mode & (FMODE_READ|FMODE_WRITE)) != mode) 710 continue; 711 ctx = get_nfs_open_context(pos); 712 break; 713 } 714 spin_unlock(&inode->i_lock); 715 return ctx; 716 } 717 718 static void nfs_file_clear_open_context(struct file *filp) 719 { 720 struct inode *inode = filp->f_path.dentry->d_inode; 721 struct nfs_open_context *ctx = nfs_file_open_context(filp); 722 723 if (ctx) { 724 filp->private_data = NULL; 725 spin_lock(&inode->i_lock); 726 list_move_tail(&ctx->list, &NFS_I(inode)->open_files); 727 spin_unlock(&inode->i_lock); 728 __put_nfs_open_context(ctx, filp->f_flags & O_DIRECT ? 0 : 1); 729 } 730 } 731 732 /* 733 * These allocate and release file read/write context information. 734 */ 735 int nfs_open(struct inode *inode, struct file *filp) 736 { 737 struct nfs_open_context *ctx; 738 struct rpc_cred *cred; 739 740 cred = rpc_lookup_cred(); 741 if (IS_ERR(cred)) 742 return PTR_ERR(cred); 743 ctx = alloc_nfs_open_context(&filp->f_path, cred, filp->f_mode); 744 put_rpccred(cred); 745 if (ctx == NULL) 746 return -ENOMEM; 747 nfs_file_set_open_context(filp, ctx); 748 put_nfs_open_context(ctx); 749 nfs_fscache_set_inode_cookie(inode, filp); 750 return 0; 751 } 752 753 int nfs_release(struct inode *inode, struct file *filp) 754 { 755 nfs_file_clear_open_context(filp); 756 return 0; 757 } 758 759 /* 760 * This function is called whenever some part of NFS notices that 761 * the cached attributes have to be refreshed. 762 */ 763 int 764 __nfs_revalidate_inode(struct nfs_server *server, struct inode *inode) 765 { 766 int status = -ESTALE; 767 struct nfs_fattr *fattr = NULL; 768 struct nfs_inode *nfsi = NFS_I(inode); 769 770 dfprintk(PAGECACHE, "NFS: revalidating (%s/%Ld)\n", 771 inode->i_sb->s_id, (long long)NFS_FILEID(inode)); 772 773 if (is_bad_inode(inode)) 774 goto out; 775 if (NFS_STALE(inode)) 776 goto out; 777 778 status = -ENOMEM; 779 fattr = nfs_alloc_fattr(); 780 if (fattr == NULL) 781 goto out; 782 783 nfs_inc_stats(inode, NFSIOS_INODEREVALIDATE); 784 status = NFS_PROTO(inode)->getattr(server, NFS_FH(inode), fattr); 785 if (status != 0) { 786 dfprintk(PAGECACHE, "nfs_revalidate_inode: (%s/%Ld) getattr failed, error=%d\n", 787 inode->i_sb->s_id, 788 (long long)NFS_FILEID(inode), status); 789 if (status == -ESTALE) { 790 nfs_zap_caches(inode); 791 if (!S_ISDIR(inode->i_mode)) 792 set_bit(NFS_INO_STALE, &NFS_I(inode)->flags); 793 } 794 goto out; 795 } 796 797 status = nfs_refresh_inode(inode, fattr); 798 if (status) { 799 dfprintk(PAGECACHE, "nfs_revalidate_inode: (%s/%Ld) refresh failed, error=%d\n", 800 inode->i_sb->s_id, 801 (long long)NFS_FILEID(inode), status); 802 goto out; 803 } 804 805 if (nfsi->cache_validity & NFS_INO_INVALID_ACL) 806 nfs_zap_acl_cache(inode); 807 808 dfprintk(PAGECACHE, "NFS: (%s/%Ld) revalidation complete\n", 809 inode->i_sb->s_id, 810 (long long)NFS_FILEID(inode)); 811 812 out: 813 nfs_free_fattr(fattr); 814 return status; 815 } 816 817 int nfs_attribute_timeout(struct inode *inode) 818 { 819 struct nfs_inode *nfsi = NFS_I(inode); 820 821 return !time_in_range_open(jiffies, nfsi->read_cache_jiffies, nfsi->read_cache_jiffies + nfsi->attrtimeo); 822 } 823 824 static int nfs_attribute_cache_expired(struct inode *inode) 825 { 826 if (nfs_have_delegated_attributes(inode)) 827 return 0; 828 return nfs_attribute_timeout(inode); 829 } 830 831 /** 832 * nfs_revalidate_inode - Revalidate the inode attributes 833 * @server - pointer to nfs_server struct 834 * @inode - pointer to inode struct 835 * 836 * Updates inode attribute information by retrieving the data from the server. 837 */ 838 int nfs_revalidate_inode(struct nfs_server *server, struct inode *inode) 839 { 840 if (!(NFS_I(inode)->cache_validity & NFS_INO_INVALID_ATTR) 841 && !nfs_attribute_cache_expired(inode)) 842 return NFS_STALE(inode) ? -ESTALE : 0; 843 return __nfs_revalidate_inode(server, inode); 844 } 845 846 static int nfs_invalidate_mapping(struct inode *inode, struct address_space *mapping) 847 { 848 struct nfs_inode *nfsi = NFS_I(inode); 849 850 if (mapping->nrpages != 0) { 851 int ret = invalidate_inode_pages2(mapping); 852 if (ret < 0) 853 return ret; 854 } 855 spin_lock(&inode->i_lock); 856 nfsi->cache_validity &= ~NFS_INO_INVALID_DATA; 857 if (S_ISDIR(inode->i_mode)) 858 memset(nfsi->cookieverf, 0, sizeof(nfsi->cookieverf)); 859 spin_unlock(&inode->i_lock); 860 nfs_inc_stats(inode, NFSIOS_DATAINVALIDATE); 861 nfs_fscache_reset_inode_cookie(inode); 862 dfprintk(PAGECACHE, "NFS: (%s/%Ld) data cache invalidated\n", 863 inode->i_sb->s_id, (long long)NFS_FILEID(inode)); 864 return 0; 865 } 866 867 /** 868 * nfs_revalidate_mapping - Revalidate the pagecache 869 * @inode - pointer to host inode 870 * @mapping - pointer to mapping 871 */ 872 int nfs_revalidate_mapping(struct inode *inode, struct address_space *mapping) 873 { 874 struct nfs_inode *nfsi = NFS_I(inode); 875 int ret = 0; 876 877 if ((nfsi->cache_validity & NFS_INO_REVAL_PAGECACHE) 878 || nfs_attribute_cache_expired(inode) 879 || NFS_STALE(inode)) { 880 ret = __nfs_revalidate_inode(NFS_SERVER(inode), inode); 881 if (ret < 0) 882 goto out; 883 } 884 if (nfsi->cache_validity & NFS_INO_INVALID_DATA) 885 ret = nfs_invalidate_mapping(inode, mapping); 886 out: 887 return ret; 888 } 889 890 static unsigned long nfs_wcc_update_inode(struct inode *inode, struct nfs_fattr *fattr) 891 { 892 struct nfs_inode *nfsi = NFS_I(inode); 893 unsigned long ret = 0; 894 895 if ((fattr->valid & NFS_ATTR_FATTR_PRECHANGE) 896 && (fattr->valid & NFS_ATTR_FATTR_CHANGE) 897 && nfsi->change_attr == fattr->pre_change_attr) { 898 nfsi->change_attr = fattr->change_attr; 899 if (S_ISDIR(inode->i_mode)) 900 nfsi->cache_validity |= NFS_INO_INVALID_DATA; 901 ret |= NFS_INO_INVALID_ATTR; 902 } 903 /* If we have atomic WCC data, we may update some attributes */ 904 if ((fattr->valid & NFS_ATTR_FATTR_PRECTIME) 905 && (fattr->valid & NFS_ATTR_FATTR_CTIME) 906 && timespec_equal(&inode->i_ctime, &fattr->pre_ctime)) { 907 memcpy(&inode->i_ctime, &fattr->ctime, sizeof(inode->i_ctime)); 908 ret |= NFS_INO_INVALID_ATTR; 909 } 910 911 if ((fattr->valid & NFS_ATTR_FATTR_PREMTIME) 912 && (fattr->valid & NFS_ATTR_FATTR_MTIME) 913 && timespec_equal(&inode->i_mtime, &fattr->pre_mtime)) { 914 memcpy(&inode->i_mtime, &fattr->mtime, sizeof(inode->i_mtime)); 915 if (S_ISDIR(inode->i_mode)) 916 nfsi->cache_validity |= NFS_INO_INVALID_DATA; 917 ret |= NFS_INO_INVALID_ATTR; 918 } 919 if ((fattr->valid & NFS_ATTR_FATTR_PRESIZE) 920 && (fattr->valid & NFS_ATTR_FATTR_SIZE) 921 && i_size_read(inode) == nfs_size_to_loff_t(fattr->pre_size) 922 && nfsi->npages == 0) { 923 i_size_write(inode, nfs_size_to_loff_t(fattr->size)); 924 ret |= NFS_INO_INVALID_ATTR; 925 } 926 return ret; 927 } 928 929 /** 930 * nfs_check_inode_attributes - verify consistency of the inode attribute cache 931 * @inode - pointer to inode 932 * @fattr - updated attributes 933 * 934 * Verifies the attribute cache. If we have just changed the attributes, 935 * so that fattr carries weak cache consistency data, then it may 936 * also update the ctime/mtime/change_attribute. 937 */ 938 static int nfs_check_inode_attributes(struct inode *inode, struct nfs_fattr *fattr) 939 { 940 struct nfs_inode *nfsi = NFS_I(inode); 941 loff_t cur_size, new_isize; 942 unsigned long invalid = 0; 943 944 945 /* Has the inode gone and changed behind our back? */ 946 if ((fattr->valid & NFS_ATTR_FATTR_FILEID) && nfsi->fileid != fattr->fileid) 947 return -EIO; 948 if ((fattr->valid & NFS_ATTR_FATTR_TYPE) && (inode->i_mode & S_IFMT) != (fattr->mode & S_IFMT)) 949 return -EIO; 950 951 if ((fattr->valid & NFS_ATTR_FATTR_CHANGE) != 0 && 952 nfsi->change_attr != fattr->change_attr) 953 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE; 954 955 /* Verify a few of the more important attributes */ 956 if ((fattr->valid & NFS_ATTR_FATTR_MTIME) && !timespec_equal(&inode->i_mtime, &fattr->mtime)) 957 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE; 958 959 if (fattr->valid & NFS_ATTR_FATTR_SIZE) { 960 cur_size = i_size_read(inode); 961 new_isize = nfs_size_to_loff_t(fattr->size); 962 if (cur_size != new_isize && nfsi->npages == 0) 963 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE; 964 } 965 966 /* Have any file permissions changed? */ 967 if ((fattr->valid & NFS_ATTR_FATTR_MODE) && (inode->i_mode & S_IALLUGO) != (fattr->mode & S_IALLUGO)) 968 invalid |= NFS_INO_INVALID_ATTR | NFS_INO_INVALID_ACCESS | NFS_INO_INVALID_ACL; 969 if ((fattr->valid & NFS_ATTR_FATTR_OWNER) && inode->i_uid != fattr->uid) 970 invalid |= NFS_INO_INVALID_ATTR | NFS_INO_INVALID_ACCESS | NFS_INO_INVALID_ACL; 971 if ((fattr->valid & NFS_ATTR_FATTR_GROUP) && inode->i_gid != fattr->gid) 972 invalid |= NFS_INO_INVALID_ATTR | NFS_INO_INVALID_ACCESS | NFS_INO_INVALID_ACL; 973 974 /* Has the link count changed? */ 975 if ((fattr->valid & NFS_ATTR_FATTR_NLINK) && inode->i_nlink != fattr->nlink) 976 invalid |= NFS_INO_INVALID_ATTR; 977 978 if ((fattr->valid & NFS_ATTR_FATTR_ATIME) && !timespec_equal(&inode->i_atime, &fattr->atime)) 979 invalid |= NFS_INO_INVALID_ATIME; 980 981 if (invalid != 0) 982 nfsi->cache_validity |= invalid; 983 984 nfsi->read_cache_jiffies = fattr->time_start; 985 return 0; 986 } 987 988 static int nfs_ctime_need_update(const struct inode *inode, const struct nfs_fattr *fattr) 989 { 990 if (!(fattr->valid & NFS_ATTR_FATTR_CTIME)) 991 return 0; 992 return timespec_compare(&fattr->ctime, &inode->i_ctime) > 0; 993 } 994 995 static int nfs_size_need_update(const struct inode *inode, const struct nfs_fattr *fattr) 996 { 997 if (!(fattr->valid & NFS_ATTR_FATTR_SIZE)) 998 return 0; 999 return nfs_size_to_loff_t(fattr->size) > i_size_read(inode); 1000 } 1001 1002 static atomic_long_t nfs_attr_generation_counter; 1003 1004 static unsigned long nfs_read_attr_generation_counter(void) 1005 { 1006 return atomic_long_read(&nfs_attr_generation_counter); 1007 } 1008 1009 unsigned long nfs_inc_attr_generation_counter(void) 1010 { 1011 return atomic_long_inc_return(&nfs_attr_generation_counter); 1012 } 1013 1014 void nfs_fattr_init(struct nfs_fattr *fattr) 1015 { 1016 fattr->valid = 0; 1017 fattr->time_start = jiffies; 1018 fattr->gencount = nfs_inc_attr_generation_counter(); 1019 } 1020 1021 struct nfs_fattr *nfs_alloc_fattr(void) 1022 { 1023 struct nfs_fattr *fattr; 1024 1025 fattr = kmalloc(sizeof(*fattr), GFP_NOFS); 1026 if (fattr != NULL) 1027 nfs_fattr_init(fattr); 1028 return fattr; 1029 } 1030 1031 struct nfs_fh *nfs_alloc_fhandle(void) 1032 { 1033 struct nfs_fh *fh; 1034 1035 fh = kmalloc(sizeof(struct nfs_fh), GFP_NOFS); 1036 if (fh != NULL) 1037 fh->size = 0; 1038 return fh; 1039 } 1040 1041 /** 1042 * nfs_inode_attrs_need_update - check if the inode attributes need updating 1043 * @inode - pointer to inode 1044 * @fattr - attributes 1045 * 1046 * Attempt to divine whether or not an RPC call reply carrying stale 1047 * attributes got scheduled after another call carrying updated ones. 1048 * 1049 * To do so, the function first assumes that a more recent ctime means 1050 * that the attributes in fattr are newer, however it also attempt to 1051 * catch the case where ctime either didn't change, or went backwards 1052 * (if someone reset the clock on the server) by looking at whether 1053 * or not this RPC call was started after the inode was last updated. 1054 * Note also the check for wraparound of 'attr_gencount' 1055 * 1056 * The function returns 'true' if it thinks the attributes in 'fattr' are 1057 * more recent than the ones cached in the inode. 1058 * 1059 */ 1060 static int nfs_inode_attrs_need_update(const struct inode *inode, const struct nfs_fattr *fattr) 1061 { 1062 const struct nfs_inode *nfsi = NFS_I(inode); 1063 1064 return ((long)fattr->gencount - (long)nfsi->attr_gencount) > 0 || 1065 nfs_ctime_need_update(inode, fattr) || 1066 nfs_size_need_update(inode, fattr) || 1067 ((long)nfsi->attr_gencount - (long)nfs_read_attr_generation_counter() > 0); 1068 } 1069 1070 static int nfs_refresh_inode_locked(struct inode *inode, struct nfs_fattr *fattr) 1071 { 1072 if (nfs_inode_attrs_need_update(inode, fattr)) 1073 return nfs_update_inode(inode, fattr); 1074 return nfs_check_inode_attributes(inode, fattr); 1075 } 1076 1077 /** 1078 * nfs_refresh_inode - try to update the inode attribute cache 1079 * @inode - pointer to inode 1080 * @fattr - updated attributes 1081 * 1082 * Check that an RPC call that returned attributes has not overlapped with 1083 * other recent updates of the inode metadata, then decide whether it is 1084 * safe to do a full update of the inode attributes, or whether just to 1085 * call nfs_check_inode_attributes. 1086 */ 1087 int nfs_refresh_inode(struct inode *inode, struct nfs_fattr *fattr) 1088 { 1089 int status; 1090 1091 if ((fattr->valid & NFS_ATTR_FATTR) == 0) 1092 return 0; 1093 spin_lock(&inode->i_lock); 1094 status = nfs_refresh_inode_locked(inode, fattr); 1095 spin_unlock(&inode->i_lock); 1096 1097 return status; 1098 } 1099 1100 static int nfs_post_op_update_inode_locked(struct inode *inode, struct nfs_fattr *fattr) 1101 { 1102 struct nfs_inode *nfsi = NFS_I(inode); 1103 1104 nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE; 1105 if (S_ISDIR(inode->i_mode)) 1106 nfsi->cache_validity |= NFS_INO_INVALID_DATA; 1107 if ((fattr->valid & NFS_ATTR_FATTR) == 0) 1108 return 0; 1109 return nfs_refresh_inode_locked(inode, fattr); 1110 } 1111 1112 /** 1113 * nfs_post_op_update_inode - try to update the inode attribute cache 1114 * @inode - pointer to inode 1115 * @fattr - updated attributes 1116 * 1117 * After an operation that has changed the inode metadata, mark the 1118 * attribute cache as being invalid, then try to update it. 1119 * 1120 * NB: if the server didn't return any post op attributes, this 1121 * function will force the retrieval of attributes before the next 1122 * NFS request. Thus it should be used only for operations that 1123 * are expected to change one or more attributes, to avoid 1124 * unnecessary NFS requests and trips through nfs_update_inode(). 1125 */ 1126 int nfs_post_op_update_inode(struct inode *inode, struct nfs_fattr *fattr) 1127 { 1128 int status; 1129 1130 spin_lock(&inode->i_lock); 1131 status = nfs_post_op_update_inode_locked(inode, fattr); 1132 spin_unlock(&inode->i_lock); 1133 return status; 1134 } 1135 1136 /** 1137 * nfs_post_op_update_inode_force_wcc - try to update the inode attribute cache 1138 * @inode - pointer to inode 1139 * @fattr - updated attributes 1140 * 1141 * After an operation that has changed the inode metadata, mark the 1142 * attribute cache as being invalid, then try to update it. Fake up 1143 * weak cache consistency data, if none exist. 1144 * 1145 * This function is mainly designed to be used by the ->write_done() functions. 1146 */ 1147 int nfs_post_op_update_inode_force_wcc(struct inode *inode, struct nfs_fattr *fattr) 1148 { 1149 int status; 1150 1151 spin_lock(&inode->i_lock); 1152 /* Don't do a WCC update if these attributes are already stale */ 1153 if ((fattr->valid & NFS_ATTR_FATTR) == 0 || 1154 !nfs_inode_attrs_need_update(inode, fattr)) { 1155 fattr->valid &= ~(NFS_ATTR_FATTR_PRECHANGE 1156 | NFS_ATTR_FATTR_PRESIZE 1157 | NFS_ATTR_FATTR_PREMTIME 1158 | NFS_ATTR_FATTR_PRECTIME); 1159 goto out_noforce; 1160 } 1161 if ((fattr->valid & NFS_ATTR_FATTR_CHANGE) != 0 && 1162 (fattr->valid & NFS_ATTR_FATTR_PRECHANGE) == 0) { 1163 fattr->pre_change_attr = NFS_I(inode)->change_attr; 1164 fattr->valid |= NFS_ATTR_FATTR_PRECHANGE; 1165 } 1166 if ((fattr->valid & NFS_ATTR_FATTR_CTIME) != 0 && 1167 (fattr->valid & NFS_ATTR_FATTR_PRECTIME) == 0) { 1168 memcpy(&fattr->pre_ctime, &inode->i_ctime, sizeof(fattr->pre_ctime)); 1169 fattr->valid |= NFS_ATTR_FATTR_PRECTIME; 1170 } 1171 if ((fattr->valid & NFS_ATTR_FATTR_MTIME) != 0 && 1172 (fattr->valid & NFS_ATTR_FATTR_PREMTIME) == 0) { 1173 memcpy(&fattr->pre_mtime, &inode->i_mtime, sizeof(fattr->pre_mtime)); 1174 fattr->valid |= NFS_ATTR_FATTR_PREMTIME; 1175 } 1176 if ((fattr->valid & NFS_ATTR_FATTR_SIZE) != 0 && 1177 (fattr->valid & NFS_ATTR_FATTR_PRESIZE) == 0) { 1178 fattr->pre_size = i_size_read(inode); 1179 fattr->valid |= NFS_ATTR_FATTR_PRESIZE; 1180 } 1181 out_noforce: 1182 status = nfs_post_op_update_inode_locked(inode, fattr); 1183 spin_unlock(&inode->i_lock); 1184 return status; 1185 } 1186 1187 /* 1188 * Many nfs protocol calls return the new file attributes after 1189 * an operation. Here we update the inode to reflect the state 1190 * of the server's inode. 1191 * 1192 * This is a bit tricky because we have to make sure all dirty pages 1193 * have been sent off to the server before calling invalidate_inode_pages. 1194 * To make sure no other process adds more write requests while we try 1195 * our best to flush them, we make them sleep during the attribute refresh. 1196 * 1197 * A very similar scenario holds for the dir cache. 1198 */ 1199 static int nfs_update_inode(struct inode *inode, struct nfs_fattr *fattr) 1200 { 1201 struct nfs_server *server; 1202 struct nfs_inode *nfsi = NFS_I(inode); 1203 loff_t cur_isize, new_isize; 1204 unsigned long invalid = 0; 1205 unsigned long now = jiffies; 1206 unsigned long save_cache_validity; 1207 1208 dfprintk(VFS, "NFS: %s(%s/%ld ct=%d info=0x%x)\n", 1209 __func__, inode->i_sb->s_id, inode->i_ino, 1210 atomic_read(&inode->i_count), fattr->valid); 1211 1212 if ((fattr->valid & NFS_ATTR_FATTR_FILEID) && nfsi->fileid != fattr->fileid) 1213 goto out_fileid; 1214 1215 /* 1216 * Make sure the inode's type hasn't changed. 1217 */ 1218 if ((fattr->valid & NFS_ATTR_FATTR_TYPE) && (inode->i_mode & S_IFMT) != (fattr->mode & S_IFMT)) 1219 goto out_changed; 1220 1221 server = NFS_SERVER(inode); 1222 /* Update the fsid? */ 1223 if (S_ISDIR(inode->i_mode) && (fattr->valid & NFS_ATTR_FATTR_FSID) && 1224 !nfs_fsid_equal(&server->fsid, &fattr->fsid) && 1225 !IS_AUTOMOUNT(inode)) 1226 server->fsid = fattr->fsid; 1227 1228 /* 1229 * Update the read time so we don't revalidate too often. 1230 */ 1231 nfsi->read_cache_jiffies = fattr->time_start; 1232 1233 save_cache_validity = nfsi->cache_validity; 1234 nfsi->cache_validity &= ~(NFS_INO_INVALID_ATTR 1235 | NFS_INO_INVALID_ATIME 1236 | NFS_INO_REVAL_FORCED 1237 | NFS_INO_REVAL_PAGECACHE); 1238 1239 /* Do atomic weak cache consistency updates */ 1240 invalid |= nfs_wcc_update_inode(inode, fattr); 1241 1242 /* More cache consistency checks */ 1243 if (fattr->valid & NFS_ATTR_FATTR_CHANGE) { 1244 if (nfsi->change_attr != fattr->change_attr) { 1245 dprintk("NFS: change_attr change on server for file %s/%ld\n", 1246 inode->i_sb->s_id, inode->i_ino); 1247 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1248 if (S_ISDIR(inode->i_mode)) 1249 nfs_force_lookup_revalidate(inode); 1250 nfsi->change_attr = fattr->change_attr; 1251 } 1252 } else if (server->caps & NFS_CAP_CHANGE_ATTR) 1253 invalid |= save_cache_validity; 1254 1255 if (fattr->valid & NFS_ATTR_FATTR_MTIME) { 1256 /* NFSv2/v3: Check if the mtime agrees */ 1257 if (!timespec_equal(&inode->i_mtime, &fattr->mtime)) { 1258 dprintk("NFS: mtime change on server for file %s/%ld\n", 1259 inode->i_sb->s_id, inode->i_ino); 1260 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA; 1261 if (S_ISDIR(inode->i_mode)) 1262 nfs_force_lookup_revalidate(inode); 1263 memcpy(&inode->i_mtime, &fattr->mtime, sizeof(inode->i_mtime)); 1264 } 1265 } else if (server->caps & NFS_CAP_MTIME) 1266 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1267 | NFS_INO_INVALID_DATA 1268 | NFS_INO_REVAL_PAGECACHE 1269 | NFS_INO_REVAL_FORCED); 1270 1271 if (fattr->valid & NFS_ATTR_FATTR_CTIME) { 1272 /* If ctime has changed we should definitely clear access+acl caches */ 1273 if (!timespec_equal(&inode->i_ctime, &fattr->ctime)) { 1274 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1275 /* and probably clear data for a directory too as utimes can cause 1276 * havoc with our cache. 1277 */ 1278 if (S_ISDIR(inode->i_mode)) { 1279 invalid |= NFS_INO_INVALID_DATA; 1280 nfs_force_lookup_revalidate(inode); 1281 } 1282 memcpy(&inode->i_ctime, &fattr->ctime, sizeof(inode->i_ctime)); 1283 } 1284 } else if (server->caps & NFS_CAP_CTIME) 1285 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1286 | NFS_INO_INVALID_ACCESS 1287 | NFS_INO_INVALID_ACL 1288 | NFS_INO_REVAL_FORCED); 1289 1290 /* Check if our cached file size is stale */ 1291 if (fattr->valid & NFS_ATTR_FATTR_SIZE) { 1292 new_isize = nfs_size_to_loff_t(fattr->size); 1293 cur_isize = i_size_read(inode); 1294 if (new_isize != cur_isize) { 1295 /* Do we perhaps have any outstanding writes, or has 1296 * the file grown beyond our last write? */ 1297 if (nfsi->npages == 0 || new_isize > cur_isize) { 1298 i_size_write(inode, new_isize); 1299 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA; 1300 } 1301 dprintk("NFS: isize change on server for file %s/%ld " 1302 "(%Ld to %Ld)\n", 1303 inode->i_sb->s_id, 1304 inode->i_ino, 1305 (long long)cur_isize, 1306 (long long)new_isize); 1307 } 1308 } else 1309 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1310 | NFS_INO_REVAL_PAGECACHE 1311 | NFS_INO_REVAL_FORCED); 1312 1313 1314 if (fattr->valid & NFS_ATTR_FATTR_ATIME) 1315 memcpy(&inode->i_atime, &fattr->atime, sizeof(inode->i_atime)); 1316 else if (server->caps & NFS_CAP_ATIME) 1317 invalid |= save_cache_validity & (NFS_INO_INVALID_ATIME 1318 | NFS_INO_REVAL_FORCED); 1319 1320 if (fattr->valid & NFS_ATTR_FATTR_MODE) { 1321 if ((inode->i_mode & S_IALLUGO) != (fattr->mode & S_IALLUGO)) { 1322 umode_t newmode = inode->i_mode & S_IFMT; 1323 newmode |= fattr->mode & S_IALLUGO; 1324 inode->i_mode = newmode; 1325 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1326 } 1327 } else if (server->caps & NFS_CAP_MODE) 1328 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1329 | NFS_INO_INVALID_ACCESS 1330 | NFS_INO_INVALID_ACL 1331 | NFS_INO_REVAL_FORCED); 1332 1333 if (fattr->valid & NFS_ATTR_FATTR_OWNER) { 1334 if (inode->i_uid != fattr->uid) { 1335 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1336 inode->i_uid = fattr->uid; 1337 } 1338 } else if (server->caps & NFS_CAP_OWNER) 1339 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1340 | NFS_INO_INVALID_ACCESS 1341 | NFS_INO_INVALID_ACL 1342 | NFS_INO_REVAL_FORCED); 1343 1344 if (fattr->valid & NFS_ATTR_FATTR_GROUP) { 1345 if (inode->i_gid != fattr->gid) { 1346 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1347 inode->i_gid = fattr->gid; 1348 } 1349 } else if (server->caps & NFS_CAP_OWNER_GROUP) 1350 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1351 | NFS_INO_INVALID_ACCESS 1352 | NFS_INO_INVALID_ACL 1353 | NFS_INO_REVAL_FORCED); 1354 1355 if (fattr->valid & NFS_ATTR_FATTR_NLINK) { 1356 if (inode->i_nlink != fattr->nlink) { 1357 invalid |= NFS_INO_INVALID_ATTR; 1358 if (S_ISDIR(inode->i_mode)) 1359 invalid |= NFS_INO_INVALID_DATA; 1360 inode->i_nlink = fattr->nlink; 1361 } 1362 } else if (server->caps & NFS_CAP_NLINK) 1363 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1364 | NFS_INO_REVAL_FORCED); 1365 1366 if (fattr->valid & NFS_ATTR_FATTR_SPACE_USED) { 1367 /* 1368 * report the blocks in 512byte units 1369 */ 1370 inode->i_blocks = nfs_calc_block_size(fattr->du.nfs3.used); 1371 } 1372 if (fattr->valid & NFS_ATTR_FATTR_BLOCKS_USED) 1373 inode->i_blocks = fattr->du.nfs2.blocks; 1374 1375 /* Update attrtimeo value if we're out of the unstable period */ 1376 if (invalid & NFS_INO_INVALID_ATTR) { 1377 nfs_inc_stats(inode, NFSIOS_ATTRINVALIDATE); 1378 nfsi->attrtimeo = NFS_MINATTRTIMEO(inode); 1379 nfsi->attrtimeo_timestamp = now; 1380 nfsi->attr_gencount = nfs_inc_attr_generation_counter(); 1381 } else { 1382 if (!time_in_range_open(now, nfsi->attrtimeo_timestamp, nfsi->attrtimeo_timestamp + nfsi->attrtimeo)) { 1383 if ((nfsi->attrtimeo <<= 1) > NFS_MAXATTRTIMEO(inode)) 1384 nfsi->attrtimeo = NFS_MAXATTRTIMEO(inode); 1385 nfsi->attrtimeo_timestamp = now; 1386 } 1387 } 1388 invalid &= ~NFS_INO_INVALID_ATTR; 1389 /* Don't invalidate the data if we were to blame */ 1390 if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) 1391 || S_ISLNK(inode->i_mode))) 1392 invalid &= ~NFS_INO_INVALID_DATA; 1393 if (!nfs_have_delegation(inode, FMODE_READ) || 1394 (save_cache_validity & NFS_INO_REVAL_FORCED)) 1395 nfsi->cache_validity |= invalid; 1396 1397 return 0; 1398 out_changed: 1399 /* 1400 * Big trouble! The inode has become a different object. 1401 */ 1402 printk(KERN_DEBUG "%s: inode %ld mode changed, %07o to %07o\n", 1403 __func__, inode->i_ino, inode->i_mode, fattr->mode); 1404 out_err: 1405 /* 1406 * No need to worry about unhashing the dentry, as the 1407 * lookup validation will know that the inode is bad. 1408 * (But we fall through to invalidate the caches.) 1409 */ 1410 nfs_invalidate_inode(inode); 1411 return -ESTALE; 1412 1413 out_fileid: 1414 printk(KERN_ERR "NFS: server %s error: fileid changed\n" 1415 "fsid %s: expected fileid 0x%Lx, got 0x%Lx\n", 1416 NFS_SERVER(inode)->nfs_client->cl_hostname, inode->i_sb->s_id, 1417 (long long)nfsi->fileid, (long long)fattr->fileid); 1418 goto out_err; 1419 } 1420 1421 1422 #ifdef CONFIG_NFS_V4 1423 1424 /* 1425 * Clean out any remaining NFSv4 state that might be left over due 1426 * to open() calls that passed nfs_atomic_lookup, but failed to call 1427 * nfs_open(). 1428 */ 1429 void nfs4_evict_inode(struct inode *inode) 1430 { 1431 truncate_inode_pages(&inode->i_data, 0); 1432 end_writeback(inode); 1433 pnfs_return_layout(inode); 1434 pnfs_destroy_layout(NFS_I(inode)); 1435 /* If we are holding a delegation, return it! */ 1436 nfs_inode_return_delegation_noreclaim(inode); 1437 /* First call standard NFS clear_inode() code */ 1438 nfs_clear_inode(inode); 1439 } 1440 #endif 1441 1442 struct inode *nfs_alloc_inode(struct super_block *sb) 1443 { 1444 struct nfs_inode *nfsi; 1445 nfsi = (struct nfs_inode *)kmem_cache_alloc(nfs_inode_cachep, GFP_KERNEL); 1446 if (!nfsi) 1447 return NULL; 1448 nfsi->flags = 0UL; 1449 nfsi->cache_validity = 0UL; 1450 #ifdef CONFIG_NFS_V3_ACL 1451 nfsi->acl_access = ERR_PTR(-EAGAIN); 1452 nfsi->acl_default = ERR_PTR(-EAGAIN); 1453 #endif 1454 #ifdef CONFIG_NFS_V4 1455 nfsi->nfs4_acl = NULL; 1456 #endif /* CONFIG_NFS_V4 */ 1457 return &nfsi->vfs_inode; 1458 } 1459 1460 static void nfs_i_callback(struct rcu_head *head) 1461 { 1462 struct inode *inode = container_of(head, struct inode, i_rcu); 1463 INIT_LIST_HEAD(&inode->i_dentry); 1464 kmem_cache_free(nfs_inode_cachep, NFS_I(inode)); 1465 } 1466 1467 void nfs_destroy_inode(struct inode *inode) 1468 { 1469 call_rcu(&inode->i_rcu, nfs_i_callback); 1470 } 1471 1472 static inline void nfs4_init_once(struct nfs_inode *nfsi) 1473 { 1474 #ifdef CONFIG_NFS_V4 1475 INIT_LIST_HEAD(&nfsi->open_states); 1476 nfsi->delegation = NULL; 1477 nfsi->delegation_state = 0; 1478 init_rwsem(&nfsi->rwsem); 1479 nfsi->layout = NULL; 1480 atomic_set(&nfsi->commits_outstanding, 0); 1481 #endif 1482 } 1483 1484 static void init_once(void *foo) 1485 { 1486 struct nfs_inode *nfsi = (struct nfs_inode *) foo; 1487 1488 inode_init_once(&nfsi->vfs_inode); 1489 INIT_LIST_HEAD(&nfsi->open_files); 1490 INIT_LIST_HEAD(&nfsi->access_cache_entry_lru); 1491 INIT_LIST_HEAD(&nfsi->access_cache_inode_lru); 1492 INIT_RADIX_TREE(&nfsi->nfs_page_tree, GFP_ATOMIC); 1493 nfsi->npages = 0; 1494 nfsi->ncommit = 0; 1495 atomic_set(&nfsi->silly_count, 1); 1496 INIT_HLIST_HEAD(&nfsi->silly_list); 1497 init_waitqueue_head(&nfsi->waitqueue); 1498 nfs4_init_once(nfsi); 1499 } 1500 1501 static int __init nfs_init_inodecache(void) 1502 { 1503 nfs_inode_cachep = kmem_cache_create("nfs_inode_cache", 1504 sizeof(struct nfs_inode), 1505 0, (SLAB_RECLAIM_ACCOUNT| 1506 SLAB_MEM_SPREAD), 1507 init_once); 1508 if (nfs_inode_cachep == NULL) 1509 return -ENOMEM; 1510 1511 return 0; 1512 } 1513 1514 static void nfs_destroy_inodecache(void) 1515 { 1516 kmem_cache_destroy(nfs_inode_cachep); 1517 } 1518 1519 struct workqueue_struct *nfsiod_workqueue; 1520 1521 /* 1522 * start up the nfsiod workqueue 1523 */ 1524 static int nfsiod_start(void) 1525 { 1526 struct workqueue_struct *wq; 1527 dprintk("RPC: creating workqueue nfsiod\n"); 1528 wq = alloc_workqueue("nfsiod", WQ_MEM_RECLAIM, 0); 1529 if (wq == NULL) 1530 return -ENOMEM; 1531 nfsiod_workqueue = wq; 1532 return 0; 1533 } 1534 1535 /* 1536 * Destroy the nfsiod workqueue 1537 */ 1538 static void nfsiod_stop(void) 1539 { 1540 struct workqueue_struct *wq; 1541 1542 wq = nfsiod_workqueue; 1543 if (wq == NULL) 1544 return; 1545 nfsiod_workqueue = NULL; 1546 destroy_workqueue(wq); 1547 } 1548 1549 /* 1550 * Initialize NFS 1551 */ 1552 static int __init init_nfs_fs(void) 1553 { 1554 int err; 1555 1556 err = nfs_idmap_init(); 1557 if (err < 0) 1558 goto out9; 1559 1560 err = nfs_dns_resolver_init(); 1561 if (err < 0) 1562 goto out8; 1563 1564 err = nfs_fscache_register(); 1565 if (err < 0) 1566 goto out7; 1567 1568 err = nfsiod_start(); 1569 if (err) 1570 goto out6; 1571 1572 err = nfs_fs_proc_init(); 1573 if (err) 1574 goto out5; 1575 1576 err = nfs_init_nfspagecache(); 1577 if (err) 1578 goto out4; 1579 1580 err = nfs_init_inodecache(); 1581 if (err) 1582 goto out3; 1583 1584 err = nfs_init_readpagecache(); 1585 if (err) 1586 goto out2; 1587 1588 err = nfs_init_writepagecache(); 1589 if (err) 1590 goto out1; 1591 1592 err = nfs_init_directcache(); 1593 if (err) 1594 goto out0; 1595 1596 #ifdef CONFIG_PROC_FS 1597 rpc_proc_register(&nfs_rpcstat); 1598 #endif 1599 if ((err = register_nfs_fs()) != 0) 1600 goto out; 1601 return 0; 1602 out: 1603 #ifdef CONFIG_PROC_FS 1604 rpc_proc_unregister("nfs"); 1605 #endif 1606 nfs_destroy_directcache(); 1607 out0: 1608 nfs_destroy_writepagecache(); 1609 out1: 1610 nfs_destroy_readpagecache(); 1611 out2: 1612 nfs_destroy_inodecache(); 1613 out3: 1614 nfs_destroy_nfspagecache(); 1615 out4: 1616 nfs_fs_proc_exit(); 1617 out5: 1618 nfsiod_stop(); 1619 out6: 1620 nfs_fscache_unregister(); 1621 out7: 1622 nfs_dns_resolver_destroy(); 1623 out8: 1624 nfs_idmap_quit(); 1625 out9: 1626 return err; 1627 } 1628 1629 static void __exit exit_nfs_fs(void) 1630 { 1631 nfs_destroy_directcache(); 1632 nfs_destroy_writepagecache(); 1633 nfs_destroy_readpagecache(); 1634 nfs_destroy_inodecache(); 1635 nfs_destroy_nfspagecache(); 1636 nfs_fscache_unregister(); 1637 nfs_dns_resolver_destroy(); 1638 nfs_idmap_quit(); 1639 #ifdef CONFIG_PROC_FS 1640 rpc_proc_unregister("nfs"); 1641 #endif 1642 nfs_cleanup_cb_ident_idr(); 1643 unregister_nfs_fs(); 1644 nfs_fs_proc_exit(); 1645 nfsiod_stop(); 1646 } 1647 1648 /* Not quite true; I just maintain it */ 1649 MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>"); 1650 MODULE_LICENSE("GPL"); 1651 module_param(enable_ino64, bool, 0644); 1652 1653 module_init(init_nfs_fs) 1654 module_exit(exit_nfs_fs) 1655