1 /* 2 * linux/fs/nfs/inode.c 3 * 4 * Copyright (C) 1992 Rick Sladkey 5 * 6 * nfs inode and superblock handling functions 7 * 8 * Modularised by Alan Cox <alan@lxorguk.ukuu.org.uk>, while hacking some 9 * experimental NFS changes. Modularisation taken straight from SYS5 fs. 10 * 11 * Change to nfs_read_super() to permit NFS mounts to multi-homed hosts. 12 * J.S.Peatfield@damtp.cam.ac.uk 13 * 14 */ 15 16 #include <linux/module.h> 17 #include <linux/init.h> 18 #include <linux/sched.h> 19 #include <linux/time.h> 20 #include <linux/kernel.h> 21 #include <linux/mm.h> 22 #include <linux/string.h> 23 #include <linux/stat.h> 24 #include <linux/errno.h> 25 #include <linux/unistd.h> 26 #include <linux/sunrpc/clnt.h> 27 #include <linux/sunrpc/stats.h> 28 #include <linux/sunrpc/metrics.h> 29 #include <linux/nfs_fs.h> 30 #include <linux/nfs_mount.h> 31 #include <linux/nfs4_mount.h> 32 #include <linux/lockd/bind.h> 33 #include <linux/seq_file.h> 34 #include <linux/mount.h> 35 #include <linux/nfs_idmap.h> 36 #include <linux/vfs.h> 37 #include <linux/inet.h> 38 #include <linux/nfs_xdr.h> 39 #include <linux/slab.h> 40 #include <linux/compat.h> 41 42 #include <asm/system.h> 43 #include <asm/uaccess.h> 44 45 #include "nfs4_fs.h" 46 #include "callback.h" 47 #include "delegation.h" 48 #include "iostat.h" 49 #include "internal.h" 50 #include "fscache.h" 51 #include "dns_resolve.h" 52 #include "pnfs.h" 53 54 #define NFSDBG_FACILITY NFSDBG_VFS 55 56 #define NFS_64_BIT_INODE_NUMBERS_ENABLED 1 57 58 /* Default is to see 64-bit inode numbers */ 59 static int enable_ino64 = NFS_64_BIT_INODE_NUMBERS_ENABLED; 60 61 static void nfs_invalidate_inode(struct inode *); 62 static int nfs_update_inode(struct inode *, struct nfs_fattr *); 63 64 static struct kmem_cache * nfs_inode_cachep; 65 66 static inline unsigned long 67 nfs_fattr_to_ino_t(struct nfs_fattr *fattr) 68 { 69 return nfs_fileid_to_ino_t(fattr->fileid); 70 } 71 72 /** 73 * nfs_wait_bit_killable - helper for functions that are sleeping on bit locks 74 * @word: long word containing the bit lock 75 */ 76 int nfs_wait_bit_killable(void *word) 77 { 78 if (fatal_signal_pending(current)) 79 return -ERESTARTSYS; 80 schedule(); 81 return 0; 82 } 83 84 /** 85 * nfs_compat_user_ino64 - returns the user-visible inode number 86 * @fileid: 64-bit fileid 87 * 88 * This function returns a 32-bit inode number if the boot parameter 89 * nfs.enable_ino64 is zero. 90 */ 91 u64 nfs_compat_user_ino64(u64 fileid) 92 { 93 #ifdef CONFIG_COMPAT 94 compat_ulong_t ino; 95 #else 96 unsigned long ino; 97 #endif 98 99 if (enable_ino64) 100 return fileid; 101 ino = fileid; 102 if (sizeof(ino) < sizeof(fileid)) 103 ino ^= fileid >> (sizeof(fileid)-sizeof(ino)) * 8; 104 return ino; 105 } 106 107 static void nfs_clear_inode(struct inode *inode) 108 { 109 /* 110 * The following should never happen... 111 */ 112 BUG_ON(nfs_have_writebacks(inode)); 113 BUG_ON(!list_empty(&NFS_I(inode)->open_files)); 114 nfs_zap_acl_cache(inode); 115 nfs_access_zap_cache(inode); 116 nfs_fscache_release_inode_cookie(inode); 117 } 118 119 void nfs_evict_inode(struct inode *inode) 120 { 121 truncate_inode_pages(&inode->i_data, 0); 122 end_writeback(inode); 123 nfs_clear_inode(inode); 124 } 125 126 /** 127 * nfs_sync_mapping - helper to flush all mmapped dirty data to disk 128 */ 129 int nfs_sync_mapping(struct address_space *mapping) 130 { 131 int ret = 0; 132 133 if (mapping->nrpages != 0) { 134 unmap_mapping_range(mapping, 0, 0, 0); 135 ret = nfs_wb_all(mapping->host); 136 } 137 return ret; 138 } 139 140 /* 141 * Invalidate the local caches 142 */ 143 static void nfs_zap_caches_locked(struct inode *inode) 144 { 145 struct nfs_inode *nfsi = NFS_I(inode); 146 int mode = inode->i_mode; 147 148 nfs_inc_stats(inode, NFSIOS_ATTRINVALIDATE); 149 150 nfsi->attrtimeo = NFS_MINATTRTIMEO(inode); 151 nfsi->attrtimeo_timestamp = jiffies; 152 153 memset(NFS_COOKIEVERF(inode), 0, sizeof(NFS_COOKIEVERF(inode))); 154 if (S_ISREG(mode) || S_ISDIR(mode) || S_ISLNK(mode)) 155 nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL|NFS_INO_REVAL_PAGECACHE; 156 else 157 nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL|NFS_INO_REVAL_PAGECACHE; 158 } 159 160 void nfs_zap_caches(struct inode *inode) 161 { 162 spin_lock(&inode->i_lock); 163 nfs_zap_caches_locked(inode); 164 spin_unlock(&inode->i_lock); 165 } 166 167 void nfs_zap_mapping(struct inode *inode, struct address_space *mapping) 168 { 169 if (mapping->nrpages != 0) { 170 spin_lock(&inode->i_lock); 171 NFS_I(inode)->cache_validity |= NFS_INO_INVALID_DATA; 172 spin_unlock(&inode->i_lock); 173 } 174 } 175 176 void nfs_zap_acl_cache(struct inode *inode) 177 { 178 void (*clear_acl_cache)(struct inode *); 179 180 clear_acl_cache = NFS_PROTO(inode)->clear_acl_cache; 181 if (clear_acl_cache != NULL) 182 clear_acl_cache(inode); 183 spin_lock(&inode->i_lock); 184 NFS_I(inode)->cache_validity &= ~NFS_INO_INVALID_ACL; 185 spin_unlock(&inode->i_lock); 186 } 187 188 void nfs_invalidate_atime(struct inode *inode) 189 { 190 spin_lock(&inode->i_lock); 191 NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ATIME; 192 spin_unlock(&inode->i_lock); 193 } 194 195 /* 196 * Invalidate, but do not unhash, the inode. 197 * NB: must be called with inode->i_lock held! 198 */ 199 static void nfs_invalidate_inode(struct inode *inode) 200 { 201 set_bit(NFS_INO_STALE, &NFS_I(inode)->flags); 202 nfs_zap_caches_locked(inode); 203 } 204 205 struct nfs_find_desc { 206 struct nfs_fh *fh; 207 struct nfs_fattr *fattr; 208 }; 209 210 /* 211 * In NFSv3 we can have 64bit inode numbers. In order to support 212 * this, and re-exported directories (also seen in NFSv2) 213 * we are forced to allow 2 different inodes to have the same 214 * i_ino. 215 */ 216 static int 217 nfs_find_actor(struct inode *inode, void *opaque) 218 { 219 struct nfs_find_desc *desc = (struct nfs_find_desc *)opaque; 220 struct nfs_fh *fh = desc->fh; 221 struct nfs_fattr *fattr = desc->fattr; 222 223 if (NFS_FILEID(inode) != fattr->fileid) 224 return 0; 225 if (nfs_compare_fh(NFS_FH(inode), fh)) 226 return 0; 227 if (is_bad_inode(inode) || NFS_STALE(inode)) 228 return 0; 229 return 1; 230 } 231 232 static int 233 nfs_init_locked(struct inode *inode, void *opaque) 234 { 235 struct nfs_find_desc *desc = (struct nfs_find_desc *)opaque; 236 struct nfs_fattr *fattr = desc->fattr; 237 238 set_nfs_fileid(inode, fattr->fileid); 239 nfs_copy_fh(NFS_FH(inode), desc->fh); 240 return 0; 241 } 242 243 /* 244 * This is our front-end to iget that looks up inodes by file handle 245 * instead of inode number. 246 */ 247 struct inode * 248 nfs_fhget(struct super_block *sb, struct nfs_fh *fh, struct nfs_fattr *fattr) 249 { 250 struct nfs_find_desc desc = { 251 .fh = fh, 252 .fattr = fattr 253 }; 254 struct inode *inode = ERR_PTR(-ENOENT); 255 unsigned long hash; 256 257 nfs_attr_check_mountpoint(sb, fattr); 258 259 if ((fattr->valid & NFS_ATTR_FATTR_FILEID) == 0 && (fattr->valid & NFS_ATTR_FATTR_MOUNTPOINT) == 0) 260 goto out_no_inode; 261 if ((fattr->valid & NFS_ATTR_FATTR_TYPE) == 0) 262 goto out_no_inode; 263 264 hash = nfs_fattr_to_ino_t(fattr); 265 266 inode = iget5_locked(sb, hash, nfs_find_actor, nfs_init_locked, &desc); 267 if (inode == NULL) { 268 inode = ERR_PTR(-ENOMEM); 269 goto out_no_inode; 270 } 271 272 if (inode->i_state & I_NEW) { 273 struct nfs_inode *nfsi = NFS_I(inode); 274 unsigned long now = jiffies; 275 276 /* We set i_ino for the few things that still rely on it, 277 * such as stat(2) */ 278 inode->i_ino = hash; 279 280 /* We can't support update_atime(), since the server will reset it */ 281 inode->i_flags |= S_NOATIME|S_NOCMTIME; 282 inode->i_mode = fattr->mode; 283 if ((fattr->valid & NFS_ATTR_FATTR_MODE) == 0 284 && nfs_server_capable(inode, NFS_CAP_MODE)) 285 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 286 | NFS_INO_INVALID_ACCESS 287 | NFS_INO_INVALID_ACL; 288 /* Why so? Because we want revalidate for devices/FIFOs, and 289 * that's precisely what we have in nfs_file_inode_operations. 290 */ 291 inode->i_op = NFS_SB(sb)->nfs_client->rpc_ops->file_inode_ops; 292 if (S_ISREG(inode->i_mode)) { 293 inode->i_fop = &nfs_file_operations; 294 inode->i_data.a_ops = &nfs_file_aops; 295 inode->i_data.backing_dev_info = &NFS_SB(sb)->backing_dev_info; 296 } else if (S_ISDIR(inode->i_mode)) { 297 inode->i_op = NFS_SB(sb)->nfs_client->rpc_ops->dir_inode_ops; 298 inode->i_fop = &nfs_dir_operations; 299 inode->i_data.a_ops = &nfs_dir_aops; 300 if (nfs_server_capable(inode, NFS_CAP_READDIRPLUS)) 301 set_bit(NFS_INO_ADVISE_RDPLUS, &NFS_I(inode)->flags); 302 /* Deal with crossing mountpoints */ 303 if (fattr->valid & NFS_ATTR_FATTR_MOUNTPOINT || 304 fattr->valid & NFS_ATTR_FATTR_V4_REFERRAL) { 305 if (fattr->valid & NFS_ATTR_FATTR_V4_REFERRAL) 306 inode->i_op = &nfs_referral_inode_operations; 307 else 308 inode->i_op = &nfs_mountpoint_inode_operations; 309 inode->i_fop = NULL; 310 inode->i_flags |= S_AUTOMOUNT; 311 } 312 } else if (S_ISLNK(inode->i_mode)) 313 inode->i_op = &nfs_symlink_inode_operations; 314 else 315 init_special_inode(inode, inode->i_mode, fattr->rdev); 316 317 memset(&inode->i_atime, 0, sizeof(inode->i_atime)); 318 memset(&inode->i_mtime, 0, sizeof(inode->i_mtime)); 319 memset(&inode->i_ctime, 0, sizeof(inode->i_ctime)); 320 nfsi->change_attr = 0; 321 inode->i_size = 0; 322 inode->i_nlink = 0; 323 inode->i_uid = -2; 324 inode->i_gid = -2; 325 inode->i_blocks = 0; 326 memset(nfsi->cookieverf, 0, sizeof(nfsi->cookieverf)); 327 328 nfsi->read_cache_jiffies = fattr->time_start; 329 nfsi->attr_gencount = fattr->gencount; 330 if (fattr->valid & NFS_ATTR_FATTR_ATIME) 331 inode->i_atime = fattr->atime; 332 else if (nfs_server_capable(inode, NFS_CAP_ATIME)) 333 nfsi->cache_validity |= NFS_INO_INVALID_ATTR; 334 if (fattr->valid & NFS_ATTR_FATTR_MTIME) 335 inode->i_mtime = fattr->mtime; 336 else if (nfs_server_capable(inode, NFS_CAP_MTIME)) 337 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 338 | NFS_INO_INVALID_DATA; 339 if (fattr->valid & NFS_ATTR_FATTR_CTIME) 340 inode->i_ctime = fattr->ctime; 341 else if (nfs_server_capable(inode, NFS_CAP_CTIME)) 342 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 343 | NFS_INO_INVALID_ACCESS 344 | NFS_INO_INVALID_ACL; 345 if (fattr->valid & NFS_ATTR_FATTR_CHANGE) 346 nfsi->change_attr = fattr->change_attr; 347 else if (nfs_server_capable(inode, NFS_CAP_CHANGE_ATTR)) 348 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 349 | NFS_INO_INVALID_DATA; 350 if (fattr->valid & NFS_ATTR_FATTR_SIZE) 351 inode->i_size = nfs_size_to_loff_t(fattr->size); 352 else 353 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 354 | NFS_INO_INVALID_DATA 355 | NFS_INO_REVAL_PAGECACHE; 356 if (fattr->valid & NFS_ATTR_FATTR_NLINK) 357 inode->i_nlink = fattr->nlink; 358 else if (nfs_server_capable(inode, NFS_CAP_NLINK)) 359 nfsi->cache_validity |= NFS_INO_INVALID_ATTR; 360 if (fattr->valid & NFS_ATTR_FATTR_OWNER) 361 inode->i_uid = fattr->uid; 362 else if (nfs_server_capable(inode, NFS_CAP_OWNER)) 363 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 364 | NFS_INO_INVALID_ACCESS 365 | NFS_INO_INVALID_ACL; 366 if (fattr->valid & NFS_ATTR_FATTR_GROUP) 367 inode->i_gid = fattr->gid; 368 else if (nfs_server_capable(inode, NFS_CAP_OWNER_GROUP)) 369 nfsi->cache_validity |= NFS_INO_INVALID_ATTR 370 | NFS_INO_INVALID_ACCESS 371 | NFS_INO_INVALID_ACL; 372 if (fattr->valid & NFS_ATTR_FATTR_BLOCKS_USED) 373 inode->i_blocks = fattr->du.nfs2.blocks; 374 if (fattr->valid & NFS_ATTR_FATTR_SPACE_USED) { 375 /* 376 * report the blocks in 512byte units 377 */ 378 inode->i_blocks = nfs_calc_block_size(fattr->du.nfs3.used); 379 } 380 nfsi->attrtimeo = NFS_MINATTRTIMEO(inode); 381 nfsi->attrtimeo_timestamp = now; 382 nfsi->access_cache = RB_ROOT; 383 384 nfs_fscache_init_inode_cookie(inode); 385 386 unlock_new_inode(inode); 387 } else 388 nfs_refresh_inode(inode, fattr); 389 dprintk("NFS: nfs_fhget(%s/%Ld ct=%d)\n", 390 inode->i_sb->s_id, 391 (long long)NFS_FILEID(inode), 392 atomic_read(&inode->i_count)); 393 394 out: 395 return inode; 396 397 out_no_inode: 398 dprintk("nfs_fhget: iget failed with error %ld\n", PTR_ERR(inode)); 399 goto out; 400 } 401 402 #define NFS_VALID_ATTRS (ATTR_MODE|ATTR_UID|ATTR_GID|ATTR_SIZE|ATTR_ATIME|ATTR_ATIME_SET|ATTR_MTIME|ATTR_MTIME_SET|ATTR_FILE) 403 404 int 405 nfs_setattr(struct dentry *dentry, struct iattr *attr) 406 { 407 struct inode *inode = dentry->d_inode; 408 struct nfs_fattr *fattr; 409 int error = -ENOMEM; 410 411 nfs_inc_stats(inode, NFSIOS_VFSSETATTR); 412 413 /* skip mode change if it's just for clearing setuid/setgid */ 414 if (attr->ia_valid & (ATTR_KILL_SUID | ATTR_KILL_SGID)) 415 attr->ia_valid &= ~ATTR_MODE; 416 417 if (attr->ia_valid & ATTR_SIZE) { 418 if (!S_ISREG(inode->i_mode) || attr->ia_size == i_size_read(inode)) 419 attr->ia_valid &= ~ATTR_SIZE; 420 } 421 422 /* Optimization: if the end result is no change, don't RPC */ 423 attr->ia_valid &= NFS_VALID_ATTRS; 424 if ((attr->ia_valid & ~ATTR_FILE) == 0) 425 return 0; 426 427 /* Write all dirty data */ 428 if (S_ISREG(inode->i_mode)) 429 nfs_wb_all(inode); 430 431 fattr = nfs_alloc_fattr(); 432 if (fattr == NULL) 433 goto out; 434 /* 435 * Return any delegations if we're going to change ACLs 436 */ 437 if ((attr->ia_valid & (ATTR_MODE|ATTR_UID|ATTR_GID)) != 0) 438 nfs_inode_return_delegation(inode); 439 error = NFS_PROTO(inode)->setattr(dentry, fattr, attr); 440 if (error == 0) 441 nfs_refresh_inode(inode, fattr); 442 nfs_free_fattr(fattr); 443 out: 444 return error; 445 } 446 447 /** 448 * nfs_vmtruncate - unmap mappings "freed" by truncate() syscall 449 * @inode: inode of the file used 450 * @offset: file offset to start truncating 451 * 452 * This is a copy of the common vmtruncate, but with the locking 453 * corrected to take into account the fact that NFS requires 454 * inode->i_size to be updated under the inode->i_lock. 455 */ 456 static int nfs_vmtruncate(struct inode * inode, loff_t offset) 457 { 458 loff_t oldsize; 459 int err; 460 461 err = inode_newsize_ok(inode, offset); 462 if (err) 463 goto out; 464 465 spin_lock(&inode->i_lock); 466 oldsize = inode->i_size; 467 i_size_write(inode, offset); 468 spin_unlock(&inode->i_lock); 469 470 truncate_pagecache(inode, oldsize, offset); 471 out: 472 return err; 473 } 474 475 /** 476 * nfs_setattr_update_inode - Update inode metadata after a setattr call. 477 * @inode: pointer to struct inode 478 * @attr: pointer to struct iattr 479 * 480 * Note: we do this in the *proc.c in order to ensure that 481 * it works for things like exclusive creates too. 482 */ 483 void nfs_setattr_update_inode(struct inode *inode, struct iattr *attr) 484 { 485 if ((attr->ia_valid & (ATTR_MODE|ATTR_UID|ATTR_GID)) != 0) { 486 spin_lock(&inode->i_lock); 487 if ((attr->ia_valid & ATTR_MODE) != 0) { 488 int mode = attr->ia_mode & S_IALLUGO; 489 mode |= inode->i_mode & ~S_IALLUGO; 490 inode->i_mode = mode; 491 } 492 if ((attr->ia_valid & ATTR_UID) != 0) 493 inode->i_uid = attr->ia_uid; 494 if ((attr->ia_valid & ATTR_GID) != 0) 495 inode->i_gid = attr->ia_gid; 496 NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 497 spin_unlock(&inode->i_lock); 498 } 499 if ((attr->ia_valid & ATTR_SIZE) != 0) { 500 nfs_inc_stats(inode, NFSIOS_SETATTRTRUNC); 501 nfs_vmtruncate(inode, attr->ia_size); 502 } 503 } 504 505 int nfs_getattr(struct vfsmount *mnt, struct dentry *dentry, struct kstat *stat) 506 { 507 struct inode *inode = dentry->d_inode; 508 int need_atime = NFS_I(inode)->cache_validity & NFS_INO_INVALID_ATIME; 509 int err; 510 511 /* Flush out writes to the server in order to update c/mtime. */ 512 if (S_ISREG(inode->i_mode)) { 513 err = filemap_write_and_wait(inode->i_mapping); 514 if (err) 515 goto out; 516 } 517 518 /* 519 * We may force a getattr if the user cares about atime. 520 * 521 * Note that we only have to check the vfsmount flags here: 522 * - NFS always sets S_NOATIME by so checking it would give a 523 * bogus result 524 * - NFS never sets MS_NOATIME or MS_NODIRATIME so there is 525 * no point in checking those. 526 */ 527 if ((mnt->mnt_flags & MNT_NOATIME) || 528 ((mnt->mnt_flags & MNT_NODIRATIME) && S_ISDIR(inode->i_mode))) 529 need_atime = 0; 530 531 if (need_atime) 532 err = __nfs_revalidate_inode(NFS_SERVER(inode), inode); 533 else 534 err = nfs_revalidate_inode(NFS_SERVER(inode), inode); 535 if (!err) { 536 generic_fillattr(inode, stat); 537 stat->ino = nfs_compat_user_ino64(NFS_FILEID(inode)); 538 } 539 out: 540 return err; 541 } 542 543 static void nfs_init_lock_context(struct nfs_lock_context *l_ctx) 544 { 545 atomic_set(&l_ctx->count, 1); 546 l_ctx->lockowner = current->files; 547 l_ctx->pid = current->tgid; 548 INIT_LIST_HEAD(&l_ctx->list); 549 } 550 551 static struct nfs_lock_context *__nfs_find_lock_context(struct nfs_open_context *ctx) 552 { 553 struct nfs_lock_context *pos; 554 555 list_for_each_entry(pos, &ctx->lock_context.list, list) { 556 if (pos->lockowner != current->files) 557 continue; 558 if (pos->pid != current->tgid) 559 continue; 560 atomic_inc(&pos->count); 561 return pos; 562 } 563 return NULL; 564 } 565 566 struct nfs_lock_context *nfs_get_lock_context(struct nfs_open_context *ctx) 567 { 568 struct nfs_lock_context *res, *new = NULL; 569 struct inode *inode = ctx->path.dentry->d_inode; 570 571 spin_lock(&inode->i_lock); 572 res = __nfs_find_lock_context(ctx); 573 if (res == NULL) { 574 spin_unlock(&inode->i_lock); 575 new = kmalloc(sizeof(*new), GFP_KERNEL); 576 if (new == NULL) 577 return NULL; 578 nfs_init_lock_context(new); 579 spin_lock(&inode->i_lock); 580 res = __nfs_find_lock_context(ctx); 581 if (res == NULL) { 582 list_add_tail(&new->list, &ctx->lock_context.list); 583 new->open_context = ctx; 584 res = new; 585 new = NULL; 586 } 587 } 588 spin_unlock(&inode->i_lock); 589 kfree(new); 590 return res; 591 } 592 593 void nfs_put_lock_context(struct nfs_lock_context *l_ctx) 594 { 595 struct nfs_open_context *ctx = l_ctx->open_context; 596 struct inode *inode = ctx->path.dentry->d_inode; 597 598 if (!atomic_dec_and_lock(&l_ctx->count, &inode->i_lock)) 599 return; 600 list_del(&l_ctx->list); 601 spin_unlock(&inode->i_lock); 602 kfree(l_ctx); 603 } 604 605 /** 606 * nfs_close_context - Common close_context() routine NFSv2/v3 607 * @ctx: pointer to context 608 * @is_sync: is this a synchronous close 609 * 610 * always ensure that the attributes are up to date if we're mounted 611 * with close-to-open semantics 612 */ 613 void nfs_close_context(struct nfs_open_context *ctx, int is_sync) 614 { 615 struct inode *inode; 616 struct nfs_server *server; 617 618 if (!(ctx->mode & FMODE_WRITE)) 619 return; 620 if (!is_sync) 621 return; 622 inode = ctx->path.dentry->d_inode; 623 if (!list_empty(&NFS_I(inode)->open_files)) 624 return; 625 server = NFS_SERVER(inode); 626 if (server->flags & NFS_MOUNT_NOCTO) 627 return; 628 nfs_revalidate_inode(server, inode); 629 } 630 631 struct nfs_open_context *alloc_nfs_open_context(struct path *path, struct rpc_cred *cred, fmode_t f_mode) 632 { 633 struct nfs_open_context *ctx; 634 635 ctx = kmalloc(sizeof(*ctx), GFP_KERNEL); 636 if (ctx != NULL) { 637 ctx->path = *path; 638 path_get(&ctx->path); 639 ctx->cred = get_rpccred(cred); 640 ctx->state = NULL; 641 ctx->mode = f_mode; 642 ctx->flags = 0; 643 ctx->error = 0; 644 nfs_init_lock_context(&ctx->lock_context); 645 ctx->lock_context.open_context = ctx; 646 INIT_LIST_HEAD(&ctx->list); 647 } 648 return ctx; 649 } 650 651 struct nfs_open_context *get_nfs_open_context(struct nfs_open_context *ctx) 652 { 653 if (ctx != NULL) 654 atomic_inc(&ctx->lock_context.count); 655 return ctx; 656 } 657 658 static void __put_nfs_open_context(struct nfs_open_context *ctx, int is_sync) 659 { 660 struct inode *inode = ctx->path.dentry->d_inode; 661 662 if (!list_empty(&ctx->list)) { 663 if (!atomic_dec_and_lock(&ctx->lock_context.count, &inode->i_lock)) 664 return; 665 list_del(&ctx->list); 666 spin_unlock(&inode->i_lock); 667 } else if (!atomic_dec_and_test(&ctx->lock_context.count)) 668 return; 669 if (inode != NULL) 670 NFS_PROTO(inode)->close_context(ctx, is_sync); 671 if (ctx->cred != NULL) 672 put_rpccred(ctx->cred); 673 path_put(&ctx->path); 674 kfree(ctx); 675 } 676 677 void put_nfs_open_context(struct nfs_open_context *ctx) 678 { 679 __put_nfs_open_context(ctx, 0); 680 } 681 682 /* 683 * Ensure that mmap has a recent RPC credential for use when writing out 684 * shared pages 685 */ 686 void nfs_file_set_open_context(struct file *filp, struct nfs_open_context *ctx) 687 { 688 struct inode *inode = filp->f_path.dentry->d_inode; 689 struct nfs_inode *nfsi = NFS_I(inode); 690 691 filp->private_data = get_nfs_open_context(ctx); 692 spin_lock(&inode->i_lock); 693 list_add(&ctx->list, &nfsi->open_files); 694 spin_unlock(&inode->i_lock); 695 } 696 697 /* 698 * Given an inode, search for an open context with the desired characteristics 699 */ 700 struct nfs_open_context *nfs_find_open_context(struct inode *inode, struct rpc_cred *cred, fmode_t mode) 701 { 702 struct nfs_inode *nfsi = NFS_I(inode); 703 struct nfs_open_context *pos, *ctx = NULL; 704 705 spin_lock(&inode->i_lock); 706 list_for_each_entry(pos, &nfsi->open_files, list) { 707 if (cred != NULL && pos->cred != cred) 708 continue; 709 if ((pos->mode & (FMODE_READ|FMODE_WRITE)) != mode) 710 continue; 711 ctx = get_nfs_open_context(pos); 712 break; 713 } 714 spin_unlock(&inode->i_lock); 715 return ctx; 716 } 717 718 static void nfs_file_clear_open_context(struct file *filp) 719 { 720 struct inode *inode = filp->f_path.dentry->d_inode; 721 struct nfs_open_context *ctx = nfs_file_open_context(filp); 722 723 if (ctx) { 724 filp->private_data = NULL; 725 spin_lock(&inode->i_lock); 726 list_move_tail(&ctx->list, &NFS_I(inode)->open_files); 727 spin_unlock(&inode->i_lock); 728 __put_nfs_open_context(ctx, filp->f_flags & O_DIRECT ? 0 : 1); 729 } 730 } 731 732 /* 733 * These allocate and release file read/write context information. 734 */ 735 int nfs_open(struct inode *inode, struct file *filp) 736 { 737 struct nfs_open_context *ctx; 738 struct rpc_cred *cred; 739 740 cred = rpc_lookup_cred(); 741 if (IS_ERR(cred)) 742 return PTR_ERR(cred); 743 ctx = alloc_nfs_open_context(&filp->f_path, cred, filp->f_mode); 744 put_rpccred(cred); 745 if (ctx == NULL) 746 return -ENOMEM; 747 nfs_file_set_open_context(filp, ctx); 748 put_nfs_open_context(ctx); 749 nfs_fscache_set_inode_cookie(inode, filp); 750 return 0; 751 } 752 753 int nfs_release(struct inode *inode, struct file *filp) 754 { 755 nfs_file_clear_open_context(filp); 756 return 0; 757 } 758 759 /* 760 * This function is called whenever some part of NFS notices that 761 * the cached attributes have to be refreshed. 762 */ 763 int 764 __nfs_revalidate_inode(struct nfs_server *server, struct inode *inode) 765 { 766 int status = -ESTALE; 767 struct nfs_fattr *fattr = NULL; 768 struct nfs_inode *nfsi = NFS_I(inode); 769 770 dfprintk(PAGECACHE, "NFS: revalidating (%s/%Ld)\n", 771 inode->i_sb->s_id, (long long)NFS_FILEID(inode)); 772 773 if (is_bad_inode(inode)) 774 goto out; 775 if (NFS_STALE(inode)) 776 goto out; 777 778 status = -ENOMEM; 779 fattr = nfs_alloc_fattr(); 780 if (fattr == NULL) 781 goto out; 782 783 nfs_inc_stats(inode, NFSIOS_INODEREVALIDATE); 784 status = NFS_PROTO(inode)->getattr(server, NFS_FH(inode), fattr); 785 if (status != 0) { 786 dfprintk(PAGECACHE, "nfs_revalidate_inode: (%s/%Ld) getattr failed, error=%d\n", 787 inode->i_sb->s_id, 788 (long long)NFS_FILEID(inode), status); 789 if (status == -ESTALE) { 790 nfs_zap_caches(inode); 791 if (!S_ISDIR(inode->i_mode)) 792 set_bit(NFS_INO_STALE, &NFS_I(inode)->flags); 793 } 794 goto out; 795 } 796 797 status = nfs_refresh_inode(inode, fattr); 798 if (status) { 799 dfprintk(PAGECACHE, "nfs_revalidate_inode: (%s/%Ld) refresh failed, error=%d\n", 800 inode->i_sb->s_id, 801 (long long)NFS_FILEID(inode), status); 802 goto out; 803 } 804 805 if (nfsi->cache_validity & NFS_INO_INVALID_ACL) 806 nfs_zap_acl_cache(inode); 807 808 dfprintk(PAGECACHE, "NFS: (%s/%Ld) revalidation complete\n", 809 inode->i_sb->s_id, 810 (long long)NFS_FILEID(inode)); 811 812 out: 813 nfs_free_fattr(fattr); 814 return status; 815 } 816 817 int nfs_attribute_timeout(struct inode *inode) 818 { 819 struct nfs_inode *nfsi = NFS_I(inode); 820 821 return !time_in_range_open(jiffies, nfsi->read_cache_jiffies, nfsi->read_cache_jiffies + nfsi->attrtimeo); 822 } 823 824 static int nfs_attribute_cache_expired(struct inode *inode) 825 { 826 if (nfs_have_delegated_attributes(inode)) 827 return 0; 828 return nfs_attribute_timeout(inode); 829 } 830 831 /** 832 * nfs_revalidate_inode - Revalidate the inode attributes 833 * @server - pointer to nfs_server struct 834 * @inode - pointer to inode struct 835 * 836 * Updates inode attribute information by retrieving the data from the server. 837 */ 838 int nfs_revalidate_inode(struct nfs_server *server, struct inode *inode) 839 { 840 if (!(NFS_I(inode)->cache_validity & NFS_INO_INVALID_ATTR) 841 && !nfs_attribute_cache_expired(inode)) 842 return NFS_STALE(inode) ? -ESTALE : 0; 843 return __nfs_revalidate_inode(server, inode); 844 } 845 846 static int nfs_invalidate_mapping(struct inode *inode, struct address_space *mapping) 847 { 848 struct nfs_inode *nfsi = NFS_I(inode); 849 850 if (mapping->nrpages != 0) { 851 int ret = invalidate_inode_pages2(mapping); 852 if (ret < 0) 853 return ret; 854 } 855 spin_lock(&inode->i_lock); 856 nfsi->cache_validity &= ~NFS_INO_INVALID_DATA; 857 if (S_ISDIR(inode->i_mode)) 858 memset(nfsi->cookieverf, 0, sizeof(nfsi->cookieverf)); 859 spin_unlock(&inode->i_lock); 860 nfs_inc_stats(inode, NFSIOS_DATAINVALIDATE); 861 nfs_fscache_reset_inode_cookie(inode); 862 dfprintk(PAGECACHE, "NFS: (%s/%Ld) data cache invalidated\n", 863 inode->i_sb->s_id, (long long)NFS_FILEID(inode)); 864 return 0; 865 } 866 867 /** 868 * nfs_revalidate_mapping - Revalidate the pagecache 869 * @inode - pointer to host inode 870 * @mapping - pointer to mapping 871 */ 872 int nfs_revalidate_mapping(struct inode *inode, struct address_space *mapping) 873 { 874 struct nfs_inode *nfsi = NFS_I(inode); 875 int ret = 0; 876 877 if ((nfsi->cache_validity & NFS_INO_REVAL_PAGECACHE) 878 || nfs_attribute_cache_expired(inode) 879 || NFS_STALE(inode)) { 880 ret = __nfs_revalidate_inode(NFS_SERVER(inode), inode); 881 if (ret < 0) 882 goto out; 883 } 884 if (nfsi->cache_validity & NFS_INO_INVALID_DATA) 885 ret = nfs_invalidate_mapping(inode, mapping); 886 out: 887 return ret; 888 } 889 890 static unsigned long nfs_wcc_update_inode(struct inode *inode, struct nfs_fattr *fattr) 891 { 892 struct nfs_inode *nfsi = NFS_I(inode); 893 unsigned long ret = 0; 894 895 if ((fattr->valid & NFS_ATTR_FATTR_PRECHANGE) 896 && (fattr->valid & NFS_ATTR_FATTR_CHANGE) 897 && nfsi->change_attr == fattr->pre_change_attr) { 898 nfsi->change_attr = fattr->change_attr; 899 if (S_ISDIR(inode->i_mode)) 900 nfsi->cache_validity |= NFS_INO_INVALID_DATA; 901 ret |= NFS_INO_INVALID_ATTR; 902 } 903 /* If we have atomic WCC data, we may update some attributes */ 904 if ((fattr->valid & NFS_ATTR_FATTR_PRECTIME) 905 && (fattr->valid & NFS_ATTR_FATTR_CTIME) 906 && timespec_equal(&inode->i_ctime, &fattr->pre_ctime)) { 907 memcpy(&inode->i_ctime, &fattr->ctime, sizeof(inode->i_ctime)); 908 ret |= NFS_INO_INVALID_ATTR; 909 } 910 911 if ((fattr->valid & NFS_ATTR_FATTR_PREMTIME) 912 && (fattr->valid & NFS_ATTR_FATTR_MTIME) 913 && timespec_equal(&inode->i_mtime, &fattr->pre_mtime)) { 914 memcpy(&inode->i_mtime, &fattr->mtime, sizeof(inode->i_mtime)); 915 if (S_ISDIR(inode->i_mode)) 916 nfsi->cache_validity |= NFS_INO_INVALID_DATA; 917 ret |= NFS_INO_INVALID_ATTR; 918 } 919 if ((fattr->valid & NFS_ATTR_FATTR_PRESIZE) 920 && (fattr->valid & NFS_ATTR_FATTR_SIZE) 921 && i_size_read(inode) == nfs_size_to_loff_t(fattr->pre_size) 922 && nfsi->npages == 0) { 923 i_size_write(inode, nfs_size_to_loff_t(fattr->size)); 924 ret |= NFS_INO_INVALID_ATTR; 925 } 926 return ret; 927 } 928 929 /** 930 * nfs_check_inode_attributes - verify consistency of the inode attribute cache 931 * @inode - pointer to inode 932 * @fattr - updated attributes 933 * 934 * Verifies the attribute cache. If we have just changed the attributes, 935 * so that fattr carries weak cache consistency data, then it may 936 * also update the ctime/mtime/change_attribute. 937 */ 938 static int nfs_check_inode_attributes(struct inode *inode, struct nfs_fattr *fattr) 939 { 940 struct nfs_inode *nfsi = NFS_I(inode); 941 loff_t cur_size, new_isize; 942 unsigned long invalid = 0; 943 944 945 /* Has the inode gone and changed behind our back? */ 946 if ((fattr->valid & NFS_ATTR_FATTR_FILEID) && nfsi->fileid != fattr->fileid) 947 return -EIO; 948 if ((fattr->valid & NFS_ATTR_FATTR_TYPE) && (inode->i_mode & S_IFMT) != (fattr->mode & S_IFMT)) 949 return -EIO; 950 951 if ((fattr->valid & NFS_ATTR_FATTR_CHANGE) != 0 && 952 nfsi->change_attr != fattr->change_attr) 953 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE; 954 955 /* Verify a few of the more important attributes */ 956 if ((fattr->valid & NFS_ATTR_FATTR_MTIME) && !timespec_equal(&inode->i_mtime, &fattr->mtime)) 957 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE; 958 959 if (fattr->valid & NFS_ATTR_FATTR_SIZE) { 960 cur_size = i_size_read(inode); 961 new_isize = nfs_size_to_loff_t(fattr->size); 962 if (cur_size != new_isize && nfsi->npages == 0) 963 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE; 964 } 965 966 /* Have any file permissions changed? */ 967 if ((fattr->valid & NFS_ATTR_FATTR_MODE) && (inode->i_mode & S_IALLUGO) != (fattr->mode & S_IALLUGO)) 968 invalid |= NFS_INO_INVALID_ATTR | NFS_INO_INVALID_ACCESS | NFS_INO_INVALID_ACL; 969 if ((fattr->valid & NFS_ATTR_FATTR_OWNER) && inode->i_uid != fattr->uid) 970 invalid |= NFS_INO_INVALID_ATTR | NFS_INO_INVALID_ACCESS | NFS_INO_INVALID_ACL; 971 if ((fattr->valid & NFS_ATTR_FATTR_GROUP) && inode->i_gid != fattr->gid) 972 invalid |= NFS_INO_INVALID_ATTR | NFS_INO_INVALID_ACCESS | NFS_INO_INVALID_ACL; 973 974 /* Has the link count changed? */ 975 if ((fattr->valid & NFS_ATTR_FATTR_NLINK) && inode->i_nlink != fattr->nlink) 976 invalid |= NFS_INO_INVALID_ATTR; 977 978 if ((fattr->valid & NFS_ATTR_FATTR_ATIME) && !timespec_equal(&inode->i_atime, &fattr->atime)) 979 invalid |= NFS_INO_INVALID_ATIME; 980 981 if (invalid != 0) 982 nfsi->cache_validity |= invalid; 983 984 nfsi->read_cache_jiffies = fattr->time_start; 985 return 0; 986 } 987 988 static int nfs_ctime_need_update(const struct inode *inode, const struct nfs_fattr *fattr) 989 { 990 if (!(fattr->valid & NFS_ATTR_FATTR_CTIME)) 991 return 0; 992 return timespec_compare(&fattr->ctime, &inode->i_ctime) > 0; 993 } 994 995 static int nfs_size_need_update(const struct inode *inode, const struct nfs_fattr *fattr) 996 { 997 if (!(fattr->valid & NFS_ATTR_FATTR_SIZE)) 998 return 0; 999 return nfs_size_to_loff_t(fattr->size) > i_size_read(inode); 1000 } 1001 1002 static atomic_long_t nfs_attr_generation_counter; 1003 1004 static unsigned long nfs_read_attr_generation_counter(void) 1005 { 1006 return atomic_long_read(&nfs_attr_generation_counter); 1007 } 1008 1009 unsigned long nfs_inc_attr_generation_counter(void) 1010 { 1011 return atomic_long_inc_return(&nfs_attr_generation_counter); 1012 } 1013 1014 void nfs_fattr_init(struct nfs_fattr *fattr) 1015 { 1016 fattr->valid = 0; 1017 fattr->time_start = jiffies; 1018 fattr->gencount = nfs_inc_attr_generation_counter(); 1019 } 1020 1021 struct nfs_fattr *nfs_alloc_fattr(void) 1022 { 1023 struct nfs_fattr *fattr; 1024 1025 fattr = kmalloc(sizeof(*fattr), GFP_NOFS); 1026 if (fattr != NULL) 1027 nfs_fattr_init(fattr); 1028 return fattr; 1029 } 1030 1031 struct nfs_fh *nfs_alloc_fhandle(void) 1032 { 1033 struct nfs_fh *fh; 1034 1035 fh = kmalloc(sizeof(struct nfs_fh), GFP_NOFS); 1036 if (fh != NULL) 1037 fh->size = 0; 1038 return fh; 1039 } 1040 1041 /** 1042 * nfs_inode_attrs_need_update - check if the inode attributes need updating 1043 * @inode - pointer to inode 1044 * @fattr - attributes 1045 * 1046 * Attempt to divine whether or not an RPC call reply carrying stale 1047 * attributes got scheduled after another call carrying updated ones. 1048 * 1049 * To do so, the function first assumes that a more recent ctime means 1050 * that the attributes in fattr are newer, however it also attempt to 1051 * catch the case where ctime either didn't change, or went backwards 1052 * (if someone reset the clock on the server) by looking at whether 1053 * or not this RPC call was started after the inode was last updated. 1054 * Note also the check for wraparound of 'attr_gencount' 1055 * 1056 * The function returns 'true' if it thinks the attributes in 'fattr' are 1057 * more recent than the ones cached in the inode. 1058 * 1059 */ 1060 static int nfs_inode_attrs_need_update(const struct inode *inode, const struct nfs_fattr *fattr) 1061 { 1062 const struct nfs_inode *nfsi = NFS_I(inode); 1063 1064 return ((long)fattr->gencount - (long)nfsi->attr_gencount) > 0 || 1065 nfs_ctime_need_update(inode, fattr) || 1066 nfs_size_need_update(inode, fattr) || 1067 ((long)nfsi->attr_gencount - (long)nfs_read_attr_generation_counter() > 0); 1068 } 1069 1070 static int nfs_refresh_inode_locked(struct inode *inode, struct nfs_fattr *fattr) 1071 { 1072 if (nfs_inode_attrs_need_update(inode, fattr)) 1073 return nfs_update_inode(inode, fattr); 1074 return nfs_check_inode_attributes(inode, fattr); 1075 } 1076 1077 /** 1078 * nfs_refresh_inode - try to update the inode attribute cache 1079 * @inode - pointer to inode 1080 * @fattr - updated attributes 1081 * 1082 * Check that an RPC call that returned attributes has not overlapped with 1083 * other recent updates of the inode metadata, then decide whether it is 1084 * safe to do a full update of the inode attributes, or whether just to 1085 * call nfs_check_inode_attributes. 1086 */ 1087 int nfs_refresh_inode(struct inode *inode, struct nfs_fattr *fattr) 1088 { 1089 int status; 1090 1091 if ((fattr->valid & NFS_ATTR_FATTR) == 0) 1092 return 0; 1093 spin_lock(&inode->i_lock); 1094 status = nfs_refresh_inode_locked(inode, fattr); 1095 spin_unlock(&inode->i_lock); 1096 1097 return status; 1098 } 1099 1100 static int nfs_post_op_update_inode_locked(struct inode *inode, struct nfs_fattr *fattr) 1101 { 1102 struct nfs_inode *nfsi = NFS_I(inode); 1103 1104 nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE; 1105 if (S_ISDIR(inode->i_mode)) 1106 nfsi->cache_validity |= NFS_INO_INVALID_DATA; 1107 if ((fattr->valid & NFS_ATTR_FATTR) == 0) 1108 return 0; 1109 return nfs_refresh_inode_locked(inode, fattr); 1110 } 1111 1112 /** 1113 * nfs_post_op_update_inode - try to update the inode attribute cache 1114 * @inode - pointer to inode 1115 * @fattr - updated attributes 1116 * 1117 * After an operation that has changed the inode metadata, mark the 1118 * attribute cache as being invalid, then try to update it. 1119 * 1120 * NB: if the server didn't return any post op attributes, this 1121 * function will force the retrieval of attributes before the next 1122 * NFS request. Thus it should be used only for operations that 1123 * are expected to change one or more attributes, to avoid 1124 * unnecessary NFS requests and trips through nfs_update_inode(). 1125 */ 1126 int nfs_post_op_update_inode(struct inode *inode, struct nfs_fattr *fattr) 1127 { 1128 int status; 1129 1130 spin_lock(&inode->i_lock); 1131 status = nfs_post_op_update_inode_locked(inode, fattr); 1132 spin_unlock(&inode->i_lock); 1133 return status; 1134 } 1135 1136 /** 1137 * nfs_post_op_update_inode_force_wcc - try to update the inode attribute cache 1138 * @inode - pointer to inode 1139 * @fattr - updated attributes 1140 * 1141 * After an operation that has changed the inode metadata, mark the 1142 * attribute cache as being invalid, then try to update it. Fake up 1143 * weak cache consistency data, if none exist. 1144 * 1145 * This function is mainly designed to be used by the ->write_done() functions. 1146 */ 1147 int nfs_post_op_update_inode_force_wcc(struct inode *inode, struct nfs_fattr *fattr) 1148 { 1149 int status; 1150 1151 spin_lock(&inode->i_lock); 1152 /* Don't do a WCC update if these attributes are already stale */ 1153 if ((fattr->valid & NFS_ATTR_FATTR) == 0 || 1154 !nfs_inode_attrs_need_update(inode, fattr)) { 1155 fattr->valid &= ~(NFS_ATTR_FATTR_PRECHANGE 1156 | NFS_ATTR_FATTR_PRESIZE 1157 | NFS_ATTR_FATTR_PREMTIME 1158 | NFS_ATTR_FATTR_PRECTIME); 1159 goto out_noforce; 1160 } 1161 if ((fattr->valid & NFS_ATTR_FATTR_CHANGE) != 0 && 1162 (fattr->valid & NFS_ATTR_FATTR_PRECHANGE) == 0) { 1163 fattr->pre_change_attr = NFS_I(inode)->change_attr; 1164 fattr->valid |= NFS_ATTR_FATTR_PRECHANGE; 1165 } 1166 if ((fattr->valid & NFS_ATTR_FATTR_CTIME) != 0 && 1167 (fattr->valid & NFS_ATTR_FATTR_PRECTIME) == 0) { 1168 memcpy(&fattr->pre_ctime, &inode->i_ctime, sizeof(fattr->pre_ctime)); 1169 fattr->valid |= NFS_ATTR_FATTR_PRECTIME; 1170 } 1171 if ((fattr->valid & NFS_ATTR_FATTR_MTIME) != 0 && 1172 (fattr->valid & NFS_ATTR_FATTR_PREMTIME) == 0) { 1173 memcpy(&fattr->pre_mtime, &inode->i_mtime, sizeof(fattr->pre_mtime)); 1174 fattr->valid |= NFS_ATTR_FATTR_PREMTIME; 1175 } 1176 if ((fattr->valid & NFS_ATTR_FATTR_SIZE) != 0 && 1177 (fattr->valid & NFS_ATTR_FATTR_PRESIZE) == 0) { 1178 fattr->pre_size = i_size_read(inode); 1179 fattr->valid |= NFS_ATTR_FATTR_PRESIZE; 1180 } 1181 out_noforce: 1182 status = nfs_post_op_update_inode_locked(inode, fattr); 1183 spin_unlock(&inode->i_lock); 1184 return status; 1185 } 1186 1187 /* 1188 * Many nfs protocol calls return the new file attributes after 1189 * an operation. Here we update the inode to reflect the state 1190 * of the server's inode. 1191 * 1192 * This is a bit tricky because we have to make sure all dirty pages 1193 * have been sent off to the server before calling invalidate_inode_pages. 1194 * To make sure no other process adds more write requests while we try 1195 * our best to flush them, we make them sleep during the attribute refresh. 1196 * 1197 * A very similar scenario holds for the dir cache. 1198 */ 1199 static int nfs_update_inode(struct inode *inode, struct nfs_fattr *fattr) 1200 { 1201 struct nfs_server *server; 1202 struct nfs_inode *nfsi = NFS_I(inode); 1203 loff_t cur_isize, new_isize; 1204 unsigned long invalid = 0; 1205 unsigned long now = jiffies; 1206 unsigned long save_cache_validity; 1207 1208 dfprintk(VFS, "NFS: %s(%s/%ld ct=%d info=0x%x)\n", 1209 __func__, inode->i_sb->s_id, inode->i_ino, 1210 atomic_read(&inode->i_count), fattr->valid); 1211 1212 if ((fattr->valid & NFS_ATTR_FATTR_FILEID) && nfsi->fileid != fattr->fileid) 1213 goto out_fileid; 1214 1215 /* 1216 * Make sure the inode's type hasn't changed. 1217 */ 1218 if ((fattr->valid & NFS_ATTR_FATTR_TYPE) && (inode->i_mode & S_IFMT) != (fattr->mode & S_IFMT)) 1219 goto out_changed; 1220 1221 server = NFS_SERVER(inode); 1222 /* Update the fsid? */ 1223 if (S_ISDIR(inode->i_mode) && (fattr->valid & NFS_ATTR_FATTR_FSID) && 1224 !nfs_fsid_equal(&server->fsid, &fattr->fsid) && 1225 !IS_AUTOMOUNT(inode)) 1226 server->fsid = fattr->fsid; 1227 1228 /* 1229 * Update the read time so we don't revalidate too often. 1230 */ 1231 nfsi->read_cache_jiffies = fattr->time_start; 1232 1233 save_cache_validity = nfsi->cache_validity; 1234 nfsi->cache_validity &= ~(NFS_INO_INVALID_ATTR 1235 | NFS_INO_INVALID_ATIME 1236 | NFS_INO_REVAL_FORCED 1237 | NFS_INO_REVAL_PAGECACHE); 1238 1239 /* Do atomic weak cache consistency updates */ 1240 invalid |= nfs_wcc_update_inode(inode, fattr); 1241 1242 /* More cache consistency checks */ 1243 if (fattr->valid & NFS_ATTR_FATTR_CHANGE) { 1244 if (nfsi->change_attr != fattr->change_attr) { 1245 dprintk("NFS: change_attr change on server for file %s/%ld\n", 1246 inode->i_sb->s_id, inode->i_ino); 1247 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1248 if (S_ISDIR(inode->i_mode)) 1249 nfs_force_lookup_revalidate(inode); 1250 nfsi->change_attr = fattr->change_attr; 1251 } 1252 } else if (server->caps & NFS_CAP_CHANGE_ATTR) 1253 invalid |= save_cache_validity; 1254 1255 if (fattr->valid & NFS_ATTR_FATTR_MTIME) { 1256 /* NFSv2/v3: Check if the mtime agrees */ 1257 if (!timespec_equal(&inode->i_mtime, &fattr->mtime)) { 1258 dprintk("NFS: mtime change on server for file %s/%ld\n", 1259 inode->i_sb->s_id, inode->i_ino); 1260 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA; 1261 if (S_ISDIR(inode->i_mode)) 1262 nfs_force_lookup_revalidate(inode); 1263 memcpy(&inode->i_mtime, &fattr->mtime, sizeof(inode->i_mtime)); 1264 } 1265 } else if (server->caps & NFS_CAP_MTIME) 1266 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1267 | NFS_INO_INVALID_DATA 1268 | NFS_INO_REVAL_PAGECACHE 1269 | NFS_INO_REVAL_FORCED); 1270 1271 if (fattr->valid & NFS_ATTR_FATTR_CTIME) { 1272 /* If ctime has changed we should definitely clear access+acl caches */ 1273 if (!timespec_equal(&inode->i_ctime, &fattr->ctime)) { 1274 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1275 /* and probably clear data for a directory too as utimes can cause 1276 * havoc with our cache. 1277 */ 1278 if (S_ISDIR(inode->i_mode)) { 1279 invalid |= NFS_INO_INVALID_DATA; 1280 nfs_force_lookup_revalidate(inode); 1281 } 1282 memcpy(&inode->i_ctime, &fattr->ctime, sizeof(inode->i_ctime)); 1283 } 1284 } else if (server->caps & NFS_CAP_CTIME) 1285 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1286 | NFS_INO_INVALID_ACCESS 1287 | NFS_INO_INVALID_ACL 1288 | NFS_INO_REVAL_FORCED); 1289 1290 /* Check if our cached file size is stale */ 1291 if (fattr->valid & NFS_ATTR_FATTR_SIZE) { 1292 new_isize = nfs_size_to_loff_t(fattr->size); 1293 cur_isize = i_size_read(inode); 1294 if (new_isize != cur_isize) { 1295 /* Do we perhaps have any outstanding writes, or has 1296 * the file grown beyond our last write? */ 1297 if (nfsi->npages == 0 || new_isize > cur_isize) { 1298 i_size_write(inode, new_isize); 1299 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA; 1300 } 1301 dprintk("NFS: isize change on server for file %s/%ld\n", 1302 inode->i_sb->s_id, inode->i_ino); 1303 } 1304 } else 1305 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1306 | NFS_INO_REVAL_PAGECACHE 1307 | NFS_INO_REVAL_FORCED); 1308 1309 1310 if (fattr->valid & NFS_ATTR_FATTR_ATIME) 1311 memcpy(&inode->i_atime, &fattr->atime, sizeof(inode->i_atime)); 1312 else if (server->caps & NFS_CAP_ATIME) 1313 invalid |= save_cache_validity & (NFS_INO_INVALID_ATIME 1314 | NFS_INO_REVAL_FORCED); 1315 1316 if (fattr->valid & NFS_ATTR_FATTR_MODE) { 1317 if ((inode->i_mode & S_IALLUGO) != (fattr->mode & S_IALLUGO)) { 1318 umode_t newmode = inode->i_mode & S_IFMT; 1319 newmode |= fattr->mode & S_IALLUGO; 1320 inode->i_mode = newmode; 1321 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1322 } 1323 } else if (server->caps & NFS_CAP_MODE) 1324 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1325 | NFS_INO_INVALID_ACCESS 1326 | NFS_INO_INVALID_ACL 1327 | NFS_INO_REVAL_FORCED); 1328 1329 if (fattr->valid & NFS_ATTR_FATTR_OWNER) { 1330 if (inode->i_uid != fattr->uid) { 1331 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1332 inode->i_uid = fattr->uid; 1333 } 1334 } else if (server->caps & NFS_CAP_OWNER) 1335 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1336 | NFS_INO_INVALID_ACCESS 1337 | NFS_INO_INVALID_ACL 1338 | NFS_INO_REVAL_FORCED); 1339 1340 if (fattr->valid & NFS_ATTR_FATTR_GROUP) { 1341 if (inode->i_gid != fattr->gid) { 1342 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1343 inode->i_gid = fattr->gid; 1344 } 1345 } else if (server->caps & NFS_CAP_OWNER_GROUP) 1346 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1347 | NFS_INO_INVALID_ACCESS 1348 | NFS_INO_INVALID_ACL 1349 | NFS_INO_REVAL_FORCED); 1350 1351 if (fattr->valid & NFS_ATTR_FATTR_NLINK) { 1352 if (inode->i_nlink != fattr->nlink) { 1353 invalid |= NFS_INO_INVALID_ATTR; 1354 if (S_ISDIR(inode->i_mode)) 1355 invalid |= NFS_INO_INVALID_DATA; 1356 inode->i_nlink = fattr->nlink; 1357 } 1358 } else if (server->caps & NFS_CAP_NLINK) 1359 invalid |= save_cache_validity & (NFS_INO_INVALID_ATTR 1360 | NFS_INO_REVAL_FORCED); 1361 1362 if (fattr->valid & NFS_ATTR_FATTR_SPACE_USED) { 1363 /* 1364 * report the blocks in 512byte units 1365 */ 1366 inode->i_blocks = nfs_calc_block_size(fattr->du.nfs3.used); 1367 } 1368 if (fattr->valid & NFS_ATTR_FATTR_BLOCKS_USED) 1369 inode->i_blocks = fattr->du.nfs2.blocks; 1370 1371 /* Update attrtimeo value if we're out of the unstable period */ 1372 if (invalid & NFS_INO_INVALID_ATTR) { 1373 nfs_inc_stats(inode, NFSIOS_ATTRINVALIDATE); 1374 nfsi->attrtimeo = NFS_MINATTRTIMEO(inode); 1375 nfsi->attrtimeo_timestamp = now; 1376 nfsi->attr_gencount = nfs_inc_attr_generation_counter(); 1377 } else { 1378 if (!time_in_range_open(now, nfsi->attrtimeo_timestamp, nfsi->attrtimeo_timestamp + nfsi->attrtimeo)) { 1379 if ((nfsi->attrtimeo <<= 1) > NFS_MAXATTRTIMEO(inode)) 1380 nfsi->attrtimeo = NFS_MAXATTRTIMEO(inode); 1381 nfsi->attrtimeo_timestamp = now; 1382 } 1383 } 1384 invalid &= ~NFS_INO_INVALID_ATTR; 1385 /* Don't invalidate the data if we were to blame */ 1386 if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) 1387 || S_ISLNK(inode->i_mode))) 1388 invalid &= ~NFS_INO_INVALID_DATA; 1389 if (!nfs_have_delegation(inode, FMODE_READ) || 1390 (save_cache_validity & NFS_INO_REVAL_FORCED)) 1391 nfsi->cache_validity |= invalid; 1392 1393 return 0; 1394 out_changed: 1395 /* 1396 * Big trouble! The inode has become a different object. 1397 */ 1398 printk(KERN_DEBUG "%s: inode %ld mode changed, %07o to %07o\n", 1399 __func__, inode->i_ino, inode->i_mode, fattr->mode); 1400 out_err: 1401 /* 1402 * No need to worry about unhashing the dentry, as the 1403 * lookup validation will know that the inode is bad. 1404 * (But we fall through to invalidate the caches.) 1405 */ 1406 nfs_invalidate_inode(inode); 1407 return -ESTALE; 1408 1409 out_fileid: 1410 printk(KERN_ERR "NFS: server %s error: fileid changed\n" 1411 "fsid %s: expected fileid 0x%Lx, got 0x%Lx\n", 1412 NFS_SERVER(inode)->nfs_client->cl_hostname, inode->i_sb->s_id, 1413 (long long)nfsi->fileid, (long long)fattr->fileid); 1414 goto out_err; 1415 } 1416 1417 1418 #ifdef CONFIG_NFS_V4 1419 1420 /* 1421 * Clean out any remaining NFSv4 state that might be left over due 1422 * to open() calls that passed nfs_atomic_lookup, but failed to call 1423 * nfs_open(). 1424 */ 1425 void nfs4_evict_inode(struct inode *inode) 1426 { 1427 pnfs_destroy_layout(NFS_I(inode)); 1428 truncate_inode_pages(&inode->i_data, 0); 1429 end_writeback(inode); 1430 /* If we are holding a delegation, return it! */ 1431 nfs_inode_return_delegation_noreclaim(inode); 1432 /* First call standard NFS clear_inode() code */ 1433 nfs_clear_inode(inode); 1434 } 1435 #endif 1436 1437 struct inode *nfs_alloc_inode(struct super_block *sb) 1438 { 1439 struct nfs_inode *nfsi; 1440 nfsi = (struct nfs_inode *)kmem_cache_alloc(nfs_inode_cachep, GFP_KERNEL); 1441 if (!nfsi) 1442 return NULL; 1443 nfsi->flags = 0UL; 1444 nfsi->cache_validity = 0UL; 1445 #ifdef CONFIG_NFS_V3_ACL 1446 nfsi->acl_access = ERR_PTR(-EAGAIN); 1447 nfsi->acl_default = ERR_PTR(-EAGAIN); 1448 #endif 1449 #ifdef CONFIG_NFS_V4 1450 nfsi->nfs4_acl = NULL; 1451 #endif /* CONFIG_NFS_V4 */ 1452 return &nfsi->vfs_inode; 1453 } 1454 1455 static void nfs_i_callback(struct rcu_head *head) 1456 { 1457 struct inode *inode = container_of(head, struct inode, i_rcu); 1458 INIT_LIST_HEAD(&inode->i_dentry); 1459 kmem_cache_free(nfs_inode_cachep, NFS_I(inode)); 1460 } 1461 1462 void nfs_destroy_inode(struct inode *inode) 1463 { 1464 call_rcu(&inode->i_rcu, nfs_i_callback); 1465 } 1466 1467 static inline void nfs4_init_once(struct nfs_inode *nfsi) 1468 { 1469 #ifdef CONFIG_NFS_V4 1470 INIT_LIST_HEAD(&nfsi->open_states); 1471 nfsi->delegation = NULL; 1472 nfsi->delegation_state = 0; 1473 init_rwsem(&nfsi->rwsem); 1474 nfsi->layout = NULL; 1475 atomic_set(&nfsi->commits_outstanding, 0); 1476 #endif 1477 } 1478 1479 static void init_once(void *foo) 1480 { 1481 struct nfs_inode *nfsi = (struct nfs_inode *) foo; 1482 1483 inode_init_once(&nfsi->vfs_inode); 1484 INIT_LIST_HEAD(&nfsi->open_files); 1485 INIT_LIST_HEAD(&nfsi->access_cache_entry_lru); 1486 INIT_LIST_HEAD(&nfsi->access_cache_inode_lru); 1487 INIT_RADIX_TREE(&nfsi->nfs_page_tree, GFP_ATOMIC); 1488 nfsi->npages = 0; 1489 nfsi->ncommit = 0; 1490 atomic_set(&nfsi->silly_count, 1); 1491 INIT_HLIST_HEAD(&nfsi->silly_list); 1492 init_waitqueue_head(&nfsi->waitqueue); 1493 nfs4_init_once(nfsi); 1494 } 1495 1496 static int __init nfs_init_inodecache(void) 1497 { 1498 nfs_inode_cachep = kmem_cache_create("nfs_inode_cache", 1499 sizeof(struct nfs_inode), 1500 0, (SLAB_RECLAIM_ACCOUNT| 1501 SLAB_MEM_SPREAD), 1502 init_once); 1503 if (nfs_inode_cachep == NULL) 1504 return -ENOMEM; 1505 1506 return 0; 1507 } 1508 1509 static void nfs_destroy_inodecache(void) 1510 { 1511 kmem_cache_destroy(nfs_inode_cachep); 1512 } 1513 1514 struct workqueue_struct *nfsiod_workqueue; 1515 1516 /* 1517 * start up the nfsiod workqueue 1518 */ 1519 static int nfsiod_start(void) 1520 { 1521 struct workqueue_struct *wq; 1522 dprintk("RPC: creating workqueue nfsiod\n"); 1523 wq = alloc_workqueue("nfsiod", WQ_MEM_RECLAIM, 0); 1524 if (wq == NULL) 1525 return -ENOMEM; 1526 nfsiod_workqueue = wq; 1527 return 0; 1528 } 1529 1530 /* 1531 * Destroy the nfsiod workqueue 1532 */ 1533 static void nfsiod_stop(void) 1534 { 1535 struct workqueue_struct *wq; 1536 1537 wq = nfsiod_workqueue; 1538 if (wq == NULL) 1539 return; 1540 nfsiod_workqueue = NULL; 1541 destroy_workqueue(wq); 1542 } 1543 1544 /* 1545 * Initialize NFS 1546 */ 1547 static int __init init_nfs_fs(void) 1548 { 1549 int err; 1550 1551 err = nfs_idmap_init(); 1552 if (err < 0) 1553 goto out9; 1554 1555 err = nfs_dns_resolver_init(); 1556 if (err < 0) 1557 goto out8; 1558 1559 err = nfs_fscache_register(); 1560 if (err < 0) 1561 goto out7; 1562 1563 err = nfsiod_start(); 1564 if (err) 1565 goto out6; 1566 1567 err = nfs_fs_proc_init(); 1568 if (err) 1569 goto out5; 1570 1571 err = nfs_init_nfspagecache(); 1572 if (err) 1573 goto out4; 1574 1575 err = nfs_init_inodecache(); 1576 if (err) 1577 goto out3; 1578 1579 err = nfs_init_readpagecache(); 1580 if (err) 1581 goto out2; 1582 1583 err = nfs_init_writepagecache(); 1584 if (err) 1585 goto out1; 1586 1587 err = nfs_init_directcache(); 1588 if (err) 1589 goto out0; 1590 1591 #ifdef CONFIG_PROC_FS 1592 rpc_proc_register(&nfs_rpcstat); 1593 #endif 1594 if ((err = register_nfs_fs()) != 0) 1595 goto out; 1596 return 0; 1597 out: 1598 #ifdef CONFIG_PROC_FS 1599 rpc_proc_unregister("nfs"); 1600 #endif 1601 nfs_destroy_directcache(); 1602 out0: 1603 nfs_destroy_writepagecache(); 1604 out1: 1605 nfs_destroy_readpagecache(); 1606 out2: 1607 nfs_destroy_inodecache(); 1608 out3: 1609 nfs_destroy_nfspagecache(); 1610 out4: 1611 nfs_fs_proc_exit(); 1612 out5: 1613 nfsiod_stop(); 1614 out6: 1615 nfs_fscache_unregister(); 1616 out7: 1617 nfs_dns_resolver_destroy(); 1618 out8: 1619 nfs_idmap_quit(); 1620 out9: 1621 return err; 1622 } 1623 1624 static void __exit exit_nfs_fs(void) 1625 { 1626 nfs_destroy_directcache(); 1627 nfs_destroy_writepagecache(); 1628 nfs_destroy_readpagecache(); 1629 nfs_destroy_inodecache(); 1630 nfs_destroy_nfspagecache(); 1631 nfs_fscache_unregister(); 1632 nfs_dns_resolver_destroy(); 1633 nfs_idmap_quit(); 1634 #ifdef CONFIG_PROC_FS 1635 rpc_proc_unregister("nfs"); 1636 #endif 1637 nfs_cleanup_cb_ident_idr(); 1638 unregister_nfs_fs(); 1639 nfs_fs_proc_exit(); 1640 nfsiod_stop(); 1641 } 1642 1643 /* Not quite true; I just maintain it */ 1644 MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>"); 1645 MODULE_LICENSE("GPL"); 1646 module_param(enable_ino64, bool, 0644); 1647 1648 module_init(init_nfs_fs) 1649 module_exit(exit_nfs_fs) 1650