1 /* 2 * linux/fs/nfs/inode.c 3 * 4 * Copyright (C) 1992 Rick Sladkey 5 * 6 * nfs inode and superblock handling functions 7 * 8 * Modularised by Alan Cox <Alan.Cox@linux.org>, while hacking some 9 * experimental NFS changes. Modularisation taken straight from SYS5 fs. 10 * 11 * Change to nfs_read_super() to permit NFS mounts to multi-homed hosts. 12 * J.S.Peatfield@damtp.cam.ac.uk 13 * 14 */ 15 16 #include <linux/config.h> 17 #include <linux/module.h> 18 #include <linux/init.h> 19 20 #include <linux/time.h> 21 #include <linux/kernel.h> 22 #include <linux/mm.h> 23 #include <linux/string.h> 24 #include <linux/stat.h> 25 #include <linux/errno.h> 26 #include <linux/unistd.h> 27 #include <linux/sunrpc/clnt.h> 28 #include <linux/sunrpc/stats.h> 29 #include <linux/nfs_fs.h> 30 #include <linux/nfs_mount.h> 31 #include <linux/nfs4_mount.h> 32 #include <linux/lockd/bind.h> 33 #include <linux/smp_lock.h> 34 #include <linux/seq_file.h> 35 #include <linux/mount.h> 36 #include <linux/nfs_idmap.h> 37 #include <linux/vfs.h> 38 39 #include <asm/system.h> 40 #include <asm/uaccess.h> 41 42 #include "nfs4_fs.h" 43 #include "delegation.h" 44 45 #define NFSDBG_FACILITY NFSDBG_VFS 46 #define NFS_PARANOIA 1 47 48 /* Maximum number of readahead requests 49 * FIXME: this should really be a sysctl so that users may tune it to suit 50 * their needs. People that do NFS over a slow network, might for 51 * instance want to reduce it to something closer to 1 for improved 52 * interactive response. 53 */ 54 #define NFS_MAX_READAHEAD (RPC_DEF_SLOT_TABLE - 1) 55 56 static void nfs_invalidate_inode(struct inode *); 57 static int nfs_update_inode(struct inode *, struct nfs_fattr *); 58 59 static struct inode *nfs_alloc_inode(struct super_block *sb); 60 static void nfs_destroy_inode(struct inode *); 61 static int nfs_write_inode(struct inode *,int); 62 static void nfs_delete_inode(struct inode *); 63 static void nfs_clear_inode(struct inode *); 64 static void nfs_umount_begin(struct super_block *); 65 static int nfs_statfs(struct super_block *, struct kstatfs *); 66 static int nfs_show_options(struct seq_file *, struct vfsmount *); 67 static void nfs_zap_acl_cache(struct inode *); 68 69 static struct rpc_program nfs_program; 70 71 static struct super_operations nfs_sops = { 72 .alloc_inode = nfs_alloc_inode, 73 .destroy_inode = nfs_destroy_inode, 74 .write_inode = nfs_write_inode, 75 .delete_inode = nfs_delete_inode, 76 .statfs = nfs_statfs, 77 .clear_inode = nfs_clear_inode, 78 .umount_begin = nfs_umount_begin, 79 .show_options = nfs_show_options, 80 }; 81 82 /* 83 * RPC cruft for NFS 84 */ 85 static struct rpc_stat nfs_rpcstat = { 86 .program = &nfs_program 87 }; 88 static struct rpc_version * nfs_version[] = { 89 NULL, 90 NULL, 91 &nfs_version2, 92 #if defined(CONFIG_NFS_V3) 93 &nfs_version3, 94 #elif defined(CONFIG_NFS_V4) 95 NULL, 96 #endif 97 #if defined(CONFIG_NFS_V4) 98 &nfs_version4, 99 #endif 100 }; 101 102 static struct rpc_program nfs_program = { 103 .name = "nfs", 104 .number = NFS_PROGRAM, 105 .nrvers = sizeof(nfs_version) / sizeof(nfs_version[0]), 106 .version = nfs_version, 107 .stats = &nfs_rpcstat, 108 .pipe_dir_name = "/nfs", 109 }; 110 111 #ifdef CONFIG_NFS_V3_ACL 112 static struct rpc_stat nfsacl_rpcstat = { &nfsacl_program }; 113 static struct rpc_version * nfsacl_version[] = { 114 [3] = &nfsacl_version3, 115 }; 116 117 struct rpc_program nfsacl_program = { 118 .name = "nfsacl", 119 .number = NFS_ACL_PROGRAM, 120 .nrvers = sizeof(nfsacl_version) / sizeof(nfsacl_version[0]), 121 .version = nfsacl_version, 122 .stats = &nfsacl_rpcstat, 123 }; 124 #endif /* CONFIG_NFS_V3_ACL */ 125 126 static inline unsigned long 127 nfs_fattr_to_ino_t(struct nfs_fattr *fattr) 128 { 129 return nfs_fileid_to_ino_t(fattr->fileid); 130 } 131 132 static int 133 nfs_write_inode(struct inode *inode, int sync) 134 { 135 int flags = sync ? FLUSH_WAIT : 0; 136 int ret; 137 138 ret = nfs_commit_inode(inode, flags); 139 if (ret < 0) 140 return ret; 141 return 0; 142 } 143 144 static void 145 nfs_delete_inode(struct inode * inode) 146 { 147 dprintk("NFS: delete_inode(%s/%ld)\n", inode->i_sb->s_id, inode->i_ino); 148 149 truncate_inode_pages(&inode->i_data, 0); 150 151 nfs_wb_all(inode); 152 /* 153 * The following should never happen... 154 */ 155 if (nfs_have_writebacks(inode)) { 156 printk(KERN_ERR "nfs_delete_inode: inode %ld has pending RPC requests\n", inode->i_ino); 157 } 158 159 clear_inode(inode); 160 } 161 162 static void 163 nfs_clear_inode(struct inode *inode) 164 { 165 struct nfs_inode *nfsi = NFS_I(inode); 166 struct rpc_cred *cred; 167 168 nfs_wb_all(inode); 169 BUG_ON (!list_empty(&nfsi->open_files)); 170 nfs_zap_acl_cache(inode); 171 cred = nfsi->cache_access.cred; 172 if (cred) 173 put_rpccred(cred); 174 BUG_ON(atomic_read(&nfsi->data_updates) != 0); 175 } 176 177 void 178 nfs_umount_begin(struct super_block *sb) 179 { 180 struct rpc_clnt *rpc = NFS_SB(sb)->client; 181 182 /* -EIO all pending I/O */ 183 if (!IS_ERR(rpc)) 184 rpc_killall_tasks(rpc); 185 rpc = NFS_SB(sb)->client_acl; 186 if (!IS_ERR(rpc)) 187 rpc_killall_tasks(rpc); 188 } 189 190 191 static inline unsigned long 192 nfs_block_bits(unsigned long bsize, unsigned char *nrbitsp) 193 { 194 /* make sure blocksize is a power of two */ 195 if ((bsize & (bsize - 1)) || nrbitsp) { 196 unsigned char nrbits; 197 198 for (nrbits = 31; nrbits && !(bsize & (1 << nrbits)); nrbits--) 199 ; 200 bsize = 1 << nrbits; 201 if (nrbitsp) 202 *nrbitsp = nrbits; 203 } 204 205 return bsize; 206 } 207 208 /* 209 * Calculate the number of 512byte blocks used. 210 */ 211 static inline unsigned long 212 nfs_calc_block_size(u64 tsize) 213 { 214 loff_t used = (tsize + 511) >> 9; 215 return (used > ULONG_MAX) ? ULONG_MAX : used; 216 } 217 218 /* 219 * Compute and set NFS server blocksize 220 */ 221 static inline unsigned long 222 nfs_block_size(unsigned long bsize, unsigned char *nrbitsp) 223 { 224 if (bsize < 1024) 225 bsize = NFS_DEF_FILE_IO_BUFFER_SIZE; 226 else if (bsize >= NFS_MAX_FILE_IO_BUFFER_SIZE) 227 bsize = NFS_MAX_FILE_IO_BUFFER_SIZE; 228 229 return nfs_block_bits(bsize, nrbitsp); 230 } 231 232 /* 233 * Obtain the root inode of the file system. 234 */ 235 static struct inode * 236 nfs_get_root(struct super_block *sb, struct nfs_fh *rootfh, struct nfs_fsinfo *fsinfo) 237 { 238 struct nfs_server *server = NFS_SB(sb); 239 struct inode *rooti; 240 int error; 241 242 error = server->rpc_ops->getroot(server, rootfh, fsinfo); 243 if (error < 0) { 244 dprintk("nfs_get_root: getattr error = %d\n", -error); 245 return ERR_PTR(error); 246 } 247 248 rooti = nfs_fhget(sb, rootfh, fsinfo->fattr); 249 if (!rooti) 250 return ERR_PTR(-ENOMEM); 251 return rooti; 252 } 253 254 /* 255 * Do NFS version-independent mount processing, and sanity checking 256 */ 257 static int 258 nfs_sb_init(struct super_block *sb, rpc_authflavor_t authflavor) 259 { 260 struct nfs_server *server; 261 struct inode *root_inode; 262 struct nfs_fattr fattr; 263 struct nfs_fsinfo fsinfo = { 264 .fattr = &fattr, 265 }; 266 struct nfs_pathconf pathinfo = { 267 .fattr = &fattr, 268 }; 269 int no_root_error = 0; 270 unsigned long max_rpc_payload; 271 272 /* We probably want something more informative here */ 273 snprintf(sb->s_id, sizeof(sb->s_id), "%x:%x", MAJOR(sb->s_dev), MINOR(sb->s_dev)); 274 275 server = NFS_SB(sb); 276 277 sb->s_magic = NFS_SUPER_MAGIC; 278 279 root_inode = nfs_get_root(sb, &server->fh, &fsinfo); 280 /* Did getting the root inode fail? */ 281 if (IS_ERR(root_inode)) { 282 no_root_error = PTR_ERR(root_inode); 283 goto out_no_root; 284 } 285 sb->s_root = d_alloc_root(root_inode); 286 if (!sb->s_root) { 287 no_root_error = -ENOMEM; 288 goto out_no_root; 289 } 290 sb->s_root->d_op = server->rpc_ops->dentry_ops; 291 292 /* Get some general file system info */ 293 if (server->namelen == 0 && 294 server->rpc_ops->pathconf(server, &server->fh, &pathinfo) >= 0) 295 server->namelen = pathinfo.max_namelen; 296 /* Work out a lot of parameters */ 297 if (server->rsize == 0) 298 server->rsize = nfs_block_size(fsinfo.rtpref, NULL); 299 if (server->wsize == 0) 300 server->wsize = nfs_block_size(fsinfo.wtpref, NULL); 301 302 if (fsinfo.rtmax >= 512 && server->rsize > fsinfo.rtmax) 303 server->rsize = nfs_block_size(fsinfo.rtmax, NULL); 304 if (fsinfo.wtmax >= 512 && server->wsize > fsinfo.wtmax) 305 server->wsize = nfs_block_size(fsinfo.wtmax, NULL); 306 307 max_rpc_payload = nfs_block_size(rpc_max_payload(server->client), NULL); 308 if (server->rsize > max_rpc_payload) 309 server->rsize = max_rpc_payload; 310 if (server->wsize > max_rpc_payload) 311 server->wsize = max_rpc_payload; 312 313 server->rpages = (server->rsize + PAGE_CACHE_SIZE - 1) >> PAGE_CACHE_SHIFT; 314 if (server->rpages > NFS_READ_MAXIOV) { 315 server->rpages = NFS_READ_MAXIOV; 316 server->rsize = server->rpages << PAGE_CACHE_SHIFT; 317 } 318 319 server->wpages = (server->wsize + PAGE_CACHE_SIZE - 1) >> PAGE_CACHE_SHIFT; 320 if (server->wpages > NFS_WRITE_MAXIOV) { 321 server->wpages = NFS_WRITE_MAXIOV; 322 server->wsize = server->wpages << PAGE_CACHE_SHIFT; 323 } 324 325 if (sb->s_blocksize == 0) 326 sb->s_blocksize = nfs_block_bits(server->wsize, 327 &sb->s_blocksize_bits); 328 server->wtmult = nfs_block_bits(fsinfo.wtmult, NULL); 329 330 server->dtsize = nfs_block_size(fsinfo.dtpref, NULL); 331 if (server->dtsize > PAGE_CACHE_SIZE) 332 server->dtsize = PAGE_CACHE_SIZE; 333 if (server->dtsize > server->rsize) 334 server->dtsize = server->rsize; 335 336 if (server->flags & NFS_MOUNT_NOAC) { 337 server->acregmin = server->acregmax = 0; 338 server->acdirmin = server->acdirmax = 0; 339 sb->s_flags |= MS_SYNCHRONOUS; 340 } 341 server->backing_dev_info.ra_pages = server->rpages * NFS_MAX_READAHEAD; 342 343 sb->s_maxbytes = fsinfo.maxfilesize; 344 if (sb->s_maxbytes > MAX_LFS_FILESIZE) 345 sb->s_maxbytes = MAX_LFS_FILESIZE; 346 347 server->client->cl_intr = (server->flags & NFS_MOUNT_INTR) ? 1 : 0; 348 server->client->cl_softrtry = (server->flags & NFS_MOUNT_SOFT) ? 1 : 0; 349 350 /* We're airborne Set socket buffersize */ 351 rpc_setbufsize(server->client, server->wsize + 100, server->rsize + 100); 352 return 0; 353 /* Yargs. It didn't work out. */ 354 out_no_root: 355 dprintk("nfs_sb_init: get root inode failed: errno %d\n", -no_root_error); 356 if (!IS_ERR(root_inode)) 357 iput(root_inode); 358 return no_root_error; 359 } 360 361 static void nfs_init_timeout_values(struct rpc_timeout *to, int proto, unsigned int timeo, unsigned int retrans) 362 { 363 to->to_initval = timeo * HZ / 10; 364 to->to_retries = retrans; 365 if (!to->to_retries) 366 to->to_retries = 2; 367 368 switch (proto) { 369 case IPPROTO_TCP: 370 if (!to->to_initval) 371 to->to_initval = 60 * HZ; 372 if (to->to_initval > NFS_MAX_TCP_TIMEOUT) 373 to->to_initval = NFS_MAX_TCP_TIMEOUT; 374 to->to_increment = to->to_initval; 375 to->to_maxval = to->to_initval + (to->to_increment * to->to_retries); 376 to->to_exponential = 0; 377 break; 378 case IPPROTO_UDP: 379 default: 380 if (!to->to_initval) 381 to->to_initval = 11 * HZ / 10; 382 if (to->to_initval > NFS_MAX_UDP_TIMEOUT) 383 to->to_initval = NFS_MAX_UDP_TIMEOUT; 384 to->to_maxval = NFS_MAX_UDP_TIMEOUT; 385 to->to_exponential = 1; 386 break; 387 } 388 } 389 390 /* 391 * Create an RPC client handle. 392 */ 393 static struct rpc_clnt * 394 nfs_create_client(struct nfs_server *server, const struct nfs_mount_data *data) 395 { 396 struct rpc_timeout timeparms; 397 struct rpc_xprt *xprt = NULL; 398 struct rpc_clnt *clnt = NULL; 399 int proto = (data->flags & NFS_MOUNT_TCP) ? IPPROTO_TCP : IPPROTO_UDP; 400 401 nfs_init_timeout_values(&timeparms, proto, data->timeo, data->retrans); 402 403 /* create transport and client */ 404 xprt = xprt_create_proto(proto, &server->addr, &timeparms); 405 if (IS_ERR(xprt)) { 406 dprintk("%s: cannot create RPC transport. Error = %ld\n", 407 __FUNCTION__, PTR_ERR(xprt)); 408 return (struct rpc_clnt *)xprt; 409 } 410 clnt = rpc_create_client(xprt, server->hostname, &nfs_program, 411 server->rpc_ops->version, data->pseudoflavor); 412 if (IS_ERR(clnt)) { 413 dprintk("%s: cannot create RPC client. Error = %ld\n", 414 __FUNCTION__, PTR_ERR(xprt)); 415 goto out_fail; 416 } 417 418 clnt->cl_intr = 1; 419 clnt->cl_softrtry = 1; 420 clnt->cl_chatty = 1; 421 422 return clnt; 423 424 out_fail: 425 return clnt; 426 } 427 428 /* 429 * The way this works is that the mount process passes a structure 430 * in the data argument which contains the server's IP address 431 * and the root file handle obtained from the server's mount 432 * daemon. We stash these away in the private superblock fields. 433 */ 434 static int 435 nfs_fill_super(struct super_block *sb, struct nfs_mount_data *data, int silent) 436 { 437 struct nfs_server *server; 438 rpc_authflavor_t authflavor; 439 440 server = NFS_SB(sb); 441 sb->s_blocksize_bits = 0; 442 sb->s_blocksize = 0; 443 if (data->bsize) 444 sb->s_blocksize = nfs_block_size(data->bsize, &sb->s_blocksize_bits); 445 if (data->rsize) 446 server->rsize = nfs_block_size(data->rsize, NULL); 447 if (data->wsize) 448 server->wsize = nfs_block_size(data->wsize, NULL); 449 server->flags = data->flags & NFS_MOUNT_FLAGMASK; 450 451 server->acregmin = data->acregmin*HZ; 452 server->acregmax = data->acregmax*HZ; 453 server->acdirmin = data->acdirmin*HZ; 454 server->acdirmax = data->acdirmax*HZ; 455 456 /* Start lockd here, before we might error out */ 457 if (!(server->flags & NFS_MOUNT_NONLM)) 458 lockd_up(); 459 460 server->namelen = data->namlen; 461 server->hostname = kmalloc(strlen(data->hostname) + 1, GFP_KERNEL); 462 if (!server->hostname) 463 return -ENOMEM; 464 strcpy(server->hostname, data->hostname); 465 466 /* Check NFS protocol revision and initialize RPC op vector 467 * and file handle pool. */ 468 #ifdef CONFIG_NFS_V3 469 if (server->flags & NFS_MOUNT_VER3) { 470 server->rpc_ops = &nfs_v3_clientops; 471 server->caps |= NFS_CAP_READDIRPLUS; 472 } else { 473 server->rpc_ops = &nfs_v2_clientops; 474 } 475 #else 476 server->rpc_ops = &nfs_v2_clientops; 477 #endif 478 479 /* Fill in pseudoflavor for mount version < 5 */ 480 if (!(data->flags & NFS_MOUNT_SECFLAVOUR)) 481 data->pseudoflavor = RPC_AUTH_UNIX; 482 authflavor = data->pseudoflavor; /* save for sb_init() */ 483 /* XXX maybe we want to add a server->pseudoflavor field */ 484 485 /* Create RPC client handles */ 486 server->client = nfs_create_client(server, data); 487 if (IS_ERR(server->client)) 488 return PTR_ERR(server->client); 489 /* RFC 2623, sec 2.3.2 */ 490 if (authflavor != RPC_AUTH_UNIX) { 491 struct rpc_auth *auth; 492 493 server->client_sys = rpc_clone_client(server->client); 494 if (IS_ERR(server->client_sys)) 495 return PTR_ERR(server->client_sys); 496 auth = rpcauth_create(RPC_AUTH_UNIX, server->client_sys); 497 if (IS_ERR(auth)) 498 return PTR_ERR(auth); 499 } else { 500 atomic_inc(&server->client->cl_count); 501 server->client_sys = server->client; 502 } 503 if (server->flags & NFS_MOUNT_VER3) { 504 #ifdef CONFIG_NFS_V3_ACL 505 if (!(server->flags & NFS_MOUNT_NOACL)) { 506 server->client_acl = rpc_bind_new_program(server->client, &nfsacl_program, 3); 507 /* No errors! Assume that Sun nfsacls are supported */ 508 if (!IS_ERR(server->client_acl)) 509 server->caps |= NFS_CAP_ACLS; 510 } 511 #else 512 server->flags &= ~NFS_MOUNT_NOACL; 513 #endif /* CONFIG_NFS_V3_ACL */ 514 /* 515 * The VFS shouldn't apply the umask to mode bits. We will 516 * do so ourselves when necessary. 517 */ 518 sb->s_flags |= MS_POSIXACL; 519 if (server->namelen == 0 || server->namelen > NFS3_MAXNAMLEN) 520 server->namelen = NFS3_MAXNAMLEN; 521 sb->s_time_gran = 1; 522 } else { 523 if (server->namelen == 0 || server->namelen > NFS2_MAXNAMLEN) 524 server->namelen = NFS2_MAXNAMLEN; 525 } 526 527 sb->s_op = &nfs_sops; 528 return nfs_sb_init(sb, authflavor); 529 } 530 531 static int 532 nfs_statfs(struct super_block *sb, struct kstatfs *buf) 533 { 534 struct nfs_server *server = NFS_SB(sb); 535 unsigned char blockbits; 536 unsigned long blockres; 537 struct nfs_fh *rootfh = NFS_FH(sb->s_root->d_inode); 538 struct nfs_fattr fattr; 539 struct nfs_fsstat res = { 540 .fattr = &fattr, 541 }; 542 int error; 543 544 lock_kernel(); 545 546 error = server->rpc_ops->statfs(server, rootfh, &res); 547 buf->f_type = NFS_SUPER_MAGIC; 548 if (error < 0) 549 goto out_err; 550 551 /* 552 * Current versions of glibc do not correctly handle the 553 * case where f_frsize != f_bsize. Eventually we want to 554 * report the value of wtmult in this field. 555 */ 556 buf->f_frsize = sb->s_blocksize; 557 558 /* 559 * On most *nix systems, f_blocks, f_bfree, and f_bavail 560 * are reported in units of f_frsize. Linux hasn't had 561 * an f_frsize field in its statfs struct until recently, 562 * thus historically Linux's sys_statfs reports these 563 * fields in units of f_bsize. 564 */ 565 buf->f_bsize = sb->s_blocksize; 566 blockbits = sb->s_blocksize_bits; 567 blockres = (1 << blockbits) - 1; 568 buf->f_blocks = (res.tbytes + blockres) >> blockbits; 569 buf->f_bfree = (res.fbytes + blockres) >> blockbits; 570 buf->f_bavail = (res.abytes + blockres) >> blockbits; 571 572 buf->f_files = res.tfiles; 573 buf->f_ffree = res.afiles; 574 575 buf->f_namelen = server->namelen; 576 out: 577 unlock_kernel(); 578 579 return 0; 580 581 out_err: 582 printk(KERN_WARNING "nfs_statfs: statfs error = %d\n", -error); 583 buf->f_bsize = buf->f_blocks = buf->f_bfree = buf->f_bavail = -1; 584 goto out; 585 586 } 587 588 static int nfs_show_options(struct seq_file *m, struct vfsmount *mnt) 589 { 590 static struct proc_nfs_info { 591 int flag; 592 char *str; 593 char *nostr; 594 } nfs_info[] = { 595 { NFS_MOUNT_SOFT, ",soft", ",hard" }, 596 { NFS_MOUNT_INTR, ",intr", "" }, 597 { NFS_MOUNT_POSIX, ",posix", "" }, 598 { NFS_MOUNT_NOCTO, ",nocto", "" }, 599 { NFS_MOUNT_NOAC, ",noac", "" }, 600 { NFS_MOUNT_NONLM, ",nolock", ",lock" }, 601 { NFS_MOUNT_NOACL, ",noacl", "" }, 602 { 0, NULL, NULL } 603 }; 604 struct proc_nfs_info *nfs_infop; 605 struct nfs_server *nfss = NFS_SB(mnt->mnt_sb); 606 char buf[12]; 607 char *proto; 608 609 seq_printf(m, ",v%d", nfss->rpc_ops->version); 610 seq_printf(m, ",rsize=%d", nfss->rsize); 611 seq_printf(m, ",wsize=%d", nfss->wsize); 612 if (nfss->acregmin != 3*HZ) 613 seq_printf(m, ",acregmin=%d", nfss->acregmin/HZ); 614 if (nfss->acregmax != 60*HZ) 615 seq_printf(m, ",acregmax=%d", nfss->acregmax/HZ); 616 if (nfss->acdirmin != 30*HZ) 617 seq_printf(m, ",acdirmin=%d", nfss->acdirmin/HZ); 618 if (nfss->acdirmax != 60*HZ) 619 seq_printf(m, ",acdirmax=%d", nfss->acdirmax/HZ); 620 for (nfs_infop = nfs_info; nfs_infop->flag; nfs_infop++) { 621 if (nfss->flags & nfs_infop->flag) 622 seq_puts(m, nfs_infop->str); 623 else 624 seq_puts(m, nfs_infop->nostr); 625 } 626 switch (nfss->client->cl_xprt->prot) { 627 case IPPROTO_TCP: 628 proto = "tcp"; 629 break; 630 case IPPROTO_UDP: 631 proto = "udp"; 632 break; 633 default: 634 snprintf(buf, sizeof(buf), "%u", nfss->client->cl_xprt->prot); 635 proto = buf; 636 } 637 seq_printf(m, ",proto=%s", proto); 638 seq_puts(m, ",addr="); 639 seq_escape(m, nfss->hostname, " \t\n\\"); 640 return 0; 641 } 642 643 /* 644 * Invalidate the local caches 645 */ 646 static void nfs_zap_caches_locked(struct inode *inode) 647 { 648 struct nfs_inode *nfsi = NFS_I(inode); 649 int mode = inode->i_mode; 650 651 NFS_ATTRTIMEO(inode) = NFS_MINATTRTIMEO(inode); 652 NFS_ATTRTIMEO_UPDATE(inode) = jiffies; 653 654 memset(NFS_COOKIEVERF(inode), 0, sizeof(NFS_COOKIEVERF(inode))); 655 if (S_ISREG(mode) || S_ISDIR(mode) || S_ISLNK(mode)) 656 nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL|NFS_INO_REVAL_PAGECACHE; 657 else 658 nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL|NFS_INO_REVAL_PAGECACHE; 659 } 660 661 void nfs_zap_caches(struct inode *inode) 662 { 663 spin_lock(&inode->i_lock); 664 nfs_zap_caches_locked(inode); 665 spin_unlock(&inode->i_lock); 666 } 667 668 static void nfs_zap_acl_cache(struct inode *inode) 669 { 670 void (*clear_acl_cache)(struct inode *); 671 672 clear_acl_cache = NFS_PROTO(inode)->clear_acl_cache; 673 if (clear_acl_cache != NULL) 674 clear_acl_cache(inode); 675 spin_lock(&inode->i_lock); 676 NFS_I(inode)->cache_validity &= ~NFS_INO_INVALID_ACL; 677 spin_unlock(&inode->i_lock); 678 } 679 680 /* 681 * Invalidate, but do not unhash, the inode. 682 * NB: must be called with inode->i_lock held! 683 */ 684 static void nfs_invalidate_inode(struct inode *inode) 685 { 686 set_bit(NFS_INO_STALE, &NFS_FLAGS(inode)); 687 nfs_zap_caches_locked(inode); 688 } 689 690 struct nfs_find_desc { 691 struct nfs_fh *fh; 692 struct nfs_fattr *fattr; 693 }; 694 695 /* 696 * In NFSv3 we can have 64bit inode numbers. In order to support 697 * this, and re-exported directories (also seen in NFSv2) 698 * we are forced to allow 2 different inodes to have the same 699 * i_ino. 700 */ 701 static int 702 nfs_find_actor(struct inode *inode, void *opaque) 703 { 704 struct nfs_find_desc *desc = (struct nfs_find_desc *)opaque; 705 struct nfs_fh *fh = desc->fh; 706 struct nfs_fattr *fattr = desc->fattr; 707 708 if (NFS_FILEID(inode) != fattr->fileid) 709 return 0; 710 if (nfs_compare_fh(NFS_FH(inode), fh)) 711 return 0; 712 if (is_bad_inode(inode) || NFS_STALE(inode)) 713 return 0; 714 return 1; 715 } 716 717 static int 718 nfs_init_locked(struct inode *inode, void *opaque) 719 { 720 struct nfs_find_desc *desc = (struct nfs_find_desc *)opaque; 721 struct nfs_fattr *fattr = desc->fattr; 722 723 NFS_FILEID(inode) = fattr->fileid; 724 nfs_copy_fh(NFS_FH(inode), desc->fh); 725 return 0; 726 } 727 728 /* Don't use READDIRPLUS on directories that we believe are too large */ 729 #define NFS_LIMIT_READDIRPLUS (8*PAGE_SIZE) 730 731 /* 732 * This is our front-end to iget that looks up inodes by file handle 733 * instead of inode number. 734 */ 735 struct inode * 736 nfs_fhget(struct super_block *sb, struct nfs_fh *fh, struct nfs_fattr *fattr) 737 { 738 struct nfs_find_desc desc = { 739 .fh = fh, 740 .fattr = fattr 741 }; 742 struct inode *inode = NULL; 743 unsigned long hash; 744 745 if ((fattr->valid & NFS_ATTR_FATTR) == 0) 746 goto out_no_inode; 747 748 if (!fattr->nlink) { 749 printk("NFS: Buggy server - nlink == 0!\n"); 750 goto out_no_inode; 751 } 752 753 hash = nfs_fattr_to_ino_t(fattr); 754 755 if (!(inode = iget5_locked(sb, hash, nfs_find_actor, nfs_init_locked, &desc))) 756 goto out_no_inode; 757 758 if (inode->i_state & I_NEW) { 759 struct nfs_inode *nfsi = NFS_I(inode); 760 761 /* We set i_ino for the few things that still rely on it, 762 * such as stat(2) */ 763 inode->i_ino = hash; 764 765 /* We can't support update_atime(), since the server will reset it */ 766 inode->i_flags |= S_NOATIME|S_NOCMTIME; 767 inode->i_mode = fattr->mode; 768 /* Why so? Because we want revalidate for devices/FIFOs, and 769 * that's precisely what we have in nfs_file_inode_operations. 770 */ 771 inode->i_op = NFS_SB(sb)->rpc_ops->file_inode_ops; 772 if (S_ISREG(inode->i_mode)) { 773 inode->i_fop = &nfs_file_operations; 774 inode->i_data.a_ops = &nfs_file_aops; 775 inode->i_data.backing_dev_info = &NFS_SB(sb)->backing_dev_info; 776 } else if (S_ISDIR(inode->i_mode)) { 777 inode->i_op = NFS_SB(sb)->rpc_ops->dir_inode_ops; 778 inode->i_fop = &nfs_dir_operations; 779 if (nfs_server_capable(inode, NFS_CAP_READDIRPLUS) 780 && fattr->size <= NFS_LIMIT_READDIRPLUS) 781 set_bit(NFS_INO_ADVISE_RDPLUS, &NFS_FLAGS(inode)); 782 } else if (S_ISLNK(inode->i_mode)) 783 inode->i_op = &nfs_symlink_inode_operations; 784 else 785 init_special_inode(inode, inode->i_mode, fattr->rdev); 786 787 nfsi->read_cache_jiffies = fattr->time_start; 788 nfsi->last_updated = jiffies; 789 inode->i_atime = fattr->atime; 790 inode->i_mtime = fattr->mtime; 791 inode->i_ctime = fattr->ctime; 792 if (fattr->valid & NFS_ATTR_FATTR_V4) 793 nfsi->change_attr = fattr->change_attr; 794 inode->i_size = nfs_size_to_loff_t(fattr->size); 795 inode->i_nlink = fattr->nlink; 796 inode->i_uid = fattr->uid; 797 inode->i_gid = fattr->gid; 798 if (fattr->valid & (NFS_ATTR_FATTR_V3 | NFS_ATTR_FATTR_V4)) { 799 /* 800 * report the blocks in 512byte units 801 */ 802 inode->i_blocks = nfs_calc_block_size(fattr->du.nfs3.used); 803 inode->i_blksize = inode->i_sb->s_blocksize; 804 } else { 805 inode->i_blocks = fattr->du.nfs2.blocks; 806 inode->i_blksize = fattr->du.nfs2.blocksize; 807 } 808 nfsi->attrtimeo = NFS_MINATTRTIMEO(inode); 809 nfsi->attrtimeo_timestamp = jiffies; 810 memset(nfsi->cookieverf, 0, sizeof(nfsi->cookieverf)); 811 nfsi->cache_access.cred = NULL; 812 813 unlock_new_inode(inode); 814 } else 815 nfs_refresh_inode(inode, fattr); 816 dprintk("NFS: nfs_fhget(%s/%Ld ct=%d)\n", 817 inode->i_sb->s_id, 818 (long long)NFS_FILEID(inode), 819 atomic_read(&inode->i_count)); 820 821 out: 822 return inode; 823 824 out_no_inode: 825 printk("nfs_fhget: iget failed\n"); 826 goto out; 827 } 828 829 #define NFS_VALID_ATTRS (ATTR_MODE|ATTR_UID|ATTR_GID|ATTR_SIZE|ATTR_ATIME|ATTR_ATIME_SET|ATTR_MTIME|ATTR_MTIME_SET) 830 831 int 832 nfs_setattr(struct dentry *dentry, struct iattr *attr) 833 { 834 struct inode *inode = dentry->d_inode; 835 struct nfs_fattr fattr; 836 int error; 837 838 if (attr->ia_valid & ATTR_SIZE) { 839 if (!S_ISREG(inode->i_mode) || attr->ia_size == i_size_read(inode)) 840 attr->ia_valid &= ~ATTR_SIZE; 841 } 842 843 /* Optimization: if the end result is no change, don't RPC */ 844 attr->ia_valid &= NFS_VALID_ATTRS; 845 if (attr->ia_valid == 0) 846 return 0; 847 848 lock_kernel(); 849 nfs_begin_data_update(inode); 850 /* Write all dirty data if we're changing file permissions or size */ 851 if ((attr->ia_valid & (ATTR_MODE|ATTR_UID|ATTR_GID|ATTR_SIZE)) != 0) { 852 if (filemap_fdatawrite(inode->i_mapping) == 0) 853 filemap_fdatawait(inode->i_mapping); 854 nfs_wb_all(inode); 855 } 856 /* 857 * Return any delegations if we're going to change ACLs 858 */ 859 if ((attr->ia_valid & (ATTR_MODE|ATTR_UID|ATTR_GID)) != 0) 860 nfs_inode_return_delegation(inode); 861 error = NFS_PROTO(inode)->setattr(dentry, &fattr, attr); 862 if (error == 0) 863 nfs_refresh_inode(inode, &fattr); 864 nfs_end_data_update(inode); 865 unlock_kernel(); 866 return error; 867 } 868 869 /** 870 * nfs_setattr_update_inode - Update inode metadata after a setattr call. 871 * @inode: pointer to struct inode 872 * @attr: pointer to struct iattr 873 * 874 * Note: we do this in the *proc.c in order to ensure that 875 * it works for things like exclusive creates too. 876 */ 877 void nfs_setattr_update_inode(struct inode *inode, struct iattr *attr) 878 { 879 if ((attr->ia_valid & (ATTR_MODE|ATTR_UID|ATTR_GID)) != 0) { 880 if ((attr->ia_valid & ATTR_MODE) != 0) { 881 int mode = attr->ia_mode & S_IALLUGO; 882 mode |= inode->i_mode & ~S_IALLUGO; 883 inode->i_mode = mode; 884 } 885 if ((attr->ia_valid & ATTR_UID) != 0) 886 inode->i_uid = attr->ia_uid; 887 if ((attr->ia_valid & ATTR_GID) != 0) 888 inode->i_gid = attr->ia_gid; 889 spin_lock(&inode->i_lock); 890 NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 891 spin_unlock(&inode->i_lock); 892 } 893 if ((attr->ia_valid & ATTR_SIZE) != 0) { 894 inode->i_size = attr->ia_size; 895 vmtruncate(inode, attr->ia_size); 896 } 897 } 898 899 static int nfs_wait_schedule(void *word) 900 { 901 if (signal_pending(current)) 902 return -ERESTARTSYS; 903 schedule(); 904 return 0; 905 } 906 907 /* 908 * Wait for the inode to get unlocked. 909 */ 910 static int nfs_wait_on_inode(struct inode *inode) 911 { 912 struct rpc_clnt *clnt = NFS_CLIENT(inode); 913 struct nfs_inode *nfsi = NFS_I(inode); 914 sigset_t oldmask; 915 int error; 916 917 rpc_clnt_sigmask(clnt, &oldmask); 918 error = wait_on_bit_lock(&nfsi->flags, NFS_INO_REVALIDATING, 919 nfs_wait_schedule, TASK_INTERRUPTIBLE); 920 rpc_clnt_sigunmask(clnt, &oldmask); 921 922 return error; 923 } 924 925 static void nfs_wake_up_inode(struct inode *inode) 926 { 927 struct nfs_inode *nfsi = NFS_I(inode); 928 929 clear_bit(NFS_INO_REVALIDATING, &nfsi->flags); 930 smp_mb__after_clear_bit(); 931 wake_up_bit(&nfsi->flags, NFS_INO_REVALIDATING); 932 } 933 934 int nfs_getattr(struct vfsmount *mnt, struct dentry *dentry, struct kstat *stat) 935 { 936 struct inode *inode = dentry->d_inode; 937 int need_atime = NFS_I(inode)->cache_validity & NFS_INO_INVALID_ATIME; 938 int err; 939 940 if (__IS_FLG(inode, MS_NOATIME)) 941 need_atime = 0; 942 else if (__IS_FLG(inode, MS_NODIRATIME) && S_ISDIR(inode->i_mode)) 943 need_atime = 0; 944 /* We may force a getattr if the user cares about atime */ 945 if (need_atime) 946 err = __nfs_revalidate_inode(NFS_SERVER(inode), inode); 947 else 948 err = nfs_revalidate_inode(NFS_SERVER(inode), inode); 949 if (!err) 950 generic_fillattr(inode, stat); 951 return err; 952 } 953 954 struct nfs_open_context *alloc_nfs_open_context(struct dentry *dentry, struct rpc_cred *cred) 955 { 956 struct nfs_open_context *ctx; 957 958 ctx = (struct nfs_open_context *)kmalloc(sizeof(*ctx), GFP_KERNEL); 959 if (ctx != NULL) { 960 atomic_set(&ctx->count, 1); 961 ctx->dentry = dget(dentry); 962 ctx->cred = get_rpccred(cred); 963 ctx->state = NULL; 964 ctx->lockowner = current->files; 965 ctx->error = 0; 966 ctx->dir_cookie = 0; 967 } 968 return ctx; 969 } 970 971 struct nfs_open_context *get_nfs_open_context(struct nfs_open_context *ctx) 972 { 973 if (ctx != NULL) 974 atomic_inc(&ctx->count); 975 return ctx; 976 } 977 978 void put_nfs_open_context(struct nfs_open_context *ctx) 979 { 980 if (atomic_dec_and_test(&ctx->count)) { 981 if (!list_empty(&ctx->list)) { 982 struct inode *inode = ctx->dentry->d_inode; 983 spin_lock(&inode->i_lock); 984 list_del(&ctx->list); 985 spin_unlock(&inode->i_lock); 986 } 987 if (ctx->state != NULL) 988 nfs4_close_state(ctx->state, ctx->mode); 989 if (ctx->cred != NULL) 990 put_rpccred(ctx->cred); 991 dput(ctx->dentry); 992 kfree(ctx); 993 } 994 } 995 996 /* 997 * Ensure that mmap has a recent RPC credential for use when writing out 998 * shared pages 999 */ 1000 void nfs_file_set_open_context(struct file *filp, struct nfs_open_context *ctx) 1001 { 1002 struct inode *inode = filp->f_dentry->d_inode; 1003 struct nfs_inode *nfsi = NFS_I(inode); 1004 1005 filp->private_data = get_nfs_open_context(ctx); 1006 spin_lock(&inode->i_lock); 1007 list_add(&ctx->list, &nfsi->open_files); 1008 spin_unlock(&inode->i_lock); 1009 } 1010 1011 /* 1012 * Given an inode, search for an open context with the desired characteristics 1013 */ 1014 struct nfs_open_context *nfs_find_open_context(struct inode *inode, struct rpc_cred *cred, int mode) 1015 { 1016 struct nfs_inode *nfsi = NFS_I(inode); 1017 struct nfs_open_context *pos, *ctx = NULL; 1018 1019 spin_lock(&inode->i_lock); 1020 list_for_each_entry(pos, &nfsi->open_files, list) { 1021 if (cred != NULL && pos->cred != cred) 1022 continue; 1023 if ((pos->mode & mode) == mode) { 1024 ctx = get_nfs_open_context(pos); 1025 break; 1026 } 1027 } 1028 spin_unlock(&inode->i_lock); 1029 return ctx; 1030 } 1031 1032 void nfs_file_clear_open_context(struct file *filp) 1033 { 1034 struct inode *inode = filp->f_dentry->d_inode; 1035 struct nfs_open_context *ctx = (struct nfs_open_context *)filp->private_data; 1036 1037 if (ctx) { 1038 filp->private_data = NULL; 1039 spin_lock(&inode->i_lock); 1040 list_move_tail(&ctx->list, &NFS_I(inode)->open_files); 1041 spin_unlock(&inode->i_lock); 1042 put_nfs_open_context(ctx); 1043 } 1044 } 1045 1046 /* 1047 * These allocate and release file read/write context information. 1048 */ 1049 int nfs_open(struct inode *inode, struct file *filp) 1050 { 1051 struct nfs_open_context *ctx; 1052 struct rpc_cred *cred; 1053 1054 cred = rpcauth_lookupcred(NFS_CLIENT(inode)->cl_auth, 0); 1055 if (IS_ERR(cred)) 1056 return PTR_ERR(cred); 1057 ctx = alloc_nfs_open_context(filp->f_dentry, cred); 1058 put_rpccred(cred); 1059 if (ctx == NULL) 1060 return -ENOMEM; 1061 ctx->mode = filp->f_mode; 1062 nfs_file_set_open_context(filp, ctx); 1063 put_nfs_open_context(ctx); 1064 return 0; 1065 } 1066 1067 int nfs_release(struct inode *inode, struct file *filp) 1068 { 1069 nfs_file_clear_open_context(filp); 1070 return 0; 1071 } 1072 1073 /* 1074 * This function is called whenever some part of NFS notices that 1075 * the cached attributes have to be refreshed. 1076 */ 1077 int 1078 __nfs_revalidate_inode(struct nfs_server *server, struct inode *inode) 1079 { 1080 int status = -ESTALE; 1081 struct nfs_fattr fattr; 1082 struct nfs_inode *nfsi = NFS_I(inode); 1083 1084 dfprintk(PAGECACHE, "NFS: revalidating (%s/%Ld)\n", 1085 inode->i_sb->s_id, (long long)NFS_FILEID(inode)); 1086 1087 lock_kernel(); 1088 if (!inode || is_bad_inode(inode)) 1089 goto out_nowait; 1090 if (NFS_STALE(inode)) 1091 goto out_nowait; 1092 1093 status = nfs_wait_on_inode(inode); 1094 if (status < 0) 1095 goto out; 1096 if (NFS_STALE(inode)) { 1097 status = -ESTALE; 1098 /* Do we trust the cached ESTALE? */ 1099 if (NFS_ATTRTIMEO(inode) != 0) { 1100 if (nfsi->cache_validity & (NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA|NFS_INO_INVALID_ATIME)) { 1101 /* no */ 1102 } else 1103 goto out; 1104 } 1105 } 1106 1107 status = NFS_PROTO(inode)->getattr(server, NFS_FH(inode), &fattr); 1108 if (status != 0) { 1109 dfprintk(PAGECACHE, "nfs_revalidate_inode: (%s/%Ld) getattr failed, error=%d\n", 1110 inode->i_sb->s_id, 1111 (long long)NFS_FILEID(inode), status); 1112 if (status == -ESTALE) { 1113 nfs_zap_caches(inode); 1114 if (!S_ISDIR(inode->i_mode)) 1115 set_bit(NFS_INO_STALE, &NFS_FLAGS(inode)); 1116 } 1117 goto out; 1118 } 1119 1120 spin_lock(&inode->i_lock); 1121 status = nfs_update_inode(inode, &fattr); 1122 if (status) { 1123 spin_unlock(&inode->i_lock); 1124 dfprintk(PAGECACHE, "nfs_revalidate_inode: (%s/%Ld) refresh failed, error=%d\n", 1125 inode->i_sb->s_id, 1126 (long long)NFS_FILEID(inode), status); 1127 goto out; 1128 } 1129 spin_unlock(&inode->i_lock); 1130 1131 nfs_revalidate_mapping(inode, inode->i_mapping); 1132 1133 if (nfsi->cache_validity & NFS_INO_INVALID_ACL) 1134 nfs_zap_acl_cache(inode); 1135 1136 dfprintk(PAGECACHE, "NFS: (%s/%Ld) revalidation complete\n", 1137 inode->i_sb->s_id, 1138 (long long)NFS_FILEID(inode)); 1139 1140 out: 1141 nfs_wake_up_inode(inode); 1142 1143 out_nowait: 1144 unlock_kernel(); 1145 return status; 1146 } 1147 1148 int nfs_attribute_timeout(struct inode *inode) 1149 { 1150 struct nfs_inode *nfsi = NFS_I(inode); 1151 1152 if (nfs_have_delegation(inode, FMODE_READ)) 1153 return 0; 1154 return time_after(jiffies, nfsi->read_cache_jiffies+nfsi->attrtimeo); 1155 } 1156 1157 /** 1158 * nfs_revalidate_inode - Revalidate the inode attributes 1159 * @server - pointer to nfs_server struct 1160 * @inode - pointer to inode struct 1161 * 1162 * Updates inode attribute information by retrieving the data from the server. 1163 */ 1164 int nfs_revalidate_inode(struct nfs_server *server, struct inode *inode) 1165 { 1166 if (!(NFS_I(inode)->cache_validity & (NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA)) 1167 && !nfs_attribute_timeout(inode)) 1168 return NFS_STALE(inode) ? -ESTALE : 0; 1169 return __nfs_revalidate_inode(server, inode); 1170 } 1171 1172 /** 1173 * nfs_revalidate_mapping - Revalidate the pagecache 1174 * @inode - pointer to host inode 1175 * @mapping - pointer to mapping 1176 */ 1177 void nfs_revalidate_mapping(struct inode *inode, struct address_space *mapping) 1178 { 1179 struct nfs_inode *nfsi = NFS_I(inode); 1180 1181 if (nfsi->cache_validity & NFS_INO_INVALID_DATA) { 1182 if (S_ISREG(inode->i_mode)) { 1183 if (filemap_fdatawrite(mapping) == 0) 1184 filemap_fdatawait(mapping); 1185 nfs_wb_all(inode); 1186 } 1187 invalidate_inode_pages2(mapping); 1188 1189 spin_lock(&inode->i_lock); 1190 nfsi->cache_validity &= ~NFS_INO_INVALID_DATA; 1191 if (S_ISDIR(inode->i_mode)) { 1192 memset(nfsi->cookieverf, 0, sizeof(nfsi->cookieverf)); 1193 /* This ensures we revalidate child dentries */ 1194 nfsi->cache_change_attribute = jiffies; 1195 } 1196 spin_unlock(&inode->i_lock); 1197 1198 dfprintk(PAGECACHE, "NFS: (%s/%Ld) data cache invalidated\n", 1199 inode->i_sb->s_id, 1200 (long long)NFS_FILEID(inode)); 1201 } 1202 } 1203 1204 /** 1205 * nfs_begin_data_update 1206 * @inode - pointer to inode 1207 * Declare that a set of operations will update file data on the server 1208 */ 1209 void nfs_begin_data_update(struct inode *inode) 1210 { 1211 atomic_inc(&NFS_I(inode)->data_updates); 1212 } 1213 1214 /** 1215 * nfs_end_data_update 1216 * @inode - pointer to inode 1217 * Declare end of the operations that will update file data 1218 * This will mark the inode as immediately needing revalidation 1219 * of its attribute cache. 1220 */ 1221 void nfs_end_data_update(struct inode *inode) 1222 { 1223 struct nfs_inode *nfsi = NFS_I(inode); 1224 1225 if (!nfs_have_delegation(inode, FMODE_READ)) { 1226 /* Directories and symlinks: invalidate page cache */ 1227 if (S_ISDIR(inode->i_mode) || S_ISLNK(inode->i_mode)) { 1228 spin_lock(&inode->i_lock); 1229 nfsi->cache_validity |= NFS_INO_INVALID_DATA; 1230 spin_unlock(&inode->i_lock); 1231 } 1232 } 1233 nfsi->cache_change_attribute = jiffies; 1234 atomic_dec(&nfsi->data_updates); 1235 } 1236 1237 /** 1238 * nfs_check_inode_attributes - verify consistency of the inode attribute cache 1239 * @inode - pointer to inode 1240 * @fattr - updated attributes 1241 * 1242 * Verifies the attribute cache. If we have just changed the attributes, 1243 * so that fattr carries weak cache consistency data, then it may 1244 * also update the ctime/mtime/change_attribute. 1245 */ 1246 static int nfs_check_inode_attributes(struct inode *inode, struct nfs_fattr *fattr) 1247 { 1248 struct nfs_inode *nfsi = NFS_I(inode); 1249 loff_t cur_size, new_isize; 1250 int data_unstable; 1251 1252 1253 /* Are we in the process of updating data on the server? */ 1254 data_unstable = nfs_caches_unstable(inode); 1255 1256 if (fattr->valid & NFS_ATTR_FATTR_V4) { 1257 if ((fattr->valid & NFS_ATTR_PRE_CHANGE) != 0 1258 && nfsi->change_attr == fattr->pre_change_attr) 1259 nfsi->change_attr = fattr->change_attr; 1260 if (nfsi->change_attr != fattr->change_attr) { 1261 nfsi->cache_validity |= NFS_INO_INVALID_ATTR; 1262 if (!data_unstable) 1263 nfsi->cache_validity |= NFS_INO_REVAL_PAGECACHE; 1264 } 1265 } 1266 1267 if ((fattr->valid & NFS_ATTR_FATTR) == 0) { 1268 return 0; 1269 } 1270 1271 /* Has the inode gone and changed behind our back? */ 1272 if (nfsi->fileid != fattr->fileid 1273 || (inode->i_mode & S_IFMT) != (fattr->mode & S_IFMT)) { 1274 return -EIO; 1275 } 1276 1277 cur_size = i_size_read(inode); 1278 new_isize = nfs_size_to_loff_t(fattr->size); 1279 1280 /* If we have atomic WCC data, we may update some attributes */ 1281 if ((fattr->valid & NFS_ATTR_WCC) != 0) { 1282 if (timespec_equal(&inode->i_ctime, &fattr->pre_ctime)) 1283 memcpy(&inode->i_ctime, &fattr->ctime, sizeof(inode->i_ctime)); 1284 if (timespec_equal(&inode->i_mtime, &fattr->pre_mtime)) 1285 memcpy(&inode->i_mtime, &fattr->mtime, sizeof(inode->i_mtime)); 1286 } 1287 1288 /* Verify a few of the more important attributes */ 1289 if (!timespec_equal(&inode->i_mtime, &fattr->mtime)) { 1290 nfsi->cache_validity |= NFS_INO_INVALID_ATTR; 1291 if (!data_unstable) 1292 nfsi->cache_validity |= NFS_INO_REVAL_PAGECACHE; 1293 } 1294 if (cur_size != new_isize) { 1295 nfsi->cache_validity |= NFS_INO_INVALID_ATTR; 1296 if (nfsi->npages == 0) 1297 nfsi->cache_validity |= NFS_INO_REVAL_PAGECACHE; 1298 } 1299 1300 /* Have any file permissions changed? */ 1301 if ((inode->i_mode & S_IALLUGO) != (fattr->mode & S_IALLUGO) 1302 || inode->i_uid != fattr->uid 1303 || inode->i_gid != fattr->gid) 1304 nfsi->cache_validity |= NFS_INO_INVALID_ATTR | NFS_INO_INVALID_ACCESS | NFS_INO_INVALID_ACL; 1305 1306 /* Has the link count changed? */ 1307 if (inode->i_nlink != fattr->nlink) 1308 nfsi->cache_validity |= NFS_INO_INVALID_ATTR; 1309 1310 if (!timespec_equal(&inode->i_atime, &fattr->atime)) 1311 nfsi->cache_validity |= NFS_INO_INVALID_ATIME; 1312 1313 nfsi->read_cache_jiffies = fattr->time_start; 1314 return 0; 1315 } 1316 1317 /** 1318 * nfs_refresh_inode - try to update the inode attribute cache 1319 * @inode - pointer to inode 1320 * @fattr - updated attributes 1321 * 1322 * Check that an RPC call that returned attributes has not overlapped with 1323 * other recent updates of the inode metadata, then decide whether it is 1324 * safe to do a full update of the inode attributes, or whether just to 1325 * call nfs_check_inode_attributes. 1326 */ 1327 int nfs_refresh_inode(struct inode *inode, struct nfs_fattr *fattr) 1328 { 1329 struct nfs_inode *nfsi = NFS_I(inode); 1330 int status; 1331 1332 if ((fattr->valid & NFS_ATTR_FATTR) == 0) 1333 return 0; 1334 spin_lock(&inode->i_lock); 1335 nfsi->cache_validity &= ~NFS_INO_REVAL_PAGECACHE; 1336 if (time_after(fattr->time_start, nfsi->last_updated)) 1337 status = nfs_update_inode(inode, fattr); 1338 else 1339 status = nfs_check_inode_attributes(inode, fattr); 1340 1341 spin_unlock(&inode->i_lock); 1342 return status; 1343 } 1344 1345 /** 1346 * nfs_post_op_update_inode - try to update the inode attribute cache 1347 * @inode - pointer to inode 1348 * @fattr - updated attributes 1349 * 1350 * After an operation that has changed the inode metadata, mark the 1351 * attribute cache as being invalid, then try to update it. 1352 */ 1353 int nfs_post_op_update_inode(struct inode *inode, struct nfs_fattr *fattr) 1354 { 1355 struct nfs_inode *nfsi = NFS_I(inode); 1356 int status = 0; 1357 1358 spin_lock(&inode->i_lock); 1359 if (unlikely((fattr->valid & NFS_ATTR_FATTR) == 0)) { 1360 nfsi->cache_validity |= NFS_INO_INVALID_ATTR | NFS_INO_INVALID_ACCESS; 1361 goto out; 1362 } 1363 status = nfs_update_inode(inode, fattr); 1364 out: 1365 spin_unlock(&inode->i_lock); 1366 return status; 1367 } 1368 1369 /* 1370 * Many nfs protocol calls return the new file attributes after 1371 * an operation. Here we update the inode to reflect the state 1372 * of the server's inode. 1373 * 1374 * This is a bit tricky because we have to make sure all dirty pages 1375 * have been sent off to the server before calling invalidate_inode_pages. 1376 * To make sure no other process adds more write requests while we try 1377 * our best to flush them, we make them sleep during the attribute refresh. 1378 * 1379 * A very similar scenario holds for the dir cache. 1380 */ 1381 static int nfs_update_inode(struct inode *inode, struct nfs_fattr *fattr) 1382 { 1383 struct nfs_inode *nfsi = NFS_I(inode); 1384 loff_t cur_isize, new_isize; 1385 unsigned int invalid = 0; 1386 int data_stable; 1387 1388 dfprintk(VFS, "NFS: %s(%s/%ld ct=%d info=0x%x)\n", 1389 __FUNCTION__, inode->i_sb->s_id, inode->i_ino, 1390 atomic_read(&inode->i_count), fattr->valid); 1391 1392 if ((fattr->valid & NFS_ATTR_FATTR) == 0) 1393 return 0; 1394 1395 if (nfsi->fileid != fattr->fileid) { 1396 printk(KERN_ERR "%s: inode number mismatch\n" 1397 "expected (%s/0x%Lx), got (%s/0x%Lx)\n", 1398 __FUNCTION__, 1399 inode->i_sb->s_id, (long long)nfsi->fileid, 1400 inode->i_sb->s_id, (long long)fattr->fileid); 1401 goto out_err; 1402 } 1403 1404 /* 1405 * Make sure the inode's type hasn't changed. 1406 */ 1407 if ((inode->i_mode & S_IFMT) != (fattr->mode & S_IFMT)) 1408 goto out_changed; 1409 1410 /* 1411 * Update the read time so we don't revalidate too often. 1412 */ 1413 nfsi->read_cache_jiffies = fattr->time_start; 1414 nfsi->last_updated = jiffies; 1415 1416 /* Are we racing with known updates of the metadata on the server? */ 1417 data_stable = nfs_verify_change_attribute(inode, fattr->time_start); 1418 if (data_stable) 1419 nfsi->cache_validity &= ~(NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ATIME); 1420 1421 /* Check if our cached file size is stale */ 1422 new_isize = nfs_size_to_loff_t(fattr->size); 1423 cur_isize = i_size_read(inode); 1424 if (new_isize != cur_isize) { 1425 /* Do we perhaps have any outstanding writes? */ 1426 if (nfsi->npages == 0) { 1427 /* No, but did we race with nfs_end_data_update()? */ 1428 if (data_stable) { 1429 inode->i_size = new_isize; 1430 invalid |= NFS_INO_INVALID_DATA; 1431 } 1432 invalid |= NFS_INO_INVALID_ATTR; 1433 } else if (new_isize > cur_isize) { 1434 inode->i_size = new_isize; 1435 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA; 1436 } 1437 nfsi->cache_change_attribute = jiffies; 1438 dprintk("NFS: isize change on server for file %s/%ld\n", 1439 inode->i_sb->s_id, inode->i_ino); 1440 } 1441 1442 /* Check if the mtime agrees */ 1443 if (!timespec_equal(&inode->i_mtime, &fattr->mtime)) { 1444 memcpy(&inode->i_mtime, &fattr->mtime, sizeof(inode->i_mtime)); 1445 dprintk("NFS: mtime change on server for file %s/%ld\n", 1446 inode->i_sb->s_id, inode->i_ino); 1447 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA; 1448 nfsi->cache_change_attribute = jiffies; 1449 } 1450 1451 if ((fattr->valid & NFS_ATTR_FATTR_V4) 1452 && nfsi->change_attr != fattr->change_attr) { 1453 dprintk("NFS: change_attr change on server for file %s/%ld\n", 1454 inode->i_sb->s_id, inode->i_ino); 1455 nfsi->change_attr = fattr->change_attr; 1456 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1457 nfsi->cache_change_attribute = jiffies; 1458 } 1459 1460 /* If ctime has changed we should definitely clear access+acl caches */ 1461 if (!timespec_equal(&inode->i_ctime, &fattr->ctime)) { 1462 invalid |= NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1463 memcpy(&inode->i_ctime, &fattr->ctime, sizeof(inode->i_ctime)); 1464 nfsi->cache_change_attribute = jiffies; 1465 } 1466 memcpy(&inode->i_atime, &fattr->atime, sizeof(inode->i_atime)); 1467 1468 if ((inode->i_mode & S_IALLUGO) != (fattr->mode & S_IALLUGO) || 1469 inode->i_uid != fattr->uid || 1470 inode->i_gid != fattr->gid) 1471 invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL; 1472 1473 inode->i_mode = fattr->mode; 1474 inode->i_nlink = fattr->nlink; 1475 inode->i_uid = fattr->uid; 1476 inode->i_gid = fattr->gid; 1477 1478 if (fattr->valid & (NFS_ATTR_FATTR_V3 | NFS_ATTR_FATTR_V4)) { 1479 /* 1480 * report the blocks in 512byte units 1481 */ 1482 inode->i_blocks = nfs_calc_block_size(fattr->du.nfs3.used); 1483 inode->i_blksize = inode->i_sb->s_blocksize; 1484 } else { 1485 inode->i_blocks = fattr->du.nfs2.blocks; 1486 inode->i_blksize = fattr->du.nfs2.blocksize; 1487 } 1488 1489 /* Update attrtimeo value if we're out of the unstable period */ 1490 if (invalid & NFS_INO_INVALID_ATTR) { 1491 nfsi->attrtimeo = NFS_MINATTRTIMEO(inode); 1492 nfsi->attrtimeo_timestamp = jiffies; 1493 } else if (time_after(jiffies, nfsi->attrtimeo_timestamp+nfsi->attrtimeo)) { 1494 if ((nfsi->attrtimeo <<= 1) > NFS_MAXATTRTIMEO(inode)) 1495 nfsi->attrtimeo = NFS_MAXATTRTIMEO(inode); 1496 nfsi->attrtimeo_timestamp = jiffies; 1497 } 1498 /* Don't invalidate the data if we were to blame */ 1499 if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) 1500 || S_ISLNK(inode->i_mode))) 1501 invalid &= ~NFS_INO_INVALID_DATA; 1502 if (data_stable) 1503 invalid &= ~(NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ATIME|NFS_INO_REVAL_PAGECACHE); 1504 if (!nfs_have_delegation(inode, FMODE_READ)) 1505 nfsi->cache_validity |= invalid; 1506 1507 return 0; 1508 out_changed: 1509 /* 1510 * Big trouble! The inode has become a different object. 1511 */ 1512 #ifdef NFS_PARANOIA 1513 printk(KERN_DEBUG "%s: inode %ld mode changed, %07o to %07o\n", 1514 __FUNCTION__, inode->i_ino, inode->i_mode, fattr->mode); 1515 #endif 1516 out_err: 1517 /* 1518 * No need to worry about unhashing the dentry, as the 1519 * lookup validation will know that the inode is bad. 1520 * (But we fall through to invalidate the caches.) 1521 */ 1522 nfs_invalidate_inode(inode); 1523 return -ESTALE; 1524 } 1525 1526 /* 1527 * File system information 1528 */ 1529 1530 static int nfs_set_super(struct super_block *s, void *data) 1531 { 1532 s->s_fs_info = data; 1533 return set_anon_super(s, data); 1534 } 1535 1536 static int nfs_compare_super(struct super_block *sb, void *data) 1537 { 1538 struct nfs_server *server = data; 1539 struct nfs_server *old = NFS_SB(sb); 1540 1541 if (old->addr.sin_addr.s_addr != server->addr.sin_addr.s_addr) 1542 return 0; 1543 if (old->addr.sin_port != server->addr.sin_port) 1544 return 0; 1545 return !nfs_compare_fh(&old->fh, &server->fh); 1546 } 1547 1548 static struct super_block *nfs_get_sb(struct file_system_type *fs_type, 1549 int flags, const char *dev_name, void *raw_data) 1550 { 1551 int error; 1552 struct nfs_server *server = NULL; 1553 struct super_block *s; 1554 struct nfs_fh *root; 1555 struct nfs_mount_data *data = raw_data; 1556 1557 s = ERR_PTR(-EINVAL); 1558 if (data == NULL) { 1559 dprintk("%s: missing data argument\n", __FUNCTION__); 1560 goto out_err; 1561 } 1562 if (data->version <= 0 || data->version > NFS_MOUNT_VERSION) { 1563 dprintk("%s: bad mount version\n", __FUNCTION__); 1564 goto out_err; 1565 } 1566 switch (data->version) { 1567 case 1: 1568 data->namlen = 0; 1569 case 2: 1570 data->bsize = 0; 1571 case 3: 1572 if (data->flags & NFS_MOUNT_VER3) { 1573 dprintk("%s: mount structure version %d does not support NFSv3\n", 1574 __FUNCTION__, 1575 data->version); 1576 goto out_err; 1577 } 1578 data->root.size = NFS2_FHSIZE; 1579 memcpy(data->root.data, data->old_root.data, NFS2_FHSIZE); 1580 case 4: 1581 if (data->flags & NFS_MOUNT_SECFLAVOUR) { 1582 dprintk("%s: mount structure version %d does not support strong security\n", 1583 __FUNCTION__, 1584 data->version); 1585 goto out_err; 1586 } 1587 case 5: 1588 memset(data->context, 0, sizeof(data->context)); 1589 } 1590 #ifndef CONFIG_NFS_V3 1591 /* If NFSv3 is not compiled in, return -EPROTONOSUPPORT */ 1592 s = ERR_PTR(-EPROTONOSUPPORT); 1593 if (data->flags & NFS_MOUNT_VER3) { 1594 dprintk("%s: NFSv3 not compiled into kernel\n", __FUNCTION__); 1595 goto out_err; 1596 } 1597 #endif /* CONFIG_NFS_V3 */ 1598 1599 s = ERR_PTR(-ENOMEM); 1600 server = kmalloc(sizeof(struct nfs_server), GFP_KERNEL); 1601 if (!server) 1602 goto out_err; 1603 memset(server, 0, sizeof(struct nfs_server)); 1604 /* Zero out the NFS state stuff */ 1605 init_nfsv4_state(server); 1606 server->client = server->client_sys = server->client_acl = ERR_PTR(-EINVAL); 1607 1608 root = &server->fh; 1609 if (data->flags & NFS_MOUNT_VER3) 1610 root->size = data->root.size; 1611 else 1612 root->size = NFS2_FHSIZE; 1613 s = ERR_PTR(-EINVAL); 1614 if (root->size > sizeof(root->data)) { 1615 dprintk("%s: invalid root filehandle\n", __FUNCTION__); 1616 goto out_err; 1617 } 1618 memcpy(root->data, data->root.data, root->size); 1619 1620 /* We now require that the mount process passes the remote address */ 1621 memcpy(&server->addr, &data->addr, sizeof(server->addr)); 1622 if (server->addr.sin_addr.s_addr == INADDR_ANY) { 1623 dprintk("%s: mount program didn't pass remote address!\n", 1624 __FUNCTION__); 1625 goto out_err; 1626 } 1627 1628 /* Fire up rpciod if not yet running */ 1629 s = ERR_PTR(rpciod_up()); 1630 if (IS_ERR(s)) { 1631 dprintk("%s: couldn't start rpciod! Error = %ld\n", 1632 __FUNCTION__, PTR_ERR(s)); 1633 goto out_err; 1634 } 1635 1636 s = sget(fs_type, nfs_compare_super, nfs_set_super, server); 1637 if (IS_ERR(s) || s->s_root) 1638 goto out_rpciod_down; 1639 1640 s->s_flags = flags; 1641 1642 error = nfs_fill_super(s, data, flags & MS_VERBOSE ? 1 : 0); 1643 if (error) { 1644 up_write(&s->s_umount); 1645 deactivate_super(s); 1646 return ERR_PTR(error); 1647 } 1648 s->s_flags |= MS_ACTIVE; 1649 return s; 1650 out_rpciod_down: 1651 rpciod_down(); 1652 out_err: 1653 kfree(server); 1654 return s; 1655 } 1656 1657 static void nfs_kill_super(struct super_block *s) 1658 { 1659 struct nfs_server *server = NFS_SB(s); 1660 1661 kill_anon_super(s); 1662 1663 if (!IS_ERR(server->client)) 1664 rpc_shutdown_client(server->client); 1665 if (!IS_ERR(server->client_sys)) 1666 rpc_shutdown_client(server->client_sys); 1667 if (!IS_ERR(server->client_acl)) 1668 rpc_shutdown_client(server->client_acl); 1669 1670 if (!(server->flags & NFS_MOUNT_NONLM)) 1671 lockd_down(); /* release rpc.lockd */ 1672 1673 rpciod_down(); /* release rpciod */ 1674 1675 kfree(server->hostname); 1676 kfree(server); 1677 } 1678 1679 static struct file_system_type nfs_fs_type = { 1680 .owner = THIS_MODULE, 1681 .name = "nfs", 1682 .get_sb = nfs_get_sb, 1683 .kill_sb = nfs_kill_super, 1684 .fs_flags = FS_ODD_RENAME|FS_REVAL_DOT|FS_BINARY_MOUNTDATA, 1685 }; 1686 1687 #ifdef CONFIG_NFS_V4 1688 1689 static void nfs4_clear_inode(struct inode *); 1690 1691 1692 static struct super_operations nfs4_sops = { 1693 .alloc_inode = nfs_alloc_inode, 1694 .destroy_inode = nfs_destroy_inode, 1695 .write_inode = nfs_write_inode, 1696 .delete_inode = nfs_delete_inode, 1697 .statfs = nfs_statfs, 1698 .clear_inode = nfs4_clear_inode, 1699 .umount_begin = nfs_umount_begin, 1700 .show_options = nfs_show_options, 1701 }; 1702 1703 /* 1704 * Clean out any remaining NFSv4 state that might be left over due 1705 * to open() calls that passed nfs_atomic_lookup, but failed to call 1706 * nfs_open(). 1707 */ 1708 static void nfs4_clear_inode(struct inode *inode) 1709 { 1710 struct nfs_inode *nfsi = NFS_I(inode); 1711 1712 /* If we are holding a delegation, return it! */ 1713 nfs_inode_return_delegation(inode); 1714 /* First call standard NFS clear_inode() code */ 1715 nfs_clear_inode(inode); 1716 /* Now clear out any remaining state */ 1717 while (!list_empty(&nfsi->open_states)) { 1718 struct nfs4_state *state; 1719 1720 state = list_entry(nfsi->open_states.next, 1721 struct nfs4_state, 1722 inode_states); 1723 dprintk("%s(%s/%Ld): found unclaimed NFSv4 state %p\n", 1724 __FUNCTION__, 1725 inode->i_sb->s_id, 1726 (long long)NFS_FILEID(inode), 1727 state); 1728 BUG_ON(atomic_read(&state->count) != 1); 1729 nfs4_close_state(state, state->state); 1730 } 1731 } 1732 1733 1734 static int nfs4_fill_super(struct super_block *sb, struct nfs4_mount_data *data, int silent) 1735 { 1736 struct nfs_server *server; 1737 struct nfs4_client *clp = NULL; 1738 struct rpc_xprt *xprt = NULL; 1739 struct rpc_clnt *clnt = NULL; 1740 struct rpc_timeout timeparms; 1741 rpc_authflavor_t authflavour; 1742 int err = -EIO; 1743 1744 sb->s_blocksize_bits = 0; 1745 sb->s_blocksize = 0; 1746 server = NFS_SB(sb); 1747 if (data->rsize != 0) 1748 server->rsize = nfs_block_size(data->rsize, NULL); 1749 if (data->wsize != 0) 1750 server->wsize = nfs_block_size(data->wsize, NULL); 1751 server->flags = data->flags & NFS_MOUNT_FLAGMASK; 1752 server->caps = NFS_CAP_ATOMIC_OPEN; 1753 1754 server->acregmin = data->acregmin*HZ; 1755 server->acregmax = data->acregmax*HZ; 1756 server->acdirmin = data->acdirmin*HZ; 1757 server->acdirmax = data->acdirmax*HZ; 1758 1759 server->rpc_ops = &nfs_v4_clientops; 1760 1761 nfs_init_timeout_values(&timeparms, data->proto, data->timeo, data->retrans); 1762 1763 clp = nfs4_get_client(&server->addr.sin_addr); 1764 if (!clp) { 1765 dprintk("%s: failed to create NFS4 client.\n", __FUNCTION__); 1766 return -EIO; 1767 } 1768 1769 /* Now create transport and client */ 1770 authflavour = RPC_AUTH_UNIX; 1771 if (data->auth_flavourlen != 0) { 1772 if (data->auth_flavourlen != 1) { 1773 dprintk("%s: Invalid number of RPC auth flavours %d.\n", 1774 __FUNCTION__, data->auth_flavourlen); 1775 err = -EINVAL; 1776 goto out_fail; 1777 } 1778 if (copy_from_user(&authflavour, data->auth_flavours, sizeof(authflavour))) { 1779 err = -EFAULT; 1780 goto out_fail; 1781 } 1782 } 1783 1784 down_write(&clp->cl_sem); 1785 if (IS_ERR(clp->cl_rpcclient)) { 1786 xprt = xprt_create_proto(data->proto, &server->addr, &timeparms); 1787 if (IS_ERR(xprt)) { 1788 up_write(&clp->cl_sem); 1789 err = PTR_ERR(xprt); 1790 dprintk("%s: cannot create RPC transport. Error = %d\n", 1791 __FUNCTION__, err); 1792 goto out_fail; 1793 } 1794 clnt = rpc_create_client(xprt, server->hostname, &nfs_program, 1795 server->rpc_ops->version, authflavour); 1796 if (IS_ERR(clnt)) { 1797 up_write(&clp->cl_sem); 1798 err = PTR_ERR(clnt); 1799 dprintk("%s: cannot create RPC client. Error = %d\n", 1800 __FUNCTION__, err); 1801 goto out_fail; 1802 } 1803 clnt->cl_intr = 1; 1804 clnt->cl_softrtry = 1; 1805 clnt->cl_chatty = 1; 1806 clp->cl_rpcclient = clnt; 1807 clp->cl_cred = rpcauth_lookupcred(clnt->cl_auth, 0); 1808 if (IS_ERR(clp->cl_cred)) { 1809 up_write(&clp->cl_sem); 1810 err = PTR_ERR(clp->cl_cred); 1811 clp->cl_cred = NULL; 1812 goto out_fail; 1813 } 1814 memcpy(clp->cl_ipaddr, server->ip_addr, sizeof(clp->cl_ipaddr)); 1815 nfs_idmap_new(clp); 1816 } 1817 if (list_empty(&clp->cl_superblocks)) { 1818 err = nfs4_init_client(clp); 1819 if (err != 0) { 1820 up_write(&clp->cl_sem); 1821 goto out_fail; 1822 } 1823 } 1824 list_add_tail(&server->nfs4_siblings, &clp->cl_superblocks); 1825 clnt = rpc_clone_client(clp->cl_rpcclient); 1826 if (!IS_ERR(clnt)) 1827 server->nfs4_state = clp; 1828 up_write(&clp->cl_sem); 1829 clp = NULL; 1830 1831 if (IS_ERR(clnt)) { 1832 err = PTR_ERR(clnt); 1833 dprintk("%s: cannot create RPC client. Error = %d\n", 1834 __FUNCTION__, err); 1835 return err; 1836 } 1837 1838 server->client = clnt; 1839 1840 if (server->nfs4_state->cl_idmap == NULL) { 1841 dprintk("%s: failed to create idmapper.\n", __FUNCTION__); 1842 return -ENOMEM; 1843 } 1844 1845 if (clnt->cl_auth->au_flavor != authflavour) { 1846 struct rpc_auth *auth; 1847 1848 auth = rpcauth_create(authflavour, clnt); 1849 if (IS_ERR(auth)) { 1850 dprintk("%s: couldn't create credcache!\n", __FUNCTION__); 1851 return PTR_ERR(auth); 1852 } 1853 } 1854 1855 sb->s_time_gran = 1; 1856 1857 sb->s_op = &nfs4_sops; 1858 err = nfs_sb_init(sb, authflavour); 1859 if (err == 0) 1860 return 0; 1861 out_fail: 1862 if (clp) 1863 nfs4_put_client(clp); 1864 return err; 1865 } 1866 1867 static int nfs4_compare_super(struct super_block *sb, void *data) 1868 { 1869 struct nfs_server *server = data; 1870 struct nfs_server *old = NFS_SB(sb); 1871 1872 if (strcmp(server->hostname, old->hostname) != 0) 1873 return 0; 1874 if (strcmp(server->mnt_path, old->mnt_path) != 0) 1875 return 0; 1876 return 1; 1877 } 1878 1879 static void * 1880 nfs_copy_user_string(char *dst, struct nfs_string *src, int maxlen) 1881 { 1882 void *p = NULL; 1883 1884 if (!src->len) 1885 return ERR_PTR(-EINVAL); 1886 if (src->len < maxlen) 1887 maxlen = src->len; 1888 if (dst == NULL) { 1889 p = dst = kmalloc(maxlen + 1, GFP_KERNEL); 1890 if (p == NULL) 1891 return ERR_PTR(-ENOMEM); 1892 } 1893 if (copy_from_user(dst, src->data, maxlen)) { 1894 kfree(p); 1895 return ERR_PTR(-EFAULT); 1896 } 1897 dst[maxlen] = '\0'; 1898 return dst; 1899 } 1900 1901 static struct super_block *nfs4_get_sb(struct file_system_type *fs_type, 1902 int flags, const char *dev_name, void *raw_data) 1903 { 1904 int error; 1905 struct nfs_server *server; 1906 struct super_block *s; 1907 struct nfs4_mount_data *data = raw_data; 1908 void *p; 1909 1910 if (data == NULL) { 1911 dprintk("%s: missing data argument\n", __FUNCTION__); 1912 return ERR_PTR(-EINVAL); 1913 } 1914 if (data->version <= 0 || data->version > NFS4_MOUNT_VERSION) { 1915 dprintk("%s: bad mount version\n", __FUNCTION__); 1916 return ERR_PTR(-EINVAL); 1917 } 1918 1919 server = kmalloc(sizeof(struct nfs_server), GFP_KERNEL); 1920 if (!server) 1921 return ERR_PTR(-ENOMEM); 1922 memset(server, 0, sizeof(struct nfs_server)); 1923 /* Zero out the NFS state stuff */ 1924 init_nfsv4_state(server); 1925 server->client = server->client_sys = server->client_acl = ERR_PTR(-EINVAL); 1926 1927 p = nfs_copy_user_string(NULL, &data->hostname, 256); 1928 if (IS_ERR(p)) 1929 goto out_err; 1930 server->hostname = p; 1931 1932 p = nfs_copy_user_string(NULL, &data->mnt_path, 1024); 1933 if (IS_ERR(p)) 1934 goto out_err; 1935 server->mnt_path = p; 1936 1937 p = nfs_copy_user_string(server->ip_addr, &data->client_addr, 1938 sizeof(server->ip_addr) - 1); 1939 if (IS_ERR(p)) 1940 goto out_err; 1941 1942 /* We now require that the mount process passes the remote address */ 1943 if (data->host_addrlen != sizeof(server->addr)) { 1944 s = ERR_PTR(-EINVAL); 1945 goto out_free; 1946 } 1947 if (copy_from_user(&server->addr, data->host_addr, sizeof(server->addr))) { 1948 s = ERR_PTR(-EFAULT); 1949 goto out_free; 1950 } 1951 if (server->addr.sin_family != AF_INET || 1952 server->addr.sin_addr.s_addr == INADDR_ANY) { 1953 dprintk("%s: mount program didn't pass remote IP address!\n", 1954 __FUNCTION__); 1955 s = ERR_PTR(-EINVAL); 1956 goto out_free; 1957 } 1958 1959 /* Fire up rpciod if not yet running */ 1960 s = ERR_PTR(rpciod_up()); 1961 if (IS_ERR(s)) { 1962 dprintk("%s: couldn't start rpciod! Error = %ld\n", 1963 __FUNCTION__, PTR_ERR(s)); 1964 goto out_free; 1965 } 1966 1967 s = sget(fs_type, nfs4_compare_super, nfs_set_super, server); 1968 1969 if (IS_ERR(s) || s->s_root) 1970 goto out_free; 1971 1972 s->s_flags = flags; 1973 1974 error = nfs4_fill_super(s, data, flags & MS_VERBOSE ? 1 : 0); 1975 if (error) { 1976 up_write(&s->s_umount); 1977 deactivate_super(s); 1978 return ERR_PTR(error); 1979 } 1980 s->s_flags |= MS_ACTIVE; 1981 return s; 1982 out_err: 1983 s = (struct super_block *)p; 1984 out_free: 1985 kfree(server->mnt_path); 1986 kfree(server->hostname); 1987 kfree(server); 1988 return s; 1989 } 1990 1991 static void nfs4_kill_super(struct super_block *sb) 1992 { 1993 struct nfs_server *server = NFS_SB(sb); 1994 1995 nfs_return_all_delegations(sb); 1996 kill_anon_super(sb); 1997 1998 nfs4_renewd_prepare_shutdown(server); 1999 2000 if (server->client != NULL && !IS_ERR(server->client)) 2001 rpc_shutdown_client(server->client); 2002 rpciod_down(); /* release rpciod */ 2003 2004 destroy_nfsv4_state(server); 2005 2006 kfree(server->hostname); 2007 kfree(server); 2008 } 2009 2010 static struct file_system_type nfs4_fs_type = { 2011 .owner = THIS_MODULE, 2012 .name = "nfs4", 2013 .get_sb = nfs4_get_sb, 2014 .kill_sb = nfs4_kill_super, 2015 .fs_flags = FS_ODD_RENAME|FS_REVAL_DOT|FS_BINARY_MOUNTDATA, 2016 }; 2017 2018 #define nfs4_init_once(nfsi) \ 2019 do { \ 2020 INIT_LIST_HEAD(&(nfsi)->open_states); \ 2021 nfsi->delegation = NULL; \ 2022 nfsi->delegation_state = 0; \ 2023 init_rwsem(&nfsi->rwsem); \ 2024 } while(0) 2025 #define register_nfs4fs() register_filesystem(&nfs4_fs_type) 2026 #define unregister_nfs4fs() unregister_filesystem(&nfs4_fs_type) 2027 #else 2028 #define nfs4_init_once(nfsi) \ 2029 do { } while (0) 2030 #define register_nfs4fs() (0) 2031 #define unregister_nfs4fs() 2032 #endif 2033 2034 extern int nfs_init_nfspagecache(void); 2035 extern void nfs_destroy_nfspagecache(void); 2036 extern int nfs_init_readpagecache(void); 2037 extern void nfs_destroy_readpagecache(void); 2038 extern int nfs_init_writepagecache(void); 2039 extern void nfs_destroy_writepagecache(void); 2040 #ifdef CONFIG_NFS_DIRECTIO 2041 extern int nfs_init_directcache(void); 2042 extern void nfs_destroy_directcache(void); 2043 #endif 2044 2045 static kmem_cache_t * nfs_inode_cachep; 2046 2047 static struct inode *nfs_alloc_inode(struct super_block *sb) 2048 { 2049 struct nfs_inode *nfsi; 2050 nfsi = (struct nfs_inode *)kmem_cache_alloc(nfs_inode_cachep, SLAB_KERNEL); 2051 if (!nfsi) 2052 return NULL; 2053 nfsi->flags = 0UL; 2054 nfsi->cache_validity = 0UL; 2055 nfsi->cache_change_attribute = jiffies; 2056 #ifdef CONFIG_NFS_V3_ACL 2057 nfsi->acl_access = ERR_PTR(-EAGAIN); 2058 nfsi->acl_default = ERR_PTR(-EAGAIN); 2059 #endif 2060 #ifdef CONFIG_NFS_V4 2061 nfsi->nfs4_acl = NULL; 2062 #endif /* CONFIG_NFS_V4 */ 2063 return &nfsi->vfs_inode; 2064 } 2065 2066 static void nfs_destroy_inode(struct inode *inode) 2067 { 2068 kmem_cache_free(nfs_inode_cachep, NFS_I(inode)); 2069 } 2070 2071 static void init_once(void * foo, kmem_cache_t * cachep, unsigned long flags) 2072 { 2073 struct nfs_inode *nfsi = (struct nfs_inode *) foo; 2074 2075 if ((flags & (SLAB_CTOR_VERIFY|SLAB_CTOR_CONSTRUCTOR)) == 2076 SLAB_CTOR_CONSTRUCTOR) { 2077 inode_init_once(&nfsi->vfs_inode); 2078 spin_lock_init(&nfsi->req_lock); 2079 INIT_LIST_HEAD(&nfsi->dirty); 2080 INIT_LIST_HEAD(&nfsi->commit); 2081 INIT_LIST_HEAD(&nfsi->open_files); 2082 INIT_RADIX_TREE(&nfsi->nfs_page_tree, GFP_ATOMIC); 2083 atomic_set(&nfsi->data_updates, 0); 2084 nfsi->ndirty = 0; 2085 nfsi->ncommit = 0; 2086 nfsi->npages = 0; 2087 nfs4_init_once(nfsi); 2088 } 2089 } 2090 2091 static int nfs_init_inodecache(void) 2092 { 2093 nfs_inode_cachep = kmem_cache_create("nfs_inode_cache", 2094 sizeof(struct nfs_inode), 2095 0, SLAB_RECLAIM_ACCOUNT, 2096 init_once, NULL); 2097 if (nfs_inode_cachep == NULL) 2098 return -ENOMEM; 2099 2100 return 0; 2101 } 2102 2103 static void nfs_destroy_inodecache(void) 2104 { 2105 if (kmem_cache_destroy(nfs_inode_cachep)) 2106 printk(KERN_INFO "nfs_inode_cache: not all structures were freed\n"); 2107 } 2108 2109 /* 2110 * Initialize NFS 2111 */ 2112 static int __init init_nfs_fs(void) 2113 { 2114 int err; 2115 2116 err = nfs_init_nfspagecache(); 2117 if (err) 2118 goto out4; 2119 2120 err = nfs_init_inodecache(); 2121 if (err) 2122 goto out3; 2123 2124 err = nfs_init_readpagecache(); 2125 if (err) 2126 goto out2; 2127 2128 err = nfs_init_writepagecache(); 2129 if (err) 2130 goto out1; 2131 2132 #ifdef CONFIG_NFS_DIRECTIO 2133 err = nfs_init_directcache(); 2134 if (err) 2135 goto out0; 2136 #endif 2137 2138 #ifdef CONFIG_PROC_FS 2139 rpc_proc_register(&nfs_rpcstat); 2140 #endif 2141 err = register_filesystem(&nfs_fs_type); 2142 if (err) 2143 goto out; 2144 if ((err = register_nfs4fs()) != 0) 2145 goto out; 2146 return 0; 2147 out: 2148 #ifdef CONFIG_PROC_FS 2149 rpc_proc_unregister("nfs"); 2150 #endif 2151 nfs_destroy_writepagecache(); 2152 #ifdef CONFIG_NFS_DIRECTIO 2153 out0: 2154 nfs_destroy_directcache(); 2155 #endif 2156 out1: 2157 nfs_destroy_readpagecache(); 2158 out2: 2159 nfs_destroy_inodecache(); 2160 out3: 2161 nfs_destroy_nfspagecache(); 2162 out4: 2163 return err; 2164 } 2165 2166 static void __exit exit_nfs_fs(void) 2167 { 2168 #ifdef CONFIG_NFS_DIRECTIO 2169 nfs_destroy_directcache(); 2170 #endif 2171 nfs_destroy_writepagecache(); 2172 nfs_destroy_readpagecache(); 2173 nfs_destroy_inodecache(); 2174 nfs_destroy_nfspagecache(); 2175 #ifdef CONFIG_PROC_FS 2176 rpc_proc_unregister("nfs"); 2177 #endif 2178 unregister_filesystem(&nfs_fs_type); 2179 unregister_nfs4fs(); 2180 } 2181 2182 /* Not quite true; I just maintain it */ 2183 MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>"); 2184 MODULE_LICENSE("GPL"); 2185 2186 module_init(init_nfs_fs) 2187 module_exit(exit_nfs_fs) 2188