1 /* 2 * CDDL HEADER START 3 * 4 * The contents of this file are subject to the terms of the 5 * Common Development and Distribution License (the "License"). 6 * You may not use this file except in compliance with the License. 7 * 8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9 * or http://www.opensolaris.org/os/licensing. 10 * See the License for the specific language governing permissions 11 * and limitations under the License. 12 * 13 * When distributing Covered Code, include this CDDL HEADER in each 14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15 * If applicable, add the following below this CDDL HEADER, with the 16 * fields enclosed by brackets "[]" replaced with your own identifying 17 * information: Portions Copyright [yyyy] [name of copyright owner] 18 * 19 * CDDL HEADER END 20 */ 21 /* 22 * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved. 23 * Copyright (c) 2013 by Delphix. All rights reserved. 24 * Copyright 2017 Nexenta Systems, Inc. All rights reserved. 25 */ 26 27 #include <sys/types.h> 28 #include <sys/param.h> 29 #include <sys/time.h> 30 #include <sys/systm.h> 31 #include <sys/sysmacros.h> 32 #include <sys/resource.h> 33 #include <sys/vfs.h> 34 #include <sys/vnode.h> 35 #include <sys/file.h> 36 #include <sys/stat.h> 37 #include <sys/kmem.h> 38 #include <sys/cmn_err.h> 39 #include <sys/errno.h> 40 #include <sys/unistd.h> 41 #include <sys/sdt.h> 42 #include <sys/fs/zfs.h> 43 #include <sys/policy.h> 44 #include <sys/zfs_znode.h> 45 #include <sys/zfs_fuid.h> 46 #include <sys/zfs_acl.h> 47 #include <sys/zfs_dir.h> 48 #include <sys/zfs_quota.h> 49 #include <sys/zfs_vfsops.h> 50 #include <sys/dmu.h> 51 #include <sys/dnode.h> 52 #include <sys/zap.h> 53 #include <sys/sa.h> 54 #include <acl/acl_common.h> 55 56 57 #define ALLOW ACE_ACCESS_ALLOWED_ACE_TYPE 58 #define DENY ACE_ACCESS_DENIED_ACE_TYPE 59 #define MAX_ACE_TYPE ACE_SYSTEM_ALARM_CALLBACK_OBJECT_ACE_TYPE 60 #define MIN_ACE_TYPE ALLOW 61 62 #define OWNING_GROUP (ACE_GROUP|ACE_IDENTIFIER_GROUP) 63 #define EVERYONE_ALLOW_MASK (ACE_READ_ACL|ACE_READ_ATTRIBUTES | \ 64 ACE_READ_NAMED_ATTRS|ACE_SYNCHRONIZE) 65 #define EVERYONE_DENY_MASK (ACE_WRITE_ACL|ACE_WRITE_OWNER | \ 66 ACE_WRITE_ATTRIBUTES|ACE_WRITE_NAMED_ATTRS) 67 #define OWNER_ALLOW_MASK (ACE_WRITE_ACL | ACE_WRITE_OWNER | \ 68 ACE_WRITE_ATTRIBUTES|ACE_WRITE_NAMED_ATTRS) 69 70 #define ZFS_CHECKED_MASKS (ACE_READ_ACL|ACE_READ_ATTRIBUTES|ACE_READ_DATA| \ 71 ACE_READ_NAMED_ATTRS|ACE_WRITE_DATA|ACE_WRITE_ATTRIBUTES| \ 72 ACE_WRITE_NAMED_ATTRS|ACE_APPEND_DATA|ACE_EXECUTE|ACE_WRITE_OWNER| \ 73 ACE_WRITE_ACL|ACE_DELETE|ACE_DELETE_CHILD|ACE_SYNCHRONIZE) 74 75 #define WRITE_MASK_DATA (ACE_WRITE_DATA|ACE_APPEND_DATA|ACE_WRITE_NAMED_ATTRS) 76 #define WRITE_MASK_ATTRS (ACE_WRITE_ACL|ACE_WRITE_OWNER|ACE_WRITE_ATTRIBUTES| \ 77 ACE_DELETE|ACE_DELETE_CHILD) 78 #define WRITE_MASK (WRITE_MASK_DATA|WRITE_MASK_ATTRS) 79 80 #define OGE_CLEAR (ACE_READ_DATA|ACE_LIST_DIRECTORY|ACE_WRITE_DATA| \ 81 ACE_ADD_FILE|ACE_APPEND_DATA|ACE_ADD_SUBDIRECTORY|ACE_EXECUTE) 82 83 #define OKAY_MASK_BITS (ACE_READ_DATA|ACE_LIST_DIRECTORY|ACE_WRITE_DATA| \ 84 ACE_ADD_FILE|ACE_APPEND_DATA|ACE_ADD_SUBDIRECTORY|ACE_EXECUTE) 85 86 #define ALL_INHERIT (ACE_FILE_INHERIT_ACE|ACE_DIRECTORY_INHERIT_ACE | \ 87 ACE_NO_PROPAGATE_INHERIT_ACE|ACE_INHERIT_ONLY_ACE|ACE_INHERITED_ACE) 88 89 #define RESTRICTED_CLEAR (ACE_WRITE_ACL|ACE_WRITE_OWNER) 90 91 #define V4_ACL_WIDE_FLAGS (ZFS_ACL_AUTO_INHERIT|ZFS_ACL_DEFAULTED|\ 92 ZFS_ACL_PROTECTED) 93 94 #define ZFS_ACL_WIDE_FLAGS (V4_ACL_WIDE_FLAGS|ZFS_ACL_TRIVIAL|ZFS_INHERIT_ACE|\ 95 ZFS_ACL_OBJ_ACE) 96 97 #define ALL_MODE_EXECS (S_IXUSR | S_IXGRP | S_IXOTH) 98 99 static uint16_t 100 zfs_ace_v0_get_type(void *acep) 101 { 102 return (((zfs_oldace_t *)acep)->z_type); 103 } 104 105 static uint16_t 106 zfs_ace_v0_get_flags(void *acep) 107 { 108 return (((zfs_oldace_t *)acep)->z_flags); 109 } 110 111 static uint32_t 112 zfs_ace_v0_get_mask(void *acep) 113 { 114 return (((zfs_oldace_t *)acep)->z_access_mask); 115 } 116 117 static uint64_t 118 zfs_ace_v0_get_who(void *acep) 119 { 120 return (((zfs_oldace_t *)acep)->z_fuid); 121 } 122 123 static void 124 zfs_ace_v0_set_type(void *acep, uint16_t type) 125 { 126 ((zfs_oldace_t *)acep)->z_type = type; 127 } 128 129 static void 130 zfs_ace_v0_set_flags(void *acep, uint16_t flags) 131 { 132 ((zfs_oldace_t *)acep)->z_flags = flags; 133 } 134 135 static void 136 zfs_ace_v0_set_mask(void *acep, uint32_t mask) 137 { 138 ((zfs_oldace_t *)acep)->z_access_mask = mask; 139 } 140 141 static void 142 zfs_ace_v0_set_who(void *acep, uint64_t who) 143 { 144 ((zfs_oldace_t *)acep)->z_fuid = who; 145 } 146 147 /*ARGSUSED*/ 148 static size_t 149 zfs_ace_v0_size(void *acep) 150 { 151 return (sizeof (zfs_oldace_t)); 152 } 153 154 static size_t 155 zfs_ace_v0_abstract_size(void) 156 { 157 return (sizeof (zfs_oldace_t)); 158 } 159 160 static int 161 zfs_ace_v0_mask_off(void) 162 { 163 return (offsetof(zfs_oldace_t, z_access_mask)); 164 } 165 166 /*ARGSUSED*/ 167 static int 168 zfs_ace_v0_data(void *acep, void **datap) 169 { 170 *datap = NULL; 171 return (0); 172 } 173 174 static acl_ops_t zfs_acl_v0_ops = { 175 zfs_ace_v0_get_mask, 176 zfs_ace_v0_set_mask, 177 zfs_ace_v0_get_flags, 178 zfs_ace_v0_set_flags, 179 zfs_ace_v0_get_type, 180 zfs_ace_v0_set_type, 181 zfs_ace_v0_get_who, 182 zfs_ace_v0_set_who, 183 zfs_ace_v0_size, 184 zfs_ace_v0_abstract_size, 185 zfs_ace_v0_mask_off, 186 zfs_ace_v0_data 187 }; 188 189 static uint16_t 190 zfs_ace_fuid_get_type(void *acep) 191 { 192 return (((zfs_ace_hdr_t *)acep)->z_type); 193 } 194 195 static uint16_t 196 zfs_ace_fuid_get_flags(void *acep) 197 { 198 return (((zfs_ace_hdr_t *)acep)->z_flags); 199 } 200 201 static uint32_t 202 zfs_ace_fuid_get_mask(void *acep) 203 { 204 return (((zfs_ace_hdr_t *)acep)->z_access_mask); 205 } 206 207 static uint64_t 208 zfs_ace_fuid_get_who(void *args) 209 { 210 uint16_t entry_type; 211 zfs_ace_t *acep = args; 212 213 entry_type = acep->z_hdr.z_flags & ACE_TYPE_FLAGS; 214 215 if (entry_type == ACE_OWNER || entry_type == OWNING_GROUP || 216 entry_type == ACE_EVERYONE) 217 return (-1); 218 return (((zfs_ace_t *)acep)->z_fuid); 219 } 220 221 static void 222 zfs_ace_fuid_set_type(void *acep, uint16_t type) 223 { 224 ((zfs_ace_hdr_t *)acep)->z_type = type; 225 } 226 227 static void 228 zfs_ace_fuid_set_flags(void *acep, uint16_t flags) 229 { 230 ((zfs_ace_hdr_t *)acep)->z_flags = flags; 231 } 232 233 static void 234 zfs_ace_fuid_set_mask(void *acep, uint32_t mask) 235 { 236 ((zfs_ace_hdr_t *)acep)->z_access_mask = mask; 237 } 238 239 static void 240 zfs_ace_fuid_set_who(void *arg, uint64_t who) 241 { 242 zfs_ace_t *acep = arg; 243 244 uint16_t entry_type = acep->z_hdr.z_flags & ACE_TYPE_FLAGS; 245 246 if (entry_type == ACE_OWNER || entry_type == OWNING_GROUP || 247 entry_type == ACE_EVERYONE) 248 return; 249 acep->z_fuid = who; 250 } 251 252 static size_t 253 zfs_ace_fuid_size(void *acep) 254 { 255 zfs_ace_hdr_t *zacep = acep; 256 uint16_t entry_type; 257 258 switch (zacep->z_type) { 259 case ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE: 260 case ACE_ACCESS_DENIED_OBJECT_ACE_TYPE: 261 case ACE_SYSTEM_AUDIT_OBJECT_ACE_TYPE: 262 case ACE_SYSTEM_ALARM_OBJECT_ACE_TYPE: 263 return (sizeof (zfs_object_ace_t)); 264 case ALLOW: 265 case DENY: 266 entry_type = 267 (((zfs_ace_hdr_t *)acep)->z_flags & ACE_TYPE_FLAGS); 268 if (entry_type == ACE_OWNER || 269 entry_type == OWNING_GROUP || 270 entry_type == ACE_EVERYONE) 271 return (sizeof (zfs_ace_hdr_t)); 272 /*FALLTHROUGH*/ 273 default: 274 return (sizeof (zfs_ace_t)); 275 } 276 } 277 278 static size_t 279 zfs_ace_fuid_abstract_size(void) 280 { 281 return (sizeof (zfs_ace_hdr_t)); 282 } 283 284 static int 285 zfs_ace_fuid_mask_off(void) 286 { 287 return (offsetof(zfs_ace_hdr_t, z_access_mask)); 288 } 289 290 static int 291 zfs_ace_fuid_data(void *acep, void **datap) 292 { 293 zfs_ace_t *zacep = acep; 294 zfs_object_ace_t *zobjp; 295 296 switch (zacep->z_hdr.z_type) { 297 case ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE: 298 case ACE_ACCESS_DENIED_OBJECT_ACE_TYPE: 299 case ACE_SYSTEM_AUDIT_OBJECT_ACE_TYPE: 300 case ACE_SYSTEM_ALARM_OBJECT_ACE_TYPE: 301 zobjp = acep; 302 *datap = (caddr_t)zobjp + sizeof (zfs_ace_t); 303 return (sizeof (zfs_object_ace_t) - sizeof (zfs_ace_t)); 304 default: 305 *datap = NULL; 306 return (0); 307 } 308 } 309 310 static acl_ops_t zfs_acl_fuid_ops = { 311 zfs_ace_fuid_get_mask, 312 zfs_ace_fuid_set_mask, 313 zfs_ace_fuid_get_flags, 314 zfs_ace_fuid_set_flags, 315 zfs_ace_fuid_get_type, 316 zfs_ace_fuid_set_type, 317 zfs_ace_fuid_get_who, 318 zfs_ace_fuid_set_who, 319 zfs_ace_fuid_size, 320 zfs_ace_fuid_abstract_size, 321 zfs_ace_fuid_mask_off, 322 zfs_ace_fuid_data 323 }; 324 325 /* 326 * The following three functions are provided for compatibility with 327 * older ZPL version in order to determine if the file use to have 328 * an external ACL and what version of ACL previously existed on the 329 * file. Would really be nice to not need this, sigh. 330 */ 331 uint64_t 332 zfs_external_acl(znode_t *zp) 333 { 334 zfs_acl_phys_t acl_phys; 335 int error; 336 337 if (zp->z_is_sa) 338 return (0); 339 340 /* 341 * Need to deal with a potential 342 * race where zfs_sa_upgrade could cause 343 * z_isa_sa to change. 344 * 345 * If the lookup fails then the state of z_is_sa should have 346 * changed. 347 */ 348 349 if ((error = sa_lookup(zp->z_sa_hdl, SA_ZPL_ZNODE_ACL(zp->z_zfsvfs), 350 &acl_phys, sizeof (acl_phys))) == 0) 351 return (acl_phys.z_acl_extern_obj); 352 else { 353 /* 354 * after upgrade the SA_ZPL_ZNODE_ACL should have been 355 * removed 356 */ 357 VERIFY(zp->z_is_sa && error == ENOENT); 358 return (0); 359 } 360 } 361 362 /* 363 * Determine size of ACL in bytes 364 * 365 * This is more complicated than it should be since we have to deal 366 * with old external ACLs. 367 */ 368 static int 369 zfs_acl_znode_info(znode_t *zp, int *aclsize, int *aclcount, 370 zfs_acl_phys_t *aclphys) 371 { 372 zfsvfs_t *zfsvfs = zp->z_zfsvfs; 373 uint64_t acl_count; 374 int size; 375 int error; 376 377 ASSERT(MUTEX_HELD(&zp->z_acl_lock)); 378 if (zp->z_is_sa) { 379 if ((error = sa_size(zp->z_sa_hdl, SA_ZPL_DACL_ACES(zfsvfs), 380 &size)) != 0) 381 return (error); 382 *aclsize = size; 383 if ((error = sa_lookup(zp->z_sa_hdl, SA_ZPL_DACL_COUNT(zfsvfs), 384 &acl_count, sizeof (acl_count))) != 0) 385 return (error); 386 *aclcount = acl_count; 387 } else { 388 if ((error = sa_lookup(zp->z_sa_hdl, SA_ZPL_ZNODE_ACL(zfsvfs), 389 aclphys, sizeof (*aclphys))) != 0) 390 return (error); 391 392 if (aclphys->z_acl_version == ZFS_ACL_VERSION_INITIAL) { 393 *aclsize = ZFS_ACL_SIZE(aclphys->z_acl_size); 394 *aclcount = aclphys->z_acl_size; 395 } else { 396 *aclsize = aclphys->z_acl_size; 397 *aclcount = aclphys->z_acl_count; 398 } 399 } 400 return (0); 401 } 402 403 int 404 zfs_znode_acl_version(znode_t *zp) 405 { 406 zfs_acl_phys_t acl_phys; 407 408 if (zp->z_is_sa) 409 return (ZFS_ACL_VERSION_FUID); 410 else { 411 int error; 412 413 /* 414 * Need to deal with a potential 415 * race where zfs_sa_upgrade could cause 416 * z_isa_sa to change. 417 * 418 * If the lookup fails then the state of z_is_sa should have 419 * changed. 420 */ 421 if ((error = sa_lookup(zp->z_sa_hdl, 422 SA_ZPL_ZNODE_ACL(zp->z_zfsvfs), 423 &acl_phys, sizeof (acl_phys))) == 0) 424 return (acl_phys.z_acl_version); 425 else { 426 /* 427 * After upgrade SA_ZPL_ZNODE_ACL should have 428 * been removed. 429 */ 430 VERIFY(zp->z_is_sa && error == ENOENT); 431 return (ZFS_ACL_VERSION_FUID); 432 } 433 } 434 } 435 436 static int 437 zfs_acl_version(int version) 438 { 439 if (version < ZPL_VERSION_FUID) 440 return (ZFS_ACL_VERSION_INITIAL); 441 else 442 return (ZFS_ACL_VERSION_FUID); 443 } 444 445 static int 446 zfs_acl_version_zp(znode_t *zp) 447 { 448 return (zfs_acl_version(zp->z_zfsvfs->z_version)); 449 } 450 451 zfs_acl_t * 452 zfs_acl_alloc(int vers) 453 { 454 zfs_acl_t *aclp; 455 456 aclp = kmem_zalloc(sizeof (zfs_acl_t), KM_SLEEP); 457 list_create(&aclp->z_acl, sizeof (zfs_acl_node_t), 458 offsetof(zfs_acl_node_t, z_next)); 459 aclp->z_version = vers; 460 if (vers == ZFS_ACL_VERSION_FUID) 461 aclp->z_ops = &zfs_acl_fuid_ops; 462 else 463 aclp->z_ops = &zfs_acl_v0_ops; 464 return (aclp); 465 } 466 467 zfs_acl_node_t * 468 zfs_acl_node_alloc(size_t bytes) 469 { 470 zfs_acl_node_t *aclnode; 471 472 aclnode = kmem_zalloc(sizeof (zfs_acl_node_t), KM_SLEEP); 473 if (bytes) { 474 aclnode->z_acldata = kmem_alloc(bytes, KM_SLEEP); 475 aclnode->z_allocdata = aclnode->z_acldata; 476 aclnode->z_allocsize = bytes; 477 aclnode->z_size = bytes; 478 } 479 480 return (aclnode); 481 } 482 483 static void 484 zfs_acl_node_free(zfs_acl_node_t *aclnode) 485 { 486 if (aclnode->z_allocsize) 487 kmem_free(aclnode->z_allocdata, aclnode->z_allocsize); 488 kmem_free(aclnode, sizeof (zfs_acl_node_t)); 489 } 490 491 static void 492 zfs_acl_release_nodes(zfs_acl_t *aclp) 493 { 494 zfs_acl_node_t *aclnode; 495 496 while ((aclnode = list_head(&aclp->z_acl))) { 497 list_remove(&aclp->z_acl, aclnode); 498 zfs_acl_node_free(aclnode); 499 } 500 aclp->z_acl_count = 0; 501 aclp->z_acl_bytes = 0; 502 } 503 504 void 505 zfs_acl_free(zfs_acl_t *aclp) 506 { 507 zfs_acl_release_nodes(aclp); 508 list_destroy(&aclp->z_acl); 509 kmem_free(aclp, sizeof (zfs_acl_t)); 510 } 511 512 static boolean_t 513 zfs_acl_valid_ace_type(uint_t type, uint_t flags) 514 { 515 uint16_t entry_type; 516 517 switch (type) { 518 case ALLOW: 519 case DENY: 520 case ACE_SYSTEM_AUDIT_ACE_TYPE: 521 case ACE_SYSTEM_ALARM_ACE_TYPE: 522 entry_type = flags & ACE_TYPE_FLAGS; 523 return (entry_type == ACE_OWNER || 524 entry_type == OWNING_GROUP || 525 entry_type == ACE_EVERYONE || entry_type == 0 || 526 entry_type == ACE_IDENTIFIER_GROUP); 527 default: 528 if (type >= MIN_ACE_TYPE && type <= MAX_ACE_TYPE) 529 return (B_TRUE); 530 } 531 return (B_FALSE); 532 } 533 534 static boolean_t 535 zfs_ace_valid(vtype_t obj_type, zfs_acl_t *aclp, uint16_t type, uint16_t iflags) 536 { 537 /* 538 * first check type of entry 539 */ 540 541 if (!zfs_acl_valid_ace_type(type, iflags)) 542 return (B_FALSE); 543 544 switch (type) { 545 case ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE: 546 case ACE_ACCESS_DENIED_OBJECT_ACE_TYPE: 547 case ACE_SYSTEM_AUDIT_OBJECT_ACE_TYPE: 548 case ACE_SYSTEM_ALARM_OBJECT_ACE_TYPE: 549 if (aclp->z_version < ZFS_ACL_VERSION_FUID) 550 return (B_FALSE); 551 aclp->z_hints |= ZFS_ACL_OBJ_ACE; 552 } 553 554 /* 555 * next check inheritance level flags 556 */ 557 558 if (obj_type == VDIR && 559 (iflags & (ACE_FILE_INHERIT_ACE|ACE_DIRECTORY_INHERIT_ACE))) 560 aclp->z_hints |= ZFS_INHERIT_ACE; 561 562 if (iflags & (ACE_INHERIT_ONLY_ACE|ACE_NO_PROPAGATE_INHERIT_ACE)) { 563 if ((iflags & (ACE_FILE_INHERIT_ACE| 564 ACE_DIRECTORY_INHERIT_ACE)) == 0) { 565 return (B_FALSE); 566 } 567 } 568 569 return (B_TRUE); 570 } 571 572 static void * 573 zfs_acl_next_ace(zfs_acl_t *aclp, void *start, uint64_t *who, 574 uint32_t *access_mask, uint16_t *iflags, uint16_t *type) 575 { 576 zfs_acl_node_t *aclnode; 577 578 ASSERT(aclp); 579 580 if (start == NULL) { 581 aclnode = list_head(&aclp->z_acl); 582 if (aclnode == NULL) 583 return (NULL); 584 585 aclp->z_next_ace = aclnode->z_acldata; 586 aclp->z_curr_node = aclnode; 587 aclnode->z_ace_idx = 0; 588 } 589 590 aclnode = aclp->z_curr_node; 591 592 if (aclnode == NULL) 593 return (NULL); 594 595 if (aclnode->z_ace_idx >= aclnode->z_ace_count) { 596 aclnode = list_next(&aclp->z_acl, aclnode); 597 if (aclnode == NULL) 598 return (NULL); 599 else { 600 aclp->z_curr_node = aclnode; 601 aclnode->z_ace_idx = 0; 602 aclp->z_next_ace = aclnode->z_acldata; 603 } 604 } 605 606 if (aclnode->z_ace_idx < aclnode->z_ace_count) { 607 void *acep = aclp->z_next_ace; 608 size_t ace_size; 609 610 /* 611 * Make sure we don't overstep our bounds 612 */ 613 ace_size = aclp->z_ops->ace_size(acep); 614 615 if (((caddr_t)acep + ace_size) > 616 ((caddr_t)aclnode->z_acldata + aclnode->z_size)) { 617 return (NULL); 618 } 619 620 *iflags = aclp->z_ops->ace_flags_get(acep); 621 *type = aclp->z_ops->ace_type_get(acep); 622 *access_mask = aclp->z_ops->ace_mask_get(acep); 623 *who = aclp->z_ops->ace_who_get(acep); 624 aclp->z_next_ace = (caddr_t)aclp->z_next_ace + ace_size; 625 aclnode->z_ace_idx++; 626 627 return ((void *)acep); 628 } 629 return (NULL); 630 } 631 632 /*ARGSUSED*/ 633 static uint64_t 634 zfs_ace_walk(void *datap, uint64_t cookie, int aclcnt, 635 uint16_t *flags, uint16_t *type, uint32_t *mask) 636 { 637 zfs_acl_t *aclp = datap; 638 zfs_ace_hdr_t *acep = (zfs_ace_hdr_t *)(uintptr_t)cookie; 639 uint64_t who; 640 641 acep = zfs_acl_next_ace(aclp, acep, &who, mask, 642 flags, type); 643 return ((uint64_t)(uintptr_t)acep); 644 } 645 646 /* 647 * Copy ACE to internal ZFS format. 648 * While processing the ACL each ACE will be validated for correctness. 649 * ACE FUIDs will be created later. 650 */ 651 static int 652 zfs_copy_ace_2_fuid(zfsvfs_t *zfsvfs, vtype_t obj_type, zfs_acl_t *aclp, 653 void *datap, zfs_ace_t *z_acl, uint64_t aclcnt, size_t *size, 654 zfs_fuid_info_t **fuidp, cred_t *cr) 655 { 656 int i; 657 uint16_t entry_type; 658 zfs_ace_t *aceptr = z_acl; 659 ace_t *acep = datap; 660 zfs_object_ace_t *zobjacep; 661 ace_object_t *aceobjp; 662 663 for (i = 0; i != aclcnt; i++) { 664 aceptr->z_hdr.z_access_mask = acep->a_access_mask; 665 aceptr->z_hdr.z_flags = acep->a_flags; 666 aceptr->z_hdr.z_type = acep->a_type; 667 entry_type = aceptr->z_hdr.z_flags & ACE_TYPE_FLAGS; 668 if (entry_type != ACE_OWNER && entry_type != OWNING_GROUP && 669 entry_type != ACE_EVERYONE) { 670 aceptr->z_fuid = zfs_fuid_create(zfsvfs, acep->a_who, 671 cr, (entry_type == 0) ? 672 ZFS_ACE_USER : ZFS_ACE_GROUP, fuidp); 673 } 674 675 /* 676 * Make sure ACE is valid 677 */ 678 if (zfs_ace_valid(obj_type, aclp, aceptr->z_hdr.z_type, 679 aceptr->z_hdr.z_flags) != B_TRUE) 680 return (SET_ERROR(EINVAL)); 681 682 switch (acep->a_type) { 683 case ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE: 684 case ACE_ACCESS_DENIED_OBJECT_ACE_TYPE: 685 case ACE_SYSTEM_AUDIT_OBJECT_ACE_TYPE: 686 case ACE_SYSTEM_ALARM_OBJECT_ACE_TYPE: 687 zobjacep = (zfs_object_ace_t *)aceptr; 688 aceobjp = (ace_object_t *)acep; 689 690 bcopy(aceobjp->a_obj_type, zobjacep->z_object_type, 691 sizeof (aceobjp->a_obj_type)); 692 bcopy(aceobjp->a_inherit_obj_type, 693 zobjacep->z_inherit_type, 694 sizeof (aceobjp->a_inherit_obj_type)); 695 acep = (ace_t *)((caddr_t)acep + sizeof (ace_object_t)); 696 break; 697 default: 698 acep = (ace_t *)((caddr_t)acep + sizeof (ace_t)); 699 } 700 701 aceptr = (zfs_ace_t *)((caddr_t)aceptr + 702 aclp->z_ops->ace_size(aceptr)); 703 } 704 705 *size = (caddr_t)aceptr - (caddr_t)z_acl; 706 707 return (0); 708 } 709 710 /* 711 * Copy ZFS ACEs to fixed size ace_t layout 712 */ 713 static void 714 zfs_copy_fuid_2_ace(zfsvfs_t *zfsvfs, zfs_acl_t *aclp, cred_t *cr, 715 void *datap, int filter) 716 { 717 uint64_t who; 718 uint32_t access_mask; 719 uint16_t iflags, type; 720 zfs_ace_hdr_t *zacep = NULL; 721 ace_t *acep = datap; 722 ace_object_t *objacep; 723 zfs_object_ace_t *zobjacep; 724 size_t ace_size; 725 uint16_t entry_type; 726 727 while ((zacep = zfs_acl_next_ace(aclp, zacep, 728 &who, &access_mask, &iflags, &type))) { 729 730 switch (type) { 731 case ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE: 732 case ACE_ACCESS_DENIED_OBJECT_ACE_TYPE: 733 case ACE_SYSTEM_AUDIT_OBJECT_ACE_TYPE: 734 case ACE_SYSTEM_ALARM_OBJECT_ACE_TYPE: 735 if (filter) { 736 continue; 737 } 738 zobjacep = (zfs_object_ace_t *)zacep; 739 objacep = (ace_object_t *)acep; 740 bcopy(zobjacep->z_object_type, 741 objacep->a_obj_type, 742 sizeof (zobjacep->z_object_type)); 743 bcopy(zobjacep->z_inherit_type, 744 objacep->a_inherit_obj_type, 745 sizeof (zobjacep->z_inherit_type)); 746 ace_size = sizeof (ace_object_t); 747 break; 748 default: 749 ace_size = sizeof (ace_t); 750 break; 751 } 752 753 entry_type = (iflags & ACE_TYPE_FLAGS); 754 if ((entry_type != ACE_OWNER && 755 entry_type != OWNING_GROUP && 756 entry_type != ACE_EVERYONE)) { 757 acep->a_who = zfs_fuid_map_id(zfsvfs, who, 758 cr, (entry_type & ACE_IDENTIFIER_GROUP) ? 759 ZFS_ACE_GROUP : ZFS_ACE_USER); 760 } else { 761 acep->a_who = (uid_t)(int64_t)who; 762 } 763 acep->a_access_mask = access_mask; 764 acep->a_flags = iflags; 765 acep->a_type = type; 766 acep = (ace_t *)((caddr_t)acep + ace_size); 767 } 768 } 769 770 static int 771 zfs_copy_ace_2_oldace(vtype_t obj_type, zfs_acl_t *aclp, ace_t *acep, 772 zfs_oldace_t *z_acl, int aclcnt, size_t *size) 773 { 774 int i; 775 zfs_oldace_t *aceptr = z_acl; 776 777 for (i = 0; i != aclcnt; i++, aceptr++) { 778 aceptr->z_access_mask = acep[i].a_access_mask; 779 aceptr->z_type = acep[i].a_type; 780 aceptr->z_flags = acep[i].a_flags; 781 aceptr->z_fuid = acep[i].a_who; 782 /* 783 * Make sure ACE is valid 784 */ 785 if (zfs_ace_valid(obj_type, aclp, aceptr->z_type, 786 aceptr->z_flags) != B_TRUE) 787 return (SET_ERROR(EINVAL)); 788 } 789 *size = (caddr_t)aceptr - (caddr_t)z_acl; 790 return (0); 791 } 792 793 /* 794 * convert old ACL format to new 795 */ 796 void 797 zfs_acl_xform(znode_t *zp, zfs_acl_t *aclp, cred_t *cr) 798 { 799 zfs_oldace_t *oldaclp; 800 int i; 801 uint16_t type, iflags; 802 uint32_t access_mask; 803 uint64_t who; 804 void *cookie = NULL; 805 zfs_acl_node_t *newaclnode; 806 807 ASSERT(aclp->z_version == ZFS_ACL_VERSION_INITIAL); 808 /* 809 * First create the ACE in a contiguous piece of memory 810 * for zfs_copy_ace_2_fuid(). 811 * 812 * We only convert an ACL once, so this won't happen 813 * everytime. 814 */ 815 oldaclp = kmem_alloc(sizeof (zfs_oldace_t) * aclp->z_acl_count, 816 KM_SLEEP); 817 i = 0; 818 while ((cookie = zfs_acl_next_ace(aclp, cookie, &who, 819 &access_mask, &iflags, &type))) { 820 oldaclp[i].z_flags = iflags; 821 oldaclp[i].z_type = type; 822 oldaclp[i].z_fuid = who; 823 oldaclp[i++].z_access_mask = access_mask; 824 } 825 826 newaclnode = zfs_acl_node_alloc(aclp->z_acl_count * 827 sizeof (zfs_object_ace_t)); 828 aclp->z_ops = &zfs_acl_fuid_ops; 829 VERIFY(zfs_copy_ace_2_fuid(zp->z_zfsvfs, ZTOV(zp)->v_type, aclp, 830 oldaclp, newaclnode->z_acldata, aclp->z_acl_count, 831 &newaclnode->z_size, NULL, cr) == 0); 832 newaclnode->z_ace_count = aclp->z_acl_count; 833 aclp->z_version = ZFS_ACL_VERSION; 834 kmem_free(oldaclp, aclp->z_acl_count * sizeof (zfs_oldace_t)); 835 836 /* 837 * Release all previous ACL nodes 838 */ 839 840 zfs_acl_release_nodes(aclp); 841 842 list_insert_head(&aclp->z_acl, newaclnode); 843 844 aclp->z_acl_bytes = newaclnode->z_size; 845 aclp->z_acl_count = newaclnode->z_ace_count; 846 847 } 848 849 /* 850 * Convert unix access mask to v4 access mask 851 */ 852 static uint32_t 853 zfs_unix_to_v4(uint32_t access_mask) 854 { 855 uint32_t new_mask = 0; 856 857 if (access_mask & S_IXOTH) 858 new_mask |= ACE_EXECUTE; 859 if (access_mask & S_IWOTH) 860 new_mask |= ACE_WRITE_DATA; 861 if (access_mask & S_IROTH) 862 new_mask |= ACE_READ_DATA; 863 return (new_mask); 864 } 865 866 static void 867 zfs_set_ace(zfs_acl_t *aclp, void *acep, uint32_t access_mask, 868 uint16_t access_type, uint64_t fuid, uint16_t entry_type) 869 { 870 uint16_t type = entry_type & ACE_TYPE_FLAGS; 871 872 aclp->z_ops->ace_mask_set(acep, access_mask); 873 aclp->z_ops->ace_type_set(acep, access_type); 874 aclp->z_ops->ace_flags_set(acep, entry_type); 875 if ((type != ACE_OWNER && type != OWNING_GROUP && 876 type != ACE_EVERYONE)) 877 aclp->z_ops->ace_who_set(acep, fuid); 878 } 879 880 /* 881 * Determine mode of file based on ACL. 882 */ 883 uint64_t 884 zfs_mode_compute(uint64_t fmode, zfs_acl_t *aclp, 885 uint64_t *pflags, uint64_t fuid, uint64_t fgid) 886 { 887 int entry_type; 888 mode_t mode; 889 mode_t seen = 0; 890 zfs_ace_hdr_t *acep = NULL; 891 uint64_t who; 892 uint16_t iflags, type; 893 uint32_t access_mask; 894 boolean_t an_exec_denied = B_FALSE; 895 896 mode = (fmode & (S_IFMT | S_ISUID | S_ISGID | S_ISVTX)); 897 898 while ((acep = zfs_acl_next_ace(aclp, acep, &who, 899 &access_mask, &iflags, &type))) { 900 901 if (!zfs_acl_valid_ace_type(type, iflags)) 902 continue; 903 904 entry_type = (iflags & ACE_TYPE_FLAGS); 905 906 /* 907 * Skip over any inherit_only ACEs 908 */ 909 if (iflags & ACE_INHERIT_ONLY_ACE) 910 continue; 911 912 if (entry_type == ACE_OWNER || (entry_type == 0 && 913 who == fuid)) { 914 if ((access_mask & ACE_READ_DATA) && 915 (!(seen & S_IRUSR))) { 916 seen |= S_IRUSR; 917 if (type == ALLOW) { 918 mode |= S_IRUSR; 919 } 920 } 921 if ((access_mask & ACE_WRITE_DATA) && 922 (!(seen & S_IWUSR))) { 923 seen |= S_IWUSR; 924 if (type == ALLOW) { 925 mode |= S_IWUSR; 926 } 927 } 928 if ((access_mask & ACE_EXECUTE) && 929 (!(seen & S_IXUSR))) { 930 seen |= S_IXUSR; 931 if (type == ALLOW) { 932 mode |= S_IXUSR; 933 } 934 } 935 } else if (entry_type == OWNING_GROUP || 936 (entry_type == ACE_IDENTIFIER_GROUP && who == fgid)) { 937 if ((access_mask & ACE_READ_DATA) && 938 (!(seen & S_IRGRP))) { 939 seen |= S_IRGRP; 940 if (type == ALLOW) { 941 mode |= S_IRGRP; 942 } 943 } 944 if ((access_mask & ACE_WRITE_DATA) && 945 (!(seen & S_IWGRP))) { 946 seen |= S_IWGRP; 947 if (type == ALLOW) { 948 mode |= S_IWGRP; 949 } 950 } 951 if ((access_mask & ACE_EXECUTE) && 952 (!(seen & S_IXGRP))) { 953 seen |= S_IXGRP; 954 if (type == ALLOW) { 955 mode |= S_IXGRP; 956 } 957 } 958 } else if (entry_type == ACE_EVERYONE) { 959 if ((access_mask & ACE_READ_DATA)) { 960 if (!(seen & S_IRUSR)) { 961 seen |= S_IRUSR; 962 if (type == ALLOW) { 963 mode |= S_IRUSR; 964 } 965 } 966 if (!(seen & S_IRGRP)) { 967 seen |= S_IRGRP; 968 if (type == ALLOW) { 969 mode |= S_IRGRP; 970 } 971 } 972 if (!(seen & S_IROTH)) { 973 seen |= S_IROTH; 974 if (type == ALLOW) { 975 mode |= S_IROTH; 976 } 977 } 978 } 979 if ((access_mask & ACE_WRITE_DATA)) { 980 if (!(seen & S_IWUSR)) { 981 seen |= S_IWUSR; 982 if (type == ALLOW) { 983 mode |= S_IWUSR; 984 } 985 } 986 if (!(seen & S_IWGRP)) { 987 seen |= S_IWGRP; 988 if (type == ALLOW) { 989 mode |= S_IWGRP; 990 } 991 } 992 if (!(seen & S_IWOTH)) { 993 seen |= S_IWOTH; 994 if (type == ALLOW) { 995 mode |= S_IWOTH; 996 } 997 } 998 } 999 if ((access_mask & ACE_EXECUTE)) { 1000 if (!(seen & S_IXUSR)) { 1001 seen |= S_IXUSR; 1002 if (type == ALLOW) { 1003 mode |= S_IXUSR; 1004 } 1005 } 1006 if (!(seen & S_IXGRP)) { 1007 seen |= S_IXGRP; 1008 if (type == ALLOW) { 1009 mode |= S_IXGRP; 1010 } 1011 } 1012 if (!(seen & S_IXOTH)) { 1013 seen |= S_IXOTH; 1014 if (type == ALLOW) { 1015 mode |= S_IXOTH; 1016 } 1017 } 1018 } 1019 } else { 1020 /* 1021 * Only care if this IDENTIFIER_GROUP or 1022 * USER ACE denies execute access to someone, 1023 * mode is not affected 1024 */ 1025 if ((access_mask & ACE_EXECUTE) && type == DENY) 1026 an_exec_denied = B_TRUE; 1027 } 1028 } 1029 1030 /* 1031 * Failure to allow is effectively a deny, so execute permission 1032 * is denied if it was never mentioned or if we explicitly 1033 * weren't allowed it. 1034 */ 1035 if (!an_exec_denied && 1036 ((seen & ALL_MODE_EXECS) != ALL_MODE_EXECS || 1037 (mode & ALL_MODE_EXECS) != ALL_MODE_EXECS)) 1038 an_exec_denied = B_TRUE; 1039 1040 if (an_exec_denied) 1041 *pflags &= ~ZFS_NO_EXECS_DENIED; 1042 else 1043 *pflags |= ZFS_NO_EXECS_DENIED; 1044 1045 return (mode); 1046 } 1047 1048 /* 1049 * Read an external acl object. If the intent is to modify, always 1050 * create a new acl and leave any cached acl in place. 1051 */ 1052 int 1053 zfs_acl_node_read(znode_t *zp, boolean_t have_lock, zfs_acl_t **aclpp, 1054 boolean_t will_modify) 1055 { 1056 zfs_acl_t *aclp; 1057 int aclsize; 1058 int acl_count; 1059 zfs_acl_node_t *aclnode; 1060 zfs_acl_phys_t znode_acl; 1061 int version; 1062 int error; 1063 1064 ASSERT(MUTEX_HELD(&zp->z_acl_lock)); 1065 if (zp->z_zfsvfs->z_replay == B_FALSE) 1066 ASSERT_VOP_LOCKED(ZTOV(zp), __func__); 1067 1068 if (zp->z_acl_cached && !will_modify) { 1069 *aclpp = zp->z_acl_cached; 1070 return (0); 1071 } 1072 1073 version = zfs_znode_acl_version(zp); 1074 1075 if ((error = zfs_acl_znode_info(zp, &aclsize, 1076 &acl_count, &znode_acl)) != 0) { 1077 goto done; 1078 } 1079 1080 aclp = zfs_acl_alloc(version); 1081 1082 aclp->z_acl_count = acl_count; 1083 aclp->z_acl_bytes = aclsize; 1084 1085 aclnode = zfs_acl_node_alloc(aclsize); 1086 aclnode->z_ace_count = aclp->z_acl_count; 1087 aclnode->z_size = aclsize; 1088 1089 if (!zp->z_is_sa) { 1090 if (znode_acl.z_acl_extern_obj) { 1091 error = dmu_read(zp->z_zfsvfs->z_os, 1092 znode_acl.z_acl_extern_obj, 0, aclnode->z_size, 1093 aclnode->z_acldata, DMU_READ_PREFETCH); 1094 } else { 1095 bcopy(znode_acl.z_ace_data, aclnode->z_acldata, 1096 aclnode->z_size); 1097 } 1098 } else { 1099 error = sa_lookup(zp->z_sa_hdl, SA_ZPL_DACL_ACES(zp->z_zfsvfs), 1100 aclnode->z_acldata, aclnode->z_size); 1101 } 1102 1103 if (error != 0) { 1104 zfs_acl_free(aclp); 1105 zfs_acl_node_free(aclnode); 1106 /* convert checksum errors into IO errors */ 1107 if (error == ECKSUM) 1108 error = SET_ERROR(EIO); 1109 goto done; 1110 } 1111 1112 list_insert_head(&aclp->z_acl, aclnode); 1113 1114 *aclpp = aclp; 1115 if (!will_modify) 1116 zp->z_acl_cached = aclp; 1117 done: 1118 return (error); 1119 } 1120 1121 /*ARGSUSED*/ 1122 void 1123 zfs_acl_data_locator(void **dataptr, uint32_t *length, uint32_t buflen, 1124 boolean_t start, void *userdata) 1125 { 1126 zfs_acl_locator_cb_t *cb = (zfs_acl_locator_cb_t *)userdata; 1127 1128 if (start) { 1129 cb->cb_acl_node = list_head(&cb->cb_aclp->z_acl); 1130 } else { 1131 cb->cb_acl_node = list_next(&cb->cb_aclp->z_acl, 1132 cb->cb_acl_node); 1133 } 1134 *dataptr = cb->cb_acl_node->z_acldata; 1135 *length = cb->cb_acl_node->z_size; 1136 } 1137 1138 int 1139 zfs_acl_chown_setattr(znode_t *zp) 1140 { 1141 int error; 1142 zfs_acl_t *aclp; 1143 1144 if (zp->z_zfsvfs->z_replay == B_FALSE) { 1145 ASSERT_VOP_ELOCKED(ZTOV(zp), __func__); 1146 ASSERT_VOP_IN_SEQC(ZTOV(zp)); 1147 } 1148 ASSERT(MUTEX_HELD(&zp->z_acl_lock)); 1149 1150 if ((error = zfs_acl_node_read(zp, B_TRUE, &aclp, B_FALSE)) == 0) 1151 zp->z_mode = zfs_mode_compute(zp->z_mode, aclp, 1152 &zp->z_pflags, zp->z_uid, zp->z_gid); 1153 return (error); 1154 } 1155 1156 /* 1157 * common code for setting ACLs. 1158 * 1159 * This function is called from zfs_mode_update, zfs_perm_init, and zfs_setacl. 1160 * zfs_setacl passes a non-NULL inherit pointer (ihp) to indicate that it's 1161 * already checked the acl and knows whether to inherit. 1162 */ 1163 int 1164 zfs_aclset_common(znode_t *zp, zfs_acl_t *aclp, cred_t *cr, dmu_tx_t *tx) 1165 { 1166 int error; 1167 zfsvfs_t *zfsvfs = zp->z_zfsvfs; 1168 dmu_object_type_t otype; 1169 zfs_acl_locator_cb_t locate = { 0 }; 1170 uint64_t mode; 1171 sa_bulk_attr_t bulk[5]; 1172 uint64_t ctime[2]; 1173 int count = 0; 1174 zfs_acl_phys_t acl_phys; 1175 1176 if (zp->z_zfsvfs->z_replay == B_FALSE) { 1177 ASSERT_VOP_IN_SEQC(ZTOV(zp)); 1178 } 1179 1180 mode = zp->z_mode; 1181 1182 mode = zfs_mode_compute(mode, aclp, &zp->z_pflags, 1183 zp->z_uid, zp->z_gid); 1184 1185 zp->z_mode = mode; 1186 SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_MODE(zfsvfs), NULL, 1187 &mode, sizeof (mode)); 1188 SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_FLAGS(zfsvfs), NULL, 1189 &zp->z_pflags, sizeof (zp->z_pflags)); 1190 SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_CTIME(zfsvfs), NULL, 1191 &ctime, sizeof (ctime)); 1192 1193 if (zp->z_acl_cached) { 1194 zfs_acl_free(zp->z_acl_cached); 1195 zp->z_acl_cached = NULL; 1196 } 1197 1198 /* 1199 * Upgrade needed? 1200 */ 1201 if (!zfsvfs->z_use_fuids) { 1202 otype = DMU_OT_OLDACL; 1203 } else { 1204 if ((aclp->z_version == ZFS_ACL_VERSION_INITIAL) && 1205 (zfsvfs->z_version >= ZPL_VERSION_FUID)) 1206 zfs_acl_xform(zp, aclp, cr); 1207 ASSERT(aclp->z_version >= ZFS_ACL_VERSION_FUID); 1208 otype = DMU_OT_ACL; 1209 } 1210 1211 /* 1212 * Arrgh, we have to handle old on disk format 1213 * as well as newer (preferred) SA format. 1214 */ 1215 1216 if (zp->z_is_sa) { /* the easy case, just update the ACL attribute */ 1217 locate.cb_aclp = aclp; 1218 SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_DACL_ACES(zfsvfs), 1219 zfs_acl_data_locator, &locate, aclp->z_acl_bytes); 1220 SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_DACL_COUNT(zfsvfs), 1221 NULL, &aclp->z_acl_count, sizeof (uint64_t)); 1222 } else { /* Painful legacy way */ 1223 zfs_acl_node_t *aclnode; 1224 uint64_t off = 0; 1225 uint64_t aoid; 1226 1227 if ((error = sa_lookup(zp->z_sa_hdl, SA_ZPL_ZNODE_ACL(zfsvfs), 1228 &acl_phys, sizeof (acl_phys))) != 0) 1229 return (error); 1230 1231 aoid = acl_phys.z_acl_extern_obj; 1232 1233 if (aclp->z_acl_bytes > ZFS_ACE_SPACE) { 1234 /* 1235 * If ACL was previously external and we are now 1236 * converting to new ACL format then release old 1237 * ACL object and create a new one. 1238 */ 1239 if (aoid && 1240 aclp->z_version != acl_phys.z_acl_version) { 1241 error = dmu_object_free(zfsvfs->z_os, aoid, tx); 1242 if (error) 1243 return (error); 1244 aoid = 0; 1245 } 1246 if (aoid == 0) { 1247 aoid = dmu_object_alloc(zfsvfs->z_os, 1248 otype, aclp->z_acl_bytes, 1249 otype == DMU_OT_ACL ? 1250 DMU_OT_SYSACL : DMU_OT_NONE, 1251 otype == DMU_OT_ACL ? 1252 DN_OLD_MAX_BONUSLEN : 0, tx); 1253 } else { 1254 (void) dmu_object_set_blocksize(zfsvfs->z_os, 1255 aoid, aclp->z_acl_bytes, 0, tx); 1256 } 1257 acl_phys.z_acl_extern_obj = aoid; 1258 for (aclnode = list_head(&aclp->z_acl); aclnode; 1259 aclnode = list_next(&aclp->z_acl, aclnode)) { 1260 if (aclnode->z_ace_count == 0) 1261 continue; 1262 dmu_write(zfsvfs->z_os, aoid, off, 1263 aclnode->z_size, aclnode->z_acldata, tx); 1264 off += aclnode->z_size; 1265 } 1266 } else { 1267 void *start = acl_phys.z_ace_data; 1268 /* 1269 * Migrating back embedded? 1270 */ 1271 if (acl_phys.z_acl_extern_obj) { 1272 error = dmu_object_free(zfsvfs->z_os, 1273 acl_phys.z_acl_extern_obj, tx); 1274 if (error) 1275 return (error); 1276 acl_phys.z_acl_extern_obj = 0; 1277 } 1278 1279 for (aclnode = list_head(&aclp->z_acl); aclnode; 1280 aclnode = list_next(&aclp->z_acl, aclnode)) { 1281 if (aclnode->z_ace_count == 0) 1282 continue; 1283 bcopy(aclnode->z_acldata, start, 1284 aclnode->z_size); 1285 start = (caddr_t)start + aclnode->z_size; 1286 } 1287 } 1288 /* 1289 * If Old version then swap count/bytes to match old 1290 * layout of znode_acl_phys_t. 1291 */ 1292 if (aclp->z_version == ZFS_ACL_VERSION_INITIAL) { 1293 acl_phys.z_acl_size = aclp->z_acl_count; 1294 acl_phys.z_acl_count = aclp->z_acl_bytes; 1295 } else { 1296 acl_phys.z_acl_size = aclp->z_acl_bytes; 1297 acl_phys.z_acl_count = aclp->z_acl_count; 1298 } 1299 acl_phys.z_acl_version = aclp->z_version; 1300 1301 SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_ZNODE_ACL(zfsvfs), NULL, 1302 &acl_phys, sizeof (acl_phys)); 1303 } 1304 1305 /* 1306 * Replace ACL wide bits, but first clear them. 1307 */ 1308 zp->z_pflags &= ~ZFS_ACL_WIDE_FLAGS; 1309 1310 zp->z_pflags |= aclp->z_hints; 1311 1312 if (ace_trivial_common(aclp, 0, zfs_ace_walk) == 0) 1313 zp->z_pflags |= ZFS_ACL_TRIVIAL; 1314 1315 zfs_tstamp_update_setup(zp, STATE_CHANGED, NULL, ctime); 1316 return (sa_bulk_update(zp->z_sa_hdl, bulk, count, tx)); 1317 } 1318 1319 static void 1320 zfs_acl_chmod(vtype_t vtype, uint64_t mode, boolean_t split, boolean_t trim, 1321 zfs_acl_t *aclp) 1322 { 1323 void *acep = NULL; 1324 uint64_t who; 1325 int new_count, new_bytes; 1326 int ace_size; 1327 int entry_type; 1328 uint16_t iflags, type; 1329 uint32_t access_mask; 1330 zfs_acl_node_t *newnode; 1331 size_t abstract_size = aclp->z_ops->ace_abstract_size(); 1332 void *zacep; 1333 boolean_t isdir; 1334 trivial_acl_t masks; 1335 1336 new_count = new_bytes = 0; 1337 1338 isdir = (vtype == VDIR); 1339 1340 acl_trivial_access_masks((mode_t)mode, isdir, &masks); 1341 1342 newnode = zfs_acl_node_alloc((abstract_size * 6) + aclp->z_acl_bytes); 1343 1344 zacep = newnode->z_acldata; 1345 if (masks.allow0) { 1346 zfs_set_ace(aclp, zacep, masks.allow0, ALLOW, -1, ACE_OWNER); 1347 zacep = (void *)((uintptr_t)zacep + abstract_size); 1348 new_count++; 1349 new_bytes += abstract_size; 1350 } 1351 if (masks.deny1) { 1352 zfs_set_ace(aclp, zacep, masks.deny1, DENY, -1, ACE_OWNER); 1353 zacep = (void *)((uintptr_t)zacep + abstract_size); 1354 new_count++; 1355 new_bytes += abstract_size; 1356 } 1357 if (masks.deny2) { 1358 zfs_set_ace(aclp, zacep, masks.deny2, DENY, -1, OWNING_GROUP); 1359 zacep = (void *)((uintptr_t)zacep + abstract_size); 1360 new_count++; 1361 new_bytes += abstract_size; 1362 } 1363 1364 while ((acep = zfs_acl_next_ace(aclp, acep, &who, &access_mask, 1365 &iflags, &type))) { 1366 entry_type = (iflags & ACE_TYPE_FLAGS); 1367 /* 1368 * ACEs used to represent the file mode may be divided 1369 * into an equivalent pair of inherit-only and regular 1370 * ACEs, if they are inheritable. 1371 * Skip regular ACEs, which are replaced by the new mode. 1372 */ 1373 if (split && (entry_type == ACE_OWNER || 1374 entry_type == OWNING_GROUP || 1375 entry_type == ACE_EVERYONE)) { 1376 if (!isdir || !(iflags & 1377 (ACE_FILE_INHERIT_ACE|ACE_DIRECTORY_INHERIT_ACE))) 1378 continue; 1379 /* 1380 * We preserve owner@, group@, or @everyone 1381 * permissions, if they are inheritable, by 1382 * copying them to inherit_only ACEs. This 1383 * prevents inheritable permissions from being 1384 * altered along with the file mode. 1385 */ 1386 iflags |= ACE_INHERIT_ONLY_ACE; 1387 } 1388 1389 /* 1390 * If this ACL has any inheritable ACEs, mark that in 1391 * the hints (which are later masked into the pflags) 1392 * so create knows to do inheritance. 1393 */ 1394 if (isdir && (iflags & 1395 (ACE_FILE_INHERIT_ACE|ACE_DIRECTORY_INHERIT_ACE))) 1396 aclp->z_hints |= ZFS_INHERIT_ACE; 1397 1398 if ((type != ALLOW && type != DENY) || 1399 (iflags & ACE_INHERIT_ONLY_ACE)) { 1400 switch (type) { 1401 case ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE: 1402 case ACE_ACCESS_DENIED_OBJECT_ACE_TYPE: 1403 case ACE_SYSTEM_AUDIT_OBJECT_ACE_TYPE: 1404 case ACE_SYSTEM_ALARM_OBJECT_ACE_TYPE: 1405 aclp->z_hints |= ZFS_ACL_OBJ_ACE; 1406 break; 1407 } 1408 } else { 1409 /* 1410 * Limit permissions granted by ACEs to be no greater 1411 * than permissions of the requested group mode. 1412 * Applies when the "aclmode" property is set to 1413 * "groupmask". 1414 */ 1415 if ((type == ALLOW) && trim) 1416 access_mask &= masks.group; 1417 } 1418 zfs_set_ace(aclp, zacep, access_mask, type, who, iflags); 1419 ace_size = aclp->z_ops->ace_size(acep); 1420 zacep = (void *)((uintptr_t)zacep + ace_size); 1421 new_count++; 1422 new_bytes += ace_size; 1423 } 1424 zfs_set_ace(aclp, zacep, masks.owner, ALLOW, -1, ACE_OWNER); 1425 zacep = (void *)((uintptr_t)zacep + abstract_size); 1426 zfs_set_ace(aclp, zacep, masks.group, ALLOW, -1, OWNING_GROUP); 1427 zacep = (void *)((uintptr_t)zacep + abstract_size); 1428 zfs_set_ace(aclp, zacep, masks.everyone, ALLOW, -1, ACE_EVERYONE); 1429 1430 new_count += 3; 1431 new_bytes += abstract_size * 3; 1432 zfs_acl_release_nodes(aclp); 1433 aclp->z_acl_count = new_count; 1434 aclp->z_acl_bytes = new_bytes; 1435 newnode->z_ace_count = new_count; 1436 newnode->z_size = new_bytes; 1437 list_insert_tail(&aclp->z_acl, newnode); 1438 } 1439 1440 int 1441 zfs_acl_chmod_setattr(znode_t *zp, zfs_acl_t **aclp, uint64_t mode) 1442 { 1443 int error = 0; 1444 1445 mutex_enter(&zp->z_acl_lock); 1446 if (zp->z_zfsvfs->z_replay == B_FALSE) 1447 ASSERT_VOP_ELOCKED(ZTOV(zp), __func__); 1448 if (zp->z_zfsvfs->z_acl_mode == ZFS_ACL_DISCARD) 1449 *aclp = zfs_acl_alloc(zfs_acl_version_zp(zp)); 1450 else 1451 error = zfs_acl_node_read(zp, B_TRUE, aclp, B_TRUE); 1452 1453 if (error == 0) { 1454 (*aclp)->z_hints = zp->z_pflags & V4_ACL_WIDE_FLAGS; 1455 zfs_acl_chmod(ZTOV(zp)->v_type, mode, B_TRUE, 1456 (zp->z_zfsvfs->z_acl_mode == ZFS_ACL_GROUPMASK), *aclp); 1457 } 1458 mutex_exit(&zp->z_acl_lock); 1459 1460 return (error); 1461 } 1462 1463 /* 1464 * Should ACE be inherited? 1465 */ 1466 static int 1467 zfs_ace_can_use(vtype_t vtype, uint16_t acep_flags) 1468 { 1469 int iflags = (acep_flags & 0xf); 1470 1471 if ((vtype == VDIR) && (iflags & ACE_DIRECTORY_INHERIT_ACE)) 1472 return (1); 1473 else if (iflags & ACE_FILE_INHERIT_ACE) 1474 return (!((vtype == VDIR) && 1475 (iflags & ACE_NO_PROPAGATE_INHERIT_ACE))); 1476 return (0); 1477 } 1478 1479 /* 1480 * inherit inheritable ACEs from parent 1481 */ 1482 static zfs_acl_t * 1483 zfs_acl_inherit(zfsvfs_t *zfsvfs, vtype_t vtype, zfs_acl_t *paclp, 1484 uint64_t mode, boolean_t *need_chmod) 1485 { 1486 void *pacep = NULL; 1487 void *acep; 1488 zfs_acl_node_t *aclnode; 1489 zfs_acl_t *aclp = NULL; 1490 uint64_t who; 1491 uint32_t access_mask; 1492 uint16_t iflags, newflags, type; 1493 size_t ace_size; 1494 void *data1, *data2; 1495 size_t data1sz, data2sz; 1496 uint_t aclinherit; 1497 boolean_t isdir = (vtype == VDIR); 1498 boolean_t isreg = (vtype == VREG); 1499 1500 *need_chmod = B_TRUE; 1501 1502 aclp = zfs_acl_alloc(paclp->z_version); 1503 aclinherit = zfsvfs->z_acl_inherit; 1504 if (aclinherit == ZFS_ACL_DISCARD || vtype == VLNK) 1505 return (aclp); 1506 1507 while ((pacep = zfs_acl_next_ace(paclp, pacep, &who, 1508 &access_mask, &iflags, &type))) { 1509 1510 /* 1511 * don't inherit bogus ACEs 1512 */ 1513 if (!zfs_acl_valid_ace_type(type, iflags)) 1514 continue; 1515 1516 /* 1517 * Check if ACE is inheritable by this vnode 1518 */ 1519 if ((aclinherit == ZFS_ACL_NOALLOW && type == ALLOW) || 1520 !zfs_ace_can_use(vtype, iflags)) 1521 continue; 1522 1523 /* 1524 * If owner@, group@, or everyone@ inheritable 1525 * then zfs_acl_chmod() isn't needed. 1526 */ 1527 if ((aclinherit == ZFS_ACL_PASSTHROUGH || 1528 aclinherit == ZFS_ACL_PASSTHROUGH_X) && 1529 ((iflags & (ACE_OWNER|ACE_EVERYONE)) || 1530 ((iflags & OWNING_GROUP) == OWNING_GROUP)) && 1531 (isreg || (isdir && (iflags & ACE_DIRECTORY_INHERIT_ACE)))) 1532 *need_chmod = B_FALSE; 1533 1534 /* 1535 * Strip inherited execute permission from file if 1536 * not in mode 1537 */ 1538 if (aclinherit == ZFS_ACL_PASSTHROUGH_X && type == ALLOW && 1539 !isdir && ((mode & (S_IXUSR|S_IXGRP|S_IXOTH)) == 0)) { 1540 access_mask &= ~ACE_EXECUTE; 1541 } 1542 1543 /* 1544 * Strip write_acl and write_owner from permissions 1545 * when inheriting an ACE 1546 */ 1547 if (aclinherit == ZFS_ACL_RESTRICTED && type == ALLOW) { 1548 access_mask &= ~RESTRICTED_CLEAR; 1549 } 1550 1551 ace_size = aclp->z_ops->ace_size(pacep); 1552 aclnode = zfs_acl_node_alloc(ace_size); 1553 list_insert_tail(&aclp->z_acl, aclnode); 1554 acep = aclnode->z_acldata; 1555 1556 zfs_set_ace(aclp, acep, access_mask, type, 1557 who, iflags|ACE_INHERITED_ACE); 1558 1559 /* 1560 * Copy special opaque data if any 1561 */ 1562 if ((data1sz = paclp->z_ops->ace_data(pacep, &data1)) != 0) { 1563 VERIFY((data2sz = aclp->z_ops->ace_data(acep, 1564 &data2)) == data1sz); 1565 bcopy(data1, data2, data2sz); 1566 } 1567 1568 aclp->z_acl_count++; 1569 aclnode->z_ace_count++; 1570 aclp->z_acl_bytes += aclnode->z_size; 1571 newflags = aclp->z_ops->ace_flags_get(acep); 1572 1573 /* 1574 * If ACE is not to be inherited further, or if the vnode is 1575 * not a directory, remove all inheritance flags 1576 */ 1577 if (!isdir || (iflags & ACE_NO_PROPAGATE_INHERIT_ACE)) { 1578 newflags &= ~ALL_INHERIT; 1579 aclp->z_ops->ace_flags_set(acep, 1580 newflags|ACE_INHERITED_ACE); 1581 continue; 1582 } 1583 1584 /* 1585 * This directory has an inheritable ACE 1586 */ 1587 aclp->z_hints |= ZFS_INHERIT_ACE; 1588 1589 /* 1590 * If only FILE_INHERIT is set then turn on 1591 * inherit_only 1592 */ 1593 if ((iflags & (ACE_FILE_INHERIT_ACE | 1594 ACE_DIRECTORY_INHERIT_ACE)) == ACE_FILE_INHERIT_ACE) { 1595 newflags |= ACE_INHERIT_ONLY_ACE; 1596 aclp->z_ops->ace_flags_set(acep, 1597 newflags|ACE_INHERITED_ACE); 1598 } else { 1599 newflags &= ~ACE_INHERIT_ONLY_ACE; 1600 aclp->z_ops->ace_flags_set(acep, 1601 newflags|ACE_INHERITED_ACE); 1602 } 1603 } 1604 if (zfsvfs->z_acl_mode == ZFS_ACL_RESTRICTED && 1605 aclp->z_acl_count != 0) { 1606 *need_chmod = B_FALSE; 1607 } 1608 1609 return (aclp); 1610 } 1611 1612 /* 1613 * Create file system object initial permissions 1614 * including inheritable ACEs. 1615 * Also, create FUIDs for owner and group. 1616 */ 1617 int 1618 zfs_acl_ids_create(znode_t *dzp, int flag, vattr_t *vap, cred_t *cr, 1619 vsecattr_t *vsecp, zfs_acl_ids_t *acl_ids) 1620 { 1621 int error; 1622 zfsvfs_t *zfsvfs = dzp->z_zfsvfs; 1623 zfs_acl_t *paclp; 1624 gid_t gid; 1625 boolean_t need_chmod = B_TRUE; 1626 boolean_t trim = B_FALSE; 1627 boolean_t inherited = B_FALSE; 1628 1629 if ((flag & IS_ROOT_NODE) == 0) { 1630 if (zfsvfs->z_replay == B_FALSE) 1631 ASSERT_VOP_ELOCKED(ZTOV(dzp), __func__); 1632 } else 1633 ASSERT(dzp->z_vnode == NULL); 1634 bzero(acl_ids, sizeof (zfs_acl_ids_t)); 1635 acl_ids->z_mode = MAKEIMODE(vap->va_type, vap->va_mode); 1636 1637 if (vsecp) 1638 if ((error = zfs_vsec_2_aclp(zfsvfs, vap->va_type, vsecp, cr, 1639 &acl_ids->z_fuidp, &acl_ids->z_aclp)) != 0) 1640 return (error); 1641 /* 1642 * Determine uid and gid. 1643 */ 1644 if ((flag & IS_ROOT_NODE) || zfsvfs->z_replay || 1645 ((flag & IS_XATTR) && (vap->va_type == VDIR))) { 1646 acl_ids->z_fuid = zfs_fuid_create(zfsvfs, 1647 (uint64_t)vap->va_uid, cr, 1648 ZFS_OWNER, &acl_ids->z_fuidp); 1649 acl_ids->z_fgid = zfs_fuid_create(zfsvfs, 1650 (uint64_t)vap->va_gid, cr, 1651 ZFS_GROUP, &acl_ids->z_fuidp); 1652 gid = vap->va_gid; 1653 } else { 1654 acl_ids->z_fuid = zfs_fuid_create_cred(zfsvfs, ZFS_OWNER, 1655 cr, &acl_ids->z_fuidp); 1656 acl_ids->z_fgid = 0; 1657 if (vap->va_mask & AT_GID) { 1658 acl_ids->z_fgid = zfs_fuid_create(zfsvfs, 1659 (uint64_t)vap->va_gid, 1660 cr, ZFS_GROUP, &acl_ids->z_fuidp); 1661 gid = vap->va_gid; 1662 if (acl_ids->z_fgid != dzp->z_gid && 1663 !groupmember(vap->va_gid, cr) && 1664 secpolicy_vnode_create_gid(cr) != 0) 1665 acl_ids->z_fgid = 0; 1666 } 1667 if (acl_ids->z_fgid == 0) { 1668 char *domain; 1669 uint32_t rid; 1670 1671 acl_ids->z_fgid = dzp->z_gid; 1672 gid = zfs_fuid_map_id(zfsvfs, acl_ids->z_fgid, 1673 cr, ZFS_GROUP); 1674 1675 if (zfsvfs->z_use_fuids && 1676 IS_EPHEMERAL(acl_ids->z_fgid)) { 1677 domain = 1678 zfs_fuid_idx_domain(&zfsvfs->z_fuid_idx, 1679 FUID_INDEX(acl_ids->z_fgid)); 1680 rid = FUID_RID(acl_ids->z_fgid); 1681 zfs_fuid_node_add(&acl_ids->z_fuidp, 1682 domain, rid, FUID_INDEX(acl_ids->z_fgid), 1683 acl_ids->z_fgid, ZFS_GROUP); 1684 } 1685 } 1686 } 1687 1688 /* 1689 * If we're creating a directory, and the parent directory has the 1690 * set-GID bit set, set in on the new directory. 1691 * Otherwise, if the user is neither privileged nor a member of the 1692 * file's new group, clear the file's set-GID bit. 1693 */ 1694 1695 if (!(flag & IS_ROOT_NODE) && (dzp->z_mode & S_ISGID) && 1696 (vap->va_type == VDIR)) { 1697 acl_ids->z_mode |= S_ISGID; 1698 } else { 1699 if ((acl_ids->z_mode & S_ISGID) && 1700 secpolicy_vnode_setids_setgids(ZTOV(dzp), cr, gid) != 0) 1701 acl_ids->z_mode &= ~S_ISGID; 1702 } 1703 1704 if (acl_ids->z_aclp == NULL) { 1705 mutex_enter(&dzp->z_acl_lock); 1706 if (!(flag & IS_ROOT_NODE) && 1707 (dzp->z_pflags & ZFS_INHERIT_ACE) && 1708 !(dzp->z_pflags & ZFS_XATTR)) { 1709 VERIFY0(zfs_acl_node_read(dzp, B_TRUE, 1710 &paclp, B_FALSE)); 1711 acl_ids->z_aclp = zfs_acl_inherit(zfsvfs, 1712 vap->va_type, paclp, acl_ids->z_mode, &need_chmod); 1713 inherited = B_TRUE; 1714 } else { 1715 acl_ids->z_aclp = 1716 zfs_acl_alloc(zfs_acl_version_zp(dzp)); 1717 acl_ids->z_aclp->z_hints |= ZFS_ACL_TRIVIAL; 1718 } 1719 mutex_exit(&dzp->z_acl_lock); 1720 1721 if (need_chmod) { 1722 if (vap->va_type == VDIR) 1723 acl_ids->z_aclp->z_hints |= 1724 ZFS_ACL_AUTO_INHERIT; 1725 1726 if (zfsvfs->z_acl_mode == ZFS_ACL_GROUPMASK && 1727 zfsvfs->z_acl_inherit != ZFS_ACL_PASSTHROUGH && 1728 zfsvfs->z_acl_inherit != ZFS_ACL_PASSTHROUGH_X) 1729 trim = B_TRUE; 1730 zfs_acl_chmod(vap->va_type, acl_ids->z_mode, B_FALSE, 1731 trim, acl_ids->z_aclp); 1732 } 1733 } 1734 1735 if (inherited || vsecp) { 1736 acl_ids->z_mode = zfs_mode_compute(acl_ids->z_mode, 1737 acl_ids->z_aclp, &acl_ids->z_aclp->z_hints, 1738 acl_ids->z_fuid, acl_ids->z_fgid); 1739 if (ace_trivial_common(acl_ids->z_aclp, 0, zfs_ace_walk) == 0) 1740 acl_ids->z_aclp->z_hints |= ZFS_ACL_TRIVIAL; 1741 } 1742 1743 return (0); 1744 } 1745 1746 /* 1747 * Free ACL and fuid_infop, but not the acl_ids structure 1748 */ 1749 void 1750 zfs_acl_ids_free(zfs_acl_ids_t *acl_ids) 1751 { 1752 if (acl_ids->z_aclp) 1753 zfs_acl_free(acl_ids->z_aclp); 1754 if (acl_ids->z_fuidp) 1755 zfs_fuid_info_free(acl_ids->z_fuidp); 1756 acl_ids->z_aclp = NULL; 1757 acl_ids->z_fuidp = NULL; 1758 } 1759 1760 boolean_t 1761 zfs_acl_ids_overquota(zfsvfs_t *zv, zfs_acl_ids_t *acl_ids, uint64_t projid) 1762 { 1763 return (zfs_id_overquota(zv, DMU_USERUSED_OBJECT, acl_ids->z_fuid) || 1764 zfs_id_overquota(zv, DMU_GROUPUSED_OBJECT, acl_ids->z_fgid) || 1765 (projid != ZFS_DEFAULT_PROJID && projid != ZFS_INVALID_PROJID && 1766 zfs_id_overquota(zv, DMU_PROJECTUSED_OBJECT, projid))); 1767 } 1768 1769 /* 1770 * Retrieve a file's ACL 1771 */ 1772 int 1773 zfs_getacl(znode_t *zp, vsecattr_t *vsecp, boolean_t skipaclchk, cred_t *cr) 1774 { 1775 zfs_acl_t *aclp; 1776 ulong_t mask; 1777 int error; 1778 int count = 0; 1779 int largeace = 0; 1780 1781 mask = vsecp->vsa_mask & (VSA_ACE | VSA_ACECNT | 1782 VSA_ACE_ACLFLAGS | VSA_ACE_ALLTYPES); 1783 1784 if (mask == 0) 1785 return (SET_ERROR(ENOSYS)); 1786 1787 if ((error = zfs_zaccess(zp, ACE_READ_ACL, 0, skipaclchk, cr))) 1788 return (error); 1789 1790 mutex_enter(&zp->z_acl_lock); 1791 1792 if (zp->z_zfsvfs->z_replay == B_FALSE) 1793 ASSERT_VOP_LOCKED(ZTOV(zp), __func__); 1794 error = zfs_acl_node_read(zp, B_TRUE, &aclp, B_FALSE); 1795 if (error != 0) { 1796 mutex_exit(&zp->z_acl_lock); 1797 return (error); 1798 } 1799 1800 /* 1801 * Scan ACL to determine number of ACEs 1802 */ 1803 if ((zp->z_pflags & ZFS_ACL_OBJ_ACE) && !(mask & VSA_ACE_ALLTYPES)) { 1804 void *zacep = NULL; 1805 uint64_t who; 1806 uint32_t access_mask; 1807 uint16_t type, iflags; 1808 1809 while ((zacep = zfs_acl_next_ace(aclp, zacep, 1810 &who, &access_mask, &iflags, &type))) { 1811 switch (type) { 1812 case ACE_ACCESS_ALLOWED_OBJECT_ACE_TYPE: 1813 case ACE_ACCESS_DENIED_OBJECT_ACE_TYPE: 1814 case ACE_SYSTEM_AUDIT_OBJECT_ACE_TYPE: 1815 case ACE_SYSTEM_ALARM_OBJECT_ACE_TYPE: 1816 largeace++; 1817 continue; 1818 default: 1819 count++; 1820 } 1821 } 1822 vsecp->vsa_aclcnt = count; 1823 } else 1824 count = (int)aclp->z_acl_count; 1825 1826 if (mask & VSA_ACECNT) { 1827 vsecp->vsa_aclcnt = count; 1828 } 1829 1830 if (mask & VSA_ACE) { 1831 size_t aclsz; 1832 1833 aclsz = count * sizeof (ace_t) + 1834 sizeof (ace_object_t) * largeace; 1835 1836 vsecp->vsa_aclentp = kmem_alloc(aclsz, KM_SLEEP); 1837 vsecp->vsa_aclentsz = aclsz; 1838 1839 if (aclp->z_version == ZFS_ACL_VERSION_FUID) 1840 zfs_copy_fuid_2_ace(zp->z_zfsvfs, aclp, cr, 1841 vsecp->vsa_aclentp, !(mask & VSA_ACE_ALLTYPES)); 1842 else { 1843 zfs_acl_node_t *aclnode; 1844 void *start = vsecp->vsa_aclentp; 1845 1846 for (aclnode = list_head(&aclp->z_acl); aclnode; 1847 aclnode = list_next(&aclp->z_acl, aclnode)) { 1848 bcopy(aclnode->z_acldata, start, 1849 aclnode->z_size); 1850 start = (caddr_t)start + aclnode->z_size; 1851 } 1852 ASSERT((caddr_t)start - (caddr_t)vsecp->vsa_aclentp == 1853 aclp->z_acl_bytes); 1854 } 1855 } 1856 if (mask & VSA_ACE_ACLFLAGS) { 1857 vsecp->vsa_aclflags = 0; 1858 if (zp->z_pflags & ZFS_ACL_DEFAULTED) 1859 vsecp->vsa_aclflags |= ACL_DEFAULTED; 1860 if (zp->z_pflags & ZFS_ACL_PROTECTED) 1861 vsecp->vsa_aclflags |= ACL_PROTECTED; 1862 if (zp->z_pflags & ZFS_ACL_AUTO_INHERIT) 1863 vsecp->vsa_aclflags |= ACL_AUTO_INHERIT; 1864 } 1865 1866 mutex_exit(&zp->z_acl_lock); 1867 1868 return (0); 1869 } 1870 1871 int 1872 zfs_vsec_2_aclp(zfsvfs_t *zfsvfs, umode_t obj_type, 1873 vsecattr_t *vsecp, cred_t *cr, zfs_fuid_info_t **fuidp, zfs_acl_t **zaclp) 1874 { 1875 zfs_acl_t *aclp; 1876 zfs_acl_node_t *aclnode; 1877 int aclcnt = vsecp->vsa_aclcnt; 1878 int error; 1879 1880 if (vsecp->vsa_aclcnt > MAX_ACL_ENTRIES || vsecp->vsa_aclcnt <= 0) 1881 return (SET_ERROR(EINVAL)); 1882 1883 aclp = zfs_acl_alloc(zfs_acl_version(zfsvfs->z_version)); 1884 1885 aclp->z_hints = 0; 1886 aclnode = zfs_acl_node_alloc(aclcnt * sizeof (zfs_object_ace_t)); 1887 if (aclp->z_version == ZFS_ACL_VERSION_INITIAL) { 1888 if ((error = zfs_copy_ace_2_oldace(obj_type, aclp, 1889 (ace_t *)vsecp->vsa_aclentp, aclnode->z_acldata, 1890 aclcnt, &aclnode->z_size)) != 0) { 1891 zfs_acl_free(aclp); 1892 zfs_acl_node_free(aclnode); 1893 return (error); 1894 } 1895 } else { 1896 if ((error = zfs_copy_ace_2_fuid(zfsvfs, obj_type, aclp, 1897 vsecp->vsa_aclentp, aclnode->z_acldata, aclcnt, 1898 &aclnode->z_size, fuidp, cr)) != 0) { 1899 zfs_acl_free(aclp); 1900 zfs_acl_node_free(aclnode); 1901 return (error); 1902 } 1903 } 1904 aclp->z_acl_bytes = aclnode->z_size; 1905 aclnode->z_ace_count = aclcnt; 1906 aclp->z_acl_count = aclcnt; 1907 list_insert_head(&aclp->z_acl, aclnode); 1908 1909 /* 1910 * If flags are being set then add them to z_hints 1911 */ 1912 if (vsecp->vsa_mask & VSA_ACE_ACLFLAGS) { 1913 if (vsecp->vsa_aclflags & ACL_PROTECTED) 1914 aclp->z_hints |= ZFS_ACL_PROTECTED; 1915 if (vsecp->vsa_aclflags & ACL_DEFAULTED) 1916 aclp->z_hints |= ZFS_ACL_DEFAULTED; 1917 if (vsecp->vsa_aclflags & ACL_AUTO_INHERIT) 1918 aclp->z_hints |= ZFS_ACL_AUTO_INHERIT; 1919 } 1920 1921 *zaclp = aclp; 1922 1923 return (0); 1924 } 1925 1926 /* 1927 * Set a file's ACL 1928 */ 1929 int 1930 zfs_setacl(znode_t *zp, vsecattr_t *vsecp, boolean_t skipaclchk, cred_t *cr) 1931 { 1932 zfsvfs_t *zfsvfs = zp->z_zfsvfs; 1933 zilog_t *zilog = zfsvfs->z_log; 1934 ulong_t mask = vsecp->vsa_mask & (VSA_ACE | VSA_ACECNT); 1935 dmu_tx_t *tx; 1936 int error; 1937 zfs_acl_t *aclp; 1938 zfs_fuid_info_t *fuidp = NULL; 1939 boolean_t fuid_dirtied; 1940 uint64_t acl_obj; 1941 1942 if (zp->z_zfsvfs->z_replay == B_FALSE) 1943 ASSERT_VOP_ELOCKED(ZTOV(zp), __func__); 1944 if (mask == 0) 1945 return (SET_ERROR(ENOSYS)); 1946 1947 if (zp->z_pflags & ZFS_IMMUTABLE) 1948 return (SET_ERROR(EPERM)); 1949 1950 if ((error = zfs_zaccess(zp, ACE_WRITE_ACL, 0, skipaclchk, cr))) 1951 return (error); 1952 1953 error = zfs_vsec_2_aclp(zfsvfs, ZTOV(zp)->v_type, vsecp, cr, &fuidp, 1954 &aclp); 1955 if (error) 1956 return (error); 1957 1958 /* 1959 * If ACL wide flags aren't being set then preserve any 1960 * existing flags. 1961 */ 1962 if (!(vsecp->vsa_mask & VSA_ACE_ACLFLAGS)) { 1963 aclp->z_hints |= 1964 (zp->z_pflags & V4_ACL_WIDE_FLAGS); 1965 } 1966 top: 1967 mutex_enter(&zp->z_acl_lock); 1968 1969 tx = dmu_tx_create(zfsvfs->z_os); 1970 1971 dmu_tx_hold_sa(tx, zp->z_sa_hdl, B_TRUE); 1972 1973 fuid_dirtied = zfsvfs->z_fuid_dirty; 1974 if (fuid_dirtied) 1975 zfs_fuid_txhold(zfsvfs, tx); 1976 1977 /* 1978 * If old version and ACL won't fit in bonus and we aren't 1979 * upgrading then take out necessary DMU holds 1980 */ 1981 1982 if ((acl_obj = zfs_external_acl(zp)) != 0) { 1983 if (zfsvfs->z_version >= ZPL_VERSION_FUID && 1984 zfs_znode_acl_version(zp) <= ZFS_ACL_VERSION_INITIAL) { 1985 dmu_tx_hold_free(tx, acl_obj, 0, 1986 DMU_OBJECT_END); 1987 dmu_tx_hold_write(tx, DMU_NEW_OBJECT, 0, 1988 aclp->z_acl_bytes); 1989 } else { 1990 dmu_tx_hold_write(tx, acl_obj, 0, aclp->z_acl_bytes); 1991 } 1992 } else if (!zp->z_is_sa && aclp->z_acl_bytes > ZFS_ACE_SPACE) { 1993 dmu_tx_hold_write(tx, DMU_NEW_OBJECT, 0, aclp->z_acl_bytes); 1994 } 1995 1996 zfs_sa_upgrade_txholds(tx, zp); 1997 error = dmu_tx_assign(tx, TXG_NOWAIT); 1998 if (error) { 1999 mutex_exit(&zp->z_acl_lock); 2000 2001 if (error == ERESTART) { 2002 dmu_tx_wait(tx); 2003 dmu_tx_abort(tx); 2004 goto top; 2005 } 2006 dmu_tx_abort(tx); 2007 zfs_acl_free(aclp); 2008 return (error); 2009 } 2010 2011 error = zfs_aclset_common(zp, aclp, cr, tx); 2012 ASSERT(error == 0); 2013 ASSERT(zp->z_acl_cached == NULL); 2014 zp->z_acl_cached = aclp; 2015 2016 if (fuid_dirtied) 2017 zfs_fuid_sync(zfsvfs, tx); 2018 2019 zfs_log_acl(zilog, tx, zp, vsecp, fuidp); 2020 2021 if (fuidp) 2022 zfs_fuid_info_free(fuidp); 2023 dmu_tx_commit(tx); 2024 mutex_exit(&zp->z_acl_lock); 2025 2026 return (error); 2027 } 2028 2029 /* 2030 * Check accesses of interest (AoI) against attributes of the dataset 2031 * such as read-only. Returns zero if no AoI conflict with dataset 2032 * attributes, otherwise an appropriate errno is returned. 2033 */ 2034 static int 2035 zfs_zaccess_dataset_check(znode_t *zp, uint32_t v4_mode) 2036 { 2037 if ((v4_mode & WRITE_MASK) && 2038 (zp->z_zfsvfs->z_vfs->vfs_flag & VFS_RDONLY) && 2039 (!IS_DEVVP(ZTOV(zp)) || 2040 (IS_DEVVP(ZTOV(zp)) && (v4_mode & WRITE_MASK_ATTRS)))) { 2041 return (SET_ERROR(EROFS)); 2042 } 2043 2044 /* 2045 * Intentionally allow ZFS_READONLY through here. 2046 * See zfs_zaccess_common(). 2047 */ 2048 if ((v4_mode & WRITE_MASK_DATA) && 2049 (zp->z_pflags & ZFS_IMMUTABLE)) { 2050 return (SET_ERROR(EPERM)); 2051 } 2052 2053 /* 2054 * In FreeBSD we allow to modify directory's content is ZFS_NOUNLINK 2055 * (sunlnk) is set. We just don't allow directory removal, which is 2056 * handled in zfs_zaccess_delete(). 2057 */ 2058 if ((v4_mode & ACE_DELETE) && 2059 (zp->z_pflags & ZFS_NOUNLINK)) { 2060 return (EPERM); 2061 } 2062 2063 if (((v4_mode & (ACE_READ_DATA|ACE_EXECUTE)) && 2064 (zp->z_pflags & ZFS_AV_QUARANTINED))) { 2065 return (SET_ERROR(EACCES)); 2066 } 2067 2068 return (0); 2069 } 2070 2071 /* 2072 * The primary usage of this function is to loop through all of the 2073 * ACEs in the znode, determining what accesses of interest (AoI) to 2074 * the caller are allowed or denied. The AoI are expressed as bits in 2075 * the working_mode parameter. As each ACE is processed, bits covered 2076 * by that ACE are removed from the working_mode. This removal 2077 * facilitates two things. The first is that when the working mode is 2078 * empty (= 0), we know we've looked at all the AoI. The second is 2079 * that the ACE interpretation rules don't allow a later ACE to undo 2080 * something granted or denied by an earlier ACE. Removing the 2081 * discovered access or denial enforces this rule. At the end of 2082 * processing the ACEs, all AoI that were found to be denied are 2083 * placed into the working_mode, giving the caller a mask of denied 2084 * accesses. Returns: 2085 * 0 if all AoI granted 2086 * EACCESS if the denied mask is non-zero 2087 * other error if abnormal failure (e.g., IO error) 2088 * 2089 * A secondary usage of the function is to determine if any of the 2090 * AoI are granted. If an ACE grants any access in 2091 * the working_mode, we immediately short circuit out of the function. 2092 * This mode is chosen by setting anyaccess to B_TRUE. The 2093 * working_mode is not a denied access mask upon exit if the function 2094 * is used in this manner. 2095 */ 2096 static int 2097 zfs_zaccess_aces_check(znode_t *zp, uint32_t *working_mode, 2098 boolean_t anyaccess, cred_t *cr) 2099 { 2100 zfsvfs_t *zfsvfs = zp->z_zfsvfs; 2101 zfs_acl_t *aclp; 2102 int error; 2103 uid_t uid = crgetuid(cr); 2104 uint64_t who; 2105 uint16_t type, iflags; 2106 uint16_t entry_type; 2107 uint32_t access_mask; 2108 uint32_t deny_mask = 0; 2109 zfs_ace_hdr_t *acep = NULL; 2110 boolean_t checkit; 2111 uid_t gowner; 2112 uid_t fowner; 2113 2114 zfs_fuid_map_ids(zp, cr, &fowner, &gowner); 2115 2116 mutex_enter(&zp->z_acl_lock); 2117 2118 if (zp->z_zfsvfs->z_replay == B_FALSE) 2119 ASSERT_VOP_LOCKED(ZTOV(zp), __func__); 2120 error = zfs_acl_node_read(zp, B_TRUE, &aclp, B_FALSE); 2121 if (error != 0) { 2122 mutex_exit(&zp->z_acl_lock); 2123 return (error); 2124 } 2125 2126 ASSERT(zp->z_acl_cached); 2127 2128 while ((acep = zfs_acl_next_ace(aclp, acep, &who, &access_mask, 2129 &iflags, &type))) { 2130 uint32_t mask_matched; 2131 2132 if (!zfs_acl_valid_ace_type(type, iflags)) 2133 continue; 2134 2135 if (ZTOV(zp)->v_type == VDIR && (iflags & ACE_INHERIT_ONLY_ACE)) 2136 continue; 2137 2138 /* Skip ACE if it does not affect any AoI */ 2139 mask_matched = (access_mask & *working_mode); 2140 if (!mask_matched) 2141 continue; 2142 2143 entry_type = (iflags & ACE_TYPE_FLAGS); 2144 2145 checkit = B_FALSE; 2146 2147 switch (entry_type) { 2148 case ACE_OWNER: 2149 if (uid == fowner) 2150 checkit = B_TRUE; 2151 break; 2152 case OWNING_GROUP: 2153 who = gowner; 2154 /*FALLTHROUGH*/ 2155 case ACE_IDENTIFIER_GROUP: 2156 checkit = zfs_groupmember(zfsvfs, who, cr); 2157 break; 2158 case ACE_EVERYONE: 2159 checkit = B_TRUE; 2160 break; 2161 2162 /* USER Entry */ 2163 default: 2164 if (entry_type == 0) { 2165 uid_t newid; 2166 2167 newid = zfs_fuid_map_id(zfsvfs, who, cr, 2168 ZFS_ACE_USER); 2169 if (newid != UID_NOBODY && 2170 uid == newid) 2171 checkit = B_TRUE; 2172 break; 2173 } else { 2174 mutex_exit(&zp->z_acl_lock); 2175 return (SET_ERROR(EIO)); 2176 } 2177 } 2178 2179 if (checkit) { 2180 if (type == DENY) { 2181 DTRACE_PROBE3(zfs__ace__denies, 2182 znode_t *, zp, 2183 zfs_ace_hdr_t *, acep, 2184 uint32_t, mask_matched); 2185 deny_mask |= mask_matched; 2186 } else { 2187 DTRACE_PROBE3(zfs__ace__allows, 2188 znode_t *, zp, 2189 zfs_ace_hdr_t *, acep, 2190 uint32_t, mask_matched); 2191 if (anyaccess) { 2192 mutex_exit(&zp->z_acl_lock); 2193 return (0); 2194 } 2195 } 2196 *working_mode &= ~mask_matched; 2197 } 2198 2199 /* Are we done? */ 2200 if (*working_mode == 0) 2201 break; 2202 } 2203 2204 mutex_exit(&zp->z_acl_lock); 2205 2206 /* Put the found 'denies' back on the working mode */ 2207 if (deny_mask) { 2208 *working_mode |= deny_mask; 2209 return (SET_ERROR(EACCES)); 2210 } else if (*working_mode) { 2211 return (-1); 2212 } 2213 2214 return (0); 2215 } 2216 2217 /* 2218 * Return true if any access whatsoever granted, we don't actually 2219 * care what access is granted. 2220 */ 2221 boolean_t 2222 zfs_has_access(znode_t *zp, cred_t *cr) 2223 { 2224 uint32_t have = ACE_ALL_PERMS; 2225 2226 if (zfs_zaccess_aces_check(zp, &have, B_TRUE, cr) != 0) { 2227 uid_t owner; 2228 2229 owner = zfs_fuid_map_id(zp->z_zfsvfs, zp->z_uid, cr, ZFS_OWNER); 2230 return (secpolicy_vnode_any_access(cr, ZTOV(zp), owner) == 0); 2231 } 2232 return (B_TRUE); 2233 } 2234 2235 static int 2236 zfs_zaccess_common(znode_t *zp, uint32_t v4_mode, uint32_t *working_mode, 2237 boolean_t *check_privs, boolean_t skipaclchk, cred_t *cr) 2238 { 2239 zfsvfs_t *zfsvfs = zp->z_zfsvfs; 2240 int err; 2241 2242 *working_mode = v4_mode; 2243 *check_privs = B_TRUE; 2244 2245 /* 2246 * Short circuit empty requests 2247 */ 2248 if (v4_mode == 0 || zfsvfs->z_replay) { 2249 *working_mode = 0; 2250 return (0); 2251 } 2252 2253 if ((err = zfs_zaccess_dataset_check(zp, v4_mode)) != 0) { 2254 *check_privs = B_FALSE; 2255 return (err); 2256 } 2257 2258 /* 2259 * The caller requested that the ACL check be skipped. This 2260 * would only happen if the caller checked VOP_ACCESS() with a 2261 * 32 bit ACE mask and already had the appropriate permissions. 2262 */ 2263 if (skipaclchk) { 2264 *working_mode = 0; 2265 return (0); 2266 } 2267 2268 /* 2269 * Note: ZFS_READONLY represents the "DOS R/O" attribute. 2270 * When that flag is set, we should behave as if write access 2271 * were not granted by anything in the ACL. In particular: 2272 * We _must_ allow writes after opening the file r/w, then 2273 * setting the DOS R/O attribute, and writing some more. 2274 * (Similar to how you can write after fchmod(fd, 0444).) 2275 * 2276 * Therefore ZFS_READONLY is ignored in the dataset check 2277 * above, and checked here as if part of the ACL check. 2278 * Also note: DOS R/O is ignored for directories. 2279 */ 2280 if ((v4_mode & WRITE_MASK_DATA) && 2281 (ZTOV(zp)->v_type != VDIR) && 2282 (zp->z_pflags & ZFS_READONLY)) { 2283 return (SET_ERROR(EPERM)); 2284 } 2285 2286 return (zfs_zaccess_aces_check(zp, working_mode, B_FALSE, cr)); 2287 } 2288 2289 static int 2290 zfs_zaccess_append(znode_t *zp, uint32_t *working_mode, boolean_t *check_privs, 2291 cred_t *cr) 2292 { 2293 if (*working_mode != ACE_WRITE_DATA) 2294 return (SET_ERROR(EACCES)); 2295 2296 return (zfs_zaccess_common(zp, ACE_APPEND_DATA, working_mode, 2297 check_privs, B_FALSE, cr)); 2298 } 2299 2300 /* 2301 * Check if VEXEC is allowed. 2302 * 2303 * This routine is based on zfs_fastaccesschk_execute which has slowpath 2304 * calling zfs_zaccess. This would be incorrect on FreeBSD (see 2305 * zfs_freebsd_access for the difference). Thus this variant let's the 2306 * caller handle the slowpath (if necessary). 2307 * 2308 * On top of that we perform a lockless check for ZFS_NO_EXECS_DENIED. 2309 * 2310 * Safe access to znode_t is provided by the vnode lock. 2311 */ 2312 int 2313 zfs_fastaccesschk_execute(znode_t *zdp, cred_t *cr) 2314 { 2315 boolean_t is_attr; 2316 2317 if (zdp->z_pflags & ZFS_AV_QUARANTINED) 2318 return (1); 2319 2320 is_attr = ((zdp->z_pflags & ZFS_XATTR) && 2321 (ZTOV(zdp)->v_type == VDIR)); 2322 if (is_attr) 2323 return (1); 2324 2325 if (zdp->z_pflags & ZFS_NO_EXECS_DENIED) 2326 return (0); 2327 2328 return (1); 2329 } 2330 2331 2332 /* 2333 * Determine whether Access should be granted/denied. 2334 * 2335 * The least priv subsystem is always consulted as a basic privilege 2336 * can define any form of access. 2337 */ 2338 int 2339 zfs_zaccess(znode_t *zp, int mode, int flags, boolean_t skipaclchk, cred_t *cr) 2340 { 2341 uint32_t working_mode; 2342 int error; 2343 int is_attr; 2344 boolean_t check_privs; 2345 znode_t *xzp = NULL; 2346 znode_t *check_zp = zp; 2347 mode_t needed_bits; 2348 uid_t owner; 2349 2350 is_attr = ((zp->z_pflags & ZFS_XATTR) && (ZTOV(zp)->v_type == VDIR)); 2351 2352 #ifdef __FreeBSD_kernel__ 2353 /* 2354 * In FreeBSD, we don't care about permissions of individual ADS. 2355 * Note that not checking them is not just an optimization - without 2356 * this shortcut, EA operations may bogusly fail with EACCES. 2357 */ 2358 if (zp->z_pflags & ZFS_XATTR) 2359 return (0); 2360 #else 2361 /* 2362 * If attribute then validate against base file 2363 */ 2364 if (is_attr) { 2365 uint64_t parent; 2366 2367 if ((error = sa_lookup(zp->z_sa_hdl, 2368 SA_ZPL_PARENT(zp->z_zfsvfs), &parent, 2369 sizeof (parent))) != 0) 2370 return (error); 2371 2372 if ((error = zfs_zget(zp->z_zfsvfs, 2373 parent, &xzp)) != 0) { 2374 return (error); 2375 } 2376 2377 check_zp = xzp; 2378 2379 /* 2380 * fixup mode to map to xattr perms 2381 */ 2382 2383 if (mode & (ACE_WRITE_DATA|ACE_APPEND_DATA)) { 2384 mode &= ~(ACE_WRITE_DATA|ACE_APPEND_DATA); 2385 mode |= ACE_WRITE_NAMED_ATTRS; 2386 } 2387 2388 if (mode & (ACE_READ_DATA|ACE_EXECUTE)) { 2389 mode &= ~(ACE_READ_DATA|ACE_EXECUTE); 2390 mode |= ACE_READ_NAMED_ATTRS; 2391 } 2392 } 2393 #endif 2394 2395 owner = zfs_fuid_map_id(zp->z_zfsvfs, zp->z_uid, cr, ZFS_OWNER); 2396 /* 2397 * Map the bits required to the standard vnode flags VREAD|VWRITE|VEXEC 2398 * in needed_bits. Map the bits mapped by working_mode (currently 2399 * missing) in missing_bits. 2400 * Call secpolicy_vnode_access2() with (needed_bits & ~checkmode), 2401 * needed_bits. 2402 */ 2403 needed_bits = 0; 2404 2405 working_mode = mode; 2406 if ((working_mode & (ACE_READ_ACL|ACE_READ_ATTRIBUTES)) && 2407 owner == crgetuid(cr)) 2408 working_mode &= ~(ACE_READ_ACL|ACE_READ_ATTRIBUTES); 2409 2410 if (working_mode & (ACE_READ_DATA|ACE_READ_NAMED_ATTRS| 2411 ACE_READ_ACL|ACE_READ_ATTRIBUTES|ACE_SYNCHRONIZE)) 2412 needed_bits |= VREAD; 2413 if (working_mode & (ACE_WRITE_DATA|ACE_WRITE_NAMED_ATTRS| 2414 ACE_APPEND_DATA|ACE_WRITE_ATTRIBUTES|ACE_SYNCHRONIZE)) 2415 needed_bits |= VWRITE; 2416 if (working_mode & ACE_EXECUTE) 2417 needed_bits |= VEXEC; 2418 2419 if ((error = zfs_zaccess_common(check_zp, mode, &working_mode, 2420 &check_privs, skipaclchk, cr)) == 0) { 2421 if (is_attr) 2422 VN_RELE(ZTOV(xzp)); 2423 return (secpolicy_vnode_access2(cr, ZTOV(zp), owner, 2424 needed_bits, needed_bits)); 2425 } 2426 2427 if (error && !check_privs) { 2428 if (is_attr) 2429 VN_RELE(ZTOV(xzp)); 2430 return (error); 2431 } 2432 2433 if (error && (flags & V_APPEND)) { 2434 error = zfs_zaccess_append(zp, &working_mode, &check_privs, cr); 2435 } 2436 2437 if (error && check_privs) { 2438 mode_t checkmode = 0; 2439 vnode_t *check_vp = ZTOV(check_zp); 2440 2441 /* 2442 * First check for implicit owner permission on 2443 * read_acl/read_attributes 2444 */ 2445 2446 error = 0; 2447 ASSERT(working_mode != 0); 2448 2449 if ((working_mode & (ACE_READ_ACL|ACE_READ_ATTRIBUTES) && 2450 owner == crgetuid(cr))) 2451 working_mode &= ~(ACE_READ_ACL|ACE_READ_ATTRIBUTES); 2452 2453 if (working_mode & (ACE_READ_DATA|ACE_READ_NAMED_ATTRS| 2454 ACE_READ_ACL|ACE_READ_ATTRIBUTES|ACE_SYNCHRONIZE)) 2455 checkmode |= VREAD; 2456 if (working_mode & (ACE_WRITE_DATA|ACE_WRITE_NAMED_ATTRS| 2457 ACE_APPEND_DATA|ACE_WRITE_ATTRIBUTES|ACE_SYNCHRONIZE)) 2458 checkmode |= VWRITE; 2459 if (working_mode & ACE_EXECUTE) 2460 checkmode |= VEXEC; 2461 2462 error = secpolicy_vnode_access2(cr, check_vp, owner, 2463 needed_bits & ~checkmode, needed_bits); 2464 2465 if (error == 0 && (working_mode & ACE_WRITE_OWNER)) 2466 error = secpolicy_vnode_chown(check_vp, cr, owner); 2467 if (error == 0 && (working_mode & ACE_WRITE_ACL)) 2468 error = secpolicy_vnode_setdac(check_vp, cr, owner); 2469 2470 if (error == 0 && (working_mode & 2471 (ACE_DELETE|ACE_DELETE_CHILD))) 2472 error = secpolicy_vnode_remove(check_vp, cr); 2473 2474 if (error == 0 && (working_mode & ACE_SYNCHRONIZE)) { 2475 error = secpolicy_vnode_chown(check_vp, cr, owner); 2476 } 2477 if (error == 0) { 2478 /* 2479 * See if any bits other than those already checked 2480 * for are still present. If so then return EACCES 2481 */ 2482 if (working_mode & ~(ZFS_CHECKED_MASKS)) { 2483 error = SET_ERROR(EACCES); 2484 } 2485 } 2486 } else if (error == 0) { 2487 error = secpolicy_vnode_access2(cr, ZTOV(zp), owner, 2488 needed_bits, needed_bits); 2489 } 2490 2491 2492 if (is_attr) 2493 VN_RELE(ZTOV(xzp)); 2494 2495 return (error); 2496 } 2497 2498 /* 2499 * Translate traditional unix VREAD/VWRITE/VEXEC mode into 2500 * NFSv4-style ZFS ACL format and call zfs_zaccess() 2501 */ 2502 int 2503 zfs_zaccess_rwx(znode_t *zp, mode_t mode, int flags, cred_t *cr) 2504 { 2505 return (zfs_zaccess(zp, zfs_unix_to_v4(mode >> 6), flags, B_FALSE, cr)); 2506 } 2507 2508 /* 2509 * Access function for secpolicy_vnode_setattr 2510 */ 2511 int 2512 zfs_zaccess_unix(znode_t *zp, mode_t mode, cred_t *cr) 2513 { 2514 int v4_mode = zfs_unix_to_v4(mode >> 6); 2515 2516 return (zfs_zaccess(zp, v4_mode, 0, B_FALSE, cr)); 2517 } 2518 2519 static int 2520 zfs_delete_final_check(znode_t *zp, znode_t *dzp, 2521 mode_t available_perms, cred_t *cr) 2522 { 2523 int error; 2524 uid_t downer; 2525 2526 downer = zfs_fuid_map_id(dzp->z_zfsvfs, dzp->z_uid, cr, ZFS_OWNER); 2527 2528 error = secpolicy_vnode_access2(cr, ZTOV(dzp), 2529 downer, available_perms, VWRITE|VEXEC); 2530 2531 if (error == 0) 2532 error = zfs_sticky_remove_access(dzp, zp, cr); 2533 2534 return (error); 2535 } 2536 2537 /* 2538 * Determine whether Access should be granted/deny, without 2539 * consulting least priv subsystem. 2540 * 2541 * The following chart is the recommended NFSv4 enforcement for 2542 * ability to delete an object. 2543 * 2544 * ------------------------------------------------------- 2545 * | Parent Dir | Target Object Permissions | 2546 * | permissions | | 2547 * ------------------------------------------------------- 2548 * | | ACL Allows | ACL Denies| Delete | 2549 * | | Delete | Delete | unspecified| 2550 * ------------------------------------------------------- 2551 * | ACL Allows | Permit | Permit | Permit | 2552 * | DELETE_CHILD | | 2553 * ------------------------------------------------------- 2554 * | ACL Denies | Permit | Deny | Deny | 2555 * | DELETE_CHILD | | | | 2556 * ------------------------------------------------------- 2557 * | ACL specifies | | | | 2558 * | only allow | Permit | Permit | Permit | 2559 * | write and | | | | 2560 * | execute | | | | 2561 * ------------------------------------------------------- 2562 * | ACL denies | | | | 2563 * | write and | Permit | Deny | Deny | 2564 * | execute | | | | 2565 * ------------------------------------------------------- 2566 * ^ 2567 * | 2568 * No search privilege, can't even look up file? 2569 * 2570 */ 2571 int 2572 zfs_zaccess_delete(znode_t *dzp, znode_t *zp, cred_t *cr) 2573 { 2574 uint32_t dzp_working_mode = 0; 2575 uint32_t zp_working_mode = 0; 2576 int dzp_error, zp_error; 2577 mode_t available_perms; 2578 boolean_t dzpcheck_privs = B_TRUE; 2579 boolean_t zpcheck_privs = B_TRUE; 2580 2581 /* 2582 * We want specific DELETE permissions to 2583 * take precedence over WRITE/EXECUTE. We don't 2584 * want an ACL such as this to mess us up. 2585 * user:joe:write_data:deny,user:joe:delete:allow 2586 * 2587 * However, deny permissions may ultimately be overridden 2588 * by secpolicy_vnode_access(). 2589 * 2590 * We will ask for all of the necessary permissions and then 2591 * look at the working modes from the directory and target object 2592 * to determine what was found. 2593 */ 2594 2595 if (zp->z_pflags & (ZFS_IMMUTABLE | ZFS_NOUNLINK)) 2596 return (SET_ERROR(EPERM)); 2597 2598 /* 2599 * First row 2600 * If the directory permissions allow the delete, we are done. 2601 */ 2602 if ((dzp_error = zfs_zaccess_common(dzp, ACE_DELETE_CHILD, 2603 &dzp_working_mode, &dzpcheck_privs, B_FALSE, cr)) == 0) 2604 return (0); 2605 2606 /* 2607 * If target object has delete permission then we are done 2608 */ 2609 if ((zp_error = zfs_zaccess_common(zp, ACE_DELETE, &zp_working_mode, 2610 &zpcheck_privs, B_FALSE, cr)) == 0) 2611 return (0); 2612 2613 ASSERT(dzp_error && zp_error); 2614 2615 if (!dzpcheck_privs) 2616 return (dzp_error); 2617 if (!zpcheck_privs) 2618 return (zp_error); 2619 2620 /* 2621 * Second row 2622 * 2623 * If directory returns EACCES then delete_child was denied 2624 * due to deny delete_child. In this case send the request through 2625 * secpolicy_vnode_remove(). We don't use zfs_delete_final_check() 2626 * since that *could* allow the delete based on write/execute permission 2627 * and we want delete permissions to override write/execute. 2628 */ 2629 2630 if (dzp_error == EACCES) { 2631 /* XXXPJD: s/dzp/zp/ ? */ 2632 return (secpolicy_vnode_remove(ZTOV(dzp), cr)); 2633 } 2634 /* 2635 * Third Row 2636 * only need to see if we have write/execute on directory. 2637 */ 2638 2639 dzp_error = zfs_zaccess_common(dzp, ACE_EXECUTE|ACE_WRITE_DATA, 2640 &dzp_working_mode, &dzpcheck_privs, B_FALSE, cr); 2641 2642 if (dzp_error != 0 && !dzpcheck_privs) 2643 return (dzp_error); 2644 2645 /* 2646 * Fourth row 2647 */ 2648 2649 available_perms = (dzp_working_mode & ACE_WRITE_DATA) ? 0 : VWRITE; 2650 available_perms |= (dzp_working_mode & ACE_EXECUTE) ? 0 : VEXEC; 2651 2652 return (zfs_delete_final_check(zp, dzp, available_perms, cr)); 2653 2654 } 2655 2656 int 2657 zfs_zaccess_rename(znode_t *sdzp, znode_t *szp, znode_t *tdzp, 2658 znode_t *tzp, cred_t *cr) 2659 { 2660 int add_perm; 2661 int error; 2662 2663 if (szp->z_pflags & ZFS_AV_QUARANTINED) 2664 return (SET_ERROR(EACCES)); 2665 2666 add_perm = (ZTOV(szp)->v_type == VDIR) ? 2667 ACE_ADD_SUBDIRECTORY : ACE_ADD_FILE; 2668 2669 /* 2670 * Rename permissions are combination of delete permission + 2671 * add file/subdir permission. 2672 * 2673 * BSD operating systems also require write permission 2674 * on the directory being moved from one parent directory 2675 * to another. 2676 */ 2677 if (ZTOV(szp)->v_type == VDIR && ZTOV(sdzp) != ZTOV(tdzp)) { 2678 if ((error = zfs_zaccess(szp, ACE_WRITE_DATA, 0, B_FALSE, cr))) 2679 return (error); 2680 } 2681 2682 /* 2683 * first make sure we do the delete portion. 2684 * 2685 * If that succeeds then check for add_file/add_subdir permissions 2686 */ 2687 2688 if ((error = zfs_zaccess_delete(sdzp, szp, cr))) 2689 return (error); 2690 2691 /* 2692 * If we have a tzp, see if we can delete it? 2693 */ 2694 if (tzp && (error = zfs_zaccess_delete(tdzp, tzp, cr))) 2695 return (error); 2696 2697 /* 2698 * Now check for add permissions 2699 */ 2700 error = zfs_zaccess(tdzp, add_perm, 0, B_FALSE, cr); 2701 2702 return (error); 2703 } 2704