1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * Landlock LSM - Ruleset management 4 * 5 * Copyright © 2016-2020 Mickaël Salaün <mic@digikod.net> 6 * Copyright © 2018-2020 ANSSI 7 */ 8 9 #include <linux/bits.h> 10 #include <linux/bug.h> 11 #include <linux/cleanup.h> 12 #include <linux/compiler_types.h> 13 #include <linux/err.h> 14 #include <linux/errno.h> 15 #include <linux/kernel.h> 16 #include <linux/lockdep.h> 17 #include <linux/mutex.h> 18 #include <linux/overflow.h> 19 #include <linux/rbtree.h> 20 #include <linux/refcount.h> 21 #include <linux/slab.h> 22 #include <linux/spinlock.h> 23 #include <linux/workqueue.h> 24 25 #include "access.h" 26 #include "domain.h" 27 #include "limits.h" 28 #include "object.h" 29 #include "ruleset.h" 30 31 static struct landlock_ruleset *create_ruleset(const u32 num_layers) 32 { 33 struct landlock_ruleset *new_ruleset; 34 35 new_ruleset = kzalloc_flex(*new_ruleset, access_masks, num_layers, 36 GFP_KERNEL_ACCOUNT); 37 if (!new_ruleset) 38 return ERR_PTR(-ENOMEM); 39 refcount_set(&new_ruleset->usage, 1); 40 mutex_init(&new_ruleset->lock); 41 new_ruleset->root_inode = RB_ROOT; 42 43 #if IS_ENABLED(CONFIG_INET) 44 new_ruleset->root_net_port = RB_ROOT; 45 #endif /* IS_ENABLED(CONFIG_INET) */ 46 47 new_ruleset->num_layers = num_layers; 48 /* 49 * hierarchy = NULL 50 * num_rules = 0 51 * access_masks[] = 0 52 */ 53 return new_ruleset; 54 } 55 56 struct landlock_ruleset * 57 landlock_create_ruleset(const access_mask_t fs_access_mask, 58 const access_mask_t net_access_mask, 59 const access_mask_t scope_mask) 60 { 61 struct landlock_ruleset *new_ruleset; 62 63 /* Informs about useless ruleset. */ 64 if (!fs_access_mask && !net_access_mask && !scope_mask) 65 return ERR_PTR(-ENOMSG); 66 new_ruleset = create_ruleset(1); 67 if (IS_ERR(new_ruleset)) 68 return new_ruleset; 69 if (fs_access_mask) 70 landlock_add_fs_access_mask(new_ruleset, fs_access_mask, 0); 71 if (net_access_mask) 72 landlock_add_net_access_mask(new_ruleset, net_access_mask, 0); 73 if (scope_mask) 74 landlock_add_scope_mask(new_ruleset, scope_mask, 0); 75 return new_ruleset; 76 } 77 78 static void build_check_rule(void) 79 { 80 const struct landlock_rule rule = { 81 .num_layers = ~0, 82 }; 83 84 /* 85 * Checks that .num_layers is large enough for at least 86 * LANDLOCK_MAX_NUM_LAYERS layers. 87 */ 88 BUILD_BUG_ON(rule.num_layers < LANDLOCK_MAX_NUM_LAYERS); 89 } 90 91 static bool is_object_pointer(const enum landlock_key_type key_type) 92 { 93 switch (key_type) { 94 case LANDLOCK_KEY_INODE: 95 return true; 96 97 #if IS_ENABLED(CONFIG_INET) 98 case LANDLOCK_KEY_NET_PORT: 99 return false; 100 #endif /* IS_ENABLED(CONFIG_INET) */ 101 102 default: 103 WARN_ON_ONCE(1); 104 return false; 105 } 106 } 107 108 static struct landlock_rule * 109 create_rule(const struct landlock_id id, 110 const struct landlock_layer (*layers)[], const u32 num_layers, 111 const struct landlock_layer *const new_layer) 112 { 113 struct landlock_rule *new_rule; 114 u32 new_num_layers; 115 116 build_check_rule(); 117 if (new_layer) { 118 /* Should already be checked by landlock_merge_ruleset(). */ 119 if (WARN_ON_ONCE(num_layers >= LANDLOCK_MAX_NUM_LAYERS)) 120 return ERR_PTR(-E2BIG); 121 new_num_layers = num_layers + 1; 122 } else { 123 new_num_layers = num_layers; 124 } 125 new_rule = kzalloc_flex(*new_rule, layers, new_num_layers, 126 GFP_KERNEL_ACCOUNT); 127 if (!new_rule) 128 return ERR_PTR(-ENOMEM); 129 RB_CLEAR_NODE(&new_rule->node); 130 if (is_object_pointer(id.type)) { 131 /* This should have been caught by insert_rule(). */ 132 WARN_ON_ONCE(!id.key.object); 133 landlock_get_object(id.key.object); 134 } 135 136 new_rule->key = id.key; 137 new_rule->num_layers = new_num_layers; 138 /* Copies the original layer stack. */ 139 memcpy(new_rule->layers, layers, 140 flex_array_size(new_rule, layers, num_layers)); 141 if (new_layer) 142 /* Adds a copy of @new_layer on the layer stack. */ 143 new_rule->layers[new_rule->num_layers - 1] = *new_layer; 144 return new_rule; 145 } 146 147 static struct rb_root *get_root(struct landlock_ruleset *const ruleset, 148 const enum landlock_key_type key_type) 149 { 150 switch (key_type) { 151 case LANDLOCK_KEY_INODE: 152 return &ruleset->root_inode; 153 154 #if IS_ENABLED(CONFIG_INET) 155 case LANDLOCK_KEY_NET_PORT: 156 return &ruleset->root_net_port; 157 #endif /* IS_ENABLED(CONFIG_INET) */ 158 159 default: 160 WARN_ON_ONCE(1); 161 return ERR_PTR(-EINVAL); 162 } 163 } 164 165 static void free_rule(struct landlock_rule *const rule, 166 const enum landlock_key_type key_type) 167 { 168 might_sleep(); 169 if (!rule) 170 return; 171 if (is_object_pointer(key_type)) 172 landlock_put_object(rule->key.object); 173 kfree(rule); 174 } 175 176 static void build_check_ruleset(void) 177 { 178 const struct landlock_ruleset ruleset = { 179 .num_rules = ~0, 180 .num_layers = ~0, 181 }; 182 183 BUILD_BUG_ON(ruleset.num_rules < LANDLOCK_MAX_NUM_RULES); 184 BUILD_BUG_ON(ruleset.num_layers < LANDLOCK_MAX_NUM_LAYERS); 185 } 186 187 /** 188 * insert_rule - Create and insert a rule in a ruleset 189 * 190 * @ruleset: The ruleset to be updated. 191 * @id: The ID to build the new rule with. The underlying kernel object, if 192 * any, must be held by the caller. 193 * @layers: One or multiple layers to be copied into the new rule. 194 * @num_layers: The number of @layers entries. 195 * 196 * When user space requests to add a new rule to a ruleset, @layers only 197 * contains one entry and this entry is not assigned to any level. In this 198 * case, the new rule will extend @ruleset, similarly to a boolean OR between 199 * access rights. 200 * 201 * When merging a ruleset in a domain, or copying a domain, @layers will be 202 * added to @ruleset as new constraints, similarly to a boolean AND between 203 * access rights. 204 * 205 * Return: 0 on success, -errno on failure. 206 */ 207 static int insert_rule(struct landlock_ruleset *const ruleset, 208 const struct landlock_id id, 209 const struct landlock_layer (*layers)[], 210 const size_t num_layers) 211 { 212 struct rb_node **walker_node; 213 struct rb_node *parent_node = NULL; 214 struct landlock_rule *new_rule; 215 struct rb_root *root; 216 217 might_sleep(); 218 lockdep_assert_held(&ruleset->lock); 219 if (WARN_ON_ONCE(!layers)) 220 return -ENOENT; 221 222 if (is_object_pointer(id.type) && WARN_ON_ONCE(!id.key.object)) 223 return -ENOENT; 224 225 root = get_root(ruleset, id.type); 226 if (IS_ERR(root)) 227 return PTR_ERR(root); 228 229 walker_node = &root->rb_node; 230 while (*walker_node) { 231 struct landlock_rule *const this = 232 rb_entry(*walker_node, struct landlock_rule, node); 233 234 if (this->key.data != id.key.data) { 235 parent_node = *walker_node; 236 if (this->key.data < id.key.data) 237 walker_node = &((*walker_node)->rb_right); 238 else 239 walker_node = &((*walker_node)->rb_left); 240 continue; 241 } 242 243 /* Only a single-level layer should match an existing rule. */ 244 if (WARN_ON_ONCE(num_layers != 1)) 245 return -EINVAL; 246 247 /* If there is a matching rule, updates it. */ 248 if ((*layers)[0].level == 0) { 249 /* 250 * Extends access rights when the request comes from 251 * landlock_add_rule(2), i.e. @ruleset is not a domain. 252 */ 253 if (WARN_ON_ONCE(this->num_layers != 1)) 254 return -EINVAL; 255 if (WARN_ON_ONCE(this->layers[0].level != 0)) 256 return -EINVAL; 257 this->layers[0].access |= (*layers)[0].access; 258 return 0; 259 } 260 261 if (WARN_ON_ONCE(this->layers[0].level == 0)) 262 return -EINVAL; 263 264 /* 265 * Intersects access rights when it is a merge between a 266 * ruleset and a domain. 267 */ 268 new_rule = create_rule(id, &this->layers, this->num_layers, 269 &(*layers)[0]); 270 if (IS_ERR(new_rule)) 271 return PTR_ERR(new_rule); 272 rb_replace_node(&this->node, &new_rule->node, root); 273 free_rule(this, id.type); 274 return 0; 275 } 276 277 /* There is no match for @id. */ 278 build_check_ruleset(); 279 if (ruleset->num_rules >= LANDLOCK_MAX_NUM_RULES) 280 return -E2BIG; 281 new_rule = create_rule(id, layers, num_layers, NULL); 282 if (IS_ERR(new_rule)) 283 return PTR_ERR(new_rule); 284 rb_link_node(&new_rule->node, parent_node, walker_node); 285 rb_insert_color(&new_rule->node, root); 286 ruleset->num_rules++; 287 return 0; 288 } 289 290 static void build_check_layer(void) 291 { 292 const struct landlock_layer layer = { 293 .level = ~0, 294 .access = ~0, 295 }; 296 297 /* 298 * Checks that .level and .access are large enough to contain their expected 299 * maximum values. 300 */ 301 BUILD_BUG_ON(layer.level < LANDLOCK_MAX_NUM_LAYERS); 302 BUILD_BUG_ON(layer.access < LANDLOCK_MASK_ACCESS_FS); 303 } 304 305 /* @ruleset must be locked by the caller. */ 306 int landlock_insert_rule(struct landlock_ruleset *const ruleset, 307 const struct landlock_id id, 308 const access_mask_t access) 309 { 310 struct landlock_layer layers[] = { { 311 .access = access, 312 /* When @level is zero, insert_rule() extends @ruleset. */ 313 .level = 0, 314 } }; 315 316 build_check_layer(); 317 return insert_rule(ruleset, id, &layers, ARRAY_SIZE(layers)); 318 } 319 320 static int merge_tree(struct landlock_ruleset *const dst, 321 struct landlock_ruleset *const src, 322 const enum landlock_key_type key_type) 323 { 324 struct landlock_rule *walker_rule, *next_rule; 325 struct rb_root *src_root; 326 int err = 0; 327 328 might_sleep(); 329 lockdep_assert_held(&dst->lock); 330 lockdep_assert_held(&src->lock); 331 332 src_root = get_root(src, key_type); 333 if (IS_ERR(src_root)) 334 return PTR_ERR(src_root); 335 336 /* Merges the @src tree. */ 337 rbtree_postorder_for_each_entry_safe(walker_rule, next_rule, src_root, 338 node) { 339 struct landlock_layer layers[] = { { 340 .level = dst->num_layers, 341 } }; 342 const struct landlock_id id = { 343 .key = walker_rule->key, 344 .type = key_type, 345 }; 346 347 if (WARN_ON_ONCE(walker_rule->num_layers != 1)) 348 return -EINVAL; 349 350 if (WARN_ON_ONCE(walker_rule->layers[0].level != 0)) 351 return -EINVAL; 352 353 layers[0].access = walker_rule->layers[0].access; 354 355 err = insert_rule(dst, id, &layers, ARRAY_SIZE(layers)); 356 if (err) 357 return err; 358 } 359 return err; 360 } 361 362 static int merge_ruleset(struct landlock_ruleset *const dst, 363 struct landlock_ruleset *const src) 364 { 365 int err = 0; 366 367 might_sleep(); 368 /* Should already be checked by landlock_merge_ruleset() */ 369 if (WARN_ON_ONCE(!src)) 370 return 0; 371 /* Only merge into a domain. */ 372 if (WARN_ON_ONCE(!dst || !dst->hierarchy)) 373 return -EINVAL; 374 375 /* Locks @dst first because we are its only owner. */ 376 mutex_lock(&dst->lock); 377 mutex_lock_nested(&src->lock, SINGLE_DEPTH_NESTING); 378 379 /* Stacks the new layer. */ 380 if (WARN_ON_ONCE(src->num_layers != 1 || dst->num_layers < 1)) { 381 err = -EINVAL; 382 goto out_unlock; 383 } 384 dst->access_masks[dst->num_layers - 1] = 385 landlock_upgrade_handled_access_masks(src->access_masks[0]); 386 387 /* Merges the @src inode tree. */ 388 err = merge_tree(dst, src, LANDLOCK_KEY_INODE); 389 if (err) 390 goto out_unlock; 391 392 #if IS_ENABLED(CONFIG_INET) 393 /* Merges the @src network port tree. */ 394 err = merge_tree(dst, src, LANDLOCK_KEY_NET_PORT); 395 if (err) 396 goto out_unlock; 397 #endif /* IS_ENABLED(CONFIG_INET) */ 398 399 out_unlock: 400 mutex_unlock(&src->lock); 401 mutex_unlock(&dst->lock); 402 return err; 403 } 404 405 static int inherit_tree(struct landlock_ruleset *const parent, 406 struct landlock_ruleset *const child, 407 const enum landlock_key_type key_type) 408 { 409 struct landlock_rule *walker_rule, *next_rule; 410 struct rb_root *parent_root; 411 int err = 0; 412 413 might_sleep(); 414 lockdep_assert_held(&parent->lock); 415 lockdep_assert_held(&child->lock); 416 417 parent_root = get_root(parent, key_type); 418 if (IS_ERR(parent_root)) 419 return PTR_ERR(parent_root); 420 421 /* Copies the @parent inode or network tree. */ 422 rbtree_postorder_for_each_entry_safe(walker_rule, next_rule, 423 parent_root, node) { 424 const struct landlock_id id = { 425 .key = walker_rule->key, 426 .type = key_type, 427 }; 428 429 err = insert_rule(child, id, &walker_rule->layers, 430 walker_rule->num_layers); 431 if (err) 432 return err; 433 } 434 return err; 435 } 436 437 static int inherit_ruleset(struct landlock_ruleset *const parent, 438 struct landlock_ruleset *const child) 439 { 440 int err = 0; 441 442 might_sleep(); 443 if (!parent) 444 return 0; 445 446 /* Locks @child first because we are its only owner. */ 447 mutex_lock(&child->lock); 448 mutex_lock_nested(&parent->lock, SINGLE_DEPTH_NESTING); 449 450 /* Copies the @parent inode tree. */ 451 err = inherit_tree(parent, child, LANDLOCK_KEY_INODE); 452 if (err) 453 goto out_unlock; 454 455 #if IS_ENABLED(CONFIG_INET) 456 /* Copies the @parent network port tree. */ 457 err = inherit_tree(parent, child, LANDLOCK_KEY_NET_PORT); 458 if (err) 459 goto out_unlock; 460 #endif /* IS_ENABLED(CONFIG_INET) */ 461 462 if (WARN_ON_ONCE(child->num_layers <= parent->num_layers)) { 463 err = -EINVAL; 464 goto out_unlock; 465 } 466 /* Copies the parent layer stack and leaves a space for the new layer. */ 467 memcpy(child->access_masks, parent->access_masks, 468 flex_array_size(parent, access_masks, parent->num_layers)); 469 470 if (WARN_ON_ONCE(!parent->hierarchy)) { 471 err = -EINVAL; 472 goto out_unlock; 473 } 474 landlock_get_hierarchy(parent->hierarchy); 475 child->hierarchy->parent = parent->hierarchy; 476 477 out_unlock: 478 mutex_unlock(&parent->lock); 479 mutex_unlock(&child->lock); 480 return err; 481 } 482 483 static void free_ruleset(struct landlock_ruleset *const ruleset) 484 { 485 struct landlock_rule *freeme, *next; 486 487 might_sleep(); 488 rbtree_postorder_for_each_entry_safe(freeme, next, &ruleset->root_inode, 489 node) 490 free_rule(freeme, LANDLOCK_KEY_INODE); 491 492 #if IS_ENABLED(CONFIG_INET) 493 rbtree_postorder_for_each_entry_safe(freeme, next, 494 &ruleset->root_net_port, node) 495 free_rule(freeme, LANDLOCK_KEY_NET_PORT); 496 #endif /* IS_ENABLED(CONFIG_INET) */ 497 498 landlock_put_hierarchy(ruleset->hierarchy); 499 kfree(ruleset); 500 } 501 502 void landlock_put_ruleset(struct landlock_ruleset *const ruleset) 503 { 504 might_sleep(); 505 if (ruleset && refcount_dec_and_test(&ruleset->usage)) 506 free_ruleset(ruleset); 507 } 508 509 static void free_ruleset_work(struct work_struct *const work) 510 { 511 struct landlock_ruleset *ruleset; 512 513 ruleset = container_of(work, struct landlock_ruleset, work_free); 514 free_ruleset(ruleset); 515 } 516 517 /* Only called by hook_cred_free(). */ 518 void landlock_put_ruleset_deferred(struct landlock_ruleset *const ruleset) 519 { 520 if (ruleset && refcount_dec_and_test(&ruleset->usage)) { 521 INIT_WORK(&ruleset->work_free, free_ruleset_work); 522 schedule_work(&ruleset->work_free); 523 } 524 } 525 526 /** 527 * landlock_merge_ruleset - Merge a ruleset with a domain 528 * 529 * @parent: Parent domain. 530 * @ruleset: New ruleset to be merged. 531 * 532 * The current task is requesting to be restricted. The subjective credentials 533 * must not be in an overridden state. cf. landlock_init_hierarchy_log(). 534 * 535 * Return: A new domain merging @parent and @ruleset on success, or ERR_PTR() 536 * on failure. If @parent is NULL, the new domain duplicates @ruleset. 537 */ 538 struct landlock_ruleset * 539 landlock_merge_ruleset(struct landlock_ruleset *const parent, 540 struct landlock_ruleset *const ruleset) 541 { 542 struct landlock_ruleset *new_dom __free(landlock_put_ruleset) = NULL; 543 u32 num_layers; 544 int err; 545 546 might_sleep(); 547 if (WARN_ON_ONCE(!ruleset || parent == ruleset)) 548 return ERR_PTR(-EINVAL); 549 550 if (parent) { 551 if (parent->num_layers >= LANDLOCK_MAX_NUM_LAYERS) 552 return ERR_PTR(-E2BIG); 553 num_layers = parent->num_layers + 1; 554 } else { 555 num_layers = 1; 556 } 557 558 /* Creates a new domain... */ 559 new_dom = create_ruleset(num_layers); 560 if (IS_ERR(new_dom)) 561 return new_dom; 562 563 new_dom->hierarchy = 564 kzalloc_obj(*new_dom->hierarchy, GFP_KERNEL_ACCOUNT); 565 if (!new_dom->hierarchy) 566 return ERR_PTR(-ENOMEM); 567 568 refcount_set(&new_dom->hierarchy->usage, 1); 569 570 /* ...as a child of @parent... */ 571 err = inherit_ruleset(parent, new_dom); 572 if (err) 573 return ERR_PTR(err); 574 575 /* ...and including @ruleset. */ 576 err = merge_ruleset(new_dom, ruleset); 577 if (err) 578 return ERR_PTR(err); 579 580 err = landlock_init_hierarchy_log(new_dom->hierarchy); 581 if (err) 582 return ERR_PTR(err); 583 584 return no_free_ptr(new_dom); 585 } 586 587 /* 588 * The returned access has the same lifetime as @ruleset. 589 */ 590 const struct landlock_rule * 591 landlock_find_rule(const struct landlock_ruleset *const ruleset, 592 const struct landlock_id id) 593 { 594 const struct rb_root *root; 595 const struct rb_node *node; 596 597 root = get_root((struct landlock_ruleset *)ruleset, id.type); 598 if (IS_ERR(root)) 599 return NULL; 600 node = root->rb_node; 601 602 while (node) { 603 struct landlock_rule *this = 604 rb_entry(node, struct landlock_rule, node); 605 606 if (this->key.data == id.key.data) 607 return this; 608 if (this->key.data < id.key.data) 609 node = node->rb_right; 610 else 611 node = node->rb_left; 612 } 613 return NULL; 614 } 615 616 /** 617 * landlock_unmask_layers - Remove the access rights in @masks 618 * which are granted in @rule 619 * 620 * Updates the set of (per-layer) unfulfilled access rights @masks 621 * so that all the access rights granted in @rule are removed from it 622 * (because they are now fulfilled). 623 * 624 * @rule: A rule that grants a set of access rights for each layer 625 * @masks: A matrix of unfulfilled access rights for each layer 626 * 627 * Return: True if the request is allowed (i.e. the access rights granted all 628 * remaining unfulfilled access rights and masks has no leftover set bits). 629 */ 630 bool landlock_unmask_layers(const struct landlock_rule *const rule, 631 struct layer_access_masks *masks) 632 { 633 if (!masks) 634 return true; 635 if (!rule) 636 return false; 637 638 /* 639 * An access is granted if, for each policy layer, at least one rule 640 * encountered on the pathwalk grants the requested access, 641 * regardless of its position in the layer stack. We must then check 642 * the remaining layers for each inode, from the first added layer to 643 * the last one. When there is multiple requested accesses, for each 644 * policy layer, the full set of requested accesses may not be granted 645 * by only one rule, but by the union (binary OR) of multiple rules. 646 * E.g. /a/b <execute> + /a <read> => /a/b <execute + read> 647 */ 648 for (size_t i = 0; i < rule->num_layers; i++) { 649 const struct landlock_layer *const layer = &rule->layers[i]; 650 651 /* Clear the bits where the layer in the rule grants access. */ 652 masks->access[layer->level - 1] &= ~layer->access; 653 } 654 655 for (size_t i = 0; i < ARRAY_SIZE(masks->access); i++) { 656 if (masks->access[i]) 657 return false; 658 } 659 return true; 660 } 661 662 typedef access_mask_t 663 get_access_mask_t(const struct landlock_ruleset *const ruleset, 664 const u16 layer_level); 665 666 /** 667 * landlock_init_layer_masks - Initialize layer masks from an access request 668 * 669 * Populates @masks such that for each access right in @access_request, 670 * the bits for all the layers are set where this access right is handled. 671 * 672 * @domain: The domain that defines the current restrictions. 673 * @access_request: The requested access rights to check. 674 * @masks: Layer access masks to populate. 675 * @key_type: The key type to switch between access masks of different types. 676 * 677 * Return: An access mask where each access right bit is set which is handled 678 * in any of the active layers in @domain. 679 */ 680 access_mask_t 681 landlock_init_layer_masks(const struct landlock_ruleset *const domain, 682 const access_mask_t access_request, 683 struct layer_access_masks *const masks, 684 const enum landlock_key_type key_type) 685 { 686 access_mask_t handled_accesses = 0; 687 get_access_mask_t *get_access_mask; 688 689 switch (key_type) { 690 case LANDLOCK_KEY_INODE: 691 get_access_mask = landlock_get_fs_access_mask; 692 break; 693 694 #if IS_ENABLED(CONFIG_INET) 695 case LANDLOCK_KEY_NET_PORT: 696 get_access_mask = landlock_get_net_access_mask; 697 break; 698 #endif /* IS_ENABLED(CONFIG_INET) */ 699 700 default: 701 WARN_ON_ONCE(1); 702 return 0; 703 } 704 705 /* An empty access request can happen because of O_WRONLY | O_RDWR. */ 706 if (!access_request) 707 return 0; 708 709 for (size_t i = 0; i < domain->num_layers; i++) { 710 const access_mask_t handled = get_access_mask(domain, i); 711 712 masks->access[i] = access_request & handled; 713 handled_accesses |= masks->access[i]; 714 } 715 for (size_t i = domain->num_layers; i < ARRAY_SIZE(masks->access); i++) 716 masks->access[i] = 0; 717 718 return handled_accesses; 719 } 720