1 // SPDX-License-Identifier: GPL-2.0-or-later 2 /* Task credentials management - see Documentation/security/credentials.rst 3 * 4 * Copyright (C) 2008 Red Hat, Inc. All Rights Reserved. 5 * Written by David Howells (dhowells@redhat.com) 6 */ 7 8 #define pr_fmt(fmt) "CRED: " fmt 9 10 #include <linux/export.h> 11 #include <linux/cred.h> 12 #include <linux/slab.h> 13 #include <linux/sched.h> 14 #include <linux/sched/coredump.h> 15 #include <linux/key.h> 16 #include <linux/keyctl.h> 17 #include <linux/init_task.h> 18 #include <linux/security.h> 19 #include <linux/binfmts.h> 20 #include <linux/cn_proc.h> 21 #include <linux/uidgid.h> 22 23 #if 0 24 #define kdebug(FMT, ...) \ 25 printk("[%-5.5s%5u] " FMT "\n", \ 26 current->comm, current->pid, ##__VA_ARGS__) 27 #else 28 #define kdebug(FMT, ...) \ 29 do { \ 30 if (0) \ 31 no_printk("[%-5.5s%5u] " FMT "\n", \ 32 current->comm, current->pid, ##__VA_ARGS__); \ 33 } while (0) 34 #endif 35 36 static struct kmem_cache *cred_jar; 37 38 /* init to 2 - one for init_task, one to ensure it is never freed */ 39 static struct group_info init_groups = { .usage = REFCOUNT_INIT(2) }; 40 41 /* 42 * The initial credentials for the initial task 43 */ 44 struct cred init_cred = { 45 .usage = ATOMIC_INIT(4), 46 .uid = GLOBAL_ROOT_UID, 47 .gid = GLOBAL_ROOT_GID, 48 .suid = GLOBAL_ROOT_UID, 49 .sgid = GLOBAL_ROOT_GID, 50 .euid = GLOBAL_ROOT_UID, 51 .egid = GLOBAL_ROOT_GID, 52 .fsuid = GLOBAL_ROOT_UID, 53 .fsgid = GLOBAL_ROOT_GID, 54 .securebits = SECUREBITS_DEFAULT, 55 .cap_inheritable = CAP_EMPTY_SET, 56 .cap_permitted = CAP_FULL_SET, 57 .cap_effective = CAP_FULL_SET, 58 .cap_bset = CAP_FULL_SET, 59 .user = INIT_USER, 60 .user_ns = &init_user_ns, 61 .group_info = &init_groups, 62 .ucounts = &init_ucounts, 63 }; 64 65 /* 66 * The RCU callback to actually dispose of a set of credentials 67 */ 68 static void put_cred_rcu(struct rcu_head *rcu) 69 { 70 struct cred *cred = container_of(rcu, struct cred, rcu); 71 72 kdebug("put_cred_rcu(%p)", cred); 73 74 if (atomic_long_read(&cred->usage) != 0) 75 panic("CRED: put_cred_rcu() sees %p with usage %ld\n", 76 cred, atomic_long_read(&cred->usage)); 77 78 security_cred_free(cred); 79 key_put(cred->session_keyring); 80 key_put(cred->process_keyring); 81 key_put(cred->thread_keyring); 82 key_put(cred->request_key_auth); 83 if (cred->group_info) 84 put_group_info(cred->group_info); 85 free_uid(cred->user); 86 if (cred->ucounts) 87 put_ucounts(cred->ucounts); 88 put_user_ns(cred->user_ns); 89 kmem_cache_free(cred_jar, cred); 90 } 91 92 /** 93 * __put_cred - Destroy a set of credentials 94 * @cred: The record to release 95 * 96 * Destroy a set of credentials on which no references remain. 97 */ 98 void __put_cred(struct cred *cred) 99 { 100 kdebug("__put_cred(%p{%ld})", cred, 101 atomic_long_read(&cred->usage)); 102 103 BUG_ON(atomic_long_read(&cred->usage) != 0); 104 BUG_ON(cred == current->cred); 105 BUG_ON(cred == current->real_cred); 106 107 if (cred->non_rcu) 108 put_cred_rcu(&cred->rcu); 109 else 110 call_rcu(&cred->rcu, put_cred_rcu); 111 } 112 EXPORT_SYMBOL(__put_cred); 113 114 /* 115 * Clean up a task's credentials when it exits 116 */ 117 void exit_creds(struct task_struct *tsk) 118 { 119 struct cred *real_cred, *cred; 120 121 kdebug("exit_creds(%u,%p,%p,{%ld})", tsk->pid, tsk->real_cred, tsk->cred, 122 atomic_long_read(&tsk->cred->usage)); 123 124 real_cred = (struct cred *) tsk->real_cred; 125 tsk->real_cred = NULL; 126 127 cred = (struct cred *) tsk->cred; 128 tsk->cred = NULL; 129 130 if (real_cred == cred) { 131 put_cred_many(cred, 2); 132 } else { 133 put_cred(real_cred); 134 put_cred(cred); 135 } 136 137 #ifdef CONFIG_KEYS_REQUEST_CACHE 138 key_put(tsk->cached_requested_key); 139 tsk->cached_requested_key = NULL; 140 #endif 141 } 142 143 /** 144 * get_task_cred - Get another task's objective credentials 145 * @task: The task to query 146 * 147 * Get the objective credentials of a task, pinning them so that they can't go 148 * away. Accessing a task's credentials directly is not permitted. 149 * 150 * The caller must also make sure task doesn't get deleted, either by holding a 151 * ref on task or by holding tasklist_lock to prevent it from being unlinked. 152 */ 153 const struct cred *get_task_cred(struct task_struct *task) 154 { 155 const struct cred *cred; 156 157 rcu_read_lock(); 158 159 do { 160 cred = __task_cred((task)); 161 BUG_ON(!cred); 162 } while (!get_cred_rcu(cred)); 163 164 rcu_read_unlock(); 165 return cred; 166 } 167 EXPORT_SYMBOL(get_task_cred); 168 169 /* 170 * Allocate blank credentials, such that the credentials can be filled in at a 171 * later date without risk of ENOMEM. 172 */ 173 struct cred *cred_alloc_blank(void) 174 { 175 struct cred *new; 176 177 new = kmem_cache_zalloc(cred_jar, GFP_KERNEL); 178 if (!new) 179 return NULL; 180 181 atomic_long_set(&new->usage, 1); 182 if (security_cred_alloc_blank(new, GFP_KERNEL_ACCOUNT) < 0) 183 goto error; 184 185 return new; 186 187 error: 188 abort_creds(new); 189 return NULL; 190 } 191 192 /** 193 * prepare_creds - Prepare a new set of credentials for modification 194 * 195 * Prepare a new set of task credentials for modification. A task's creds 196 * shouldn't generally be modified directly, therefore this function is used to 197 * prepare a new copy, which the caller then modifies and then commits by 198 * calling commit_creds(). 199 * 200 * Preparation involves making a copy of the objective creds for modification. 201 * 202 * Returns a pointer to the new creds-to-be if successful, NULL otherwise. 203 * 204 * Call commit_creds() or abort_creds() to clean up. 205 */ 206 struct cred *prepare_creds(void) 207 { 208 struct task_struct *task = current; 209 const struct cred *old; 210 struct cred *new; 211 212 new = kmem_cache_alloc(cred_jar, GFP_KERNEL); 213 if (!new) 214 return NULL; 215 216 kdebug("prepare_creds() alloc %p", new); 217 218 old = task->cred; 219 memcpy(new, old, sizeof(struct cred)); 220 221 new->non_rcu = 0; 222 atomic_long_set(&new->usage, 1); 223 get_group_info(new->group_info); 224 get_uid(new->user); 225 get_user_ns(new->user_ns); 226 227 #ifdef CONFIG_KEYS 228 key_get(new->session_keyring); 229 key_get(new->process_keyring); 230 key_get(new->thread_keyring); 231 key_get(new->request_key_auth); 232 #endif 233 234 #ifdef CONFIG_SECURITY 235 new->security = NULL; 236 #endif 237 238 new->ucounts = get_ucounts(new->ucounts); 239 if (!new->ucounts) 240 goto error; 241 242 if (security_prepare_creds(new, old, GFP_KERNEL_ACCOUNT) < 0) 243 goto error; 244 245 return new; 246 247 error: 248 abort_creds(new); 249 return NULL; 250 } 251 EXPORT_SYMBOL(prepare_creds); 252 253 /* 254 * Prepare credentials for current to perform an execve() 255 * - The caller must hold ->cred_guard_mutex 256 */ 257 struct cred *prepare_exec_creds(void) 258 { 259 struct cred *new; 260 261 new = prepare_creds(); 262 if (!new) 263 return new; 264 265 #ifdef CONFIG_KEYS 266 /* newly exec'd tasks don't get a thread keyring */ 267 key_put(new->thread_keyring); 268 new->thread_keyring = NULL; 269 270 /* inherit the session keyring; new process keyring */ 271 key_put(new->process_keyring); 272 new->process_keyring = NULL; 273 #endif 274 275 new->suid = new->fsuid = new->euid; 276 new->sgid = new->fsgid = new->egid; 277 278 return new; 279 } 280 281 /* 282 * Copy credentials for the new process created by fork() 283 * 284 * We share if we can, but under some circumstances we have to generate a new 285 * set. 286 * 287 * The new process gets the current process's subjective credentials as its 288 * objective and subjective credentials 289 */ 290 int copy_creds(struct task_struct *p, u64 clone_flags) 291 { 292 struct cred *new; 293 int ret; 294 295 #ifdef CONFIG_KEYS_REQUEST_CACHE 296 p->cached_requested_key = NULL; 297 #endif 298 299 if ( 300 #ifdef CONFIG_KEYS 301 !p->cred->thread_keyring && 302 #endif 303 clone_flags & CLONE_THREAD 304 ) { 305 p->real_cred = get_cred_many(p->cred, 2); 306 kdebug("share_creds(%p{%ld})", 307 p->cred, atomic_long_read(&p->cred->usage)); 308 inc_rlimit_ucounts(task_ucounts(p), UCOUNT_RLIMIT_NPROC, 1); 309 get_cred_namespaces(p); 310 return 0; 311 } 312 313 new = prepare_creds(); 314 if (!new) 315 return -ENOMEM; 316 317 if (clone_flags & CLONE_NEWUSER) { 318 ret = create_user_ns(new); 319 if (ret < 0) 320 goto error_put; 321 ret = set_cred_ucounts(new); 322 if (ret < 0) 323 goto error_put; 324 } 325 326 #ifdef CONFIG_KEYS 327 /* new threads get their own thread keyrings if their parent already 328 * had one */ 329 if (new->thread_keyring) { 330 key_put(new->thread_keyring); 331 new->thread_keyring = NULL; 332 if (clone_flags & CLONE_THREAD) 333 install_thread_keyring_to_cred(new); 334 } 335 336 /* The process keyring is only shared between the threads in a process; 337 * anything outside of those threads doesn't inherit. 338 */ 339 if (!(clone_flags & CLONE_THREAD)) { 340 key_put(new->process_keyring); 341 new->process_keyring = NULL; 342 } 343 #endif 344 345 p->cred = p->real_cred = get_cred(new); 346 inc_rlimit_ucounts(task_ucounts(p), UCOUNT_RLIMIT_NPROC, 1); 347 get_cred_namespaces(p); 348 349 return 0; 350 351 error_put: 352 put_cred(new); 353 return ret; 354 } 355 356 static bool cred_cap_issubset(const struct cred *set, const struct cred *subset) 357 { 358 const struct user_namespace *set_ns = set->user_ns; 359 const struct user_namespace *subset_ns = subset->user_ns; 360 361 /* If the two credentials are in the same user namespace see if 362 * the capabilities of subset are a subset of set. 363 */ 364 if (set_ns == subset_ns) 365 return cap_issubset(subset->cap_permitted, set->cap_permitted); 366 367 /* The credentials are in a different user namespaces 368 * therefore one is a subset of the other only if a set is an 369 * ancestor of subset and set->euid is owner of subset or one 370 * of subsets ancestors. 371 */ 372 for (;subset_ns != &init_user_ns; subset_ns = subset_ns->parent) { 373 if ((set_ns == subset_ns->parent) && 374 uid_eq(subset_ns->owner, set->euid)) 375 return true; 376 } 377 378 return false; 379 } 380 381 /** 382 * commit_creds - Install new credentials upon the current task 383 * @new: The credentials to be assigned 384 * 385 * Install a new set of credentials to the current task, using RCU to replace 386 * the old set. Both the objective and the subjective credentials pointers are 387 * updated. This function may not be called if the subjective credentials are 388 * in an overridden state. 389 * 390 * This function eats the caller's reference to the new credentials. 391 * 392 * Always returns 0 thus allowing this function to be tail-called at the end 393 * of, say, sys_setgid(). 394 */ 395 int commit_creds(struct cred *new) 396 { 397 struct task_struct *task = current; 398 const struct cred *old = task->real_cred; 399 400 kdebug("commit_creds(%p{%ld})", new, 401 atomic_long_read(&new->usage)); 402 403 BUG_ON(task->cred != old); 404 BUG_ON(atomic_long_read(&new->usage) < 1); 405 406 get_cred(new); /* we will require a ref for the subj creds too */ 407 408 /* dumpability changes */ 409 if (!uid_eq(old->euid, new->euid) || 410 !gid_eq(old->egid, new->egid) || 411 !uid_eq(old->fsuid, new->fsuid) || 412 !gid_eq(old->fsgid, new->fsgid) || 413 !cred_cap_issubset(old, new)) { 414 if (task->mm) 415 set_dumpable(task->mm, suid_dumpable); 416 task->pdeath_signal = 0; 417 /* 418 * If a task drops privileges and becomes nondumpable, 419 * the dumpability change must become visible before 420 * the credential change; otherwise, a __ptrace_may_access() 421 * racing with this change may be able to attach to a task it 422 * shouldn't be able to attach to (as if the task had dropped 423 * privileges without becoming nondumpable). 424 * Pairs with a read barrier in __ptrace_may_access(). 425 */ 426 smp_wmb(); 427 } 428 429 /* alter the thread keyring */ 430 if (!uid_eq(new->fsuid, old->fsuid)) 431 key_fsuid_changed(new); 432 if (!gid_eq(new->fsgid, old->fsgid)) 433 key_fsgid_changed(new); 434 435 /* do it 436 * RLIMIT_NPROC limits on user->processes have already been checked 437 * in set_user(). 438 */ 439 if (new->user != old->user || new->user_ns != old->user_ns) 440 inc_rlimit_ucounts(new->ucounts, UCOUNT_RLIMIT_NPROC, 1); 441 442 rcu_assign_pointer(task->real_cred, new); 443 rcu_assign_pointer(task->cred, new); 444 if (new->user != old->user || new->user_ns != old->user_ns) 445 dec_rlimit_ucounts(old->ucounts, UCOUNT_RLIMIT_NPROC, 1); 446 if (new->user_ns != old->user_ns) 447 switch_cred_namespaces(old, new); 448 449 /* send notifications */ 450 if (!uid_eq(new->uid, old->uid) || 451 !uid_eq(new->euid, old->euid) || 452 !uid_eq(new->suid, old->suid) || 453 !uid_eq(new->fsuid, old->fsuid)) 454 proc_id_connector(task, PROC_EVENT_UID); 455 456 if (!gid_eq(new->gid, old->gid) || 457 !gid_eq(new->egid, old->egid) || 458 !gid_eq(new->sgid, old->sgid) || 459 !gid_eq(new->fsgid, old->fsgid)) 460 proc_id_connector(task, PROC_EVENT_GID); 461 462 /* release the old obj and subj refs both */ 463 put_cred_many(old, 2); 464 return 0; 465 } 466 EXPORT_SYMBOL(commit_creds); 467 468 /** 469 * abort_creds - Discard a set of credentials and unlock the current task 470 * @new: The credentials that were going to be applied 471 * 472 * Discard a set of credentials that were under construction and unlock the 473 * current task. 474 */ 475 void abort_creds(struct cred *new) 476 { 477 kdebug("abort_creds(%p{%ld})", new, 478 atomic_long_read(&new->usage)); 479 480 BUG_ON(atomic_long_read(&new->usage) < 1); 481 put_cred(new); 482 } 483 EXPORT_SYMBOL(abort_creds); 484 485 /** 486 * cred_fscmp - Compare two credentials with respect to filesystem access. 487 * @a: The first credential 488 * @b: The second credential 489 * 490 * cred_cmp() will return zero if both credentials have the same 491 * fsuid, fsgid, and supplementary groups. That is, if they will both 492 * provide the same access to files based on mode/uid/gid. 493 * If the credentials are different, then either -1 or 1 will 494 * be returned depending on whether @a comes before or after @b 495 * respectively in an arbitrary, but stable, ordering of credentials. 496 * 497 * Return: -1, 0, or 1 depending on comparison 498 */ 499 int cred_fscmp(const struct cred *a, const struct cred *b) 500 { 501 struct group_info *ga, *gb; 502 int g; 503 504 if (a == b) 505 return 0; 506 if (uid_lt(a->fsuid, b->fsuid)) 507 return -1; 508 if (uid_gt(a->fsuid, b->fsuid)) 509 return 1; 510 511 if (gid_lt(a->fsgid, b->fsgid)) 512 return -1; 513 if (gid_gt(a->fsgid, b->fsgid)) 514 return 1; 515 516 ga = a->group_info; 517 gb = b->group_info; 518 if (ga == gb) 519 return 0; 520 if (ga == NULL) 521 return -1; 522 if (gb == NULL) 523 return 1; 524 if (ga->ngroups < gb->ngroups) 525 return -1; 526 if (ga->ngroups > gb->ngroups) 527 return 1; 528 529 for (g = 0; g < ga->ngroups; g++) { 530 if (gid_lt(ga->gid[g], gb->gid[g])) 531 return -1; 532 if (gid_gt(ga->gid[g], gb->gid[g])) 533 return 1; 534 } 535 return 0; 536 } 537 EXPORT_SYMBOL(cred_fscmp); 538 539 int set_cred_ucounts(struct cred *new) 540 { 541 struct ucounts *new_ucounts, *old_ucounts = new->ucounts; 542 543 /* 544 * This optimization is needed because alloc_ucounts() uses locks 545 * for table lookups. 546 */ 547 if (old_ucounts->ns == new->user_ns && uid_eq(old_ucounts->uid, new->uid)) 548 return 0; 549 550 if (!(new_ucounts = alloc_ucounts(new->user_ns, new->uid))) 551 return -EAGAIN; 552 553 new->ucounts = new_ucounts; 554 put_ucounts(old_ucounts); 555 556 return 0; 557 } 558 559 /* 560 * initialise the credentials stuff 561 */ 562 void __init cred_init(void) 563 { 564 /* allocate a slab in which we can store credentials */ 565 cred_jar = KMEM_CACHE(cred, 566 SLAB_HWCACHE_ALIGN | SLAB_PANIC | SLAB_ACCOUNT); 567 } 568 569 /** 570 * prepare_kernel_cred - Prepare a set of credentials for a kernel service 571 * @daemon: A userspace daemon to be used as a reference 572 * 573 * Prepare a set of credentials for a kernel service. This can then be used to 574 * override a task's own credentials so that work can be done on behalf of that 575 * task that requires a different subjective context. 576 * 577 * @daemon is used to provide a base cred, with the security data derived from 578 * that; if this is "&init_task", they'll be set to 0, no groups, full 579 * capabilities, and no keys. 580 * 581 * The caller may change these controls afterwards if desired. 582 * 583 * Returns the new credentials or NULL if out of memory. 584 */ 585 struct cred *prepare_kernel_cred(struct task_struct *daemon) 586 { 587 const struct cred *old; 588 struct cred *new; 589 590 if (WARN_ON_ONCE(!daemon)) 591 return NULL; 592 593 new = kmem_cache_alloc(cred_jar, GFP_KERNEL); 594 if (!new) 595 return NULL; 596 597 kdebug("prepare_kernel_cred() alloc %p", new); 598 599 old = get_task_cred(daemon); 600 601 *new = *old; 602 new->non_rcu = 0; 603 atomic_long_set(&new->usage, 1); 604 get_uid(new->user); 605 get_user_ns(new->user_ns); 606 get_group_info(new->group_info); 607 608 #ifdef CONFIG_KEYS 609 new->session_keyring = NULL; 610 new->process_keyring = NULL; 611 new->thread_keyring = NULL; 612 new->request_key_auth = NULL; 613 new->jit_keyring = KEY_REQKEY_DEFL_THREAD_KEYRING; 614 #endif 615 616 #ifdef CONFIG_SECURITY 617 new->security = NULL; 618 #endif 619 new->ucounts = get_ucounts(new->ucounts); 620 if (!new->ucounts) 621 goto error; 622 623 if (security_prepare_creds(new, old, GFP_KERNEL_ACCOUNT) < 0) 624 goto error; 625 626 put_cred(old); 627 return new; 628 629 error: 630 put_cred(new); 631 put_cred(old); 632 return NULL; 633 } 634 EXPORT_SYMBOL(prepare_kernel_cred); 635 636 /** 637 * set_security_override - Set the security ID in a set of credentials 638 * @new: The credentials to alter 639 * @secid: The LSM security ID to set 640 * 641 * Set the LSM security ID in a set of credentials so that the subjective 642 * security is overridden when an alternative set of credentials is used. 643 */ 644 int set_security_override(struct cred *new, u32 secid) 645 { 646 return security_kernel_act_as(new, secid); 647 } 648 EXPORT_SYMBOL(set_security_override); 649 650 /** 651 * set_security_override_from_ctx - Set the security ID in a set of credentials 652 * @new: The credentials to alter 653 * @secctx: The LSM security context to generate the security ID from. 654 * 655 * Set the LSM security ID in a set of credentials so that the subjective 656 * security is overridden when an alternative set of credentials is used. The 657 * security ID is specified in string form as a security context to be 658 * interpreted by the LSM. 659 */ 660 int set_security_override_from_ctx(struct cred *new, const char *secctx) 661 { 662 u32 secid; 663 int ret; 664 665 ret = security_secctx_to_secid(secctx, strlen(secctx), &secid); 666 if (ret < 0) 667 return ret; 668 669 return set_security_override(new, secid); 670 } 671 EXPORT_SYMBOL(set_security_override_from_ctx); 672 673 /** 674 * set_create_files_as - Set the LSM file create context in a set of credentials 675 * @new: The credentials to alter 676 * @inode: The inode to take the context from 677 * 678 * Change the LSM file creation context in a set of credentials to be the same 679 * as the object context of the specified inode, so that the new inodes have 680 * the same MAC context as that inode. 681 */ 682 int set_create_files_as(struct cred *new, struct inode *inode) 683 { 684 if (!uid_valid(inode->i_uid) || !gid_valid(inode->i_gid)) 685 return -EINVAL; 686 new->fsuid = inode->i_uid; 687 new->fsgid = inode->i_gid; 688 return security_kernel_create_files_as(new, inode); 689 } 690 EXPORT_SYMBOL(set_create_files_as); 691