1 /* 2 * Copyright (c) 1989, 1993 3 * The Regents of the University of California. All rights reserved. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions 7 * are met: 8 * 1. Redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer. 10 * 2. Redistributions in binary form must reproduce the above copyright 11 * notice, this list of conditions and the following disclaimer in the 12 * documentation and/or other materials provided with the distribution. 13 * 4. Neither the name of the University nor the names of its contributors 14 * may be used to endorse or promote products derived from this software 15 * without specific prior written permission. 16 * 17 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 20 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27 * SUCH DAMAGE. 28 * 29 * @(#)kern_ktrace.c 8.2 (Berkeley) 9/23/93 30 */ 31 32 #include <sys/cdefs.h> 33 __FBSDID("$FreeBSD$"); 34 35 #include "opt_ktrace.h" 36 #include "opt_mac.h" 37 38 #include <sys/param.h> 39 #include <sys/systm.h> 40 #include <sys/fcntl.h> 41 #include <sys/kernel.h> 42 #include <sys/kthread.h> 43 #include <sys/lock.h> 44 #include <sys/mutex.h> 45 #include <sys/mac.h> 46 #include <sys/malloc.h> 47 #include <sys/namei.h> 48 #include <sys/proc.h> 49 #include <sys/unistd.h> 50 #include <sys/vnode.h> 51 #include <sys/ktrace.h> 52 #include <sys/sx.h> 53 #include <sys/sysctl.h> 54 #include <sys/syslog.h> 55 #include <sys/sysproto.h> 56 57 static MALLOC_DEFINE(M_KTRACE, "KTRACE", "KTRACE"); 58 59 #ifdef KTRACE 60 61 #ifndef KTRACE_REQUEST_POOL 62 #define KTRACE_REQUEST_POOL 100 63 #endif 64 65 struct ktr_request { 66 struct ktr_header ktr_header; 67 struct ucred *ktr_cred; 68 struct vnode *ktr_vp; 69 union { 70 struct ktr_syscall ktr_syscall; 71 struct ktr_sysret ktr_sysret; 72 struct ktr_genio ktr_genio; 73 struct ktr_psig ktr_psig; 74 struct ktr_csw ktr_csw; 75 } ktr_data; 76 STAILQ_ENTRY(ktr_request) ktr_list; 77 }; 78 79 static int data_lengths[] = { 80 0, /* none */ 81 offsetof(struct ktr_syscall, ktr_args), /* KTR_SYSCALL */ 82 sizeof(struct ktr_sysret), /* KTR_SYSRET */ 83 0, /* KTR_NAMEI */ 84 sizeof(struct ktr_genio), /* KTR_GENIO */ 85 sizeof(struct ktr_psig), /* KTR_PSIG */ 86 sizeof(struct ktr_csw), /* KTR_CSW */ 87 0 /* KTR_USER */ 88 }; 89 90 static STAILQ_HEAD(, ktr_request) ktr_todo; 91 static STAILQ_HEAD(, ktr_request) ktr_free; 92 93 SYSCTL_NODE(_kern, OID_AUTO, ktrace, CTLFLAG_RD, 0, "KTRACE options"); 94 95 static u_int ktr_requestpool = KTRACE_REQUEST_POOL; 96 TUNABLE_INT("kern.ktrace.request_pool", &ktr_requestpool); 97 98 static u_int ktr_geniosize = PAGE_SIZE; 99 TUNABLE_INT("kern.ktrace.genio_size", &ktr_geniosize); 100 SYSCTL_UINT(_kern_ktrace, OID_AUTO, genio_size, CTLFLAG_RW, &ktr_geniosize, 101 0, "Maximum size of genio event payload"); 102 103 static int print_message = 1; 104 struct mtx ktrace_mtx; 105 static struct cv ktrace_cv; 106 107 static void ktrace_init(void *dummy); 108 static int sysctl_kern_ktrace_request_pool(SYSCTL_HANDLER_ARGS); 109 static u_int ktrace_resize_pool(u_int newsize); 110 static struct ktr_request *ktr_getrequest(int type); 111 static void ktr_submitrequest(struct ktr_request *req); 112 static void ktr_freerequest(struct ktr_request *req); 113 static void ktr_loop(void *dummy); 114 static void ktr_writerequest(struct ktr_request *req); 115 static int ktrcanset(struct thread *,struct proc *); 116 static int ktrsetchildren(struct thread *,struct proc *,int,int,struct vnode *); 117 static int ktrops(struct thread *,struct proc *,int,int,struct vnode *); 118 119 static void 120 ktrace_init(void *dummy) 121 { 122 struct ktr_request *req; 123 int i; 124 125 mtx_init(&ktrace_mtx, "ktrace", NULL, MTX_DEF | MTX_QUIET); 126 cv_init(&ktrace_cv, "ktrace"); 127 STAILQ_INIT(&ktr_todo); 128 STAILQ_INIT(&ktr_free); 129 for (i = 0; i < ktr_requestpool; i++) { 130 req = malloc(sizeof(struct ktr_request), M_KTRACE, M_WAITOK); 131 STAILQ_INSERT_HEAD(&ktr_free, req, ktr_list); 132 } 133 kthread_create(ktr_loop, NULL, NULL, RFHIGHPID, 0, "ktrace"); 134 } 135 SYSINIT(ktrace_init, SI_SUB_KTRACE, SI_ORDER_ANY, ktrace_init, NULL); 136 137 static int 138 sysctl_kern_ktrace_request_pool(SYSCTL_HANDLER_ARGS) 139 { 140 struct thread *td; 141 u_int newsize, oldsize, wantsize; 142 int error; 143 144 /* Handle easy read-only case first to avoid warnings from GCC. */ 145 if (!req->newptr) { 146 mtx_lock(&ktrace_mtx); 147 oldsize = ktr_requestpool; 148 mtx_unlock(&ktrace_mtx); 149 return (SYSCTL_OUT(req, &oldsize, sizeof(u_int))); 150 } 151 152 error = SYSCTL_IN(req, &wantsize, sizeof(u_int)); 153 if (error) 154 return (error); 155 td = curthread; 156 td->td_pflags |= TDP_INKTRACE; 157 mtx_lock(&ktrace_mtx); 158 oldsize = ktr_requestpool; 159 newsize = ktrace_resize_pool(wantsize); 160 mtx_unlock(&ktrace_mtx); 161 td->td_pflags &= ~TDP_INKTRACE; 162 error = SYSCTL_OUT(req, &oldsize, sizeof(u_int)); 163 if (error) 164 return (error); 165 if (wantsize > oldsize && newsize < wantsize) 166 return (ENOSPC); 167 return (0); 168 } 169 SYSCTL_PROC(_kern_ktrace, OID_AUTO, request_pool, CTLTYPE_UINT|CTLFLAG_RW, 170 &ktr_requestpool, 0, sysctl_kern_ktrace_request_pool, "IU", ""); 171 172 static u_int 173 ktrace_resize_pool(u_int newsize) 174 { 175 struct ktr_request *req; 176 int bound; 177 178 mtx_assert(&ktrace_mtx, MA_OWNED); 179 print_message = 1; 180 bound = newsize - ktr_requestpool; 181 if (bound == 0) 182 return (ktr_requestpool); 183 if (bound < 0) 184 /* Shrink pool down to newsize if possible. */ 185 while (bound++ < 0) { 186 req = STAILQ_FIRST(&ktr_free); 187 if (req == NULL) 188 return (ktr_requestpool); 189 STAILQ_REMOVE_HEAD(&ktr_free, ktr_list); 190 ktr_requestpool--; 191 mtx_unlock(&ktrace_mtx); 192 free(req, M_KTRACE); 193 mtx_lock(&ktrace_mtx); 194 } 195 else 196 /* Grow pool up to newsize. */ 197 while (bound-- > 0) { 198 mtx_unlock(&ktrace_mtx); 199 req = malloc(sizeof(struct ktr_request), M_KTRACE, 200 M_WAITOK); 201 mtx_lock(&ktrace_mtx); 202 STAILQ_INSERT_HEAD(&ktr_free, req, ktr_list); 203 ktr_requestpool++; 204 } 205 return (ktr_requestpool); 206 } 207 208 static struct ktr_request * 209 ktr_getrequest(int type) 210 { 211 struct ktr_request *req; 212 struct thread *td = curthread; 213 struct proc *p = td->td_proc; 214 int pm; 215 216 td->td_pflags |= TDP_INKTRACE; 217 mtx_lock(&ktrace_mtx); 218 if (!KTRCHECK(td, type)) { 219 mtx_unlock(&ktrace_mtx); 220 td->td_pflags &= ~TDP_INKTRACE; 221 return (NULL); 222 } 223 req = STAILQ_FIRST(&ktr_free); 224 if (req != NULL) { 225 STAILQ_REMOVE_HEAD(&ktr_free, ktr_list); 226 req->ktr_header.ktr_type = type; 227 if (p->p_traceflag & KTRFAC_DROP) { 228 req->ktr_header.ktr_type |= KTR_DROP; 229 p->p_traceflag &= ~KTRFAC_DROP; 230 } 231 KASSERT(p->p_tracevp != NULL, ("ktrace: no trace vnode")); 232 KASSERT(p->p_tracecred != NULL, ("ktrace: no trace cred")); 233 req->ktr_vp = p->p_tracevp; 234 VREF(p->p_tracevp); 235 req->ktr_cred = crhold(p->p_tracecred); 236 mtx_unlock(&ktrace_mtx); 237 microtime(&req->ktr_header.ktr_time); 238 req->ktr_header.ktr_pid = p->p_pid; 239 bcopy(p->p_comm, req->ktr_header.ktr_comm, MAXCOMLEN + 1); 240 req->ktr_header.ktr_buffer = NULL; 241 req->ktr_header.ktr_len = 0; 242 } else { 243 p->p_traceflag |= KTRFAC_DROP; 244 pm = print_message; 245 print_message = 0; 246 mtx_unlock(&ktrace_mtx); 247 if (pm) 248 printf("Out of ktrace request objects.\n"); 249 td->td_pflags &= ~TDP_INKTRACE; 250 } 251 return (req); 252 } 253 254 static void 255 ktr_submitrequest(struct ktr_request *req) 256 { 257 258 mtx_lock(&ktrace_mtx); 259 STAILQ_INSERT_TAIL(&ktr_todo, req, ktr_list); 260 cv_signal(&ktrace_cv); 261 mtx_unlock(&ktrace_mtx); 262 curthread->td_pflags &= ~TDP_INKTRACE; 263 } 264 265 static void 266 ktr_freerequest(struct ktr_request *req) 267 { 268 269 crfree(req->ktr_cred); 270 if (req->ktr_vp != NULL) { 271 mtx_lock(&Giant); 272 vrele(req->ktr_vp); 273 mtx_unlock(&Giant); 274 } 275 if (req->ktr_header.ktr_buffer != NULL) 276 free(req->ktr_header.ktr_buffer, M_KTRACE); 277 mtx_lock(&ktrace_mtx); 278 STAILQ_INSERT_HEAD(&ktr_free, req, ktr_list); 279 mtx_unlock(&ktrace_mtx); 280 } 281 282 static void 283 ktr_loop(void *dummy) 284 { 285 struct ktr_request *req; 286 struct thread *td; 287 struct ucred *cred; 288 289 /* Only cache these values once. */ 290 td = curthread; 291 cred = td->td_ucred; 292 for (;;) { 293 mtx_lock(&ktrace_mtx); 294 while (STAILQ_EMPTY(&ktr_todo)) 295 cv_wait(&ktrace_cv, &ktrace_mtx); 296 req = STAILQ_FIRST(&ktr_todo); 297 STAILQ_REMOVE_HEAD(&ktr_todo, ktr_list); 298 KASSERT(req != NULL, ("got a NULL request")); 299 mtx_unlock(&ktrace_mtx); 300 /* 301 * It is not enough just to pass the cached cred 302 * to the VOP's in ktr_writerequest(). Some VFS 303 * operations use curthread->td_ucred, so we need 304 * to modify our thread's credentials as well. 305 * Evil. 306 */ 307 td->td_ucred = req->ktr_cred; 308 ktr_writerequest(req); 309 td->td_ucred = cred; 310 ktr_freerequest(req); 311 } 312 } 313 314 /* 315 * MPSAFE 316 */ 317 void 318 ktrsyscall(code, narg, args) 319 int code, narg; 320 register_t args[]; 321 { 322 struct ktr_request *req; 323 struct ktr_syscall *ktp; 324 size_t buflen; 325 char *buf = NULL; 326 327 buflen = sizeof(register_t) * narg; 328 if (buflen > 0) { 329 buf = malloc(buflen, M_KTRACE, M_WAITOK); 330 bcopy(args, buf, buflen); 331 } 332 req = ktr_getrequest(KTR_SYSCALL); 333 if (req == NULL) { 334 if (buf != NULL) 335 free(buf, M_KTRACE); 336 return; 337 } 338 ktp = &req->ktr_data.ktr_syscall; 339 ktp->ktr_code = code; 340 ktp->ktr_narg = narg; 341 if (buflen > 0) { 342 req->ktr_header.ktr_len = buflen; 343 req->ktr_header.ktr_buffer = buf; 344 } 345 ktr_submitrequest(req); 346 } 347 348 /* 349 * MPSAFE 350 */ 351 void 352 ktrsysret(code, error, retval) 353 int code, error; 354 register_t retval; 355 { 356 struct ktr_request *req; 357 struct ktr_sysret *ktp; 358 359 req = ktr_getrequest(KTR_SYSRET); 360 if (req == NULL) 361 return; 362 ktp = &req->ktr_data.ktr_sysret; 363 ktp->ktr_code = code; 364 ktp->ktr_error = error; 365 ktp->ktr_retval = retval; /* what about val2 ? */ 366 ktr_submitrequest(req); 367 } 368 369 void 370 ktrnamei(path) 371 char *path; 372 { 373 struct ktr_request *req; 374 int namelen; 375 char *buf = NULL; 376 377 namelen = strlen(path); 378 if (namelen > 0) { 379 buf = malloc(namelen, M_KTRACE, M_WAITOK); 380 bcopy(path, buf, namelen); 381 } 382 req = ktr_getrequest(KTR_NAMEI); 383 if (req == NULL) { 384 if (buf != NULL) 385 free(buf, M_KTRACE); 386 return; 387 } 388 if (namelen > 0) { 389 req->ktr_header.ktr_len = namelen; 390 req->ktr_header.ktr_buffer = buf; 391 } 392 ktr_submitrequest(req); 393 } 394 395 /* 396 * Since the uio may not stay valid, we can not hand off this request to 397 * the thread and need to process it synchronously. However, we wish to 398 * keep the relative order of records in a trace file correct, so we 399 * do put this request on the queue (if it isn't empty) and then block. 400 * The ktrace thread waks us back up when it is time for this event to 401 * be posted and blocks until we have completed writing out the event 402 * and woken it back up. 403 */ 404 void 405 ktrgenio(fd, rw, uio, error) 406 int fd; 407 enum uio_rw rw; 408 struct uio *uio; 409 int error; 410 { 411 struct ktr_request *req; 412 struct ktr_genio *ktg; 413 int datalen; 414 char *buf; 415 416 if (error) 417 return; 418 uio->uio_offset = 0; 419 uio->uio_rw = UIO_WRITE; 420 datalen = imin(uio->uio_resid, ktr_geniosize); 421 buf = malloc(datalen, M_KTRACE, M_WAITOK); 422 if (uiomove(buf, datalen, uio)) { 423 free(buf, M_KTRACE); 424 return; 425 } 426 req = ktr_getrequest(KTR_GENIO); 427 if (req == NULL) { 428 free(buf, M_KTRACE); 429 return; 430 } 431 ktg = &req->ktr_data.ktr_genio; 432 ktg->ktr_fd = fd; 433 ktg->ktr_rw = rw; 434 req->ktr_header.ktr_len = datalen; 435 req->ktr_header.ktr_buffer = buf; 436 ktr_submitrequest(req); 437 } 438 439 void 440 ktrpsig(sig, action, mask, code) 441 int sig; 442 sig_t action; 443 sigset_t *mask; 444 int code; 445 { 446 struct ktr_request *req; 447 struct ktr_psig *kp; 448 449 req = ktr_getrequest(KTR_PSIG); 450 if (req == NULL) 451 return; 452 kp = &req->ktr_data.ktr_psig; 453 kp->signo = (char)sig; 454 kp->action = action; 455 kp->mask = *mask; 456 kp->code = code; 457 ktr_submitrequest(req); 458 } 459 460 void 461 ktrcsw(out, user) 462 int out, user; 463 { 464 struct ktr_request *req; 465 struct ktr_csw *kc; 466 467 req = ktr_getrequest(KTR_CSW); 468 if (req == NULL) 469 return; 470 kc = &req->ktr_data.ktr_csw; 471 kc->out = out; 472 kc->user = user; 473 ktr_submitrequest(req); 474 } 475 #endif /* KTRACE */ 476 477 /* Interface and common routines */ 478 479 /* 480 * ktrace system call 481 * 482 * MPSAFE 483 */ 484 #ifndef _SYS_SYSPROTO_H_ 485 struct ktrace_args { 486 char *fname; 487 int ops; 488 int facs; 489 int pid; 490 }; 491 #endif 492 /* ARGSUSED */ 493 int 494 ktrace(td, uap) 495 struct thread *td; 496 register struct ktrace_args *uap; 497 { 498 #ifdef KTRACE 499 register struct vnode *vp = NULL; 500 register struct proc *p; 501 struct pgrp *pg; 502 int facs = uap->facs & ~KTRFAC_ROOT; 503 int ops = KTROP(uap->ops); 504 int descend = uap->ops & KTRFLAG_DESCEND; 505 int ret = 0; 506 int flags, error = 0; 507 struct nameidata nd; 508 struct ucred *cred; 509 510 /* 511 * Need something to (un)trace. 512 */ 513 if (ops != KTROP_CLEARFILE && facs == 0) 514 return (EINVAL); 515 516 td->td_pflags |= TDP_INKTRACE; 517 if (ops != KTROP_CLEAR) { 518 /* 519 * an operation which requires a file argument. 520 */ 521 NDINIT(&nd, LOOKUP, NOFOLLOW, UIO_USERSPACE, uap->fname, td); 522 flags = FREAD | FWRITE | O_NOFOLLOW; 523 mtx_lock(&Giant); 524 error = vn_open(&nd, &flags, 0, -1); 525 if (error) { 526 mtx_unlock(&Giant); 527 td->td_pflags &= ~TDP_INKTRACE; 528 return (error); 529 } 530 NDFREE(&nd, NDF_ONLY_PNBUF); 531 vp = nd.ni_vp; 532 VOP_UNLOCK(vp, 0, td); 533 if (vp->v_type != VREG) { 534 (void) vn_close(vp, FREAD|FWRITE, td->td_ucred, td); 535 mtx_unlock(&Giant); 536 td->td_pflags &= ~TDP_INKTRACE; 537 return (EACCES); 538 } 539 mtx_unlock(&Giant); 540 } 541 /* 542 * Clear all uses of the tracefile. 543 */ 544 if (ops == KTROP_CLEARFILE) { 545 sx_slock(&allproc_lock); 546 LIST_FOREACH(p, &allproc, p_list) { 547 PROC_LOCK(p); 548 if (p->p_tracevp == vp) { 549 if (ktrcanset(td, p)) { 550 mtx_lock(&ktrace_mtx); 551 cred = p->p_tracecred; 552 p->p_tracecred = NULL; 553 p->p_tracevp = NULL; 554 p->p_traceflag = 0; 555 mtx_unlock(&ktrace_mtx); 556 PROC_UNLOCK(p); 557 mtx_lock(&Giant); 558 (void) vn_close(vp, FREAD|FWRITE, 559 cred, td); 560 mtx_unlock(&Giant); 561 crfree(cred); 562 } else { 563 PROC_UNLOCK(p); 564 error = EPERM; 565 } 566 } else 567 PROC_UNLOCK(p); 568 } 569 sx_sunlock(&allproc_lock); 570 goto done; 571 } 572 /* 573 * do it 574 */ 575 sx_slock(&proctree_lock); 576 if (uap->pid < 0) { 577 /* 578 * by process group 579 */ 580 pg = pgfind(-uap->pid); 581 if (pg == NULL) { 582 sx_sunlock(&proctree_lock); 583 error = ESRCH; 584 goto done; 585 } 586 /* 587 * ktrops() may call vrele(). Lock pg_members 588 * by the proctree_lock rather than pg_mtx. 589 */ 590 PGRP_UNLOCK(pg); 591 LIST_FOREACH(p, &pg->pg_members, p_pglist) 592 if (descend) 593 ret |= ktrsetchildren(td, p, ops, facs, vp); 594 else 595 ret |= ktrops(td, p, ops, facs, vp); 596 } else { 597 /* 598 * by pid 599 */ 600 p = pfind(uap->pid); 601 if (p == NULL) { 602 sx_sunlock(&proctree_lock); 603 error = ESRCH; 604 goto done; 605 } 606 /* 607 * The slock of the proctree lock will keep this process 608 * from going away, so unlocking the proc here is ok. 609 */ 610 PROC_UNLOCK(p); 611 if (descend) 612 ret |= ktrsetchildren(td, p, ops, facs, vp); 613 else 614 ret |= ktrops(td, p, ops, facs, vp); 615 } 616 sx_sunlock(&proctree_lock); 617 if (!ret) 618 error = EPERM; 619 done: 620 if (vp != NULL) { 621 mtx_lock(&Giant); 622 (void) vn_close(vp, FWRITE, td->td_ucred, td); 623 mtx_unlock(&Giant); 624 } 625 td->td_pflags &= ~TDP_INKTRACE; 626 return (error); 627 #else /* !KTRACE */ 628 return (ENOSYS); 629 #endif /* KTRACE */ 630 } 631 632 /* 633 * utrace system call 634 * 635 * MPSAFE 636 */ 637 /* ARGSUSED */ 638 int 639 utrace(td, uap) 640 struct thread *td; 641 register struct utrace_args *uap; 642 { 643 644 #ifdef KTRACE 645 struct ktr_request *req; 646 void *cp; 647 int error; 648 649 if (!KTRPOINT(td, KTR_USER)) 650 return (0); 651 if (uap->len > KTR_USER_MAXLEN) 652 return (EINVAL); 653 cp = malloc(uap->len, M_KTRACE, M_WAITOK); 654 error = copyin(uap->addr, cp, uap->len); 655 if (error) { 656 free(cp, M_KTRACE); 657 return (error); 658 } 659 req = ktr_getrequest(KTR_USER); 660 if (req == NULL) { 661 free(cp, M_KTRACE); 662 return (ENOMEM); 663 } 664 req->ktr_header.ktr_buffer = cp; 665 req->ktr_header.ktr_len = uap->len; 666 ktr_submitrequest(req); 667 return (0); 668 #else /* !KTRACE */ 669 return (ENOSYS); 670 #endif /* KTRACE */ 671 } 672 673 #ifdef KTRACE 674 static int 675 ktrops(td, p, ops, facs, vp) 676 struct thread *td; 677 struct proc *p; 678 int ops, facs; 679 struct vnode *vp; 680 { 681 struct vnode *tracevp = NULL; 682 struct ucred *tracecred = NULL; 683 684 PROC_LOCK(p); 685 if (!ktrcanset(td, p)) { 686 PROC_UNLOCK(p); 687 return (0); 688 } 689 mtx_lock(&ktrace_mtx); 690 if (ops == KTROP_SET) { 691 if (p->p_tracevp != vp) { 692 /* 693 * if trace file already in use, relinquish below 694 */ 695 tracevp = p->p_tracevp; 696 VREF(vp); 697 p->p_tracevp = vp; 698 } 699 if (p->p_tracecred != td->td_ucred) { 700 tracecred = p->p_tracecred; 701 p->p_tracecred = crhold(td->td_ucred); 702 } 703 p->p_traceflag |= facs; 704 if (td->td_ucred->cr_uid == 0) 705 p->p_traceflag |= KTRFAC_ROOT; 706 } else { 707 /* KTROP_CLEAR */ 708 if (((p->p_traceflag &= ~facs) & KTRFAC_MASK) == 0) { 709 /* no more tracing */ 710 p->p_traceflag = 0; 711 tracevp = p->p_tracevp; 712 p->p_tracevp = NULL; 713 tracecred = p->p_tracecred; 714 p->p_tracecred = NULL; 715 } 716 } 717 mtx_unlock(&ktrace_mtx); 718 PROC_UNLOCK(p); 719 if (tracevp != NULL) { 720 mtx_lock(&Giant); 721 vrele(tracevp); 722 mtx_unlock(&Giant); 723 } 724 if (tracecred != NULL) 725 crfree(tracecred); 726 727 return (1); 728 } 729 730 static int 731 ktrsetchildren(td, top, ops, facs, vp) 732 struct thread *td; 733 struct proc *top; 734 int ops, facs; 735 struct vnode *vp; 736 { 737 register struct proc *p; 738 register int ret = 0; 739 740 p = top; 741 sx_assert(&proctree_lock, SX_LOCKED); 742 for (;;) { 743 ret |= ktrops(td, p, ops, facs, vp); 744 /* 745 * If this process has children, descend to them next, 746 * otherwise do any siblings, and if done with this level, 747 * follow back up the tree (but not past top). 748 */ 749 if (!LIST_EMPTY(&p->p_children)) 750 p = LIST_FIRST(&p->p_children); 751 else for (;;) { 752 if (p == top) 753 return (ret); 754 if (LIST_NEXT(p, p_sibling)) { 755 p = LIST_NEXT(p, p_sibling); 756 break; 757 } 758 p = p->p_pptr; 759 } 760 } 761 /*NOTREACHED*/ 762 } 763 764 static void 765 ktr_writerequest(struct ktr_request *req) 766 { 767 struct ktr_header *kth; 768 struct vnode *vp; 769 struct proc *p; 770 struct thread *td; 771 struct ucred *cred; 772 struct uio auio; 773 struct iovec aiov[3]; 774 struct mount *mp; 775 int datalen, buflen, vrele_count; 776 int error; 777 778 vp = req->ktr_vp; 779 /* 780 * If vp is NULL, the vp has been cleared out from under this 781 * request, so just drop it. 782 */ 783 if (vp == NULL) 784 return; 785 kth = &req->ktr_header; 786 datalen = data_lengths[(u_short)kth->ktr_type & ~KTR_DROP]; 787 buflen = kth->ktr_len; 788 cred = req->ktr_cred; 789 td = curthread; 790 auio.uio_iov = &aiov[0]; 791 auio.uio_offset = 0; 792 auio.uio_segflg = UIO_SYSSPACE; 793 auio.uio_rw = UIO_WRITE; 794 aiov[0].iov_base = (caddr_t)kth; 795 aiov[0].iov_len = sizeof(struct ktr_header); 796 auio.uio_resid = sizeof(struct ktr_header); 797 auio.uio_iovcnt = 1; 798 auio.uio_td = td; 799 if (datalen != 0) { 800 aiov[1].iov_base = (caddr_t)&req->ktr_data; 801 aiov[1].iov_len = datalen; 802 auio.uio_resid += datalen; 803 auio.uio_iovcnt++; 804 kth->ktr_len += datalen; 805 } 806 if (buflen != 0) { 807 KASSERT(kth->ktr_buffer != NULL, ("ktrace: nothing to write")); 808 aiov[auio.uio_iovcnt].iov_base = kth->ktr_buffer; 809 aiov[auio.uio_iovcnt].iov_len = buflen; 810 auio.uio_resid += buflen; 811 auio.uio_iovcnt++; 812 } 813 mtx_lock(&Giant); 814 vn_start_write(vp, &mp, V_WAIT); 815 vn_lock(vp, LK_EXCLUSIVE | LK_RETRY, td); 816 (void)VOP_LEASE(vp, td, cred, LEASE_WRITE); 817 #ifdef MAC 818 error = mac_check_vnode_write(cred, NOCRED, vp); 819 if (error == 0) 820 #endif 821 error = VOP_WRITE(vp, &auio, IO_UNIT | IO_APPEND, cred); 822 VOP_UNLOCK(vp, 0, td); 823 vn_finished_write(mp); 824 mtx_unlock(&Giant); 825 if (!error) 826 return; 827 /* 828 * If error encountered, give up tracing on this vnode. We defer 829 * all the vrele()'s on the vnode until after we are finished walking 830 * the various lists to avoid needlessly holding locks. 831 */ 832 log(LOG_NOTICE, "ktrace write failed, errno %d, tracing stopped\n", 833 error); 834 vrele_count = 0; 835 /* 836 * First, clear this vnode from being used by any processes in the 837 * system. 838 * XXX - If one process gets an EPERM writing to the vnode, should 839 * we really do this? Other processes might have suitable 840 * credentials for the operation. 841 */ 842 cred = NULL; 843 sx_slock(&allproc_lock); 844 LIST_FOREACH(p, &allproc, p_list) { 845 PROC_LOCK(p); 846 if (p->p_tracevp == vp) { 847 mtx_lock(&ktrace_mtx); 848 p->p_tracevp = NULL; 849 p->p_traceflag = 0; 850 cred = p->p_tracecred; 851 p->p_tracecred = NULL; 852 mtx_unlock(&ktrace_mtx); 853 vrele_count++; 854 } 855 PROC_UNLOCK(p); 856 if (cred != NULL) { 857 crfree(cred); 858 cred = NULL; 859 } 860 } 861 sx_sunlock(&allproc_lock); 862 /* 863 * Second, clear this vnode from any pending requests. 864 */ 865 mtx_lock(&ktrace_mtx); 866 STAILQ_FOREACH(req, &ktr_todo, ktr_list) { 867 if (req->ktr_vp == vp) { 868 req->ktr_vp = NULL; 869 vrele_count++; 870 } 871 } 872 mtx_unlock(&ktrace_mtx); 873 mtx_lock(&Giant); 874 while (vrele_count-- > 0) 875 vrele(vp); 876 mtx_unlock(&Giant); 877 } 878 879 /* 880 * Return true if caller has permission to set the ktracing state 881 * of target. Essentially, the target can't possess any 882 * more permissions than the caller. KTRFAC_ROOT signifies that 883 * root previously set the tracing status on the target process, and 884 * so, only root may further change it. 885 */ 886 static int 887 ktrcanset(td, targetp) 888 struct thread *td; 889 struct proc *targetp; 890 { 891 892 PROC_LOCK_ASSERT(targetp, MA_OWNED); 893 if (targetp->p_traceflag & KTRFAC_ROOT && 894 suser_cred(td->td_ucred, PRISON_ROOT)) 895 return (0); 896 897 if (p_candebug(td, targetp) != 0) 898 return (0); 899 900 return (1); 901 } 902 903 #endif /* KTRACE */ 904