1 /* 2 * Copyright (c) 1997, Stefan Esser <se@freebsd.org> 3 * All rights reserved. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions 7 * are met: 8 * 1. Redistributions of source code must retain the above copyright 9 * notice unmodified, this list of conditions, and the following 10 * disclaimer. 11 * 2. Redistributions in binary form must reproduce the above copyright 12 * notice, this list of conditions and the following disclaimer in the 13 * documentation and/or other materials provided with the distribution. 14 * 15 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 16 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 17 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 18 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 19 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 20 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 21 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 22 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 23 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 24 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 25 * 26 * $FreeBSD$ 27 * 28 */ 29 30 31 #include <sys/param.h> 32 #include <sys/bus.h> 33 #include <sys/rtprio.h> 34 #include <sys/systm.h> 35 #include <sys/interrupt.h> 36 #include <sys/kernel.h> 37 #include <sys/kthread.h> 38 #include <sys/ktr.h> 39 #include <sys/lock.h> 40 #include <sys/malloc.h> 41 #include <sys/mutex.h> 42 #include <sys/proc.h> 43 #include <sys/random.h> 44 #include <sys/resourcevar.h> 45 #include <sys/sysctl.h> 46 #include <sys/unistd.h> 47 #include <sys/vmmeter.h> 48 #include <machine/atomic.h> 49 #include <machine/cpu.h> 50 #include <machine/md_var.h> 51 #include <machine/stdarg.h> 52 53 #include <net/netisr.h> /* prototype for legacy_setsoftnet */ 54 55 struct int_entropy { 56 struct proc *proc; 57 int vector; 58 }; 59 60 void *net_ih; 61 void *vm_ih; 62 void *softclock_ih; 63 struct ithd *clk_ithd; 64 struct ithd *tty_ithd; 65 66 static MALLOC_DEFINE(M_ITHREAD, "ithread", "Interrupt Threads"); 67 68 static void ithread_update(struct ithd *); 69 static void ithread_loop(void *); 70 static void start_softintr(void *); 71 static void swi_net(void *); 72 73 u_char 74 ithread_priority(enum intr_type flags) 75 { 76 u_char pri; 77 78 flags &= (INTR_TYPE_TTY | INTR_TYPE_BIO | INTR_TYPE_NET | 79 INTR_TYPE_CAM | INTR_TYPE_MISC | INTR_TYPE_CLK | INTR_TYPE_AV); 80 switch (flags) { 81 case INTR_TYPE_TTY: 82 pri = PI_TTYLOW; 83 break; 84 case INTR_TYPE_BIO: 85 /* 86 * XXX We need to refine this. BSD/OS distinguishes 87 * between tape and disk priorities. 88 */ 89 pri = PI_DISK; 90 break; 91 case INTR_TYPE_NET: 92 pri = PI_NET; 93 break; 94 case INTR_TYPE_CAM: 95 pri = PI_DISK; /* XXX or PI_CAM? */ 96 break; 97 case INTR_TYPE_AV: /* Audio/video */ 98 pri = PI_AV; 99 break; 100 case INTR_TYPE_CLK: 101 pri = PI_REALTIME; 102 break; 103 case INTR_TYPE_MISC: 104 pri = PI_DULL; /* don't care */ 105 break; 106 default: 107 /* We didn't specify an interrupt level. */ 108 panic("ithread_priority: no interrupt type in flags"); 109 } 110 111 return pri; 112 } 113 114 /* 115 * Regenerate the name (p_comm) and priority for a threaded interrupt thread. 116 */ 117 static void 118 ithread_update(struct ithd *ithd) 119 { 120 struct intrhand *ih; 121 struct proc *p; 122 int entropy; 123 124 mtx_assert(&ithd->it_lock, MA_OWNED); 125 p = ithd->it_proc; 126 if (p == NULL) 127 return; 128 129 strncpy(p->p_comm, ithd->it_name, sizeof(ithd->it_name)); 130 ih = TAILQ_FIRST(&ithd->it_handlers); 131 if (ih == NULL) { 132 p->p_pri.pri_level = PRI_MAX_ITHD; 133 ithd->it_flags &= ~IT_ENTROPY; 134 return; 135 } 136 137 entropy = 0; 138 p->p_pri.pri_level = ih->ih_pri; 139 p->p_pri.pri_native = ih->ih_pri; 140 TAILQ_FOREACH(ih, &ithd->it_handlers, ih_next) { 141 if (strlen(p->p_comm) + strlen(ih->ih_name) + 1 < 142 sizeof(p->p_comm)) { 143 strcat(p->p_comm, " "); 144 strcat(p->p_comm, ih->ih_name); 145 } else if (strlen(p->p_comm) + 1 == sizeof(p->p_comm)) { 146 if (p->p_comm[sizeof(p->p_comm) - 2] == '+') 147 p->p_comm[sizeof(p->p_comm) - 2] = '*'; 148 else 149 p->p_comm[sizeof(p->p_comm) - 2] = '+'; 150 } else 151 strcat(p->p_comm, "+"); 152 if (ih->ih_flags & IH_ENTROPY) 153 entropy++; 154 } 155 156 if (entropy) 157 ithd->it_flags |= IT_ENTROPY; 158 else 159 ithd->it_flags &= ~IT_ENTROPY; 160 161 CTR1(KTR_INTR, __func__ ": updated %s\n", p->p_comm); 162 } 163 164 int 165 ithread_create(struct ithd **ithread, int vector, int flags, 166 void (*disable)(int), void (*enable)(int), const char *fmt, ...) 167 { 168 struct ithd *ithd; 169 struct proc *p; 170 int error; 171 va_list ap; 172 173 /* The only valid flag during creation is IT_SOFT. */ 174 if ((flags & ~IT_SOFT) != 0) 175 return (EINVAL); 176 177 ithd = malloc(sizeof(struct ithd), M_ITHREAD, M_WAITOK | M_ZERO); 178 ithd->it_vector = vector; 179 ithd->it_disable = disable; 180 ithd->it_enable = enable; 181 ithd->it_flags = flags; 182 TAILQ_INIT(&ithd->it_handlers); 183 mtx_init(&ithd->it_lock, "ithread", MTX_DEF); 184 mtx_lock(&ithd->it_lock); 185 186 va_start(ap, fmt); 187 vsnprintf(ithd->it_name, sizeof(ithd->it_name), fmt, ap); 188 va_end(ap); 189 190 error = kthread_create(ithread_loop, ithd, &p, RFSTOPPED | RFHIGHPID, 191 "%s", ithd->it_name); 192 if (error) { 193 mtx_destroy(&ithd->it_lock); 194 free(ithd, M_ITHREAD); 195 return (error); 196 } 197 p->p_pri.pri_class = PRI_ITHD; 198 p->p_pri.pri_level = PRI_MAX_ITHD; 199 p->p_stat = SWAIT; 200 ithd->it_proc = p; 201 p->p_ithd = ithd; 202 if (ithread != NULL) 203 *ithread = ithd; 204 mtx_unlock(&ithd->it_lock); 205 206 CTR1(KTR_INTR, __func__ ": created %s", ithd->it_name); 207 return (0); 208 } 209 210 int 211 ithread_destroy(struct ithd *ithread) 212 { 213 214 if (ithread == NULL) 215 return (EINVAL); 216 217 mtx_lock(&ithread->it_lock); 218 if (!TAILQ_EMPTY(&ithread->it_handlers)) { 219 mtx_unlock(&ithread->it_lock); 220 return (EINVAL); 221 } 222 ithread->it_flags |= IT_DEAD; 223 mtx_lock_spin(&sched_lock); 224 if (ithread->it_proc->p_stat == SWAIT) { 225 ithread->it_proc->p_stat = SRUN; 226 setrunqueue(ithread->it_proc); 227 } 228 mtx_unlock_spin(&sched_lock); 229 mtx_unlock(&ithread->it_lock); 230 CTR1(KTR_INTR, __func__ ": killing %s", ithread->it_name); 231 return (0); 232 } 233 234 int 235 ithread_add_handler(struct ithd* ithread, const char *name, 236 driver_intr_t handler, void *arg, u_char pri, enum intr_type flags, 237 void **cookiep) 238 { 239 struct intrhand *ih, *temp_ih; 240 241 if (ithread == NULL || name == NULL || handler == NULL) 242 return (EINVAL); 243 if ((flags & INTR_FAST) !=0) 244 flags |= INTR_EXCL; 245 246 ih = malloc(sizeof(struct intrhand), M_ITHREAD, M_WAITOK | M_ZERO); 247 ih->ih_handler = handler; 248 ih->ih_argument = arg; 249 ih->ih_name = name; 250 ih->ih_ithread = ithread; 251 ih->ih_pri = pri; 252 if (flags & INTR_FAST) 253 ih->ih_flags = IH_FAST | IH_EXCLUSIVE; 254 else if (flags & INTR_EXCL) 255 ih->ih_flags = IH_EXCLUSIVE; 256 if (flags & INTR_MPSAFE) 257 ih->ih_flags |= IH_MPSAFE; 258 if (flags & INTR_ENTROPY) 259 ih->ih_flags |= IH_ENTROPY; 260 261 mtx_lock(&ithread->it_lock); 262 if ((flags & INTR_EXCL) !=0 && !TAILQ_EMPTY(&ithread->it_handlers)) 263 goto fail; 264 if (!TAILQ_EMPTY(&ithread->it_handlers) && 265 (TAILQ_FIRST(&ithread->it_handlers)->ih_flags & IH_EXCLUSIVE) != 0) 266 goto fail; 267 268 TAILQ_FOREACH(temp_ih, &ithread->it_handlers, ih_next) 269 if (temp_ih->ih_pri > ih->ih_pri) 270 break; 271 if (temp_ih == NULL) 272 TAILQ_INSERT_TAIL(&ithread->it_handlers, ih, ih_next); 273 else 274 TAILQ_INSERT_BEFORE(temp_ih, ih, ih_next); 275 ithread_update(ithread); 276 mtx_unlock(&ithread->it_lock); 277 278 if (cookiep != NULL) 279 *cookiep = ih; 280 CTR2(KTR_INTR, __func__ ": added %s to %s", ih->ih_name, 281 ithread->it_name); 282 return (0); 283 284 fail: 285 mtx_unlock(&ithread->it_lock); 286 free(ih, M_ITHREAD); 287 return (EINVAL); 288 } 289 290 int 291 ithread_remove_handler(void *cookie) 292 { 293 struct intrhand *handler = (struct intrhand *)cookie; 294 struct ithd *ithread; 295 #ifdef INVARIANTS 296 struct intrhand *ih; 297 #endif 298 299 if (handler == NULL) 300 return (EINVAL); 301 ithread = handler->ih_ithread; 302 KASSERT(ithread != NULL, 303 ("interrupt handler \"%s\" has a NULL interrupt thread", 304 handler->ih_name)); 305 CTR2(KTR_INTR, __func__ ": removing %s from %s", handler->ih_name, 306 ithread->it_name); 307 mtx_lock(&ithread->it_lock); 308 #ifdef INVARIANTS 309 TAILQ_FOREACH(ih, &ithread->it_handlers, ih_next) 310 if (ih == handler) 311 goto ok; 312 mtx_unlock(&ithread->it_lock); 313 panic("interrupt handler \"%s\" not found in interrupt thread \"%s\"", 314 ih->ih_name, ithread->it_name); 315 ok: 316 #endif 317 /* 318 * If the interrupt thread is already running, then just mark this 319 * handler as being dead and let the ithread do the actual removal. 320 */ 321 mtx_lock_spin(&sched_lock); 322 if (ithread->it_proc->p_stat != SWAIT) { 323 handler->ih_flags |= IH_DEAD; 324 325 /* 326 * Ensure that the thread will process the handler list 327 * again and remove this handler if it has already passed 328 * it on the list. 329 */ 330 ithread->it_need = 1; 331 } else 332 TAILQ_REMOVE(&ithread->it_handlers, handler, ih_next); 333 mtx_unlock_spin(&sched_lock); 334 if ((handler->ih_flags & IH_DEAD) != 0) 335 msleep(handler, &ithread->it_lock, PUSER, "itrmh", 0); 336 ithread_update(ithread); 337 mtx_unlock(&ithread->it_lock); 338 free(handler, M_ITHREAD); 339 return (0); 340 } 341 342 int 343 ithread_schedule(struct ithd *ithread, int do_switch) 344 { 345 struct int_entropy entropy; 346 struct proc *p; 347 348 /* 349 * If no ithread or no handlers, then we have a stray interrupt. 350 */ 351 if ((ithread == NULL) || TAILQ_EMPTY(&ithread->it_handlers)) 352 return (EINVAL); 353 354 /* 355 * If any of the handlers for this ithread claim to be good 356 * sources of entropy, then gather some. 357 */ 358 if (harvest.interrupt && ithread->it_flags & IT_ENTROPY) { 359 entropy.vector = ithread->it_vector; 360 entropy.proc = CURPROC; 361 random_harvest(&entropy, sizeof(entropy), 2, 0, 362 RANDOM_INTERRUPT); 363 } 364 365 p = ithread->it_proc; 366 KASSERT(p != NULL, ("ithread %s has no process", ithread->it_name)); 367 CTR3(KTR_INTR, __func__ ": pid %d: (%s) need = %d", p->p_pid, p->p_comm, 368 ithread->it_need); 369 370 /* 371 * Set it_need to tell the thread to keep running if it is already 372 * running. Then, grab sched_lock and see if we actually need to 373 * put this thread on the runqueue. If so and the do_switch flag is 374 * true, then switch to the ithread immediately. Otherwise, use 375 * need_resched() to guarantee that this ithread will run before any 376 * userland processes. 377 */ 378 ithread->it_need = 1; 379 mtx_lock_spin(&sched_lock); 380 if (p->p_stat == SWAIT) { 381 CTR1(KTR_INTR, __func__ ": setrunqueue %d", p->p_pid); 382 p->p_stat = SRUN; 383 setrunqueue(p); 384 if (do_switch && curproc->p_stat == SRUN) { 385 if (curproc != PCPU_GET(idleproc)) 386 setrunqueue(curproc); 387 curproc->p_stats->p_ru.ru_nivcsw++; 388 mi_switch(); 389 } else 390 need_resched(curproc); 391 } else { 392 CTR3(KTR_INTR, __func__ ": pid %d: it_need %d, state %d", 393 p->p_pid, ithread->it_need, p->p_stat); 394 } 395 mtx_unlock_spin(&sched_lock); 396 397 return (0); 398 } 399 400 int 401 swi_add(struct ithd **ithdp, const char *name, driver_intr_t handler, 402 void *arg, int pri, enum intr_type flags, void **cookiep) 403 { 404 struct ithd *ithd; 405 int error; 406 407 if (flags & (INTR_FAST | INTR_ENTROPY)) 408 return (EINVAL); 409 410 ithd = (ithdp != NULL) ? *ithdp : NULL; 411 412 if (ithd != NULL) { 413 if ((ithd->it_flags & IT_SOFT) == 0) 414 return(EINVAL); 415 } else { 416 error = ithread_create(&ithd, pri, IT_SOFT, NULL, NULL, 417 "swi%d:", pri); 418 if (error) 419 return (error); 420 421 if (ithdp != NULL) 422 *ithdp = ithd; 423 } 424 return (ithread_add_handler(ithd, name, handler, arg, 425 (pri * RQ_PPQ) + PI_SOFT, flags, cookiep)); 426 } 427 428 429 /* 430 * Schedule a heavyweight software interrupt process. 431 */ 432 void 433 swi_sched(void *cookie, int flags) 434 { 435 struct intrhand *ih = (struct intrhand *)cookie; 436 struct ithd *it = ih->ih_ithread; 437 int error; 438 439 atomic_add_int(&cnt.v_intr, 1); /* one more global interrupt */ 440 441 CTR3(KTR_INTR, "swi_sched pid %d(%s) need=%d", 442 it->it_proc->p_pid, it->it_proc->p_comm, it->it_need); 443 444 /* 445 * Set ih_need for this handler so that if the ithread is already 446 * running it will execute this handler on the next pass. Otherwise, 447 * it will execute it the next time it runs. 448 */ 449 atomic_store_rel_int(&ih->ih_need, 1); 450 if (!(flags & SWI_DELAY)) { 451 error = ithread_schedule(it, !cold && flags & SWI_SWITCH); 452 KASSERT(error == 0, ("stray software interrupt")); 453 } 454 } 455 456 /* 457 * This is the main code for interrupt threads. 458 */ 459 void 460 ithread_loop(void *arg) 461 { 462 struct ithd *ithd; /* our thread context */ 463 struct intrhand *ih; /* and our interrupt handler chain */ 464 struct proc *p; 465 466 p = curproc; 467 ithd = (struct ithd *)arg; /* point to myself */ 468 KASSERT(ithd->it_proc == p && p->p_ithd == ithd, 469 (__func__ ": ithread and proc linkage out of sync")); 470 471 /* 472 * As long as we have interrupts outstanding, go through the 473 * list of handlers, giving each one a go at it. 474 */ 475 for (;;) { 476 /* 477 * If we are an orphaned thread, then just die. 478 */ 479 if (ithd->it_flags & IT_DEAD) { 480 CTR2(KTR_INTR, __func__ ": pid %d: (%s) exiting", 481 p->p_pid, p->p_comm); 482 p->p_ithd = NULL; 483 mtx_destroy(&ithd->it_lock); 484 mtx_lock(&Giant); 485 free(ithd, M_ITHREAD); 486 kthread_exit(0); 487 } 488 489 CTR3(KTR_INTR, __func__ ": pid %d: (%s) need=%d", 490 p->p_pid, p->p_comm, ithd->it_need); 491 while (ithd->it_need) { 492 /* 493 * Service interrupts. If another interrupt 494 * arrives while we are running, they will set 495 * it_need to denote that we should make 496 * another pass. 497 */ 498 atomic_store_rel_int(&ithd->it_need, 0); 499 restart: 500 TAILQ_FOREACH(ih, &ithd->it_handlers, ih_next) { 501 if (ithd->it_flags & IT_SOFT && !ih->ih_need) 502 continue; 503 atomic_store_rel_int(&ih->ih_need, 0); 504 CTR5(KTR_INTR, 505 __func__ ": pid %d ih=%p: %p(%p) flg=%x", 506 p->p_pid, (void *)ih, 507 (void *)ih->ih_handler, ih->ih_argument, 508 ih->ih_flags); 509 510 if ((ih->ih_flags & IH_DEAD) != 0) { 511 mtx_lock(&ithd->it_lock); 512 TAILQ_REMOVE(&ithd->it_handlers, ih, 513 ih_next); 514 wakeup(ih); 515 mtx_unlock(&ithd->it_lock); 516 goto restart; 517 } 518 if ((ih->ih_flags & IH_MPSAFE) == 0) 519 mtx_lock(&Giant); 520 ih->ih_handler(ih->ih_argument); 521 if ((ih->ih_flags & IH_MPSAFE) == 0) 522 mtx_unlock(&Giant); 523 } 524 } 525 526 /* 527 * Processed all our interrupts. Now get the sched 528 * lock. This may take a while and it_need may get 529 * set again, so we have to check it again. 530 */ 531 mtx_assert(&Giant, MA_NOTOWNED); 532 mtx_lock_spin(&sched_lock); 533 if (!ithd->it_need) { 534 /* 535 * Should we call this earlier in the loop above? 536 */ 537 if (ithd->it_enable != NULL) 538 ithd->it_enable(ithd->it_vector); 539 p->p_stat = SWAIT; /* we're idle */ 540 p->p_stats->p_ru.ru_nvcsw++; 541 CTR1(KTR_INTR, __func__ ": pid %d: done", p->p_pid); 542 mi_switch(); 543 CTR1(KTR_INTR, __func__ ": pid %d: resumed", p->p_pid); 544 } 545 mtx_unlock_spin(&sched_lock); 546 } 547 } 548 549 /* 550 * Start standard software interrupt threads 551 */ 552 static void 553 start_softintr(void *dummy) 554 { 555 556 if (swi_add(NULL, "net", swi_net, NULL, SWI_NET, 0, &net_ih) || 557 swi_add(&clk_ithd, "clock", softclock, NULL, SWI_CLOCK, 558 INTR_MPSAFE, &softclock_ih) || 559 swi_add(NULL, "vm", swi_vm, NULL, SWI_VM, 0, &vm_ih)) 560 panic("died while creating standard software ithreads"); 561 562 PROC_LOCK(clk_ithd->it_proc); 563 clk_ithd->it_proc->p_flag |= P_NOLOAD; 564 PROC_UNLOCK(clk_ithd->it_proc); 565 } 566 SYSINIT(start_softintr, SI_SUB_SOFTINTR, SI_ORDER_FIRST, start_softintr, NULL) 567 568 void 569 legacy_setsoftnet(void) 570 { 571 swi_sched(net_ih, SWI_NOSWITCH); 572 } 573 574 /* 575 * XXX: This should really be in the network code somewhere and installed 576 * via a SI_SUB_SOFINTR, SI_ORDER_MIDDLE sysinit. 577 */ 578 void (*netisrs[32]) __P((void)); 579 u_int netisr; 580 581 int 582 register_netisr(num, handler) 583 int num; 584 netisr_t *handler; 585 { 586 587 if (num < 0 || num >= (sizeof(netisrs)/sizeof(*netisrs)) ) { 588 printf("register_netisr: bad isr number: %d\n", num); 589 return (EINVAL); 590 } 591 netisrs[num] = handler; 592 return (0); 593 } 594 595 int 596 unregister_netisr(num) 597 int num; 598 { 599 600 if (num < 0 || num >= (sizeof(netisrs)/sizeof(*netisrs)) ) { 601 printf("unregister_netisr: bad isr number: %d\n", num); 602 return (EINVAL); 603 } 604 netisrs[num] = NULL; 605 return (0); 606 } 607 608 static void 609 swi_net(void *dummy) 610 { 611 u_int bits; 612 int i; 613 614 bits = atomic_readandclear_int(&netisr); 615 while ((i = ffs(bits)) != 0) { 616 i--; 617 if (netisrs[i] != NULL) 618 netisrs[i](); 619 else 620 printf("swi_net: unregistered isr number: %d.\n", i); 621 bits &= ~(1 << i); 622 } 623 } 624 625 /* 626 * Sysctls used by systat and others: hw.intrnames and hw.intrcnt. 627 * The data for this machine dependent, and the declarations are in machine 628 * dependent code. The layout of intrnames and intrcnt however is machine 629 * independent. 630 * 631 * We do not know the length of intrcnt and intrnames at compile time, so 632 * calculate things at run time. 633 */ 634 static int 635 sysctl_intrnames(SYSCTL_HANDLER_ARGS) 636 { 637 return (sysctl_handle_opaque(oidp, intrnames, eintrnames - intrnames, 638 req)); 639 } 640 641 SYSCTL_PROC(_hw, OID_AUTO, intrnames, CTLTYPE_OPAQUE | CTLFLAG_RD, 642 NULL, 0, sysctl_intrnames, "", "Interrupt Names"); 643 644 static int 645 sysctl_intrcnt(SYSCTL_HANDLER_ARGS) 646 { 647 return (sysctl_handle_opaque(oidp, intrcnt, 648 (char *)eintrcnt - (char *)intrcnt, req)); 649 } 650 651 SYSCTL_PROC(_hw, OID_AUTO, intrcnt, CTLTYPE_OPAQUE | CTLFLAG_RD, 652 NULL, 0, sysctl_intrcnt, "", "Interrupt Counts"); 653