1 /*- 2 * Copyright (c) 1995 3 * The Regents of the University of California. All rights reserved. 4 * 5 * Copyright (C) 1997 6 * John S. Dyson. All rights reserved. 7 * 8 * This code contains ideas from software contributed to Berkeley by 9 * Avadis Tevanian, Jr., Michael Wayne Young, and the Mach Operating 10 * System project at Carnegie-Mellon University. 11 * 12 * Redistribution and use in source and binary forms, with or without 13 * modification, are permitted provided that the following conditions 14 * are met: 15 * 1. Redistributions of source code must retain the above copyright 16 * notice, this list of conditions and the following disclaimer. 17 * 2. Redistributions in binary form must reproduce the above copyright 18 * notice, this list of conditions and the following disclaimer in the 19 * documentation and/or other materials provided with the distribution. 20 * 3. All advertising materials mentioning features or use of this software 21 * must display the following acknowledgement: 22 * This product includes software developed by the University of 23 * California, Berkeley and its contributors. 24 * 4. Neither the name of the University nor the names of its contributors 25 * may be used to endorse or promote products derived from this software 26 * without specific prior written permission. 27 * 28 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 29 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 30 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 31 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 32 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 33 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 34 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 35 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 36 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 37 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 38 * SUCH DAMAGE. 39 * 40 * @(#)kern_lock.c 8.18 (Berkeley) 5/21/95 41 */ 42 43 #include <sys/cdefs.h> 44 __FBSDID("$FreeBSD$"); 45 46 #include <sys/param.h> 47 #include <sys/kdb.h> 48 #include <sys/kernel.h> 49 #include <sys/ktr.h> 50 #include <sys/lock.h> 51 #include <sys/lockmgr.h> 52 #include <sys/mutex.h> 53 #include <sys/proc.h> 54 #include <sys/systm.h> 55 #ifdef DEBUG_LOCKS 56 #include <sys/stack.h> 57 #include <sys/sysctl.h> 58 #endif 59 #include <sys/kdb.h> 60 61 /* 62 * Locking primitives implementation. 63 * Locks provide shared/exclusive sychronization. 64 */ 65 66 #define COUNT(td, x) if ((td)) (td)->td_locks += (x) 67 #define LK_ALL (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE | \ 68 LK_SHARE_NONZERO | LK_WAIT_NONZERO) 69 70 static int acquire(struct lock **lkpp, int extflags, int wanted); 71 static int acquiredrain(struct lock *lkp, int extflags) ; 72 73 static __inline void 74 sharelock(struct thread *td, struct lock *lkp, int incr) { 75 lkp->lk_flags |= LK_SHARE_NONZERO; 76 lkp->lk_sharecount += incr; 77 COUNT(td, incr); 78 } 79 80 static __inline void 81 shareunlock(struct thread *td, struct lock *lkp, int decr) { 82 83 KASSERT(lkp->lk_sharecount >= decr, ("shareunlock: count < decr")); 84 85 COUNT(td, -decr); 86 if (lkp->lk_sharecount == decr) { 87 lkp->lk_flags &= ~LK_SHARE_NONZERO; 88 if (lkp->lk_flags & (LK_WANT_UPGRADE | LK_WANT_EXCL)) { 89 wakeup(lkp); 90 } 91 lkp->lk_sharecount = 0; 92 } else { 93 lkp->lk_sharecount -= decr; 94 } 95 } 96 97 static int 98 acquire(struct lock **lkpp, int extflags, int wanted) 99 { 100 struct lock *lkp = *lkpp; 101 int error; 102 CTR3(KTR_LOCK, 103 "acquire(): lkp == %p, extflags == 0x%x, wanted == 0x%x", 104 lkp, extflags, wanted); 105 106 if ((extflags & LK_NOWAIT) && (lkp->lk_flags & wanted)) 107 return EBUSY; 108 error = 0; 109 while ((lkp->lk_flags & wanted) != 0) { 110 CTR2(KTR_LOCK, 111 "acquire(): lkp == %p, lk_flags == 0x%x sleeping", 112 lkp, lkp->lk_flags); 113 lkp->lk_flags |= LK_WAIT_NONZERO; 114 lkp->lk_waitcount++; 115 error = msleep(lkp, lkp->lk_interlock, lkp->lk_prio, 116 lkp->lk_wmesg, 117 ((extflags & LK_TIMELOCK) ? lkp->lk_timo : 0)); 118 lkp->lk_waitcount--; 119 if (lkp->lk_waitcount == 0) 120 lkp->lk_flags &= ~LK_WAIT_NONZERO; 121 if (error) 122 break; 123 if (extflags & LK_SLEEPFAIL) { 124 error = ENOLCK; 125 break; 126 } 127 if (lkp->lk_newlock != NULL) { 128 mtx_lock(lkp->lk_newlock->lk_interlock); 129 mtx_unlock(lkp->lk_interlock); 130 if (lkp->lk_waitcount == 0) 131 wakeup((void *)(&lkp->lk_newlock)); 132 *lkpp = lkp = lkp->lk_newlock; 133 } 134 } 135 mtx_assert(lkp->lk_interlock, MA_OWNED); 136 return (error); 137 } 138 139 /* 140 * Set, change, or release a lock. 141 * 142 * Shared requests increment the shared count. Exclusive requests set the 143 * LK_WANT_EXCL flag (preventing further shared locks), and wait for already 144 * accepted shared locks and shared-to-exclusive upgrades to go away. 145 */ 146 int 147 lockmgr(lkp, flags, interlkp, td) 148 struct lock *lkp; 149 u_int flags; 150 struct mtx *interlkp; 151 struct thread *td; 152 { 153 int error; 154 struct thread *thr; 155 int extflags, lockflags; 156 157 error = 0; 158 if (td == NULL) 159 thr = LK_KERNPROC; 160 else 161 thr = td; 162 163 if ((flags & LK_INTERNAL) == 0) 164 mtx_lock(lkp->lk_interlock); 165 CTR6(KTR_LOCK, 166 "lockmgr(): lkp == %p (lk_wmesg == \"%s\"), owner == %p, exclusivecount == %d, flags == 0x%x, " 167 "td == %p", lkp, lkp->lk_wmesg, lkp->lk_lockholder, 168 lkp->lk_exclusivecount, flags, td); 169 #ifdef DEBUG_LOCKS 170 { 171 struct stack stack; /* XXX */ 172 stack_save(&stack); 173 CTRSTACK(KTR_LOCK, &stack, 0, 1); 174 } 175 #endif 176 177 if (flags & LK_INTERLOCK) { 178 mtx_assert(interlkp, MA_OWNED | MA_NOTRECURSED); 179 mtx_unlock(interlkp); 180 } 181 182 if ((flags & (LK_NOWAIT|LK_RELEASE)) == 0) 183 WITNESS_WARN(WARN_GIANTOK | WARN_SLEEPOK, 184 &lkp->lk_interlock->mtx_object, 185 "Acquiring lockmgr lock \"%s\"", lkp->lk_wmesg); 186 187 if (panicstr != NULL) { 188 mtx_unlock(lkp->lk_interlock); 189 return (0); 190 } 191 if ((lkp->lk_flags & LK_NOSHARE) && 192 (flags & LK_TYPE_MASK) == LK_SHARED) { 193 flags &= ~LK_TYPE_MASK; 194 flags |= LK_EXCLUSIVE; 195 } 196 extflags = (flags | lkp->lk_flags) & LK_EXTFLG_MASK; 197 198 switch (flags & LK_TYPE_MASK) { 199 200 case LK_SHARED: 201 /* 202 * If we are not the exclusive lock holder, we have to block 203 * while there is an exclusive lock holder or while an 204 * exclusive lock request or upgrade request is in progress. 205 * 206 * However, if TDP_DEADLKTREAT is set, we override exclusive 207 * lock requests or upgrade requests ( but not the exclusive 208 * lock itself ). 209 */ 210 if (lkp->lk_lockholder != thr) { 211 lockflags = LK_HAVE_EXCL; 212 if (td != NULL && !(td->td_pflags & TDP_DEADLKTREAT)) 213 lockflags |= LK_WANT_EXCL | LK_WANT_UPGRADE; 214 error = acquire(&lkp, extflags, lockflags); 215 if (error) 216 break; 217 sharelock(td, lkp, 1); 218 #if defined(DEBUG_LOCKS) 219 stack_save(&lkp->lk_stack); 220 #endif 221 break; 222 } 223 /* 224 * We hold an exclusive lock, so downgrade it to shared. 225 * An alternative would be to fail with EDEADLK. 226 */ 227 sharelock(td, lkp, 1); 228 /* FALLTHROUGH downgrade */ 229 230 case LK_DOWNGRADE: 231 KASSERT(lkp->lk_lockholder == thr && lkp->lk_exclusivecount != 0, 232 ("lockmgr: not holding exclusive lock " 233 "(owner thread (%p) != thread (%p), exlcnt (%d) != 0", 234 lkp->lk_lockholder, thr, lkp->lk_exclusivecount)); 235 sharelock(td, lkp, lkp->lk_exclusivecount); 236 COUNT(td, -lkp->lk_exclusivecount); 237 lkp->lk_exclusivecount = 0; 238 lkp->lk_flags &= ~LK_HAVE_EXCL; 239 lkp->lk_lockholder = LK_NOPROC; 240 if (lkp->lk_waitcount) 241 wakeup((void *)lkp); 242 break; 243 244 case LK_EXCLUPGRADE: 245 /* 246 * If another process is ahead of us to get an upgrade, 247 * then we want to fail rather than have an intervening 248 * exclusive access. 249 */ 250 if (lkp->lk_flags & LK_WANT_UPGRADE) { 251 shareunlock(td, lkp, 1); 252 error = EBUSY; 253 break; 254 } 255 /* FALLTHROUGH normal upgrade */ 256 257 case LK_UPGRADE: 258 /* 259 * Upgrade a shared lock to an exclusive one. If another 260 * shared lock has already requested an upgrade to an 261 * exclusive lock, our shared lock is released and an 262 * exclusive lock is requested (which will be granted 263 * after the upgrade). If we return an error, the file 264 * will always be unlocked. 265 */ 266 if (lkp->lk_lockholder == thr) 267 panic("lockmgr: upgrade exclusive lock"); 268 if (lkp->lk_sharecount <= 0) 269 panic("lockmgr: upgrade without shared"); 270 shareunlock(td, lkp, 1); 271 /* 272 * If we are just polling, check to see if we will block. 273 */ 274 if ((extflags & LK_NOWAIT) && 275 ((lkp->lk_flags & LK_WANT_UPGRADE) || 276 lkp->lk_sharecount > 1)) { 277 error = EBUSY; 278 break; 279 } 280 if ((lkp->lk_flags & LK_WANT_UPGRADE) == 0) { 281 /* 282 * We are first shared lock to request an upgrade, so 283 * request upgrade and wait for the shared count to 284 * drop to zero, then take exclusive lock. 285 */ 286 lkp->lk_flags |= LK_WANT_UPGRADE; 287 error = acquire(&lkp, extflags, LK_SHARE_NONZERO); 288 lkp->lk_flags &= ~LK_WANT_UPGRADE; 289 290 if (error) { 291 if ((lkp->lk_flags & ( LK_WANT_EXCL | LK_WAIT_NONZERO)) == (LK_WANT_EXCL | LK_WAIT_NONZERO)) 292 wakeup((void *)lkp); 293 break; 294 } 295 if (lkp->lk_exclusivecount != 0) 296 panic("lockmgr: non-zero exclusive count"); 297 lkp->lk_flags |= LK_HAVE_EXCL; 298 lkp->lk_lockholder = thr; 299 lkp->lk_exclusivecount = 1; 300 COUNT(td, 1); 301 #if defined(DEBUG_LOCKS) 302 stack_save(&lkp->lk_stack); 303 #endif 304 break; 305 } 306 /* 307 * Someone else has requested upgrade. Release our shared 308 * lock, awaken upgrade requestor if we are the last shared 309 * lock, then request an exclusive lock. 310 */ 311 if ( (lkp->lk_flags & (LK_SHARE_NONZERO|LK_WAIT_NONZERO)) == 312 LK_WAIT_NONZERO) 313 wakeup((void *)lkp); 314 /* FALLTHROUGH exclusive request */ 315 316 case LK_EXCLUSIVE: 317 if (lkp->lk_lockholder == thr && thr != LK_KERNPROC) { 318 /* 319 * Recursive lock. 320 */ 321 if ((extflags & (LK_NOWAIT | LK_CANRECURSE)) == 0) 322 panic("lockmgr: locking against myself"); 323 if ((extflags & LK_CANRECURSE) != 0) { 324 lkp->lk_exclusivecount++; 325 COUNT(td, 1); 326 break; 327 } 328 } 329 /* 330 * If we are just polling, check to see if we will sleep. 331 */ 332 if ((extflags & LK_NOWAIT) && 333 (lkp->lk_flags & (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE | LK_SHARE_NONZERO))) { 334 error = EBUSY; 335 break; 336 } 337 /* 338 * Try to acquire the want_exclusive flag. 339 */ 340 error = acquire(&lkp, extflags, (LK_HAVE_EXCL | LK_WANT_EXCL)); 341 if (error) 342 break; 343 lkp->lk_flags |= LK_WANT_EXCL; 344 /* 345 * Wait for shared locks and upgrades to finish. 346 */ 347 error = acquire(&lkp, extflags, LK_HAVE_EXCL | LK_WANT_UPGRADE | LK_SHARE_NONZERO); 348 lkp->lk_flags &= ~LK_WANT_EXCL; 349 if (error) { 350 if (lkp->lk_flags & LK_WAIT_NONZERO) 351 wakeup((void *)lkp); 352 break; 353 } 354 lkp->lk_flags |= LK_HAVE_EXCL; 355 lkp->lk_lockholder = thr; 356 if (lkp->lk_exclusivecount != 0) 357 panic("lockmgr: non-zero exclusive count"); 358 lkp->lk_exclusivecount = 1; 359 COUNT(td, 1); 360 #if defined(DEBUG_LOCKS) 361 stack_save(&lkp->lk_stack); 362 #endif 363 break; 364 365 case LK_RELEASE: 366 if (lkp->lk_exclusivecount != 0) { 367 if (lkp->lk_lockholder != thr && 368 lkp->lk_lockholder != LK_KERNPROC) { 369 panic("lockmgr: thread %p, not %s %p unlocking", 370 thr, "exclusive lock holder", 371 lkp->lk_lockholder); 372 } 373 if (lkp->lk_lockholder != LK_KERNPROC) 374 COUNT(td, -1); 375 if (lkp->lk_exclusivecount == 1) { 376 lkp->lk_flags &= ~LK_HAVE_EXCL; 377 lkp->lk_lockholder = LK_NOPROC; 378 lkp->lk_exclusivecount = 0; 379 } else { 380 lkp->lk_exclusivecount--; 381 } 382 } else if (lkp->lk_flags & LK_SHARE_NONZERO) 383 shareunlock(td, lkp, 1); 384 else { 385 printf("lockmgr: thread %p unlocking unheld lock\n", 386 thr); 387 kdb_backtrace(); 388 } 389 390 if (lkp->lk_flags & LK_WAIT_NONZERO) 391 wakeup((void *)lkp); 392 break; 393 394 case LK_DRAIN: 395 /* 396 * Check that we do not already hold the lock, as it can 397 * never drain if we do. Unfortunately, we have no way to 398 * check for holding a shared lock, but at least we can 399 * check for an exclusive one. 400 */ 401 if (lkp->lk_lockholder == thr) 402 panic("lockmgr: draining against myself"); 403 404 error = acquiredrain(lkp, extflags); 405 if (error) 406 break; 407 lkp->lk_flags |= LK_DRAINING | LK_HAVE_EXCL; 408 lkp->lk_lockholder = thr; 409 lkp->lk_exclusivecount = 1; 410 COUNT(td, 1); 411 #if defined(DEBUG_LOCKS) 412 stack_save(&lkp->lk_stack); 413 #endif 414 break; 415 416 default: 417 mtx_unlock(lkp->lk_interlock); 418 panic("lockmgr: unknown locktype request %d", 419 flags & LK_TYPE_MASK); 420 /* NOTREACHED */ 421 } 422 if ((lkp->lk_flags & LK_WAITDRAIN) && 423 (lkp->lk_flags & (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE | 424 LK_SHARE_NONZERO | LK_WAIT_NONZERO)) == 0) { 425 lkp->lk_flags &= ~LK_WAITDRAIN; 426 wakeup((void *)&lkp->lk_flags); 427 } 428 mtx_unlock(lkp->lk_interlock); 429 return (error); 430 } 431 432 static int 433 acquiredrain(struct lock *lkp, int extflags) { 434 int error; 435 436 if ((extflags & LK_NOWAIT) && (lkp->lk_flags & LK_ALL)) { 437 return EBUSY; 438 } 439 while (lkp->lk_flags & LK_ALL) { 440 lkp->lk_flags |= LK_WAITDRAIN; 441 error = msleep(&lkp->lk_flags, lkp->lk_interlock, lkp->lk_prio, 442 lkp->lk_wmesg, 443 ((extflags & LK_TIMELOCK) ? lkp->lk_timo : 0)); 444 if (error) 445 return error; 446 if (extflags & LK_SLEEPFAIL) { 447 return ENOLCK; 448 } 449 } 450 return 0; 451 } 452 453 /* 454 * Transfer any waiting processes from one lock to another. 455 */ 456 void 457 transferlockers(from, to) 458 struct lock *from; 459 struct lock *to; 460 { 461 462 KASSERT(from != to, ("lock transfer to self")); 463 KASSERT((from->lk_flags&LK_WAITDRAIN) == 0, ("transfer draining lock")); 464 465 mtx_lock(from->lk_interlock); 466 if (from->lk_waitcount == 0) { 467 mtx_unlock(from->lk_interlock); 468 return; 469 } 470 from->lk_newlock = to; 471 wakeup((void *)from); 472 msleep(&from->lk_newlock, from->lk_interlock, from->lk_prio, 473 "lkxfer", 0); 474 from->lk_newlock = NULL; 475 from->lk_flags &= ~(LK_WANT_EXCL | LK_WANT_UPGRADE); 476 KASSERT(from->lk_waitcount == 0, ("active lock")); 477 mtx_unlock(from->lk_interlock); 478 } 479 480 481 /* 482 * Initialize a lock; required before use. 483 */ 484 void 485 lockinit(lkp, prio, wmesg, timo, flags) 486 struct lock *lkp; 487 int prio; 488 const char *wmesg; 489 int timo; 490 int flags; 491 { 492 CTR5(KTR_LOCK, "lockinit(): lkp == %p, prio == %d, wmesg == \"%s\", " 493 "timo == %d, flags = 0x%x\n", lkp, prio, wmesg, timo, flags); 494 495 lkp->lk_interlock = mtx_pool_alloc(mtxpool_lockbuilder); 496 lkp->lk_flags = (flags & LK_EXTFLG_MASK); 497 lkp->lk_sharecount = 0; 498 lkp->lk_waitcount = 0; 499 lkp->lk_exclusivecount = 0; 500 lkp->lk_prio = prio; 501 lkp->lk_wmesg = wmesg; 502 lkp->lk_timo = timo; 503 lkp->lk_lockholder = LK_NOPROC; 504 lkp->lk_newlock = NULL; 505 #ifdef DEBUG_LOCKS 506 stack_zero(&lkp->lk_stack); 507 #endif 508 } 509 510 /* 511 * Destroy a lock. 512 */ 513 void 514 lockdestroy(lkp) 515 struct lock *lkp; 516 { 517 CTR2(KTR_LOCK, "lockdestroy(): lkp == %p (lk_wmesg == \"%s\")", 518 lkp, lkp->lk_wmesg); 519 } 520 521 /* 522 * Determine the status of a lock. 523 */ 524 int 525 lockstatus(lkp, td) 526 struct lock *lkp; 527 struct thread *td; 528 { 529 int lock_type = 0; 530 int interlocked; 531 532 if (!kdb_active) { 533 interlocked = 1; 534 mtx_lock(lkp->lk_interlock); 535 } else 536 interlocked = 0; 537 if (lkp->lk_exclusivecount != 0) { 538 if (td == NULL || lkp->lk_lockholder == td) 539 lock_type = LK_EXCLUSIVE; 540 else 541 lock_type = LK_EXCLOTHER; 542 } else if (lkp->lk_sharecount != 0) 543 lock_type = LK_SHARED; 544 if (interlocked) 545 mtx_unlock(lkp->lk_interlock); 546 return (lock_type); 547 } 548 549 /* 550 * Determine the number of holders of a lock. 551 */ 552 int 553 lockcount(lkp) 554 struct lock *lkp; 555 { 556 int count; 557 558 mtx_lock(lkp->lk_interlock); 559 count = lkp->lk_exclusivecount + lkp->lk_sharecount; 560 mtx_unlock(lkp->lk_interlock); 561 return (count); 562 } 563 564 /* 565 * Print out information about state of a lock. Used by VOP_PRINT 566 * routines to display status about contained locks. 567 */ 568 void 569 lockmgr_printinfo(lkp) 570 struct lock *lkp; 571 { 572 573 if (lkp->lk_sharecount) 574 printf(" lock type %s: SHARED (count %d)", lkp->lk_wmesg, 575 lkp->lk_sharecount); 576 else if (lkp->lk_flags & LK_HAVE_EXCL) 577 printf(" lock type %s: EXCL (count %d) by thread %p (pid %d)", 578 lkp->lk_wmesg, lkp->lk_exclusivecount, 579 lkp->lk_lockholder, lkp->lk_lockholder->td_proc->p_pid); 580 if (lkp->lk_waitcount > 0) 581 printf(" with %d pending", lkp->lk_waitcount); 582 #ifdef DEBUG_LOCKS 583 stack_print(&lkp->lk_stack); 584 #endif 585 } 586