168762Smckusick /* 268762Smckusick * Copyright (c) 1995 368762Smckusick * The Regents of the University of California. All rights reserved. 468762Smckusick * 568775Smckusick * This code contains ideas from software contributed to Berkeley by 668762Smckusick * Avadis Tevanian, Jr., Michael Wayne Young, and the Mach Operating 768762Smckusick * System project at Carnegie-Mellon University. 868762Smckusick * 968762Smckusick * %sccs.include.redist.c% 1068762Smckusick * 11*68933Smckusick * @(#)kern_lock.c 8.7 (Berkeley) 04/27/95 1268762Smckusick */ 1368762Smckusick 1468762Smckusick #include <sys/param.h> 1568762Smckusick #include <sys/proc.h> 1668762Smckusick #include <sys/lock.h> 1768762Smckusick 1868762Smckusick /* 1968762Smckusick * Locking primitives implementation. 2068762Smckusick * Locks provide shared/exclusive sychronization. 2168762Smckusick */ 2268762Smckusick 2368762Smckusick #if NCPUS > 1 2468762Smckusick 2568762Smckusick /* 2668762Smckusick * For multiprocessor system, try spin lock first. 2768762Smckusick * 2868762Smckusick * This should be inline expanded below, but we cannot have #if 2968762Smckusick * inside a multiline define. 3068762Smckusick */ 3168762Smckusick int lock_wait_time = 100; 3268762Smckusick #define PAUSE(lkp, wanted) \ 3368762Smckusick if (lock_wait_time > 0) { \ 3468762Smckusick int i; \ 3568762Smckusick \ 36*68933Smckusick simple_unlock(&lkp->lk_interlock); \ 3768762Smckusick for (i = lock_wait_time; i > 0; i--) \ 3868762Smckusick if (!(wanted)) \ 3968762Smckusick break; \ 40*68933Smckusick simple_lock(&lkp->lk_interlock); \ 4168762Smckusick } \ 4268762Smckusick if (!(wanted)) \ 4368762Smckusick break; 4468762Smckusick 4568762Smckusick #else /* NCPUS == 1 */ 4668762Smckusick 4768762Smckusick /* 4868762Smckusick * It is an error to spin on a uniprocessor as nothing will ever cause 49*68933Smckusick * the simple lock to clear while we are executing. 5068762Smckusick */ 5168762Smckusick #define PAUSE(lkp, wanted) 5268762Smckusick 53*68933Smckusick /* 54*68933Smckusick * Panic messages for inline expanded simple locks. 55*68933Smckusick * Put text here to avoid hundreds of copies. 56*68933Smckusick */ 57*68933Smckusick const char *simple_lock_held = "simple_lock: lock held"; 58*68933Smckusick const char *simple_lock_not_held = "simple_lock: lock not held"; 59*68933Smckusick 6068762Smckusick #endif /* NCPUS == 1 */ 6168762Smckusick 6268762Smckusick /* 6368762Smckusick * Acquire a resource. 6468762Smckusick */ 6568762Smckusick #define ACQUIRE(lkp, error, extflags, wanted) \ 6668762Smckusick PAUSE(lkp, wanted); \ 6768762Smckusick for (error = 0; wanted; ) { \ 6868800Smckusick (lkp)->lk_waitcount++; \ 69*68933Smckusick simple_unlock(&(lkp)->lk_interlock); \ 7068779Smckusick error = tsleep((void *)lkp, (lkp)->lk_prio, \ 7168779Smckusick (lkp)->lk_wmesg, (lkp)->lk_timo); \ 72*68933Smckusick simple_lock(&(lkp)->lk_interlock); \ 7368800Smckusick (lkp)->lk_waitcount--; \ 7468762Smckusick if (error) \ 7568762Smckusick break; \ 7668762Smckusick if ((extflags) & LK_SLEEPFAIL) { \ 7768762Smckusick error = ENOLCK; \ 7868762Smckusick break; \ 7968762Smckusick } \ 8068762Smckusick } 8168762Smckusick 8268762Smckusick /* 8368762Smckusick * Initialize a lock; required before use. 8468762Smckusick */ 8568782Smckusick void 8668782Smckusick lock_init(lkp, prio, wmesg, timo, flags) 8768762Smckusick struct lock *lkp; 8868762Smckusick int prio; 8968762Smckusick char *wmesg; 9068762Smckusick int timo; 9168762Smckusick int flags; 9268762Smckusick { 9368762Smckusick bzero(lkp, sizeof(struct lock)); 94*68933Smckusick simple_lock_init(&lkp->lk_interlock); 9568762Smckusick lkp->lk_flags = flags & LK_EXTFLG_MASK; 9668762Smckusick lkp->lk_prio = prio; 9768762Smckusick lkp->lk_timo = timo; 9868762Smckusick lkp->lk_wmesg = wmesg; 9968762Smckusick lkp->lk_lockholder = LK_NOPROC; 10068762Smckusick } 10168762Smckusick 10268762Smckusick /* 10368780Smckusick * Determine the status of a lock. 10468780Smckusick */ 10568780Smckusick int 10668780Smckusick lockstatus(lkp) 10768780Smckusick struct lock *lkp; 10868780Smckusick { 10968780Smckusick int lock_type = 0; 11068780Smckusick 111*68933Smckusick simple_lock(&lkp->lk_interlock); 11268780Smckusick if (lkp->lk_exclusivecount != 0) 11368780Smckusick lock_type = LK_EXCLUSIVE; 11468780Smckusick else if (lkp->lk_sharecount != 0) 11568780Smckusick lock_type = LK_SHARED; 116*68933Smckusick simple_unlock(&lkp->lk_interlock); 11768780Smckusick return (lock_type); 11868780Smckusick } 11968780Smckusick 12068780Smckusick /* 12168762Smckusick * Set, change, or release a lock. 12268762Smckusick * 12368762Smckusick * Shared requests increment the shared count. Exclusive requests set the 12468762Smckusick * LK_WANT_EXCL flag (preventing further shared locks), and wait for already 12568762Smckusick * accepted shared locks and shared-to-exclusive upgrades to go away. 12668762Smckusick */ 12768782Smckusick int 12868800Smckusick lockmgr(lkp, flags, p) 12968779Smckusick volatile struct lock *lkp; 13068800Smckusick u_int flags; 13168762Smckusick struct proc *p; 13268762Smckusick { 13368779Smckusick int error; 13468762Smckusick pid_t pid; 13568779Smckusick volatile int extflags; 13668762Smckusick 13768800Smckusick error = 0; 13868762Smckusick pid = p->p_pid; 139*68933Smckusick simple_lock(&lkp->lk_interlock); 14068762Smckusick extflags = (flags | lkp->lk_flags) & LK_EXTFLG_MASK; 14168800Smckusick if (lkp->lk_flags & LK_DRAINED) 14268800Smckusick panic("lockmgr: using decommissioned lock"); 14368762Smckusick 14468762Smckusick switch (flags & LK_TYPE_MASK) { 14568762Smckusick 14668762Smckusick case LK_SHARED: 14768762Smckusick if (lkp->lk_lockholder != pid) { 14868762Smckusick /* 14968762Smckusick * If just polling, check to see if we will block. 15068762Smckusick */ 15168762Smckusick if ((extflags & LK_NOWAIT) && (lkp->lk_flags & 15268762Smckusick (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE))) { 15368800Smckusick error = EBUSY; 15468800Smckusick break; 15568762Smckusick } 15668762Smckusick /* 15768762Smckusick * Wait for exclusive locks and upgrades to clear. 15868762Smckusick */ 15968762Smckusick ACQUIRE(lkp, error, extflags, lkp->lk_flags & 16068762Smckusick (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE)); 16168800Smckusick if (error) 16268800Smckusick break; 16368762Smckusick lkp->lk_sharecount++; 16468800Smckusick break; 16568762Smckusick } 16668762Smckusick /* 16768762Smckusick * We hold an exclusive lock, so downgrade it to shared. 16868762Smckusick * An alternative would be to fail with EDEADLK. 16968762Smckusick */ 17068762Smckusick lkp->lk_sharecount++; 17168762Smckusick /* fall into downgrade */ 17268762Smckusick 17368762Smckusick case LK_DOWNGRADE: 17468762Smckusick if (lkp->lk_lockholder != pid || lkp->lk_exclusivecount == 0) 17568762Smckusick panic("lockmgr: not holding exclusive lock"); 17668762Smckusick lkp->lk_sharecount += lkp->lk_exclusivecount; 17768762Smckusick lkp->lk_exclusivecount = 0; 17868762Smckusick lkp->lk_flags &= ~LK_HAVE_EXCL; 17968762Smckusick lkp->lk_lockholder = LK_NOPROC; 18068800Smckusick if (lkp->lk_waitcount) 18168779Smckusick wakeup((void *)lkp); 18268800Smckusick break; 18368762Smckusick 18468779Smckusick case LK_EXCLUPGRADE: 18568779Smckusick /* 18668779Smckusick * If another process is ahead of us to get an upgrade, 18768779Smckusick * then we want to fail rather than have an intervening 18868779Smckusick * exclusive access. 18968779Smckusick */ 19068779Smckusick if (lkp->lk_flags & LK_WANT_UPGRADE) { 19168779Smckusick lkp->lk_sharecount--; 19268800Smckusick error = EBUSY; 19368800Smckusick break; 19468779Smckusick } 19568779Smckusick /* fall into normal upgrade */ 19668779Smckusick 19768762Smckusick case LK_UPGRADE: 19868762Smckusick /* 19968762Smckusick * Upgrade a shared lock to an exclusive one. If another 20068762Smckusick * shared lock has already requested an upgrade to an 20168762Smckusick * exclusive lock, our shared lock is released and an 20268762Smckusick * exclusive lock is requested (which will be granted 20368775Smckusick * after the upgrade). If we return an error, the file 20468775Smckusick * will always be unlocked. 20568762Smckusick */ 20668762Smckusick if (lkp->lk_lockholder == pid || lkp->lk_sharecount <= 0) 20768762Smckusick panic("lockmgr: upgrade exclusive lock"); 20868775Smckusick lkp->lk_sharecount--; 20968762Smckusick /* 21068762Smckusick * If we are just polling, check to see if we will block. 21168762Smckusick */ 21268762Smckusick if ((extflags & LK_NOWAIT) && 21368762Smckusick ((lkp->lk_flags & LK_WANT_UPGRADE) || 21468762Smckusick lkp->lk_sharecount > 1)) { 21568800Smckusick error = EBUSY; 21668800Smckusick break; 21768762Smckusick } 21868762Smckusick if ((lkp->lk_flags & LK_WANT_UPGRADE) == 0) { 21968762Smckusick /* 22068762Smckusick * We are first shared lock to request an upgrade, so 22168762Smckusick * request upgrade and wait for the shared count to 22268762Smckusick * drop to zero, then take exclusive lock. 22368762Smckusick */ 22468762Smckusick lkp->lk_flags |= LK_WANT_UPGRADE; 22568762Smckusick ACQUIRE(lkp, error, extflags, lkp->lk_sharecount); 22668762Smckusick lkp->lk_flags &= ~LK_WANT_UPGRADE; 22768800Smckusick if (error) 22868800Smckusick break; 22968762Smckusick lkp->lk_flags |= LK_HAVE_EXCL; 23068762Smckusick lkp->lk_lockholder = pid; 23168762Smckusick if (lkp->lk_exclusivecount != 0) 23268762Smckusick panic("lockmgr: non-zero exclusive count"); 23368762Smckusick lkp->lk_exclusivecount = 1; 23468800Smckusick break; 23568762Smckusick } 23668762Smckusick /* 23768762Smckusick * Someone else has requested upgrade. Release our shared 23868762Smckusick * lock, awaken upgrade requestor if we are the last shared 23968762Smckusick * lock, then request an exclusive lock. 24068762Smckusick */ 24168800Smckusick if (lkp->lk_sharecount == 0 && lkp->lk_waitcount) 24268779Smckusick wakeup((void *)lkp); 24368762Smckusick /* fall into exclusive request */ 24468762Smckusick 24568762Smckusick case LK_EXCLUSIVE: 24668762Smckusick if (lkp->lk_lockholder == pid) { 24768762Smckusick /* 24868762Smckusick * Recursive lock. 24968762Smckusick */ 25068762Smckusick if ((extflags & LK_CANRECURSE) == 0) 25168762Smckusick panic("lockmgr: locking against myself"); 25268762Smckusick lkp->lk_exclusivecount++; 25368800Smckusick break; 25468762Smckusick } 25568762Smckusick /* 25668762Smckusick * If we are just polling, check to see if we will sleep. 25768762Smckusick */ 25868762Smckusick if ((extflags & LK_NOWAIT) && ((lkp->lk_flags & 25968762Smckusick (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE)) || 26068762Smckusick lkp->lk_sharecount != 0)) { 26168800Smckusick error = EBUSY; 26268800Smckusick break; 26368762Smckusick } 26468762Smckusick /* 26568762Smckusick * Try to acquire the want_exclusive flag. 26668762Smckusick */ 26768762Smckusick ACQUIRE(lkp, error, extflags, lkp->lk_flags & 26868762Smckusick (LK_HAVE_EXCL | LK_WANT_EXCL)); 26968800Smckusick if (error) 27068800Smckusick break; 27168762Smckusick lkp->lk_flags |= LK_WANT_EXCL; 27268762Smckusick /* 27368762Smckusick * Wait for shared locks and upgrades to finish. 27468762Smckusick */ 27568762Smckusick ACQUIRE(lkp, error, extflags, lkp->lk_sharecount != 0 || 27668762Smckusick (lkp->lk_flags & LK_WANT_UPGRADE)); 27768762Smckusick lkp->lk_flags &= ~LK_WANT_EXCL; 27868800Smckusick if (error) 27968800Smckusick break; 28068762Smckusick lkp->lk_flags |= LK_HAVE_EXCL; 28168762Smckusick lkp->lk_lockholder = pid; 28268762Smckusick if (lkp->lk_exclusivecount != 0) 28368762Smckusick panic("lockmgr: non-zero exclusive count"); 28468762Smckusick lkp->lk_exclusivecount = 1; 28568800Smckusick break; 28668762Smckusick 28768762Smckusick case LK_RELEASE: 28868762Smckusick if (lkp->lk_exclusivecount != 0) { 28968800Smckusick if (pid != lkp->lk_lockholder) 29068800Smckusick panic("lockmgr: pid %d, not %s %d unlocking", 29168800Smckusick pid, "exclusive lock holder", 29268800Smckusick lkp->lk_lockholder); 29368762Smckusick lkp->lk_exclusivecount--; 29468762Smckusick if (lkp->lk_exclusivecount == 0) { 29568762Smckusick lkp->lk_flags &= ~LK_HAVE_EXCL; 29668762Smckusick lkp->lk_lockholder = LK_NOPROC; 29768762Smckusick } 29868762Smckusick } else if (lkp->lk_sharecount != 0) 29968762Smckusick lkp->lk_sharecount--; 30068800Smckusick if (lkp->lk_waitcount) 30168779Smckusick wakeup((void *)lkp); 30268800Smckusick break; 30368800Smckusick 30468800Smckusick case LK_DRAIN: 30568800Smckusick /* 30668800Smckusick * If we are just polling, check to see if we will sleep. 30768800Smckusick */ 30868800Smckusick if ((extflags & LK_NOWAIT) && ((lkp->lk_flags & 30968800Smckusick (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE)) || 31068800Smckusick lkp->lk_sharecount != 0 || lkp->lk_waitcount != 0)) { 31168800Smckusick error = EBUSY; 31268800Smckusick break; 31368762Smckusick } 31468800Smckusick PAUSE(lkp, ((lkp->lk_flags & 31568800Smckusick (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE)) || 31668800Smckusick lkp->lk_sharecount != 0 || lkp->lk_waitcount != 0)); 31768800Smckusick for (error = 0; ((lkp->lk_flags & 31868800Smckusick (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE)) || 31968800Smckusick lkp->lk_sharecount != 0 || lkp->lk_waitcount != 0); ) { 32068800Smckusick lkp->lk_flags |= LK_WAITDRAIN; 321*68933Smckusick simple_unlock(&lkp->lk_interlock); 32268800Smckusick if (error = tsleep((void *)&lkp->lk_flags, lkp->lk_prio, 32368800Smckusick lkp->lk_wmesg, lkp->lk_timo)) 32468800Smckusick return (error); 32568800Smckusick if ((extflags) & LK_SLEEPFAIL) 32668800Smckusick return (ENOLCK); 327*68933Smckusick simple_lock(&lkp->lk_interlock); 32868800Smckusick } 32968800Smckusick lkp->lk_flags |= LK_DRAINED; 33068800Smckusick break; 33168762Smckusick 33268762Smckusick default: 333*68933Smckusick simple_unlock(&lkp->lk_interlock); 33468762Smckusick panic("lockmgr: unknown locktype request %d", 33568762Smckusick flags & LK_TYPE_MASK); 33668775Smckusick /* NOTREACHED */ 33768762Smckusick } 33868800Smckusick if ((lkp->lk_flags & LK_WAITDRAIN) && ((lkp->lk_flags & 33968800Smckusick (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE)) == 0 && 34068800Smckusick lkp->lk_sharecount == 0 && lkp->lk_waitcount == 0)) { 34168800Smckusick lkp->lk_flags &= ~LK_WAITDRAIN; 34268800Smckusick wakeup((void *)&lkp->lk_flags); 34368800Smckusick } 344*68933Smckusick simple_unlock(&lkp->lk_interlock); 34568800Smckusick return (error); 34668762Smckusick } 347