xref: /csrg-svn/sys/kern/kern_lock.c (revision 68933)
168762Smckusick /*
268762Smckusick  * Copyright (c) 1995
368762Smckusick  *	The Regents of the University of California.  All rights reserved.
468762Smckusick  *
568775Smckusick  * This code contains ideas from software contributed to Berkeley by
668762Smckusick  * Avadis Tevanian, Jr., Michael Wayne Young, and the Mach Operating
768762Smckusick  * System project at Carnegie-Mellon University.
868762Smckusick  *
968762Smckusick  * %sccs.include.redist.c%
1068762Smckusick  *
11*68933Smckusick  *	@(#)kern_lock.c	8.7 (Berkeley) 04/27/95
1268762Smckusick  */
1368762Smckusick 
1468762Smckusick #include <sys/param.h>
1568762Smckusick #include <sys/proc.h>
1668762Smckusick #include <sys/lock.h>
1768762Smckusick 
1868762Smckusick /*
1968762Smckusick  * Locking primitives implementation.
2068762Smckusick  * Locks provide shared/exclusive sychronization.
2168762Smckusick  */
2268762Smckusick 
2368762Smckusick #if NCPUS > 1
2468762Smckusick 
2568762Smckusick /*
2668762Smckusick  * For multiprocessor system, try spin lock first.
2768762Smckusick  *
2868762Smckusick  * This should be inline expanded below, but we cannot have #if
2968762Smckusick  * inside a multiline define.
3068762Smckusick  */
3168762Smckusick int lock_wait_time = 100;
3268762Smckusick #define PAUSE(lkp, wanted)						\
3368762Smckusick 		if (lock_wait_time > 0) {				\
3468762Smckusick 			int i;						\
3568762Smckusick 									\
36*68933Smckusick 			simple_unlock(&lkp->lk_interlock);		\
3768762Smckusick 			for (i = lock_wait_time; i > 0; i--)		\
3868762Smckusick 				if (!(wanted))				\
3968762Smckusick 					break;				\
40*68933Smckusick 			simple_lock(&lkp->lk_interlock);		\
4168762Smckusick 		}							\
4268762Smckusick 		if (!(wanted))						\
4368762Smckusick 			break;
4468762Smckusick 
4568762Smckusick #else /* NCPUS == 1 */
4668762Smckusick 
4768762Smckusick /*
4868762Smckusick  * It is an error to spin on a uniprocessor as nothing will ever cause
49*68933Smckusick  * the simple lock to clear while we are executing.
5068762Smckusick  */
5168762Smckusick #define PAUSE(lkp, wanted)
5268762Smckusick 
53*68933Smckusick /*
54*68933Smckusick  * Panic messages for inline expanded simple locks.
55*68933Smckusick  * Put text here to avoid hundreds of copies.
56*68933Smckusick  */
57*68933Smckusick const char *simple_lock_held = "simple_lock: lock held";
58*68933Smckusick const char *simple_lock_not_held = "simple_lock: lock not held";
59*68933Smckusick 
6068762Smckusick #endif /* NCPUS == 1 */
6168762Smckusick 
6268762Smckusick /*
6368762Smckusick  * Acquire a resource.
6468762Smckusick  */
6568762Smckusick #define ACQUIRE(lkp, error, extflags, wanted)				\
6668762Smckusick 	PAUSE(lkp, wanted);						\
6768762Smckusick 	for (error = 0; wanted; ) {					\
6868800Smckusick 		(lkp)->lk_waitcount++;					\
69*68933Smckusick 		simple_unlock(&(lkp)->lk_interlock);			\
7068779Smckusick 		error = tsleep((void *)lkp, (lkp)->lk_prio,		\
7168779Smckusick 		    (lkp)->lk_wmesg, (lkp)->lk_timo);			\
72*68933Smckusick 		simple_lock(&(lkp)->lk_interlock);			\
7368800Smckusick 		(lkp)->lk_waitcount--;					\
7468762Smckusick 		if (error)						\
7568762Smckusick 			break;						\
7668762Smckusick 		if ((extflags) & LK_SLEEPFAIL) {			\
7768762Smckusick 			error = ENOLCK;					\
7868762Smckusick 			break;						\
7968762Smckusick 		}							\
8068762Smckusick 	}
8168762Smckusick 
8268762Smckusick /*
8368762Smckusick  * Initialize a lock; required before use.
8468762Smckusick  */
8568782Smckusick void
8668782Smckusick lock_init(lkp, prio, wmesg, timo, flags)
8768762Smckusick 	struct lock *lkp;
8868762Smckusick 	int prio;
8968762Smckusick 	char *wmesg;
9068762Smckusick 	int timo;
9168762Smckusick 	int flags;
9268762Smckusick {
9368762Smckusick 	bzero(lkp, sizeof(struct lock));
94*68933Smckusick 	simple_lock_init(&lkp->lk_interlock);
9568762Smckusick 	lkp->lk_flags = flags & LK_EXTFLG_MASK;
9668762Smckusick 	lkp->lk_prio = prio;
9768762Smckusick 	lkp->lk_timo = timo;
9868762Smckusick 	lkp->lk_wmesg = wmesg;
9968762Smckusick 	lkp->lk_lockholder = LK_NOPROC;
10068762Smckusick }
10168762Smckusick 
10268762Smckusick /*
10368780Smckusick  * Determine the status of a lock.
10468780Smckusick  */
10568780Smckusick int
10668780Smckusick lockstatus(lkp)
10768780Smckusick 	struct lock *lkp;
10868780Smckusick {
10968780Smckusick 	int lock_type = 0;
11068780Smckusick 
111*68933Smckusick 	simple_lock(&lkp->lk_interlock);
11268780Smckusick 	if (lkp->lk_exclusivecount != 0)
11368780Smckusick 		lock_type = LK_EXCLUSIVE;
11468780Smckusick 	else if (lkp->lk_sharecount != 0)
11568780Smckusick 		lock_type = LK_SHARED;
116*68933Smckusick 	simple_unlock(&lkp->lk_interlock);
11768780Smckusick 	return (lock_type);
11868780Smckusick }
11968780Smckusick 
12068780Smckusick /*
12168762Smckusick  * Set, change, or release a lock.
12268762Smckusick  *
12368762Smckusick  * Shared requests increment the shared count. Exclusive requests set the
12468762Smckusick  * LK_WANT_EXCL flag (preventing further shared locks), and wait for already
12568762Smckusick  * accepted shared locks and shared-to-exclusive upgrades to go away.
12668762Smckusick  */
12768782Smckusick int
12868800Smckusick lockmgr(lkp, flags, p)
12968779Smckusick 	volatile struct lock *lkp;
13068800Smckusick 	u_int flags;
13168762Smckusick 	struct proc *p;
13268762Smckusick {
13368779Smckusick 	int error;
13468762Smckusick 	pid_t pid;
13568779Smckusick 	volatile int extflags;
13668762Smckusick 
13768800Smckusick 	error = 0;
13868762Smckusick 	pid = p->p_pid;
139*68933Smckusick 	simple_lock(&lkp->lk_interlock);
14068762Smckusick 	extflags = (flags | lkp->lk_flags) & LK_EXTFLG_MASK;
14168800Smckusick 	if (lkp->lk_flags & LK_DRAINED)
14268800Smckusick 		panic("lockmgr: using decommissioned lock");
14368762Smckusick 
14468762Smckusick 	switch (flags & LK_TYPE_MASK) {
14568762Smckusick 
14668762Smckusick 	case LK_SHARED:
14768762Smckusick 		if (lkp->lk_lockholder != pid) {
14868762Smckusick 			/*
14968762Smckusick 			 * If just polling, check to see if we will block.
15068762Smckusick 			 */
15168762Smckusick 			if ((extflags & LK_NOWAIT) && (lkp->lk_flags &
15268762Smckusick 			    (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE))) {
15368800Smckusick 				error = EBUSY;
15468800Smckusick 				break;
15568762Smckusick 			}
15668762Smckusick 			/*
15768762Smckusick 			 * Wait for exclusive locks and upgrades to clear.
15868762Smckusick 			 */
15968762Smckusick 			ACQUIRE(lkp, error, extflags, lkp->lk_flags &
16068762Smckusick 			    (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE));
16168800Smckusick 			if (error)
16268800Smckusick 				break;
16368762Smckusick 			lkp->lk_sharecount++;
16468800Smckusick 			break;
16568762Smckusick 		}
16668762Smckusick 		/*
16768762Smckusick 		 * We hold an exclusive lock, so downgrade it to shared.
16868762Smckusick 		 * An alternative would be to fail with EDEADLK.
16968762Smckusick 		 */
17068762Smckusick 		lkp->lk_sharecount++;
17168762Smckusick 		/* fall into downgrade */
17268762Smckusick 
17368762Smckusick 	case LK_DOWNGRADE:
17468762Smckusick 		if (lkp->lk_lockholder != pid || lkp->lk_exclusivecount == 0)
17568762Smckusick 			panic("lockmgr: not holding exclusive lock");
17668762Smckusick 		lkp->lk_sharecount += lkp->lk_exclusivecount;
17768762Smckusick 		lkp->lk_exclusivecount = 0;
17868762Smckusick 		lkp->lk_flags &= ~LK_HAVE_EXCL;
17968762Smckusick 		lkp->lk_lockholder = LK_NOPROC;
18068800Smckusick 		if (lkp->lk_waitcount)
18168779Smckusick 			wakeup((void *)lkp);
18268800Smckusick 		break;
18368762Smckusick 
18468779Smckusick 	case LK_EXCLUPGRADE:
18568779Smckusick 		/*
18668779Smckusick 		 * If another process is ahead of us to get an upgrade,
18768779Smckusick 		 * then we want to fail rather than have an intervening
18868779Smckusick 		 * exclusive access.
18968779Smckusick 		 */
19068779Smckusick 		if (lkp->lk_flags & LK_WANT_UPGRADE) {
19168779Smckusick 			lkp->lk_sharecount--;
19268800Smckusick 			error = EBUSY;
19368800Smckusick 			break;
19468779Smckusick 		}
19568779Smckusick 		/* fall into normal upgrade */
19668779Smckusick 
19768762Smckusick 	case LK_UPGRADE:
19868762Smckusick 		/*
19968762Smckusick 		 * Upgrade a shared lock to an exclusive one. If another
20068762Smckusick 		 * shared lock has already requested an upgrade to an
20168762Smckusick 		 * exclusive lock, our shared lock is released and an
20268762Smckusick 		 * exclusive lock is requested (which will be granted
20368775Smckusick 		 * after the upgrade). If we return an error, the file
20468775Smckusick 		 * will always be unlocked.
20568762Smckusick 		 */
20668762Smckusick 		if (lkp->lk_lockholder == pid || lkp->lk_sharecount <= 0)
20768762Smckusick 			panic("lockmgr: upgrade exclusive lock");
20868775Smckusick 		lkp->lk_sharecount--;
20968762Smckusick 		/*
21068762Smckusick 		 * If we are just polling, check to see if we will block.
21168762Smckusick 		 */
21268762Smckusick 		if ((extflags & LK_NOWAIT) &&
21368762Smckusick 		    ((lkp->lk_flags & LK_WANT_UPGRADE) ||
21468762Smckusick 		     lkp->lk_sharecount > 1)) {
21568800Smckusick 			error = EBUSY;
21668800Smckusick 			break;
21768762Smckusick 		}
21868762Smckusick 		if ((lkp->lk_flags & LK_WANT_UPGRADE) == 0) {
21968762Smckusick 			/*
22068762Smckusick 			 * We are first shared lock to request an upgrade, so
22168762Smckusick 			 * request upgrade and wait for the shared count to
22268762Smckusick 			 * drop to zero, then take exclusive lock.
22368762Smckusick 			 */
22468762Smckusick 			lkp->lk_flags |= LK_WANT_UPGRADE;
22568762Smckusick 			ACQUIRE(lkp, error, extflags, lkp->lk_sharecount);
22668762Smckusick 			lkp->lk_flags &= ~LK_WANT_UPGRADE;
22768800Smckusick 			if (error)
22868800Smckusick 				break;
22968762Smckusick 			lkp->lk_flags |= LK_HAVE_EXCL;
23068762Smckusick 			lkp->lk_lockholder = pid;
23168762Smckusick 			if (lkp->lk_exclusivecount != 0)
23268762Smckusick 				panic("lockmgr: non-zero exclusive count");
23368762Smckusick 			lkp->lk_exclusivecount = 1;
23468800Smckusick 			break;
23568762Smckusick 		}
23668762Smckusick 		/*
23768762Smckusick 		 * Someone else has requested upgrade. Release our shared
23868762Smckusick 		 * lock, awaken upgrade requestor if we are the last shared
23968762Smckusick 		 * lock, then request an exclusive lock.
24068762Smckusick 		 */
24168800Smckusick 		if (lkp->lk_sharecount == 0 && lkp->lk_waitcount)
24268779Smckusick 			wakeup((void *)lkp);
24368762Smckusick 		/* fall into exclusive request */
24468762Smckusick 
24568762Smckusick 	case LK_EXCLUSIVE:
24668762Smckusick 		if (lkp->lk_lockholder == pid) {
24768762Smckusick 			/*
24868762Smckusick 			 *	Recursive lock.
24968762Smckusick 			 */
25068762Smckusick 			if ((extflags & LK_CANRECURSE) == 0)
25168762Smckusick 				panic("lockmgr: locking against myself");
25268762Smckusick 			lkp->lk_exclusivecount++;
25368800Smckusick 			break;
25468762Smckusick 		}
25568762Smckusick 		/*
25668762Smckusick 		 * If we are just polling, check to see if we will sleep.
25768762Smckusick 		 */
25868762Smckusick 		if ((extflags & LK_NOWAIT) && ((lkp->lk_flags &
25968762Smckusick 		     (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE)) ||
26068762Smckusick 		     lkp->lk_sharecount != 0)) {
26168800Smckusick 			error = EBUSY;
26268800Smckusick 			break;
26368762Smckusick 		}
26468762Smckusick 		/*
26568762Smckusick 		 * Try to acquire the want_exclusive flag.
26668762Smckusick 		 */
26768762Smckusick 		ACQUIRE(lkp, error, extflags, lkp->lk_flags &
26868762Smckusick 		    (LK_HAVE_EXCL | LK_WANT_EXCL));
26968800Smckusick 		if (error)
27068800Smckusick 			break;
27168762Smckusick 		lkp->lk_flags |= LK_WANT_EXCL;
27268762Smckusick 		/*
27368762Smckusick 		 * Wait for shared locks and upgrades to finish.
27468762Smckusick 		 */
27568762Smckusick 		ACQUIRE(lkp, error, extflags, lkp->lk_sharecount != 0 ||
27668762Smckusick 		       (lkp->lk_flags & LK_WANT_UPGRADE));
27768762Smckusick 		lkp->lk_flags &= ~LK_WANT_EXCL;
27868800Smckusick 		if (error)
27968800Smckusick 			break;
28068762Smckusick 		lkp->lk_flags |= LK_HAVE_EXCL;
28168762Smckusick 		lkp->lk_lockholder = pid;
28268762Smckusick 		if (lkp->lk_exclusivecount != 0)
28368762Smckusick 			panic("lockmgr: non-zero exclusive count");
28468762Smckusick 		lkp->lk_exclusivecount = 1;
28568800Smckusick 		break;
28668762Smckusick 
28768762Smckusick 	case LK_RELEASE:
28868762Smckusick 		if (lkp->lk_exclusivecount != 0) {
28968800Smckusick 			if (pid != lkp->lk_lockholder)
29068800Smckusick 				panic("lockmgr: pid %d, not %s %d unlocking",
29168800Smckusick 				    pid, "exclusive lock holder",
29268800Smckusick 				    lkp->lk_lockholder);
29368762Smckusick 			lkp->lk_exclusivecount--;
29468762Smckusick 			if (lkp->lk_exclusivecount == 0) {
29568762Smckusick 				lkp->lk_flags &= ~LK_HAVE_EXCL;
29668762Smckusick 				lkp->lk_lockholder = LK_NOPROC;
29768762Smckusick 			}
29868762Smckusick 		} else if (lkp->lk_sharecount != 0)
29968762Smckusick 			lkp->lk_sharecount--;
30068800Smckusick 		if (lkp->lk_waitcount)
30168779Smckusick 			wakeup((void *)lkp);
30268800Smckusick 		break;
30368800Smckusick 
30468800Smckusick 	case LK_DRAIN:
30568800Smckusick 		/*
30668800Smckusick 		 * If we are just polling, check to see if we will sleep.
30768800Smckusick 		 */
30868800Smckusick 		if ((extflags & LK_NOWAIT) && ((lkp->lk_flags &
30968800Smckusick 		     (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE)) ||
31068800Smckusick 		     lkp->lk_sharecount != 0 || lkp->lk_waitcount != 0)) {
31168800Smckusick 			error = EBUSY;
31268800Smckusick 			break;
31368762Smckusick 		}
31468800Smckusick 		PAUSE(lkp, ((lkp->lk_flags &
31568800Smckusick 		     (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE)) ||
31668800Smckusick 		     lkp->lk_sharecount != 0 || lkp->lk_waitcount != 0));
31768800Smckusick 		for (error = 0; ((lkp->lk_flags &
31868800Smckusick 		     (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE)) ||
31968800Smckusick 		     lkp->lk_sharecount != 0 || lkp->lk_waitcount != 0); ) {
32068800Smckusick 			lkp->lk_flags |= LK_WAITDRAIN;
321*68933Smckusick 			simple_unlock(&lkp->lk_interlock);
32268800Smckusick 			if (error = tsleep((void *)&lkp->lk_flags, lkp->lk_prio,
32368800Smckusick 			    lkp->lk_wmesg, lkp->lk_timo))
32468800Smckusick 				return (error);
32568800Smckusick 			if ((extflags) & LK_SLEEPFAIL)
32668800Smckusick 				return (ENOLCK);
327*68933Smckusick 			simple_lock(&lkp->lk_interlock);
32868800Smckusick 		}
32968800Smckusick 		lkp->lk_flags |= LK_DRAINED;
33068800Smckusick 		break;
33168762Smckusick 
33268762Smckusick 	default:
333*68933Smckusick 		simple_unlock(&lkp->lk_interlock);
33468762Smckusick 		panic("lockmgr: unknown locktype request %d",
33568762Smckusick 		    flags & LK_TYPE_MASK);
33668775Smckusick 		/* NOTREACHED */
33768762Smckusick 	}
33868800Smckusick 	if ((lkp->lk_flags & LK_WAITDRAIN) && ((lkp->lk_flags &
33968800Smckusick 	     (LK_HAVE_EXCL | LK_WANT_EXCL | LK_WANT_UPGRADE)) == 0 &&
34068800Smckusick 	     lkp->lk_sharecount == 0 && lkp->lk_waitcount == 0)) {
34168800Smckusick 		lkp->lk_flags &= ~LK_WAITDRAIN;
34268800Smckusick 		wakeup((void *)&lkp->lk_flags);
34368800Smckusick 	}
344*68933Smckusick 	simple_unlock(&lkp->lk_interlock);
34568800Smckusick 	return (error);
34668762Smckusick }
347