xref: /openbsd-src/lib/libc/db/hash/hash_buf.c (revision aea60bee5e9bad0aab62f480f19c2fb34c068de4)
1*aea60beeSderaadt /*	$OpenBSD: hash_buf.c,v 1.19 2015/01/16 16:48:51 deraadt Exp $	*/
21b727fc6Smillert 
3df930be7Sderaadt /*-
4df930be7Sderaadt  * Copyright (c) 1990, 1993, 1994
5df930be7Sderaadt  *	The Regents of the University of California.  All rights reserved.
6df930be7Sderaadt  *
7df930be7Sderaadt  * This code is derived from software contributed to Berkeley by
8df930be7Sderaadt  * Margo Seltzer.
9df930be7Sderaadt  *
10df930be7Sderaadt  * Redistribution and use in source and binary forms, with or without
11df930be7Sderaadt  * modification, are permitted provided that the following conditions
12df930be7Sderaadt  * are met:
13df930be7Sderaadt  * 1. Redistributions of source code must retain the above copyright
14df930be7Sderaadt  *    notice, this list of conditions and the following disclaimer.
15df930be7Sderaadt  * 2. Redistributions in binary form must reproduce the above copyright
16df930be7Sderaadt  *    notice, this list of conditions and the following disclaimer in the
17df930be7Sderaadt  *    documentation and/or other materials provided with the distribution.
186580fee3Smillert  * 3. Neither the name of the University nor the names of its contributors
19df930be7Sderaadt  *    may be used to endorse or promote products derived from this software
20df930be7Sderaadt  *    without specific prior written permission.
21df930be7Sderaadt  *
22df930be7Sderaadt  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23df930be7Sderaadt  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24df930be7Sderaadt  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25df930be7Sderaadt  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26df930be7Sderaadt  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27df930be7Sderaadt  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28df930be7Sderaadt  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29df930be7Sderaadt  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30df930be7Sderaadt  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31df930be7Sderaadt  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32df930be7Sderaadt  * SUCH DAMAGE.
33df930be7Sderaadt  */
34df930be7Sderaadt 
35df930be7Sderaadt /*
36df930be7Sderaadt  * PACKAGE: hash
37df930be7Sderaadt  *
38df930be7Sderaadt  * DESCRIPTION:
39df930be7Sderaadt  *	Contains buffer management
40df930be7Sderaadt  *
41df930be7Sderaadt  * ROUTINES:
42df930be7Sderaadt  * External
43df930be7Sderaadt  *	__buf_init
44df930be7Sderaadt  *	__get_buf
45df930be7Sderaadt  *	__buf_free
46df930be7Sderaadt  *	__reclaim_buf
47df930be7Sderaadt  * Internal
48df930be7Sderaadt  *	newbuf
49df930be7Sderaadt  */
50df930be7Sderaadt 
51df930be7Sderaadt #include <errno.h>
52df930be7Sderaadt #include <stddef.h>
53df930be7Sderaadt #include <stdio.h>
54df930be7Sderaadt #include <stdlib.h>
5584769496Sderaadt #include <string.h>
56df930be7Sderaadt 
57df930be7Sderaadt #ifdef DEBUG
58df930be7Sderaadt #include <assert.h>
59df930be7Sderaadt #endif
60df930be7Sderaadt 
61df930be7Sderaadt #include <db.h>
62df930be7Sderaadt #include "hash.h"
63df930be7Sderaadt #include "page.h"
64df930be7Sderaadt #include "extern.h"
65df930be7Sderaadt 
66*aea60beeSderaadt #define MAXIMUM(a, b)	(((a) > (b)) ? (a) : (b))
67*aea60beeSderaadt 
68c72b5b24Smillert static BUFHEAD *newbuf(HTAB *, u_int32_t, BUFHEAD *);
69df930be7Sderaadt 
70df930be7Sderaadt /* Unlink B from its place in the lru */
71df930be7Sderaadt #define BUF_REMOVE(B) { \
72df930be7Sderaadt 	(B)->prev->next = (B)->next; \
73df930be7Sderaadt 	(B)->next->prev = (B)->prev; \
74df930be7Sderaadt }
75df930be7Sderaadt 
76df930be7Sderaadt /* Insert B after P */
77df930be7Sderaadt #define BUF_INSERT(B, P) { \
78df930be7Sderaadt 	(B)->next = (P)->next; \
79df930be7Sderaadt 	(B)->prev = (P); \
80df930be7Sderaadt 	(P)->next = (B); \
81df930be7Sderaadt 	(B)->next->prev = (B); \
82df930be7Sderaadt }
83df930be7Sderaadt 
84df930be7Sderaadt #define	MRU	hashp->bufhead.next
85df930be7Sderaadt #define	LRU	hashp->bufhead.prev
86df930be7Sderaadt 
87df930be7Sderaadt #define MRU_INSERT(B)	BUF_INSERT((B), &hashp->bufhead)
88df930be7Sderaadt #define LRU_INSERT(B)	BUF_INSERT((B), LRU)
89df930be7Sderaadt 
90df930be7Sderaadt /*
91df930be7Sderaadt  * We are looking for a buffer with address "addr".  If prev_bp is NULL, then
92df930be7Sderaadt  * address is a bucket index.  If prev_bp is not NULL, then it points to the
93df930be7Sderaadt  * page previous to an overflow page that we are trying to find.
94df930be7Sderaadt  *
95df930be7Sderaadt  * CAVEAT:  The buffer header accessed via prev_bp's ovfl field may no longer
96df930be7Sderaadt  * be valid.  Therefore, you must always verify that its address matches the
97df930be7Sderaadt  * address you are seeking.
98df930be7Sderaadt  */
99e20a56a5Sotto BUFHEAD *
__get_buf(HTAB * hashp,u_int32_t addr,BUFHEAD * prev_bp,int newpage)100e20a56a5Sotto __get_buf(HTAB *hashp, u_int32_t addr,
101e20a56a5Sotto     BUFHEAD *prev_bp,	/* If prev_bp set, indicates a new overflow page. */
102e20a56a5Sotto     int newpage)
103df930be7Sderaadt {
1046c51c909Smillert 	BUFHEAD *bp;
1056c51c909Smillert 	u_int32_t is_disk_mask;
1066c51c909Smillert 	int is_disk, segment_ndx;
107df930be7Sderaadt 	SEGMENT segp;
108df930be7Sderaadt 
109df930be7Sderaadt 	is_disk = 0;
110df930be7Sderaadt 	is_disk_mask = 0;
111df930be7Sderaadt 	if (prev_bp) {
112df930be7Sderaadt 		bp = prev_bp->ovfl;
113df930be7Sderaadt 		if (!bp || (bp->addr != addr))
114df930be7Sderaadt 			bp = NULL;
115df930be7Sderaadt 		if (!newpage)
116df930be7Sderaadt 			is_disk = BUF_DISK;
117df930be7Sderaadt 	} else {
118df930be7Sderaadt 		/* Grab buffer out of directory */
119df930be7Sderaadt 		segment_ndx = addr & (hashp->SGSIZE - 1);
120df930be7Sderaadt 
121df930be7Sderaadt 		/* valid segment ensured by __call_hash() */
122df930be7Sderaadt 		segp = hashp->dir[addr >> hashp->SSHIFT];
123df930be7Sderaadt #ifdef DEBUG
124df930be7Sderaadt 		assert(segp != NULL);
125df930be7Sderaadt #endif
126df930be7Sderaadt 		bp = PTROF(segp[segment_ndx]);
127df930be7Sderaadt 		is_disk_mask = ISDISK(segp[segment_ndx]);
128df930be7Sderaadt 		is_disk = is_disk_mask || !hashp->new_file;
129df930be7Sderaadt 	}
130df930be7Sderaadt 
131df930be7Sderaadt 	if (!bp) {
132df930be7Sderaadt 		bp = newbuf(hashp, addr, prev_bp);
133df930be7Sderaadt 		if (!bp ||
134df930be7Sderaadt 		    __get_page(hashp, bp->page, addr, !prev_bp, is_disk, 0))
135df930be7Sderaadt 			return (NULL);
136df930be7Sderaadt 		if (!prev_bp)
137df930be7Sderaadt 			segp[segment_ndx] =
138df930be7Sderaadt 			    (BUFHEAD *)((ptrdiff_t)bp | is_disk_mask);
139df930be7Sderaadt 	} else {
140df930be7Sderaadt 		BUF_REMOVE(bp);
141df930be7Sderaadt 		MRU_INSERT(bp);
142df930be7Sderaadt 	}
143df930be7Sderaadt 	return (bp);
144df930be7Sderaadt }
145df930be7Sderaadt 
146df930be7Sderaadt /*
147df930be7Sderaadt  * We need a buffer for this page. Either allocate one, or evict a resident
148df930be7Sderaadt  * one (if we have as many buffers as we're allowed) and put this one in.
149df930be7Sderaadt  *
150df930be7Sderaadt  * If newbuf finds an error (returning NULL), it also sets errno.
151df930be7Sderaadt  */
152df930be7Sderaadt static BUFHEAD *
newbuf(HTAB * hashp,u_int32_t addr,BUFHEAD * prev_bp)153e20a56a5Sotto newbuf(HTAB *hashp, u_int32_t addr, BUFHEAD *prev_bp)
154df930be7Sderaadt {
1556c51c909Smillert 	BUFHEAD *bp;		/* The buffer we're going to use */
1566c51c909Smillert 	BUFHEAD *xbp;		/* Temp pointer */
1576c51c909Smillert 	BUFHEAD *next_xbp;
158df930be7Sderaadt 	SEGMENT segp;
159df930be7Sderaadt 	int segment_ndx;
160df930be7Sderaadt 	u_int16_t oaddr, *shortp;
161df930be7Sderaadt 
162df930be7Sderaadt 	oaddr = 0;
163df930be7Sderaadt 	bp = LRU;
164f19f124aSotto 
165f19f124aSotto         /* It is bad to overwrite the page under the cursor. */
166f19f124aSotto         if (bp == hashp->cpage) {
167f19f124aSotto                 BUF_REMOVE(bp);
168f19f124aSotto                 MRU_INSERT(bp);
169f19f124aSotto                 bp = LRU;
170f19f124aSotto         }
171f19f124aSotto 
172a4d2df78Smillert 	/* If prev_bp is part of bp overflow, create a new buffer. */
173e68688f2Smillert 	if (hashp->nbufs == 0 && prev_bp && bp->ovfl) {
174e68688f2Smillert 		BUFHEAD *ovfl;
175a4d2df78Smillert 
176e68688f2Smillert 		for (ovfl = bp->ovfl; ovfl ; ovfl = ovfl->ovfl) {
177e68688f2Smillert 			if (ovfl == prev_bp) {
178a4d2df78Smillert 				hashp->nbufs++;
179a4d2df78Smillert 				break;
180a4d2df78Smillert 			}
181a4d2df78Smillert 		}
182a4d2df78Smillert 	}
183a4d2df78Smillert 
184df930be7Sderaadt 	/*
185df930be7Sderaadt 	 * If LRU buffer is pinned, the buffer pool is too small. We need to
186df930be7Sderaadt 	 * allocate more buffers.
187df930be7Sderaadt 	 */
188f19f124aSotto 	if (hashp->nbufs || (bp->flags & BUF_PIN) || bp == hashp->cpage) {
189df930be7Sderaadt 		/* Allocate a new one */
190df930be7Sderaadt 		if ((bp = (BUFHEAD *)malloc(sizeof(BUFHEAD))) == NULL)
191df930be7Sderaadt 			return (NULL);
192bec2d00aSderaadt 		memset(bp, 0xff, sizeof(BUFHEAD));
193df930be7Sderaadt 		if ((bp->page = (char *)malloc(hashp->BSIZE)) == NULL) {
194df930be7Sderaadt 			free(bp);
195df930be7Sderaadt 			return (NULL);
196df930be7Sderaadt 		}
197bec2d00aSderaadt 		memset(bp->page, 0xff, hashp->BSIZE);
198df930be7Sderaadt 		if (hashp->nbufs)
199df930be7Sderaadt 			hashp->nbufs--;
200df930be7Sderaadt 	} else {
201df930be7Sderaadt 		/* Kick someone out */
202df930be7Sderaadt 		BUF_REMOVE(bp);
203df930be7Sderaadt 		/*
204df930be7Sderaadt 		 * If this is an overflow page with addr 0, it's already been
205df930be7Sderaadt 		 * flushed back in an overflow chain and initialized.
206df930be7Sderaadt 		 */
207df930be7Sderaadt 		if ((bp->addr != 0) || (bp->flags & BUF_BUCKET)) {
208df930be7Sderaadt 			/*
209df930be7Sderaadt 			 * Set oaddr before __put_page so that you get it
210df930be7Sderaadt 			 * before bytes are swapped.
211df930be7Sderaadt 			 */
212df930be7Sderaadt 			shortp = (u_int16_t *)bp->page;
213df930be7Sderaadt 			if (shortp[0])
214df930be7Sderaadt 				oaddr = shortp[shortp[0] - 1];
215df930be7Sderaadt 			if ((bp->flags & BUF_MOD) && __put_page(hashp, bp->page,
216df930be7Sderaadt 			    bp->addr, (int)IS_BUCKET(bp->flags), 0))
217df930be7Sderaadt 				return (NULL);
218df930be7Sderaadt 			/*
219df930be7Sderaadt 			 * Update the pointer to this page (i.e. invalidate it).
220df930be7Sderaadt 			 *
221df930be7Sderaadt 			 * If this is a new file (i.e. we created it at open
222df930be7Sderaadt 			 * time), make sure that we mark pages which have been
223df930be7Sderaadt 			 * written to disk so we retrieve them from disk later,
224df930be7Sderaadt 			 * rather than allocating new pages.
225df930be7Sderaadt 			 */
226df930be7Sderaadt 			if (IS_BUCKET(bp->flags)) {
227df930be7Sderaadt 				segment_ndx = bp->addr & (hashp->SGSIZE - 1);
228df930be7Sderaadt 				segp = hashp->dir[bp->addr >> hashp->SSHIFT];
229df930be7Sderaadt #ifdef DEBUG
230df930be7Sderaadt 				assert(segp != NULL);
231df930be7Sderaadt #endif
232df930be7Sderaadt 
233df930be7Sderaadt 				if (hashp->new_file &&
234df930be7Sderaadt 				    ((bp->flags & BUF_MOD) ||
235df930be7Sderaadt 				    ISDISK(segp[segment_ndx])))
236df930be7Sderaadt 					segp[segment_ndx] = (BUFHEAD *)BUF_DISK;
237df930be7Sderaadt 				else
238df930be7Sderaadt 					segp[segment_ndx] = NULL;
239df930be7Sderaadt 			}
240df930be7Sderaadt 			/*
241df930be7Sderaadt 			 * Since overflow pages can only be access by means of
242df930be7Sderaadt 			 * their bucket, free overflow pages associated with
243df930be7Sderaadt 			 * this bucket.
244df930be7Sderaadt 			 */
245df930be7Sderaadt 			for (xbp = bp; xbp->ovfl;) {
246df930be7Sderaadt 				next_xbp = xbp->ovfl;
247df930be7Sderaadt 				xbp->ovfl = 0;
248df930be7Sderaadt 				xbp = next_xbp;
249df930be7Sderaadt 
250df930be7Sderaadt 				/* Check that ovfl pointer is up date. */
251df930be7Sderaadt 				if (IS_BUCKET(xbp->flags) ||
252df930be7Sderaadt 				    (oaddr != xbp->addr))
253df930be7Sderaadt 					break;
254df930be7Sderaadt 
255df930be7Sderaadt 				shortp = (u_int16_t *)xbp->page;
256df930be7Sderaadt 				if (shortp[0])
257df930be7Sderaadt 					/* set before __put_page */
258df930be7Sderaadt 					oaddr = shortp[shortp[0] - 1];
259df930be7Sderaadt 				if ((xbp->flags & BUF_MOD) && __put_page(hashp,
260df930be7Sderaadt 				    xbp->page, xbp->addr, 0, 0))
261df930be7Sderaadt 					return (NULL);
262df930be7Sderaadt 				xbp->addr = 0;
263df930be7Sderaadt 				xbp->flags = 0;
264df930be7Sderaadt 				BUF_REMOVE(xbp);
265df930be7Sderaadt 				LRU_INSERT(xbp);
266df930be7Sderaadt 			}
267df930be7Sderaadt 		}
268df930be7Sderaadt 	}
269df930be7Sderaadt 
270df930be7Sderaadt 	/* Now assign this buffer */
271df930be7Sderaadt 	bp->addr = addr;
272df930be7Sderaadt #ifdef DEBUG1
273df930be7Sderaadt 	(void)fprintf(stderr, "NEWBUF1: %d->ovfl was %d is now %d\n",
274df930be7Sderaadt 	    bp->addr, (bp->ovfl ? bp->ovfl->addr : 0), 0);
275df930be7Sderaadt #endif
276df95a199Smillert 	bp->ovfl = NULL;
277df930be7Sderaadt 	if (prev_bp) {
278df930be7Sderaadt 		/*
279df930be7Sderaadt 		 * If prev_bp is set, this is an overflow page, hook it in to
280df930be7Sderaadt 		 * the buffer overflow links.
281df930be7Sderaadt 		 */
282df930be7Sderaadt #ifdef DEBUG1
283df930be7Sderaadt 		(void)fprintf(stderr, "NEWBUF2: %d->ovfl was %d is now %d\n",
28451c9e5abSmickey 		    prev_bp->addr, (prev_bp->ovfl ? prev_bp->ovfl->addr : 0),
285df930be7Sderaadt 		    (bp ? bp->addr : 0));
286df930be7Sderaadt #endif
287df95a199Smillert 		prev_bp->ovfl = bp;
288df930be7Sderaadt 		bp->flags = 0;
289df930be7Sderaadt 	} else
290df930be7Sderaadt 		bp->flags = BUF_BUCKET;
291df930be7Sderaadt 	MRU_INSERT(bp);
292df930be7Sderaadt 	return (bp);
293df930be7Sderaadt }
294df930be7Sderaadt 
295e20a56a5Sotto void
__buf_init(HTAB * hashp,int nbytes)296e20a56a5Sotto __buf_init(HTAB *hashp, int nbytes)
297df930be7Sderaadt {
298df930be7Sderaadt 	BUFHEAD *bfp;
299df930be7Sderaadt 	int npages;
300df930be7Sderaadt 
301df930be7Sderaadt 	bfp = &(hashp->bufhead);
302df930be7Sderaadt 	npages = (nbytes + hashp->BSIZE - 1) >> hashp->BSHIFT;
303*aea60beeSderaadt 	npages = MAXIMUM(npages, MIN_BUFFERS);
304df930be7Sderaadt 
305df930be7Sderaadt 	hashp->nbufs = npages;
306df930be7Sderaadt 	bfp->next = bfp;
307df930be7Sderaadt 	bfp->prev = bfp;
308df930be7Sderaadt 	/*
309df930be7Sderaadt 	 * This space is calloc'd so these are already null.
310df930be7Sderaadt 	 *
311df930be7Sderaadt 	 * bfp->ovfl = NULL;
312df930be7Sderaadt 	 * bfp->flags = 0;
313df930be7Sderaadt 	 * bfp->page = NULL;
314df930be7Sderaadt 	 * bfp->addr = 0;
315df930be7Sderaadt 	 */
316df930be7Sderaadt }
317df930be7Sderaadt 
318e20a56a5Sotto int
__buf_free(HTAB * hashp,int do_free,int to_disk)319e20a56a5Sotto __buf_free(HTAB *hashp, int do_free, int to_disk)
320df930be7Sderaadt {
321df930be7Sderaadt 	BUFHEAD *bp;
322df930be7Sderaadt 
323df930be7Sderaadt 	/* Need to make sure that buffer manager has been initialized */
324df930be7Sderaadt 	if (!LRU)
325df930be7Sderaadt 		return (0);
326df930be7Sderaadt 	for (bp = LRU; bp != &hashp->bufhead;) {
327df930be7Sderaadt 		/* Check that the buffer is valid */
328df930be7Sderaadt 		if (bp->addr || IS_BUCKET(bp->flags)) {
329df930be7Sderaadt 			if (to_disk && (bp->flags & BUF_MOD) &&
330df930be7Sderaadt 			    __put_page(hashp, bp->page,
331df930be7Sderaadt 			    bp->addr, IS_BUCKET(bp->flags), 0))
332df930be7Sderaadt 				return (-1);
333df930be7Sderaadt 		}
334df930be7Sderaadt 		/* Check if we are freeing stuff */
335df930be7Sderaadt 		if (do_free) {
3361f4695f0Sdownsj 			if (bp->page) {
3371f4695f0Sdownsj 				(void)memset(bp->page, 0, hashp->BSIZE);
338df930be7Sderaadt 				free(bp->page);
3391f4695f0Sdownsj 			}
340df930be7Sderaadt 			BUF_REMOVE(bp);
341df930be7Sderaadt 			free(bp);
342df930be7Sderaadt 			bp = LRU;
343df930be7Sderaadt 		} else
344df930be7Sderaadt 			bp = bp->prev;
345df930be7Sderaadt 	}
346df930be7Sderaadt 	return (0);
347df930be7Sderaadt }
348df930be7Sderaadt 
349e20a56a5Sotto void
__reclaim_buf(HTAB * hashp,BUFHEAD * bp)350e20a56a5Sotto __reclaim_buf(HTAB *hashp, BUFHEAD *bp)
351df930be7Sderaadt {
352df930be7Sderaadt 	bp->ovfl = 0;
353df930be7Sderaadt 	bp->addr = 0;
354df930be7Sderaadt 	bp->flags = 0;
355df930be7Sderaadt 	BUF_REMOVE(bp);
356df930be7Sderaadt 	LRU_INSERT(bp);
357df930be7Sderaadt }
358