xref: /onnv-gate/usr/src/lib/libumem/common/vmem_sbrk.c (revision 6812:febeba71273d)
10Sstevel@tonic-gate /*
20Sstevel@tonic-gate  * CDDL HEADER START
30Sstevel@tonic-gate  *
40Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
51528Sjwadams  * Common Development and Distribution License (the "License").
61528Sjwadams  * You may not use this file except in compliance with the License.
70Sstevel@tonic-gate  *
80Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
90Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
100Sstevel@tonic-gate  * See the License for the specific language governing permissions
110Sstevel@tonic-gate  * and limitations under the License.
120Sstevel@tonic-gate  *
130Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
140Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
150Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
160Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
170Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
180Sstevel@tonic-gate  *
190Sstevel@tonic-gate  * CDDL HEADER END
200Sstevel@tonic-gate  */
211219Sraf 
220Sstevel@tonic-gate /*
23*6812Sraf  * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
240Sstevel@tonic-gate  * Use is subject to license terms.
250Sstevel@tonic-gate  */
260Sstevel@tonic-gate 
270Sstevel@tonic-gate #pragma ident	"%Z%%M%	%I%	%E% SMI"
280Sstevel@tonic-gate 
290Sstevel@tonic-gate /*
300Sstevel@tonic-gate  * The structure of the sbrk backend:
310Sstevel@tonic-gate  *
320Sstevel@tonic-gate  * +-----------+
330Sstevel@tonic-gate  * | sbrk_top  |
340Sstevel@tonic-gate  * +-----------+
350Sstevel@tonic-gate  *      | (vmem_sbrk_alloc(), vmem_free())
360Sstevel@tonic-gate  *      |
370Sstevel@tonic-gate  * +-----------+
380Sstevel@tonic-gate  * | sbrk_heap |
390Sstevel@tonic-gate  * +-----------+
400Sstevel@tonic-gate  *   | | ... |  (vmem_alloc(), vmem_free())
410Sstevel@tonic-gate  * <other arenas>
420Sstevel@tonic-gate  *
430Sstevel@tonic-gate  * The sbrk_top arena holds all controlled memory.  vmem_sbrk_alloc() handles
440Sstevel@tonic-gate  * allocations from it, including growing the heap when we run low.
450Sstevel@tonic-gate  *
460Sstevel@tonic-gate  * Growing the heap is complicated by the fact that we have to extend the
470Sstevel@tonic-gate  * sbrk_top arena (using _vmem_extend_alloc()), and that can fail.  Since
480Sstevel@tonic-gate  * other threads may be actively allocating, we can't return the memory.
490Sstevel@tonic-gate  *
500Sstevel@tonic-gate  * Instead, we put it on a doubly-linked list, sbrk_fails, which we search
510Sstevel@tonic-gate  * before calling sbrk().
520Sstevel@tonic-gate  */
530Sstevel@tonic-gate 
540Sstevel@tonic-gate #include <errno.h>
550Sstevel@tonic-gate #include <limits.h>
560Sstevel@tonic-gate #include <sys/sysmacros.h>
570Sstevel@tonic-gate #include <sys/mman.h>
580Sstevel@tonic-gate #include <unistd.h>
590Sstevel@tonic-gate 
600Sstevel@tonic-gate #include "vmem_base.h"
610Sstevel@tonic-gate 
620Sstevel@tonic-gate #include "misc.h"
630Sstevel@tonic-gate 
640Sstevel@tonic-gate size_t vmem_sbrk_pagesize = 0; /* the preferred page size of the heap */
650Sstevel@tonic-gate 
661528Sjwadams #define	VMEM_SBRK_MINALLOC	(64 * 1024)
671528Sjwadams size_t vmem_sbrk_minalloc = VMEM_SBRK_MINALLOC; /* minimum allocation */
680Sstevel@tonic-gate 
690Sstevel@tonic-gate static size_t real_pagesize;
700Sstevel@tonic-gate static vmem_t *sbrk_heap;
710Sstevel@tonic-gate 
720Sstevel@tonic-gate typedef struct sbrk_fail {
730Sstevel@tonic-gate 	struct sbrk_fail *sf_next;
740Sstevel@tonic-gate 	struct sbrk_fail *sf_prev;
750Sstevel@tonic-gate 	void *sf_base;			/* == the sbrk_fail's address */
760Sstevel@tonic-gate 	size_t sf_size;			/* the size of this buffer */
770Sstevel@tonic-gate } sbrk_fail_t;
780Sstevel@tonic-gate 
790Sstevel@tonic-gate static sbrk_fail_t sbrk_fails = {
800Sstevel@tonic-gate 	&sbrk_fails,
810Sstevel@tonic-gate 	&sbrk_fails,
820Sstevel@tonic-gate 	NULL,
830Sstevel@tonic-gate 	0
840Sstevel@tonic-gate };
850Sstevel@tonic-gate 
860Sstevel@tonic-gate static mutex_t sbrk_faillock = DEFAULTMUTEX;
870Sstevel@tonic-gate 
880Sstevel@tonic-gate /*
890Sstevel@tonic-gate  * Try to extend src with [pos, pos + size).
900Sstevel@tonic-gate  *
910Sstevel@tonic-gate  * If it fails, add the block to the sbrk_fails list.
920Sstevel@tonic-gate  */
930Sstevel@tonic-gate static void *
vmem_sbrk_extend_alloc(vmem_t * src,void * pos,size_t size,size_t alloc,int vmflags)940Sstevel@tonic-gate vmem_sbrk_extend_alloc(vmem_t *src, void *pos, size_t size, size_t alloc,
950Sstevel@tonic-gate     int vmflags)
960Sstevel@tonic-gate {
970Sstevel@tonic-gate 	sbrk_fail_t *fnext, *fprev, *fp;
980Sstevel@tonic-gate 	void *ret;
990Sstevel@tonic-gate 
1000Sstevel@tonic-gate 	ret = _vmem_extend_alloc(src, pos, size, alloc, vmflags);
1010Sstevel@tonic-gate 	if (ret != NULL)
1020Sstevel@tonic-gate 		return (ret);
1030Sstevel@tonic-gate 
1040Sstevel@tonic-gate 	fp = (sbrk_fail_t *)pos;
1050Sstevel@tonic-gate 
1060Sstevel@tonic-gate 	ASSERT(sizeof (sbrk_fail_t) <= size);
1070Sstevel@tonic-gate 
1080Sstevel@tonic-gate 	fp->sf_base = pos;
1090Sstevel@tonic-gate 	fp->sf_size = size;
1100Sstevel@tonic-gate 
1110Sstevel@tonic-gate 	(void) mutex_lock(&sbrk_faillock);
1120Sstevel@tonic-gate 	fp->sf_next = fnext = &sbrk_fails;
1130Sstevel@tonic-gate 	fp->sf_prev = fprev = sbrk_fails.sf_prev;
1140Sstevel@tonic-gate 	fnext->sf_prev = fp;
1150Sstevel@tonic-gate 	fprev->sf_next = fp;
1160Sstevel@tonic-gate 	(void) mutex_unlock(&sbrk_faillock);
1170Sstevel@tonic-gate 
1180Sstevel@tonic-gate 	return (NULL);
1190Sstevel@tonic-gate }
1200Sstevel@tonic-gate 
1210Sstevel@tonic-gate /*
1220Sstevel@tonic-gate  * Try to add at least size bytes to src, using the sbrk_fails list
1230Sstevel@tonic-gate  */
1240Sstevel@tonic-gate static void *
vmem_sbrk_tryfail(vmem_t * src,size_t size,int vmflags)1250Sstevel@tonic-gate vmem_sbrk_tryfail(vmem_t *src, size_t size, int vmflags)
1260Sstevel@tonic-gate {
1270Sstevel@tonic-gate 	sbrk_fail_t *fp;
1280Sstevel@tonic-gate 
1290Sstevel@tonic-gate 	(void) mutex_lock(&sbrk_faillock);
1300Sstevel@tonic-gate 	for (fp = sbrk_fails.sf_next; fp != &sbrk_fails; fp = fp->sf_next) {
1310Sstevel@tonic-gate 		if (fp->sf_size >= size) {
1320Sstevel@tonic-gate 			fp->sf_next->sf_prev = fp->sf_prev;
1330Sstevel@tonic-gate 			fp->sf_prev->sf_next = fp->sf_next;
1340Sstevel@tonic-gate 			fp->sf_next = fp->sf_prev = NULL;
1350Sstevel@tonic-gate 			break;
1360Sstevel@tonic-gate 		}
1370Sstevel@tonic-gate 	}
1380Sstevel@tonic-gate 	(void) mutex_unlock(&sbrk_faillock);
1390Sstevel@tonic-gate 
1400Sstevel@tonic-gate 	if (fp != &sbrk_fails) {
1410Sstevel@tonic-gate 		ASSERT(fp->sf_base == (void *)fp);
1420Sstevel@tonic-gate 		return (vmem_sbrk_extend_alloc(src, fp, fp->sf_size, size,
1430Sstevel@tonic-gate 		    vmflags));
1440Sstevel@tonic-gate 	}
1450Sstevel@tonic-gate 	/*
1460Sstevel@tonic-gate 	 * nothing of the right size on the freelist
1470Sstevel@tonic-gate 	 */
1480Sstevel@tonic-gate 	return (NULL);
1490Sstevel@tonic-gate }
1500Sstevel@tonic-gate 
1510Sstevel@tonic-gate static void *
vmem_sbrk_alloc(vmem_t * src,size_t size,int vmflags)1520Sstevel@tonic-gate vmem_sbrk_alloc(vmem_t *src, size_t size, int vmflags)
1530Sstevel@tonic-gate {
1540Sstevel@tonic-gate 	extern void *_sbrk_grow_aligned(size_t min_size, size_t low_align,
1550Sstevel@tonic-gate 	    size_t high_align, size_t *actual_size);
1560Sstevel@tonic-gate 
1570Sstevel@tonic-gate 	void *ret;
1580Sstevel@tonic-gate 	void *buf;
1590Sstevel@tonic-gate 	size_t buf_size;
1600Sstevel@tonic-gate 
1610Sstevel@tonic-gate 	int old_errno = errno;
1620Sstevel@tonic-gate 
1630Sstevel@tonic-gate 	ret = vmem_alloc(src, size, VM_NOSLEEP);
1640Sstevel@tonic-gate 	if (ret != NULL) {
1650Sstevel@tonic-gate 		errno = old_errno;
1660Sstevel@tonic-gate 		return (ret);
1670Sstevel@tonic-gate 	}
1680Sstevel@tonic-gate 
1690Sstevel@tonic-gate 	/*
1700Sstevel@tonic-gate 	 * The allocation failed.  We need to grow the heap.
1710Sstevel@tonic-gate 	 *
1720Sstevel@tonic-gate 	 * First, try to use any buffers which failed earlier.
1730Sstevel@tonic-gate 	 */
1740Sstevel@tonic-gate 	if (sbrk_fails.sf_next != &sbrk_fails &&
1750Sstevel@tonic-gate 	    (ret = vmem_sbrk_tryfail(src, size, vmflags)) != NULL)
1760Sstevel@tonic-gate 		return (ret);
1770Sstevel@tonic-gate 
1781528Sjwadams 	buf_size = MAX(size, vmem_sbrk_minalloc);
1790Sstevel@tonic-gate 
1800Sstevel@tonic-gate 	/*
1810Sstevel@tonic-gate 	 * buf_size gets overwritten with the actual allocated size
1820Sstevel@tonic-gate 	 */
1830Sstevel@tonic-gate 	buf = _sbrk_grow_aligned(buf_size, real_pagesize, vmem_sbrk_pagesize,
1840Sstevel@tonic-gate 	    &buf_size);
1850Sstevel@tonic-gate 
1860Sstevel@tonic-gate 	if (buf != MAP_FAILED) {
1870Sstevel@tonic-gate 		ret = vmem_sbrk_extend_alloc(src, buf, buf_size, size, vmflags);
1880Sstevel@tonic-gate 		if (ret != NULL) {
1890Sstevel@tonic-gate 			errno = old_errno;
1900Sstevel@tonic-gate 			return (ret);
1910Sstevel@tonic-gate 		}
1920Sstevel@tonic-gate 	}
1930Sstevel@tonic-gate 
1940Sstevel@tonic-gate 	/*
1950Sstevel@tonic-gate 	 * Growing the heap failed. The vmem_alloc() above called umem_reap().
1960Sstevel@tonic-gate 	 */
1970Sstevel@tonic-gate 	ASSERT((vmflags & VM_NOSLEEP) == VM_NOSLEEP);
1980Sstevel@tonic-gate 
1990Sstevel@tonic-gate 	errno = old_errno;
2000Sstevel@tonic-gate 	return (NULL);
2010Sstevel@tonic-gate }
2020Sstevel@tonic-gate 
2030Sstevel@tonic-gate /*
2040Sstevel@tonic-gate  * fork1() support
2050Sstevel@tonic-gate  */
2060Sstevel@tonic-gate void
vmem_sbrk_lockup(void)2070Sstevel@tonic-gate vmem_sbrk_lockup(void)
2080Sstevel@tonic-gate {
2090Sstevel@tonic-gate 	(void) mutex_lock(&sbrk_faillock);
2100Sstevel@tonic-gate }
2110Sstevel@tonic-gate 
2120Sstevel@tonic-gate void
vmem_sbrk_release(void)2130Sstevel@tonic-gate vmem_sbrk_release(void)
2140Sstevel@tonic-gate {
2150Sstevel@tonic-gate 	(void) mutex_unlock(&sbrk_faillock);
2160Sstevel@tonic-gate }
2170Sstevel@tonic-gate 
2180Sstevel@tonic-gate vmem_t *
vmem_sbrk_arena(vmem_alloc_t ** a_out,vmem_free_t ** f_out)2190Sstevel@tonic-gate vmem_sbrk_arena(vmem_alloc_t **a_out, vmem_free_t **f_out)
2200Sstevel@tonic-gate {
2210Sstevel@tonic-gate 	if (sbrk_heap == NULL) {
2220Sstevel@tonic-gate 		size_t heap_size;
2230Sstevel@tonic-gate 
2240Sstevel@tonic-gate 		real_pagesize = sysconf(_SC_PAGESIZE);
2250Sstevel@tonic-gate 
2260Sstevel@tonic-gate 		heap_size = vmem_sbrk_pagesize;
2270Sstevel@tonic-gate 
2280Sstevel@tonic-gate 		if (issetugid()) {
2290Sstevel@tonic-gate 			heap_size = 0;
2300Sstevel@tonic-gate 		} else if (heap_size != 0 && !ISP2(heap_size)) {
2310Sstevel@tonic-gate 			heap_size = 0;
2320Sstevel@tonic-gate 			log_message("ignoring bad pagesize: 0x%p\n", heap_size);
2330Sstevel@tonic-gate 		}
2340Sstevel@tonic-gate 		if (heap_size <= real_pagesize) {
2350Sstevel@tonic-gate 			heap_size = real_pagesize;
2360Sstevel@tonic-gate 		} else {
2370Sstevel@tonic-gate 			struct memcntl_mha mha;
2380Sstevel@tonic-gate 			mha.mha_cmd = MHA_MAPSIZE_BSSBRK;
2390Sstevel@tonic-gate 			mha.mha_flags = 0;
2400Sstevel@tonic-gate 			mha.mha_pagesize = heap_size;
2410Sstevel@tonic-gate 
2420Sstevel@tonic-gate 			if (memcntl(NULL, 0, MC_HAT_ADVISE, (char *)&mha, 0, 0)
2430Sstevel@tonic-gate 			    == -1) {
2440Sstevel@tonic-gate 				log_message("unable to set MAPSIZE_BSSBRK to "
2450Sstevel@tonic-gate 				    "0x%p\n", heap_size);
2460Sstevel@tonic-gate 				heap_size = real_pagesize;
2470Sstevel@tonic-gate 			}
2480Sstevel@tonic-gate 		}
2490Sstevel@tonic-gate 		vmem_sbrk_pagesize = heap_size;
2500Sstevel@tonic-gate 
2511528Sjwadams 		/* validate vmem_sbrk_minalloc */
2521528Sjwadams 		if (vmem_sbrk_minalloc < VMEM_SBRK_MINALLOC)
2531528Sjwadams 			vmem_sbrk_minalloc = VMEM_SBRK_MINALLOC;
2541528Sjwadams 		vmem_sbrk_minalloc = P2ROUNDUP(vmem_sbrk_minalloc, heap_size);
2551528Sjwadams 
2560Sstevel@tonic-gate 		sbrk_heap = vmem_init("sbrk_top", real_pagesize,
2570Sstevel@tonic-gate 		    vmem_sbrk_alloc, vmem_free,
2580Sstevel@tonic-gate 		    "sbrk_heap", NULL, 0, real_pagesize,
2590Sstevel@tonic-gate 		    vmem_alloc, vmem_free);
2600Sstevel@tonic-gate 	}
2610Sstevel@tonic-gate 
2620Sstevel@tonic-gate 	if (a_out != NULL)
2630Sstevel@tonic-gate 		*a_out = vmem_alloc;
2640Sstevel@tonic-gate 	if (f_out != NULL)
2650Sstevel@tonic-gate 		*f_out = vmem_free;
2660Sstevel@tonic-gate 
2670Sstevel@tonic-gate 	return (sbrk_heap);
2680Sstevel@tonic-gate }
269