xref: /onnv-gate/usr/src/uts/common/vm/seg.h (revision 3247)
10Sstevel@tonic-gate /*
20Sstevel@tonic-gate  * CDDL HEADER START
30Sstevel@tonic-gate  *
40Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
5*3247Sgjelinek  * Common Development and Distribution License (the "License").
6*3247Sgjelinek  * You may not use this file except in compliance with the License.
70Sstevel@tonic-gate  *
80Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
90Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
100Sstevel@tonic-gate  * See the License for the specific language governing permissions
110Sstevel@tonic-gate  * and limitations under the License.
120Sstevel@tonic-gate  *
130Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
140Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
150Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
160Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
170Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
180Sstevel@tonic-gate  *
190Sstevel@tonic-gate  * CDDL HEADER END
200Sstevel@tonic-gate  */
210Sstevel@tonic-gate /*
22*3247Sgjelinek  * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
230Sstevel@tonic-gate  * Use is subject to license terms.
240Sstevel@tonic-gate  */
250Sstevel@tonic-gate 
260Sstevel@tonic-gate /*	Copyright (c) 1984, 1986, 1987, 1988, 1989 AT&T	*/
270Sstevel@tonic-gate /*	  All Rights Reserved  	*/
280Sstevel@tonic-gate 
290Sstevel@tonic-gate /*
300Sstevel@tonic-gate  * University Copyright- Copyright (c) 1982, 1986, 1988
310Sstevel@tonic-gate  * The Regents of the University of California
320Sstevel@tonic-gate  * All Rights Reserved
330Sstevel@tonic-gate  *
340Sstevel@tonic-gate  * University Acknowledgment- Portions of this document are derived from
350Sstevel@tonic-gate  * software developed by the University of California, Berkeley, and its
360Sstevel@tonic-gate  * contributors.
370Sstevel@tonic-gate  */
380Sstevel@tonic-gate 
390Sstevel@tonic-gate #ifndef	_VM_SEG_H
400Sstevel@tonic-gate #define	_VM_SEG_H
410Sstevel@tonic-gate 
420Sstevel@tonic-gate #pragma ident	"%Z%%M%	%I%	%E% SMI"
430Sstevel@tonic-gate 
440Sstevel@tonic-gate #include <sys/vnode.h>
450Sstevel@tonic-gate #include <sys/avl.h>
460Sstevel@tonic-gate #include <vm/seg_enum.h>
470Sstevel@tonic-gate #include <vm/faultcode.h>
480Sstevel@tonic-gate #include <vm/hat.h>
490Sstevel@tonic-gate 
500Sstevel@tonic-gate #ifdef	__cplusplus
510Sstevel@tonic-gate extern "C" {
520Sstevel@tonic-gate #endif
530Sstevel@tonic-gate 
540Sstevel@tonic-gate /*
550Sstevel@tonic-gate  * VM - Segments.
560Sstevel@tonic-gate  */
570Sstevel@tonic-gate 
580Sstevel@tonic-gate /*
590Sstevel@tonic-gate  * kstat statistics for segment advise
600Sstevel@tonic-gate  */
610Sstevel@tonic-gate typedef struct {
620Sstevel@tonic-gate 	kstat_named_t MADV_FREE_hit;
630Sstevel@tonic-gate 	kstat_named_t MADV_FREE_miss;
640Sstevel@tonic-gate } segadvstat_t;
650Sstevel@tonic-gate 
660Sstevel@tonic-gate /*
670Sstevel@tonic-gate  * memory object ids
680Sstevel@tonic-gate  */
690Sstevel@tonic-gate typedef struct memid { u_longlong_t val[2]; } memid_t;
700Sstevel@tonic-gate 
710Sstevel@tonic-gate /*
720Sstevel@tonic-gate  * An address space contains a set of segments, managed by drivers.
730Sstevel@tonic-gate  * Drivers support mapped devices, sharing, copy-on-write, etc.
740Sstevel@tonic-gate  *
750Sstevel@tonic-gate  * The seg structure contains a lock to prevent races, the base virtual
760Sstevel@tonic-gate  * address and size of the segment, a back pointer to the containing
770Sstevel@tonic-gate  * address space, pointers to maintain an AVL tree of segments in the
780Sstevel@tonic-gate  * same address space, and procedure and data hooks for the driver.
790Sstevel@tonic-gate  * The AVL tree of segments for the address space is sorted by
800Sstevel@tonic-gate  * ascending base addresses and overlapping segments are not allowed.
810Sstevel@tonic-gate  *
820Sstevel@tonic-gate  * After a segment is created, faults may occur on pages of the segment.
830Sstevel@tonic-gate  * When a fault occurs, the fault handling code must get the desired
840Sstevel@tonic-gate  * object and set up the hardware translation to the object.  For some
850Sstevel@tonic-gate  * objects, the fault handling code also implements copy-on-write.
860Sstevel@tonic-gate  *
870Sstevel@tonic-gate  * When the hat wants to unload a translation, it can call the unload
880Sstevel@tonic-gate  * routine which is responsible for processing reference and modify bits.
890Sstevel@tonic-gate  *
900Sstevel@tonic-gate  * Each segment is protected by it's containing address space lock.  To
910Sstevel@tonic-gate  * access any field in the segment structure, the "as" must be locked.
920Sstevel@tonic-gate  * If a segment field is to be modified, the address space lock must be
930Sstevel@tonic-gate  * write locked.
940Sstevel@tonic-gate  */
950Sstevel@tonic-gate 
960Sstevel@tonic-gate struct seg {
970Sstevel@tonic-gate 	caddr_t	s_base;			/* base virtual address */
980Sstevel@tonic-gate 	size_t	s_size;			/* size in bytes */
990Sstevel@tonic-gate 	uint_t	s_szc;			/* max page size code */
1000Sstevel@tonic-gate 	uint_t	s_flags;		/* flags for segment, see below */
1010Sstevel@tonic-gate 	struct	as *s_as;		/* containing address space */
1020Sstevel@tonic-gate 	avl_node_t s_tree;		/* AVL tree links to segs in this as */
1030Sstevel@tonic-gate 	struct	seg_ops *s_ops;		/* ops vector: see below */
1040Sstevel@tonic-gate 	void *s_data;			/* private data for instance */
1050Sstevel@tonic-gate };
1060Sstevel@tonic-gate 
1070Sstevel@tonic-gate #define	S_PURGE		(0x01)		/* seg should be purged in as_gap() */
1080Sstevel@tonic-gate 
1090Sstevel@tonic-gate struct	seg_ops {
1100Sstevel@tonic-gate 	int	(*dup)(struct seg *, struct seg *);
1110Sstevel@tonic-gate 	int	(*unmap)(struct seg *, caddr_t, size_t);
1120Sstevel@tonic-gate 	void	(*free)(struct seg *);
1130Sstevel@tonic-gate 	faultcode_t (*fault)(struct hat *, struct seg *, caddr_t, size_t,
1140Sstevel@tonic-gate 	    enum fault_type, enum seg_rw);
1150Sstevel@tonic-gate 	faultcode_t (*faulta)(struct seg *, caddr_t);
1160Sstevel@tonic-gate 	int	(*setprot)(struct seg *, caddr_t, size_t, uint_t);
1170Sstevel@tonic-gate 	int	(*checkprot)(struct seg *, caddr_t, size_t, uint_t);
1180Sstevel@tonic-gate 	int	(*kluster)(struct seg *, caddr_t, ssize_t);
1190Sstevel@tonic-gate 	size_t	(*swapout)(struct seg *);
1200Sstevel@tonic-gate 	int	(*sync)(struct seg *, caddr_t, size_t, int, uint_t);
1210Sstevel@tonic-gate 	size_t	(*incore)(struct seg *, caddr_t, size_t, char *);
1220Sstevel@tonic-gate 	int	(*lockop)(struct seg *, caddr_t, size_t, int, int, ulong_t *,
1230Sstevel@tonic-gate 			size_t);
1240Sstevel@tonic-gate 	int	(*getprot)(struct seg *, caddr_t, size_t, uint_t *);
1250Sstevel@tonic-gate 	u_offset_t	(*getoffset)(struct seg *, caddr_t);
1260Sstevel@tonic-gate 	int	(*gettype)(struct seg *, caddr_t);
1270Sstevel@tonic-gate 	int	(*getvp)(struct seg *, caddr_t, struct vnode **);
1280Sstevel@tonic-gate 	int	(*advise)(struct seg *, caddr_t, size_t, uint_t);
1290Sstevel@tonic-gate 	void	(*dump)(struct seg *);
1300Sstevel@tonic-gate 	int	(*pagelock)(struct seg *, caddr_t, size_t, struct page ***,
1310Sstevel@tonic-gate 			enum lock_type, enum seg_rw);
1320Sstevel@tonic-gate 	int	(*setpagesize)(struct seg *, caddr_t, size_t, uint_t);
1330Sstevel@tonic-gate 	int	(*getmemid)(struct seg *, caddr_t, memid_t *);
1340Sstevel@tonic-gate 	struct lgrp_mem_policy_info	*(*getpolicy)(struct seg *, caddr_t);
135670Selowe 	int	(*capable)(struct seg *, segcapability_t);
1360Sstevel@tonic-gate };
1370Sstevel@tonic-gate 
1380Sstevel@tonic-gate #ifdef _KERNEL
1390Sstevel@tonic-gate /*
1400Sstevel@tonic-gate  * Generic segment operations
1410Sstevel@tonic-gate  */
1420Sstevel@tonic-gate extern	void	seg_init(void);
1430Sstevel@tonic-gate extern	struct	seg *seg_alloc(struct as *as, caddr_t base, size_t size);
1440Sstevel@tonic-gate extern	int	seg_attach(struct as *as, caddr_t base, size_t size,
1450Sstevel@tonic-gate 			struct seg *seg);
1460Sstevel@tonic-gate extern	void	seg_unmap(struct seg *seg);
1470Sstevel@tonic-gate extern	void	seg_free(struct seg *seg);
1480Sstevel@tonic-gate 
1490Sstevel@tonic-gate /*
1500Sstevel@tonic-gate  * functions for pagelock cache support
1510Sstevel@tonic-gate  */
1520Sstevel@tonic-gate extern	void	seg_ppurge(struct seg *seg);
1530Sstevel@tonic-gate extern	void	seg_ppurge_seg(int (*callback)());
1540Sstevel@tonic-gate extern	void	seg_pinactive(struct seg *seg, caddr_t addr, size_t len,
1550Sstevel@tonic-gate 			struct page **pp, enum seg_rw rw, int (*callback)());
1560Sstevel@tonic-gate extern	int	seg_pinsert_check(struct seg *seg, size_t len, uint_t flags);
1570Sstevel@tonic-gate extern	int	seg_pinsert(struct seg *seg, caddr_t addr, size_t len,
1580Sstevel@tonic-gate 			struct page **pp, enum seg_rw rw, uint_t flags,
1590Sstevel@tonic-gate 			int (*callback)());
1600Sstevel@tonic-gate extern	struct	page **seg_plookup(struct seg *seg, caddr_t addr,
1610Sstevel@tonic-gate 			size_t len, enum seg_rw rw);
1620Sstevel@tonic-gate extern	void	seg_pasync_thread(void);
1630Sstevel@tonic-gate extern	void	seg_preap(void);
1640Sstevel@tonic-gate 
1650Sstevel@tonic-gate extern	int	seg_preapahead;
1660Sstevel@tonic-gate extern	segadvstat_t  segadvstat;
1670Sstevel@tonic-gate /*
1680Sstevel@tonic-gate  * Flags for pagelock cache support
1690Sstevel@tonic-gate  */
1700Sstevel@tonic-gate #define	SEGP_ASYNC_FLUSH	0x1	/* flushed by async thread */
1710Sstevel@tonic-gate #define	SEGP_FORCE_WIRED	0x2	/* skip check against seg_pwindow */
1720Sstevel@tonic-gate 
1730Sstevel@tonic-gate /*
1740Sstevel@tonic-gate  * Return values for seg_pinsert and seg_pinsert_check functions.
1750Sstevel@tonic-gate  */
1760Sstevel@tonic-gate #define	SEGP_SUCCESS		0	/* seg_pinsert() succeeded */
1770Sstevel@tonic-gate #define	SEGP_FAIL		1	/* seg_pinsert() failed */
1780Sstevel@tonic-gate 
1790Sstevel@tonic-gate /* Page status bits for segop_incore */
1800Sstevel@tonic-gate #define	SEG_PAGE_INCORE		0x01	/* VA has a page backing it */
1810Sstevel@tonic-gate #define	SEG_PAGE_LOCKED		0x02	/* VA has a page that is locked */
1820Sstevel@tonic-gate #define	SEG_PAGE_HASCOW		0x04	/* VA has a page with a copy-on-write */
1830Sstevel@tonic-gate #define	SEG_PAGE_SOFTLOCK	0x08	/* VA has a page with softlock held */
1840Sstevel@tonic-gate #define	SEG_PAGE_VNODEBACKED	0x10	/* Segment is backed by a vnode */
1850Sstevel@tonic-gate #define	SEG_PAGE_ANON		0x20	/* VA has an anonymous page */
1860Sstevel@tonic-gate #define	SEG_PAGE_VNODE		0x40	/* VA has a vnode page backing it */
1870Sstevel@tonic-gate 
1880Sstevel@tonic-gate #define	SEGOP_DUP(s, n)		    (*(s)->s_ops->dup)((s), (n))
1890Sstevel@tonic-gate #define	SEGOP_UNMAP(s, a, l)	    (*(s)->s_ops->unmap)((s), (a), (l))
1900Sstevel@tonic-gate #define	SEGOP_FREE(s)		    (*(s)->s_ops->free)((s))
1910Sstevel@tonic-gate #define	SEGOP_FAULT(h, s, a, l, t, rw) \
1920Sstevel@tonic-gate 		(*(s)->s_ops->fault)((h), (s), (a), (l), (t), (rw))
1930Sstevel@tonic-gate #define	SEGOP_FAULTA(s, a)	    (*(s)->s_ops->faulta)((s), (a))
1940Sstevel@tonic-gate #define	SEGOP_SETPROT(s, a, l, p)   (*(s)->s_ops->setprot)((s), (a), (l), (p))
1950Sstevel@tonic-gate #define	SEGOP_CHECKPROT(s, a, l, p) (*(s)->s_ops->checkprot)((s), (a), (l), (p))
1960Sstevel@tonic-gate #define	SEGOP_KLUSTER(s, a, d)	    (*(s)->s_ops->kluster)((s), (a), (d))
1970Sstevel@tonic-gate #define	SEGOP_SWAPOUT(s)	    (*(s)->s_ops->swapout)((s))
1980Sstevel@tonic-gate #define	SEGOP_SYNC(s, a, l, atr, f) \
1990Sstevel@tonic-gate 		(*(s)->s_ops->sync)((s), (a), (l), (atr), (f))
2000Sstevel@tonic-gate #define	SEGOP_INCORE(s, a, l, v)    (*(s)->s_ops->incore)((s), (a), (l), (v))
2010Sstevel@tonic-gate #define	SEGOP_LOCKOP(s, a, l, atr, op, b, p) \
2020Sstevel@tonic-gate 		(*(s)->s_ops->lockop)((s), (a), (l), (atr), (op), (b), (p))
2030Sstevel@tonic-gate #define	SEGOP_GETPROT(s, a, l, p)   (*(s)->s_ops->getprot)((s), (a), (l), (p))
2040Sstevel@tonic-gate #define	SEGOP_GETOFFSET(s, a)	    (*(s)->s_ops->getoffset)((s), (a))
2050Sstevel@tonic-gate #define	SEGOP_GETTYPE(s, a)	    (*(s)->s_ops->gettype)((s), (a))
2060Sstevel@tonic-gate #define	SEGOP_GETVP(s, a, vpp)	    (*(s)->s_ops->getvp)((s), (a), (vpp))
2070Sstevel@tonic-gate #define	SEGOP_ADVISE(s, a, l, b)    (*(s)->s_ops->advise)((s), (a), (l), (b))
2080Sstevel@tonic-gate #define	SEGOP_DUMP(s)		    (*(s)->s_ops->dump)((s))
2090Sstevel@tonic-gate #define	SEGOP_PAGELOCK(s, a, l, p, t, rw) \
2100Sstevel@tonic-gate 		(*(s)->s_ops->pagelock)((s), (a), (l), (p), (t), (rw))
2110Sstevel@tonic-gate #define	SEGOP_SETPAGESIZE(s, a, l, szc) \
2120Sstevel@tonic-gate 		(*(s)->s_ops->setpagesize)((s), (a), (l), (szc))
2130Sstevel@tonic-gate #define	SEGOP_GETMEMID(s, a, mp)    (*(s)->s_ops->getmemid)((s), (a), (mp))
2140Sstevel@tonic-gate #define	SEGOP_GETPOLICY(s, a)	    (*(s)->s_ops->getpolicy)((s), (a))
215670Selowe #define	SEGOP_CAPABLE(s, c)	    (*(s)->s_ops->capable)((s), (c))
2160Sstevel@tonic-gate 
2170Sstevel@tonic-gate #define	seg_page(seg, addr) \
2180Sstevel@tonic-gate 	(((uintptr_t)((addr) - (seg)->s_base)) >> PAGESHIFT)
2190Sstevel@tonic-gate 
2200Sstevel@tonic-gate #define	seg_pages(seg) \
2210Sstevel@tonic-gate 	(((uintptr_t)((seg)->s_size + PAGEOFFSET)) >> PAGESHIFT)
2220Sstevel@tonic-gate 
2230Sstevel@tonic-gate #define	IE_NOMEM	-1	/* internal to seg layer */
2240Sstevel@tonic-gate #define	IE_RETRY	-2	/* internal to seg layer */
2250Sstevel@tonic-gate #define	IE_REATTACH	-3	/* internal to seg layer */
2260Sstevel@tonic-gate 
2270Sstevel@tonic-gate /* Delay/retry factors for seg_p_mem_config_pre_del */
2280Sstevel@tonic-gate #define	SEGP_PREDEL_DELAY_FACTOR	4
2290Sstevel@tonic-gate /*
2300Sstevel@tonic-gate  * As a workaround to being unable to purge the pagelock
2310Sstevel@tonic-gate  * cache during a DR delete memory operation, we use
2320Sstevel@tonic-gate  * a stall threshold that is twice the maximum seen
2330Sstevel@tonic-gate  * during testing.  This workaround will be removed
2340Sstevel@tonic-gate  * when a suitable fix is found.
2350Sstevel@tonic-gate  */
2360Sstevel@tonic-gate #define	SEGP_STALL_SECONDS	25
2370Sstevel@tonic-gate #define	SEGP_STALL_THRESHOLD \
2380Sstevel@tonic-gate 	(SEGP_STALL_SECONDS * SEGP_PREDEL_DELAY_FACTOR)
2390Sstevel@tonic-gate 
2400Sstevel@tonic-gate #ifdef VMDEBUG
2410Sstevel@tonic-gate 
2420Sstevel@tonic-gate uint_t	seg_page(struct seg *, caddr_t);
2430Sstevel@tonic-gate uint_t	seg_pages(struct seg *);
2440Sstevel@tonic-gate 
2450Sstevel@tonic-gate #endif	/* VMDEBUG */
2460Sstevel@tonic-gate 
247*3247Sgjelinek boolean_t	seg_can_change_zones(struct seg *);
248*3247Sgjelinek size_t		seg_swresv(struct seg *);
249*3247Sgjelinek 
2500Sstevel@tonic-gate #endif	/* _KERNEL */
2510Sstevel@tonic-gate 
2520Sstevel@tonic-gate #ifdef	__cplusplus
2530Sstevel@tonic-gate }
2540Sstevel@tonic-gate #endif
2550Sstevel@tonic-gate 
2560Sstevel@tonic-gate #endif	/* _VM_SEG_H */
257