141490Smckusick /* 241490Smckusick * Copyright (c) 1988 University of Utah. 341490Smckusick * Copyright (c) 1990 The Regents of the University of California. 441490Smckusick * All rights reserved. 541490Smckusick * 641490Smckusick * This code is derived from software contributed to Berkeley by 741490Smckusick * the Systems Programming Group of the University of Utah Computer 841490Smckusick * Science Department. Originally from University of Wisconsin. 941490Smckusick * 1041490Smckusick * %sccs.include.redist.c% 1141490Smckusick * 1241490Smckusick * from: Utah $Hdr: uipc_shm.c 1.9 89/08/14$ 1341490Smckusick * 14*42964Smckusick * @(#)sysv_shm.c 7.6 (Berkeley) 06/07/90 1541490Smckusick */ 1641490Smckusick 1741490Smckusick /* 1841490Smckusick * System V shared memory routines. 1941490Smckusick */ 2041490Smckusick 2141490Smckusick #ifdef SYSVSHM 2241490Smckusick 2341490Smckusick #include "machine/pte.h" 2441490Smckusick 2541490Smckusick #include "param.h" 2641490Smckusick #include "systm.h" 2742961Smckusick #include "syscontext.h" 2841490Smckusick #include "kernel.h" 2941490Smckusick #include "proc.h" 3041490Smckusick #include "vm.h" 3141490Smckusick #include "shm.h" 3241490Smckusick #include "mapmem.h" 3341490Smckusick #include "malloc.h" 3441490Smckusick 3541490Smckusick #ifdef HPUXCOMPAT 3641490Smckusick #include "../hpux/hpux.h" 3741490Smckusick #endif 3841490Smckusick 3941490Smckusick int shmat(), shmctl(), shmdt(), shmget(); 4041490Smckusick int (*shmcalls[])() = { shmat, shmctl, shmdt, shmget }; 4141490Smckusick int shmtot = 0; 4241490Smckusick 4341490Smckusick int shmfork(), shmexit(); 4441490Smckusick struct mapmemops shmops = { shmfork, (int (*)())0, shmexit, shmexit }; 4541490Smckusick 4641490Smckusick shminit() 4741490Smckusick { 4841490Smckusick register int i; 4941490Smckusick 5041490Smckusick if (shminfo.shmmni > SHMMMNI) 5141490Smckusick shminfo.shmmni = SHMMMNI; 5241490Smckusick for (i = 0; i < shminfo.shmmni; i++) { 5341490Smckusick shmsegs[i].shm_perm.mode = 0; 5441490Smckusick shmsegs[i].shm_perm.seq = 0; 5541490Smckusick } 5641490Smckusick } 5741490Smckusick 5842961Smckusick /* 5942961Smckusick * Entry point for all SHM calls 6042961Smckusick */ 6142961Smckusick shmsys(p, uap, retval) 6242961Smckusick struct proc *p; 6342961Smckusick struct args { 6442961Smckusick int which; 6542961Smckusick } *uap; 6642961Smckusick int *retval; 6741490Smckusick { 6841490Smckusick 6942961Smckusick if (uap->which >= sizeof(shmcalls)/sizeof(shmcalls[0])) 7042961Smckusick RETURN (EINVAL); 7142961Smckusick RETURN ((*shmcalls[uap->which])(p, &uap[1], retval)); 7241490Smckusick } 7341490Smckusick 7442961Smckusick /* 7542961Smckusick * Get a shared memory segment 7642961Smckusick */ 7742961Smckusick shmget(p, uap, retval) 7842961Smckusick struct proc *p; 7942961Smckusick register struct args { 8041490Smckusick key_t key; 8141490Smckusick int size; 8241490Smckusick int shmflg; 8342961Smckusick } *uap; 8442961Smckusick int *retval; 8542961Smckusick { 8641490Smckusick register struct shmid_ds *shp; 8742961Smckusick register struct ucred *cred = u.u_cred; 8841490Smckusick register int i; 8942961Smckusick int error, size, rval = 0; 9041490Smckusick caddr_t kva; 9141490Smckusick 9241490Smckusick /* look up the specified shm_id */ 9341490Smckusick if (uap->key != IPC_PRIVATE) { 9441490Smckusick for (i = 0; i < shminfo.shmmni; i++) 9541490Smckusick if ((shmsegs[i].shm_perm.mode & SHM_ALLOC) && 9641490Smckusick shmsegs[i].shm_perm.key == uap->key) { 9741490Smckusick rval = i; 9841490Smckusick break; 9941490Smckusick } 10041490Smckusick } else 10141490Smckusick i = shminfo.shmmni; 10241490Smckusick 10341490Smckusick /* create a new shared segment if necessary */ 10441490Smckusick if (i == shminfo.shmmni) { 10542961Smckusick if ((uap->shmflg & IPC_CREAT) == 0) 10642961Smckusick return (ENOENT); 10742961Smckusick if (uap->size < shminfo.shmmin || uap->size > shminfo.shmmax) 10842961Smckusick return (EINVAL); 10941490Smckusick for (i = 0; i < shminfo.shmmni; i++) 11041490Smckusick if ((shmsegs[i].shm_perm.mode & SHM_ALLOC) == 0) { 11141490Smckusick rval = i; 11241490Smckusick break; 11341490Smckusick } 11442961Smckusick if (i == shminfo.shmmni) 11542961Smckusick return (ENOSPC); 11641490Smckusick size = clrnd(btoc(uap->size)); 11742961Smckusick if (shmtot + size > shminfo.shmall) 11842961Smckusick return (ENOMEM); 11941490Smckusick shp = &shmsegs[rval]; 12041490Smckusick /* 12141490Smckusick * We need to do a couple of things to ensure consistency 12241490Smckusick * in case we sleep in malloc(). We mark segment as 12341490Smckusick * allocated so that other shmgets() will not allocate it. 12441490Smckusick * We mark it as "destroyed" to insure that shmvalid() is 12541490Smckusick * false making most operations fail (XXX). We set the key, 12641490Smckusick * so that other shmget()s will fail. 12741490Smckusick */ 12841490Smckusick shp->shm_perm.mode = SHM_ALLOC | SHM_DEST; 12941490Smckusick shp->shm_perm.key = uap->key; 13041490Smckusick kva = (caddr_t) malloc((u_long)ctob(size), M_SHM, M_WAITOK); 13141490Smckusick if (kva == NULL) { 13241490Smckusick shp->shm_perm.mode = 0; 13342961Smckusick return (ENOMEM); 13441490Smckusick } 13541490Smckusick if (!claligned(kva)) 13641490Smckusick panic("shmget: non-aligned memory"); 13741490Smckusick bzero(kva, (u_int)ctob(size)); 13841490Smckusick shmtot += size; 13942961Smckusick shp->shm_perm.cuid = shp->shm_perm.uid = cred->cr_uid; 14042961Smckusick shp->shm_perm.cgid = shp->shm_perm.gid = cred->cr_gid; 14141490Smckusick shp->shm_perm.mode = SHM_ALLOC | (uap->shmflg&0777); 14241490Smckusick shp->shm_handle = (void *) kvtopte(kva); 14341490Smckusick shp->shm_segsz = uap->size; 14442922Smckusick shp->shm_cpid = p->p_pid; 14541490Smckusick shp->shm_lpid = shp->shm_nattch = 0; 14641490Smckusick shp->shm_atime = shp->shm_dtime = 0; 14741490Smckusick shp->shm_ctime = time.tv_sec; 14841490Smckusick } else { 14941490Smckusick shp = &shmsegs[rval]; 15041490Smckusick /* XXX: probably not the right thing to do */ 15142961Smckusick if (shp->shm_perm.mode & SHM_DEST) 15242961Smckusick return (EBUSY); 15342961Smckusick if (error = ipcaccess(cred, &shp->shm_perm, uap->shmflg&0777)) 15442961Smckusick return (error); 15542961Smckusick if (uap->size && uap->size > shp->shm_segsz) 15642961Smckusick return (EINVAL); 15742961Smckusick if ((uap->shmflg&IPC_CREAT) && (uap->shmflg&IPC_EXCL)) 15842961Smckusick return (EEXIST); 15941490Smckusick } 16042961Smckusick *retval = shp->shm_perm.seq * SHMMMNI + rval; 16141490Smckusick } 16241490Smckusick 16342961Smckusick /* 16442961Smckusick * Shared memory control 16542961Smckusick */ 16642961Smckusick /* ARGSUSED */ 16742961Smckusick shmctl(p, uap, retval) 16842961Smckusick struct proc *p; 16942961Smckusick register struct args { 17041490Smckusick int shmid; 17141490Smckusick int cmd; 17241490Smckusick caddr_t buf; 17342961Smckusick } *uap; 17442961Smckusick int *retval; 17542961Smckusick { 17641490Smckusick register struct shmid_ds *shp; 17742961Smckusick register struct ucred *cred = u.u_cred; 17841490Smckusick struct shmid_ds sbuf; 17942961Smckusick int error; 18041490Smckusick 18142961Smckusick if (error = shmvalid(uap->shmid)) 18242961Smckusick return (error); 18341490Smckusick shp = &shmsegs[uap->shmid % SHMMMNI]; 18441490Smckusick switch (uap->cmd) { 18541490Smckusick case IPC_STAT: 18642961Smckusick if (error = ipcaccess(cred, &shp->shm_perm, IPC_R)) 18742961Smckusick return (error); 18842961Smckusick return (copyout((caddr_t)shp, uap->buf, sizeof(*shp))); 18941490Smckusick 19041490Smckusick case IPC_SET: 19142961Smckusick if (cred->cr_uid && cred->cr_uid != shp->shm_perm.uid && 19242961Smckusick cred->cr_uid != shp->shm_perm.cuid) 19342961Smckusick return (EPERM); 19442961Smckusick if (error = copyin(uap->buf, (caddr_t)&sbuf, sizeof sbuf)) 19542961Smckusick return (error); 19642961Smckusick shp->shm_perm.uid = sbuf.shm_perm.uid; 19742961Smckusick shp->shm_perm.gid = sbuf.shm_perm.gid; 19842961Smckusick shp->shm_perm.mode = (shp->shm_perm.mode & ~0777) 19942961Smckusick | (sbuf.shm_perm.mode & 0777); 20042961Smckusick shp->shm_ctime = time.tv_sec; 20141490Smckusick break; 20241490Smckusick 20341490Smckusick case IPC_RMID: 20442961Smckusick if (cred->cr_uid && cred->cr_uid != shp->shm_perm.uid && 20542961Smckusick cred->cr_uid != shp->shm_perm.cuid) 20642961Smckusick return (EPERM); 20741490Smckusick /* set ctime? */ 20841490Smckusick shp->shm_perm.key = IPC_PRIVATE; 20941490Smckusick shp->shm_perm.mode |= SHM_DEST; 21041490Smckusick if (shp->shm_nattch <= 0) 21141490Smckusick shmfree(shp); 21241490Smckusick break; 21341490Smckusick 21441490Smckusick #ifdef HPUXCOMPAT 21541490Smckusick case SHM_LOCK: 21641490Smckusick case SHM_UNLOCK: 21741490Smckusick /* don't really do anything, but make them think we did */ 21842922Smckusick if ((p->p_flag & SHPUX) == 0) 21942961Smckusick return (EINVAL); 22042961Smckusick if (cred->cr_uid && cred->cr_uid != shp->shm_perm.uid && 22142961Smckusick cred->cr_uid != shp->shm_perm.cuid) 22242961Smckusick return (EPERM); 22341490Smckusick break; 22441490Smckusick #endif 22541490Smckusick 22641490Smckusick default: 22742961Smckusick return (EINVAL); 22841490Smckusick } 22942961Smckusick return (0); 23041490Smckusick } 23141490Smckusick 23242961Smckusick /* 23342961Smckusick * Attach to shared memory segment. 23442961Smckusick */ 23542961Smckusick shmat(p, uap, retval) 23642961Smckusick struct proc *p; 23742961Smckusick register struct args { 23841490Smckusick int shmid; 23941490Smckusick caddr_t shmaddr; 24041490Smckusick int shmflg; 24142961Smckusick } *uap; 24242961Smckusick int *retval; 24342961Smckusick { 24441490Smckusick register struct shmid_ds *shp; 24541490Smckusick register int size; 24641490Smckusick struct mapmem *mp; 24741490Smckusick caddr_t uva; 24842961Smckusick int error, error1, prot, shmmapin(); 24941490Smckusick 25042961Smckusick if (error = shmvalid(uap->shmid)) 25142961Smckusick return (error); 25241490Smckusick shp = &shmsegs[uap->shmid % SHMMMNI]; 25341490Smckusick if (shp->shm_handle == NULL) 25442349Smckusick panic("shmat NULL handle"); 25542961Smckusick if (error = ipcaccess(u.u_cred, &shp->shm_perm, 25641490Smckusick (uap->shmflg&SHM_RDONLY) ? IPC_R : IPC_R|IPC_W)) 25742961Smckusick return (error); 25841490Smckusick uva = uap->shmaddr; 25941490Smckusick if (uva && ((int)uva & (SHMLBA-1))) { 26041490Smckusick if (uap->shmflg & SHM_RND) 26141490Smckusick uva = (caddr_t) ((int)uva & ~(SHMLBA-1)); 26242961Smckusick else 26342961Smckusick return (EINVAL); 26441490Smckusick } 26541490Smckusick /* 26641490Smckusick * Make sure user doesn't use more than their fair share 26741490Smckusick */ 26841490Smckusick size = 0; 26941490Smckusick for (mp = u.u_mmap; mp; mp = mp->mm_next) 27041490Smckusick if (mp->mm_ops == &shmops) 27141490Smckusick size++; 27242961Smckusick if (size >= shminfo.shmseg) 27342961Smckusick return (EMFILE); 27441490Smckusick /* 27541490Smckusick * Allocate a mapped memory region descriptor and 27641490Smckusick * attempt to expand the user page table to allow for region 27741490Smckusick */ 27841490Smckusick prot = (uap->shmflg & SHM_RDONLY) ? MM_RO : MM_RW; 27941490Smckusick #if defined(hp300) 28041490Smckusick prot |= MM_CI; 28141490Smckusick #endif 28241490Smckusick size = ctob(clrnd(btoc(shp->shm_segsz))); 28342922Smckusick error = mmalloc(p, uap->shmid, &uva, (segsz_t)size, prot, &shmops, &mp); 28442961Smckusick if (error) 28542961Smckusick return (error); 28642961Smckusick if (error = mmmapin(p, mp, shmmapin)) { 28742961Smckusick if (error1 = mmfree(p, mp)) 28842961Smckusick return (error1); 28942961Smckusick return (error); 29042922Smckusick } 29141490Smckusick /* 29241490Smckusick * Fill in the remaining fields 29341490Smckusick */ 29442922Smckusick shp->shm_lpid = p->p_pid; 29541490Smckusick shp->shm_atime = time.tv_sec; 29641490Smckusick shp->shm_nattch++; 29742961Smckusick *retval = (int) uva; 29841490Smckusick } 29941490Smckusick 30042961Smckusick /* 30142961Smckusick * Detach from shared memory segment. 30242961Smckusick */ 30342961Smckusick /* ARGSUSED */ 30442961Smckusick shmdt(p, uap, retval) 30542961Smckusick struct proc *p; 30642961Smckusick struct args { 30742961Smckusick caddr_t shmaddr; 30842961Smckusick } *uap; 30942961Smckusick int *retval; 31041490Smckusick { 31141490Smckusick register struct mapmem *mp; 31241490Smckusick 31341490Smckusick for (mp = u.u_mmap; mp; mp = mp->mm_next) 31441490Smckusick if (mp->mm_ops == &shmops && mp->mm_uva == uap->shmaddr) 31541490Smckusick break; 31642961Smckusick if (mp == MMNIL) 31742961Smckusick return (EINVAL); 31842922Smckusick shmsegs[mp->mm_id % SHMMMNI].shm_lpid = p->p_pid; 31942961Smckusick return (shmufree(p, mp)); 32041490Smckusick } 32141490Smckusick 32241490Smckusick shmmapin(mp, off) 32341490Smckusick struct mapmem *mp; 32441490Smckusick { 32541490Smckusick register struct shmid_ds *shp; 32641490Smckusick 32741490Smckusick shp = &shmsegs[mp->mm_id % SHMMMNI]; 32841490Smckusick if (off >= ctob(clrnd(btoc(shp->shm_segsz)))) 32941490Smckusick return(-1); 33041490Smckusick return(((struct pte *)shp->shm_handle)[btop(off)].pg_pfnum); 33141490Smckusick } 33241490Smckusick 33341490Smckusick /* 33441490Smckusick * Increment attach count on fork 33541490Smckusick */ 336*42964Smckusick /* ARGSUSED */ 33741490Smckusick shmfork(mp, ischild) 33841490Smckusick register struct mapmem *mp; 33941490Smckusick { 34041490Smckusick if (!ischild) 34141490Smckusick shmsegs[mp->mm_id % SHMMMNI].shm_nattch++; 34241490Smckusick } 34341490Smckusick 34441490Smckusick /* 34541490Smckusick * Detach from shared memory segment on exit (or exec) 34641490Smckusick */ 347*42964Smckusick shmexit(p, mp) 348*42964Smckusick struct proc *p; 349*42964Smckusick struct mapmem *mp; 35041490Smckusick { 35142922Smckusick 35242961Smckusick return (shmufree(p, mp)); 35341490Smckusick } 35441490Smckusick 35541490Smckusick shmvalid(id) 35641490Smckusick register int id; 35741490Smckusick { 35841490Smckusick register struct shmid_ds *shp; 35941490Smckusick 36041490Smckusick if (id < 0 || (id % SHMMMNI) >= shminfo.shmmni) 36142961Smckusick return(EINVAL); 36241490Smckusick shp = &shmsegs[id % SHMMMNI]; 36341490Smckusick if (shp->shm_perm.seq == (id / SHMMMNI) && 36441490Smckusick (shp->shm_perm.mode & (SHM_ALLOC|SHM_DEST)) == SHM_ALLOC) 36542961Smckusick return(0); 36642961Smckusick return(EINVAL); 36741490Smckusick } 36841490Smckusick 36941490Smckusick /* 37041490Smckusick * Free user resources associated with a shared memory segment 37141490Smckusick */ 37242922Smckusick shmufree(p, mp) 37342922Smckusick struct proc *p; 37441490Smckusick struct mapmem *mp; 37541490Smckusick { 37641490Smckusick register struct shmid_ds *shp; 37742922Smckusick int error; 37841490Smckusick 37941490Smckusick shp = &shmsegs[mp->mm_id % SHMMMNI]; 38042922Smckusick mmmapout(p, mp); 38142922Smckusick error = mmfree(p, mp); 38241490Smckusick shp->shm_dtime = time.tv_sec; 38341490Smckusick if (--shp->shm_nattch <= 0 && (shp->shm_perm.mode & SHM_DEST)) 38441490Smckusick shmfree(shp); 38542922Smckusick return (error); 38641490Smckusick } 38741490Smckusick 38841490Smckusick /* 38941490Smckusick * Deallocate resources associated with a shared memory segment 39041490Smckusick */ 39141490Smckusick shmfree(shp) 39241490Smckusick register struct shmid_ds *shp; 39341490Smckusick { 39441490Smckusick caddr_t kva; 39541490Smckusick 39641490Smckusick if (shp->shm_handle == NULL) 39741490Smckusick panic("shmfree"); 39841490Smckusick kva = (caddr_t) ptetokv(shp->shm_handle); 39941490Smckusick free(kva, M_SHM); 40041490Smckusick shp->shm_handle = NULL; 40141490Smckusick shmtot -= clrnd(btoc(shp->shm_segsz)); 40241490Smckusick shp->shm_perm.mode = 0; 40341490Smckusick /* 40441490Smckusick * Increment the sequence number to ensure that outstanding 40541490Smckusick * shmids for this segment will be invalid in the event that 40641490Smckusick * the segment is reallocated. Note that shmids must be 40741490Smckusick * positive as decreed by SVID. 40841490Smckusick */ 40941490Smckusick shp->shm_perm.seq++; 41041490Smckusick if ((int)(shp->shm_perm.seq * SHMMMNI) < 0) 41141490Smckusick shp->shm_perm.seq = 0; 41241490Smckusick } 41341490Smckusick 41441490Smckusick /* 41541490Smckusick * XXX This routine would be common to all sysV style IPC 41641490Smckusick * (if the others were implemented). 41741490Smckusick */ 41842961Smckusick ipcaccess(ipc, mode, cred) 41941490Smckusick register struct ipc_perm *ipc; 42042961Smckusick int mode; 42142961Smckusick register struct ucred *cred; 42241490Smckusick { 42341490Smckusick register int m; 42441490Smckusick 42542961Smckusick if (cred->cr_uid == 0) 42641490Smckusick return(0); 42741490Smckusick /* 42841490Smckusick * Access check is based on only one of owner, group, public. 42941490Smckusick * If not owner, then check group. 43041490Smckusick * If not a member of the group, then check public access. 43141490Smckusick */ 43241490Smckusick mode &= 0700; 43341490Smckusick m = ipc->mode; 43442961Smckusick if (cred->cr_uid != ipc->uid && cred->cr_uid != ipc->cuid) { 43541490Smckusick m <<= 3; 43642961Smckusick if (!groupmember(ipc->gid, cred) && 43742961Smckusick !groupmember(ipc->cgid, cred)) 43841490Smckusick m <<= 3; 43941490Smckusick } 44041490Smckusick if ((mode&m) == mode) 44142961Smckusick return (0); 44242961Smckusick return (EACCES); 44341490Smckusick } 44441490Smckusick 44541490Smckusick #endif /* SYSVSHM */ 446