xref: /freebsd/sys/kern/sysv_shm.c (revision cb1f0db9dbf89ed25f16308c33a721e7ed6ba531)
1c3aac50fSPeter Wemm /* $FreeBSD$ */
23d903220SDoug Rabson /*	$NetBSD: sysv_shm.c,v 1.23 1994/07/04 23:25:12 glass Exp $	*/
33d903220SDoug Rabson 
43d903220SDoug Rabson /*
53d903220SDoug Rabson  * Copyright (c) 1994 Adam Glass and Charles Hannum.  All rights reserved.
63d903220SDoug Rabson  *
73d903220SDoug Rabson  * Redistribution and use in source and binary forms, with or without
83d903220SDoug Rabson  * modification, are permitted provided that the following conditions
93d903220SDoug Rabson  * are met:
103d903220SDoug Rabson  * 1. Redistributions of source code must retain the above copyright
113d903220SDoug Rabson  *    notice, this list of conditions and the following disclaimer.
123d903220SDoug Rabson  * 2. Redistributions in binary form must reproduce the above copyright
133d903220SDoug Rabson  *    notice, this list of conditions and the following disclaimer in the
143d903220SDoug Rabson  *    documentation and/or other materials provided with the distribution.
153d903220SDoug Rabson  * 3. All advertising materials mentioning features or use of this software
163d903220SDoug Rabson  *    must display the following acknowledgement:
173d903220SDoug Rabson  *	This product includes software developed by Adam Glass and Charles
183d903220SDoug Rabson  *	Hannum.
193d903220SDoug Rabson  * 4. The names of the authors may not be used to endorse or promote products
203d903220SDoug Rabson  *    derived from this software without specific prior written permission.
213d903220SDoug Rabson  *
223d903220SDoug Rabson  * THIS SOFTWARE IS PROVIDED BY THE AUTHORS ``AS IS'' AND ANY EXPRESS OR
233d903220SDoug Rabson  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
243d903220SDoug Rabson  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
253d903220SDoug Rabson  * IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY DIRECT, INDIRECT,
263d903220SDoug Rabson  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
273d903220SDoug Rabson  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
283d903220SDoug Rabson  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
293d903220SDoug Rabson  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
303d903220SDoug Rabson  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
313d903220SDoug Rabson  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
323d903220SDoug Rabson  */
333d903220SDoug Rabson 
345591b823SEivind Eklund #include "opt_compat.h"
35e9822d92SJoerg Wunsch #include "opt_rlimit.h"
36255108f3SPeter Wemm #include "opt_sysvipc.h"
37511b67b7SGarrett Wollman 
383d903220SDoug Rabson #include <sys/param.h>
39725db531SBruce Evans #include <sys/systm.h>
40725db531SBruce Evans #include <sys/sysproto.h>
413d903220SDoug Rabson #include <sys/kernel.h>
42255108f3SPeter Wemm #include <sys/sysctl.h>
433d903220SDoug Rabson #include <sys/shm.h>
443d903220SDoug Rabson #include <sys/proc.h>
453d903220SDoug Rabson #include <sys/malloc.h>
463d903220SDoug Rabson #include <sys/mman.h>
473d903220SDoug Rabson #include <sys/stat.h>
48725db531SBruce Evans #include <sys/sysent.h>
49cb1f0db9SRobert Watson #include <sys/jail.h>
503d903220SDoug Rabson 
513d903220SDoug Rabson #include <vm/vm.h>
52efeaf95aSDavid Greenman #include <vm/vm_param.h>
53996c772fSJohn Dyson #include <sys/lock.h>
54efeaf95aSDavid Greenman #include <vm/pmap.h>
55a51f7119SJohn Dyson #include <vm/vm_object.h>
563d903220SDoug Rabson #include <vm/vm_map.h>
571c7c3c6aSMatthew Dillon #include <vm/vm_page.h>
58ae9b8c3aSJohn Dyson #include <vm/vm_pager.h>
593d903220SDoug Rabson 
60a1c995b6SPoul-Henning Kamp static MALLOC_DEFINE(M_SHM, "shm", "SVID compatible shared memory segments");
6155166637SPoul-Henning Kamp 
62725db531SBruce Evans struct oshmctl_args;
63cb226aaaSPoul-Henning Kamp static int oshmctl __P((struct proc *p, struct oshmctl_args *uap));
64255108f3SPeter Wemm 
65cb226aaaSPoul-Henning Kamp static int shmget_allocate_segment __P((struct proc *p, struct shmget_args *uap, int mode));
66cb226aaaSPoul-Henning Kamp static int shmget_existing __P((struct proc *p, struct shmget_args *uap, int mode, int segnum));
67725db531SBruce Evans 
68725db531SBruce Evans /* XXX casting to (sy_call_t *) is bogus, as usual. */
69303b270bSEivind Eklund static sy_call_t *shmcalls[] = {
70725db531SBruce Evans 	(sy_call_t *)shmat, (sy_call_t *)oshmctl,
71725db531SBruce Evans 	(sy_call_t *)shmdt, (sy_call_t *)shmget,
72725db531SBruce Evans 	(sy_call_t *)shmctl
73725db531SBruce Evans };
743d903220SDoug Rabson 
753d903220SDoug Rabson #define	SHMSEG_FREE     	0x0200
763d903220SDoug Rabson #define	SHMSEG_REMOVED  	0x0400
773d903220SDoug Rabson #define	SHMSEG_ALLOCATED	0x0800
783d903220SDoug Rabson #define	SHMSEG_WANTED		0x1000
793d903220SDoug Rabson 
80255108f3SPeter Wemm static int shm_last_free, shm_nused, shm_committed, shmalloced;
81255108f3SPeter Wemm static struct shmid_ds	*shmsegs;
823d903220SDoug Rabson 
833d903220SDoug Rabson struct shm_handle {
84a51f7119SJohn Dyson 	/* vm_offset_t kva; */
85a51f7119SJohn Dyson 	vm_object_t shm_object;
863d903220SDoug Rabson };
873d903220SDoug Rabson 
883d903220SDoug Rabson struct shmmap_state {
893d903220SDoug Rabson 	vm_offset_t va;
903d903220SDoug Rabson 	int shmid;
913d903220SDoug Rabson };
923d903220SDoug Rabson 
933d903220SDoug Rabson static void shm_deallocate_segment __P((struct shmid_ds *));
943d903220SDoug Rabson static int shm_find_segment_by_key __P((key_t));
953d903220SDoug Rabson static struct shmid_ds *shm_find_segment_by_shmid __P((int));
963d903220SDoug Rabson static int shm_delete_mapping __P((struct proc *, struct shmmap_state *));
97255108f3SPeter Wemm static void shmrealloc __P((void));
98255108f3SPeter Wemm static void shminit __P((void *));
99255108f3SPeter Wemm 
100255108f3SPeter Wemm /*
101255108f3SPeter Wemm  * Tuneable values
102255108f3SPeter Wemm  */
103255108f3SPeter Wemm #ifndef SHMMAXPGS
104255108f3SPeter Wemm #define	SHMMAXPGS	1024	/* XXX increase this, it's not in kva! */
105255108f3SPeter Wemm #endif
106255108f3SPeter Wemm #ifndef SHMMAX
107255108f3SPeter Wemm #define	SHMMAX	(SHMMAXPGS*PAGE_SIZE)
108255108f3SPeter Wemm #endif
109255108f3SPeter Wemm #ifndef SHMMIN
110255108f3SPeter Wemm #define	SHMMIN	1
111255108f3SPeter Wemm #endif
112255108f3SPeter Wemm #ifndef SHMMNI
113255108f3SPeter Wemm #define	SHMMNI	96
114255108f3SPeter Wemm #endif
115255108f3SPeter Wemm #ifndef SHMSEG
116255108f3SPeter Wemm #define	SHMSEG	64
117255108f3SPeter Wemm #endif
118255108f3SPeter Wemm #ifndef SHMALL
119255108f3SPeter Wemm #define	SHMALL	(SHMMAXPGS)
120255108f3SPeter Wemm #endif
121255108f3SPeter Wemm 
122255108f3SPeter Wemm struct	shminfo shminfo = {
123255108f3SPeter Wemm 	SHMMAX,
124255108f3SPeter Wemm 	SHMMIN,
125255108f3SPeter Wemm 	SHMMNI,
126255108f3SPeter Wemm 	SHMSEG,
127255108f3SPeter Wemm 	SHMALL
128255108f3SPeter Wemm };
129255108f3SPeter Wemm 
1308b03c8edSMatthew Dillon static int shm_use_phys;
1318b03c8edSMatthew Dillon 
132255108f3SPeter Wemm SYSCTL_DECL(_kern_ipc);
133255108f3SPeter Wemm SYSCTL_INT(_kern_ipc, OID_AUTO, shmmax, CTLFLAG_RW, &shminfo.shmmax, 0, "");
134255108f3SPeter Wemm SYSCTL_INT(_kern_ipc, OID_AUTO, shmmin, CTLFLAG_RW, &shminfo.shmmin, 0, "");
135255108f3SPeter Wemm SYSCTL_INT(_kern_ipc, OID_AUTO, shmmni, CTLFLAG_RD, &shminfo.shmmni, 0, "");
136255108f3SPeter Wemm SYSCTL_INT(_kern_ipc, OID_AUTO, shmseg, CTLFLAG_RW, &shminfo.shmseg, 0, "");
137255108f3SPeter Wemm SYSCTL_INT(_kern_ipc, OID_AUTO, shmall, CTLFLAG_RW, &shminfo.shmall, 0, "");
1388b03c8edSMatthew Dillon SYSCTL_INT(_kern_ipc, OID_AUTO, shm_use_phys, CTLFLAG_RW, &shm_use_phys, 0, "");
1393d903220SDoug Rabson 
1403d903220SDoug Rabson static int
1413d903220SDoug Rabson shm_find_segment_by_key(key)
1423d903220SDoug Rabson 	key_t key;
1433d903220SDoug Rabson {
1443d903220SDoug Rabson 	int i;
1453d903220SDoug Rabson 
146255108f3SPeter Wemm 	for (i = 0; i < shmalloced; i++)
1473d903220SDoug Rabson 		if ((shmsegs[i].shm_perm.mode & SHMSEG_ALLOCATED) &&
1483d903220SDoug Rabson 		    shmsegs[i].shm_perm.key == key)
1493d903220SDoug Rabson 			return i;
1503d903220SDoug Rabson 	return -1;
1513d903220SDoug Rabson }
1523d903220SDoug Rabson 
1533d903220SDoug Rabson static struct shmid_ds *
1543d903220SDoug Rabson shm_find_segment_by_shmid(shmid)
1553d903220SDoug Rabson 	int shmid;
1563d903220SDoug Rabson {
1573d903220SDoug Rabson 	int segnum;
1583d903220SDoug Rabson 	struct shmid_ds *shmseg;
1593d903220SDoug Rabson 
1603d903220SDoug Rabson 	segnum = IPCID_TO_IX(shmid);
161255108f3SPeter Wemm 	if (segnum < 0 || segnum >= shmalloced)
1623d903220SDoug Rabson 		return NULL;
1633d903220SDoug Rabson 	shmseg = &shmsegs[segnum];
1643d903220SDoug Rabson 	if ((shmseg->shm_perm.mode & (SHMSEG_ALLOCATED | SHMSEG_REMOVED))
1653d903220SDoug Rabson 	    != SHMSEG_ALLOCATED ||
1663d903220SDoug Rabson 	    shmseg->shm_perm.seq != IPCID_TO_SEQ(shmid))
1673d903220SDoug Rabson 		return NULL;
1683d903220SDoug Rabson 	return shmseg;
1693d903220SDoug Rabson }
1703d903220SDoug Rabson 
1713d903220SDoug Rabson static void
1723d903220SDoug Rabson shm_deallocate_segment(shmseg)
1733d903220SDoug Rabson 	struct shmid_ds *shmseg;
1743d903220SDoug Rabson {
1753d903220SDoug Rabson 	struct shm_handle *shm_handle;
1763d903220SDoug Rabson 	size_t size;
1773d903220SDoug Rabson 
1783d903220SDoug Rabson 	shm_handle = shmseg->shm_internal;
179a51f7119SJohn Dyson 	vm_object_deallocate(shm_handle->shm_object);
1803d903220SDoug Rabson 	free((caddr_t)shm_handle, M_SHM);
1813d903220SDoug Rabson 	shmseg->shm_internal = NULL;
182a51f7119SJohn Dyson 	size = round_page(shmseg->shm_segsz);
1833d903220SDoug Rabson 	shm_committed -= btoc(size);
1843d903220SDoug Rabson 	shm_nused--;
1853d903220SDoug Rabson 	shmseg->shm_perm.mode = SHMSEG_FREE;
1863d903220SDoug Rabson }
1873d903220SDoug Rabson 
1883d903220SDoug Rabson static int
1893d903220SDoug Rabson shm_delete_mapping(p, shmmap_s)
1903d903220SDoug Rabson 	struct proc *p;
1913d903220SDoug Rabson 	struct shmmap_state *shmmap_s;
1923d903220SDoug Rabson {
1933d903220SDoug Rabson 	struct shmid_ds *shmseg;
1943d903220SDoug Rabson 	int segnum, result;
1953d903220SDoug Rabson 	size_t size;
1963d903220SDoug Rabson 
1973d903220SDoug Rabson 	segnum = IPCID_TO_IX(shmmap_s->shmid);
1983d903220SDoug Rabson 	shmseg = &shmsegs[segnum];
199aa8de40aSPoul-Henning Kamp 	size = round_page(shmseg->shm_segsz);
20068940ac1SDavid Greenman 	result = vm_map_remove(&p->p_vmspace->vm_map, shmmap_s->va, shmmap_s->va + size);
2013d903220SDoug Rabson 	if (result != KERN_SUCCESS)
2023d903220SDoug Rabson 		return EINVAL;
2033d903220SDoug Rabson 	shmmap_s->shmid = -1;
204227ee8a1SPoul-Henning Kamp 	shmseg->shm_dtime = time_second;
2053d903220SDoug Rabson 	if ((--shmseg->shm_nattch <= 0) &&
2063d903220SDoug Rabson 	    (shmseg->shm_perm.mode & SHMSEG_REMOVED)) {
2073d903220SDoug Rabson 		shm_deallocate_segment(shmseg);
2083d903220SDoug Rabson 		shm_last_free = segnum;
2093d903220SDoug Rabson 	}
2103d903220SDoug Rabson 	return 0;
2113d903220SDoug Rabson }
2123d903220SDoug Rabson 
213b5d5c0c9SPeter Wemm #ifndef _SYS_SYSPROTO_H_
2143d903220SDoug Rabson struct shmdt_args {
2153d903220SDoug Rabson 	void *shmaddr;
2163d903220SDoug Rabson };
217b5d5c0c9SPeter Wemm #endif
218b5d5c0c9SPeter Wemm 
2193d903220SDoug Rabson int
220cb226aaaSPoul-Henning Kamp shmdt(p, uap)
2213d903220SDoug Rabson 	struct proc *p;
2223d903220SDoug Rabson 	struct shmdt_args *uap;
2233d903220SDoug Rabson {
2243d903220SDoug Rabson 	struct shmmap_state *shmmap_s;
2253d903220SDoug Rabson 	int i;
2263d903220SDoug Rabson 
227cb1f0db9SRobert Watson 	if (!jail_sysvipc_allowed && p->p_prison != NULL)
228cb1f0db9SRobert Watson 		return (ENOSYS);
229cb1f0db9SRobert Watson 
2303d903220SDoug Rabson 	shmmap_s = (struct shmmap_state *)p->p_vmspace->vm_shm;
231f205c887SJordan K. Hubbard  	if (shmmap_s == NULL)
232f205c887SJordan K. Hubbard  	    return EINVAL;
2333d903220SDoug Rabson 	for (i = 0; i < shminfo.shmseg; i++, shmmap_s++)
2343d903220SDoug Rabson 		if (shmmap_s->shmid != -1 &&
2353d903220SDoug Rabson 		    shmmap_s->va == (vm_offset_t)uap->shmaddr)
2363d903220SDoug Rabson 			break;
2373d903220SDoug Rabson 	if (i == shminfo.shmseg)
2383d903220SDoug Rabson 		return EINVAL;
2393d903220SDoug Rabson 	return shm_delete_mapping(p, shmmap_s);
2403d903220SDoug Rabson }
2413d903220SDoug Rabson 
242b5d5c0c9SPeter Wemm #ifndef _SYS_SYSPROTO_H_
2433d903220SDoug Rabson struct shmat_args {
2443d903220SDoug Rabson 	int shmid;
2453d903220SDoug Rabson 	void *shmaddr;
2463d903220SDoug Rabson 	int shmflg;
2473d903220SDoug Rabson };
248b5d5c0c9SPeter Wemm #endif
249b5d5c0c9SPeter Wemm 
2503d903220SDoug Rabson int
251cb226aaaSPoul-Henning Kamp shmat(p, uap)
2523d903220SDoug Rabson 	struct proc *p;
2533d903220SDoug Rabson 	struct shmat_args *uap;
2543d903220SDoug Rabson {
2553d903220SDoug Rabson 	int error, i, flags;
2563d903220SDoug Rabson 	struct shmid_ds *shmseg;
2573d903220SDoug Rabson 	struct shmmap_state *shmmap_s = NULL;
258a51f7119SJohn Dyson 	struct shm_handle *shm_handle;
2593d903220SDoug Rabson 	vm_offset_t attach_va;
2603d903220SDoug Rabson 	vm_prot_t prot;
2613d903220SDoug Rabson 	vm_size_t size;
262a51f7119SJohn Dyson 	int rv;
2633d903220SDoug Rabson 
264cb1f0db9SRobert Watson 	if (!jail_sysvipc_allowed && p->p_prison != NULL)
265cb1f0db9SRobert Watson 		return (ENOSYS);
266cb1f0db9SRobert Watson 
2673d903220SDoug Rabson 	shmmap_s = (struct shmmap_state *)p->p_vmspace->vm_shm;
2683d903220SDoug Rabson 	if (shmmap_s == NULL) {
2693d903220SDoug Rabson 		size = shminfo.shmseg * sizeof(struct shmmap_state);
2703d903220SDoug Rabson 		shmmap_s = malloc(size, M_SHM, M_WAITOK);
2713d903220SDoug Rabson 		for (i = 0; i < shminfo.shmseg; i++)
2723d903220SDoug Rabson 			shmmap_s[i].shmid = -1;
2733d903220SDoug Rabson 		p->p_vmspace->vm_shm = (caddr_t)shmmap_s;
2743d903220SDoug Rabson 	}
2753d903220SDoug Rabson 	shmseg = shm_find_segment_by_shmid(uap->shmid);
2763d903220SDoug Rabson 	if (shmseg == NULL)
2773d903220SDoug Rabson 		return EINVAL;
2781c308b81SPoul-Henning Kamp 	error = ipcperm(p, &shmseg->shm_perm,
279797f2d22SPoul-Henning Kamp 	    (uap->shmflg & SHM_RDONLY) ? IPC_R : IPC_R|IPC_W);
280797f2d22SPoul-Henning Kamp 	if (error)
2813d903220SDoug Rabson 		return error;
2823d903220SDoug Rabson 	for (i = 0; i < shminfo.shmseg; i++) {
2833d903220SDoug Rabson 		if (shmmap_s->shmid == -1)
2843d903220SDoug Rabson 			break;
2853d903220SDoug Rabson 		shmmap_s++;
2863d903220SDoug Rabson 	}
2873d903220SDoug Rabson 	if (i >= shminfo.shmseg)
2883d903220SDoug Rabson 		return EMFILE;
289aa8de40aSPoul-Henning Kamp 	size = round_page(shmseg->shm_segsz);
290af25d10cSAlan Cox #ifdef VM_PROT_READ_IS_EXEC
291af25d10cSAlan Cox 	prot = VM_PROT_READ | VM_PROT_EXECUTE;
292af25d10cSAlan Cox #else
2933d903220SDoug Rabson 	prot = VM_PROT_READ;
294af25d10cSAlan Cox #endif
2953d903220SDoug Rabson 	if ((uap->shmflg & SHM_RDONLY) == 0)
2963d903220SDoug Rabson 		prot |= VM_PROT_WRITE;
2973d903220SDoug Rabson 	flags = MAP_ANON | MAP_SHARED;
2983d903220SDoug Rabson 	if (uap->shmaddr) {
2993d903220SDoug Rabson 		flags |= MAP_FIXED;
3003d903220SDoug Rabson 		if (uap->shmflg & SHM_RND)
3013d903220SDoug Rabson 			attach_va = (vm_offset_t)uap->shmaddr & ~(SHMLBA-1);
3023d903220SDoug Rabson 		else if (((vm_offset_t)uap->shmaddr & (SHMLBA-1)) == 0)
3033d903220SDoug Rabson 			attach_va = (vm_offset_t)uap->shmaddr;
3043d903220SDoug Rabson 		else
3053d903220SDoug Rabson 			return EINVAL;
3063d903220SDoug Rabson 	} else {
307a51f7119SJohn Dyson 		/* This is just a hint to vm_map_find() about where to put it. */
3086cde7a16SDavid Greenman 		attach_va = round_page((vm_offset_t)p->p_vmspace->vm_taddr + MAXTSIZ + MAXDSIZ);
3093d903220SDoug Rabson 	}
310a51f7119SJohn Dyson 
311a51f7119SJohn Dyson 	shm_handle = shmseg->shm_internal;
312a51f7119SJohn Dyson 	vm_object_reference(shm_handle->shm_object);
313a51f7119SJohn Dyson 	rv = vm_map_find(&p->p_vmspace->vm_map, shm_handle->shm_object,
314a51f7119SJohn Dyson 		0, &attach_va, size, (flags & MAP_FIXED)?0:1, prot, prot, 0);
315a51f7119SJohn Dyson 	if (rv != KERN_SUCCESS) {
316a51f7119SJohn Dyson 		return ENOMEM;
317a51f7119SJohn Dyson 	}
3180463028cSJohn Dyson 	vm_map_inherit(&p->p_vmspace->vm_map,
3190463028cSJohn Dyson 		attach_va, attach_va + size, VM_INHERIT_SHARE);
3200463028cSJohn Dyson 
3213d903220SDoug Rabson 	shmmap_s->va = attach_va;
3223d903220SDoug Rabson 	shmmap_s->shmid = uap->shmid;
3233d903220SDoug Rabson 	shmseg->shm_lpid = p->p_pid;
324227ee8a1SPoul-Henning Kamp 	shmseg->shm_atime = time_second;
3253d903220SDoug Rabson 	shmseg->shm_nattch++;
326cb226aaaSPoul-Henning Kamp 	p->p_retval[0] = attach_va;
3273d903220SDoug Rabson 	return 0;
3283d903220SDoug Rabson }
3293d903220SDoug Rabson 
3308bec0921SDoug Rabson struct oshmid_ds {
3318bec0921SDoug Rabson 	struct	ipc_perm shm_perm;	/* operation perms */
3328bec0921SDoug Rabson 	int	shm_segsz;		/* size of segment (bytes) */
3338bec0921SDoug Rabson 	ushort	shm_cpid;		/* pid, creator */
3348bec0921SDoug Rabson 	ushort	shm_lpid;		/* pid, last operation */
3358bec0921SDoug Rabson 	short	shm_nattch;		/* no. of current attaches */
3368bec0921SDoug Rabson 	time_t	shm_atime;		/* last attach time */
3378bec0921SDoug Rabson 	time_t	shm_dtime;		/* last detach time */
3388bec0921SDoug Rabson 	time_t	shm_ctime;		/* last change time */
3398bec0921SDoug Rabson 	void	*shm_handle;		/* internal handle for shm segment */
3408bec0921SDoug Rabson };
3418bec0921SDoug Rabson 
3428bec0921SDoug Rabson struct oshmctl_args {
3438bec0921SDoug Rabson 	int shmid;
3448bec0921SDoug Rabson 	int cmd;
3458bec0921SDoug Rabson 	struct oshmid_ds *ubuf;
3468bec0921SDoug Rabson };
3478bec0921SDoug Rabson 
34887b6de2bSPoul-Henning Kamp static int
349cb226aaaSPoul-Henning Kamp oshmctl(p, uap)
3508bec0921SDoug Rabson 	struct proc *p;
3518bec0921SDoug Rabson 	struct oshmctl_args *uap;
3528bec0921SDoug Rabson {
3538bec0921SDoug Rabson #ifdef COMPAT_43
354797f2d22SPoul-Henning Kamp 	int error;
3558bec0921SDoug Rabson 	struct shmid_ds *shmseg;
3568bec0921SDoug Rabson 	struct oshmid_ds outbuf;
3578bec0921SDoug Rabson 
358cb1f0db9SRobert Watson 	if (!jail_sysvipc_allowed && p->p_prison != NULL)
359cb1f0db9SRobert Watson 		return (ENOSYS);
360cb1f0db9SRobert Watson 
3618bec0921SDoug Rabson 	shmseg = shm_find_segment_by_shmid(uap->shmid);
3628bec0921SDoug Rabson 	if (shmseg == NULL)
3638bec0921SDoug Rabson 		return EINVAL;
3648bec0921SDoug Rabson 	switch (uap->cmd) {
3658bec0921SDoug Rabson 	case IPC_STAT:
3661c308b81SPoul-Henning Kamp 		error = ipcperm(p, &shmseg->shm_perm, IPC_R);
367797f2d22SPoul-Henning Kamp 		if (error)
3688bec0921SDoug Rabson 			return error;
3698bec0921SDoug Rabson 		outbuf.shm_perm = shmseg->shm_perm;
3708bec0921SDoug Rabson 		outbuf.shm_segsz = shmseg->shm_segsz;
3718bec0921SDoug Rabson 		outbuf.shm_cpid = shmseg->shm_cpid;
3728bec0921SDoug Rabson 		outbuf.shm_lpid = shmseg->shm_lpid;
3738bec0921SDoug Rabson 		outbuf.shm_nattch = shmseg->shm_nattch;
3748bec0921SDoug Rabson 		outbuf.shm_atime = shmseg->shm_atime;
3758bec0921SDoug Rabson 		outbuf.shm_dtime = shmseg->shm_dtime;
3768bec0921SDoug Rabson 		outbuf.shm_ctime = shmseg->shm_ctime;
3778bec0921SDoug Rabson 		outbuf.shm_handle = shmseg->shm_internal;
378797f2d22SPoul-Henning Kamp 		error = copyout((caddr_t)&outbuf, uap->ubuf, sizeof(outbuf));
379797f2d22SPoul-Henning Kamp 		if (error)
3808bec0921SDoug Rabson 			return error;
3818bec0921SDoug Rabson 		break;
3828bec0921SDoug Rabson 	default:
383725db531SBruce Evans 		/* XXX casting to (sy_call_t *) is bogus, as usual. */
384cb226aaaSPoul-Henning Kamp 		return ((sy_call_t *)shmctl)(p, uap);
3858bec0921SDoug Rabson 	}
3868bec0921SDoug Rabson 	return 0;
3878bec0921SDoug Rabson #else
3888bec0921SDoug Rabson 	return EINVAL;
3898bec0921SDoug Rabson #endif
3908bec0921SDoug Rabson }
3918bec0921SDoug Rabson 
392b5d5c0c9SPeter Wemm #ifndef _SYS_SYSPROTO_H_
3933d903220SDoug Rabson struct shmctl_args {
3943d903220SDoug Rabson 	int shmid;
3953d903220SDoug Rabson 	int cmd;
396b5d5c0c9SPeter Wemm 	struct shmid_ds *buf;
3973d903220SDoug Rabson };
398b5d5c0c9SPeter Wemm #endif
399b5d5c0c9SPeter Wemm 
4003d903220SDoug Rabson int
401cb226aaaSPoul-Henning Kamp shmctl(p, uap)
4023d903220SDoug Rabson 	struct proc *p;
4033d903220SDoug Rabson 	struct shmctl_args *uap;
4043d903220SDoug Rabson {
405797f2d22SPoul-Henning Kamp 	int error;
4063d903220SDoug Rabson 	struct shmid_ds inbuf;
4073d903220SDoug Rabson 	struct shmid_ds *shmseg;
4083d903220SDoug Rabson 
409cb1f0db9SRobert Watson 	if (!jail_sysvipc_allowed && p->p_prison != NULL)
410cb1f0db9SRobert Watson 		return (ENOSYS);
411cb1f0db9SRobert Watson 
4123d903220SDoug Rabson 	shmseg = shm_find_segment_by_shmid(uap->shmid);
4133d903220SDoug Rabson 	if (shmseg == NULL)
4143d903220SDoug Rabson 		return EINVAL;
4153d903220SDoug Rabson 	switch (uap->cmd) {
4163d903220SDoug Rabson 	case IPC_STAT:
4171c308b81SPoul-Henning Kamp 		error = ipcperm(p, &shmseg->shm_perm, IPC_R);
418797f2d22SPoul-Henning Kamp 		if (error)
4193d903220SDoug Rabson 			return error;
420b5d5c0c9SPeter Wemm 		error = copyout((caddr_t)shmseg, uap->buf, sizeof(inbuf));
421797f2d22SPoul-Henning Kamp 		if (error)
4223d903220SDoug Rabson 			return error;
4233d903220SDoug Rabson 		break;
4243d903220SDoug Rabson 	case IPC_SET:
4251c308b81SPoul-Henning Kamp 		error = ipcperm(p, &shmseg->shm_perm, IPC_M);
426797f2d22SPoul-Henning Kamp 		if (error)
4273d903220SDoug Rabson 			return error;
428b5d5c0c9SPeter Wemm 		error = copyin(uap->buf, (caddr_t)&inbuf, sizeof(inbuf));
429797f2d22SPoul-Henning Kamp 		if (error)
4303d903220SDoug Rabson 			return error;
4313d903220SDoug Rabson 		shmseg->shm_perm.uid = inbuf.shm_perm.uid;
4323d903220SDoug Rabson 		shmseg->shm_perm.gid = inbuf.shm_perm.gid;
4333d903220SDoug Rabson 		shmseg->shm_perm.mode =
4343d903220SDoug Rabson 		    (shmseg->shm_perm.mode & ~ACCESSPERMS) |
4353d903220SDoug Rabson 		    (inbuf.shm_perm.mode & ACCESSPERMS);
436227ee8a1SPoul-Henning Kamp 		shmseg->shm_ctime = time_second;
4373d903220SDoug Rabson 		break;
4383d903220SDoug Rabson 	case IPC_RMID:
4391c308b81SPoul-Henning Kamp 		error = ipcperm(p, &shmseg->shm_perm, IPC_M);
440797f2d22SPoul-Henning Kamp 		if (error)
4413d903220SDoug Rabson 			return error;
4423d903220SDoug Rabson 		shmseg->shm_perm.key = IPC_PRIVATE;
4433d903220SDoug Rabson 		shmseg->shm_perm.mode |= SHMSEG_REMOVED;
4443d903220SDoug Rabson 		if (shmseg->shm_nattch <= 0) {
4453d903220SDoug Rabson 			shm_deallocate_segment(shmseg);
4463d903220SDoug Rabson 			shm_last_free = IPCID_TO_IX(uap->shmid);
4473d903220SDoug Rabson 		}
4483d903220SDoug Rabson 		break;
4493d903220SDoug Rabson #if 0
4503d903220SDoug Rabson 	case SHM_LOCK:
4513d903220SDoug Rabson 	case SHM_UNLOCK:
4523d903220SDoug Rabson #endif
4533d903220SDoug Rabson 	default:
4543d903220SDoug Rabson 		return EINVAL;
4553d903220SDoug Rabson 	}
4563d903220SDoug Rabson 	return 0;
4573d903220SDoug Rabson }
4583d903220SDoug Rabson 
459b5d5c0c9SPeter Wemm #ifndef _SYS_SYSPROTO_H_
4603d903220SDoug Rabson struct shmget_args {
4613d903220SDoug Rabson 	key_t key;
4623d903220SDoug Rabson 	size_t size;
4633d903220SDoug Rabson 	int shmflg;
4643d903220SDoug Rabson };
465b5d5c0c9SPeter Wemm #endif
466b5d5c0c9SPeter Wemm 
4673d903220SDoug Rabson static int
468cb226aaaSPoul-Henning Kamp shmget_existing(p, uap, mode, segnum)
4693d903220SDoug Rabson 	struct proc *p;
4703d903220SDoug Rabson 	struct shmget_args *uap;
4713d903220SDoug Rabson 	int mode;
4723d903220SDoug Rabson 	int segnum;
4733d903220SDoug Rabson {
4743d903220SDoug Rabson 	struct shmid_ds *shmseg;
4753d903220SDoug Rabson 	int error;
4763d903220SDoug Rabson 
4773d903220SDoug Rabson 	shmseg = &shmsegs[segnum];
4783d903220SDoug Rabson 	if (shmseg->shm_perm.mode & SHMSEG_REMOVED) {
4793d903220SDoug Rabson 		/*
4803d903220SDoug Rabson 		 * This segment is in the process of being allocated.  Wait
4813d903220SDoug Rabson 		 * until it's done, and look the key up again (in case the
4823d903220SDoug Rabson 		 * allocation failed or it was freed).
4833d903220SDoug Rabson 		 */
4843d903220SDoug Rabson 		shmseg->shm_perm.mode |= SHMSEG_WANTED;
485797f2d22SPoul-Henning Kamp 		error = tsleep((caddr_t)shmseg, PLOCK | PCATCH, "shmget", 0);
486797f2d22SPoul-Henning Kamp 		if (error)
4873d903220SDoug Rabson 			return error;
4883d903220SDoug Rabson 		return EAGAIN;
4893d903220SDoug Rabson 	}
490dc92aa57SAlan Cox 	if ((uap->shmflg & (IPC_CREAT | IPC_EXCL)) == (IPC_CREAT | IPC_EXCL))
491dc92aa57SAlan Cox 		return EEXIST;
4921c308b81SPoul-Henning Kamp 	error = ipcperm(p, &shmseg->shm_perm, mode);
493797f2d22SPoul-Henning Kamp 	if (error)
4943d903220SDoug Rabson 		return error;
4953d903220SDoug Rabson 	if (uap->size && uap->size > shmseg->shm_segsz)
4963d903220SDoug Rabson 		return EINVAL;
497cb226aaaSPoul-Henning Kamp 	p->p_retval[0] = IXSEQ_TO_IPCID(segnum, shmseg->shm_perm);
4983d903220SDoug Rabson 	return 0;
4993d903220SDoug Rabson }
5003d903220SDoug Rabson 
5013d903220SDoug Rabson static int
502cb226aaaSPoul-Henning Kamp shmget_allocate_segment(p, uap, mode)
5033d903220SDoug Rabson 	struct proc *p;
5043d903220SDoug Rabson 	struct shmget_args *uap;
5053d903220SDoug Rabson 	int mode;
5063d903220SDoug Rabson {
507a51f7119SJohn Dyson 	int i, segnum, shmid, size;
5083d903220SDoug Rabson 	struct ucred *cred = p->p_ucred;
5093d903220SDoug Rabson 	struct shmid_ds *shmseg;
5103d903220SDoug Rabson 	struct shm_handle *shm_handle;
5113d903220SDoug Rabson 
5123d903220SDoug Rabson 	if (uap->size < shminfo.shmmin || uap->size > shminfo.shmmax)
5133d903220SDoug Rabson 		return EINVAL;
5143d903220SDoug Rabson 	if (shm_nused >= shminfo.shmmni) /* any shmids left? */
5153d903220SDoug Rabson 		return ENOSPC;
5169e609ddeSJoerg Wunsch 	size = round_page(uap->size);
5173d903220SDoug Rabson 	if (shm_committed + btoc(size) > shminfo.shmall)
5183d903220SDoug Rabson 		return ENOMEM;
5193d903220SDoug Rabson 	if (shm_last_free < 0) {
520255108f3SPeter Wemm 		shmrealloc();	/* maybe expand the shmsegs[] array */
521255108f3SPeter Wemm 		for (i = 0; i < shmalloced; i++)
5223d903220SDoug Rabson 			if (shmsegs[i].shm_perm.mode & SHMSEG_FREE)
5233d903220SDoug Rabson 				break;
524255108f3SPeter Wemm 		if (i == shmalloced)
525255108f3SPeter Wemm 			return ENOSPC;
5263d903220SDoug Rabson 		segnum = i;
5273d903220SDoug Rabson 	} else  {
5283d903220SDoug Rabson 		segnum = shm_last_free;
5293d903220SDoug Rabson 		shm_last_free = -1;
5303d903220SDoug Rabson 	}
5313d903220SDoug Rabson 	shmseg = &shmsegs[segnum];
5323d903220SDoug Rabson 	/*
5333d903220SDoug Rabson 	 * In case we sleep in malloc(), mark the segment present but deleted
5343d903220SDoug Rabson 	 * so that noone else tries to create the same key.
5353d903220SDoug Rabson 	 */
5363d903220SDoug Rabson 	shmseg->shm_perm.mode = SHMSEG_ALLOCATED | SHMSEG_REMOVED;
5373d903220SDoug Rabson 	shmseg->shm_perm.key = uap->key;
5383d903220SDoug Rabson 	shmseg->shm_perm.seq = (shmseg->shm_perm.seq + 1) & 0x7fff;
5393d903220SDoug Rabson 	shm_handle = (struct shm_handle *)
5403d903220SDoug Rabson 	    malloc(sizeof(struct shm_handle), M_SHM, M_WAITOK);
5413d903220SDoug Rabson 	shmid = IXSEQ_TO_IPCID(segnum, shmseg->shm_perm);
542a51f7119SJohn Dyson 
543ae9b8c3aSJohn Dyson 	/*
544ae9b8c3aSJohn Dyson 	 * We make sure that we have allocated a pager before we need
545ae9b8c3aSJohn Dyson 	 * to.
546ae9b8c3aSJohn Dyson 	 */
5478b03c8edSMatthew Dillon 	if (shm_use_phys) {
54824488c74SPeter Wemm 		shm_handle->shm_object =
54924488c74SPeter Wemm 		    vm_pager_allocate(OBJT_PHYS, 0, size, VM_PROT_DEFAULT, 0);
5508b03c8edSMatthew Dillon 	} else {
551a51f7119SJohn Dyson 		shm_handle->shm_object =
5526cde7a16SDavid Greenman 		    vm_pager_allocate(OBJT_SWAP, 0, size, VM_PROT_DEFAULT, 0);
5538b03c8edSMatthew Dillon 	}
554069e9bc1SDoug Rabson 	vm_object_clear_flag(shm_handle->shm_object, OBJ_ONEMAPPING);
555069e9bc1SDoug Rabson 	vm_object_set_flag(shm_handle->shm_object, OBJ_NOSPLIT);
556cbd8ec09SJohn Dyson 
5573d903220SDoug Rabson 	shmseg->shm_internal = shm_handle;
5583d903220SDoug Rabson 	shmseg->shm_perm.cuid = shmseg->shm_perm.uid = cred->cr_uid;
5593d903220SDoug Rabson 	shmseg->shm_perm.cgid = shmseg->shm_perm.gid = cred->cr_gid;
5603d903220SDoug Rabson 	shmseg->shm_perm.mode = (shmseg->shm_perm.mode & SHMSEG_WANTED) |
5613d903220SDoug Rabson 	    (mode & ACCESSPERMS) | SHMSEG_ALLOCATED;
5623d903220SDoug Rabson 	shmseg->shm_segsz = uap->size;
5633d903220SDoug Rabson 	shmseg->shm_cpid = p->p_pid;
5643d903220SDoug Rabson 	shmseg->shm_lpid = shmseg->shm_nattch = 0;
5653d903220SDoug Rabson 	shmseg->shm_atime = shmseg->shm_dtime = 0;
566227ee8a1SPoul-Henning Kamp 	shmseg->shm_ctime = time_second;
5673d903220SDoug Rabson 	shm_committed += btoc(size);
5683d903220SDoug Rabson 	shm_nused++;
5693d903220SDoug Rabson 	if (shmseg->shm_perm.mode & SHMSEG_WANTED) {
5703d903220SDoug Rabson 		/*
5713d903220SDoug Rabson 		 * Somebody else wanted this key while we were asleep.  Wake
5723d903220SDoug Rabson 		 * them up now.
5733d903220SDoug Rabson 		 */
5743d903220SDoug Rabson 		shmseg->shm_perm.mode &= ~SHMSEG_WANTED;
5753d903220SDoug Rabson 		wakeup((caddr_t)shmseg);
5763d903220SDoug Rabson 	}
577cb226aaaSPoul-Henning Kamp 	p->p_retval[0] = shmid;
5783d903220SDoug Rabson 	return 0;
5793d903220SDoug Rabson }
5803d903220SDoug Rabson 
5813d903220SDoug Rabson int
582cb226aaaSPoul-Henning Kamp shmget(p, uap)
5833d903220SDoug Rabson 	struct proc *p;
5843d903220SDoug Rabson 	struct shmget_args *uap;
5853d903220SDoug Rabson {
5863d903220SDoug Rabson 	int segnum, mode, error;
5873d903220SDoug Rabson 
588cb1f0db9SRobert Watson 	if (!jail_sysvipc_allowed && p->p_prison != NULL)
589cb1f0db9SRobert Watson 		return (ENOSYS);
590cb1f0db9SRobert Watson 
5913d903220SDoug Rabson 	mode = uap->shmflg & ACCESSPERMS;
5923d903220SDoug Rabson 	if (uap->key != IPC_PRIVATE) {
5933d903220SDoug Rabson 	again:
5943d903220SDoug Rabson 		segnum = shm_find_segment_by_key(uap->key);
5953d903220SDoug Rabson 		if (segnum >= 0) {
596cb226aaaSPoul-Henning Kamp 			error = shmget_existing(p, uap, mode, segnum);
5973d903220SDoug Rabson 			if (error == EAGAIN)
5983d903220SDoug Rabson 				goto again;
5993d903220SDoug Rabson 			return error;
6003d903220SDoug Rabson 		}
6013d903220SDoug Rabson 		if ((uap->shmflg & IPC_CREAT) == 0)
6023d903220SDoug Rabson 			return ENOENT;
6033d903220SDoug Rabson 	}
604cb226aaaSPoul-Henning Kamp 	return shmget_allocate_segment(p, uap, mode);
6053d903220SDoug Rabson }
6063d903220SDoug Rabson 
6073d903220SDoug Rabson int
608cb226aaaSPoul-Henning Kamp shmsys(p, uap)
6093d903220SDoug Rabson 	struct proc *p;
610725db531SBruce Evans 	/* XXX actually varargs. */
611725db531SBruce Evans 	struct shmsys_args /* {
612725db531SBruce Evans 		u_int	which;
613725db531SBruce Evans 		int	a2;
614725db531SBruce Evans 		int	a3;
615725db531SBruce Evans 		int	a4;
616725db531SBruce Evans 	} */ *uap;
6173d903220SDoug Rabson {
6183d903220SDoug Rabson 
619cb1f0db9SRobert Watson 	if (!jail_sysvipc_allowed && p->p_prison != NULL)
620cb1f0db9SRobert Watson 		return (ENOSYS);
621cb1f0db9SRobert Watson 
6223d903220SDoug Rabson 	if (uap->which >= sizeof(shmcalls)/sizeof(shmcalls[0]))
6233d903220SDoug Rabson 		return EINVAL;
624cb226aaaSPoul-Henning Kamp 	return ((*shmcalls[uap->which])(p, &uap->a2));
6253d903220SDoug Rabson }
6263d903220SDoug Rabson 
6273d903220SDoug Rabson void
628dabee6feSPeter Wemm shmfork(p1, p2)
6293d903220SDoug Rabson 	struct proc *p1, *p2;
6303d903220SDoug Rabson {
6313d903220SDoug Rabson 	struct shmmap_state *shmmap_s;
6323d903220SDoug Rabson 	size_t size;
6333d903220SDoug Rabson 	int i;
6343d903220SDoug Rabson 
6353d903220SDoug Rabson 	size = shminfo.shmseg * sizeof(struct shmmap_state);
6363d903220SDoug Rabson 	shmmap_s = malloc(size, M_SHM, M_WAITOK);
6373d903220SDoug Rabson 	bcopy((caddr_t)p1->p_vmspace->vm_shm, (caddr_t)shmmap_s, size);
6383d903220SDoug Rabson 	p2->p_vmspace->vm_shm = (caddr_t)shmmap_s;
6393d903220SDoug Rabson 	for (i = 0; i < shminfo.shmseg; i++, shmmap_s++)
6403d903220SDoug Rabson 		if (shmmap_s->shmid != -1)
6413d903220SDoug Rabson 			shmsegs[IPCID_TO_IX(shmmap_s->shmid)].shm_nattch++;
6423d903220SDoug Rabson }
6433d903220SDoug Rabson 
6443d903220SDoug Rabson void
6453d903220SDoug Rabson shmexit(p)
6463d903220SDoug Rabson 	struct proc *p;
6473d903220SDoug Rabson {
6483d903220SDoug Rabson 	struct shmmap_state *shmmap_s;
6493d903220SDoug Rabson 	int i;
6503d903220SDoug Rabson 
6513d903220SDoug Rabson 	shmmap_s = (struct shmmap_state *)p->p_vmspace->vm_shm;
6523d903220SDoug Rabson 	for (i = 0; i < shminfo.shmseg; i++, shmmap_s++)
6533d903220SDoug Rabson 		if (shmmap_s->shmid != -1)
6543d903220SDoug Rabson 			shm_delete_mapping(p, shmmap_s);
6553d903220SDoug Rabson 	free((caddr_t)p->p_vmspace->vm_shm, M_SHM);
6563d903220SDoug Rabson 	p->p_vmspace->vm_shm = NULL;
6573d903220SDoug Rabson }
6583d903220SDoug Rabson 
659255108f3SPeter Wemm static void
660255108f3SPeter Wemm shmrealloc(void)
661255108f3SPeter Wemm {
662255108f3SPeter Wemm 	int i;
663255108f3SPeter Wemm 	struct shmid_ds *newsegs;
664255108f3SPeter Wemm 
665255108f3SPeter Wemm 	if (shmalloced >= shminfo.shmmni)
666255108f3SPeter Wemm 		return;
667255108f3SPeter Wemm 
668255108f3SPeter Wemm 	newsegs = malloc(shminfo.shmmni * sizeof(*newsegs), M_SHM, M_WAITOK);
669255108f3SPeter Wemm 	if (newsegs == NULL)
670255108f3SPeter Wemm 		return;
671255108f3SPeter Wemm 	for (i = 0; i < shmalloced; i++)
672255108f3SPeter Wemm 		bcopy(&shmsegs[i], &newsegs[i], sizeof(newsegs[0]));
673255108f3SPeter Wemm 	for (; i < shminfo.shmmni; i++) {
674255108f3SPeter Wemm 		shmsegs[i].shm_perm.mode = SHMSEG_FREE;
675255108f3SPeter Wemm 		shmsegs[i].shm_perm.seq = 0;
676255108f3SPeter Wemm 	}
677255108f3SPeter Wemm 	free(shmsegs, M_SHM);
678255108f3SPeter Wemm 	shmsegs = newsegs;
679255108f3SPeter Wemm 	shmalloced = shminfo.shmmni;
680255108f3SPeter Wemm }
681255108f3SPeter Wemm 
682255108f3SPeter Wemm static void
683725db531SBruce Evans shminit(dummy)
684725db531SBruce Evans 	void *dummy;
6853d903220SDoug Rabson {
6863d903220SDoug Rabson 	int i;
687255108f3SPeter Wemm 
688255108f3SPeter Wemm 	shmalloced = shminfo.shmmni;
689255108f3SPeter Wemm 	shmsegs = malloc(shmalloced * sizeof(shmsegs[0]), M_SHM, M_WAITOK);
690255108f3SPeter Wemm 	if (shmsegs == NULL)
691255108f3SPeter Wemm 		panic("cannot allocate initial memory for sysvshm");
692255108f3SPeter Wemm 	for (i = 0; i < shmalloced; i++) {
6933d903220SDoug Rabson 		shmsegs[i].shm_perm.mode = SHMSEG_FREE;
6943d903220SDoug Rabson 		shmsegs[i].shm_perm.seq = 0;
6953d903220SDoug Rabson 	}
6963d903220SDoug Rabson 	shm_last_free = 0;
6973d903220SDoug Rabson 	shm_nused = 0;
6983d903220SDoug Rabson 	shm_committed = 0;
6993d903220SDoug Rabson }
700255108f3SPeter Wemm SYSINIT(sysv_shm, SI_SUB_SYSV_SHM, SI_ORDER_FIRST, shminit, NULL);
701