xref: /f-stack/freebsd/kern/sysv_msg.c (revision 22ce4aff)
1a9643ea8Slogwang /*-
2a9643ea8Slogwang  * Implementation of SVID messages
3a9643ea8Slogwang  *
4a9643ea8Slogwang  * Author:  Daniel Boulet
5a9643ea8Slogwang  *
6a9643ea8Slogwang  * Copyright 1993 Daniel Boulet and RTMX Inc.
7a9643ea8Slogwang  *
8a9643ea8Slogwang  * This system call was implemented by Daniel Boulet under contract from RTMX.
9a9643ea8Slogwang  *
10a9643ea8Slogwang  * Redistribution and use in source forms, with and without modification,
11a9643ea8Slogwang  * are permitted provided that this entire comment appears intact.
12a9643ea8Slogwang  *
13a9643ea8Slogwang  * Redistribution in binary form may occur without any restrictions.
14a9643ea8Slogwang  * Obviously, it would be nice if you gave credit where credit is due
15a9643ea8Slogwang  * but requiring it would be too onerous.
16a9643ea8Slogwang  *
17a9643ea8Slogwang  * This software is provided ``AS IS'' without any warranties of any kind.
18a9643ea8Slogwang  */
19a9643ea8Slogwang /*-
20*22ce4affSfengbojiang  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
21*22ce4affSfengbojiang  *
22a9643ea8Slogwang  * Copyright (c) 2003-2005 McAfee, Inc.
23*22ce4affSfengbojiang  * Copyright (c) 2016-2017 Robert N. M. Watson
24a9643ea8Slogwang  * All rights reserved.
25a9643ea8Slogwang  *
26a9643ea8Slogwang  * This software was developed for the FreeBSD Project in part by McAfee
27a9643ea8Slogwang  * Research, the Security Research Division of McAfee, Inc under DARPA/SPAWAR
28a9643ea8Slogwang  * contract N66001-01-C-8035 ("CBOSS"), as part of the DARPA CHATS research
29a9643ea8Slogwang  * program.
30a9643ea8Slogwang  *
31*22ce4affSfengbojiang  * Portions of this software were developed by BAE Systems, the University of
32*22ce4affSfengbojiang  * Cambridge Computer Laboratory, and Memorial University under DARPA/AFRL
33*22ce4affSfengbojiang  * contract FA8650-15-C-7558 ("CADETS"), as part of the DARPA Transparent
34*22ce4affSfengbojiang  * Computing (TC) research program.
35*22ce4affSfengbojiang  *
36a9643ea8Slogwang  * Redistribution and use in source and binary forms, with or without
37a9643ea8Slogwang  * modification, are permitted provided that the following conditions
38a9643ea8Slogwang  * are met:
39a9643ea8Slogwang  * 1. Redistributions of source code must retain the above copyright
40a9643ea8Slogwang  *    notice, this list of conditions and the following disclaimer.
41a9643ea8Slogwang  * 2. Redistributions in binary form must reproduce the above copyright
42a9643ea8Slogwang  *    notice, this list of conditions and the following disclaimer in the
43a9643ea8Slogwang  *    documentation and/or other materials provided with the distribution.
44a9643ea8Slogwang  *
45a9643ea8Slogwang  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
46a9643ea8Slogwang  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
47a9643ea8Slogwang  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
48a9643ea8Slogwang  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
49a9643ea8Slogwang  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
50a9643ea8Slogwang  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
51a9643ea8Slogwang  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
52a9643ea8Slogwang  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
53a9643ea8Slogwang  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
54a9643ea8Slogwang  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
55a9643ea8Slogwang  * SUCH DAMAGE.
56a9643ea8Slogwang  */
57a9643ea8Slogwang 
58a9643ea8Slogwang #include <sys/cdefs.h>
59a9643ea8Slogwang __FBSDID("$FreeBSD$");
60a9643ea8Slogwang 
61a9643ea8Slogwang #include "opt_sysvipc.h"
62a9643ea8Slogwang 
63a9643ea8Slogwang #include <sys/param.h>
64a9643ea8Slogwang #include <sys/systm.h>
65a9643ea8Slogwang #include <sys/sysproto.h>
66a9643ea8Slogwang #include <sys/kernel.h>
67a9643ea8Slogwang #include <sys/priv.h>
68a9643ea8Slogwang #include <sys/proc.h>
69a9643ea8Slogwang #include <sys/lock.h>
70a9643ea8Slogwang #include <sys/mutex.h>
71a9643ea8Slogwang #include <sys/module.h>
72a9643ea8Slogwang #include <sys/mount.h>
73a9643ea8Slogwang #include <sys/msg.h>
74a9643ea8Slogwang #include <sys/racct.h>
75a9643ea8Slogwang #include <sys/sx.h>
76a9643ea8Slogwang #include <sys/syscall.h>
77a9643ea8Slogwang #include <sys/syscallsubr.h>
78a9643ea8Slogwang #include <sys/sysent.h>
79a9643ea8Slogwang #include <sys/sysctl.h>
80a9643ea8Slogwang #include <sys/malloc.h>
81a9643ea8Slogwang #include <sys/jail.h>
82a9643ea8Slogwang 
83*22ce4affSfengbojiang #include <security/audit/audit.h>
84a9643ea8Slogwang #include <security/mac/mac_framework.h>
85a9643ea8Slogwang 
86a9643ea8Slogwang FEATURE(sysv_msg, "System V message queues support");
87a9643ea8Slogwang 
88a9643ea8Slogwang static MALLOC_DEFINE(M_MSG, "msg", "SVID compatible message queues");
89a9643ea8Slogwang 
90a9643ea8Slogwang static int msginit(void);
91a9643ea8Slogwang static int msgunload(void);
92a9643ea8Slogwang static int sysvmsg_modload(struct module *, int, void *);
93a9643ea8Slogwang static void msq_remove(struct msqid_kernel *);
94a9643ea8Slogwang static struct prison *msg_find_prison(struct ucred *);
95a9643ea8Slogwang static int msq_prison_cansee(struct prison *, struct msqid_kernel *);
96a9643ea8Slogwang static int msg_prison_check(void *, void *);
97a9643ea8Slogwang static int msg_prison_set(void *, void *);
98a9643ea8Slogwang static int msg_prison_get(void *, void *);
99a9643ea8Slogwang static int msg_prison_remove(void *, void *);
100a9643ea8Slogwang static void msg_prison_cleanup(struct prison *);
101a9643ea8Slogwang 
102a9643ea8Slogwang #ifdef MSG_DEBUG
103a9643ea8Slogwang #define DPRINTF(a)	printf a
104a9643ea8Slogwang #else
105a9643ea8Slogwang #define DPRINTF(a)	(void)0
106a9643ea8Slogwang #endif
107a9643ea8Slogwang 
108a9643ea8Slogwang static void msg_freehdr(struct msg *msghdr);
109a9643ea8Slogwang 
110a9643ea8Slogwang #ifndef MSGSSZ
111a9643ea8Slogwang #define MSGSSZ	8		/* Each segment must be 2^N long */
112a9643ea8Slogwang #endif
113a9643ea8Slogwang #ifndef MSGSEG
114a9643ea8Slogwang #define MSGSEG	2048		/* must be less than 32767 */
115a9643ea8Slogwang #endif
116a9643ea8Slogwang #define MSGMAX	(MSGSSZ*MSGSEG)
117a9643ea8Slogwang #ifndef MSGMNB
118a9643ea8Slogwang #define MSGMNB	2048		/* max # of bytes in a queue */
119a9643ea8Slogwang #endif
120a9643ea8Slogwang #ifndef MSGMNI
121a9643ea8Slogwang #define MSGMNI	40
122a9643ea8Slogwang #endif
123a9643ea8Slogwang #ifndef MSGTQL
124a9643ea8Slogwang #define MSGTQL	40
125a9643ea8Slogwang #endif
126a9643ea8Slogwang 
127a9643ea8Slogwang /*
128a9643ea8Slogwang  * Based on the configuration parameters described in an SVR2 (yes, two)
129a9643ea8Slogwang  * config(1m) man page.
130a9643ea8Slogwang  *
131a9643ea8Slogwang  * Each message is broken up and stored in segments that are msgssz bytes
132a9643ea8Slogwang  * long.  For efficiency reasons, this should be a power of two.  Also,
133a9643ea8Slogwang  * it doesn't make sense if it is less than 8 or greater than about 256.
134a9643ea8Slogwang  * Consequently, msginit in kern/sysv_msg.c checks that msgssz is a power of
135a9643ea8Slogwang  * two between 8 and 1024 inclusive (and panic's if it isn't).
136a9643ea8Slogwang  */
137a9643ea8Slogwang struct msginfo msginfo = {
138a9643ea8Slogwang                 MSGMAX,         /* max chars in a message */
139a9643ea8Slogwang                 MSGMNI,         /* # of message queue identifiers */
140a9643ea8Slogwang                 MSGMNB,         /* max chars in a queue */
141a9643ea8Slogwang                 MSGTQL,         /* max messages in system */
142a9643ea8Slogwang                 MSGSSZ,         /* size of a message segment */
143a9643ea8Slogwang                 		/* (must be small power of 2 greater than 4) */
144a9643ea8Slogwang                 MSGSEG          /* number of message segments */
145a9643ea8Slogwang };
146a9643ea8Slogwang 
147a9643ea8Slogwang /*
148a9643ea8Slogwang  * macros to convert between msqid_ds's and msqid's.
149a9643ea8Slogwang  * (specific to this implementation)
150a9643ea8Slogwang  */
151a9643ea8Slogwang #define MSQID(ix,ds)	((ix) & 0xffff | (((ds).msg_perm.seq << 16) & 0xffff0000))
152a9643ea8Slogwang #define MSQID_IX(id)	((id) & 0xffff)
153a9643ea8Slogwang #define MSQID_SEQ(id)	(((id) >> 16) & 0xffff)
154a9643ea8Slogwang 
155a9643ea8Slogwang /*
156a9643ea8Slogwang  * The rest of this file is specific to this particular implementation.
157a9643ea8Slogwang  */
158a9643ea8Slogwang 
159a9643ea8Slogwang struct msgmap {
160a9643ea8Slogwang 	short	next;		/* next segment in buffer */
161a9643ea8Slogwang     				/* -1 -> available */
162a9643ea8Slogwang     				/* 0..(MSGSEG-1) -> index of next segment */
163a9643ea8Slogwang };
164a9643ea8Slogwang 
165a9643ea8Slogwang #define MSG_LOCKED	01000	/* Is this msqid_ds locked? */
166a9643ea8Slogwang 
167a9643ea8Slogwang static int nfree_msgmaps;	/* # of free map entries */
168a9643ea8Slogwang static short free_msgmaps;	/* head of linked list of free map entries */
169a9643ea8Slogwang static struct msg *free_msghdrs;/* list of free msg headers */
170a9643ea8Slogwang static char *msgpool;		/* MSGMAX byte long msg buffer pool */
171a9643ea8Slogwang static struct msgmap *msgmaps;	/* MSGSEG msgmap structures */
172a9643ea8Slogwang static struct msg *msghdrs;	/* MSGTQL msg headers */
173a9643ea8Slogwang static struct msqid_kernel *msqids;	/* MSGMNI msqid_kernel struct's */
174a9643ea8Slogwang static struct mtx msq_mtx;	/* global mutex for message queues. */
175a9643ea8Slogwang static unsigned msg_prison_slot;/* prison OSD slot */
176a9643ea8Slogwang 
177a9643ea8Slogwang static struct syscall_helper_data msg_syscalls[] = {
178a9643ea8Slogwang 	SYSCALL_INIT_HELPER(msgctl),
179a9643ea8Slogwang 	SYSCALL_INIT_HELPER(msgget),
180a9643ea8Slogwang 	SYSCALL_INIT_HELPER(msgsnd),
181a9643ea8Slogwang 	SYSCALL_INIT_HELPER(msgrcv),
182a9643ea8Slogwang #if defined(COMPAT_FREEBSD4) || defined(COMPAT_FREEBSD5) || \
183a9643ea8Slogwang     defined(COMPAT_FREEBSD6) || defined(COMPAT_FREEBSD7)
184a9643ea8Slogwang 	SYSCALL_INIT_HELPER(msgsys),
185a9643ea8Slogwang 	SYSCALL_INIT_HELPER_COMPAT(freebsd7_msgctl),
186a9643ea8Slogwang #endif
187a9643ea8Slogwang 	SYSCALL_INIT_LAST
188a9643ea8Slogwang };
189a9643ea8Slogwang 
190a9643ea8Slogwang #ifdef COMPAT_FREEBSD32
191a9643ea8Slogwang #include <compat/freebsd32/freebsd32.h>
192a9643ea8Slogwang #include <compat/freebsd32/freebsd32_ipc.h>
193a9643ea8Slogwang #include <compat/freebsd32/freebsd32_proto.h>
194a9643ea8Slogwang #include <compat/freebsd32/freebsd32_signal.h>
195a9643ea8Slogwang #include <compat/freebsd32/freebsd32_syscall.h>
196a9643ea8Slogwang #include <compat/freebsd32/freebsd32_util.h>
197a9643ea8Slogwang 
198a9643ea8Slogwang static struct syscall_helper_data msg32_syscalls[] = {
199a9643ea8Slogwang 	SYSCALL32_INIT_HELPER(freebsd32_msgctl),
200a9643ea8Slogwang 	SYSCALL32_INIT_HELPER(freebsd32_msgsnd),
201a9643ea8Slogwang 	SYSCALL32_INIT_HELPER(freebsd32_msgrcv),
202a9643ea8Slogwang 	SYSCALL32_INIT_HELPER_COMPAT(msgget),
203a9643ea8Slogwang 	SYSCALL32_INIT_HELPER(freebsd32_msgsys),
204a9643ea8Slogwang #if defined(COMPAT_FREEBSD4) || defined(COMPAT_FREEBSD5) || \
205a9643ea8Slogwang     defined(COMPAT_FREEBSD6) || defined(COMPAT_FREEBSD7)
206a9643ea8Slogwang 	SYSCALL32_INIT_HELPER(freebsd7_freebsd32_msgctl),
207a9643ea8Slogwang #endif
208a9643ea8Slogwang 	SYSCALL_INIT_LAST
209a9643ea8Slogwang };
210a9643ea8Slogwang #endif
211a9643ea8Slogwang 
212a9643ea8Slogwang static int
msginit()213a9643ea8Slogwang msginit()
214a9643ea8Slogwang {
215a9643ea8Slogwang 	struct prison *pr;
216a9643ea8Slogwang 	void **rsv;
217a9643ea8Slogwang 	int i, error;
218a9643ea8Slogwang 	osd_method_t methods[PR_MAXMETHOD] = {
219a9643ea8Slogwang 	    [PR_METHOD_CHECK] =		msg_prison_check,
220a9643ea8Slogwang 	    [PR_METHOD_SET] =		msg_prison_set,
221a9643ea8Slogwang 	    [PR_METHOD_GET] =		msg_prison_get,
222a9643ea8Slogwang 	    [PR_METHOD_REMOVE] =	msg_prison_remove,
223a9643ea8Slogwang 	};
224a9643ea8Slogwang 
225a9643ea8Slogwang 	msginfo.msgmax = msginfo.msgseg * msginfo.msgssz;
226a9643ea8Slogwang 	msgpool = malloc(msginfo.msgmax, M_MSG, M_WAITOK);
227a9643ea8Slogwang 	msgmaps = malloc(sizeof(struct msgmap) * msginfo.msgseg, M_MSG, M_WAITOK);
228a9643ea8Slogwang 	msghdrs = malloc(sizeof(struct msg) * msginfo.msgtql, M_MSG, M_WAITOK);
229a9643ea8Slogwang 	msqids = malloc(sizeof(struct msqid_kernel) * msginfo.msgmni, M_MSG,
230*22ce4affSfengbojiang 	    M_WAITOK | M_ZERO);
231a9643ea8Slogwang 
232a9643ea8Slogwang 	/*
233a9643ea8Slogwang 	 * msginfo.msgssz should be a power of two for efficiency reasons.
234a9643ea8Slogwang 	 * It is also pretty silly if msginfo.msgssz is less than 8
235a9643ea8Slogwang 	 * or greater than about 256 so ...
236a9643ea8Slogwang 	 */
237a9643ea8Slogwang 
238a9643ea8Slogwang 	i = 8;
239a9643ea8Slogwang 	while (i < 1024 && i != msginfo.msgssz)
240a9643ea8Slogwang 		i <<= 1;
241a9643ea8Slogwang     	if (i != msginfo.msgssz) {
242a9643ea8Slogwang 		DPRINTF(("msginfo.msgssz=%d (0x%x)\n", msginfo.msgssz,
243a9643ea8Slogwang 		    msginfo.msgssz));
244a9643ea8Slogwang 		panic("msginfo.msgssz not a small power of 2");
245a9643ea8Slogwang 	}
246a9643ea8Slogwang 
247a9643ea8Slogwang 	if (msginfo.msgseg > 32767) {
248a9643ea8Slogwang 		DPRINTF(("msginfo.msgseg=%d\n", msginfo.msgseg));
249a9643ea8Slogwang 		panic("msginfo.msgseg > 32767");
250a9643ea8Slogwang 	}
251a9643ea8Slogwang 
252a9643ea8Slogwang 	for (i = 0; i < msginfo.msgseg; i++) {
253a9643ea8Slogwang 		if (i > 0)
254a9643ea8Slogwang 			msgmaps[i-1].next = i;
255a9643ea8Slogwang 		msgmaps[i].next = -1;	/* implies entry is available */
256a9643ea8Slogwang 	}
257a9643ea8Slogwang 	free_msgmaps = 0;
258a9643ea8Slogwang 	nfree_msgmaps = msginfo.msgseg;
259a9643ea8Slogwang 
260a9643ea8Slogwang 	for (i = 0; i < msginfo.msgtql; i++) {
261a9643ea8Slogwang 		msghdrs[i].msg_type = 0;
262a9643ea8Slogwang 		if (i > 0)
263a9643ea8Slogwang 			msghdrs[i-1].msg_next = &msghdrs[i];
264a9643ea8Slogwang 		msghdrs[i].msg_next = NULL;
265a9643ea8Slogwang #ifdef MAC
266a9643ea8Slogwang 		mac_sysvmsg_init(&msghdrs[i]);
267a9643ea8Slogwang #endif
268a9643ea8Slogwang     	}
269a9643ea8Slogwang 	free_msghdrs = &msghdrs[0];
270a9643ea8Slogwang 
271a9643ea8Slogwang 	for (i = 0; i < msginfo.msgmni; i++) {
272a9643ea8Slogwang 		msqids[i].u.msg_qbytes = 0;	/* implies entry is available */
273a9643ea8Slogwang 		msqids[i].u.msg_perm.seq = 0;	/* reset to a known value */
274a9643ea8Slogwang 		msqids[i].u.msg_perm.mode = 0;
275a9643ea8Slogwang #ifdef MAC
276a9643ea8Slogwang 		mac_sysvmsq_init(&msqids[i]);
277a9643ea8Slogwang #endif
278a9643ea8Slogwang 	}
279a9643ea8Slogwang 	mtx_init(&msq_mtx, "msq", NULL, MTX_DEF);
280a9643ea8Slogwang 
281a9643ea8Slogwang 	/* Set current prisons according to their allow.sysvipc. */
282a9643ea8Slogwang 	msg_prison_slot = osd_jail_register(NULL, methods);
283a9643ea8Slogwang 	rsv = osd_reserve(msg_prison_slot);
284a9643ea8Slogwang 	prison_lock(&prison0);
285a9643ea8Slogwang 	(void)osd_jail_set_reserved(&prison0, msg_prison_slot, rsv, &prison0);
286a9643ea8Slogwang 	prison_unlock(&prison0);
287a9643ea8Slogwang 	rsv = NULL;
288a9643ea8Slogwang 	sx_slock(&allprison_lock);
289a9643ea8Slogwang 	TAILQ_FOREACH(pr, &allprison, pr_list) {
290a9643ea8Slogwang 		if (rsv == NULL)
291a9643ea8Slogwang 			rsv = osd_reserve(msg_prison_slot);
292a9643ea8Slogwang 		prison_lock(pr);
293*22ce4affSfengbojiang 		if (prison_isvalid(pr) && (pr->pr_allow & PR_ALLOW_SYSVIPC)) {
294a9643ea8Slogwang 			(void)osd_jail_set_reserved(pr, msg_prison_slot, rsv,
295a9643ea8Slogwang 			    &prison0);
296a9643ea8Slogwang 			rsv = NULL;
297a9643ea8Slogwang 		}
298a9643ea8Slogwang 		prison_unlock(pr);
299a9643ea8Slogwang 	}
300a9643ea8Slogwang 	if (rsv != NULL)
301a9643ea8Slogwang 		osd_free_reserved(rsv);
302a9643ea8Slogwang 	sx_sunlock(&allprison_lock);
303a9643ea8Slogwang 
304a9643ea8Slogwang 	error = syscall_helper_register(msg_syscalls, SY_THR_STATIC_KLD);
305a9643ea8Slogwang 	if (error != 0)
306a9643ea8Slogwang 		return (error);
307a9643ea8Slogwang #ifdef COMPAT_FREEBSD32
308a9643ea8Slogwang 	error = syscall32_helper_register(msg32_syscalls, SY_THR_STATIC_KLD);
309a9643ea8Slogwang 	if (error != 0)
310a9643ea8Slogwang 		return (error);
311a9643ea8Slogwang #endif
312a9643ea8Slogwang 	return (0);
313a9643ea8Slogwang }
314a9643ea8Slogwang 
315a9643ea8Slogwang static int
msgunload()316a9643ea8Slogwang msgunload()
317a9643ea8Slogwang {
318a9643ea8Slogwang 	struct msqid_kernel *msqkptr;
319a9643ea8Slogwang 	int msqid;
320a9643ea8Slogwang #ifdef MAC
321a9643ea8Slogwang 	int i;
322a9643ea8Slogwang #endif
323a9643ea8Slogwang 
324a9643ea8Slogwang 	syscall_helper_unregister(msg_syscalls);
325a9643ea8Slogwang #ifdef COMPAT_FREEBSD32
326a9643ea8Slogwang 	syscall32_helper_unregister(msg32_syscalls);
327a9643ea8Slogwang #endif
328a9643ea8Slogwang 
329a9643ea8Slogwang 	for (msqid = 0; msqid < msginfo.msgmni; msqid++) {
330a9643ea8Slogwang 		msqkptr = &msqids[msqid];
331a9643ea8Slogwang 		if (msqkptr->u.msg_qbytes != 0 ||
332a9643ea8Slogwang 		    (msqkptr->u.msg_perm.mode & MSG_LOCKED) != 0)
333a9643ea8Slogwang 			break;
334a9643ea8Slogwang 	}
335a9643ea8Slogwang 	if (msqid != msginfo.msgmni)
336a9643ea8Slogwang 		return (EBUSY);
337a9643ea8Slogwang 
338a9643ea8Slogwang 	if (msg_prison_slot != 0)
339a9643ea8Slogwang 		osd_jail_deregister(msg_prison_slot);
340a9643ea8Slogwang #ifdef MAC
341a9643ea8Slogwang 	for (i = 0; i < msginfo.msgtql; i++)
342a9643ea8Slogwang 		mac_sysvmsg_destroy(&msghdrs[i]);
343a9643ea8Slogwang 	for (msqid = 0; msqid < msginfo.msgmni; msqid++)
344a9643ea8Slogwang 		mac_sysvmsq_destroy(&msqids[msqid]);
345a9643ea8Slogwang #endif
346a9643ea8Slogwang 	free(msgpool, M_MSG);
347a9643ea8Slogwang 	free(msgmaps, M_MSG);
348a9643ea8Slogwang 	free(msghdrs, M_MSG);
349a9643ea8Slogwang 	free(msqids, M_MSG);
350a9643ea8Slogwang 	mtx_destroy(&msq_mtx);
351a9643ea8Slogwang 	return (0);
352a9643ea8Slogwang }
353a9643ea8Slogwang 
354a9643ea8Slogwang static int
sysvmsg_modload(struct module * module,int cmd,void * arg)355a9643ea8Slogwang sysvmsg_modload(struct module *module, int cmd, void *arg)
356a9643ea8Slogwang {
357a9643ea8Slogwang 	int error = 0;
358a9643ea8Slogwang 
359a9643ea8Slogwang 	switch (cmd) {
360a9643ea8Slogwang 	case MOD_LOAD:
361a9643ea8Slogwang 		error = msginit();
362a9643ea8Slogwang 		if (error != 0)
363a9643ea8Slogwang 			msgunload();
364a9643ea8Slogwang 		break;
365a9643ea8Slogwang 	case MOD_UNLOAD:
366a9643ea8Slogwang 		error = msgunload();
367a9643ea8Slogwang 		break;
368a9643ea8Slogwang 	case MOD_SHUTDOWN:
369a9643ea8Slogwang 		break;
370a9643ea8Slogwang 	default:
371a9643ea8Slogwang 		error = EINVAL;
372a9643ea8Slogwang 		break;
373a9643ea8Slogwang 	}
374a9643ea8Slogwang 	return (error);
375a9643ea8Slogwang }
376a9643ea8Slogwang 
377a9643ea8Slogwang static moduledata_t sysvmsg_mod = {
378a9643ea8Slogwang 	"sysvmsg",
379a9643ea8Slogwang 	&sysvmsg_modload,
380a9643ea8Slogwang 	NULL
381a9643ea8Slogwang };
382a9643ea8Slogwang 
383a9643ea8Slogwang DECLARE_MODULE(sysvmsg, sysvmsg_mod, SI_SUB_SYSV_MSG, SI_ORDER_FIRST);
384a9643ea8Slogwang MODULE_VERSION(sysvmsg, 1);
385a9643ea8Slogwang 
386a9643ea8Slogwang static void
msg_freehdr(struct msg * msghdr)387*22ce4affSfengbojiang msg_freehdr(struct msg *msghdr)
388a9643ea8Slogwang {
389a9643ea8Slogwang 	while (msghdr->msg_ts > 0) {
390a9643ea8Slogwang 		short next;
391a9643ea8Slogwang 		if (msghdr->msg_spot < 0 || msghdr->msg_spot >= msginfo.msgseg)
392a9643ea8Slogwang 			panic("msghdr->msg_spot out of range");
393a9643ea8Slogwang 		next = msgmaps[msghdr->msg_spot].next;
394a9643ea8Slogwang 		msgmaps[msghdr->msg_spot].next = free_msgmaps;
395a9643ea8Slogwang 		free_msgmaps = msghdr->msg_spot;
396a9643ea8Slogwang 		nfree_msgmaps++;
397a9643ea8Slogwang 		msghdr->msg_spot = next;
398a9643ea8Slogwang 		if (msghdr->msg_ts >= msginfo.msgssz)
399a9643ea8Slogwang 			msghdr->msg_ts -= msginfo.msgssz;
400a9643ea8Slogwang 		else
401a9643ea8Slogwang 			msghdr->msg_ts = 0;
402a9643ea8Slogwang 	}
403a9643ea8Slogwang 	if (msghdr->msg_spot != -1)
404a9643ea8Slogwang 		panic("msghdr->msg_spot != -1");
405a9643ea8Slogwang 	msghdr->msg_next = free_msghdrs;
406a9643ea8Slogwang 	free_msghdrs = msghdr;
407a9643ea8Slogwang #ifdef MAC
408a9643ea8Slogwang 	mac_sysvmsg_cleanup(msghdr);
409a9643ea8Slogwang #endif
410a9643ea8Slogwang }
411a9643ea8Slogwang 
412a9643ea8Slogwang static void
msq_remove(struct msqid_kernel * msqkptr)413a9643ea8Slogwang msq_remove(struct msqid_kernel *msqkptr)
414a9643ea8Slogwang {
415a9643ea8Slogwang 	struct msg *msghdr;
416a9643ea8Slogwang 
417a9643ea8Slogwang 	racct_sub_cred(msqkptr->cred, RACCT_NMSGQ, 1);
418a9643ea8Slogwang 	racct_sub_cred(msqkptr->cred, RACCT_MSGQQUEUED, msqkptr->u.msg_qnum);
419a9643ea8Slogwang 	racct_sub_cred(msqkptr->cred, RACCT_MSGQSIZE, msqkptr->u.msg_cbytes);
420a9643ea8Slogwang 	crfree(msqkptr->cred);
421a9643ea8Slogwang 	msqkptr->cred = NULL;
422a9643ea8Slogwang 
423a9643ea8Slogwang 	/* Free the message headers */
424*22ce4affSfengbojiang 	msghdr = msqkptr->u.__msg_first;
425a9643ea8Slogwang 	while (msghdr != NULL) {
426a9643ea8Slogwang 		struct msg *msghdr_tmp;
427a9643ea8Slogwang 
428a9643ea8Slogwang 		/* Free the segments of each message */
429a9643ea8Slogwang 		msqkptr->u.msg_cbytes -= msghdr->msg_ts;
430a9643ea8Slogwang 		msqkptr->u.msg_qnum--;
431a9643ea8Slogwang 		msghdr_tmp = msghdr;
432a9643ea8Slogwang 		msghdr = msghdr->msg_next;
433a9643ea8Slogwang 		msg_freehdr(msghdr_tmp);
434a9643ea8Slogwang 	}
435a9643ea8Slogwang 
436a9643ea8Slogwang 	if (msqkptr->u.msg_cbytes != 0)
437a9643ea8Slogwang 		panic("msg_cbytes is screwed up");
438a9643ea8Slogwang 	if (msqkptr->u.msg_qnum != 0)
439a9643ea8Slogwang 		panic("msg_qnum is screwed up");
440a9643ea8Slogwang 
441a9643ea8Slogwang 	msqkptr->u.msg_qbytes = 0;	/* Mark it as free */
442a9643ea8Slogwang 
443a9643ea8Slogwang #ifdef MAC
444a9643ea8Slogwang 	mac_sysvmsq_cleanup(msqkptr);
445a9643ea8Slogwang #endif
446a9643ea8Slogwang 
447a9643ea8Slogwang 	wakeup(msqkptr);
448a9643ea8Slogwang }
449a9643ea8Slogwang 
450a9643ea8Slogwang static struct prison *
msg_find_prison(struct ucred * cred)451a9643ea8Slogwang msg_find_prison(struct ucred *cred)
452a9643ea8Slogwang {
453a9643ea8Slogwang 	struct prison *pr, *rpr;
454a9643ea8Slogwang 
455a9643ea8Slogwang 	pr = cred->cr_prison;
456a9643ea8Slogwang 	prison_lock(pr);
457a9643ea8Slogwang 	rpr = osd_jail_get(pr, msg_prison_slot);
458a9643ea8Slogwang 	prison_unlock(pr);
459a9643ea8Slogwang 	return rpr;
460a9643ea8Slogwang }
461a9643ea8Slogwang 
462a9643ea8Slogwang static int
msq_prison_cansee(struct prison * rpr,struct msqid_kernel * msqkptr)463a9643ea8Slogwang msq_prison_cansee(struct prison *rpr, struct msqid_kernel *msqkptr)
464a9643ea8Slogwang {
465a9643ea8Slogwang 
466a9643ea8Slogwang 	if (msqkptr->cred == NULL ||
467a9643ea8Slogwang 	    !(rpr == msqkptr->cred->cr_prison ||
468a9643ea8Slogwang 	      prison_ischild(rpr, msqkptr->cred->cr_prison)))
469a9643ea8Slogwang 		return (EINVAL);
470a9643ea8Slogwang 	return (0);
471a9643ea8Slogwang }
472a9643ea8Slogwang 
473a9643ea8Slogwang #ifndef _SYS_SYSPROTO_H_
474a9643ea8Slogwang struct msgctl_args {
475a9643ea8Slogwang 	int	msqid;
476a9643ea8Slogwang 	int	cmd;
477a9643ea8Slogwang 	struct	msqid_ds *buf;
478a9643ea8Slogwang };
479a9643ea8Slogwang #endif
480a9643ea8Slogwang int
sys_msgctl(struct thread * td,struct msgctl_args * uap)481*22ce4affSfengbojiang sys_msgctl(struct thread *td, struct msgctl_args *uap)
482a9643ea8Slogwang {
483a9643ea8Slogwang 	int msqid = uap->msqid;
484a9643ea8Slogwang 	int cmd = uap->cmd;
485a9643ea8Slogwang 	struct msqid_ds msqbuf;
486a9643ea8Slogwang 	int error;
487a9643ea8Slogwang 
488a9643ea8Slogwang 	DPRINTF(("call to msgctl(%d, %d, %p)\n", msqid, cmd, uap->buf));
489a9643ea8Slogwang 	if (cmd == IPC_SET &&
490a9643ea8Slogwang 	    (error = copyin(uap->buf, &msqbuf, sizeof(msqbuf))) != 0)
491a9643ea8Slogwang 		return (error);
492a9643ea8Slogwang 	error = kern_msgctl(td, msqid, cmd, &msqbuf);
493a9643ea8Slogwang 	if (cmd == IPC_STAT && error == 0)
494a9643ea8Slogwang 		error = copyout(&msqbuf, uap->buf, sizeof(struct msqid_ds));
495a9643ea8Slogwang 	return (error);
496a9643ea8Slogwang }
497a9643ea8Slogwang 
498a9643ea8Slogwang int
kern_msgctl(struct thread * td,int msqid,int cmd,struct msqid_ds * msqbuf)499*22ce4affSfengbojiang kern_msgctl(struct thread *td, int msqid, int cmd, struct msqid_ds *msqbuf)
500a9643ea8Slogwang {
501a9643ea8Slogwang 	int rval, error, msqix;
502*22ce4affSfengbojiang 	struct msqid_kernel *msqkptr;
503a9643ea8Slogwang 	struct prison *rpr;
504a9643ea8Slogwang 
505a9643ea8Slogwang 	rpr = msg_find_prison(td->td_ucred);
506a9643ea8Slogwang 	if (rpr == NULL)
507a9643ea8Slogwang 		return (ENOSYS);
508a9643ea8Slogwang 
509*22ce4affSfengbojiang 	AUDIT_ARG_SVIPC_CMD(cmd);
510*22ce4affSfengbojiang 	AUDIT_ARG_SVIPC_ID(msqid);
511a9643ea8Slogwang 	msqix = IPCID_TO_IX(msqid);
512a9643ea8Slogwang 
513a9643ea8Slogwang 	if (msqix < 0 || msqix >= msginfo.msgmni) {
514a9643ea8Slogwang 		DPRINTF(("msqid (%d) out of range (0<=msqid<%d)\n", msqix,
515a9643ea8Slogwang 		    msginfo.msgmni));
516a9643ea8Slogwang 		return (EINVAL);
517a9643ea8Slogwang 	}
518a9643ea8Slogwang 
519a9643ea8Slogwang 	msqkptr = &msqids[msqix];
520a9643ea8Slogwang 
521a9643ea8Slogwang 	mtx_lock(&msq_mtx);
522a9643ea8Slogwang 	if (msqkptr->u.msg_qbytes == 0) {
523a9643ea8Slogwang 		DPRINTF(("no such msqid\n"));
524a9643ea8Slogwang 		error = EINVAL;
525a9643ea8Slogwang 		goto done2;
526a9643ea8Slogwang 	}
527a9643ea8Slogwang 	if (msqkptr->u.msg_perm.seq != IPCID_TO_SEQ(msqid)) {
528a9643ea8Slogwang 		DPRINTF(("wrong sequence number\n"));
529a9643ea8Slogwang 		error = EINVAL;
530a9643ea8Slogwang 		goto done2;
531a9643ea8Slogwang 	}
532a9643ea8Slogwang 
533a9643ea8Slogwang 	error = msq_prison_cansee(rpr, msqkptr);
534a9643ea8Slogwang 	if (error != 0) {
535a9643ea8Slogwang 		DPRINTF(("requester can't see prison\n"));
536a9643ea8Slogwang 		goto done2;
537a9643ea8Slogwang 	}
538a9643ea8Slogwang 
539a9643ea8Slogwang #ifdef MAC
540a9643ea8Slogwang 	error = mac_sysvmsq_check_msqctl(td->td_ucred, msqkptr, cmd);
541a9643ea8Slogwang 	if (error != 0)
542a9643ea8Slogwang 		goto done2;
543a9643ea8Slogwang #endif
544a9643ea8Slogwang 
545a9643ea8Slogwang 	error = 0;
546a9643ea8Slogwang 	rval = 0;
547a9643ea8Slogwang 
548a9643ea8Slogwang 	switch (cmd) {
549a9643ea8Slogwang 	case IPC_RMID:
550a9643ea8Slogwang 	{
551a9643ea8Slogwang #ifdef MAC
552a9643ea8Slogwang 		struct msg *msghdr;
553a9643ea8Slogwang #endif
554a9643ea8Slogwang 		if ((error = ipcperm(td, &msqkptr->u.msg_perm, IPC_M)))
555a9643ea8Slogwang 			goto done2;
556a9643ea8Slogwang 
557a9643ea8Slogwang #ifdef MAC
558a9643ea8Slogwang 		/*
559a9643ea8Slogwang 		 * Check that the thread has MAC access permissions to
560a9643ea8Slogwang 		 * individual msghdrs.  Note: We need to do this in a
561a9643ea8Slogwang 		 * separate loop because the actual loop alters the
562a9643ea8Slogwang 		 * msq/msghdr info as it progresses, and there is no going
563a9643ea8Slogwang 		 * back if half the way through we discover that the
564a9643ea8Slogwang 		 * thread cannot free a certain msghdr.  The msq will get
565a9643ea8Slogwang 		 * into an inconsistent state.
566a9643ea8Slogwang 		 */
567*22ce4affSfengbojiang 		for (msghdr = msqkptr->u.__msg_first; msghdr != NULL;
568a9643ea8Slogwang 		    msghdr = msghdr->msg_next) {
569a9643ea8Slogwang 			error = mac_sysvmsq_check_msgrmid(td->td_ucred, msghdr);
570a9643ea8Slogwang 			if (error != 0)
571a9643ea8Slogwang 				goto done2;
572a9643ea8Slogwang 		}
573a9643ea8Slogwang #endif
574a9643ea8Slogwang 
575a9643ea8Slogwang 		msq_remove(msqkptr);
576a9643ea8Slogwang 	}
577a9643ea8Slogwang 
578a9643ea8Slogwang 		break;
579a9643ea8Slogwang 
580a9643ea8Slogwang 	case IPC_SET:
581*22ce4affSfengbojiang 		AUDIT_ARG_SVIPC_PERM(&msqbuf->msg_perm);
582a9643ea8Slogwang 		if ((error = ipcperm(td, &msqkptr->u.msg_perm, IPC_M)))
583a9643ea8Slogwang 			goto done2;
584a9643ea8Slogwang 		if (msqbuf->msg_qbytes > msqkptr->u.msg_qbytes) {
585a9643ea8Slogwang 			error = priv_check(td, PRIV_IPC_MSGSIZE);
586a9643ea8Slogwang 			if (error)
587a9643ea8Slogwang 				goto done2;
588a9643ea8Slogwang 		}
589a9643ea8Slogwang 		if (msqbuf->msg_qbytes > msginfo.msgmnb) {
590a9643ea8Slogwang 			DPRINTF(("can't increase msg_qbytes beyond %d"
591a9643ea8Slogwang 			    "(truncating)\n", msginfo.msgmnb));
592a9643ea8Slogwang 			msqbuf->msg_qbytes = msginfo.msgmnb;	/* silently restrict qbytes to system limit */
593a9643ea8Slogwang 		}
594a9643ea8Slogwang 		if (msqbuf->msg_qbytes == 0) {
595a9643ea8Slogwang 			DPRINTF(("can't reduce msg_qbytes to 0\n"));
596a9643ea8Slogwang 			error = EINVAL;		/* non-standard errno! */
597a9643ea8Slogwang 			goto done2;
598a9643ea8Slogwang 		}
599a9643ea8Slogwang 		msqkptr->u.msg_perm.uid = msqbuf->msg_perm.uid;	/* change the owner */
600a9643ea8Slogwang 		msqkptr->u.msg_perm.gid = msqbuf->msg_perm.gid;	/* change the owner */
601a9643ea8Slogwang 		msqkptr->u.msg_perm.mode = (msqkptr->u.msg_perm.mode & ~0777) |
602a9643ea8Slogwang 		    (msqbuf->msg_perm.mode & 0777);
603a9643ea8Slogwang 		msqkptr->u.msg_qbytes = msqbuf->msg_qbytes;
604a9643ea8Slogwang 		msqkptr->u.msg_ctime = time_second;
605a9643ea8Slogwang 		break;
606a9643ea8Slogwang 
607a9643ea8Slogwang 	case IPC_STAT:
608a9643ea8Slogwang 		if ((error = ipcperm(td, &msqkptr->u.msg_perm, IPC_R))) {
609a9643ea8Slogwang 			DPRINTF(("requester doesn't have read access\n"));
610a9643ea8Slogwang 			goto done2;
611a9643ea8Slogwang 		}
612a9643ea8Slogwang 		*msqbuf = msqkptr->u;
613a9643ea8Slogwang 		if (td->td_ucred->cr_prison != msqkptr->cred->cr_prison)
614a9643ea8Slogwang 			msqbuf->msg_perm.key = IPC_PRIVATE;
615*22ce4affSfengbojiang 
616*22ce4affSfengbojiang 		/*
617*22ce4affSfengbojiang 		 * Try to hide the fact that the structure layout is shared by
618*22ce4affSfengbojiang 		 * both the kernel and userland.  These pointers are not useful
619*22ce4affSfengbojiang 		 * to userspace.
620*22ce4affSfengbojiang 		 */
621*22ce4affSfengbojiang 		msqbuf->__msg_first = msqbuf->__msg_last = NULL;
622a9643ea8Slogwang 		break;
623a9643ea8Slogwang 
624a9643ea8Slogwang 	default:
625a9643ea8Slogwang 		DPRINTF(("invalid command %d\n", cmd));
626a9643ea8Slogwang 		error = EINVAL;
627a9643ea8Slogwang 		goto done2;
628a9643ea8Slogwang 	}
629a9643ea8Slogwang 
630a9643ea8Slogwang 	if (error == 0)
631a9643ea8Slogwang 		td->td_retval[0] = rval;
632a9643ea8Slogwang done2:
633a9643ea8Slogwang 	mtx_unlock(&msq_mtx);
634a9643ea8Slogwang 	return (error);
635a9643ea8Slogwang }
636a9643ea8Slogwang 
637a9643ea8Slogwang #ifndef _SYS_SYSPROTO_H_
638a9643ea8Slogwang struct msgget_args {
639a9643ea8Slogwang 	key_t	key;
640a9643ea8Slogwang 	int	msgflg;
641a9643ea8Slogwang };
642a9643ea8Slogwang #endif
643a9643ea8Slogwang 
644a9643ea8Slogwang int
sys_msgget(struct thread * td,struct msgget_args * uap)645*22ce4affSfengbojiang sys_msgget(struct thread *td, struct msgget_args *uap)
646a9643ea8Slogwang {
647a9643ea8Slogwang 	int msqid, error = 0;
648a9643ea8Slogwang 	int key = uap->key;
649a9643ea8Slogwang 	int msgflg = uap->msgflg;
650a9643ea8Slogwang 	struct ucred *cred = td->td_ucred;
651*22ce4affSfengbojiang 	struct msqid_kernel *msqkptr = NULL;
652a9643ea8Slogwang 
653a9643ea8Slogwang 	DPRINTF(("msgget(0x%x, 0%o)\n", key, msgflg));
654a9643ea8Slogwang 
655a9643ea8Slogwang 	if (msg_find_prison(cred) == NULL)
656a9643ea8Slogwang 		return (ENOSYS);
657a9643ea8Slogwang 
658a9643ea8Slogwang 	mtx_lock(&msq_mtx);
659a9643ea8Slogwang 	if (key != IPC_PRIVATE) {
660a9643ea8Slogwang 		for (msqid = 0; msqid < msginfo.msgmni; msqid++) {
661a9643ea8Slogwang 			msqkptr = &msqids[msqid];
662a9643ea8Slogwang 			if (msqkptr->u.msg_qbytes != 0 &&
663a9643ea8Slogwang 			    msqkptr->cred != NULL &&
664a9643ea8Slogwang 			    msqkptr->cred->cr_prison == cred->cr_prison &&
665a9643ea8Slogwang 			    msqkptr->u.msg_perm.key == key)
666a9643ea8Slogwang 				break;
667a9643ea8Slogwang 		}
668a9643ea8Slogwang 		if (msqid < msginfo.msgmni) {
669a9643ea8Slogwang 			DPRINTF(("found public key\n"));
670a9643ea8Slogwang 			if ((msgflg & IPC_CREAT) && (msgflg & IPC_EXCL)) {
671a9643ea8Slogwang 				DPRINTF(("not exclusive\n"));
672a9643ea8Slogwang 				error = EEXIST;
673a9643ea8Slogwang 				goto done2;
674a9643ea8Slogwang 			}
675*22ce4affSfengbojiang 			AUDIT_ARG_SVIPC_ID(IXSEQ_TO_IPCID(msqid,
676*22ce4affSfengbojiang 			    msqkptr->u.msg_perm));
677a9643ea8Slogwang 			if ((error = ipcperm(td, &msqkptr->u.msg_perm,
678a9643ea8Slogwang 			    msgflg & 0700))) {
679a9643ea8Slogwang 				DPRINTF(("requester doesn't have 0%o access\n",
680a9643ea8Slogwang 				    msgflg & 0700));
681a9643ea8Slogwang 				goto done2;
682a9643ea8Slogwang 			}
683a9643ea8Slogwang #ifdef MAC
684a9643ea8Slogwang 			error = mac_sysvmsq_check_msqget(cred, msqkptr);
685a9643ea8Slogwang 			if (error != 0)
686a9643ea8Slogwang 				goto done2;
687a9643ea8Slogwang #endif
688a9643ea8Slogwang 			goto found;
689a9643ea8Slogwang 		}
690a9643ea8Slogwang 	}
691a9643ea8Slogwang 
692a9643ea8Slogwang 	DPRINTF(("need to allocate the msqid_ds\n"));
693a9643ea8Slogwang 	if (key == IPC_PRIVATE || (msgflg & IPC_CREAT)) {
694a9643ea8Slogwang 		for (msqid = 0; msqid < msginfo.msgmni; msqid++) {
695a9643ea8Slogwang 			/*
696a9643ea8Slogwang 			 * Look for an unallocated and unlocked msqid_ds.
697a9643ea8Slogwang 			 * msqid_ds's can be locked by msgsnd or msgrcv while
698a9643ea8Slogwang 			 * they are copying the message in/out.  We can't
699a9643ea8Slogwang 			 * re-use the entry until they release it.
700a9643ea8Slogwang 			 */
701a9643ea8Slogwang 			msqkptr = &msqids[msqid];
702a9643ea8Slogwang 			if (msqkptr->u.msg_qbytes == 0 &&
703a9643ea8Slogwang 			    (msqkptr->u.msg_perm.mode & MSG_LOCKED) == 0)
704a9643ea8Slogwang 				break;
705a9643ea8Slogwang 		}
706a9643ea8Slogwang 		if (msqid == msginfo.msgmni) {
707a9643ea8Slogwang 			DPRINTF(("no more msqid_ds's available\n"));
708a9643ea8Slogwang 			error = ENOSPC;
709a9643ea8Slogwang 			goto done2;
710a9643ea8Slogwang 		}
711a9643ea8Slogwang #ifdef RACCT
712a9643ea8Slogwang 		if (racct_enable) {
713a9643ea8Slogwang 			PROC_LOCK(td->td_proc);
714a9643ea8Slogwang 			error = racct_add(td->td_proc, RACCT_NMSGQ, 1);
715a9643ea8Slogwang 			PROC_UNLOCK(td->td_proc);
716a9643ea8Slogwang 			if (error != 0) {
717a9643ea8Slogwang 				error = ENOSPC;
718a9643ea8Slogwang 				goto done2;
719a9643ea8Slogwang 			}
720a9643ea8Slogwang 		}
721a9643ea8Slogwang #endif
722a9643ea8Slogwang 		DPRINTF(("msqid %d is available\n", msqid));
723a9643ea8Slogwang 		msqkptr->u.msg_perm.key = key;
724a9643ea8Slogwang 		msqkptr->u.msg_perm.cuid = cred->cr_uid;
725a9643ea8Slogwang 		msqkptr->u.msg_perm.uid = cred->cr_uid;
726a9643ea8Slogwang 		msqkptr->u.msg_perm.cgid = cred->cr_gid;
727a9643ea8Slogwang 		msqkptr->u.msg_perm.gid = cred->cr_gid;
728a9643ea8Slogwang 		msqkptr->u.msg_perm.mode = (msgflg & 0777);
729a9643ea8Slogwang 		msqkptr->cred = crhold(cred);
730a9643ea8Slogwang 		/* Make sure that the returned msqid is unique */
731a9643ea8Slogwang 		msqkptr->u.msg_perm.seq = (msqkptr->u.msg_perm.seq + 1) & 0x7fff;
732*22ce4affSfengbojiang 		msqkptr->u.__msg_first = NULL;
733*22ce4affSfengbojiang 		msqkptr->u.__msg_last = NULL;
734a9643ea8Slogwang 		msqkptr->u.msg_cbytes = 0;
735a9643ea8Slogwang 		msqkptr->u.msg_qnum = 0;
736a9643ea8Slogwang 		msqkptr->u.msg_qbytes = msginfo.msgmnb;
737a9643ea8Slogwang 		msqkptr->u.msg_lspid = 0;
738a9643ea8Slogwang 		msqkptr->u.msg_lrpid = 0;
739a9643ea8Slogwang 		msqkptr->u.msg_stime = 0;
740a9643ea8Slogwang 		msqkptr->u.msg_rtime = 0;
741a9643ea8Slogwang 		msqkptr->u.msg_ctime = time_second;
742a9643ea8Slogwang #ifdef MAC
743a9643ea8Slogwang 		mac_sysvmsq_create(cred, msqkptr);
744a9643ea8Slogwang #endif
745*22ce4affSfengbojiang 		AUDIT_ARG_SVIPC_PERM(&msqkptr->u.msg_perm);
746a9643ea8Slogwang 	} else {
747a9643ea8Slogwang 		DPRINTF(("didn't find it and wasn't asked to create it\n"));
748a9643ea8Slogwang 		error = ENOENT;
749a9643ea8Slogwang 		goto done2;
750a9643ea8Slogwang 	}
751a9643ea8Slogwang 
752a9643ea8Slogwang found:
753a9643ea8Slogwang 	/* Construct the unique msqid */
754a9643ea8Slogwang 	td->td_retval[0] = IXSEQ_TO_IPCID(msqid, msqkptr->u.msg_perm);
755a9643ea8Slogwang done2:
756a9643ea8Slogwang 	mtx_unlock(&msq_mtx);
757a9643ea8Slogwang 	return (error);
758a9643ea8Slogwang }
759a9643ea8Slogwang 
760a9643ea8Slogwang #ifndef _SYS_SYSPROTO_H_
761a9643ea8Slogwang struct msgsnd_args {
762a9643ea8Slogwang 	int	msqid;
763*22ce4affSfengbojiang 	const void	*msgp;	/* XXX msgp is actually mtext. */
764a9643ea8Slogwang 	size_t	msgsz;
765a9643ea8Slogwang 	int	msgflg;
766a9643ea8Slogwang };
767a9643ea8Slogwang #endif
768a9643ea8Slogwang int
kern_msgsnd(struct thread * td,int msqid,const void * msgp,size_t msgsz,int msgflg,long mtype)769*22ce4affSfengbojiang kern_msgsnd(struct thread *td, int msqid, const void *msgp,
770*22ce4affSfengbojiang     size_t msgsz, int msgflg, long mtype)
771a9643ea8Slogwang {
772a9643ea8Slogwang 	int msqix, segs_needed, error = 0;
773*22ce4affSfengbojiang 	struct msqid_kernel *msqkptr;
774*22ce4affSfengbojiang 	struct msg *msghdr;
775a9643ea8Slogwang 	struct prison *rpr;
776a9643ea8Slogwang 	short next;
777a9643ea8Slogwang #ifdef RACCT
778*22ce4affSfengbojiang 	size_t saved_msgsz = 0;
779a9643ea8Slogwang #endif
780a9643ea8Slogwang 
781a9643ea8Slogwang 	rpr = msg_find_prison(td->td_ucred);
782a9643ea8Slogwang 	if (rpr == NULL)
783a9643ea8Slogwang 		return (ENOSYS);
784a9643ea8Slogwang 
785a9643ea8Slogwang 	mtx_lock(&msq_mtx);
786*22ce4affSfengbojiang 	AUDIT_ARG_SVIPC_ID(msqid);
787a9643ea8Slogwang 	msqix = IPCID_TO_IX(msqid);
788a9643ea8Slogwang 
789a9643ea8Slogwang 	if (msqix < 0 || msqix >= msginfo.msgmni) {
790a9643ea8Slogwang 		DPRINTF(("msqid (%d) out of range (0<=msqid<%d)\n", msqix,
791a9643ea8Slogwang 		    msginfo.msgmni));
792a9643ea8Slogwang 		error = EINVAL;
793a9643ea8Slogwang 		goto done2;
794a9643ea8Slogwang 	}
795a9643ea8Slogwang 
796a9643ea8Slogwang 	msqkptr = &msqids[msqix];
797*22ce4affSfengbojiang 	AUDIT_ARG_SVIPC_PERM(&msqkptr->u.msg_perm);
798a9643ea8Slogwang 	if (msqkptr->u.msg_qbytes == 0) {
799a9643ea8Slogwang 		DPRINTF(("no such message queue id\n"));
800a9643ea8Slogwang 		error = EINVAL;
801a9643ea8Slogwang 		goto done2;
802a9643ea8Slogwang 	}
803a9643ea8Slogwang 	if (msqkptr->u.msg_perm.seq != IPCID_TO_SEQ(msqid)) {
804a9643ea8Slogwang 		DPRINTF(("wrong sequence number\n"));
805a9643ea8Slogwang 		error = EINVAL;
806a9643ea8Slogwang 		goto done2;
807a9643ea8Slogwang 	}
808a9643ea8Slogwang 
809a9643ea8Slogwang 	if ((error = msq_prison_cansee(rpr, msqkptr))) {
810a9643ea8Slogwang 		DPRINTF(("requester can't see prison\n"));
811a9643ea8Slogwang 		goto done2;
812a9643ea8Slogwang 	}
813a9643ea8Slogwang 
814a9643ea8Slogwang 	if ((error = ipcperm(td, &msqkptr->u.msg_perm, IPC_W))) {
815a9643ea8Slogwang 		DPRINTF(("requester doesn't have write access\n"));
816a9643ea8Slogwang 		goto done2;
817a9643ea8Slogwang 	}
818a9643ea8Slogwang 
819a9643ea8Slogwang #ifdef MAC
820a9643ea8Slogwang 	error = mac_sysvmsq_check_msqsnd(td->td_ucred, msqkptr);
821a9643ea8Slogwang 	if (error != 0)
822a9643ea8Slogwang 		goto done2;
823a9643ea8Slogwang #endif
824a9643ea8Slogwang 
825a9643ea8Slogwang #ifdef RACCT
826a9643ea8Slogwang 	if (racct_enable) {
827a9643ea8Slogwang 		PROC_LOCK(td->td_proc);
828a9643ea8Slogwang 		if (racct_add(td->td_proc, RACCT_MSGQQUEUED, 1)) {
829a9643ea8Slogwang 			PROC_UNLOCK(td->td_proc);
830a9643ea8Slogwang 			error = EAGAIN;
831a9643ea8Slogwang 			goto done2;
832a9643ea8Slogwang 		}
833a9643ea8Slogwang 		saved_msgsz = msgsz;
834a9643ea8Slogwang 		if (racct_add(td->td_proc, RACCT_MSGQSIZE, msgsz)) {
835a9643ea8Slogwang 			racct_sub(td->td_proc, RACCT_MSGQQUEUED, 1);
836a9643ea8Slogwang 			PROC_UNLOCK(td->td_proc);
837a9643ea8Slogwang 			error = EAGAIN;
838a9643ea8Slogwang 			goto done2;
839a9643ea8Slogwang 		}
840a9643ea8Slogwang 		PROC_UNLOCK(td->td_proc);
841a9643ea8Slogwang 	}
842a9643ea8Slogwang #endif
843a9643ea8Slogwang 
844a9643ea8Slogwang 	segs_needed = howmany(msgsz, msginfo.msgssz);
845a9643ea8Slogwang 	DPRINTF(("msgsz=%zu, msgssz=%d, segs_needed=%d\n", msgsz,
846a9643ea8Slogwang 	    msginfo.msgssz, segs_needed));
847a9643ea8Slogwang 	for (;;) {
848a9643ea8Slogwang 		int need_more_resources = 0;
849a9643ea8Slogwang 
850a9643ea8Slogwang 		/*
851a9643ea8Slogwang 		 * check msgsz
852a9643ea8Slogwang 		 * (inside this loop in case msg_qbytes changes while we sleep)
853a9643ea8Slogwang 		 */
854a9643ea8Slogwang 
855a9643ea8Slogwang 		if (msgsz > msqkptr->u.msg_qbytes) {
856a9643ea8Slogwang 			DPRINTF(("msgsz > msqkptr->u.msg_qbytes\n"));
857a9643ea8Slogwang 			error = EINVAL;
858a9643ea8Slogwang 			goto done3;
859a9643ea8Slogwang 		}
860a9643ea8Slogwang 
861a9643ea8Slogwang 		if (msqkptr->u.msg_perm.mode & MSG_LOCKED) {
862a9643ea8Slogwang 			DPRINTF(("msqid is locked\n"));
863a9643ea8Slogwang 			need_more_resources = 1;
864a9643ea8Slogwang 		}
865a9643ea8Slogwang 		if (msgsz + msqkptr->u.msg_cbytes > msqkptr->u.msg_qbytes) {
866a9643ea8Slogwang 			DPRINTF(("msgsz + msg_cbytes > msg_qbytes\n"));
867a9643ea8Slogwang 			need_more_resources = 1;
868a9643ea8Slogwang 		}
869a9643ea8Slogwang 		if (segs_needed > nfree_msgmaps) {
870a9643ea8Slogwang 			DPRINTF(("segs_needed > nfree_msgmaps\n"));
871a9643ea8Slogwang 			need_more_resources = 1;
872a9643ea8Slogwang 		}
873a9643ea8Slogwang 		if (free_msghdrs == NULL) {
874a9643ea8Slogwang 			DPRINTF(("no more msghdrs\n"));
875a9643ea8Slogwang 			need_more_resources = 1;
876a9643ea8Slogwang 		}
877a9643ea8Slogwang 
878a9643ea8Slogwang 		if (need_more_resources) {
879a9643ea8Slogwang 			int we_own_it;
880a9643ea8Slogwang 
881a9643ea8Slogwang 			if ((msgflg & IPC_NOWAIT) != 0) {
882a9643ea8Slogwang 				DPRINTF(("need more resources but caller "
883a9643ea8Slogwang 				    "doesn't want to wait\n"));
884a9643ea8Slogwang 				error = EAGAIN;
885a9643ea8Slogwang 				goto done3;
886a9643ea8Slogwang 			}
887a9643ea8Slogwang 
888a9643ea8Slogwang 			if ((msqkptr->u.msg_perm.mode & MSG_LOCKED) != 0) {
889a9643ea8Slogwang 				DPRINTF(("we don't own the msqid_ds\n"));
890a9643ea8Slogwang 				we_own_it = 0;
891a9643ea8Slogwang 			} else {
892a9643ea8Slogwang 				/* Force later arrivals to wait for our
893a9643ea8Slogwang 				   request */
894a9643ea8Slogwang 				DPRINTF(("we own the msqid_ds\n"));
895a9643ea8Slogwang 				msqkptr->u.msg_perm.mode |= MSG_LOCKED;
896a9643ea8Slogwang 				we_own_it = 1;
897a9643ea8Slogwang 			}
898a9643ea8Slogwang 			DPRINTF(("msgsnd:  goodnight\n"));
899a9643ea8Slogwang 			error = msleep(msqkptr, &msq_mtx, (PZERO - 4) | PCATCH,
900a9643ea8Slogwang 			    "msgsnd", hz);
901a9643ea8Slogwang 			DPRINTF(("msgsnd:  good morning, error=%d\n", error));
902a9643ea8Slogwang 			if (we_own_it)
903a9643ea8Slogwang 				msqkptr->u.msg_perm.mode &= ~MSG_LOCKED;
904a9643ea8Slogwang 			if (error == EWOULDBLOCK) {
905a9643ea8Slogwang 				DPRINTF(("msgsnd:  timed out\n"));
906a9643ea8Slogwang 				continue;
907a9643ea8Slogwang 			}
908a9643ea8Slogwang 			if (error != 0) {
909a9643ea8Slogwang 				DPRINTF(("msgsnd:  interrupted system call\n"));
910a9643ea8Slogwang 				error = EINTR;
911a9643ea8Slogwang 				goto done3;
912a9643ea8Slogwang 			}
913a9643ea8Slogwang 
914a9643ea8Slogwang 			/*
915a9643ea8Slogwang 			 * Make sure that the msq queue still exists
916a9643ea8Slogwang 			 */
917a9643ea8Slogwang 
918a9643ea8Slogwang 			if (msqkptr->u.msg_qbytes == 0) {
919a9643ea8Slogwang 				DPRINTF(("msqid deleted\n"));
920a9643ea8Slogwang 				error = EIDRM;
921a9643ea8Slogwang 				goto done3;
922a9643ea8Slogwang 			}
923a9643ea8Slogwang 
924a9643ea8Slogwang 		} else {
925a9643ea8Slogwang 			DPRINTF(("got all the resources that we need\n"));
926a9643ea8Slogwang 			break;
927a9643ea8Slogwang 		}
928a9643ea8Slogwang 	}
929a9643ea8Slogwang 
930a9643ea8Slogwang 	/*
931a9643ea8Slogwang 	 * We have the resources that we need.
932a9643ea8Slogwang 	 * Make sure!
933a9643ea8Slogwang 	 */
934a9643ea8Slogwang 
935a9643ea8Slogwang 	if (msqkptr->u.msg_perm.mode & MSG_LOCKED)
936a9643ea8Slogwang 		panic("msg_perm.mode & MSG_LOCKED");
937a9643ea8Slogwang 	if (segs_needed > nfree_msgmaps)
938a9643ea8Slogwang 		panic("segs_needed > nfree_msgmaps");
939a9643ea8Slogwang 	if (msgsz + msqkptr->u.msg_cbytes > msqkptr->u.msg_qbytes)
940a9643ea8Slogwang 		panic("msgsz + msg_cbytes > msg_qbytes");
941a9643ea8Slogwang 	if (free_msghdrs == NULL)
942a9643ea8Slogwang 		panic("no more msghdrs");
943a9643ea8Slogwang 
944a9643ea8Slogwang 	/*
945a9643ea8Slogwang 	 * Re-lock the msqid_ds in case we page-fault when copying in the
946a9643ea8Slogwang 	 * message
947a9643ea8Slogwang 	 */
948a9643ea8Slogwang 
949a9643ea8Slogwang 	if ((msqkptr->u.msg_perm.mode & MSG_LOCKED) != 0)
950a9643ea8Slogwang 		panic("msqid_ds is already locked");
951a9643ea8Slogwang 	msqkptr->u.msg_perm.mode |= MSG_LOCKED;
952a9643ea8Slogwang 
953a9643ea8Slogwang 	/*
954a9643ea8Slogwang 	 * Allocate a message header
955a9643ea8Slogwang 	 */
956a9643ea8Slogwang 
957a9643ea8Slogwang 	msghdr = free_msghdrs;
958a9643ea8Slogwang 	free_msghdrs = msghdr->msg_next;
959a9643ea8Slogwang 	msghdr->msg_spot = -1;
960a9643ea8Slogwang 	msghdr->msg_ts = msgsz;
961a9643ea8Slogwang 	msghdr->msg_type = mtype;
962a9643ea8Slogwang #ifdef MAC
963a9643ea8Slogwang 	/*
964a9643ea8Slogwang 	 * XXXMAC: Should the mac_sysvmsq_check_msgmsq check follow here
965a9643ea8Slogwang 	 * immediately?  Or, should it be checked just before the msg is
966a9643ea8Slogwang 	 * enqueued in the msgq (as it is done now)?
967a9643ea8Slogwang 	 */
968a9643ea8Slogwang 	mac_sysvmsg_create(td->td_ucred, msqkptr, msghdr);
969a9643ea8Slogwang #endif
970a9643ea8Slogwang 
971a9643ea8Slogwang 	/*
972a9643ea8Slogwang 	 * Allocate space for the message
973a9643ea8Slogwang 	 */
974a9643ea8Slogwang 
975a9643ea8Slogwang 	while (segs_needed > 0) {
976a9643ea8Slogwang 		if (nfree_msgmaps <= 0)
977a9643ea8Slogwang 			panic("not enough msgmaps");
978a9643ea8Slogwang 		if (free_msgmaps == -1)
979a9643ea8Slogwang 			panic("nil free_msgmaps");
980a9643ea8Slogwang 		next = free_msgmaps;
981a9643ea8Slogwang 		if (next <= -1)
982a9643ea8Slogwang 			panic("next too low #1");
983a9643ea8Slogwang 		if (next >= msginfo.msgseg)
984a9643ea8Slogwang 			panic("next out of range #1");
985a9643ea8Slogwang 		DPRINTF(("allocating segment %d to message\n", next));
986a9643ea8Slogwang 		free_msgmaps = msgmaps[next].next;
987a9643ea8Slogwang 		nfree_msgmaps--;
988a9643ea8Slogwang 		msgmaps[next].next = msghdr->msg_spot;
989a9643ea8Slogwang 		msghdr->msg_spot = next;
990a9643ea8Slogwang 		segs_needed--;
991a9643ea8Slogwang 	}
992a9643ea8Slogwang 
993a9643ea8Slogwang 	/*
994a9643ea8Slogwang 	 * Validate the message type
995a9643ea8Slogwang 	 */
996a9643ea8Slogwang 
997a9643ea8Slogwang 	if (msghdr->msg_type < 1) {
998a9643ea8Slogwang 		msg_freehdr(msghdr);
999a9643ea8Slogwang 		msqkptr->u.msg_perm.mode &= ~MSG_LOCKED;
1000a9643ea8Slogwang 		wakeup(msqkptr);
1001a9643ea8Slogwang 		DPRINTF(("mtype (%ld) < 1\n", msghdr->msg_type));
1002a9643ea8Slogwang 		error = EINVAL;
1003a9643ea8Slogwang 		goto done3;
1004a9643ea8Slogwang 	}
1005a9643ea8Slogwang 
1006a9643ea8Slogwang 	/*
1007a9643ea8Slogwang 	 * Copy in the message body
1008a9643ea8Slogwang 	 */
1009a9643ea8Slogwang 
1010a9643ea8Slogwang 	next = msghdr->msg_spot;
1011a9643ea8Slogwang 	while (msgsz > 0) {
1012a9643ea8Slogwang 		size_t tlen;
1013a9643ea8Slogwang 		if (msgsz > msginfo.msgssz)
1014a9643ea8Slogwang 			tlen = msginfo.msgssz;
1015a9643ea8Slogwang 		else
1016a9643ea8Slogwang 			tlen = msgsz;
1017a9643ea8Slogwang 		if (next <= -1)
1018a9643ea8Slogwang 			panic("next too low #2");
1019a9643ea8Slogwang 		if (next >= msginfo.msgseg)
1020a9643ea8Slogwang 			panic("next out of range #2");
1021a9643ea8Slogwang 		mtx_unlock(&msq_mtx);
1022a9643ea8Slogwang 		if ((error = copyin(msgp, &msgpool[next * msginfo.msgssz],
1023a9643ea8Slogwang 		    tlen)) != 0) {
1024a9643ea8Slogwang 			mtx_lock(&msq_mtx);
1025a9643ea8Slogwang 			DPRINTF(("error %d copying in message segment\n",
1026a9643ea8Slogwang 			    error));
1027a9643ea8Slogwang 			msg_freehdr(msghdr);
1028a9643ea8Slogwang 			msqkptr->u.msg_perm.mode &= ~MSG_LOCKED;
1029a9643ea8Slogwang 			wakeup(msqkptr);
1030a9643ea8Slogwang 			goto done3;
1031a9643ea8Slogwang 		}
1032a9643ea8Slogwang 		mtx_lock(&msq_mtx);
1033a9643ea8Slogwang 		msgsz -= tlen;
1034a9643ea8Slogwang 		msgp = (const char *)msgp + tlen;
1035a9643ea8Slogwang 		next = msgmaps[next].next;
1036a9643ea8Slogwang 	}
1037a9643ea8Slogwang 	if (next != -1)
1038a9643ea8Slogwang 		panic("didn't use all the msg segments");
1039a9643ea8Slogwang 
1040a9643ea8Slogwang 	/*
1041a9643ea8Slogwang 	 * We've got the message.  Unlock the msqid_ds.
1042a9643ea8Slogwang 	 */
1043a9643ea8Slogwang 
1044a9643ea8Slogwang 	msqkptr->u.msg_perm.mode &= ~MSG_LOCKED;
1045a9643ea8Slogwang 
1046a9643ea8Slogwang 	/*
1047a9643ea8Slogwang 	 * Make sure that the msqid_ds is still allocated.
1048a9643ea8Slogwang 	 */
1049a9643ea8Slogwang 
1050a9643ea8Slogwang 	if (msqkptr->u.msg_qbytes == 0) {
1051a9643ea8Slogwang 		msg_freehdr(msghdr);
1052a9643ea8Slogwang 		wakeup(msqkptr);
1053a9643ea8Slogwang 		error = EIDRM;
1054a9643ea8Slogwang 		goto done3;
1055a9643ea8Slogwang 	}
1056a9643ea8Slogwang 
1057a9643ea8Slogwang #ifdef MAC
1058a9643ea8Slogwang 	/*
1059a9643ea8Slogwang 	 * Note: Since the task/thread allocates the msghdr and usually
1060a9643ea8Slogwang 	 * primes it with its own MAC label, for a majority of policies, it
1061a9643ea8Slogwang 	 * won't be necessary to check whether the msghdr has access
1062a9643ea8Slogwang 	 * permissions to the msgq.  The mac_sysvmsq_check_msqsnd check would
1063a9643ea8Slogwang 	 * suffice in that case.  However, this hook may be required where
1064a9643ea8Slogwang 	 * individual policies derive a non-identical label for the msghdr
1065a9643ea8Slogwang 	 * from the current thread label and may want to check the msghdr
1066a9643ea8Slogwang 	 * enqueue permissions, along with read/write permissions to the
1067a9643ea8Slogwang 	 * msgq.
1068a9643ea8Slogwang 	 */
1069a9643ea8Slogwang 	error = mac_sysvmsq_check_msgmsq(td->td_ucred, msghdr, msqkptr);
1070a9643ea8Slogwang 	if (error != 0) {
1071a9643ea8Slogwang 		msg_freehdr(msghdr);
1072a9643ea8Slogwang 		wakeup(msqkptr);
1073a9643ea8Slogwang 		goto done3;
1074a9643ea8Slogwang 	}
1075a9643ea8Slogwang #endif
1076a9643ea8Slogwang 
1077a9643ea8Slogwang 	/*
1078a9643ea8Slogwang 	 * Put the message into the queue
1079a9643ea8Slogwang 	 */
1080*22ce4affSfengbojiang 	if (msqkptr->u.__msg_first == NULL) {
1081*22ce4affSfengbojiang 		msqkptr->u.__msg_first = msghdr;
1082*22ce4affSfengbojiang 		msqkptr->u.__msg_last = msghdr;
1083a9643ea8Slogwang 	} else {
1084*22ce4affSfengbojiang 		msqkptr->u.__msg_last->msg_next = msghdr;
1085*22ce4affSfengbojiang 		msqkptr->u.__msg_last = msghdr;
1086a9643ea8Slogwang 	}
1087*22ce4affSfengbojiang 	msqkptr->u.__msg_last->msg_next = NULL;
1088a9643ea8Slogwang 
1089a9643ea8Slogwang 	msqkptr->u.msg_cbytes += msghdr->msg_ts;
1090a9643ea8Slogwang 	msqkptr->u.msg_qnum++;
1091a9643ea8Slogwang 	msqkptr->u.msg_lspid = td->td_proc->p_pid;
1092a9643ea8Slogwang 	msqkptr->u.msg_stime = time_second;
1093a9643ea8Slogwang 
1094a9643ea8Slogwang 	wakeup(msqkptr);
1095a9643ea8Slogwang 	td->td_retval[0] = 0;
1096a9643ea8Slogwang done3:
1097a9643ea8Slogwang #ifdef RACCT
1098a9643ea8Slogwang 	if (racct_enable && error != 0) {
1099a9643ea8Slogwang 		PROC_LOCK(td->td_proc);
1100a9643ea8Slogwang 		racct_sub(td->td_proc, RACCT_MSGQQUEUED, 1);
1101a9643ea8Slogwang 		racct_sub(td->td_proc, RACCT_MSGQSIZE, saved_msgsz);
1102a9643ea8Slogwang 		PROC_UNLOCK(td->td_proc);
1103a9643ea8Slogwang 	}
1104a9643ea8Slogwang #endif
1105a9643ea8Slogwang done2:
1106a9643ea8Slogwang 	mtx_unlock(&msq_mtx);
1107a9643ea8Slogwang 	return (error);
1108a9643ea8Slogwang }
1109a9643ea8Slogwang 
1110a9643ea8Slogwang int
sys_msgsnd(struct thread * td,struct msgsnd_args * uap)1111*22ce4affSfengbojiang sys_msgsnd(struct thread *td, struct msgsnd_args *uap)
1112a9643ea8Slogwang {
1113a9643ea8Slogwang 	int error;
1114a9643ea8Slogwang 	long mtype;
1115a9643ea8Slogwang 
1116a9643ea8Slogwang 	DPRINTF(("call to msgsnd(%d, %p, %zu, %d)\n", uap->msqid, uap->msgp,
1117a9643ea8Slogwang 	    uap->msgsz, uap->msgflg));
1118a9643ea8Slogwang 
1119a9643ea8Slogwang 	if ((error = copyin(uap->msgp, &mtype, sizeof(mtype))) != 0) {
1120a9643ea8Slogwang 		DPRINTF(("error %d copying the message type\n", error));
1121a9643ea8Slogwang 		return (error);
1122a9643ea8Slogwang 	}
1123a9643ea8Slogwang 	return (kern_msgsnd(td, uap->msqid,
1124a9643ea8Slogwang 	    (const char *)uap->msgp + sizeof(mtype),
1125a9643ea8Slogwang 	    uap->msgsz, uap->msgflg, mtype));
1126a9643ea8Slogwang }
1127a9643ea8Slogwang 
1128a9643ea8Slogwang #ifndef _SYS_SYSPROTO_H_
1129a9643ea8Slogwang struct msgrcv_args {
1130a9643ea8Slogwang 	int	msqid;
1131a9643ea8Slogwang 	void	*msgp;
1132a9643ea8Slogwang 	size_t	msgsz;
1133a9643ea8Slogwang 	long	msgtyp;
1134a9643ea8Slogwang 	int	msgflg;
1135a9643ea8Slogwang };
1136a9643ea8Slogwang #endif
1137*22ce4affSfengbojiang /* XXX msgp is actually mtext. */
1138a9643ea8Slogwang int
kern_msgrcv(struct thread * td,int msqid,void * msgp,size_t msgsz,long msgtyp,int msgflg,long * mtype)1139*22ce4affSfengbojiang kern_msgrcv(struct thread *td, int msqid, void *msgp, size_t msgsz, long msgtyp,
1140*22ce4affSfengbojiang     int msgflg, long *mtype)
1141a9643ea8Slogwang {
1142a9643ea8Slogwang 	size_t len;
1143*22ce4affSfengbojiang 	struct msqid_kernel *msqkptr;
1144*22ce4affSfengbojiang 	struct msg *msghdr;
1145a9643ea8Slogwang 	struct prison *rpr;
1146a9643ea8Slogwang 	int msqix, error = 0;
1147a9643ea8Slogwang 	short next;
1148a9643ea8Slogwang 
1149a9643ea8Slogwang 	rpr = msg_find_prison(td->td_ucred);
1150a9643ea8Slogwang 	if (rpr == NULL)
1151a9643ea8Slogwang 		return (ENOSYS);
1152a9643ea8Slogwang 
1153*22ce4affSfengbojiang 	AUDIT_ARG_SVIPC_ID(msqid);
1154a9643ea8Slogwang 	msqix = IPCID_TO_IX(msqid);
1155a9643ea8Slogwang 
1156a9643ea8Slogwang 	if (msqix < 0 || msqix >= msginfo.msgmni) {
1157a9643ea8Slogwang 		DPRINTF(("msqid (%d) out of range (0<=msqid<%d)\n", msqix,
1158a9643ea8Slogwang 		    msginfo.msgmni));
1159a9643ea8Slogwang 		return (EINVAL);
1160a9643ea8Slogwang 	}
1161a9643ea8Slogwang 
1162a9643ea8Slogwang 	msqkptr = &msqids[msqix];
1163a9643ea8Slogwang 	mtx_lock(&msq_mtx);
1164*22ce4affSfengbojiang 	AUDIT_ARG_SVIPC_PERM(&msqkptr->u.msg_perm);
1165a9643ea8Slogwang 	if (msqkptr->u.msg_qbytes == 0) {
1166a9643ea8Slogwang 		DPRINTF(("no such message queue id\n"));
1167a9643ea8Slogwang 		error = EINVAL;
1168a9643ea8Slogwang 		goto done2;
1169a9643ea8Slogwang 	}
1170a9643ea8Slogwang 	if (msqkptr->u.msg_perm.seq != IPCID_TO_SEQ(msqid)) {
1171a9643ea8Slogwang 		DPRINTF(("wrong sequence number\n"));
1172a9643ea8Slogwang 		error = EINVAL;
1173a9643ea8Slogwang 		goto done2;
1174a9643ea8Slogwang 	}
1175a9643ea8Slogwang 
1176a9643ea8Slogwang 	if ((error = msq_prison_cansee(rpr, msqkptr))) {
1177a9643ea8Slogwang 		DPRINTF(("requester can't see prison\n"));
1178a9643ea8Slogwang 		goto done2;
1179a9643ea8Slogwang 	}
1180a9643ea8Slogwang 
1181a9643ea8Slogwang 	if ((error = ipcperm(td, &msqkptr->u.msg_perm, IPC_R))) {
1182a9643ea8Slogwang 		DPRINTF(("requester doesn't have read access\n"));
1183a9643ea8Slogwang 		goto done2;
1184a9643ea8Slogwang 	}
1185a9643ea8Slogwang 
1186a9643ea8Slogwang #ifdef MAC
1187a9643ea8Slogwang 	error = mac_sysvmsq_check_msqrcv(td->td_ucred, msqkptr);
1188a9643ea8Slogwang 	if (error != 0)
1189a9643ea8Slogwang 		goto done2;
1190a9643ea8Slogwang #endif
1191a9643ea8Slogwang 
1192a9643ea8Slogwang 	msghdr = NULL;
1193a9643ea8Slogwang 	while (msghdr == NULL) {
1194a9643ea8Slogwang 		if (msgtyp == 0) {
1195*22ce4affSfengbojiang 			msghdr = msqkptr->u.__msg_first;
1196a9643ea8Slogwang 			if (msghdr != NULL) {
1197a9643ea8Slogwang 				if (msgsz < msghdr->msg_ts &&
1198a9643ea8Slogwang 				    (msgflg & MSG_NOERROR) == 0) {
1199a9643ea8Slogwang 					DPRINTF(("first message on the queue "
1200a9643ea8Slogwang 					    "is too big (want %zu, got %d)\n",
1201a9643ea8Slogwang 					    msgsz, msghdr->msg_ts));
1202a9643ea8Slogwang 					error = E2BIG;
1203a9643ea8Slogwang 					goto done2;
1204a9643ea8Slogwang 				}
1205a9643ea8Slogwang #ifdef MAC
1206a9643ea8Slogwang 				error = mac_sysvmsq_check_msgrcv(td->td_ucred,
1207a9643ea8Slogwang 				    msghdr);
1208a9643ea8Slogwang 				if (error != 0)
1209a9643ea8Slogwang 					goto done2;
1210a9643ea8Slogwang #endif
1211*22ce4affSfengbojiang 				if (msqkptr->u.__msg_first ==
1212*22ce4affSfengbojiang 				    msqkptr->u.__msg_last) {
1213*22ce4affSfengbojiang 					msqkptr->u.__msg_first = NULL;
1214*22ce4affSfengbojiang 					msqkptr->u.__msg_last = NULL;
1215a9643ea8Slogwang 				} else {
1216*22ce4affSfengbojiang 					msqkptr->u.__msg_first = msghdr->msg_next;
1217*22ce4affSfengbojiang 					if (msqkptr->u.__msg_first == NULL)
1218a9643ea8Slogwang 						panic("msg_first/last screwed up #1");
1219a9643ea8Slogwang 				}
1220a9643ea8Slogwang 			}
1221a9643ea8Slogwang 		} else {
1222a9643ea8Slogwang 			struct msg *previous;
1223a9643ea8Slogwang 			struct msg **prev;
1224a9643ea8Slogwang 
1225a9643ea8Slogwang 			previous = NULL;
1226*22ce4affSfengbojiang 			prev = &(msqkptr->u.__msg_first);
1227a9643ea8Slogwang 			while ((msghdr = *prev) != NULL) {
1228a9643ea8Slogwang 				/*
1229a9643ea8Slogwang 				 * Is this message's type an exact match or is
1230a9643ea8Slogwang 				 * this message's type less than or equal to
1231a9643ea8Slogwang 				 * the absolute value of a negative msgtyp?
1232a9643ea8Slogwang 				 * Note that the second half of this test can
1233a9643ea8Slogwang 				 * NEVER be true if msgtyp is positive since
1234a9643ea8Slogwang 				 * msg_type is always positive!
1235a9643ea8Slogwang 				 */
1236a9643ea8Slogwang 
1237a9643ea8Slogwang 				if (msgtyp == msghdr->msg_type ||
1238a9643ea8Slogwang 				    msghdr->msg_type <= -msgtyp) {
1239a9643ea8Slogwang 					DPRINTF(("found message type %ld, "
1240a9643ea8Slogwang 					    "requested %ld\n",
1241a9643ea8Slogwang 					    msghdr->msg_type, msgtyp));
1242a9643ea8Slogwang 					if (msgsz < msghdr->msg_ts &&
1243a9643ea8Slogwang 					    (msgflg & MSG_NOERROR) == 0) {
1244a9643ea8Slogwang 						DPRINTF(("requested message "
1245a9643ea8Slogwang 						    "on the queue is too big "
1246a9643ea8Slogwang 						    "(want %zu, got %hu)\n",
1247a9643ea8Slogwang 						    msgsz, msghdr->msg_ts));
1248a9643ea8Slogwang 						error = E2BIG;
1249a9643ea8Slogwang 						goto done2;
1250a9643ea8Slogwang 					}
1251a9643ea8Slogwang #ifdef MAC
1252a9643ea8Slogwang 					error = mac_sysvmsq_check_msgrcv(
1253a9643ea8Slogwang 					    td->td_ucred, msghdr);
1254a9643ea8Slogwang 					if (error != 0)
1255a9643ea8Slogwang 						goto done2;
1256a9643ea8Slogwang #endif
1257a9643ea8Slogwang 					*prev = msghdr->msg_next;
1258*22ce4affSfengbojiang 					if (msghdr == msqkptr->u.__msg_last) {
1259a9643ea8Slogwang 						if (previous == NULL) {
1260a9643ea8Slogwang 							if (prev !=
1261*22ce4affSfengbojiang 							    &msqkptr->u.__msg_first)
1262*22ce4affSfengbojiang 								panic("__msg_first/last screwed up #2");
1263*22ce4affSfengbojiang 							msqkptr->u.__msg_first =
1264a9643ea8Slogwang 							    NULL;
1265*22ce4affSfengbojiang 							msqkptr->u.__msg_last =
1266a9643ea8Slogwang 							    NULL;
1267a9643ea8Slogwang 						} else {
1268a9643ea8Slogwang 							if (prev ==
1269*22ce4affSfengbojiang 							    &msqkptr->u.__msg_first)
1270*22ce4affSfengbojiang 								panic("__msg_first/last screwed up #3");
1271*22ce4affSfengbojiang 							msqkptr->u.__msg_last =
1272a9643ea8Slogwang 							    previous;
1273a9643ea8Slogwang 						}
1274a9643ea8Slogwang 					}
1275a9643ea8Slogwang 					break;
1276a9643ea8Slogwang 				}
1277a9643ea8Slogwang 				previous = msghdr;
1278a9643ea8Slogwang 				prev = &(msghdr->msg_next);
1279a9643ea8Slogwang 			}
1280a9643ea8Slogwang 		}
1281a9643ea8Slogwang 
1282a9643ea8Slogwang 		/*
1283a9643ea8Slogwang 		 * We've either extracted the msghdr for the appropriate
1284a9643ea8Slogwang 		 * message or there isn't one.
1285a9643ea8Slogwang 		 * If there is one then bail out of this loop.
1286a9643ea8Slogwang 		 */
1287a9643ea8Slogwang 
1288a9643ea8Slogwang 		if (msghdr != NULL)
1289a9643ea8Slogwang 			break;
1290a9643ea8Slogwang 
1291a9643ea8Slogwang 		/*
1292a9643ea8Slogwang 		 * Hmph!  No message found.  Does the user want to wait?
1293a9643ea8Slogwang 		 */
1294a9643ea8Slogwang 
1295a9643ea8Slogwang 		if ((msgflg & IPC_NOWAIT) != 0) {
1296a9643ea8Slogwang 			DPRINTF(("no appropriate message found (msgtyp=%ld)\n",
1297a9643ea8Slogwang 			    msgtyp));
1298a9643ea8Slogwang 			/* The SVID says to return ENOMSG. */
1299a9643ea8Slogwang 			error = ENOMSG;
1300a9643ea8Slogwang 			goto done2;
1301a9643ea8Slogwang 		}
1302a9643ea8Slogwang 
1303a9643ea8Slogwang 		/*
1304a9643ea8Slogwang 		 * Wait for something to happen
1305a9643ea8Slogwang 		 */
1306a9643ea8Slogwang 
1307a9643ea8Slogwang 		DPRINTF(("msgrcv:  goodnight\n"));
1308a9643ea8Slogwang 		error = msleep(msqkptr, &msq_mtx, (PZERO - 4) | PCATCH,
1309a9643ea8Slogwang 		    "msgrcv", 0);
1310a9643ea8Slogwang 		DPRINTF(("msgrcv:  good morning (error=%d)\n", error));
1311a9643ea8Slogwang 
1312a9643ea8Slogwang 		if (error != 0) {
1313a9643ea8Slogwang 			DPRINTF(("msgrcv:  interrupted system call\n"));
1314a9643ea8Slogwang 			error = EINTR;
1315a9643ea8Slogwang 			goto done2;
1316a9643ea8Slogwang 		}
1317a9643ea8Slogwang 
1318a9643ea8Slogwang 		/*
1319a9643ea8Slogwang 		 * Make sure that the msq queue still exists
1320a9643ea8Slogwang 		 */
1321a9643ea8Slogwang 
1322a9643ea8Slogwang 		if (msqkptr->u.msg_qbytes == 0 ||
1323a9643ea8Slogwang 		    msqkptr->u.msg_perm.seq != IPCID_TO_SEQ(msqid)) {
1324a9643ea8Slogwang 			DPRINTF(("msqid deleted\n"));
1325a9643ea8Slogwang 			error = EIDRM;
1326a9643ea8Slogwang 			goto done2;
1327a9643ea8Slogwang 		}
1328a9643ea8Slogwang 	}
1329a9643ea8Slogwang 
1330a9643ea8Slogwang 	/*
1331a9643ea8Slogwang 	 * Return the message to the user.
1332a9643ea8Slogwang 	 *
1333a9643ea8Slogwang 	 * First, do the bookkeeping (before we risk being interrupted).
1334a9643ea8Slogwang 	 */
1335a9643ea8Slogwang 
1336a9643ea8Slogwang 	msqkptr->u.msg_cbytes -= msghdr->msg_ts;
1337a9643ea8Slogwang 	msqkptr->u.msg_qnum--;
1338a9643ea8Slogwang 	msqkptr->u.msg_lrpid = td->td_proc->p_pid;
1339a9643ea8Slogwang 	msqkptr->u.msg_rtime = time_second;
1340a9643ea8Slogwang 
1341a9643ea8Slogwang 	racct_sub_cred(msqkptr->cred, RACCT_MSGQQUEUED, 1);
1342a9643ea8Slogwang 	racct_sub_cred(msqkptr->cred, RACCT_MSGQSIZE, msghdr->msg_ts);
1343a9643ea8Slogwang 
1344a9643ea8Slogwang 	/*
1345a9643ea8Slogwang 	 * Make msgsz the actual amount that we'll be returning.
1346a9643ea8Slogwang 	 * Note that this effectively truncates the message if it is too long
1347a9643ea8Slogwang 	 * (since msgsz is never increased).
1348a9643ea8Slogwang 	 */
1349a9643ea8Slogwang 
1350a9643ea8Slogwang 	DPRINTF(("found a message, msgsz=%zu, msg_ts=%hu\n", msgsz,
1351a9643ea8Slogwang 	    msghdr->msg_ts));
1352a9643ea8Slogwang 	if (msgsz > msghdr->msg_ts)
1353a9643ea8Slogwang 		msgsz = msghdr->msg_ts;
1354a9643ea8Slogwang 	*mtype = msghdr->msg_type;
1355a9643ea8Slogwang 
1356a9643ea8Slogwang 	/*
1357a9643ea8Slogwang 	 * Return the segments to the user
1358a9643ea8Slogwang 	 */
1359a9643ea8Slogwang 
1360a9643ea8Slogwang 	next = msghdr->msg_spot;
1361a9643ea8Slogwang 	for (len = 0; len < msgsz; len += msginfo.msgssz) {
1362a9643ea8Slogwang 		size_t tlen;
1363a9643ea8Slogwang 
1364a9643ea8Slogwang 		if (msgsz - len > msginfo.msgssz)
1365a9643ea8Slogwang 			tlen = msginfo.msgssz;
1366a9643ea8Slogwang 		else
1367a9643ea8Slogwang 			tlen = msgsz - len;
1368a9643ea8Slogwang 		if (next <= -1)
1369a9643ea8Slogwang 			panic("next too low #3");
1370a9643ea8Slogwang 		if (next >= msginfo.msgseg)
1371a9643ea8Slogwang 			panic("next out of range #3");
1372a9643ea8Slogwang 		mtx_unlock(&msq_mtx);
1373a9643ea8Slogwang 		error = copyout(&msgpool[next * msginfo.msgssz], msgp, tlen);
1374a9643ea8Slogwang 		mtx_lock(&msq_mtx);
1375a9643ea8Slogwang 		if (error != 0) {
1376a9643ea8Slogwang 			DPRINTF(("error (%d) copying out message segment\n",
1377a9643ea8Slogwang 			    error));
1378a9643ea8Slogwang 			msg_freehdr(msghdr);
1379a9643ea8Slogwang 			wakeup(msqkptr);
1380a9643ea8Slogwang 			goto done2;
1381a9643ea8Slogwang 		}
1382a9643ea8Slogwang 		msgp = (char *)msgp + tlen;
1383a9643ea8Slogwang 		next = msgmaps[next].next;
1384a9643ea8Slogwang 	}
1385a9643ea8Slogwang 
1386a9643ea8Slogwang 	/*
1387a9643ea8Slogwang 	 * Done, return the actual number of bytes copied out.
1388a9643ea8Slogwang 	 */
1389a9643ea8Slogwang 
1390a9643ea8Slogwang 	msg_freehdr(msghdr);
1391a9643ea8Slogwang 	wakeup(msqkptr);
1392a9643ea8Slogwang 	td->td_retval[0] = msgsz;
1393a9643ea8Slogwang done2:
1394a9643ea8Slogwang 	mtx_unlock(&msq_mtx);
1395a9643ea8Slogwang 	return (error);
1396a9643ea8Slogwang }
1397a9643ea8Slogwang 
1398a9643ea8Slogwang int
sys_msgrcv(struct thread * td,struct msgrcv_args * uap)1399*22ce4affSfengbojiang sys_msgrcv(struct thread *td, struct msgrcv_args *uap)
1400a9643ea8Slogwang {
1401a9643ea8Slogwang 	int error;
1402a9643ea8Slogwang 	long mtype;
1403a9643ea8Slogwang 
1404a9643ea8Slogwang 	DPRINTF(("call to msgrcv(%d, %p, %zu, %ld, %d)\n", uap->msqid,
1405a9643ea8Slogwang 	    uap->msgp, uap->msgsz, uap->msgtyp, uap->msgflg));
1406a9643ea8Slogwang 
1407a9643ea8Slogwang 	if ((error = kern_msgrcv(td, uap->msqid,
1408a9643ea8Slogwang 	    (char *)uap->msgp + sizeof(mtype), uap->msgsz,
1409a9643ea8Slogwang 	    uap->msgtyp, uap->msgflg, &mtype)) != 0)
1410a9643ea8Slogwang 		return (error);
1411a9643ea8Slogwang 	if ((error = copyout(&mtype, uap->msgp, sizeof(mtype))) != 0)
1412a9643ea8Slogwang 		DPRINTF(("error %d copying the message type\n", error));
1413a9643ea8Slogwang 	return (error);
1414a9643ea8Slogwang }
1415a9643ea8Slogwang 
1416a9643ea8Slogwang static int
sysctl_msqids(SYSCTL_HANDLER_ARGS)1417a9643ea8Slogwang sysctl_msqids(SYSCTL_HANDLER_ARGS)
1418a9643ea8Slogwang {
1419a9643ea8Slogwang 	struct msqid_kernel tmsqk;
1420*22ce4affSfengbojiang #ifdef COMPAT_FREEBSD32
1421*22ce4affSfengbojiang 	struct msqid_kernel32 tmsqk32;
1422*22ce4affSfengbojiang #endif
1423a9643ea8Slogwang 	struct prison *pr, *rpr;
1424*22ce4affSfengbojiang 	void *outaddr;
1425*22ce4affSfengbojiang 	size_t outsize;
1426a9643ea8Slogwang 	int error, i;
1427a9643ea8Slogwang 
1428a9643ea8Slogwang 	pr = req->td->td_ucred->cr_prison;
1429a9643ea8Slogwang 	rpr = msg_find_prison(req->td->td_ucred);
1430a9643ea8Slogwang 	error = 0;
1431a9643ea8Slogwang 	for (i = 0; i < msginfo.msgmni; i++) {
1432a9643ea8Slogwang 		mtx_lock(&msq_mtx);
1433a9643ea8Slogwang 		if (msqids[i].u.msg_qbytes == 0 || rpr == NULL ||
1434a9643ea8Slogwang 		    msq_prison_cansee(rpr, &msqids[i]) != 0)
1435a9643ea8Slogwang 			bzero(&tmsqk, sizeof(tmsqk));
1436a9643ea8Slogwang 		else {
1437a9643ea8Slogwang 			tmsqk = msqids[i];
1438a9643ea8Slogwang 			if (tmsqk.cred->cr_prison != pr)
1439a9643ea8Slogwang 				tmsqk.u.msg_perm.key = IPC_PRIVATE;
1440a9643ea8Slogwang 		}
1441a9643ea8Slogwang 		mtx_unlock(&msq_mtx);
1442*22ce4affSfengbojiang #ifdef COMPAT_FREEBSD32
1443*22ce4affSfengbojiang 		if (SV_CURPROC_FLAG(SV_ILP32)) {
1444*22ce4affSfengbojiang 			bzero(&tmsqk32, sizeof(tmsqk32));
1445*22ce4affSfengbojiang 			freebsd32_ipcperm_out(&tmsqk.u.msg_perm,
1446*22ce4affSfengbojiang 			    &tmsqk32.u.msg_perm);
1447*22ce4affSfengbojiang 			/* Don't copy u.msg_first or u.msg_last */
1448*22ce4affSfengbojiang 			CP(tmsqk, tmsqk32, u.msg_cbytes);
1449*22ce4affSfengbojiang 			CP(tmsqk, tmsqk32, u.msg_qnum);
1450*22ce4affSfengbojiang 			CP(tmsqk, tmsqk32, u.msg_qbytes);
1451*22ce4affSfengbojiang 			CP(tmsqk, tmsqk32, u.msg_lspid);
1452*22ce4affSfengbojiang 			CP(tmsqk, tmsqk32, u.msg_lrpid);
1453*22ce4affSfengbojiang 			CP(tmsqk, tmsqk32, u.msg_stime);
1454*22ce4affSfengbojiang 			CP(tmsqk, tmsqk32, u.msg_rtime);
1455*22ce4affSfengbojiang 			CP(tmsqk, tmsqk32, u.msg_ctime);
1456*22ce4affSfengbojiang 			/* Don't copy label or cred */
1457*22ce4affSfengbojiang 			outaddr = &tmsqk32;
1458*22ce4affSfengbojiang 			outsize = sizeof(tmsqk32);
1459*22ce4affSfengbojiang 		} else
1460*22ce4affSfengbojiang #endif
1461*22ce4affSfengbojiang 		{
1462*22ce4affSfengbojiang 			/* Don't leak kernel pointers */
1463*22ce4affSfengbojiang 			tmsqk.u.__msg_first = NULL;
1464*22ce4affSfengbojiang 			tmsqk.u.__msg_last = NULL;
1465*22ce4affSfengbojiang 			tmsqk.label = NULL;
1466*22ce4affSfengbojiang 			tmsqk.cred = NULL;
1467*22ce4affSfengbojiang 			/*
1468*22ce4affSfengbojiang 			 * XXX: some padding also exists, but we take care to
1469*22ce4affSfengbojiang 			 * allocate our pool of msqid_kernel structs with
1470*22ce4affSfengbojiang 			 * zeroed memory so this should be OK.
1471*22ce4affSfengbojiang 			 */
1472*22ce4affSfengbojiang 			outaddr = &tmsqk;
1473*22ce4affSfengbojiang 			outsize = sizeof(tmsqk);
1474*22ce4affSfengbojiang 		}
1475*22ce4affSfengbojiang 		error = SYSCTL_OUT(req, outaddr, outsize);
1476a9643ea8Slogwang 		if (error != 0)
1477a9643ea8Slogwang 			break;
1478a9643ea8Slogwang 	}
1479a9643ea8Slogwang 	return (error);
1480a9643ea8Slogwang }
1481a9643ea8Slogwang 
1482a9643ea8Slogwang SYSCTL_INT(_kern_ipc, OID_AUTO, msgmax, CTLFLAG_RD, &msginfo.msgmax, 0,
1483a9643ea8Slogwang     "Maximum message size");
1484a9643ea8Slogwang SYSCTL_INT(_kern_ipc, OID_AUTO, msgmni, CTLFLAG_RDTUN, &msginfo.msgmni, 0,
1485a9643ea8Slogwang     "Number of message queue identifiers");
1486a9643ea8Slogwang SYSCTL_INT(_kern_ipc, OID_AUTO, msgmnb, CTLFLAG_RDTUN, &msginfo.msgmnb, 0,
1487a9643ea8Slogwang     "Maximum number of bytes in a queue");
1488a9643ea8Slogwang SYSCTL_INT(_kern_ipc, OID_AUTO, msgtql, CTLFLAG_RDTUN, &msginfo.msgtql, 0,
1489a9643ea8Slogwang     "Maximum number of messages in the system");
1490a9643ea8Slogwang SYSCTL_INT(_kern_ipc, OID_AUTO, msgssz, CTLFLAG_RDTUN, &msginfo.msgssz, 0,
1491a9643ea8Slogwang     "Size of a message segment");
1492a9643ea8Slogwang SYSCTL_INT(_kern_ipc, OID_AUTO, msgseg, CTLFLAG_RDTUN, &msginfo.msgseg, 0,
1493a9643ea8Slogwang     "Number of message segments");
1494a9643ea8Slogwang SYSCTL_PROC(_kern_ipc, OID_AUTO, msqids,
1495a9643ea8Slogwang     CTLTYPE_OPAQUE | CTLFLAG_RD | CTLFLAG_MPSAFE,
1496*22ce4affSfengbojiang     NULL, 0, sysctl_msqids, "",
1497*22ce4affSfengbojiang     "Array of struct msqid_kernel for each potential message queue");
1498a9643ea8Slogwang 
1499a9643ea8Slogwang static int
msg_prison_check(void * obj,void * data)1500a9643ea8Slogwang msg_prison_check(void *obj, void *data)
1501a9643ea8Slogwang {
1502a9643ea8Slogwang 	struct prison *pr = obj;
1503a9643ea8Slogwang 	struct prison *prpr;
1504a9643ea8Slogwang 	struct vfsoptlist *opts = data;
1505a9643ea8Slogwang 	int error, jsys;
1506a9643ea8Slogwang 
1507a9643ea8Slogwang 	/*
1508a9643ea8Slogwang 	 * sysvmsg is a jailsys integer.
1509a9643ea8Slogwang 	 * It must be "disable" if the parent jail is disabled.
1510a9643ea8Slogwang 	 */
1511a9643ea8Slogwang 	error = vfs_copyopt(opts, "sysvmsg", &jsys, sizeof(jsys));
1512a9643ea8Slogwang 	if (error != ENOENT) {
1513a9643ea8Slogwang 		if (error != 0)
1514a9643ea8Slogwang 			return (error);
1515a9643ea8Slogwang 		switch (jsys) {
1516a9643ea8Slogwang 		case JAIL_SYS_DISABLE:
1517a9643ea8Slogwang 			break;
1518a9643ea8Slogwang 		case JAIL_SYS_NEW:
1519a9643ea8Slogwang 		case JAIL_SYS_INHERIT:
1520a9643ea8Slogwang 			prison_lock(pr->pr_parent);
1521a9643ea8Slogwang 			prpr = osd_jail_get(pr->pr_parent, msg_prison_slot);
1522a9643ea8Slogwang 			prison_unlock(pr->pr_parent);
1523a9643ea8Slogwang 			if (prpr == NULL)
1524a9643ea8Slogwang 				return (EPERM);
1525a9643ea8Slogwang 			break;
1526a9643ea8Slogwang 		default:
1527a9643ea8Slogwang 			return (EINVAL);
1528a9643ea8Slogwang 		}
1529a9643ea8Slogwang 	}
1530a9643ea8Slogwang 
1531a9643ea8Slogwang 	return (0);
1532a9643ea8Slogwang }
1533a9643ea8Slogwang 
1534a9643ea8Slogwang static int
msg_prison_set(void * obj,void * data)1535a9643ea8Slogwang msg_prison_set(void *obj, void *data)
1536a9643ea8Slogwang {
1537a9643ea8Slogwang 	struct prison *pr = obj;
1538a9643ea8Slogwang 	struct prison *tpr, *orpr, *nrpr, *trpr;
1539a9643ea8Slogwang 	struct vfsoptlist *opts = data;
1540a9643ea8Slogwang 	void *rsv;
1541a9643ea8Slogwang 	int jsys, descend;
1542a9643ea8Slogwang 
1543a9643ea8Slogwang 	/*
1544a9643ea8Slogwang 	 * sysvmsg controls which jail is the root of the associated msgs (this
1545a9643ea8Slogwang 	 * jail or same as the parent), or if the feature is available at all.
1546a9643ea8Slogwang 	 */
1547a9643ea8Slogwang 	if (vfs_copyopt(opts, "sysvmsg", &jsys, sizeof(jsys)) == ENOENT)
1548a9643ea8Slogwang 		jsys = vfs_flagopt(opts, "allow.sysvipc", NULL, 0)
1549a9643ea8Slogwang 		    ? JAIL_SYS_INHERIT
1550a9643ea8Slogwang 		    : vfs_flagopt(opts, "allow.nosysvipc", NULL, 0)
1551a9643ea8Slogwang 		    ? JAIL_SYS_DISABLE
1552a9643ea8Slogwang 		    : -1;
1553a9643ea8Slogwang 	if (jsys == JAIL_SYS_DISABLE) {
1554a9643ea8Slogwang 		prison_lock(pr);
1555a9643ea8Slogwang 		orpr = osd_jail_get(pr, msg_prison_slot);
1556a9643ea8Slogwang 		if (orpr != NULL)
1557a9643ea8Slogwang 			osd_jail_del(pr, msg_prison_slot);
1558a9643ea8Slogwang 		prison_unlock(pr);
1559a9643ea8Slogwang 		if (orpr != NULL) {
1560a9643ea8Slogwang 			if (orpr == pr)
1561a9643ea8Slogwang 				msg_prison_cleanup(pr);
1562a9643ea8Slogwang 			/* Disable all child jails as well. */
1563a9643ea8Slogwang 			FOREACH_PRISON_DESCENDANT(pr, tpr, descend) {
1564a9643ea8Slogwang 				prison_lock(tpr);
1565a9643ea8Slogwang 				trpr = osd_jail_get(tpr, msg_prison_slot);
1566a9643ea8Slogwang 				if (trpr != NULL) {
1567a9643ea8Slogwang 					osd_jail_del(tpr, msg_prison_slot);
1568a9643ea8Slogwang 					prison_unlock(tpr);
1569a9643ea8Slogwang 					if (trpr == tpr)
1570a9643ea8Slogwang 						msg_prison_cleanup(tpr);
1571a9643ea8Slogwang 				} else {
1572a9643ea8Slogwang 					prison_unlock(tpr);
1573a9643ea8Slogwang 					descend = 0;
1574a9643ea8Slogwang 				}
1575a9643ea8Slogwang 			}
1576a9643ea8Slogwang 		}
1577a9643ea8Slogwang 	} else if (jsys != -1) {
1578a9643ea8Slogwang 		if (jsys == JAIL_SYS_NEW)
1579a9643ea8Slogwang 			nrpr = pr;
1580a9643ea8Slogwang 		else {
1581a9643ea8Slogwang 			prison_lock(pr->pr_parent);
1582a9643ea8Slogwang 			nrpr = osd_jail_get(pr->pr_parent, msg_prison_slot);
1583a9643ea8Slogwang 			prison_unlock(pr->pr_parent);
1584a9643ea8Slogwang 		}
1585a9643ea8Slogwang 		rsv = osd_reserve(msg_prison_slot);
1586a9643ea8Slogwang 		prison_lock(pr);
1587a9643ea8Slogwang 		orpr = osd_jail_get(pr, msg_prison_slot);
1588a9643ea8Slogwang 		if (orpr != nrpr)
1589a9643ea8Slogwang 			(void)osd_jail_set_reserved(pr, msg_prison_slot, rsv,
1590a9643ea8Slogwang 			    nrpr);
1591a9643ea8Slogwang 		else
1592a9643ea8Slogwang 			osd_free_reserved(rsv);
1593a9643ea8Slogwang 		prison_unlock(pr);
1594a9643ea8Slogwang 		if (orpr != nrpr) {
1595a9643ea8Slogwang 			if (orpr == pr)
1596a9643ea8Slogwang 				msg_prison_cleanup(pr);
1597a9643ea8Slogwang 			if (orpr != NULL) {
1598a9643ea8Slogwang 				/* Change child jails matching the old root, */
1599a9643ea8Slogwang 				FOREACH_PRISON_DESCENDANT(pr, tpr, descend) {
1600a9643ea8Slogwang 					prison_lock(tpr);
1601a9643ea8Slogwang 					trpr = osd_jail_get(tpr,
1602a9643ea8Slogwang 					    msg_prison_slot);
1603a9643ea8Slogwang 					if (trpr == orpr) {
1604a9643ea8Slogwang 						(void)osd_jail_set(tpr,
1605a9643ea8Slogwang 						    msg_prison_slot, nrpr);
1606a9643ea8Slogwang 						prison_unlock(tpr);
1607a9643ea8Slogwang 						if (trpr == tpr)
1608a9643ea8Slogwang 							msg_prison_cleanup(tpr);
1609a9643ea8Slogwang 					} else {
1610a9643ea8Slogwang 						prison_unlock(tpr);
1611a9643ea8Slogwang 						descend = 0;
1612a9643ea8Slogwang 					}
1613a9643ea8Slogwang 				}
1614a9643ea8Slogwang 			}
1615a9643ea8Slogwang 		}
1616a9643ea8Slogwang 	}
1617a9643ea8Slogwang 
1618a9643ea8Slogwang 	return (0);
1619a9643ea8Slogwang }
1620a9643ea8Slogwang 
1621a9643ea8Slogwang static int
msg_prison_get(void * obj,void * data)1622a9643ea8Slogwang msg_prison_get(void *obj, void *data)
1623a9643ea8Slogwang {
1624a9643ea8Slogwang 	struct prison *pr = obj;
1625a9643ea8Slogwang 	struct prison *rpr;
1626a9643ea8Slogwang 	struct vfsoptlist *opts = data;
1627a9643ea8Slogwang 	int error, jsys;
1628a9643ea8Slogwang 
1629a9643ea8Slogwang 	/* Set sysvmsg based on the jail's root prison. */
1630a9643ea8Slogwang 	prison_lock(pr);
1631a9643ea8Slogwang 	rpr = osd_jail_get(pr, msg_prison_slot);
1632a9643ea8Slogwang 	prison_unlock(pr);
1633a9643ea8Slogwang 	jsys = rpr == NULL ? JAIL_SYS_DISABLE
1634a9643ea8Slogwang 	    : rpr == pr ? JAIL_SYS_NEW : JAIL_SYS_INHERIT;
1635a9643ea8Slogwang 	error = vfs_setopt(opts, "sysvmsg", &jsys, sizeof(jsys));
1636a9643ea8Slogwang 	if (error == ENOENT)
1637a9643ea8Slogwang 		error = 0;
1638a9643ea8Slogwang 	return (error);
1639a9643ea8Slogwang }
1640a9643ea8Slogwang 
1641a9643ea8Slogwang static int
msg_prison_remove(void * obj,void * data __unused)1642a9643ea8Slogwang msg_prison_remove(void *obj, void *data __unused)
1643a9643ea8Slogwang {
1644a9643ea8Slogwang 	struct prison *pr = obj;
1645a9643ea8Slogwang 	struct prison *rpr;
1646a9643ea8Slogwang 
1647a9643ea8Slogwang 	prison_lock(pr);
1648a9643ea8Slogwang 	rpr = osd_jail_get(pr, msg_prison_slot);
1649a9643ea8Slogwang 	prison_unlock(pr);
1650a9643ea8Slogwang 	if (rpr == pr)
1651a9643ea8Slogwang 		msg_prison_cleanup(pr);
1652a9643ea8Slogwang 	return (0);
1653a9643ea8Slogwang }
1654a9643ea8Slogwang 
1655a9643ea8Slogwang static void
msg_prison_cleanup(struct prison * pr)1656a9643ea8Slogwang msg_prison_cleanup(struct prison *pr)
1657a9643ea8Slogwang {
1658a9643ea8Slogwang 	struct msqid_kernel *msqkptr;
1659a9643ea8Slogwang 	int i;
1660a9643ea8Slogwang 
1661a9643ea8Slogwang 	/* Remove any msqs that belong to this jail. */
1662a9643ea8Slogwang 	mtx_lock(&msq_mtx);
1663a9643ea8Slogwang 	for (i = 0; i < msginfo.msgmni; i++) {
1664a9643ea8Slogwang 		msqkptr = &msqids[i];
1665a9643ea8Slogwang 		if (msqkptr->u.msg_qbytes != 0 &&
1666a9643ea8Slogwang 		    msqkptr->cred != NULL && msqkptr->cred->cr_prison == pr)
1667a9643ea8Slogwang 			msq_remove(msqkptr);
1668a9643ea8Slogwang 	}
1669a9643ea8Slogwang 	mtx_unlock(&msq_mtx);
1670a9643ea8Slogwang }
1671a9643ea8Slogwang 
1672a9643ea8Slogwang SYSCTL_JAIL_PARAM_SYS_NODE(sysvmsg, CTLFLAG_RW, "SYSV message queues");
1673a9643ea8Slogwang 
1674a9643ea8Slogwang #ifdef COMPAT_FREEBSD32
1675a9643ea8Slogwang int
freebsd32_msgsys(struct thread * td,struct freebsd32_msgsys_args * uap)1676a9643ea8Slogwang freebsd32_msgsys(struct thread *td, struct freebsd32_msgsys_args *uap)
1677a9643ea8Slogwang {
1678a9643ea8Slogwang 
1679a9643ea8Slogwang #if defined(COMPAT_FREEBSD4) || defined(COMPAT_FREEBSD5) || \
1680a9643ea8Slogwang     defined(COMPAT_FREEBSD6) || defined(COMPAT_FREEBSD7)
1681*22ce4affSfengbojiang 	AUDIT_ARG_SVIPC_WHICH(uap->which);
1682a9643ea8Slogwang 	switch (uap->which) {
1683a9643ea8Slogwang 	case 0:
1684a9643ea8Slogwang 		return (freebsd7_freebsd32_msgctl(td,
1685a9643ea8Slogwang 		    (struct freebsd7_freebsd32_msgctl_args *)&uap->a2));
1686a9643ea8Slogwang 	case 2:
1687a9643ea8Slogwang 		return (freebsd32_msgsnd(td,
1688a9643ea8Slogwang 		    (struct freebsd32_msgsnd_args *)&uap->a2));
1689a9643ea8Slogwang 	case 3:
1690a9643ea8Slogwang 		return (freebsd32_msgrcv(td,
1691a9643ea8Slogwang 		    (struct freebsd32_msgrcv_args *)&uap->a2));
1692a9643ea8Slogwang 	default:
1693a9643ea8Slogwang 		return (sys_msgsys(td, (struct msgsys_args *)uap));
1694a9643ea8Slogwang 	}
1695a9643ea8Slogwang #else
1696a9643ea8Slogwang 	return (nosys(td, NULL));
1697a9643ea8Slogwang #endif
1698a9643ea8Slogwang }
1699a9643ea8Slogwang 
1700a9643ea8Slogwang #if defined(COMPAT_FREEBSD4) || defined(COMPAT_FREEBSD5) || \
1701a9643ea8Slogwang     defined(COMPAT_FREEBSD6) || defined(COMPAT_FREEBSD7)
1702a9643ea8Slogwang int
freebsd7_freebsd32_msgctl(struct thread * td,struct freebsd7_freebsd32_msgctl_args * uap)1703a9643ea8Slogwang freebsd7_freebsd32_msgctl(struct thread *td,
1704a9643ea8Slogwang     struct freebsd7_freebsd32_msgctl_args *uap)
1705a9643ea8Slogwang {
1706a9643ea8Slogwang 	struct msqid_ds msqbuf;
1707a9643ea8Slogwang 	struct msqid_ds32_old msqbuf32;
1708a9643ea8Slogwang 	int error;
1709a9643ea8Slogwang 
1710a9643ea8Slogwang 	if (uap->cmd == IPC_SET) {
1711a9643ea8Slogwang 		error = copyin(uap->buf, &msqbuf32, sizeof(msqbuf32));
1712a9643ea8Slogwang 		if (error)
1713a9643ea8Slogwang 			return (error);
1714a9643ea8Slogwang 		freebsd32_ipcperm_old_in(&msqbuf32.msg_perm, &msqbuf.msg_perm);
1715*22ce4affSfengbojiang 		PTRIN_CP(msqbuf32, msqbuf, __msg_first);
1716*22ce4affSfengbojiang 		PTRIN_CP(msqbuf32, msqbuf, __msg_last);
1717a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_cbytes);
1718a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_qnum);
1719a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_qbytes);
1720a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_lspid);
1721a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_lrpid);
1722a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_stime);
1723a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_rtime);
1724a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_ctime);
1725a9643ea8Slogwang 	}
1726a9643ea8Slogwang 	error = kern_msgctl(td, uap->msqid, uap->cmd, &msqbuf);
1727a9643ea8Slogwang 	if (error)
1728a9643ea8Slogwang 		return (error);
1729a9643ea8Slogwang 	if (uap->cmd == IPC_STAT) {
1730a9643ea8Slogwang 		bzero(&msqbuf32, sizeof(msqbuf32));
1731a9643ea8Slogwang 		freebsd32_ipcperm_old_out(&msqbuf.msg_perm, &msqbuf32.msg_perm);
1732*22ce4affSfengbojiang 		PTROUT_CP(msqbuf, msqbuf32, __msg_first);
1733*22ce4affSfengbojiang 		PTROUT_CP(msqbuf, msqbuf32, __msg_last);
1734a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_cbytes);
1735a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_qnum);
1736a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_qbytes);
1737a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_lspid);
1738a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_lrpid);
1739a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_stime);
1740a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_rtime);
1741a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_ctime);
1742a9643ea8Slogwang 		error = copyout(&msqbuf32, uap->buf, sizeof(struct msqid_ds32));
1743a9643ea8Slogwang 	}
1744a9643ea8Slogwang 	return (error);
1745a9643ea8Slogwang }
1746a9643ea8Slogwang #endif
1747a9643ea8Slogwang 
1748a9643ea8Slogwang int
freebsd32_msgctl(struct thread * td,struct freebsd32_msgctl_args * uap)1749a9643ea8Slogwang freebsd32_msgctl(struct thread *td, struct freebsd32_msgctl_args *uap)
1750a9643ea8Slogwang {
1751a9643ea8Slogwang 	struct msqid_ds msqbuf;
1752a9643ea8Slogwang 	struct msqid_ds32 msqbuf32;
1753a9643ea8Slogwang 	int error;
1754a9643ea8Slogwang 
1755a9643ea8Slogwang 	if (uap->cmd == IPC_SET) {
1756a9643ea8Slogwang 		error = copyin(uap->buf, &msqbuf32, sizeof(msqbuf32));
1757a9643ea8Slogwang 		if (error)
1758a9643ea8Slogwang 			return (error);
1759a9643ea8Slogwang 		freebsd32_ipcperm_in(&msqbuf32.msg_perm, &msqbuf.msg_perm);
1760*22ce4affSfengbojiang 		PTRIN_CP(msqbuf32, msqbuf, __msg_first);
1761*22ce4affSfengbojiang 		PTRIN_CP(msqbuf32, msqbuf, __msg_last);
1762a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_cbytes);
1763a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_qnum);
1764a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_qbytes);
1765a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_lspid);
1766a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_lrpid);
1767a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_stime);
1768a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_rtime);
1769a9643ea8Slogwang 		CP(msqbuf32, msqbuf, msg_ctime);
1770a9643ea8Slogwang 	}
1771a9643ea8Slogwang 	error = kern_msgctl(td, uap->msqid, uap->cmd, &msqbuf);
1772a9643ea8Slogwang 	if (error)
1773a9643ea8Slogwang 		return (error);
1774a9643ea8Slogwang 	if (uap->cmd == IPC_STAT) {
1775a9643ea8Slogwang 		freebsd32_ipcperm_out(&msqbuf.msg_perm, &msqbuf32.msg_perm);
1776*22ce4affSfengbojiang 		PTROUT_CP(msqbuf, msqbuf32, __msg_first);
1777*22ce4affSfengbojiang 		PTROUT_CP(msqbuf, msqbuf32, __msg_last);
1778a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_cbytes);
1779a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_qnum);
1780a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_qbytes);
1781a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_lspid);
1782a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_lrpid);
1783a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_stime);
1784a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_rtime);
1785a9643ea8Slogwang 		CP(msqbuf, msqbuf32, msg_ctime);
1786a9643ea8Slogwang 		error = copyout(&msqbuf32, uap->buf, sizeof(struct msqid_ds32));
1787a9643ea8Slogwang 	}
1788a9643ea8Slogwang 	return (error);
1789a9643ea8Slogwang }
1790a9643ea8Slogwang 
1791a9643ea8Slogwang int
freebsd32_msgsnd(struct thread * td,struct freebsd32_msgsnd_args * uap)1792a9643ea8Slogwang freebsd32_msgsnd(struct thread *td, struct freebsd32_msgsnd_args *uap)
1793a9643ea8Slogwang {
1794a9643ea8Slogwang 	const void *msgp;
1795a9643ea8Slogwang 	long mtype;
1796a9643ea8Slogwang 	int32_t mtype32;
1797a9643ea8Slogwang 	int error;
1798a9643ea8Slogwang 
1799a9643ea8Slogwang 	msgp = PTRIN(uap->msgp);
1800a9643ea8Slogwang 	if ((error = copyin(msgp, &mtype32, sizeof(mtype32))) != 0)
1801a9643ea8Slogwang 		return (error);
1802a9643ea8Slogwang 	mtype = mtype32;
1803a9643ea8Slogwang 	return (kern_msgsnd(td, uap->msqid,
1804a9643ea8Slogwang 	    (const char *)msgp + sizeof(mtype32),
1805a9643ea8Slogwang 	    uap->msgsz, uap->msgflg, mtype));
1806a9643ea8Slogwang }
1807a9643ea8Slogwang 
1808a9643ea8Slogwang int
freebsd32_msgrcv(struct thread * td,struct freebsd32_msgrcv_args * uap)1809a9643ea8Slogwang freebsd32_msgrcv(struct thread *td, struct freebsd32_msgrcv_args *uap)
1810a9643ea8Slogwang {
1811a9643ea8Slogwang 	void *msgp;
1812a9643ea8Slogwang 	long mtype;
1813a9643ea8Slogwang 	int32_t mtype32;
1814a9643ea8Slogwang 	int error;
1815a9643ea8Slogwang 
1816a9643ea8Slogwang 	msgp = PTRIN(uap->msgp);
1817a9643ea8Slogwang 	if ((error = kern_msgrcv(td, uap->msqid,
1818a9643ea8Slogwang 	    (char *)msgp + sizeof(mtype32), uap->msgsz,
1819a9643ea8Slogwang 	    uap->msgtyp, uap->msgflg, &mtype)) != 0)
1820a9643ea8Slogwang 		return (error);
1821a9643ea8Slogwang 	mtype32 = (int32_t)mtype;
1822a9643ea8Slogwang 	return (copyout(&mtype32, msgp, sizeof(mtype32)));
1823a9643ea8Slogwang }
1824a9643ea8Slogwang #endif
1825a9643ea8Slogwang 
1826a9643ea8Slogwang #if defined(COMPAT_FREEBSD4) || defined(COMPAT_FREEBSD5) || \
1827a9643ea8Slogwang     defined(COMPAT_FREEBSD6) || defined(COMPAT_FREEBSD7)
1828a9643ea8Slogwang 
1829a9643ea8Slogwang /* XXX casting to (sy_call_t *) is bogus, as usual. */
1830a9643ea8Slogwang static sy_call_t *msgcalls[] = {
1831a9643ea8Slogwang 	(sy_call_t *)freebsd7_msgctl, (sy_call_t *)sys_msgget,
1832a9643ea8Slogwang 	(sy_call_t *)sys_msgsnd, (sy_call_t *)sys_msgrcv
1833a9643ea8Slogwang };
1834a9643ea8Slogwang 
1835a9643ea8Slogwang /*
1836a9643ea8Slogwang  * Entry point for all MSG calls.
1837*22ce4affSfengbojiang  *
1838*22ce4affSfengbojiang  * XXX actually varargs.
1839*22ce4affSfengbojiang  * struct msgsys_args {
1840*22ce4affSfengbojiang  *		int	which;
1841*22ce4affSfengbojiang  *		int	a2;
1842*22ce4affSfengbojiang  *		int	a3;
1843*22ce4affSfengbojiang  *		int	a4;
1844*22ce4affSfengbojiang  *		int	a5;
1845*22ce4affSfengbojiang  *		int	a6;
1846*22ce4affSfengbojiang  *	} *uap;
1847a9643ea8Slogwang  */
1848a9643ea8Slogwang int
sys_msgsys(struct thread * td,struct msgsys_args * uap)1849*22ce4affSfengbojiang sys_msgsys(struct thread *td, struct msgsys_args *uap)
1850a9643ea8Slogwang {
1851a9643ea8Slogwang 	int error;
1852a9643ea8Slogwang 
1853*22ce4affSfengbojiang 	AUDIT_ARG_SVIPC_WHICH(uap->which);
1854a9643ea8Slogwang 	if (uap->which < 0 || uap->which >= nitems(msgcalls))
1855a9643ea8Slogwang 		return (EINVAL);
1856a9643ea8Slogwang 	error = (*msgcalls[uap->which])(td, &uap->a2);
1857a9643ea8Slogwang 	return (error);
1858a9643ea8Slogwang }
1859a9643ea8Slogwang 
1860a9643ea8Slogwang #ifndef CP
1861a9643ea8Slogwang #define CP(src, dst, fld)	do { (dst).fld = (src).fld; } while (0)
1862a9643ea8Slogwang #endif
1863a9643ea8Slogwang 
1864a9643ea8Slogwang #ifndef _SYS_SYSPROTO_H_
1865a9643ea8Slogwang struct freebsd7_msgctl_args {
1866a9643ea8Slogwang 	int	msqid;
1867a9643ea8Slogwang 	int	cmd;
1868a9643ea8Slogwang 	struct	msqid_ds_old *buf;
1869a9643ea8Slogwang };
1870a9643ea8Slogwang #endif
1871a9643ea8Slogwang int
freebsd7_msgctl(struct thread * td,struct freebsd7_msgctl_args * uap)1872*22ce4affSfengbojiang freebsd7_msgctl(struct thread *td, struct freebsd7_msgctl_args *uap)
1873a9643ea8Slogwang {
1874a9643ea8Slogwang 	struct msqid_ds_old msqold;
1875a9643ea8Slogwang 	struct msqid_ds msqbuf;
1876a9643ea8Slogwang 	int error;
1877a9643ea8Slogwang 
1878a9643ea8Slogwang 	DPRINTF(("call to freebsd7_msgctl(%d, %d, %p)\n", uap->msqid, uap->cmd,
1879a9643ea8Slogwang 	    uap->buf));
1880a9643ea8Slogwang 	if (uap->cmd == IPC_SET) {
1881a9643ea8Slogwang 		error = copyin(uap->buf, &msqold, sizeof(msqold));
1882a9643ea8Slogwang 		if (error)
1883a9643ea8Slogwang 			return (error);
1884a9643ea8Slogwang 		ipcperm_old2new(&msqold.msg_perm, &msqbuf.msg_perm);
1885*22ce4affSfengbojiang 		CP(msqold, msqbuf, __msg_first);
1886*22ce4affSfengbojiang 		CP(msqold, msqbuf, __msg_last);
1887a9643ea8Slogwang 		CP(msqold, msqbuf, msg_cbytes);
1888a9643ea8Slogwang 		CP(msqold, msqbuf, msg_qnum);
1889a9643ea8Slogwang 		CP(msqold, msqbuf, msg_qbytes);
1890a9643ea8Slogwang 		CP(msqold, msqbuf, msg_lspid);
1891a9643ea8Slogwang 		CP(msqold, msqbuf, msg_lrpid);
1892a9643ea8Slogwang 		CP(msqold, msqbuf, msg_stime);
1893a9643ea8Slogwang 		CP(msqold, msqbuf, msg_rtime);
1894a9643ea8Slogwang 		CP(msqold, msqbuf, msg_ctime);
1895a9643ea8Slogwang 	}
1896a9643ea8Slogwang 	error = kern_msgctl(td, uap->msqid, uap->cmd, &msqbuf);
1897a9643ea8Slogwang 	if (error)
1898a9643ea8Slogwang 		return (error);
1899a9643ea8Slogwang 	if (uap->cmd == IPC_STAT) {
1900a9643ea8Slogwang 		bzero(&msqold, sizeof(msqold));
1901a9643ea8Slogwang 		ipcperm_new2old(&msqbuf.msg_perm, &msqold.msg_perm);
1902*22ce4affSfengbojiang 		CP(msqbuf, msqold, __msg_first);
1903*22ce4affSfengbojiang 		CP(msqbuf, msqold, __msg_last);
1904a9643ea8Slogwang 		CP(msqbuf, msqold, msg_cbytes);
1905a9643ea8Slogwang 		CP(msqbuf, msqold, msg_qnum);
1906a9643ea8Slogwang 		CP(msqbuf, msqold, msg_qbytes);
1907a9643ea8Slogwang 		CP(msqbuf, msqold, msg_lspid);
1908a9643ea8Slogwang 		CP(msqbuf, msqold, msg_lrpid);
1909a9643ea8Slogwang 		CP(msqbuf, msqold, msg_stime);
1910a9643ea8Slogwang 		CP(msqbuf, msqold, msg_rtime);
1911a9643ea8Slogwang 		CP(msqbuf, msqold, msg_ctime);
1912a9643ea8Slogwang 		error = copyout(&msqold, uap->buf, sizeof(struct msqid_ds_old));
1913a9643ea8Slogwang 	}
1914a9643ea8Slogwang 	return (error);
1915a9643ea8Slogwang }
1916a9643ea8Slogwang 
1917a9643ea8Slogwang #undef CP
1918a9643ea8Slogwang 
1919a9643ea8Slogwang #endif	/* COMPAT_FREEBSD4 || COMPAT_FREEBSD5 || COMPAT_FREEBSD6 ||
1920a9643ea8Slogwang 	   COMPAT_FREEBSD7 */
1921