sysv_msg.c revision 141471
1139749Simp/*-
265942Sgibbs * Implementation of SVID messages
365942Sgibbs *
465942Sgibbs * Author:  Daniel Boulet
571717Sgibbs *
665942Sgibbs * Copyright 1993 Daniel Boulet and RTMX Inc.
765942Sgibbs *
865942Sgibbs * This system call was implemented by Daniel Boulet under contract from RTMX.
965942Sgibbs *
1065942Sgibbs * Redistribution and use in source forms, with and without modification,
1165942Sgibbs * are permitted provided that this entire comment appears intact.
1295378Sgibbs *
1395378Sgibbs * Redistribution in binary form may occur without any restrictions.
1495378Sgibbs * Obviously, it would be nice if you gave credit where credit is due
1595378Sgibbs * but requiring it would be too onerous.
1695378Sgibbs *
1795378Sgibbs * This software is provided ``AS IS'' without any warranties of any kind.
1895378Sgibbs */
1995378Sgibbs/*-
2095378Sgibbs * Copyright (c) 2003-2005 McAfee, Inc.
2195378Sgibbs * All rights reserved.
2265942Sgibbs *
2371717Sgibbs * This software was developed for the FreeBSD Project in part by McAfee
2495378Sgibbs * Research, the Security Research Division of McAfee, Inc under DARPA/SPAWAR
2595378Sgibbs * contract N66001-01-C-8035 ("CBOSS"), as part of the DARPA CHATS research
2671717Sgibbs * program.
2795378Sgibbs *
2895378Sgibbs * Redistribution and use in source and binary forms, with or without
2995378Sgibbs * modification, are permitted provided that the following conditions
3095378Sgibbs * are met:
3195378Sgibbs * 1. Redistributions of source code must retain the above copyright
3295378Sgibbs *    notice, this list of conditions and the following disclaimer.
3365942Sgibbs * 2. Redistributions in binary form must reproduce the above copyright
3465942Sgibbs *    notice, this list of conditions and the following disclaimer in the
3595378Sgibbs *    documentation and/or other materials provided with the distribution.
3695378Sgibbs *
3795378Sgibbs * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
3895378Sgibbs * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
3965942Sgibbs * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
40123579Sgibbs * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
4165942Sgibbs * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
4265942Sgibbs * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
4395378Sgibbs * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
4495378Sgibbs * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
4595378Sgibbs * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
4695378Sgibbs * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
4795378Sgibbs * SUCH DAMAGE.
48123579Sgibbs */
49123579Sgibbs
5095378Sgibbs#include <sys/cdefs.h>
5165942Sgibbs__FBSDID("$FreeBSD: head/sys/kern/sysv_msg.c 141471 2005-02-07 18:44:55Z jhb $");
5265942Sgibbs
5395378Sgibbs#include "opt_sysvipc.h"
5465942Sgibbs#include "opt_mac.h"
5565942Sgibbs
5665942Sgibbs#include <sys/param.h>
5765942Sgibbs#include <sys/systm.h>
5865942Sgibbs#include <sys/sysproto.h>
59107411Sscottl#include <sys/kernel.h>
60107411Sscottl#include <sys/proc.h>
6165942Sgibbs#include <sys/lock.h>
62114621Sgibbs#include <sys/mac.h>
63114621Sgibbs#include <sys/mutex.h>
64114621Sgibbs#include <sys/module.h>
65102669Sgibbs#include <sys/msg.h>
6665942Sgibbs#include <sys/syscall.h>
67132107Sstefanf#include <sys/syscallsubr.h>
6865942Sgibbs#include <sys/sysent.h>
6965942Sgibbs#include <sys/sysctl.h>
70115915Sgibbs#include <sys/malloc.h>
7165942Sgibbs#include <sys/jail.h>
7265942Sgibbs
7365942Sgibbsstatic MALLOC_DEFINE(M_MSG, "msg", "SVID compatible message queues");
7465942Sgibbs
7565942Sgibbsstatic void msginit(void);
7665942Sgibbsstatic int msgunload(void);
7765942Sgibbsstatic int sysvmsg_modload(struct module *, int, void *);
7865942Sgibbs
7965942Sgibbs#ifdef MSG_DEBUG
8065942Sgibbs#define DPRINTF(a)	printf a
8165942Sgibbs#else
8265942Sgibbs#define DPRINTF(a)
8365942Sgibbs#endif
84107411Sscottl#ifdef MAC_DEBUG
85115915Sgibbs#define MPRINTF(a)	printf a
86115915Sgibbs#else
87115915Sgibbs#define MPRINTF(a)
88115915Sgibbs#endif
89115915Sgibbs
90115915Sgibbsstatic void msg_freehdr(struct msg *msghdr);
91107411Sscottl
92107411Sscottl/* XXX casting to (sy_call_t *) is bogus, as usual. */
93107411Sscottlstatic sy_call_t *msgcalls[] = {
94107411Sscottl	(sy_call_t *)msgctl, (sy_call_t *)msgget,
95107411Sscottl	(sy_call_t *)msgsnd, (sy_call_t *)msgrcv
96107411Sscottl};
97107411Sscottl
98107411Sscottl#ifndef MSGSSZ
99107411Sscottl#define MSGSSZ	8		/* Each segment must be 2^N long */
100107411Sscottl#endif
101107411Sscottl#ifndef MSGSEG
10265942Sgibbs#define MSGSEG	2048		/* must be less than 32767 */
10365942Sgibbs#endif
10465942Sgibbs#define MSGMAX	(MSGSSZ*MSGSEG)
10565942Sgibbs#ifndef MSGMNB
10665942Sgibbs#define MSGMNB	2048		/* max # of bytes in a queue */
10765942Sgibbs#endif
10865942Sgibbs#ifndef MSGMNI
10965942Sgibbs#define MSGMNI	40
11065942Sgibbs#endif
11165942Sgibbs#ifndef MSGTQL
11265942Sgibbs#define MSGTQL	40
11365942Sgibbs#endif
11465942Sgibbs
11565942Sgibbs/*
11665942Sgibbs * Based on the configuration parameters described in an SVR2 (yes, two)
11765942Sgibbs * config(1m) man page.
11865942Sgibbs *
11965942Sgibbs * Each message is broken up and stored in segments that are msgssz bytes
12065942Sgibbs * long.  For efficiency reasons, this should be a power of two.  Also,
12165942Sgibbs * it doesn't make sense if it is less than 8 or greater than about 256.
12265942Sgibbs * Consequently, msginit in kern/sysv_msg.c checks that msgssz is a power of
12365942Sgibbs * two between 8 and 1024 inclusive (and panic's if it isn't).
12465942Sgibbs */
12565942Sgibbsstruct msginfo msginfo = {
12665942Sgibbs                MSGMAX,         /* max chars in a message */
12795378Sgibbs                MSGMNI,         /* # of message queue identifiers */
12865942Sgibbs                MSGMNB,         /* max chars in a queue */
12965942Sgibbs                MSGTQL,         /* max messages in system */
130102669Sgibbs                MSGSSZ,         /* size of a message segment */
13165942Sgibbs                		/* (must be small power of 2 greater than 4) */
13274094Sgibbs                MSGSEG          /* number of message segments */
13374094Sgibbs};
13465942Sgibbs
13579874Sgibbs/*
136102669Sgibbs * macros to convert between msqid_ds's and msqid's.
13765942Sgibbs * (specific to this implementation)
13865942Sgibbs */
13965942Sgibbs#define MSQID(ix,ds)	((ix) & 0xffff | (((ds).msg_perm.seq << 16) & 0xffff0000))
14095378Sgibbs#define MSQID_IX(id)	((id) & 0xffff)
14165942Sgibbs#define MSQID_SEQ(id)	(((id) >> 16) & 0xffff)
14265942Sgibbs
14365942Sgibbs/*
14495378Sgibbs * The rest of this file is specific to this particular implementation.
14595378Sgibbs */
14695378Sgibbs
14795378Sgibbsstruct msgmap {
14895378Sgibbs	short	next;		/* next segment in buffer */
14995378Sgibbs    				/* -1 -> available */
15095378Sgibbs    				/* 0..(MSGSEG-1) -> index of next segment */
15195378Sgibbs};
15279874Sgibbs
15379874Sgibbs#define MSG_LOCKED	01000	/* Is this msqid_ds locked? */
154114621Sgibbs
155114621Sgibbsstatic int nfree_msgmaps;	/* # of free map entries */
15665942Sgibbsstatic short free_msgmaps;	/* head of linked list of free map entries */
157114621Sgibbsstatic struct msg *free_msghdrs;/* list of free msg headers */
158114621Sgibbsstatic char *msgpool;		/* MSGMAX byte long msg buffer pool */
159114621Sgibbsstatic struct msgmap *msgmaps;	/* MSGSEG msgmap structures */
160114621Sgibbsstatic struct msg *msghdrs;	/* MSGTQL msg headers */
161115917Sgibbsstatic struct msqid_kernel *msqids;	/* MSGMNI msqid_kernel struct's */
16265942Sgibbsstatic struct mtx msq_mtx;	/* global mutex for message queues. */
16365942Sgibbs
16465942Sgibbsstatic void
16574094Sgibbsmsginit()
16674094Sgibbs{
16774094Sgibbs	register int i;
16874094Sgibbs
16974094Sgibbs	TUNABLE_INT_FETCH("kern.ipc.msgseg", &msginfo.msgseg);
17074094Sgibbs	TUNABLE_INT_FETCH("kern.ipc.msgssz", &msginfo.msgssz);
17174094Sgibbs	msginfo.msgmax = msginfo.msgseg * msginfo.msgssz;
17274094Sgibbs	TUNABLE_INT_FETCH("kern.ipc.msgmni", &msginfo.msgmni);
17374094Sgibbs	TUNABLE_INT_FETCH("kern.ipc.msgmnb", &msginfo.msgmnb);
17474094Sgibbs	TUNABLE_INT_FETCH("kern.ipc.msgtql", &msginfo.msgtql);
17574094Sgibbs
17674094Sgibbs	msgpool = malloc(msginfo.msgmax, M_MSG, M_WAITOK);
177123579Sgibbs	if (msgpool == NULL)
17874094Sgibbs		panic("msgpool is NULL");
17974094Sgibbs	msgmaps = malloc(sizeof(struct msgmap) * msginfo.msgseg, M_MSG, M_WAITOK);
18074094Sgibbs	if (msgmaps == NULL)
18174094Sgibbs		panic("msgmaps is NULL");
18274094Sgibbs	msghdrs = malloc(sizeof(struct msg) * msginfo.msgtql, M_MSG, M_WAITOK);
18374094Sgibbs	if (msghdrs == NULL)
18479874Sgibbs		panic("msghdrs is NULL");
18565942Sgibbs	msqids = malloc(sizeof(struct msqid_kernel) * msginfo.msgmni, M_MSG,
18665942Sgibbs	    M_WAITOK);
18765942Sgibbs	if (msqids == NULL)
18865942Sgibbs		panic("msqids is NULL");
18965942Sgibbs
19065942Sgibbs	/*
19165942Sgibbs	 * msginfo.msgssz should be a power of two for efficiency reasons.
19265942Sgibbs	 * It is also pretty silly if msginfo.msgssz is less than 8
19365942Sgibbs	 * or greater than about 256 so ...
19465942Sgibbs	 */
19565942Sgibbs
19665942Sgibbs	i = 8;
19774094Sgibbs	while (i < 1024 && i != msginfo.msgssz)
19865942Sgibbs		i <<= 1;
19965942Sgibbs    	if (i != msginfo.msgssz) {
20065942Sgibbs		DPRINTF(("msginfo.msgssz=%d (0x%x)\n", msginfo.msgssz,
20165942Sgibbs		    msginfo.msgssz));
20265942Sgibbs		panic("msginfo.msgssz not a small power of 2");
20365942Sgibbs	}
20465942Sgibbs
20565942Sgibbs	if (msginfo.msgseg > 32767) {
20665942Sgibbs		DPRINTF(("msginfo.msgseg=%d\n", msginfo.msgseg));
20765942Sgibbs		panic("msginfo.msgseg > 32767");
20865942Sgibbs	}
20965942Sgibbs
21065942Sgibbs	if (msgmaps == NULL)
21165942Sgibbs		panic("msgmaps is NULL");
21265942Sgibbs
21365942Sgibbs	for (i = 0; i < msginfo.msgseg; i++) {
21465942Sgibbs		if (i > 0)
215102669Sgibbs			msgmaps[i-1].next = i;
216102669Sgibbs		msgmaps[i].next = -1;	/* implies entry is available */
21765942Sgibbs	}
21865942Sgibbs	free_msgmaps = 0;
21965942Sgibbs	nfree_msgmaps = msginfo.msgseg;
22065942Sgibbs
221102669Sgibbs	if (msghdrs == NULL)
22265942Sgibbs		panic("msghdrs is NULL");
22365942Sgibbs
22465942Sgibbs	for (i = 0; i < msginfo.msgtql; i++) {
22565942Sgibbs		msghdrs[i].msg_type = 0;
22665942Sgibbs		if (i > 0)
227102669Sgibbs			msghdrs[i-1].msg_next = &msghdrs[i];
228102669Sgibbs		msghdrs[i].msg_next = NULL;
229102669Sgibbs#ifdef MAC
230102669Sgibbs		mac_init_sysv_msgmsg(&msghdrs[i]);
23165942Sgibbs#endif
23265942Sgibbs    	}
23365942Sgibbs	free_msghdrs = &msghdrs[0];
23465942Sgibbs
23565942Sgibbs	if (msqids == NULL)
23665942Sgibbs		panic("msqids is NULL");
23765942Sgibbs
23865942Sgibbs	for (i = 0; i < msginfo.msgmni; i++) {
23965942Sgibbs		msqids[i].u.msg_qbytes = 0;	/* implies entry is available */
24065942Sgibbs		msqids[i].u.msg_perm.seq = 0;	/* reset to a known value */
24165942Sgibbs		msqids[i].u.msg_perm.mode = 0;
242114621Sgibbs#ifdef MAC
243114621Sgibbs		mac_init_sysv_msgqueue(&msqids[i]);
244114621Sgibbs#endif
24565942Sgibbs	}
24665942Sgibbs	mtx_init(&msq_mtx, "msq", NULL, MTX_DEF);
24765942Sgibbs}
24865942Sgibbs
24965942Sgibbsstatic int
25065942Sgibbsmsgunload()
25165942Sgibbs{
252102669Sgibbs	struct msqid_kernel *msqkptr;
253102669Sgibbs	int msqid;
254102669Sgibbs#ifdef MAC
255102669Sgibbs	int i;
256168807Sscottl#endif
25765942Sgibbs
25871390Sgibbs	for (msqid = 0; msqid < msginfo.msgmni; msqid++) {
25971390Sgibbs		/*
26071390Sgibbs		 * Look for an unallocated and unlocked msqid_ds.
26171390Sgibbs		 * msqid_ds's can be locked by msgsnd or msgrcv while
26271390Sgibbs		 * they are copying the message in/out.  We can't
26365942Sgibbs		 * re-use the entry until they release it.
26465942Sgibbs		 */
26565942Sgibbs		msqkptr = &msqids[msqid];
26665942Sgibbs		if (msqkptr->u.msg_qbytes != 0 ||
267168807Sscottl		    (msqkptr->u.msg_perm.mode & MSG_LOCKED) != 0)
26874972Sgibbs			break;
26965942Sgibbs	}
27065942Sgibbs	if (msqid != msginfo.msgmni)
27165942Sgibbs		return (EBUSY);
272114621Sgibbs
273114621Sgibbs#ifdef MAC
274114621Sgibbs	for (i = 0; i < msginfo.msgtql; i++)
275114621Sgibbs		mac_destroy_sysv_msgmsg(&msghdrs[i]);
276114621Sgibbs	for (msqid = 0; msqid < msginfo.msgmni; msqid++)
277114621Sgibbs		mac_destroy_sysv_msgqueue(&msqids[msqid]);
278114621Sgibbs#endif
279114621Sgibbs	free(msgpool, M_MSG);
280114621Sgibbs	free(msgmaps, M_MSG);
281114621Sgibbs	free(msghdrs, M_MSG);
282114621Sgibbs	free(msqids, M_MSG);
283114621Sgibbs	mtx_destroy(&msq_mtx);
284114621Sgibbs	return (0);
285114621Sgibbs}
286114621Sgibbs
287114621Sgibbs
288114621Sgibbsstatic int
289114621Sgibbssysvmsg_modload(struct module *module, int cmd, void *arg)
290114621Sgibbs{
291114621Sgibbs	int error = 0;
292114621Sgibbs
293114621Sgibbs	switch (cmd) {
29465942Sgibbs	case MOD_LOAD:
29565942Sgibbs		msginit();
29665942Sgibbs		break;
297102669Sgibbs	case MOD_UNLOAD:
29865942Sgibbs		error = msgunload();
29965942Sgibbs		break;
300102669Sgibbs	case MOD_SHUTDOWN:
301102669Sgibbs		break;
302102669Sgibbs	default:
303102669Sgibbs		error = EINVAL;
30465942Sgibbs		break;
30565942Sgibbs	}
30665942Sgibbs	return (error);
30765942Sgibbs}
30865942Sgibbs
30965942Sgibbsstatic moduledata_t sysvmsg_mod = {
31065942Sgibbs	"sysvmsg",
31165942Sgibbs	&sysvmsg_modload,
31265942Sgibbs	NULL
31365942Sgibbs};
31465942Sgibbs
31565942SgibbsSYSCALL_MODULE_HELPER(msgsys);
316102669SgibbsSYSCALL_MODULE_HELPER(msgctl);
31765942SgibbsSYSCALL_MODULE_HELPER(msgget);
31865942SgibbsSYSCALL_MODULE_HELPER(msgsnd);
31965942SgibbsSYSCALL_MODULE_HELPER(msgrcv);
320104231Sgibbs
321114621SgibbsDECLARE_MODULE(sysvmsg, sysvmsg_mod,
32265942Sgibbs	SI_SUB_SYSV_MSG, SI_ORDER_FIRST);
32365942SgibbsMODULE_VERSION(sysvmsg, 1);
32465942Sgibbs
325102669Sgibbs/*
32665942Sgibbs * Entry point for all MSG calls
32765942Sgibbs *
32865942Sgibbs * MPSAFE
32965942Sgibbs */
33065942Sgibbsint
33165942Sgibbsmsgsys(td, uap)
33265942Sgibbs	struct thread *td;
33365942Sgibbs	/* XXX actually varargs. */
33465942Sgibbs	struct msgsys_args /* {
33565942Sgibbs		int	which;
33665942Sgibbs		int	a2;
33765942Sgibbs		int	a3;
33865942Sgibbs		int	a4;
33965942Sgibbs		int	a5;
34065942Sgibbs		int	a6;
34165942Sgibbs	} */ *uap;
34265942Sgibbs{
343102669Sgibbs	int error;
344102669Sgibbs
34565942Sgibbs	if (!jail_sysvipc_allowed && jailed(td->td_ucred))
34665942Sgibbs		return (ENOSYS);
347102669Sgibbs	if (uap->which < 0 ||
34865942Sgibbs	    uap->which >= sizeof(msgcalls)/sizeof(msgcalls[0]))
34965942Sgibbs		return (EINVAL);
350102669Sgibbs	error = (*msgcalls[uap->which])(td, &uap->a2);
351102669Sgibbs	return (error);
352102669Sgibbs}
353102669Sgibbs
35465942Sgibbsstatic void
355102669Sgibbsmsg_freehdr(msghdr)
35665942Sgibbs	struct msg *msghdr;
357102669Sgibbs{
35865942Sgibbs	while (msghdr->msg_ts > 0) {
35965942Sgibbs		short next;
36065942Sgibbs		if (msghdr->msg_spot < 0 || msghdr->msg_spot >= msginfo.msgseg)
36165942Sgibbs			panic("msghdr->msg_spot out of range");
36265942Sgibbs		next = msgmaps[msghdr->msg_spot].next;
36365942Sgibbs		msgmaps[msghdr->msg_spot].next = free_msgmaps;
364102669Sgibbs		free_msgmaps = msghdr->msg_spot;
36565942Sgibbs		nfree_msgmaps++;
36665942Sgibbs		msghdr->msg_spot = next;
367102669Sgibbs		if (msghdr->msg_ts >= msginfo.msgssz)
36865942Sgibbs			msghdr->msg_ts -= msginfo.msgssz;
369102669Sgibbs		else
37065942Sgibbs			msghdr->msg_ts = 0;
37165942Sgibbs	}
372102669Sgibbs	if (msghdr->msg_spot != -1)
37365942Sgibbs		panic("msghdr->msg_spot != -1");
37465942Sgibbs	msghdr->msg_next = free_msghdrs;
37565942Sgibbs	free_msghdrs = msghdr;
37665942Sgibbs#ifdef MAC
377102669Sgibbs	mac_cleanup_sysv_msgmsg(msghdr);
37865942Sgibbs#endif
37965942Sgibbs}
380102669Sgibbs
38165942Sgibbs#ifndef _SYS_SYSPROTO_H_
38265942Sgibbsstruct msgctl_args {
38365942Sgibbs	int	msqid;
38479874Sgibbs	int	cmd;
38565942Sgibbs	struct	msqid_ds *buf;
38665942Sgibbs};
38765942Sgibbs#endif
38879874Sgibbs
38979874Sgibbs/*
39065942Sgibbs * MPSAFE
39165942Sgibbs */
39265942Sgibbsint
39365942Sgibbsmsgctl(td, uap)
39479874Sgibbs	struct thread *td;
39565942Sgibbs	register struct msgctl_args *uap;
39665942Sgibbs{
39765942Sgibbs	int msqid = uap->msqid;
39879874Sgibbs	int cmd = uap->cmd;
39979874Sgibbs	struct msqid_ds msqbuf;
40065942Sgibbs	int error;
40165942Sgibbs
40265942Sgibbs	DPRINTF(("call to msgctl(%d, %d, 0x%x)\n", msqid, cmd, uap->buf));
40365942Sgibbs	if (cmd == IPC_SET &&
40479874Sgibbs	    (error = copyin(uap->buf, &msqbuf, sizeof(msqbuf))) != 0)
40565942Sgibbs		return (error);
40679874Sgibbs	error = kern_msgctl(td, msqid, cmd, &msqbuf);
40779874Sgibbs	if (cmd == IPC_STAT && error == 0)
40879874Sgibbs		error = copyout(&msqbuf, uap->buf, sizeof(struct msqid_ds));
40979874Sgibbs	return (error);
41079874Sgibbs}
41179874Sgibbs
412114621Sgibbsint
41365942Sgibbskern_msgctl(td, msqid, cmd, msqbuf)
41465942Sgibbs	struct thread *td;
415	int msqid;
416	int cmd;
417	struct msqid_ds *msqbuf;
418{
419	int rval, error, msqix;
420	register struct msqid_kernel *msqkptr;
421
422	if (!jail_sysvipc_allowed && jailed(td->td_ucred))
423		return (ENOSYS);
424
425	msqix = IPCID_TO_IX(msqid);
426
427	if (msqix < 0 || msqix >= msginfo.msgmni) {
428		DPRINTF(("msqid (%d) out of range (0<=msqid<%d)\n", msqix,
429		    msginfo.msgmni));
430		return (EINVAL);
431	}
432
433	msqkptr = &msqids[msqix];
434
435	mtx_lock(&msq_mtx);
436	if (msqkptr->u.msg_qbytes == 0) {
437		DPRINTF(("no such msqid\n"));
438		error = EINVAL;
439		goto done2;
440	}
441	if (msqkptr->u.msg_perm.seq != IPCID_TO_SEQ(msqid)) {
442		DPRINTF(("wrong sequence number\n"));
443		error = EINVAL;
444		goto done2;
445	}
446#ifdef MAC
447	error = mac_check_sysv_msqctl(td->td_ucred, msqkptr, cmd);
448	if (error != 0) {
449		MPRINTF(("mac_check_sysv_msqctl returned %d\n", error));
450		goto done2;
451	}
452#endif
453
454	error = 0;
455	rval = 0;
456
457	switch (cmd) {
458
459	case IPC_RMID:
460	{
461		struct msg *msghdr;
462		if ((error = ipcperm(td, &msqkptr->u.msg_perm, IPC_M)))
463			goto done2;
464
465#ifdef MAC
466		/*
467		 * Check that the thread has MAC access permissions to
468		 * individual msghdrs.  Note: We need to do this in a
469		 * separate loop because the actual loop alters the
470		 * msq/msghdr info as it progresses, and there is no going
471		 * back if half the way through we discover that the
472		 * thread cannot free a certain msghdr.  The msq will get
473		 * into an inconsistent state.
474		 */
475		for (msghdr = msqkptr->u.msg_first; msghdr != NULL;
476		    msghdr = msghdr->msg_next) {
477			error = mac_check_sysv_msgrmid(td->td_ucred, msghdr);
478			if (error != 0) {
479				MPRINTF(("mac_check_sysv_msgrmid returned %d\n",
480				    error));
481				goto done2;
482			}
483		}
484#endif
485
486		/* Free the message headers */
487		msghdr = msqkptr->u.msg_first;
488		while (msghdr != NULL) {
489			struct msg *msghdr_tmp;
490
491			/* Free the segments of each message */
492			msqkptr->u.msg_cbytes -= msghdr->msg_ts;
493			msqkptr->u.msg_qnum--;
494			msghdr_tmp = msghdr;
495			msghdr = msghdr->msg_next;
496			msg_freehdr(msghdr_tmp);
497		}
498
499		if (msqkptr->u.msg_cbytes != 0)
500			panic("msg_cbytes is screwed up");
501		if (msqkptr->u.msg_qnum != 0)
502			panic("msg_qnum is screwed up");
503
504		msqkptr->u.msg_qbytes = 0;	/* Mark it as free */
505
506#ifdef MAC
507		mac_cleanup_sysv_msgqueue(msqkptr);
508#endif
509
510		wakeup(msqkptr);
511	}
512
513		break;
514
515	case IPC_SET:
516		if ((error = ipcperm(td, &msqkptr->u.msg_perm, IPC_M)))
517			goto done2;
518		if (msqbuf->msg_qbytes > msqkptr->u.msg_qbytes) {
519			error = suser(td);
520			if (error)
521				goto done2;
522		}
523		if (msqbuf->msg_qbytes > msginfo.msgmnb) {
524			DPRINTF(("can't increase msg_qbytes beyond %d"
525			    "(truncating)\n", msginfo.msgmnb));
526			msqbuf->msg_qbytes = msginfo.msgmnb;	/* silently restrict qbytes to system limit */
527		}
528		if (msqbuf->msg_qbytes == 0) {
529			DPRINTF(("can't reduce msg_qbytes to 0\n"));
530			error = EINVAL;		/* non-standard errno! */
531			goto done2;
532		}
533		msqkptr->u.msg_perm.uid = msqbuf->msg_perm.uid;	/* change the owner */
534		msqkptr->u.msg_perm.gid = msqbuf->msg_perm.gid;	/* change the owner */
535		msqkptr->u.msg_perm.mode = (msqkptr->u.msg_perm.mode & ~0777) |
536		    (msqbuf->msg_perm.mode & 0777);
537		msqkptr->u.msg_qbytes = msqbuf->msg_qbytes;
538		msqkptr->u.msg_ctime = time_second;
539		break;
540
541	case IPC_STAT:
542		if ((error = ipcperm(td, &msqkptr->u.msg_perm, IPC_R))) {
543			DPRINTF(("requester doesn't have read access\n"));
544			goto done2;
545		}
546		*msqbuf = msqkptr->u;
547		break;
548
549	default:
550		DPRINTF(("invalid command %d\n", cmd));
551		error = EINVAL;
552		goto done2;
553	}
554
555	if (error == 0)
556		td->td_retval[0] = rval;
557done2:
558	mtx_unlock(&msq_mtx);
559	return (error);
560}
561
562#ifndef _SYS_SYSPROTO_H_
563struct msgget_args {
564	key_t	key;
565	int	msgflg;
566};
567#endif
568
569/*
570 * MPSAFE
571 */
572int
573msgget(td, uap)
574	struct thread *td;
575	register struct msgget_args *uap;
576{
577	int msqid, error = 0;
578	int key = uap->key;
579	int msgflg = uap->msgflg;
580	struct ucred *cred = td->td_ucred;
581	register struct msqid_kernel *msqkptr = NULL;
582
583	DPRINTF(("msgget(0x%x, 0%o)\n", key, msgflg));
584
585	if (!jail_sysvipc_allowed && jailed(td->td_ucred))
586		return (ENOSYS);
587
588	mtx_lock(&msq_mtx);
589	if (key != IPC_PRIVATE) {
590		for (msqid = 0; msqid < msginfo.msgmni; msqid++) {
591			msqkptr = &msqids[msqid];
592			if (msqkptr->u.msg_qbytes != 0 &&
593			    msqkptr->u.msg_perm.key == key)
594				break;
595		}
596		if (msqid < msginfo.msgmni) {
597			DPRINTF(("found public key\n"));
598			if ((msgflg & IPC_CREAT) && (msgflg & IPC_EXCL)) {
599				DPRINTF(("not exclusive\n"));
600				error = EEXIST;
601				goto done2;
602			}
603			if ((error = ipcperm(td, &msqkptr->u.msg_perm,
604			    msgflg & 0700))) {
605				DPRINTF(("requester doesn't have 0%o access\n",
606				    msgflg & 0700));
607				goto done2;
608			}
609#ifdef MAC
610			error = mac_check_sysv_msqget(cred, msqkptr);
611			if (error != 0) {
612				MPRINTF(("mac_check_sysv_msqget returned %d\n",
613				    error));
614				goto done2;
615			}
616#endif
617			goto found;
618		}
619	}
620
621	DPRINTF(("need to allocate the msqid_ds\n"));
622	if (key == IPC_PRIVATE || (msgflg & IPC_CREAT)) {
623		for (msqid = 0; msqid < msginfo.msgmni; msqid++) {
624			/*
625			 * Look for an unallocated and unlocked msqid_ds.
626			 * msqid_ds's can be locked by msgsnd or msgrcv while
627			 * they are copying the message in/out.  We can't
628			 * re-use the entry until they release it.
629			 */
630			msqkptr = &msqids[msqid];
631			if (msqkptr->u.msg_qbytes == 0 &&
632			    (msqkptr->u.msg_perm.mode & MSG_LOCKED) == 0)
633				break;
634		}
635		if (msqid == msginfo.msgmni) {
636			DPRINTF(("no more msqid_ds's available\n"));
637			error = ENOSPC;
638			goto done2;
639		}
640		DPRINTF(("msqid %d is available\n", msqid));
641		msqkptr->u.msg_perm.key = key;
642		msqkptr->u.msg_perm.cuid = cred->cr_uid;
643		msqkptr->u.msg_perm.uid = cred->cr_uid;
644		msqkptr->u.msg_perm.cgid = cred->cr_gid;
645		msqkptr->u.msg_perm.gid = cred->cr_gid;
646		msqkptr->u.msg_perm.mode = (msgflg & 0777);
647		/* Make sure that the returned msqid is unique */
648		msqkptr->u.msg_perm.seq = (msqkptr->u.msg_perm.seq + 1) & 0x7fff;
649		msqkptr->u.msg_first = NULL;
650		msqkptr->u.msg_last = NULL;
651		msqkptr->u.msg_cbytes = 0;
652		msqkptr->u.msg_qnum = 0;
653		msqkptr->u.msg_qbytes = msginfo.msgmnb;
654		msqkptr->u.msg_lspid = 0;
655		msqkptr->u.msg_lrpid = 0;
656		msqkptr->u.msg_stime = 0;
657		msqkptr->u.msg_rtime = 0;
658		msqkptr->u.msg_ctime = time_second;
659#ifdef MAC
660		mac_create_sysv_msgqueue(cred, msqkptr);
661#endif
662	} else {
663		DPRINTF(("didn't find it and wasn't asked to create it\n"));
664		error = ENOENT;
665		goto done2;
666	}
667
668found:
669	/* Construct the unique msqid */
670	td->td_retval[0] = IXSEQ_TO_IPCID(msqid, msqkptr->u.msg_perm);
671done2:
672	mtx_unlock(&msq_mtx);
673	return (error);
674}
675
676#ifndef _SYS_SYSPROTO_H_
677struct msgsnd_args {
678	int	msqid;
679	const void	*msgp;
680	size_t	msgsz;
681	int	msgflg;
682};
683#endif
684
685/*
686 * MPSAFE
687 */
688int
689msgsnd(td, uap)
690	struct thread *td;
691	register struct msgsnd_args *uap;
692{
693	int msqid = uap->msqid;
694	const void *user_msgp = uap->msgp;
695	size_t msgsz = uap->msgsz;
696	int msgflg = uap->msgflg;
697	int segs_needed, error = 0;
698	register struct msqid_kernel *msqkptr;
699	register struct msg *msghdr;
700	short next;
701
702	DPRINTF(("call to msgsnd(%d, 0x%x, %d, %d)\n", msqid, user_msgp, msgsz,
703	    msgflg));
704	if (!jail_sysvipc_allowed && jailed(td->td_ucred))
705		return (ENOSYS);
706
707	mtx_lock(&msq_mtx);
708	msqid = IPCID_TO_IX(msqid);
709
710	if (msqid < 0 || msqid >= msginfo.msgmni) {
711		DPRINTF(("msqid (%d) out of range (0<=msqid<%d)\n", msqid,
712		    msginfo.msgmni));
713		error = EINVAL;
714		goto done2;
715	}
716
717	msqkptr = &msqids[msqid];
718	if (msqkptr->u.msg_qbytes == 0) {
719		DPRINTF(("no such message queue id\n"));
720		error = EINVAL;
721		goto done2;
722	}
723	if (msqkptr->u.msg_perm.seq != IPCID_TO_SEQ(uap->msqid)) {
724		DPRINTF(("wrong sequence number\n"));
725		error = EINVAL;
726		goto done2;
727	}
728
729	if ((error = ipcperm(td, &msqkptr->u.msg_perm, IPC_W))) {
730		DPRINTF(("requester doesn't have write access\n"));
731		goto done2;
732	}
733
734#ifdef MAC
735	error = mac_check_sysv_msqsnd(td->td_ucred, msqkptr);
736	if (error != 0) {
737		MPRINTF(("mac_check_sysv_msqsnd returned %d\n", error));
738		goto done2;
739	}
740#endif
741
742	segs_needed = (msgsz + msginfo.msgssz - 1) / msginfo.msgssz;
743	DPRINTF(("msgsz=%d, msgssz=%d, segs_needed=%d\n", msgsz, msginfo.msgssz,
744	    segs_needed));
745	for (;;) {
746		int need_more_resources = 0;
747
748		/*
749		 * check msgsz
750		 * (inside this loop in case msg_qbytes changes while we sleep)
751		 */
752
753		if (msgsz > msqkptr->u.msg_qbytes) {
754			DPRINTF(("msgsz > msqkptr->u.msg_qbytes\n"));
755			error = EINVAL;
756			goto done2;
757		}
758
759		if (msqkptr->u.msg_perm.mode & MSG_LOCKED) {
760			DPRINTF(("msqid is locked\n"));
761			need_more_resources = 1;
762		}
763		if (msgsz + msqkptr->u.msg_cbytes > msqkptr->u.msg_qbytes) {
764			DPRINTF(("msgsz + msg_cbytes > msg_qbytes\n"));
765			need_more_resources = 1;
766		}
767		if (segs_needed > nfree_msgmaps) {
768			DPRINTF(("segs_needed > nfree_msgmaps\n"));
769			need_more_resources = 1;
770		}
771		if (free_msghdrs == NULL) {
772			DPRINTF(("no more msghdrs\n"));
773			need_more_resources = 1;
774		}
775
776		if (need_more_resources) {
777			int we_own_it;
778
779			if ((msgflg & IPC_NOWAIT) != 0) {
780				DPRINTF(("need more resources but caller "
781				    "doesn't want to wait\n"));
782				error = EAGAIN;
783				goto done2;
784			}
785
786			if ((msqkptr->u.msg_perm.mode & MSG_LOCKED) != 0) {
787				DPRINTF(("we don't own the msqid_ds\n"));
788				we_own_it = 0;
789			} else {
790				/* Force later arrivals to wait for our
791				   request */
792				DPRINTF(("we own the msqid_ds\n"));
793				msqkptr->u.msg_perm.mode |= MSG_LOCKED;
794				we_own_it = 1;
795			}
796			DPRINTF(("goodnight\n"));
797			error = msleep(msqkptr, &msq_mtx, (PZERO - 4) | PCATCH,
798			    "msgwait", 0);
799			DPRINTF(("good morning, error=%d\n", error));
800			if (we_own_it)
801				msqkptr->u.msg_perm.mode &= ~MSG_LOCKED;
802			if (error != 0) {
803				DPRINTF(("msgsnd:  interrupted system call\n"));
804				error = EINTR;
805				goto done2;
806			}
807
808			/*
809			 * Make sure that the msq queue still exists
810			 */
811
812			if (msqkptr->u.msg_qbytes == 0) {
813				DPRINTF(("msqid deleted\n"));
814				error = EIDRM;
815				goto done2;
816			}
817
818		} else {
819			DPRINTF(("got all the resources that we need\n"));
820			break;
821		}
822	}
823
824	/*
825	 * We have the resources that we need.
826	 * Make sure!
827	 */
828
829	if (msqkptr->u.msg_perm.mode & MSG_LOCKED)
830		panic("msg_perm.mode & MSG_LOCKED");
831	if (segs_needed > nfree_msgmaps)
832		panic("segs_needed > nfree_msgmaps");
833	if (msgsz + msqkptr->u.msg_cbytes > msqkptr->u.msg_qbytes)
834		panic("msgsz + msg_cbytes > msg_qbytes");
835	if (free_msghdrs == NULL)
836		panic("no more msghdrs");
837
838	/*
839	 * Re-lock the msqid_ds in case we page-fault when copying in the
840	 * message
841	 */
842
843	if ((msqkptr->u.msg_perm.mode & MSG_LOCKED) != 0)
844		panic("msqid_ds is already locked");
845	msqkptr->u.msg_perm.mode |= MSG_LOCKED;
846
847	/*
848	 * Allocate a message header
849	 */
850
851	msghdr = free_msghdrs;
852	free_msghdrs = msghdr->msg_next;
853	msghdr->msg_spot = -1;
854	msghdr->msg_ts = msgsz;
855#ifdef MAC
856	/*
857	 * XXXMAC: Should the mac_check_sysv_msgmsq check follow here
858	 * immediately?  Or, should it be checked just before the msg is
859	 * enqueued in the msgq (as it is done now)?
860	 */
861	mac_create_sysv_msgmsg(td->td_ucred, msqkptr, msghdr);
862#endif
863
864	/*
865	 * Allocate space for the message
866	 */
867
868	while (segs_needed > 0) {
869		if (nfree_msgmaps <= 0)
870			panic("not enough msgmaps");
871		if (free_msgmaps == -1)
872			panic("nil free_msgmaps");
873		next = free_msgmaps;
874		if (next <= -1)
875			panic("next too low #1");
876		if (next >= msginfo.msgseg)
877			panic("next out of range #1");
878		DPRINTF(("allocating segment %d to message\n", next));
879		free_msgmaps = msgmaps[next].next;
880		nfree_msgmaps--;
881		msgmaps[next].next = msghdr->msg_spot;
882		msghdr->msg_spot = next;
883		segs_needed--;
884	}
885
886	/*
887	 * Copy in the message type
888	 */
889
890	mtx_unlock(&msq_mtx);
891	if ((error = copyin(user_msgp, &msghdr->msg_type,
892	    sizeof(msghdr->msg_type))) != 0) {
893		mtx_lock(&msq_mtx);
894		DPRINTF(("error %d copying the message type\n", error));
895		msg_freehdr(msghdr);
896		msqkptr->u.msg_perm.mode &= ~MSG_LOCKED;
897		wakeup(msqkptr);
898		goto done2;
899	}
900	mtx_lock(&msq_mtx);
901	user_msgp = (const char *)user_msgp + sizeof(msghdr->msg_type);
902
903	/*
904	 * Validate the message type
905	 */
906
907	if (msghdr->msg_type < 1) {
908		msg_freehdr(msghdr);
909		msqkptr->u.msg_perm.mode &= ~MSG_LOCKED;
910		wakeup(msqkptr);
911		DPRINTF(("mtype (%d) < 1\n", msghdr->msg_type));
912		error = EINVAL;
913		goto done2;
914	}
915
916	/*
917	 * Copy in the message body
918	 */
919
920	next = msghdr->msg_spot;
921	while (msgsz > 0) {
922		size_t tlen;
923		if (msgsz > msginfo.msgssz)
924			tlen = msginfo.msgssz;
925		else
926			tlen = msgsz;
927		if (next <= -1)
928			panic("next too low #2");
929		if (next >= msginfo.msgseg)
930			panic("next out of range #2");
931		mtx_unlock(&msq_mtx);
932		if ((error = copyin(user_msgp, &msgpool[next * msginfo.msgssz],
933		    tlen)) != 0) {
934			mtx_lock(&msq_mtx);
935			DPRINTF(("error %d copying in message segment\n",
936			    error));
937			msg_freehdr(msghdr);
938			msqkptr->u.msg_perm.mode &= ~MSG_LOCKED;
939			wakeup(msqkptr);
940			goto done2;
941		}
942		mtx_lock(&msq_mtx);
943		msgsz -= tlen;
944		user_msgp = (const char *)user_msgp + tlen;
945		next = msgmaps[next].next;
946	}
947	if (next != -1)
948		panic("didn't use all the msg segments");
949
950	/*
951	 * We've got the message.  Unlock the msqid_ds.
952	 */
953
954	msqkptr->u.msg_perm.mode &= ~MSG_LOCKED;
955
956	/*
957	 * Make sure that the msqid_ds is still allocated.
958	 */
959
960	if (msqkptr->u.msg_qbytes == 0) {
961		msg_freehdr(msghdr);
962		wakeup(msqkptr);
963		error = EIDRM;
964		goto done2;
965	}
966
967#ifdef MAC
968	/*
969	 * Note: Since the task/thread allocates the msghdr and usually
970	 * primes it with its own MAC label, for a majority of policies, it
971	 * won't be necessary to check whether the msghdr has access
972	 * permissions to the msgq.  The mac_check_sysv_msqsnd check would
973	 * suffice in that case.  However, this hook may be required where
974	 * individual policies derive a non-identical label for the msghdr
975	 * from the current thread label and may want to check the msghdr
976	 * enqueue permissions, along with read/write permissions to the
977	 * msgq.
978	 */
979	error = mac_check_sysv_msgmsq(td->td_ucred, msghdr, msqkptr);
980	if (error != 0) {
981		MPRINTF(("mac_check_sysv_msqmsq returned %d\n", error));
982		msg_freehdr(msghdr);
983		wakeup(msqkptr);
984		goto done2;
985	}
986#endif
987
988	/*
989	 * Put the message into the queue
990	 */
991	if (msqkptr->u.msg_first == NULL) {
992		msqkptr->u.msg_first = msghdr;
993		msqkptr->u.msg_last = msghdr;
994	} else {
995		msqkptr->u.msg_last->msg_next = msghdr;
996		msqkptr->u.msg_last = msghdr;
997	}
998	msqkptr->u.msg_last->msg_next = NULL;
999
1000	msqkptr->u.msg_cbytes += msghdr->msg_ts;
1001	msqkptr->u.msg_qnum++;
1002	msqkptr->u.msg_lspid = td->td_proc->p_pid;
1003	msqkptr->u.msg_stime = time_second;
1004
1005	wakeup(msqkptr);
1006	td->td_retval[0] = 0;
1007done2:
1008	mtx_unlock(&msq_mtx);
1009	return (error);
1010}
1011
1012#ifndef _SYS_SYSPROTO_H_
1013struct msgrcv_args {
1014	int	msqid;
1015	void	*msgp;
1016	size_t	msgsz;
1017	long	msgtyp;
1018	int	msgflg;
1019};
1020#endif
1021
1022/*
1023 * MPSAFE
1024 */
1025int
1026msgrcv(td, uap)
1027	struct thread *td;
1028	register struct msgrcv_args *uap;
1029{
1030	int msqid = uap->msqid;
1031	void *user_msgp = uap->msgp;
1032	size_t msgsz = uap->msgsz;
1033	long msgtyp = uap->msgtyp;
1034	int msgflg = uap->msgflg;
1035	size_t len;
1036	register struct msqid_kernel *msqkptr;
1037	register struct msg *msghdr;
1038	int error = 0;
1039	short next;
1040
1041	DPRINTF(("call to msgrcv(%d, 0x%x, %d, %ld, %d)\n", msqid, user_msgp,
1042	    msgsz, msgtyp, msgflg));
1043
1044	if (!jail_sysvipc_allowed && jailed(td->td_ucred))
1045		return (ENOSYS);
1046
1047	msqid = IPCID_TO_IX(msqid);
1048
1049	if (msqid < 0 || msqid >= msginfo.msgmni) {
1050		DPRINTF(("msqid (%d) out of range (0<=msqid<%d)\n", msqid,
1051		    msginfo.msgmni));
1052		return (EINVAL);
1053	}
1054
1055	msqkptr = &msqids[msqid];
1056	mtx_lock(&msq_mtx);
1057	if (msqkptr->u.msg_qbytes == 0) {
1058		DPRINTF(("no such message queue id\n"));
1059		error = EINVAL;
1060		goto done2;
1061	}
1062	if (msqkptr->u.msg_perm.seq != IPCID_TO_SEQ(uap->msqid)) {
1063		DPRINTF(("wrong sequence number\n"));
1064		error = EINVAL;
1065		goto done2;
1066	}
1067
1068	if ((error = ipcperm(td, &msqkptr->u.msg_perm, IPC_R))) {
1069		DPRINTF(("requester doesn't have read access\n"));
1070		goto done2;
1071	}
1072
1073#ifdef MAC
1074	error = mac_check_sysv_msqrcv(td->td_ucred, msqkptr);
1075	if (error != 0) {
1076		MPRINTF(("mac_check_sysv_msqrcv returned %d\n", error));
1077		goto done2;
1078	}
1079#endif
1080
1081	msghdr = NULL;
1082	while (msghdr == NULL) {
1083		if (msgtyp == 0) {
1084			msghdr = msqkptr->u.msg_first;
1085			if (msghdr != NULL) {
1086				if (msgsz < msghdr->msg_ts &&
1087				    (msgflg & MSG_NOERROR) == 0) {
1088					DPRINTF(("first message on the queue "
1089					    "is too big (want %d, got %d)\n",
1090					    msgsz, msghdr->msg_ts));
1091					error = E2BIG;
1092					goto done2;
1093				}
1094#ifdef MAC
1095				error = mac_check_sysv_msgrcv(td->td_ucred,
1096				    msghdr);
1097				if (error != 0) {
1098					MPRINTF(("mac_check_sysv_msgrcv "
1099					    "returned %d\n", error));
1100					goto done2;
1101				}
1102#endif
1103				if (msqkptr->u.msg_first == msqkptr->u.msg_last) {
1104					msqkptr->u.msg_first = NULL;
1105					msqkptr->u.msg_last = NULL;
1106				} else {
1107					msqkptr->u.msg_first = msghdr->msg_next;
1108					if (msqkptr->u.msg_first == NULL)
1109						panic("msg_first/last screwed up #1");
1110				}
1111			}
1112		} else {
1113			struct msg *previous;
1114			struct msg **prev;
1115
1116			previous = NULL;
1117			prev = &(msqkptr->u.msg_first);
1118			while ((msghdr = *prev) != NULL) {
1119				/*
1120				 * Is this message's type an exact match or is
1121				 * this message's type less than or equal to
1122				 * the absolute value of a negative msgtyp?
1123				 * Note that the second half of this test can
1124				 * NEVER be true if msgtyp is positive since
1125				 * msg_type is always positive!
1126				 */
1127
1128				if (msgtyp == msghdr->msg_type ||
1129				    msghdr->msg_type <= -msgtyp) {
1130					DPRINTF(("found message type %d, "
1131					    "requested %d\n",
1132					    msghdr->msg_type, msgtyp));
1133					if (msgsz < msghdr->msg_ts &&
1134					    (msgflg & MSG_NOERROR) == 0) {
1135						DPRINTF(("requested message "
1136						    "on the queue is too big "
1137						    "(want %d, got %d)\n",
1138						    msgsz, msghdr->msg_ts));
1139						error = E2BIG;
1140						goto done2;
1141					}
1142#ifdef MAC
1143					error = mac_check_sysv_msgrcv(
1144					    td->td_ucred, msghdr);
1145					if (error != 0) {
1146						MPRINTF(("mac_check_sysv_"
1147						    "msgrcv returned %d\n",
1148						    error));
1149						goto done2;
1150					}
1151#endif
1152					*prev = msghdr->msg_next;
1153					if (msghdr == msqkptr->u.msg_last) {
1154						if (previous == NULL) {
1155							if (prev !=
1156							    &msqkptr->u.msg_first)
1157								panic("msg_first/last screwed up #2");
1158							msqkptr->u.msg_first =
1159							    NULL;
1160							msqkptr->u.msg_last =
1161							    NULL;
1162						} else {
1163							if (prev ==
1164							    &msqkptr->u.msg_first)
1165								panic("msg_first/last screwed up #3");
1166							msqkptr->u.msg_last =
1167							    previous;
1168						}
1169					}
1170					break;
1171				}
1172				previous = msghdr;
1173				prev = &(msghdr->msg_next);
1174			}
1175		}
1176
1177		/*
1178		 * We've either extracted the msghdr for the appropriate
1179		 * message or there isn't one.
1180		 * If there is one then bail out of this loop.
1181		 */
1182
1183		if (msghdr != NULL)
1184			break;
1185
1186		/*
1187		 * Hmph!  No message found.  Does the user want to wait?
1188		 */
1189
1190		if ((msgflg & IPC_NOWAIT) != 0) {
1191			DPRINTF(("no appropriate message found (msgtyp=%d)\n",
1192			    msgtyp));
1193			/* The SVID says to return ENOMSG. */
1194			error = ENOMSG;
1195			goto done2;
1196		}
1197
1198		/*
1199		 * Wait for something to happen
1200		 */
1201
1202		DPRINTF(("msgrcv:  goodnight\n"));
1203		error = msleep(msqkptr, &msq_mtx, (PZERO - 4) | PCATCH,
1204		    "msgwait", 0);
1205		DPRINTF(("msgrcv:  good morning (error=%d)\n", error));
1206
1207		if (error != 0) {
1208			DPRINTF(("msgsnd:  interrupted system call\n"));
1209			error = EINTR;
1210			goto done2;
1211		}
1212
1213		/*
1214		 * Make sure that the msq queue still exists
1215		 */
1216
1217		if (msqkptr->u.msg_qbytes == 0 ||
1218		    msqkptr->u.msg_perm.seq != IPCID_TO_SEQ(uap->msqid)) {
1219			DPRINTF(("msqid deleted\n"));
1220			error = EIDRM;
1221			goto done2;
1222		}
1223	}
1224
1225	/*
1226	 * Return the message to the user.
1227	 *
1228	 * First, do the bookkeeping (before we risk being interrupted).
1229	 */
1230
1231	msqkptr->u.msg_cbytes -= msghdr->msg_ts;
1232	msqkptr->u.msg_qnum--;
1233	msqkptr->u.msg_lrpid = td->td_proc->p_pid;
1234	msqkptr->u.msg_rtime = time_second;
1235
1236	/*
1237	 * Make msgsz the actual amount that we'll be returning.
1238	 * Note that this effectively truncates the message if it is too long
1239	 * (since msgsz is never increased).
1240	 */
1241
1242	DPRINTF(("found a message, msgsz=%d, msg_ts=%d\n", msgsz,
1243	    msghdr->msg_ts));
1244	if (msgsz > msghdr->msg_ts)
1245		msgsz = msghdr->msg_ts;
1246
1247	/*
1248	 * Return the type to the user.
1249	 */
1250
1251	mtx_unlock(&msq_mtx);
1252	error = copyout(&(msghdr->msg_type), user_msgp,
1253	    sizeof(msghdr->msg_type));
1254	mtx_lock(&msq_mtx);
1255	if (error != 0) {
1256		DPRINTF(("error (%d) copying out message type\n", error));
1257		msg_freehdr(msghdr);
1258		wakeup(msqkptr);
1259		goto done2;
1260	}
1261	user_msgp = (char *)user_msgp + sizeof(msghdr->msg_type);
1262
1263	/*
1264	 * Return the segments to the user
1265	 */
1266
1267	next = msghdr->msg_spot;
1268	for (len = 0; len < msgsz; len += msginfo.msgssz) {
1269		size_t tlen;
1270
1271		if (msgsz - len > msginfo.msgssz)
1272			tlen = msginfo.msgssz;
1273		else
1274			tlen = msgsz - len;
1275		if (next <= -1)
1276			panic("next too low #3");
1277		if (next >= msginfo.msgseg)
1278			panic("next out of range #3");
1279		mtx_unlock(&msq_mtx);
1280		error = copyout(&msgpool[next * msginfo.msgssz],
1281		    user_msgp, tlen);
1282		mtx_lock(&msq_mtx);
1283		if (error != 0) {
1284			DPRINTF(("error (%d) copying out message segment\n",
1285			    error));
1286			msg_freehdr(msghdr);
1287			wakeup(msqkptr);
1288			goto done2;
1289		}
1290		user_msgp = (char *)user_msgp + tlen;
1291		next = msgmaps[next].next;
1292	}
1293
1294	/*
1295	 * Done, return the actual number of bytes copied out.
1296	 */
1297
1298	msg_freehdr(msghdr);
1299	wakeup(msqkptr);
1300	td->td_retval[0] = msgsz;
1301done2:
1302	mtx_unlock(&msq_mtx);
1303	return (error);
1304}
1305
1306static int
1307sysctl_msqids(SYSCTL_HANDLER_ARGS)
1308{
1309
1310	return (SYSCTL_OUT(req, msqids,
1311	    sizeof(struct msqid_kernel) * msginfo.msgmni));
1312}
1313
1314SYSCTL_DECL(_kern_ipc);
1315SYSCTL_INT(_kern_ipc, OID_AUTO, msgmax, CTLFLAG_RD, &msginfo.msgmax, 0, "");
1316SYSCTL_INT(_kern_ipc, OID_AUTO, msgmni, CTLFLAG_RDTUN, &msginfo.msgmni, 0, "");
1317SYSCTL_INT(_kern_ipc, OID_AUTO, msgmnb, CTLFLAG_RDTUN, &msginfo.msgmnb, 0, "");
1318SYSCTL_INT(_kern_ipc, OID_AUTO, msgtql, CTLFLAG_RDTUN, &msginfo.msgtql, 0, "");
1319SYSCTL_INT(_kern_ipc, OID_AUTO, msgssz, CTLFLAG_RDTUN, &msginfo.msgssz, 0, "");
1320SYSCTL_INT(_kern_ipc, OID_AUTO, msgseg, CTLFLAG_RDTUN, &msginfo.msgseg, 0, "");
1321SYSCTL_PROC(_kern_ipc, OID_AUTO, msqids, CTLFLAG_RD,
1322    NULL, 0, sysctl_msqids, "", "Message queue IDs");
1323