xref: /f-stack/freebsd/sys/socketvar.h (revision 22ce4aff)
1a9643ea8Slogwang /*-
2*22ce4affSfengbojiang  * SPDX-License-Identifier: BSD-3-Clause
3*22ce4affSfengbojiang  *
4a9643ea8Slogwang  * Copyright (c) 1982, 1986, 1990, 1993
5a9643ea8Slogwang  *	The Regents of the University of California.  All rights reserved.
6a9643ea8Slogwang  *
7a9643ea8Slogwang  * Redistribution and use in source and binary forms, with or without
8a9643ea8Slogwang  * modification, are permitted provided that the following conditions
9a9643ea8Slogwang  * are met:
10a9643ea8Slogwang  * 1. Redistributions of source code must retain the above copyright
11a9643ea8Slogwang  *    notice, this list of conditions and the following disclaimer.
12a9643ea8Slogwang  * 2. Redistributions in binary form must reproduce the above copyright
13a9643ea8Slogwang  *    notice, this list of conditions and the following disclaimer in the
14a9643ea8Slogwang  *    documentation and/or other materials provided with the distribution.
15*22ce4affSfengbojiang  * 3. Neither the name of the University nor the names of its contributors
16a9643ea8Slogwang  *    may be used to endorse or promote products derived from this software
17a9643ea8Slogwang  *    without specific prior written permission.
18a9643ea8Slogwang  *
19a9643ea8Slogwang  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20a9643ea8Slogwang  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21a9643ea8Slogwang  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22a9643ea8Slogwang  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23a9643ea8Slogwang  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24a9643ea8Slogwang  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25a9643ea8Slogwang  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26a9643ea8Slogwang  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27a9643ea8Slogwang  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28a9643ea8Slogwang  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29a9643ea8Slogwang  * SUCH DAMAGE.
30a9643ea8Slogwang  *
31a9643ea8Slogwang  *	@(#)socketvar.h	8.3 (Berkeley) 2/19/95
32a9643ea8Slogwang  *
33a9643ea8Slogwang  * $FreeBSD$
34a9643ea8Slogwang  */
35a9643ea8Slogwang 
36a9643ea8Slogwang #ifndef _SYS_SOCKETVAR_H_
37a9643ea8Slogwang #define _SYS_SOCKETVAR_H_
38a9643ea8Slogwang 
39*22ce4affSfengbojiang /*
40*22ce4affSfengbojiang  * Socket generation count type.  Also used in xinpcb, xtcpcb, xunpcb.
41*22ce4affSfengbojiang  */
42*22ce4affSfengbojiang typedef uint64_t so_gen_t;
43*22ce4affSfengbojiang 
44*22ce4affSfengbojiang #if defined(_KERNEL) || defined(_WANT_SOCKET)
45a9643ea8Slogwang #include <sys/queue.h>			/* for TAILQ macros */
46a9643ea8Slogwang #include <sys/selinfo.h>		/* for struct selinfo */
47a9643ea8Slogwang #include <sys/_lock.h>
48a9643ea8Slogwang #include <sys/_mutex.h>
49a9643ea8Slogwang #include <sys/osd.h>
50a9643ea8Slogwang #include <sys/_sx.h>
51a9643ea8Slogwang #include <sys/sockbuf.h>
52a9643ea8Slogwang #ifdef _KERNEL
53a9643ea8Slogwang #include <sys/caprights.h>
54a9643ea8Slogwang #include <sys/sockopt.h>
55a9643ea8Slogwang #endif
56a9643ea8Slogwang 
57a9643ea8Slogwang struct vnet;
58a9643ea8Slogwang 
59a9643ea8Slogwang /*
60a9643ea8Slogwang  * Kernel structure per socket.
61a9643ea8Slogwang  * Contains send and receive buffer queues,
62a9643ea8Slogwang  * handle on protocol and pointer to protocol
63a9643ea8Slogwang  * private data and error information.
64a9643ea8Slogwang  */
65*22ce4affSfengbojiang typedef	int so_upcall_t(struct socket *, void *, int);
66*22ce4affSfengbojiang typedef	void so_dtor_t(struct socket *);
67a9643ea8Slogwang 
68a9643ea8Slogwang struct socket;
69a9643ea8Slogwang 
70*22ce4affSfengbojiang enum socket_qstate {
71*22ce4affSfengbojiang 	SQ_NONE = 0,
72*22ce4affSfengbojiang 	SQ_INCOMP = 0x0800,	/* on sol_incomp */
73*22ce4affSfengbojiang 	SQ_COMP = 0x1000,	/* on sol_comp */
74*22ce4affSfengbojiang };
75*22ce4affSfengbojiang 
76a9643ea8Slogwang /*-
77a9643ea8Slogwang  * Locking key to struct socket:
78a9643ea8Slogwang  * (a) constant after allocation, no locking required.
79a9643ea8Slogwang  * (b) locked by SOCK_LOCK(so).
80*22ce4affSfengbojiang  * (cr) locked by SOCKBUF_LOCK(&so->so_rcv).
81*22ce4affSfengbojiang  * (cs) locked by SOCKBUF_LOCK(&so->so_snd).
82*22ce4affSfengbojiang  * (e) locked by SOLISTEN_LOCK() of corresponding listening socket.
83a9643ea8Slogwang  * (f) not locked since integer reads/writes are atomic.
84a9643ea8Slogwang  * (g) used only as a sleep/wakeup address, no value.
85a9643ea8Slogwang  * (h) locked by global mutex so_global_mtx.
86*22ce4affSfengbojiang  * (k) locked by KTLS workqueue mutex
87a9643ea8Slogwang  */
88*22ce4affSfengbojiang TAILQ_HEAD(accept_queue, socket);
89a9643ea8Slogwang struct socket {
90*22ce4affSfengbojiang 	struct mtx	so_lock;
91*22ce4affSfengbojiang 	volatile u_int	so_count;	/* (b / refcount) */
92*22ce4affSfengbojiang 	struct selinfo	so_rdsel;	/* (b/cr) for so_rcv/so_comp */
93*22ce4affSfengbojiang 	struct selinfo	so_wrsel;	/* (b/cs) for so_snd */
94a9643ea8Slogwang 	short	so_type;		/* (a) generic type, see socket.h */
95*22ce4affSfengbojiang 	int	so_options;		/* (b) from socket call, see socket.h */
96*22ce4affSfengbojiang 	short	so_linger;		/* time to linger close(2) */
97a9643ea8Slogwang 	short	so_state;		/* (b) internal state flags SS_* */
98a9643ea8Slogwang 	void	*so_pcb;		/* protocol control block */
99a9643ea8Slogwang 	struct	vnet *so_vnet;		/* (a) network stack instance */
100a9643ea8Slogwang 	struct	protosw *so_proto;	/* (a) protocol handle */
101a9643ea8Slogwang 	short	so_timeo;		/* (g) connection timeout */
102a9643ea8Slogwang 	u_short	so_error;		/* (f) error affecting connection */
103a9643ea8Slogwang 	struct	sigio *so_sigio;	/* [sg] information for async I/O or
104a9643ea8Slogwang 					   out of band data (SIGURG) */
105a9643ea8Slogwang 	struct	ucred *so_cred;		/* (a) user credentials */
106a9643ea8Slogwang 	struct	label *so_label;	/* (b) MAC label for socket */
107a9643ea8Slogwang 	/* NB: generation count must not be first. */
108a9643ea8Slogwang 	so_gen_t so_gencnt;		/* (h) generation count */
109a9643ea8Slogwang 	void	*so_emuldata;		/* (b) private data for emulators */
110*22ce4affSfengbojiang 	so_dtor_t *so_dtor;		/* (b) optional destructor */
111a9643ea8Slogwang 	struct	osd	osd;		/* Object Specific extensions */
112a9643ea8Slogwang 	/*
113a9643ea8Slogwang 	 * so_fibnum, so_user_cookie and friends can be used to attach
114a9643ea8Slogwang 	 * some user-specified metadata to a socket, which then can be
115a9643ea8Slogwang 	 * used by the kernel for various actions.
116a9643ea8Slogwang 	 * so_user_cookie is used by ipfw/dummynet.
117a9643ea8Slogwang 	 */
118a9643ea8Slogwang 	int so_fibnum;		/* routing domain for this socket */
119a9643ea8Slogwang 	uint32_t so_user_cookie;
120a9643ea8Slogwang 
121*22ce4affSfengbojiang 	int so_ts_clock;	/* type of the clock used for timestamps */
122*22ce4affSfengbojiang 	uint32_t so_max_pacing_rate;	/* (f) TX rate limit in bytes/s */
123*22ce4affSfengbojiang 	union {
124*22ce4affSfengbojiang 		/* Regular (data flow) socket. */
125*22ce4affSfengbojiang 		struct {
126*22ce4affSfengbojiang 			/* (cr, cs) Receive and send buffers. */
127*22ce4affSfengbojiang 			struct sockbuf		so_rcv, so_snd;
128*22ce4affSfengbojiang 
129*22ce4affSfengbojiang 			/* (e) Our place on accept queue. */
130*22ce4affSfengbojiang 			TAILQ_ENTRY(socket)	so_list;
131*22ce4affSfengbojiang 			struct socket		*so_listen;	/* (b) */
132*22ce4affSfengbojiang 			enum socket_qstate so_qstate;		/* (b) */
133*22ce4affSfengbojiang 			/* (b) cached MAC label for peer */
134*22ce4affSfengbojiang 			struct	label		*so_peerlabel;
135*22ce4affSfengbojiang 			u_long	so_oobmark;	/* chars to oob mark */
136*22ce4affSfengbojiang 
137*22ce4affSfengbojiang 			/* (k) Our place on KTLS RX work queue. */
138*22ce4affSfengbojiang 			STAILQ_ENTRY(socket)	so_ktls_rx_list;
139*22ce4affSfengbojiang 		};
140*22ce4affSfengbojiang 		/*
141*22ce4affSfengbojiang 		 * Listening socket, where accepts occur, is so_listen in all
142*22ce4affSfengbojiang 		 * subsidiary sockets.  If so_listen is NULL, socket is not
143*22ce4affSfengbojiang 		 * related to an accept.  For a listening socket itself
144*22ce4affSfengbojiang 		 * sol_incomp queues partially completed connections, while
145*22ce4affSfengbojiang 		 * sol_comp is a queue of connections ready to be accepted.
146*22ce4affSfengbojiang 		 * If a connection is aborted and it has so_listen set, then
147*22ce4affSfengbojiang 		 * it has to be pulled out of either sol_incomp or sol_comp.
148*22ce4affSfengbojiang 		 * We allow connections to queue up based on current queue
149*22ce4affSfengbojiang 		 * lengths and limit on number of queued connections for this
150*22ce4affSfengbojiang 		 * socket.
151*22ce4affSfengbojiang 		 */
152*22ce4affSfengbojiang 		struct {
153*22ce4affSfengbojiang 			/* (e) queue of partial unaccepted connections */
154*22ce4affSfengbojiang 			struct accept_queue	sol_incomp;
155*22ce4affSfengbojiang 			/* (e) queue of complete unaccepted connections */
156*22ce4affSfengbojiang 			struct accept_queue	sol_comp;
157*22ce4affSfengbojiang 			u_int	sol_qlen;    /* (e) sol_comp length */
158*22ce4affSfengbojiang 			u_int	sol_incqlen; /* (e) sol_incomp length */
159*22ce4affSfengbojiang 			u_int	sol_qlimit;  /* (e) queue limit */
160*22ce4affSfengbojiang 
161*22ce4affSfengbojiang 			/* accept_filter(9) optional data */
162*22ce4affSfengbojiang 			struct	accept_filter	*sol_accept_filter;
163*22ce4affSfengbojiang 			void	*sol_accept_filter_arg;	/* saved filter args */
164*22ce4affSfengbojiang 			char	*sol_accept_filter_str;	/* saved user args */
165*22ce4affSfengbojiang 
166*22ce4affSfengbojiang 			/* Optional upcall, for kernel socket. */
167*22ce4affSfengbojiang 			so_upcall_t	*sol_upcall;	/* (e) */
168*22ce4affSfengbojiang 			void		*sol_upcallarg;	/* (e) */
169*22ce4affSfengbojiang 
170*22ce4affSfengbojiang 			/* Socket buffer parameters, to be copied to
171*22ce4affSfengbojiang 			 * dataflow sockets, accepted from this one. */
172*22ce4affSfengbojiang 			int		sol_sbrcv_lowat;
173*22ce4affSfengbojiang 			int		sol_sbsnd_lowat;
174*22ce4affSfengbojiang 			u_int		sol_sbrcv_hiwat;
175*22ce4affSfengbojiang 			u_int		sol_sbsnd_hiwat;
176*22ce4affSfengbojiang 			short		sol_sbrcv_flags;
177*22ce4affSfengbojiang 			short		sol_sbsnd_flags;
178*22ce4affSfengbojiang 			sbintime_t	sol_sbrcv_timeo;
179*22ce4affSfengbojiang 			sbintime_t	sol_sbsnd_timeo;
180*22ce4affSfengbojiang 
181*22ce4affSfengbojiang 			/* Information tracking listen queue overflows. */
182*22ce4affSfengbojiang 			struct timeval	sol_lastover;	/* (e) */
183*22ce4affSfengbojiang 			int		sol_overcount;	/* (e) */
184*22ce4affSfengbojiang 		};
185*22ce4affSfengbojiang 	};
18608dba010SAndy #ifdef LVS_TCPOPT_TOA
18708dba010SAndy 	uint8_t so_toa[8];  /* lvs toa option */
18808dba010SAndy #endif
189a9643ea8Slogwang };
190*22ce4affSfengbojiang #endif	/* defined(_KERNEL) || defined(_WANT_SOCKET) */
191a9643ea8Slogwang 
192a9643ea8Slogwang /*
193*22ce4affSfengbojiang  * Socket state bits.
194*22ce4affSfengbojiang  *
195*22ce4affSfengbojiang  * Historically, these bits were all kept in the so_state field.
196*22ce4affSfengbojiang  * They are now split into separate, lock-specific fields.
197*22ce4affSfengbojiang  * so_state maintains basic socket state protected by the socket lock.
198*22ce4affSfengbojiang  * so_qstate holds information about the socket accept queues.
199*22ce4affSfengbojiang  * Each socket buffer also has a state field holding information
200*22ce4affSfengbojiang  * relevant to that socket buffer (can't send, rcv).
201*22ce4affSfengbojiang  * Many fields will be read without locks to improve performance and avoid
202*22ce4affSfengbojiang  * lock order issues.  However, this approach must be used with caution.
203a9643ea8Slogwang  */
204*22ce4affSfengbojiang #define	SS_NOFDREF		0x0001	/* no file table ref any more */
205*22ce4affSfengbojiang #define	SS_ISCONNECTED		0x0002	/* socket connected to a peer */
206*22ce4affSfengbojiang #define	SS_ISCONNECTING		0x0004	/* in process of connecting to peer */
207*22ce4affSfengbojiang #define	SS_ISDISCONNECTING	0x0008	/* in process of disconnecting */
208*22ce4affSfengbojiang #define	SS_NBIO			0x0100	/* non-blocking ops */
209*22ce4affSfengbojiang #define	SS_ASYNC		0x0200	/* async i/o notify */
210*22ce4affSfengbojiang #define	SS_ISCONFIRMING		0x0400	/* deciding to accept connection req */
211*22ce4affSfengbojiang #define	SS_ISDISCONNECTED	0x2000	/* socket disconnected from peer */
212a9643ea8Slogwang 
213a9643ea8Slogwang /*
214*22ce4affSfengbojiang  * Protocols can mark a socket as SS_PROTOREF to indicate that, following
215*22ce4affSfengbojiang  * pru_detach, they still want the socket to persist, and will free it
216*22ce4affSfengbojiang  * themselves when they are done.  Protocols should only ever call sofree()
217*22ce4affSfengbojiang  * following setting this flag in pru_detach(), and never otherwise, as
218*22ce4affSfengbojiang  * sofree() bypasses socket reference counting.
219a9643ea8Slogwang  */
220*22ce4affSfengbojiang #define	SS_PROTOREF		0x4000	/* strong protocol reference */
221a9643ea8Slogwang 
222a9643ea8Slogwang #ifdef _KERNEL
223a9643ea8Slogwang 
224*22ce4affSfengbojiang #define	SOCK_MTX(so)		&(so)->so_lock
225*22ce4affSfengbojiang #define	SOCK_LOCK(so)		mtx_lock(&(so)->so_lock)
226*22ce4affSfengbojiang #define	SOCK_OWNED(so)		mtx_owned(&(so)->so_lock)
227*22ce4affSfengbojiang #define	SOCK_UNLOCK(so)		mtx_unlock(&(so)->so_lock)
228*22ce4affSfengbojiang #define	SOCK_LOCK_ASSERT(so)	mtx_assert(&(so)->so_lock, MA_OWNED)
229*22ce4affSfengbojiang #define	SOCK_UNLOCK_ASSERT(so)	mtx_assert(&(so)->so_lock, MA_NOTOWNED)
230*22ce4affSfengbojiang 
231*22ce4affSfengbojiang #define	SOLISTENING(sol)	(((sol)->so_options & SO_ACCEPTCONN) != 0)
232*22ce4affSfengbojiang #define	SOLISTEN_LOCK(sol)	do {					\
233*22ce4affSfengbojiang 	mtx_lock(&(sol)->so_lock);					\
234*22ce4affSfengbojiang 	KASSERT(SOLISTENING(sol),					\
235*22ce4affSfengbojiang 	    ("%s: %p not listening", __func__, (sol)));			\
236*22ce4affSfengbojiang } while (0)
237*22ce4affSfengbojiang #define	SOLISTEN_TRYLOCK(sol)	mtx_trylock(&(sol)->so_lock)
238*22ce4affSfengbojiang #define	SOLISTEN_UNLOCK(sol)	do {					\
239*22ce4affSfengbojiang 	KASSERT(SOLISTENING(sol),					\
240*22ce4affSfengbojiang 	    ("%s: %p not listening", __func__, (sol)));			\
241*22ce4affSfengbojiang 	mtx_unlock(&(sol)->so_lock);					\
242*22ce4affSfengbojiang } while (0)
243*22ce4affSfengbojiang #define	SOLISTEN_LOCK_ASSERT(sol)	do {				\
244*22ce4affSfengbojiang 	mtx_assert(&(sol)->so_lock, MA_OWNED);				\
245*22ce4affSfengbojiang 	KASSERT(SOLISTENING(sol),					\
246*22ce4affSfengbojiang 	    ("%s: %p not listening", __func__, (sol)));			\
247*22ce4affSfengbojiang } while (0)
248*22ce4affSfengbojiang 
249a9643ea8Slogwang /*
250a9643ea8Slogwang  * Macros for sockets and socket buffering.
251a9643ea8Slogwang  */
252a9643ea8Slogwang 
253a9643ea8Slogwang /*
254a9643ea8Slogwang  * Flags to sblock().
255a9643ea8Slogwang  */
256a9643ea8Slogwang #define	SBL_WAIT	0x00000001	/* Wait if not immediately available. */
257a9643ea8Slogwang #define	SBL_NOINTR	0x00000002	/* Force non-interruptible sleep. */
258a9643ea8Slogwang #define	SBL_VALID	(SBL_WAIT | SBL_NOINTR)
259a9643ea8Slogwang 
260a9643ea8Slogwang /*
261a9643ea8Slogwang  * Do we need to notify the other side when I/O is possible?
262a9643ea8Slogwang  */
263a9643ea8Slogwang #define	sb_notify(sb)	(((sb)->sb_flags & (SB_WAIT | SB_SEL | SB_ASYNC | \
264a9643ea8Slogwang     SB_UPCALL | SB_AIO | SB_KNOTE)) != 0)
265a9643ea8Slogwang 
266a9643ea8Slogwang /* do we have to send all at once on a socket? */
267a9643ea8Slogwang #define	sosendallatonce(so) \
268a9643ea8Slogwang     ((so)->so_proto->pr_flags & PR_ATOMIC)
269a9643ea8Slogwang 
270a9643ea8Slogwang /* can we read something from so? */
271a9643ea8Slogwang #define	soreadabledata(so) \
272*22ce4affSfengbojiang 	(sbavail(&(so)->so_rcv) >= (so)->so_rcv.sb_lowat ||  (so)->so_error)
273a9643ea8Slogwang #define	soreadable(so) \
274a9643ea8Slogwang 	(soreadabledata(so) || ((so)->so_rcv.sb_state & SBS_CANTRCVMORE))
275a9643ea8Slogwang 
276a9643ea8Slogwang /* can we write something to so? */
277a9643ea8Slogwang #define	sowriteable(so) \
278a9643ea8Slogwang     ((sbspace(&(so)->so_snd) >= (so)->so_snd.sb_lowat && \
279a9643ea8Slogwang 	(((so)->so_state&SS_ISCONNECTED) || \
280a9643ea8Slogwang 	  ((so)->so_proto->pr_flags&PR_CONNREQUIRED)==0)) || \
281a9643ea8Slogwang      ((so)->so_snd.sb_state & SBS_CANTSENDMORE) || \
282a9643ea8Slogwang      (so)->so_error)
283a9643ea8Slogwang 
284a9643ea8Slogwang /*
285*22ce4affSfengbojiang  * soref()/sorele() ref-count the socket structure.
286*22ce4affSfengbojiang  * soref() may be called without owning socket lock, but in that case a
287*22ce4affSfengbojiang  * caller must own something that holds socket, and so_count must be not 0.
288*22ce4affSfengbojiang  * Note that you must still explicitly close the socket, but the last ref
289*22ce4affSfengbojiang  * count will free the structure.
290a9643ea8Slogwang  */
291*22ce4affSfengbojiang #define	soref(so)	refcount_acquire(&(so)->so_count)
292a9643ea8Slogwang #define	sorele(so) do {							\
293a9643ea8Slogwang 	SOCK_LOCK_ASSERT(so);						\
294*22ce4affSfengbojiang 	if (refcount_release(&(so)->so_count))				\
295a9643ea8Slogwang 		sofree(so);						\
296*22ce4affSfengbojiang 	else								\
297a9643ea8Slogwang 		SOCK_UNLOCK(so);					\
298a9643ea8Slogwang } while (0)
299a9643ea8Slogwang 
300a9643ea8Slogwang /*
301a9643ea8Slogwang  * In sorwakeup() and sowwakeup(), acquire the socket buffer lock to
302a9643ea8Slogwang  * avoid a non-atomic test-and-wakeup.  However, sowakeup is
303a9643ea8Slogwang  * responsible for releasing the lock if it is called.  We unlock only
304a9643ea8Slogwang  * if we don't call into sowakeup.  If any code is introduced that
305a9643ea8Slogwang  * directly invokes the underlying sowakeup() primitives, it must
306a9643ea8Slogwang  * maintain the same semantics.
307a9643ea8Slogwang  */
308a9643ea8Slogwang #define	sorwakeup_locked(so) do {					\
309a9643ea8Slogwang 	SOCKBUF_LOCK_ASSERT(&(so)->so_rcv);				\
310a9643ea8Slogwang 	if (sb_notify(&(so)->so_rcv))					\
311a9643ea8Slogwang 		sowakeup((so), &(so)->so_rcv);	 			\
312a9643ea8Slogwang 	else								\
313a9643ea8Slogwang 		SOCKBUF_UNLOCK(&(so)->so_rcv);				\
314a9643ea8Slogwang } while (0)
315a9643ea8Slogwang 
316a9643ea8Slogwang #define	sorwakeup(so) do {						\
317a9643ea8Slogwang 	SOCKBUF_LOCK(&(so)->so_rcv);					\
318a9643ea8Slogwang 	sorwakeup_locked(so);						\
319a9643ea8Slogwang } while (0)
320a9643ea8Slogwang 
321a9643ea8Slogwang #define	sowwakeup_locked(so) do {					\
322a9643ea8Slogwang 	SOCKBUF_LOCK_ASSERT(&(so)->so_snd);				\
323a9643ea8Slogwang 	if (sb_notify(&(so)->so_snd))					\
324a9643ea8Slogwang 		sowakeup((so), &(so)->so_snd); 				\
325a9643ea8Slogwang 	else								\
326a9643ea8Slogwang 		SOCKBUF_UNLOCK(&(so)->so_snd);				\
327a9643ea8Slogwang } while (0)
328a9643ea8Slogwang 
329a9643ea8Slogwang #define	sowwakeup(so) do {						\
330a9643ea8Slogwang 	SOCKBUF_LOCK(&(so)->so_snd);					\
331a9643ea8Slogwang 	sowwakeup_locked(so);						\
332a9643ea8Slogwang } while (0)
333a9643ea8Slogwang 
334a9643ea8Slogwang struct accept_filter {
335a9643ea8Slogwang 	char	accf_name[16];
336a9643ea8Slogwang 	int	(*accf_callback)
337a9643ea8Slogwang 		(struct socket *so, void *arg, int waitflag);
338a9643ea8Slogwang 	void *	(*accf_create)
339a9643ea8Slogwang 		(struct socket *so, char *arg);
340a9643ea8Slogwang 	void	(*accf_destroy)
341a9643ea8Slogwang 		(struct socket *so);
342a9643ea8Slogwang 	SLIST_ENTRY(accept_filter) accf_next;
343a9643ea8Slogwang };
344a9643ea8Slogwang 
345*22ce4affSfengbojiang #define	ACCEPT_FILTER_DEFINE(modname, filtname, cb, create, destroy, ver) \
346*22ce4affSfengbojiang 	static struct accept_filter modname##_filter = {		\
347*22ce4affSfengbojiang 		.accf_name = filtname,					\
348*22ce4affSfengbojiang 		.accf_callback = cb,					\
349*22ce4affSfengbojiang 		.accf_create = create,					\
350*22ce4affSfengbojiang 		.accf_destroy = destroy,				\
351*22ce4affSfengbojiang 	};								\
352*22ce4affSfengbojiang 	static moduledata_t modname##_mod = {				\
353*22ce4affSfengbojiang 		.name = __XSTRING(modname),				\
354*22ce4affSfengbojiang 		.evhand = accept_filt_generic_mod_event,		\
355*22ce4affSfengbojiang 		.priv = &modname##_filter,				\
356*22ce4affSfengbojiang 	};								\
357*22ce4affSfengbojiang 	DECLARE_MODULE(modname, modname##_mod, SI_SUB_DRIVERS,		\
358*22ce4affSfengbojiang 	    SI_ORDER_MIDDLE);						\
359*22ce4affSfengbojiang 	MODULE_VERSION(modname, ver)
360*22ce4affSfengbojiang 
361a9643ea8Slogwang #ifdef MALLOC_DECLARE
362a9643ea8Slogwang MALLOC_DECLARE(M_ACCF);
363a9643ea8Slogwang MALLOC_DECLARE(M_PCB);
364a9643ea8Slogwang MALLOC_DECLARE(M_SONAME);
365a9643ea8Slogwang #endif
366a9643ea8Slogwang 
367a9643ea8Slogwang /*
368a9643ea8Slogwang  * Socket specific helper hook point identifiers
369a9643ea8Slogwang  * Do not leave holes in the sequence, hook registration is a loop.
370a9643ea8Slogwang  */
371a9643ea8Slogwang #define HHOOK_SOCKET_OPT		0
372a9643ea8Slogwang #define HHOOK_SOCKET_CREATE		1
373a9643ea8Slogwang #define HHOOK_SOCKET_RCV 		2
374a9643ea8Slogwang #define HHOOK_SOCKET_SND		3
375a9643ea8Slogwang #define HHOOK_FILT_SOREAD		4
376a9643ea8Slogwang #define HHOOK_FILT_SOWRITE		5
377a9643ea8Slogwang #define HHOOK_SOCKET_CLOSE		6
378a9643ea8Slogwang #define HHOOK_SOCKET_LAST		HHOOK_SOCKET_CLOSE
379a9643ea8Slogwang 
380a9643ea8Slogwang struct socket_hhook_data {
381a9643ea8Slogwang 	struct socket	*so;
382a9643ea8Slogwang 	struct mbuf	*m;
383a9643ea8Slogwang 	void		*hctx;		/* hook point specific data*/
384a9643ea8Slogwang 	int		status;
385a9643ea8Slogwang };
386a9643ea8Slogwang 
387a9643ea8Slogwang extern int	maxsockets;
388a9643ea8Slogwang extern u_long	sb_max;
389a9643ea8Slogwang extern so_gen_t so_gencnt;
390a9643ea8Slogwang 
391a9643ea8Slogwang struct file;
392*22ce4affSfengbojiang struct filecaps;
393a9643ea8Slogwang struct filedesc;
394a9643ea8Slogwang struct mbuf;
395a9643ea8Slogwang struct sockaddr;
396a9643ea8Slogwang struct ucred;
397a9643ea8Slogwang struct uio;
398a9643ea8Slogwang 
399a9643ea8Slogwang /* 'which' values for socket upcalls. */
400a9643ea8Slogwang #define	SO_RCV		1
401a9643ea8Slogwang #define	SO_SND		2
402a9643ea8Slogwang 
403a9643ea8Slogwang /* Return values for socket upcalls. */
404a9643ea8Slogwang #define	SU_OK		0
405a9643ea8Slogwang #define	SU_ISCONNECTED	1
406a9643ea8Slogwang 
407a9643ea8Slogwang /*
408a9643ea8Slogwang  * From uipc_socket and friends
409a9643ea8Slogwang  */
410*22ce4affSfengbojiang int	getsockaddr(struct sockaddr **namp, const struct sockaddr *uaddr,
411*22ce4affSfengbojiang 	    size_t len);
412a9643ea8Slogwang int	getsock_cap(struct thread *td, int fd, cap_rights_t *rightsp,
413*22ce4affSfengbojiang 	    struct file **fpp, u_int *fflagp, struct filecaps *havecaps);
414a9643ea8Slogwang void	soabort(struct socket *so);
415a9643ea8Slogwang int	soaccept(struct socket *so, struct sockaddr **nam);
416a9643ea8Slogwang void	soaio_enqueue(struct task *task);
417a9643ea8Slogwang void	soaio_rcv(void *context, int pending);
418a9643ea8Slogwang void	soaio_snd(void *context, int pending);
419a9643ea8Slogwang int	socheckuid(struct socket *so, uid_t uid);
420a9643ea8Slogwang int	sobind(struct socket *so, struct sockaddr *nam, struct thread *td);
421a9643ea8Slogwang int	sobindat(int fd, struct socket *so, struct sockaddr *nam,
422a9643ea8Slogwang 	    struct thread *td);
423a9643ea8Slogwang int	soclose(struct socket *so);
424a9643ea8Slogwang int	soconnect(struct socket *so, struct sockaddr *nam, struct thread *td);
425a9643ea8Slogwang int	soconnectat(int fd, struct socket *so, struct sockaddr *nam,
426a9643ea8Slogwang 	    struct thread *td);
427a9643ea8Slogwang int	soconnect2(struct socket *so1, struct socket *so2);
428a9643ea8Slogwang int	socreate(int dom, struct socket **aso, int type, int proto,
429a9643ea8Slogwang 	    struct ucred *cred, struct thread *td);
430a9643ea8Slogwang int	sodisconnect(struct socket *so);
431*22ce4affSfengbojiang void	sodtor_set(struct socket *, so_dtor_t *);
432a9643ea8Slogwang struct	sockaddr *sodupsockaddr(const struct sockaddr *sa, int mflags);
433a9643ea8Slogwang void	sofree(struct socket *so);
434a9643ea8Slogwang void	sohasoutofband(struct socket *so);
435a9643ea8Slogwang int	solisten(struct socket *so, int backlog, struct thread *td);
436a9643ea8Slogwang void	solisten_proto(struct socket *so, int backlog);
437a9643ea8Slogwang int	solisten_proto_check(struct socket *so);
438*22ce4affSfengbojiang int	solisten_dequeue(struct socket *, struct socket **, int);
439a9643ea8Slogwang struct socket *
440a9643ea8Slogwang 	sonewconn(struct socket *head, int connstatus);
441*22ce4affSfengbojiang struct socket *
442*22ce4affSfengbojiang 	sopeeloff(struct socket *);
443a9643ea8Slogwang int	sopoll(struct socket *so, int events, struct ucred *active_cred,
444a9643ea8Slogwang 	    struct thread *td);
445a9643ea8Slogwang int	sopoll_generic(struct socket *so, int events,
446a9643ea8Slogwang 	    struct ucred *active_cred, struct thread *td);
447a9643ea8Slogwang int	soreceive(struct socket *so, struct sockaddr **paddr, struct uio *uio,
448a9643ea8Slogwang 	    struct mbuf **mp0, struct mbuf **controlp, int *flagsp);
449a9643ea8Slogwang int	soreceive_stream(struct socket *so, struct sockaddr **paddr,
450a9643ea8Slogwang 	    struct uio *uio, struct mbuf **mp0, struct mbuf **controlp,
451a9643ea8Slogwang 	    int *flagsp);
452a9643ea8Slogwang int	soreceive_dgram(struct socket *so, struct sockaddr **paddr,
453a9643ea8Slogwang 	    struct uio *uio, struct mbuf **mp0, struct mbuf **controlp,
454a9643ea8Slogwang 	    int *flagsp);
455a9643ea8Slogwang int	soreceive_generic(struct socket *so, struct sockaddr **paddr,
456a9643ea8Slogwang 	    struct uio *uio, struct mbuf **mp0, struct mbuf **controlp,
457a9643ea8Slogwang 	    int *flagsp);
458a9643ea8Slogwang int	soreserve(struct socket *so, u_long sndcc, u_long rcvcc);
459a9643ea8Slogwang void	sorflush(struct socket *so);
460a9643ea8Slogwang int	sosend(struct socket *so, struct sockaddr *addr, struct uio *uio,
461a9643ea8Slogwang 	    struct mbuf *top, struct mbuf *control, int flags,
462a9643ea8Slogwang 	    struct thread *td);
463a9643ea8Slogwang int	sosend_dgram(struct socket *so, struct sockaddr *addr,
464a9643ea8Slogwang 	    struct uio *uio, struct mbuf *top, struct mbuf *control,
465a9643ea8Slogwang 	    int flags, struct thread *td);
466a9643ea8Slogwang int	sosend_generic(struct socket *so, struct sockaddr *addr,
467a9643ea8Slogwang 	    struct uio *uio, struct mbuf *top, struct mbuf *control,
468a9643ea8Slogwang 	    int flags, struct thread *td);
469a9643ea8Slogwang int	soshutdown(struct socket *so, int how);
470*22ce4affSfengbojiang void	soupcall_clear(struct socket *, int);
471*22ce4affSfengbojiang void	soupcall_set(struct socket *, int, so_upcall_t, void *);
472*22ce4affSfengbojiang void	solisten_upcall_set(struct socket *, so_upcall_t, void *);
473a9643ea8Slogwang void	sowakeup(struct socket *so, struct sockbuf *sb);
474a9643ea8Slogwang void	sowakeup_aio(struct socket *so, struct sockbuf *sb);
475*22ce4affSfengbojiang void	solisten_wakeup(struct socket *);
476a9643ea8Slogwang int	selsocket(struct socket *so, int events, struct timeval *tv,
477a9643ea8Slogwang 	    struct thread *td);
478*22ce4affSfengbojiang void	soisconnected(struct socket *so);
479*22ce4affSfengbojiang void	soisconnecting(struct socket *so);
480*22ce4affSfengbojiang void	soisdisconnected(struct socket *so);
481*22ce4affSfengbojiang void	soisdisconnecting(struct socket *so);
482*22ce4affSfengbojiang void	socantrcvmore(struct socket *so);
483*22ce4affSfengbojiang void	socantrcvmore_locked(struct socket *so);
484*22ce4affSfengbojiang void	socantsendmore(struct socket *so);
485*22ce4affSfengbojiang void	socantsendmore_locked(struct socket *so);
486a9643ea8Slogwang 
487a9643ea8Slogwang /*
488a9643ea8Slogwang  * Accept filter functions (duh).
489a9643ea8Slogwang  */
490a9643ea8Slogwang int	accept_filt_add(struct accept_filter *filt);
491a9643ea8Slogwang int	accept_filt_del(char *name);
492a9643ea8Slogwang struct	accept_filter *accept_filt_get(char *name);
493a9643ea8Slogwang #ifdef ACCEPT_FILTER_MOD
494a9643ea8Slogwang #ifdef SYSCTL_DECL
495a9643ea8Slogwang SYSCTL_DECL(_net_inet_accf);
496a9643ea8Slogwang #endif
497a9643ea8Slogwang int	accept_filt_generic_mod_event(module_t mod, int event, void *data);
498a9643ea8Slogwang #endif
499a9643ea8Slogwang 
500a9643ea8Slogwang #endif /* _KERNEL */
501a9643ea8Slogwang 
502*22ce4affSfengbojiang /*
503*22ce4affSfengbojiang  * Structure to export socket from kernel to utilities, via sysctl(3).
504*22ce4affSfengbojiang  */
505*22ce4affSfengbojiang struct xsocket {
506*22ce4affSfengbojiang 	ksize_t		xso_len;	/* length of this structure */
507*22ce4affSfengbojiang 	kvaddr_t	xso_so;		/* kernel address of struct socket */
508*22ce4affSfengbojiang 	kvaddr_t	so_pcb;		/* kernel address of struct inpcb */
509*22ce4affSfengbojiang 	uint64_t	so_oobmark;
510*22ce4affSfengbojiang 	int64_t		so_spare64[8];
511*22ce4affSfengbojiang 	int32_t		xso_protocol;
512*22ce4affSfengbojiang 	int32_t		xso_family;
513*22ce4affSfengbojiang 	uint32_t	so_qlen;
514*22ce4affSfengbojiang 	uint32_t	so_incqlen;
515*22ce4affSfengbojiang 	uint32_t	so_qlimit;
516*22ce4affSfengbojiang 	pid_t		so_pgid;
517*22ce4affSfengbojiang 	uid_t		so_uid;
518*22ce4affSfengbojiang 	int32_t		so_spare32[8];
519*22ce4affSfengbojiang 	int16_t		so_type;
520*22ce4affSfengbojiang 	int16_t		so_options;
521*22ce4affSfengbojiang 	int16_t		so_linger;
522*22ce4affSfengbojiang 	int16_t		so_state;
523*22ce4affSfengbojiang 	int16_t		so_timeo;
524*22ce4affSfengbojiang 	uint16_t	so_error;
525*22ce4affSfengbojiang 	struct xsockbuf {
526*22ce4affSfengbojiang 		uint32_t	sb_cc;
527*22ce4affSfengbojiang 		uint32_t	sb_hiwat;
528*22ce4affSfengbojiang 		uint32_t	sb_mbcnt;
529*22ce4affSfengbojiang 		uint32_t	sb_mcnt;
530*22ce4affSfengbojiang 		uint32_t	sb_ccnt;
531*22ce4affSfengbojiang 		uint32_t	sb_mbmax;
532*22ce4affSfengbojiang 		int32_t		sb_lowat;
533*22ce4affSfengbojiang 		int32_t		sb_timeo;
534*22ce4affSfengbojiang 		int16_t		sb_flags;
535*22ce4affSfengbojiang 	} so_rcv, so_snd;
536*22ce4affSfengbojiang };
537*22ce4affSfengbojiang 
538*22ce4affSfengbojiang #ifdef _KERNEL
539*22ce4affSfengbojiang void	sotoxsocket(struct socket *so, struct xsocket *xso);
540*22ce4affSfengbojiang void	sbtoxsockbuf(struct sockbuf *sb, struct xsockbuf *xsb);
541*22ce4affSfengbojiang #endif
542*22ce4affSfengbojiang 
543*22ce4affSfengbojiang /*
544*22ce4affSfengbojiang  * Socket buffer state bits.  Exported via libprocstat(3).
545*22ce4affSfengbojiang  */
546*22ce4affSfengbojiang #define	SBS_CANTSENDMORE	0x0010	/* can't send more data to peer */
547*22ce4affSfengbojiang #define	SBS_CANTRCVMORE		0x0020	/* can't receive more data from peer */
548*22ce4affSfengbojiang #define	SBS_RCVATMARK		0x0040	/* at mark on input */
549*22ce4affSfengbojiang 
550a9643ea8Slogwang #endif /* !_SYS_SOCKETVAR_H_ */
551