1a9643ea8Slogwang /*- 2*22ce4affSfengbojiang * SPDX-License-Identifier: BSD-3-Clause 3*22ce4affSfengbojiang * 4a9643ea8Slogwang * Copyright (c) 1982, 1986, 1990, 1993 5a9643ea8Slogwang * The Regents of the University of California. All rights reserved. 6a9643ea8Slogwang * 7a9643ea8Slogwang * Redistribution and use in source and binary forms, with or without 8a9643ea8Slogwang * modification, are permitted provided that the following conditions 9a9643ea8Slogwang * are met: 10a9643ea8Slogwang * 1. Redistributions of source code must retain the above copyright 11a9643ea8Slogwang * notice, this list of conditions and the following disclaimer. 12a9643ea8Slogwang * 2. Redistributions in binary form must reproduce the above copyright 13a9643ea8Slogwang * notice, this list of conditions and the following disclaimer in the 14a9643ea8Slogwang * documentation and/or other materials provided with the distribution. 15*22ce4affSfengbojiang * 3. Neither the name of the University nor the names of its contributors 16a9643ea8Slogwang * may be used to endorse or promote products derived from this software 17a9643ea8Slogwang * without specific prior written permission. 18a9643ea8Slogwang * 19a9643ea8Slogwang * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 20a9643ea8Slogwang * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21a9643ea8Slogwang * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22a9643ea8Slogwang * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 23a9643ea8Slogwang * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24a9643ea8Slogwang * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25a9643ea8Slogwang * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26a9643ea8Slogwang * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27a9643ea8Slogwang * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28a9643ea8Slogwang * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29a9643ea8Slogwang * SUCH DAMAGE. 30a9643ea8Slogwang * 31a9643ea8Slogwang * @(#)socketvar.h 8.3 (Berkeley) 2/19/95 32a9643ea8Slogwang * 33a9643ea8Slogwang * $FreeBSD$ 34a9643ea8Slogwang */ 35a9643ea8Slogwang 36a9643ea8Slogwang #ifndef _SYS_SOCKETVAR_H_ 37a9643ea8Slogwang #define _SYS_SOCKETVAR_H_ 38a9643ea8Slogwang 39*22ce4affSfengbojiang /* 40*22ce4affSfengbojiang * Socket generation count type. Also used in xinpcb, xtcpcb, xunpcb. 41*22ce4affSfengbojiang */ 42*22ce4affSfengbojiang typedef uint64_t so_gen_t; 43*22ce4affSfengbojiang 44*22ce4affSfengbojiang #if defined(_KERNEL) || defined(_WANT_SOCKET) 45a9643ea8Slogwang #include <sys/queue.h> /* for TAILQ macros */ 46a9643ea8Slogwang #include <sys/selinfo.h> /* for struct selinfo */ 47a9643ea8Slogwang #include <sys/_lock.h> 48a9643ea8Slogwang #include <sys/_mutex.h> 49a9643ea8Slogwang #include <sys/osd.h> 50a9643ea8Slogwang #include <sys/_sx.h> 51a9643ea8Slogwang #include <sys/sockbuf.h> 52a9643ea8Slogwang #ifdef _KERNEL 53a9643ea8Slogwang #include <sys/caprights.h> 54a9643ea8Slogwang #include <sys/sockopt.h> 55a9643ea8Slogwang #endif 56a9643ea8Slogwang 57a9643ea8Slogwang struct vnet; 58a9643ea8Slogwang 59a9643ea8Slogwang /* 60a9643ea8Slogwang * Kernel structure per socket. 61a9643ea8Slogwang * Contains send and receive buffer queues, 62a9643ea8Slogwang * handle on protocol and pointer to protocol 63a9643ea8Slogwang * private data and error information. 64a9643ea8Slogwang */ 65*22ce4affSfengbojiang typedef int so_upcall_t(struct socket *, void *, int); 66*22ce4affSfengbojiang typedef void so_dtor_t(struct socket *); 67a9643ea8Slogwang 68a9643ea8Slogwang struct socket; 69a9643ea8Slogwang 70*22ce4affSfengbojiang enum socket_qstate { 71*22ce4affSfengbojiang SQ_NONE = 0, 72*22ce4affSfengbojiang SQ_INCOMP = 0x0800, /* on sol_incomp */ 73*22ce4affSfengbojiang SQ_COMP = 0x1000, /* on sol_comp */ 74*22ce4affSfengbojiang }; 75*22ce4affSfengbojiang 76a9643ea8Slogwang /*- 77a9643ea8Slogwang * Locking key to struct socket: 78a9643ea8Slogwang * (a) constant after allocation, no locking required. 79a9643ea8Slogwang * (b) locked by SOCK_LOCK(so). 80*22ce4affSfengbojiang * (cr) locked by SOCKBUF_LOCK(&so->so_rcv). 81*22ce4affSfengbojiang * (cs) locked by SOCKBUF_LOCK(&so->so_snd). 82*22ce4affSfengbojiang * (e) locked by SOLISTEN_LOCK() of corresponding listening socket. 83a9643ea8Slogwang * (f) not locked since integer reads/writes are atomic. 84a9643ea8Slogwang * (g) used only as a sleep/wakeup address, no value. 85a9643ea8Slogwang * (h) locked by global mutex so_global_mtx. 86*22ce4affSfengbojiang * (k) locked by KTLS workqueue mutex 87a9643ea8Slogwang */ 88*22ce4affSfengbojiang TAILQ_HEAD(accept_queue, socket); 89a9643ea8Slogwang struct socket { 90*22ce4affSfengbojiang struct mtx so_lock; 91*22ce4affSfengbojiang volatile u_int so_count; /* (b / refcount) */ 92*22ce4affSfengbojiang struct selinfo so_rdsel; /* (b/cr) for so_rcv/so_comp */ 93*22ce4affSfengbojiang struct selinfo so_wrsel; /* (b/cs) for so_snd */ 94a9643ea8Slogwang short so_type; /* (a) generic type, see socket.h */ 95*22ce4affSfengbojiang int so_options; /* (b) from socket call, see socket.h */ 96*22ce4affSfengbojiang short so_linger; /* time to linger close(2) */ 97a9643ea8Slogwang short so_state; /* (b) internal state flags SS_* */ 98a9643ea8Slogwang void *so_pcb; /* protocol control block */ 99a9643ea8Slogwang struct vnet *so_vnet; /* (a) network stack instance */ 100a9643ea8Slogwang struct protosw *so_proto; /* (a) protocol handle */ 101a9643ea8Slogwang short so_timeo; /* (g) connection timeout */ 102a9643ea8Slogwang u_short so_error; /* (f) error affecting connection */ 103a9643ea8Slogwang struct sigio *so_sigio; /* [sg] information for async I/O or 104a9643ea8Slogwang out of band data (SIGURG) */ 105a9643ea8Slogwang struct ucred *so_cred; /* (a) user credentials */ 106a9643ea8Slogwang struct label *so_label; /* (b) MAC label for socket */ 107a9643ea8Slogwang /* NB: generation count must not be first. */ 108a9643ea8Slogwang so_gen_t so_gencnt; /* (h) generation count */ 109a9643ea8Slogwang void *so_emuldata; /* (b) private data for emulators */ 110*22ce4affSfengbojiang so_dtor_t *so_dtor; /* (b) optional destructor */ 111a9643ea8Slogwang struct osd osd; /* Object Specific extensions */ 112a9643ea8Slogwang /* 113a9643ea8Slogwang * so_fibnum, so_user_cookie and friends can be used to attach 114a9643ea8Slogwang * some user-specified metadata to a socket, which then can be 115a9643ea8Slogwang * used by the kernel for various actions. 116a9643ea8Slogwang * so_user_cookie is used by ipfw/dummynet. 117a9643ea8Slogwang */ 118a9643ea8Slogwang int so_fibnum; /* routing domain for this socket */ 119a9643ea8Slogwang uint32_t so_user_cookie; 120a9643ea8Slogwang 121*22ce4affSfengbojiang int so_ts_clock; /* type of the clock used for timestamps */ 122*22ce4affSfengbojiang uint32_t so_max_pacing_rate; /* (f) TX rate limit in bytes/s */ 123*22ce4affSfengbojiang union { 124*22ce4affSfengbojiang /* Regular (data flow) socket. */ 125*22ce4affSfengbojiang struct { 126*22ce4affSfengbojiang /* (cr, cs) Receive and send buffers. */ 127*22ce4affSfengbojiang struct sockbuf so_rcv, so_snd; 128*22ce4affSfengbojiang 129*22ce4affSfengbojiang /* (e) Our place on accept queue. */ 130*22ce4affSfengbojiang TAILQ_ENTRY(socket) so_list; 131*22ce4affSfengbojiang struct socket *so_listen; /* (b) */ 132*22ce4affSfengbojiang enum socket_qstate so_qstate; /* (b) */ 133*22ce4affSfengbojiang /* (b) cached MAC label for peer */ 134*22ce4affSfengbojiang struct label *so_peerlabel; 135*22ce4affSfengbojiang u_long so_oobmark; /* chars to oob mark */ 136*22ce4affSfengbojiang 137*22ce4affSfengbojiang /* (k) Our place on KTLS RX work queue. */ 138*22ce4affSfengbojiang STAILQ_ENTRY(socket) so_ktls_rx_list; 139*22ce4affSfengbojiang }; 140*22ce4affSfengbojiang /* 141*22ce4affSfengbojiang * Listening socket, where accepts occur, is so_listen in all 142*22ce4affSfengbojiang * subsidiary sockets. If so_listen is NULL, socket is not 143*22ce4affSfengbojiang * related to an accept. For a listening socket itself 144*22ce4affSfengbojiang * sol_incomp queues partially completed connections, while 145*22ce4affSfengbojiang * sol_comp is a queue of connections ready to be accepted. 146*22ce4affSfengbojiang * If a connection is aborted and it has so_listen set, then 147*22ce4affSfengbojiang * it has to be pulled out of either sol_incomp or sol_comp. 148*22ce4affSfengbojiang * We allow connections to queue up based on current queue 149*22ce4affSfengbojiang * lengths and limit on number of queued connections for this 150*22ce4affSfengbojiang * socket. 151*22ce4affSfengbojiang */ 152*22ce4affSfengbojiang struct { 153*22ce4affSfengbojiang /* (e) queue of partial unaccepted connections */ 154*22ce4affSfengbojiang struct accept_queue sol_incomp; 155*22ce4affSfengbojiang /* (e) queue of complete unaccepted connections */ 156*22ce4affSfengbojiang struct accept_queue sol_comp; 157*22ce4affSfengbojiang u_int sol_qlen; /* (e) sol_comp length */ 158*22ce4affSfengbojiang u_int sol_incqlen; /* (e) sol_incomp length */ 159*22ce4affSfengbojiang u_int sol_qlimit; /* (e) queue limit */ 160*22ce4affSfengbojiang 161*22ce4affSfengbojiang /* accept_filter(9) optional data */ 162*22ce4affSfengbojiang struct accept_filter *sol_accept_filter; 163*22ce4affSfengbojiang void *sol_accept_filter_arg; /* saved filter args */ 164*22ce4affSfengbojiang char *sol_accept_filter_str; /* saved user args */ 165*22ce4affSfengbojiang 166*22ce4affSfengbojiang /* Optional upcall, for kernel socket. */ 167*22ce4affSfengbojiang so_upcall_t *sol_upcall; /* (e) */ 168*22ce4affSfengbojiang void *sol_upcallarg; /* (e) */ 169*22ce4affSfengbojiang 170*22ce4affSfengbojiang /* Socket buffer parameters, to be copied to 171*22ce4affSfengbojiang * dataflow sockets, accepted from this one. */ 172*22ce4affSfengbojiang int sol_sbrcv_lowat; 173*22ce4affSfengbojiang int sol_sbsnd_lowat; 174*22ce4affSfengbojiang u_int sol_sbrcv_hiwat; 175*22ce4affSfengbojiang u_int sol_sbsnd_hiwat; 176*22ce4affSfengbojiang short sol_sbrcv_flags; 177*22ce4affSfengbojiang short sol_sbsnd_flags; 178*22ce4affSfengbojiang sbintime_t sol_sbrcv_timeo; 179*22ce4affSfengbojiang sbintime_t sol_sbsnd_timeo; 180*22ce4affSfengbojiang 181*22ce4affSfengbojiang /* Information tracking listen queue overflows. */ 182*22ce4affSfengbojiang struct timeval sol_lastover; /* (e) */ 183*22ce4affSfengbojiang int sol_overcount; /* (e) */ 184*22ce4affSfengbojiang }; 185*22ce4affSfengbojiang }; 18608dba010SAndy #ifdef LVS_TCPOPT_TOA 18708dba010SAndy uint8_t so_toa[8]; /* lvs toa option */ 18808dba010SAndy #endif 189a9643ea8Slogwang }; 190*22ce4affSfengbojiang #endif /* defined(_KERNEL) || defined(_WANT_SOCKET) */ 191a9643ea8Slogwang 192a9643ea8Slogwang /* 193*22ce4affSfengbojiang * Socket state bits. 194*22ce4affSfengbojiang * 195*22ce4affSfengbojiang * Historically, these bits were all kept in the so_state field. 196*22ce4affSfengbojiang * They are now split into separate, lock-specific fields. 197*22ce4affSfengbojiang * so_state maintains basic socket state protected by the socket lock. 198*22ce4affSfengbojiang * so_qstate holds information about the socket accept queues. 199*22ce4affSfengbojiang * Each socket buffer also has a state field holding information 200*22ce4affSfengbojiang * relevant to that socket buffer (can't send, rcv). 201*22ce4affSfengbojiang * Many fields will be read without locks to improve performance and avoid 202*22ce4affSfengbojiang * lock order issues. However, this approach must be used with caution. 203a9643ea8Slogwang */ 204*22ce4affSfengbojiang #define SS_NOFDREF 0x0001 /* no file table ref any more */ 205*22ce4affSfengbojiang #define SS_ISCONNECTED 0x0002 /* socket connected to a peer */ 206*22ce4affSfengbojiang #define SS_ISCONNECTING 0x0004 /* in process of connecting to peer */ 207*22ce4affSfengbojiang #define SS_ISDISCONNECTING 0x0008 /* in process of disconnecting */ 208*22ce4affSfengbojiang #define SS_NBIO 0x0100 /* non-blocking ops */ 209*22ce4affSfengbojiang #define SS_ASYNC 0x0200 /* async i/o notify */ 210*22ce4affSfengbojiang #define SS_ISCONFIRMING 0x0400 /* deciding to accept connection req */ 211*22ce4affSfengbojiang #define SS_ISDISCONNECTED 0x2000 /* socket disconnected from peer */ 212a9643ea8Slogwang 213a9643ea8Slogwang /* 214*22ce4affSfengbojiang * Protocols can mark a socket as SS_PROTOREF to indicate that, following 215*22ce4affSfengbojiang * pru_detach, they still want the socket to persist, and will free it 216*22ce4affSfengbojiang * themselves when they are done. Protocols should only ever call sofree() 217*22ce4affSfengbojiang * following setting this flag in pru_detach(), and never otherwise, as 218*22ce4affSfengbojiang * sofree() bypasses socket reference counting. 219a9643ea8Slogwang */ 220*22ce4affSfengbojiang #define SS_PROTOREF 0x4000 /* strong protocol reference */ 221a9643ea8Slogwang 222a9643ea8Slogwang #ifdef _KERNEL 223a9643ea8Slogwang 224*22ce4affSfengbojiang #define SOCK_MTX(so) &(so)->so_lock 225*22ce4affSfengbojiang #define SOCK_LOCK(so) mtx_lock(&(so)->so_lock) 226*22ce4affSfengbojiang #define SOCK_OWNED(so) mtx_owned(&(so)->so_lock) 227*22ce4affSfengbojiang #define SOCK_UNLOCK(so) mtx_unlock(&(so)->so_lock) 228*22ce4affSfengbojiang #define SOCK_LOCK_ASSERT(so) mtx_assert(&(so)->so_lock, MA_OWNED) 229*22ce4affSfengbojiang #define SOCK_UNLOCK_ASSERT(so) mtx_assert(&(so)->so_lock, MA_NOTOWNED) 230*22ce4affSfengbojiang 231*22ce4affSfengbojiang #define SOLISTENING(sol) (((sol)->so_options & SO_ACCEPTCONN) != 0) 232*22ce4affSfengbojiang #define SOLISTEN_LOCK(sol) do { \ 233*22ce4affSfengbojiang mtx_lock(&(sol)->so_lock); \ 234*22ce4affSfengbojiang KASSERT(SOLISTENING(sol), \ 235*22ce4affSfengbojiang ("%s: %p not listening", __func__, (sol))); \ 236*22ce4affSfengbojiang } while (0) 237*22ce4affSfengbojiang #define SOLISTEN_TRYLOCK(sol) mtx_trylock(&(sol)->so_lock) 238*22ce4affSfengbojiang #define SOLISTEN_UNLOCK(sol) do { \ 239*22ce4affSfengbojiang KASSERT(SOLISTENING(sol), \ 240*22ce4affSfengbojiang ("%s: %p not listening", __func__, (sol))); \ 241*22ce4affSfengbojiang mtx_unlock(&(sol)->so_lock); \ 242*22ce4affSfengbojiang } while (0) 243*22ce4affSfengbojiang #define SOLISTEN_LOCK_ASSERT(sol) do { \ 244*22ce4affSfengbojiang mtx_assert(&(sol)->so_lock, MA_OWNED); \ 245*22ce4affSfengbojiang KASSERT(SOLISTENING(sol), \ 246*22ce4affSfengbojiang ("%s: %p not listening", __func__, (sol))); \ 247*22ce4affSfengbojiang } while (0) 248*22ce4affSfengbojiang 249a9643ea8Slogwang /* 250a9643ea8Slogwang * Macros for sockets and socket buffering. 251a9643ea8Slogwang */ 252a9643ea8Slogwang 253a9643ea8Slogwang /* 254a9643ea8Slogwang * Flags to sblock(). 255a9643ea8Slogwang */ 256a9643ea8Slogwang #define SBL_WAIT 0x00000001 /* Wait if not immediately available. */ 257a9643ea8Slogwang #define SBL_NOINTR 0x00000002 /* Force non-interruptible sleep. */ 258a9643ea8Slogwang #define SBL_VALID (SBL_WAIT | SBL_NOINTR) 259a9643ea8Slogwang 260a9643ea8Slogwang /* 261a9643ea8Slogwang * Do we need to notify the other side when I/O is possible? 262a9643ea8Slogwang */ 263a9643ea8Slogwang #define sb_notify(sb) (((sb)->sb_flags & (SB_WAIT | SB_SEL | SB_ASYNC | \ 264a9643ea8Slogwang SB_UPCALL | SB_AIO | SB_KNOTE)) != 0) 265a9643ea8Slogwang 266a9643ea8Slogwang /* do we have to send all at once on a socket? */ 267a9643ea8Slogwang #define sosendallatonce(so) \ 268a9643ea8Slogwang ((so)->so_proto->pr_flags & PR_ATOMIC) 269a9643ea8Slogwang 270a9643ea8Slogwang /* can we read something from so? */ 271a9643ea8Slogwang #define soreadabledata(so) \ 272*22ce4affSfengbojiang (sbavail(&(so)->so_rcv) >= (so)->so_rcv.sb_lowat || (so)->so_error) 273a9643ea8Slogwang #define soreadable(so) \ 274a9643ea8Slogwang (soreadabledata(so) || ((so)->so_rcv.sb_state & SBS_CANTRCVMORE)) 275a9643ea8Slogwang 276a9643ea8Slogwang /* can we write something to so? */ 277a9643ea8Slogwang #define sowriteable(so) \ 278a9643ea8Slogwang ((sbspace(&(so)->so_snd) >= (so)->so_snd.sb_lowat && \ 279a9643ea8Slogwang (((so)->so_state&SS_ISCONNECTED) || \ 280a9643ea8Slogwang ((so)->so_proto->pr_flags&PR_CONNREQUIRED)==0)) || \ 281a9643ea8Slogwang ((so)->so_snd.sb_state & SBS_CANTSENDMORE) || \ 282a9643ea8Slogwang (so)->so_error) 283a9643ea8Slogwang 284a9643ea8Slogwang /* 285*22ce4affSfengbojiang * soref()/sorele() ref-count the socket structure. 286*22ce4affSfengbojiang * soref() may be called without owning socket lock, but in that case a 287*22ce4affSfengbojiang * caller must own something that holds socket, and so_count must be not 0. 288*22ce4affSfengbojiang * Note that you must still explicitly close the socket, but the last ref 289*22ce4affSfengbojiang * count will free the structure. 290a9643ea8Slogwang */ 291*22ce4affSfengbojiang #define soref(so) refcount_acquire(&(so)->so_count) 292a9643ea8Slogwang #define sorele(so) do { \ 293a9643ea8Slogwang SOCK_LOCK_ASSERT(so); \ 294*22ce4affSfengbojiang if (refcount_release(&(so)->so_count)) \ 295a9643ea8Slogwang sofree(so); \ 296*22ce4affSfengbojiang else \ 297a9643ea8Slogwang SOCK_UNLOCK(so); \ 298a9643ea8Slogwang } while (0) 299a9643ea8Slogwang 300a9643ea8Slogwang /* 301a9643ea8Slogwang * In sorwakeup() and sowwakeup(), acquire the socket buffer lock to 302a9643ea8Slogwang * avoid a non-atomic test-and-wakeup. However, sowakeup is 303a9643ea8Slogwang * responsible for releasing the lock if it is called. We unlock only 304a9643ea8Slogwang * if we don't call into sowakeup. If any code is introduced that 305a9643ea8Slogwang * directly invokes the underlying sowakeup() primitives, it must 306a9643ea8Slogwang * maintain the same semantics. 307a9643ea8Slogwang */ 308a9643ea8Slogwang #define sorwakeup_locked(so) do { \ 309a9643ea8Slogwang SOCKBUF_LOCK_ASSERT(&(so)->so_rcv); \ 310a9643ea8Slogwang if (sb_notify(&(so)->so_rcv)) \ 311a9643ea8Slogwang sowakeup((so), &(so)->so_rcv); \ 312a9643ea8Slogwang else \ 313a9643ea8Slogwang SOCKBUF_UNLOCK(&(so)->so_rcv); \ 314a9643ea8Slogwang } while (0) 315a9643ea8Slogwang 316a9643ea8Slogwang #define sorwakeup(so) do { \ 317a9643ea8Slogwang SOCKBUF_LOCK(&(so)->so_rcv); \ 318a9643ea8Slogwang sorwakeup_locked(so); \ 319a9643ea8Slogwang } while (0) 320a9643ea8Slogwang 321a9643ea8Slogwang #define sowwakeup_locked(so) do { \ 322a9643ea8Slogwang SOCKBUF_LOCK_ASSERT(&(so)->so_snd); \ 323a9643ea8Slogwang if (sb_notify(&(so)->so_snd)) \ 324a9643ea8Slogwang sowakeup((so), &(so)->so_snd); \ 325a9643ea8Slogwang else \ 326a9643ea8Slogwang SOCKBUF_UNLOCK(&(so)->so_snd); \ 327a9643ea8Slogwang } while (0) 328a9643ea8Slogwang 329a9643ea8Slogwang #define sowwakeup(so) do { \ 330a9643ea8Slogwang SOCKBUF_LOCK(&(so)->so_snd); \ 331a9643ea8Slogwang sowwakeup_locked(so); \ 332a9643ea8Slogwang } while (0) 333a9643ea8Slogwang 334a9643ea8Slogwang struct accept_filter { 335a9643ea8Slogwang char accf_name[16]; 336a9643ea8Slogwang int (*accf_callback) 337a9643ea8Slogwang (struct socket *so, void *arg, int waitflag); 338a9643ea8Slogwang void * (*accf_create) 339a9643ea8Slogwang (struct socket *so, char *arg); 340a9643ea8Slogwang void (*accf_destroy) 341a9643ea8Slogwang (struct socket *so); 342a9643ea8Slogwang SLIST_ENTRY(accept_filter) accf_next; 343a9643ea8Slogwang }; 344a9643ea8Slogwang 345*22ce4affSfengbojiang #define ACCEPT_FILTER_DEFINE(modname, filtname, cb, create, destroy, ver) \ 346*22ce4affSfengbojiang static struct accept_filter modname##_filter = { \ 347*22ce4affSfengbojiang .accf_name = filtname, \ 348*22ce4affSfengbojiang .accf_callback = cb, \ 349*22ce4affSfengbojiang .accf_create = create, \ 350*22ce4affSfengbojiang .accf_destroy = destroy, \ 351*22ce4affSfengbojiang }; \ 352*22ce4affSfengbojiang static moduledata_t modname##_mod = { \ 353*22ce4affSfengbojiang .name = __XSTRING(modname), \ 354*22ce4affSfengbojiang .evhand = accept_filt_generic_mod_event, \ 355*22ce4affSfengbojiang .priv = &modname##_filter, \ 356*22ce4affSfengbojiang }; \ 357*22ce4affSfengbojiang DECLARE_MODULE(modname, modname##_mod, SI_SUB_DRIVERS, \ 358*22ce4affSfengbojiang SI_ORDER_MIDDLE); \ 359*22ce4affSfengbojiang MODULE_VERSION(modname, ver) 360*22ce4affSfengbojiang 361a9643ea8Slogwang #ifdef MALLOC_DECLARE 362a9643ea8Slogwang MALLOC_DECLARE(M_ACCF); 363a9643ea8Slogwang MALLOC_DECLARE(M_PCB); 364a9643ea8Slogwang MALLOC_DECLARE(M_SONAME); 365a9643ea8Slogwang #endif 366a9643ea8Slogwang 367a9643ea8Slogwang /* 368a9643ea8Slogwang * Socket specific helper hook point identifiers 369a9643ea8Slogwang * Do not leave holes in the sequence, hook registration is a loop. 370a9643ea8Slogwang */ 371a9643ea8Slogwang #define HHOOK_SOCKET_OPT 0 372a9643ea8Slogwang #define HHOOK_SOCKET_CREATE 1 373a9643ea8Slogwang #define HHOOK_SOCKET_RCV 2 374a9643ea8Slogwang #define HHOOK_SOCKET_SND 3 375a9643ea8Slogwang #define HHOOK_FILT_SOREAD 4 376a9643ea8Slogwang #define HHOOK_FILT_SOWRITE 5 377a9643ea8Slogwang #define HHOOK_SOCKET_CLOSE 6 378a9643ea8Slogwang #define HHOOK_SOCKET_LAST HHOOK_SOCKET_CLOSE 379a9643ea8Slogwang 380a9643ea8Slogwang struct socket_hhook_data { 381a9643ea8Slogwang struct socket *so; 382a9643ea8Slogwang struct mbuf *m; 383a9643ea8Slogwang void *hctx; /* hook point specific data*/ 384a9643ea8Slogwang int status; 385a9643ea8Slogwang }; 386a9643ea8Slogwang 387a9643ea8Slogwang extern int maxsockets; 388a9643ea8Slogwang extern u_long sb_max; 389a9643ea8Slogwang extern so_gen_t so_gencnt; 390a9643ea8Slogwang 391a9643ea8Slogwang struct file; 392*22ce4affSfengbojiang struct filecaps; 393a9643ea8Slogwang struct filedesc; 394a9643ea8Slogwang struct mbuf; 395a9643ea8Slogwang struct sockaddr; 396a9643ea8Slogwang struct ucred; 397a9643ea8Slogwang struct uio; 398a9643ea8Slogwang 399a9643ea8Slogwang /* 'which' values for socket upcalls. */ 400a9643ea8Slogwang #define SO_RCV 1 401a9643ea8Slogwang #define SO_SND 2 402a9643ea8Slogwang 403a9643ea8Slogwang /* Return values for socket upcalls. */ 404a9643ea8Slogwang #define SU_OK 0 405a9643ea8Slogwang #define SU_ISCONNECTED 1 406a9643ea8Slogwang 407a9643ea8Slogwang /* 408a9643ea8Slogwang * From uipc_socket and friends 409a9643ea8Slogwang */ 410*22ce4affSfengbojiang int getsockaddr(struct sockaddr **namp, const struct sockaddr *uaddr, 411*22ce4affSfengbojiang size_t len); 412a9643ea8Slogwang int getsock_cap(struct thread *td, int fd, cap_rights_t *rightsp, 413*22ce4affSfengbojiang struct file **fpp, u_int *fflagp, struct filecaps *havecaps); 414a9643ea8Slogwang void soabort(struct socket *so); 415a9643ea8Slogwang int soaccept(struct socket *so, struct sockaddr **nam); 416a9643ea8Slogwang void soaio_enqueue(struct task *task); 417a9643ea8Slogwang void soaio_rcv(void *context, int pending); 418a9643ea8Slogwang void soaio_snd(void *context, int pending); 419a9643ea8Slogwang int socheckuid(struct socket *so, uid_t uid); 420a9643ea8Slogwang int sobind(struct socket *so, struct sockaddr *nam, struct thread *td); 421a9643ea8Slogwang int sobindat(int fd, struct socket *so, struct sockaddr *nam, 422a9643ea8Slogwang struct thread *td); 423a9643ea8Slogwang int soclose(struct socket *so); 424a9643ea8Slogwang int soconnect(struct socket *so, struct sockaddr *nam, struct thread *td); 425a9643ea8Slogwang int soconnectat(int fd, struct socket *so, struct sockaddr *nam, 426a9643ea8Slogwang struct thread *td); 427a9643ea8Slogwang int soconnect2(struct socket *so1, struct socket *so2); 428a9643ea8Slogwang int socreate(int dom, struct socket **aso, int type, int proto, 429a9643ea8Slogwang struct ucred *cred, struct thread *td); 430a9643ea8Slogwang int sodisconnect(struct socket *so); 431*22ce4affSfengbojiang void sodtor_set(struct socket *, so_dtor_t *); 432a9643ea8Slogwang struct sockaddr *sodupsockaddr(const struct sockaddr *sa, int mflags); 433a9643ea8Slogwang void sofree(struct socket *so); 434a9643ea8Slogwang void sohasoutofband(struct socket *so); 435a9643ea8Slogwang int solisten(struct socket *so, int backlog, struct thread *td); 436a9643ea8Slogwang void solisten_proto(struct socket *so, int backlog); 437a9643ea8Slogwang int solisten_proto_check(struct socket *so); 438*22ce4affSfengbojiang int solisten_dequeue(struct socket *, struct socket **, int); 439a9643ea8Slogwang struct socket * 440a9643ea8Slogwang sonewconn(struct socket *head, int connstatus); 441*22ce4affSfengbojiang struct socket * 442*22ce4affSfengbojiang sopeeloff(struct socket *); 443a9643ea8Slogwang int sopoll(struct socket *so, int events, struct ucred *active_cred, 444a9643ea8Slogwang struct thread *td); 445a9643ea8Slogwang int sopoll_generic(struct socket *so, int events, 446a9643ea8Slogwang struct ucred *active_cred, struct thread *td); 447a9643ea8Slogwang int soreceive(struct socket *so, struct sockaddr **paddr, struct uio *uio, 448a9643ea8Slogwang struct mbuf **mp0, struct mbuf **controlp, int *flagsp); 449a9643ea8Slogwang int soreceive_stream(struct socket *so, struct sockaddr **paddr, 450a9643ea8Slogwang struct uio *uio, struct mbuf **mp0, struct mbuf **controlp, 451a9643ea8Slogwang int *flagsp); 452a9643ea8Slogwang int soreceive_dgram(struct socket *so, struct sockaddr **paddr, 453a9643ea8Slogwang struct uio *uio, struct mbuf **mp0, struct mbuf **controlp, 454a9643ea8Slogwang int *flagsp); 455a9643ea8Slogwang int soreceive_generic(struct socket *so, struct sockaddr **paddr, 456a9643ea8Slogwang struct uio *uio, struct mbuf **mp0, struct mbuf **controlp, 457a9643ea8Slogwang int *flagsp); 458a9643ea8Slogwang int soreserve(struct socket *so, u_long sndcc, u_long rcvcc); 459a9643ea8Slogwang void sorflush(struct socket *so); 460a9643ea8Slogwang int sosend(struct socket *so, struct sockaddr *addr, struct uio *uio, 461a9643ea8Slogwang struct mbuf *top, struct mbuf *control, int flags, 462a9643ea8Slogwang struct thread *td); 463a9643ea8Slogwang int sosend_dgram(struct socket *so, struct sockaddr *addr, 464a9643ea8Slogwang struct uio *uio, struct mbuf *top, struct mbuf *control, 465a9643ea8Slogwang int flags, struct thread *td); 466a9643ea8Slogwang int sosend_generic(struct socket *so, struct sockaddr *addr, 467a9643ea8Slogwang struct uio *uio, struct mbuf *top, struct mbuf *control, 468a9643ea8Slogwang int flags, struct thread *td); 469a9643ea8Slogwang int soshutdown(struct socket *so, int how); 470*22ce4affSfengbojiang void soupcall_clear(struct socket *, int); 471*22ce4affSfengbojiang void soupcall_set(struct socket *, int, so_upcall_t, void *); 472*22ce4affSfengbojiang void solisten_upcall_set(struct socket *, so_upcall_t, void *); 473a9643ea8Slogwang void sowakeup(struct socket *so, struct sockbuf *sb); 474a9643ea8Slogwang void sowakeup_aio(struct socket *so, struct sockbuf *sb); 475*22ce4affSfengbojiang void solisten_wakeup(struct socket *); 476a9643ea8Slogwang int selsocket(struct socket *so, int events, struct timeval *tv, 477a9643ea8Slogwang struct thread *td); 478*22ce4affSfengbojiang void soisconnected(struct socket *so); 479*22ce4affSfengbojiang void soisconnecting(struct socket *so); 480*22ce4affSfengbojiang void soisdisconnected(struct socket *so); 481*22ce4affSfengbojiang void soisdisconnecting(struct socket *so); 482*22ce4affSfengbojiang void socantrcvmore(struct socket *so); 483*22ce4affSfengbojiang void socantrcvmore_locked(struct socket *so); 484*22ce4affSfengbojiang void socantsendmore(struct socket *so); 485*22ce4affSfengbojiang void socantsendmore_locked(struct socket *so); 486a9643ea8Slogwang 487a9643ea8Slogwang /* 488a9643ea8Slogwang * Accept filter functions (duh). 489a9643ea8Slogwang */ 490a9643ea8Slogwang int accept_filt_add(struct accept_filter *filt); 491a9643ea8Slogwang int accept_filt_del(char *name); 492a9643ea8Slogwang struct accept_filter *accept_filt_get(char *name); 493a9643ea8Slogwang #ifdef ACCEPT_FILTER_MOD 494a9643ea8Slogwang #ifdef SYSCTL_DECL 495a9643ea8Slogwang SYSCTL_DECL(_net_inet_accf); 496a9643ea8Slogwang #endif 497a9643ea8Slogwang int accept_filt_generic_mod_event(module_t mod, int event, void *data); 498a9643ea8Slogwang #endif 499a9643ea8Slogwang 500a9643ea8Slogwang #endif /* _KERNEL */ 501a9643ea8Slogwang 502*22ce4affSfengbojiang /* 503*22ce4affSfengbojiang * Structure to export socket from kernel to utilities, via sysctl(3). 504*22ce4affSfengbojiang */ 505*22ce4affSfengbojiang struct xsocket { 506*22ce4affSfengbojiang ksize_t xso_len; /* length of this structure */ 507*22ce4affSfengbojiang kvaddr_t xso_so; /* kernel address of struct socket */ 508*22ce4affSfengbojiang kvaddr_t so_pcb; /* kernel address of struct inpcb */ 509*22ce4affSfengbojiang uint64_t so_oobmark; 510*22ce4affSfengbojiang int64_t so_spare64[8]; 511*22ce4affSfengbojiang int32_t xso_protocol; 512*22ce4affSfengbojiang int32_t xso_family; 513*22ce4affSfengbojiang uint32_t so_qlen; 514*22ce4affSfengbojiang uint32_t so_incqlen; 515*22ce4affSfengbojiang uint32_t so_qlimit; 516*22ce4affSfengbojiang pid_t so_pgid; 517*22ce4affSfengbojiang uid_t so_uid; 518*22ce4affSfengbojiang int32_t so_spare32[8]; 519*22ce4affSfengbojiang int16_t so_type; 520*22ce4affSfengbojiang int16_t so_options; 521*22ce4affSfengbojiang int16_t so_linger; 522*22ce4affSfengbojiang int16_t so_state; 523*22ce4affSfengbojiang int16_t so_timeo; 524*22ce4affSfengbojiang uint16_t so_error; 525*22ce4affSfengbojiang struct xsockbuf { 526*22ce4affSfengbojiang uint32_t sb_cc; 527*22ce4affSfengbojiang uint32_t sb_hiwat; 528*22ce4affSfengbojiang uint32_t sb_mbcnt; 529*22ce4affSfengbojiang uint32_t sb_mcnt; 530*22ce4affSfengbojiang uint32_t sb_ccnt; 531*22ce4affSfengbojiang uint32_t sb_mbmax; 532*22ce4affSfengbojiang int32_t sb_lowat; 533*22ce4affSfengbojiang int32_t sb_timeo; 534*22ce4affSfengbojiang int16_t sb_flags; 535*22ce4affSfengbojiang } so_rcv, so_snd; 536*22ce4affSfengbojiang }; 537*22ce4affSfengbojiang 538*22ce4affSfengbojiang #ifdef _KERNEL 539*22ce4affSfengbojiang void sotoxsocket(struct socket *so, struct xsocket *xso); 540*22ce4affSfengbojiang void sbtoxsockbuf(struct sockbuf *sb, struct xsockbuf *xsb); 541*22ce4affSfengbojiang #endif 542*22ce4affSfengbojiang 543*22ce4affSfengbojiang /* 544*22ce4affSfengbojiang * Socket buffer state bits. Exported via libprocstat(3). 545*22ce4affSfengbojiang */ 546*22ce4affSfengbojiang #define SBS_CANTSENDMORE 0x0010 /* can't send more data to peer */ 547*22ce4affSfengbojiang #define SBS_CANTRCVMORE 0x0020 /* can't receive more data from peer */ 548*22ce4affSfengbojiang #define SBS_RCVATMARK 0x0040 /* at mark on input */ 549*22ce4affSfengbojiang 550a9643ea8Slogwang #endif /* !_SYS_SOCKETVAR_H_ */ 551