11eaf0ac3Slogwang /*- 2*d4a07e70Sfengbojiang * SPDX-License-Identifier: BSD-3-Clause 3*d4a07e70Sfengbojiang * 41eaf0ac3Slogwang * Copyright (c) 1982, 1986, 1993 51eaf0ac3Slogwang * The Regents of the University of California. All rights reserved. 61eaf0ac3Slogwang * 71eaf0ac3Slogwang * Redistribution and use in source and binary forms, with or without 81eaf0ac3Slogwang * modification, are permitted provided that the following conditions 91eaf0ac3Slogwang * are met: 101eaf0ac3Slogwang * 1. Redistributions of source code must retain the above copyright 111eaf0ac3Slogwang * notice, this list of conditions and the following disclaimer. 121eaf0ac3Slogwang * 2. Redistributions in binary form must reproduce the above copyright 131eaf0ac3Slogwang * notice, this list of conditions and the following disclaimer in the 141eaf0ac3Slogwang * documentation and/or other materials provided with the distribution. 15*d4a07e70Sfengbojiang * 3. Neither the name of the University nor the names of its contributors 161eaf0ac3Slogwang * may be used to endorse or promote products derived from this software 171eaf0ac3Slogwang * without specific prior written permission. 181eaf0ac3Slogwang * 191eaf0ac3Slogwang * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 201eaf0ac3Slogwang * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 211eaf0ac3Slogwang * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 221eaf0ac3Slogwang * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 231eaf0ac3Slogwang * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 241eaf0ac3Slogwang * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 251eaf0ac3Slogwang * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 261eaf0ac3Slogwang * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 271eaf0ac3Slogwang * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 281eaf0ac3Slogwang * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 291eaf0ac3Slogwang * SUCH DAMAGE. 301eaf0ac3Slogwang * 311eaf0ac3Slogwang * @(#)tcp.h 8.1 (Berkeley) 6/10/93 321eaf0ac3Slogwang * $FreeBSD$ 331eaf0ac3Slogwang */ 341eaf0ac3Slogwang 351eaf0ac3Slogwang #ifndef _NETINET_TCP_H_ 361eaf0ac3Slogwang #define _NETINET_TCP_H_ 371eaf0ac3Slogwang 381eaf0ac3Slogwang #include <sys/cdefs.h> 391eaf0ac3Slogwang #include <sys/types.h> 401eaf0ac3Slogwang 411eaf0ac3Slogwang #if __BSD_VISIBLE 421eaf0ac3Slogwang 431eaf0ac3Slogwang typedef u_int32_t tcp_seq; 441eaf0ac3Slogwang 451eaf0ac3Slogwang #define tcp6_seq tcp_seq /* for KAME src sync over BSD*'s */ 461eaf0ac3Slogwang #define tcp6hdr tcphdr /* for KAME src sync over BSD*'s */ 471eaf0ac3Slogwang 481eaf0ac3Slogwang /* 491eaf0ac3Slogwang * TCP header. 501eaf0ac3Slogwang * Per RFC 793, September, 1981. 511eaf0ac3Slogwang */ 521eaf0ac3Slogwang struct tcphdr { 531eaf0ac3Slogwang u_short th_sport; /* source port */ 541eaf0ac3Slogwang u_short th_dport; /* destination port */ 551eaf0ac3Slogwang tcp_seq th_seq; /* sequence number */ 561eaf0ac3Slogwang tcp_seq th_ack; /* acknowledgement number */ 571eaf0ac3Slogwang #if BYTE_ORDER == LITTLE_ENDIAN 581eaf0ac3Slogwang u_char th_x2:4, /* (unused) */ 591eaf0ac3Slogwang th_off:4; /* data offset */ 601eaf0ac3Slogwang #endif 611eaf0ac3Slogwang #if BYTE_ORDER == BIG_ENDIAN 621eaf0ac3Slogwang u_char th_off:4, /* data offset */ 631eaf0ac3Slogwang th_x2:4; /* (unused) */ 641eaf0ac3Slogwang #endif 651eaf0ac3Slogwang u_char th_flags; 661eaf0ac3Slogwang #define TH_FIN 0x01 671eaf0ac3Slogwang #define TH_SYN 0x02 681eaf0ac3Slogwang #define TH_RST 0x04 691eaf0ac3Slogwang #define TH_PUSH 0x08 701eaf0ac3Slogwang #define TH_ACK 0x10 711eaf0ac3Slogwang #define TH_URG 0x20 721eaf0ac3Slogwang #define TH_ECE 0x40 731eaf0ac3Slogwang #define TH_CWR 0x80 74*d4a07e70Sfengbojiang #define TH_AE 0x100 /* maps into th_x2 */ 751eaf0ac3Slogwang #define TH_FLAGS (TH_FIN|TH_SYN|TH_RST|TH_PUSH|TH_ACK|TH_URG|TH_ECE|TH_CWR) 76*d4a07e70Sfengbojiang #define PRINT_TH_FLAGS "\20\1FIN\2SYN\3RST\4PUSH\5ACK\6URG\7ECE\10CWR\11AE" 771eaf0ac3Slogwang 781eaf0ac3Slogwang u_short th_win; /* window */ 791eaf0ac3Slogwang u_short th_sum; /* checksum */ 801eaf0ac3Slogwang u_short th_urp; /* urgent pointer */ 811eaf0ac3Slogwang }; 821eaf0ac3Slogwang 83*d4a07e70Sfengbojiang #define PADTCPOLEN(len) ((((len) / 4) + !!((len) % 4)) * 4) 84*d4a07e70Sfengbojiang 851eaf0ac3Slogwang #define TCPOPT_EOL 0 861eaf0ac3Slogwang #define TCPOLEN_EOL 1 871eaf0ac3Slogwang #define TCPOPT_PAD 0 /* padding after EOL */ 881eaf0ac3Slogwang #define TCPOLEN_PAD 1 891eaf0ac3Slogwang #define TCPOPT_NOP 1 901eaf0ac3Slogwang #define TCPOLEN_NOP 1 911eaf0ac3Slogwang #define TCPOPT_MAXSEG 2 921eaf0ac3Slogwang #define TCPOLEN_MAXSEG 4 931eaf0ac3Slogwang #define TCPOPT_WINDOW 3 941eaf0ac3Slogwang #define TCPOLEN_WINDOW 3 951eaf0ac3Slogwang #define TCPOPT_SACK_PERMITTED 4 961eaf0ac3Slogwang #define TCPOLEN_SACK_PERMITTED 2 971eaf0ac3Slogwang #define TCPOPT_SACK 5 981eaf0ac3Slogwang #define TCPOLEN_SACKHDR 2 991eaf0ac3Slogwang #define TCPOLEN_SACK 8 /* 2*sizeof(tcp_seq) */ 1001eaf0ac3Slogwang #define TCPOPT_TIMESTAMP 8 1011eaf0ac3Slogwang #define TCPOLEN_TIMESTAMP 10 1021eaf0ac3Slogwang #define TCPOLEN_TSTAMP_APPA (TCPOLEN_TIMESTAMP+2) /* appendix A */ 1031eaf0ac3Slogwang #define TCPOPT_SIGNATURE 19 /* Keyed MD5: RFC 2385 */ 1041eaf0ac3Slogwang #define TCPOLEN_SIGNATURE 18 1051eaf0ac3Slogwang #define TCPOPT_FAST_OPEN 34 1061eaf0ac3Slogwang #define TCPOLEN_FAST_OPEN_EMPTY 2 1071eaf0ac3Slogwang 1081eaf0ac3Slogwang /* Miscellaneous constants */ 1091eaf0ac3Slogwang #define MAX_SACK_BLKS 6 /* Max # SACK blocks stored at receiver side */ 1101eaf0ac3Slogwang #define TCP_MAX_SACK 4 /* MAX # SACKs sent in any segment */ 1111eaf0ac3Slogwang 1121eaf0ac3Slogwang /* 1131eaf0ac3Slogwang * The default maximum segment size (MSS) to be used for new TCP connections 1141eaf0ac3Slogwang * when path MTU discovery is not enabled. 1151eaf0ac3Slogwang * 1161eaf0ac3Slogwang * RFC879 derives the default MSS from the largest datagram size hosts are 1171eaf0ac3Slogwang * minimally required to handle directly or through IP reassembly minus the 1181eaf0ac3Slogwang * size of the IP and TCP header. With IPv6 the minimum MTU is specified 1191eaf0ac3Slogwang * in RFC2460. 1201eaf0ac3Slogwang * 1211eaf0ac3Slogwang * For IPv4 the MSS is 576 - sizeof(struct tcpiphdr) 1221eaf0ac3Slogwang * For IPv6 the MSS is IPV6_MMTU - sizeof(struct ip6_hdr) - sizeof(struct tcphdr) 1231eaf0ac3Slogwang * 1241eaf0ac3Slogwang * We use explicit numerical definition here to avoid header pollution. 1251eaf0ac3Slogwang */ 1261eaf0ac3Slogwang #define TCP_MSS 536 1271eaf0ac3Slogwang #define TCP6_MSS 1220 1281eaf0ac3Slogwang 1291eaf0ac3Slogwang /* 1301eaf0ac3Slogwang * Limit the lowest MSS we accept for path MTU discovery and the TCP SYN MSS 1311eaf0ac3Slogwang * option. Allowing low values of MSS can consume significant resources and 1321eaf0ac3Slogwang * be used to mount a resource exhaustion attack. 1331eaf0ac3Slogwang * Connections requesting lower MSS values will be rounded up to this value 1341eaf0ac3Slogwang * and the IP_DF flag will be cleared to allow fragmentation along the path. 1351eaf0ac3Slogwang * 1361eaf0ac3Slogwang * See tcp_subr.c tcp_minmss SYSCTL declaration for more comments. Setting 1371eaf0ac3Slogwang * it to "0" disables the minmss check. 1381eaf0ac3Slogwang * 1391eaf0ac3Slogwang * The default value is fine for TCP across the Internet's smallest official 1401eaf0ac3Slogwang * link MTU (256 bytes for AX.25 packet radio). However, a connection is very 1411eaf0ac3Slogwang * unlikely to come across such low MTU interfaces these days (anno domini 2003). 1421eaf0ac3Slogwang */ 1431eaf0ac3Slogwang #define TCP_MINMSS 216 1441eaf0ac3Slogwang 1451eaf0ac3Slogwang #define TCP_MAXWIN 65535 /* largest value for (unscaled) window */ 1461eaf0ac3Slogwang #define TTCP_CLIENT_SND_WND 4096 /* dflt send window for T/TCP client */ 1471eaf0ac3Slogwang 1481eaf0ac3Slogwang #define TCP_MAX_WINSHIFT 14 /* maximum window shift */ 1491eaf0ac3Slogwang 1501eaf0ac3Slogwang #define TCP_MAXBURST 4 /* maximum segments in a burst */ 1511eaf0ac3Slogwang 1521eaf0ac3Slogwang #define TCP_MAXHLEN (0xf<<2) /* max length of header in bytes */ 1531eaf0ac3Slogwang #define TCP_MAXOLEN (TCP_MAXHLEN - sizeof(struct tcphdr)) 1541eaf0ac3Slogwang /* max space left for options */ 155*d4a07e70Sfengbojiang 156*d4a07e70Sfengbojiang #define TCP_FASTOPEN_MIN_COOKIE_LEN 4 /* Per RFC7413 */ 157*d4a07e70Sfengbojiang #define TCP_FASTOPEN_MAX_COOKIE_LEN 16 /* Per RFC7413 */ 158*d4a07e70Sfengbojiang #define TCP_FASTOPEN_PSK_LEN 16 /* Same as TCP_FASTOPEN_KEY_LEN */ 1591eaf0ac3Slogwang #endif /* __BSD_VISIBLE */ 1601eaf0ac3Slogwang 1611eaf0ac3Slogwang /* 1621eaf0ac3Slogwang * User-settable options (used with setsockopt). These are discrete 1631eaf0ac3Slogwang * values and are not masked together. Some values appear to be 1641eaf0ac3Slogwang * bitmasks for historical reasons. 1651eaf0ac3Slogwang */ 1661eaf0ac3Slogwang #define TCP_NODELAY 1 /* don't delay send to coalesce packets */ 1671eaf0ac3Slogwang #if __BSD_VISIBLE 1681eaf0ac3Slogwang #define TCP_MAXSEG 2 /* set maximum segment size */ 1691eaf0ac3Slogwang #define TCP_NOPUSH 4 /* don't push last block of write */ 1701eaf0ac3Slogwang #define TCP_NOOPT 8 /* don't use TCP options */ 1711eaf0ac3Slogwang #define TCP_MD5SIG 16 /* use MD5 digests (RFC2385) */ 1721eaf0ac3Slogwang #define TCP_INFO 32 /* retrieve tcp_info structure */ 173*d4a07e70Sfengbojiang #define TCP_STATS 33 /* retrieve stats blob structure */ 174*d4a07e70Sfengbojiang #define TCP_LOG 34 /* configure event logging for connection */ 175*d4a07e70Sfengbojiang #define TCP_LOGBUF 35 /* retrieve event log for connection */ 176*d4a07e70Sfengbojiang #define TCP_LOGID 36 /* configure log ID to correlate connections */ 177*d4a07e70Sfengbojiang #define TCP_LOGDUMP 37 /* dump connection log events to device */ 178*d4a07e70Sfengbojiang #define TCP_LOGDUMPID 38 /* dump events from connections with same ID to 179*d4a07e70Sfengbojiang device */ 180*d4a07e70Sfengbojiang #define TCP_TXTLS_ENABLE 39 /* TLS framing and encryption for transmit */ 181*d4a07e70Sfengbojiang #define TCP_TXTLS_MODE 40 /* Transmit TLS mode */ 182*d4a07e70Sfengbojiang #define TCP_RXTLS_ENABLE 41 /* TLS framing and encryption for receive */ 183*d4a07e70Sfengbojiang #define TCP_RXTLS_MODE 42 /* Receive TLS mode */ 1841eaf0ac3Slogwang #define TCP_CONGESTION 64 /* get/set congestion control algorithm */ 1851eaf0ac3Slogwang #define TCP_CCALGOOPT 65 /* get/set cc algorithm specific options */ 186*d4a07e70Sfengbojiang #define TCP_DELACK 72 /* socket option for delayed ack */ 187*d4a07e70Sfengbojiang #define TCP_FIN_IS_RST 73 /* A fin from the peer is treated has a RST */ 188*d4a07e70Sfengbojiang #define TCP_LOG_LIMIT 74 /* Limit to number of records in tcp-log */ 189*d4a07e70Sfengbojiang #define TCP_SHARED_CWND_ALLOWED 75 /* Use of a shared cwnd is allowed */ 1901eaf0ac3Slogwang #define TCP_KEEPINIT 128 /* N, time to establish connection */ 1911eaf0ac3Slogwang #define TCP_KEEPIDLE 256 /* L,N,X start keeplives after this period */ 1921eaf0ac3Slogwang #define TCP_KEEPINTVL 512 /* L,N interval between keepalives */ 1931eaf0ac3Slogwang #define TCP_KEEPCNT 1024 /* L,N number of keepalives before close */ 1941eaf0ac3Slogwang #define TCP_FASTOPEN 1025 /* enable TFO / was created via TFO */ 1951eaf0ac3Slogwang #define TCP_PCAP_OUT 2048 /* number of output packets to keep */ 1961eaf0ac3Slogwang #define TCP_PCAP_IN 4096 /* number of input packets to keep */ 1971eaf0ac3Slogwang #define TCP_FUNCTION_BLK 8192 /* Set the tcp function pointers to the specified stack */ 198*d4a07e70Sfengbojiang /* Options for Rack and BBR */ 199*d4a07e70Sfengbojiang #define TCP_REUSPORT_LB_NUMA 1026 /* set listen socket numa domain */ 200*d4a07e70Sfengbojiang #define TCP_RACK_MBUF_QUEUE 1050 /* Do we allow mbuf queuing if supported */ 201*d4a07e70Sfengbojiang #define TCP_RACK_PROP 1051 /* RACK proportional rate reduction (bool) */ 202*d4a07e70Sfengbojiang #define TCP_RACK_TLP_REDUCE 1052 /* RACK TLP cwnd reduction (bool) */ 203*d4a07e70Sfengbojiang #define TCP_RACK_PACE_REDUCE 1053 /* RACK Pacing reduction factor (divisor) */ 204*d4a07e70Sfengbojiang #define TCP_RACK_PACE_MAX_SEG 1054 /* Max TSO size we will send */ 205*d4a07e70Sfengbojiang #define TCP_RACK_PACE_ALWAYS 1055 /* Use the always pace method */ 206*d4a07e70Sfengbojiang #define TCP_RACK_PROP_RATE 1056 /* The proportional reduction rate */ 207*d4a07e70Sfengbojiang #define TCP_RACK_PRR_SENDALOT 1057 /* Allow PRR to send more than one seg */ 208*d4a07e70Sfengbojiang #define TCP_RACK_MIN_TO 1058 /* Minimum time between rack t-o's in ms */ 209*d4a07e70Sfengbojiang #define TCP_RACK_EARLY_RECOV 1059 /* Should recovery happen early (bool) */ 210*d4a07e70Sfengbojiang #define TCP_RACK_EARLY_SEG 1060 /* If early recovery max segments */ 211*d4a07e70Sfengbojiang #define TCP_RACK_REORD_THRESH 1061 /* RACK reorder threshold (shift amount) */ 212*d4a07e70Sfengbojiang #define TCP_RACK_REORD_FADE 1062 /* Does reordering fade after ms time */ 213*d4a07e70Sfengbojiang #define TCP_RACK_TLP_THRESH 1063 /* RACK TLP theshold i.e. srtt+(srtt/N) */ 214*d4a07e70Sfengbojiang #define TCP_RACK_PKT_DELAY 1064 /* RACK added ms i.e. rack-rtt + reord + N */ 215*d4a07e70Sfengbojiang #define TCP_RACK_TLP_INC_VAR 1065 /* Does TLP include rtt variance in t-o */ 216*d4a07e70Sfengbojiang #define TCP_BBR_IWINTSO 1067 /* Initial TSO window for BBRs first sends */ 217*d4a07e70Sfengbojiang #define TCP_BBR_RECFORCE 1068 /* Enter recovery force out a segment disregard pacer no longer valid */ 218*d4a07e70Sfengbojiang #define TCP_BBR_STARTUP_PG 1069 /* Startup pacing gain */ 219*d4a07e70Sfengbojiang #define TCP_BBR_DRAIN_PG 1070 /* Drain pacing gain */ 220*d4a07e70Sfengbojiang #define TCP_BBR_RWND_IS_APP 1071 /* Rwnd limited is considered app limited */ 221*d4a07e70Sfengbojiang #define TCP_BBR_PROBE_RTT_INT 1072 /* How long in useconds between probe-rtt */ 222*d4a07e70Sfengbojiang #define TCP_BBR_ONE_RETRAN 1073 /* Is only one segment allowed out during retran */ 223*d4a07e70Sfengbojiang #define TCP_BBR_STARTUP_LOSS_EXIT 1074 /* Do we exit a loss during startup if not 20% incr */ 224*d4a07e70Sfengbojiang #define TCP_BBR_USE_LOWGAIN 1075 /* lower the gain in PROBE_BW enable */ 225*d4a07e70Sfengbojiang #define TCP_BBR_LOWGAIN_THRESH 1076 /* Unused after 2.3 morphs to TSLIMITS >= 2.3 */ 226*d4a07e70Sfengbojiang #define TCP_BBR_TSLIMITS 1076 /* Do we use experimental Timestamp limiting for our algo */ 227*d4a07e70Sfengbojiang #define TCP_BBR_LOWGAIN_HALF 1077 /* Unused after 2.3 */ 228*d4a07e70Sfengbojiang #define TCP_BBR_PACE_OH 1077 /* Reused in 4.2 for pacing overhead setting */ 229*d4a07e70Sfengbojiang #define TCP_BBR_LOWGAIN_FD 1078 /* Unused after 2.3 */ 230*d4a07e70Sfengbojiang #define TCP_BBR_HOLD_TARGET 1078 /* For 4.3 on */ 231*d4a07e70Sfengbojiang #define TCP_BBR_USEDEL_RATE 1079 /* Enable use of delivery rate for loss recovery */ 232*d4a07e70Sfengbojiang #define TCP_BBR_MIN_RTO 1080 /* Min RTO in milliseconds */ 233*d4a07e70Sfengbojiang #define TCP_BBR_MAX_RTO 1081 /* Max RTO in milliseconds */ 234*d4a07e70Sfengbojiang #define TCP_BBR_REC_OVER_HPTS 1082 /* Recovery override htps settings 0/1/3 */ 235*d4a07e70Sfengbojiang #define TCP_BBR_UNLIMITED 1083 /* Not used before 2.3 and morphs to algorithm >= 2.3 */ 236*d4a07e70Sfengbojiang #define TCP_BBR_ALGORITHM 1083 /* What measurement algo does BBR use netflix=0, google=1 */ 237*d4a07e70Sfengbojiang #define TCP_BBR_DRAIN_INC_EXTRA 1084 /* Does the 3/4 drain target include the extra gain */ 238*d4a07e70Sfengbojiang #define TCP_BBR_STARTUP_EXIT_EPOCH 1085 /* what epoch gets us out of startup */ 239*d4a07e70Sfengbojiang #define TCP_BBR_PACE_PER_SEC 1086 240*d4a07e70Sfengbojiang #define TCP_BBR_PACE_DEL_TAR 1087 241*d4a07e70Sfengbojiang #define TCP_BBR_PACE_SEG_MAX 1088 242*d4a07e70Sfengbojiang #define TCP_BBR_PACE_SEG_MIN 1089 243*d4a07e70Sfengbojiang #define TCP_BBR_PACE_CROSS 1090 244*d4a07e70Sfengbojiang #define TCP_RACK_IDLE_REDUCE_HIGH 1092 /* Reduce the highest cwnd seen to IW on idle */ 245*d4a07e70Sfengbojiang #define TCP_RACK_MIN_PACE 1093 /* Do we enforce rack min pace time */ 246*d4a07e70Sfengbojiang #define TCP_RACK_MIN_PACE_SEG 1094 /* If so what is the seg threshould */ 247*d4a07e70Sfengbojiang #define TCP_RACK_GP_INCREASE 1094 /* After 4.1 its the GP increase in older rack */ 248*d4a07e70Sfengbojiang #define TCP_RACK_TLP_USE 1095 249*d4a07e70Sfengbojiang #define TCP_BBR_ACK_COMP_ALG 1096 /* Not used */ 250*d4a07e70Sfengbojiang #define TCP_BBR_TMR_PACE_OH 1096 /* Recycled in 4.2 */ 251*d4a07e70Sfengbojiang #define TCP_BBR_EXTRA_GAIN 1097 252*d4a07e70Sfengbojiang #define TCP_RACK_DO_DETECTION 1097 /* Recycle of extra gain for rack, attack detection */ 253*d4a07e70Sfengbojiang #define TCP_BBR_RACK_RTT_USE 1098 /* what RTT should we use 0, 1, or 2? */ 254*d4a07e70Sfengbojiang #define TCP_BBR_RETRAN_WTSO 1099 255*d4a07e70Sfengbojiang #define TCP_DATA_AFTER_CLOSE 1100 256*d4a07e70Sfengbojiang #define TCP_BBR_PROBE_RTT_GAIN 1101 257*d4a07e70Sfengbojiang #define TCP_BBR_PROBE_RTT_LEN 1102 258*d4a07e70Sfengbojiang #define TCP_BBR_SEND_IWND_IN_TSO 1103 /* Do we burst out whole iwin size chunks at start? */ 259*d4a07e70Sfengbojiang #define TCP_BBR_USE_RACK_RR 1104 /* Do we use the rack rapid recovery for pacing rxt's */ 260*d4a07e70Sfengbojiang #define TCP_BBR_USE_RACK_CHEAT TCP_BBR_USE_RACK_RR /* Compat. */ 261*d4a07e70Sfengbojiang #define TCP_BBR_HDWR_PACE 1105 /* Enable/disable hardware pacing */ 262*d4a07e70Sfengbojiang #define TCP_BBR_UTTER_MAX_TSO 1106 /* Do we enforce an utter max TSO size */ 263*d4a07e70Sfengbojiang #define TCP_BBR_EXTRA_STATE 1107 /* Special exit-persist catch up */ 264*d4a07e70Sfengbojiang #define TCP_BBR_FLOOR_MIN_TSO 1108 /* The min tso size */ 265*d4a07e70Sfengbojiang #define TCP_BBR_MIN_TOPACEOUT 1109 /* Do we suspend pacing until */ 266*d4a07e70Sfengbojiang #define TCP_BBR_TSTMP_RAISES 1110 /* Can a timestamp measurement raise the b/w */ 267*d4a07e70Sfengbojiang #define TCP_BBR_POLICER_DETECT 1111 /* Turn on/off google mode policer detection */ 268*d4a07e70Sfengbojiang #define TCP_BBR_RACK_INIT_RATE 1112 /* Set an initial pacing rate for when we have no b/w in kbits per sec */ 269*d4a07e70Sfengbojiang #define TCP_RACK_RR_CONF 1113 /* Rack rapid recovery configuration control*/ 270*d4a07e70Sfengbojiang #define TCP_RACK_CHEAT_NOT_CONF_RATE TCP_RACK_RR_CONF 271*d4a07e70Sfengbojiang #define TCP_RACK_GP_INCREASE_CA 1114 /* GP increase for Congestion Avoidance */ 272*d4a07e70Sfengbojiang #define TCP_RACK_GP_INCREASE_SS 1115 /* GP increase for Slow Start */ 273*d4a07e70Sfengbojiang #define TCP_RACK_GP_INCREASE_REC 1116 /* GP increase for Recovery */ 274*d4a07e70Sfengbojiang #define TCP_RACK_FORCE_MSEG 1117 /* Override to use the user set max-seg value */ 275*d4a07e70Sfengbojiang #define TCP_RACK_PACE_RATE_CA 1118 /* Pacing rate for Congestion Avoidance */ 276*d4a07e70Sfengbojiang #define TCP_RACK_PACE_RATE_SS 1119 /* Pacing rate for Slow Start */ 277*d4a07e70Sfengbojiang #define TCP_RACK_PACE_RATE_REC 1120 /* Pacing rate for Recovery */ 278*d4a07e70Sfengbojiang #define TCP_NO_PRR 1122 /* If pacing, don't use prr */ 279*d4a07e70Sfengbojiang #define TCP_RACK_NONRXT_CFG_RATE 1123 /* In recovery does a non-rxt use the cfg rate */ 280*d4a07e70Sfengbojiang #define TCP_SHARED_CWND_ENABLE 1124 /* Use a shared cwnd if allowed */ 281*d4a07e70Sfengbojiang #define TCP_TIMELY_DYN_ADJ 1125 /* Do we attempt dynamic multipler adjustment with timely. */ 282*d4a07e70Sfengbojiang #define TCP_RACK_NO_PUSH_AT_MAX 1126 /* For timely do not push if we are over max rtt */ 283*d4a07e70Sfengbojiang #define TCP_RACK_PACE_TO_FILL 1127 /* If we are not in recovery, always pace to fill the cwnd in 1 RTT */ 284*d4a07e70Sfengbojiang #define TCP_SHARED_CWND_TIME_LIMIT 1128 /* we should limit to low time values the scwnd life */ 285*d4a07e70Sfengbojiang #define TCP_RACK_PROFILE 1129 /* Select a profile that sets multiple options */ 286*d4a07e70Sfengbojiang 2871eaf0ac3Slogwang /* Start of reserved space for third-party user-settable options. */ 2881eaf0ac3Slogwang #define TCP_VENDOR SO_VENDOR 2891eaf0ac3Slogwang 2901eaf0ac3Slogwang #define TCP_CA_NAME_MAX 16 /* max congestion control name length */ 2911eaf0ac3Slogwang 2921eaf0ac3Slogwang #define TCPI_OPT_TIMESTAMPS 0x01 2931eaf0ac3Slogwang #define TCPI_OPT_SACK 0x02 2941eaf0ac3Slogwang #define TCPI_OPT_WSCALE 0x04 2951eaf0ac3Slogwang #define TCPI_OPT_ECN 0x08 2961eaf0ac3Slogwang #define TCPI_OPT_TOE 0x10 2971eaf0ac3Slogwang 298*d4a07e70Sfengbojiang /* Maximum length of log ID. */ 299*d4a07e70Sfengbojiang #define TCP_LOG_ID_LEN 64 300*d4a07e70Sfengbojiang 3011eaf0ac3Slogwang /* 3021eaf0ac3Slogwang * The TCP_INFO socket option comes from the Linux 2.6 TCP API, and permits 3031eaf0ac3Slogwang * the caller to query certain information about the state of a TCP 3041eaf0ac3Slogwang * connection. We provide an overlapping set of fields with the Linux 3051eaf0ac3Slogwang * implementation, but since this is a fixed size structure, room has been 3061eaf0ac3Slogwang * left for growth. In order to maximize potential future compatibility with 3071eaf0ac3Slogwang * the Linux API, the same variable names and order have been adopted, and 3081eaf0ac3Slogwang * padding left to make room for omitted fields in case they are added later. 3091eaf0ac3Slogwang * 3101eaf0ac3Slogwang * XXX: This is currently an unstable ABI/API, in that it is expected to 3111eaf0ac3Slogwang * change. 3121eaf0ac3Slogwang */ 3131eaf0ac3Slogwang struct tcp_info { 3141eaf0ac3Slogwang u_int8_t tcpi_state; /* TCP FSM state. */ 3151eaf0ac3Slogwang u_int8_t __tcpi_ca_state; 3161eaf0ac3Slogwang u_int8_t __tcpi_retransmits; 3171eaf0ac3Slogwang u_int8_t __tcpi_probes; 3181eaf0ac3Slogwang u_int8_t __tcpi_backoff; 3191eaf0ac3Slogwang u_int8_t tcpi_options; /* Options enabled on conn. */ 3201eaf0ac3Slogwang u_int8_t tcpi_snd_wscale:4, /* RFC1323 send shift value. */ 3211eaf0ac3Slogwang tcpi_rcv_wscale:4; /* RFC1323 recv shift value. */ 3221eaf0ac3Slogwang 3231eaf0ac3Slogwang u_int32_t tcpi_rto; /* Retransmission timeout (usec). */ 3241eaf0ac3Slogwang u_int32_t __tcpi_ato; 3251eaf0ac3Slogwang u_int32_t tcpi_snd_mss; /* Max segment size for send. */ 3261eaf0ac3Slogwang u_int32_t tcpi_rcv_mss; /* Max segment size for receive. */ 3271eaf0ac3Slogwang 3281eaf0ac3Slogwang u_int32_t __tcpi_unacked; 3291eaf0ac3Slogwang u_int32_t __tcpi_sacked; 3301eaf0ac3Slogwang u_int32_t __tcpi_lost; 3311eaf0ac3Slogwang u_int32_t __tcpi_retrans; 3321eaf0ac3Slogwang u_int32_t __tcpi_fackets; 3331eaf0ac3Slogwang 3341eaf0ac3Slogwang /* Times; measurements in usecs. */ 3351eaf0ac3Slogwang u_int32_t __tcpi_last_data_sent; 3361eaf0ac3Slogwang u_int32_t __tcpi_last_ack_sent; /* Also unimpl. on Linux? */ 3371eaf0ac3Slogwang u_int32_t tcpi_last_data_recv; /* Time since last recv data. */ 3381eaf0ac3Slogwang u_int32_t __tcpi_last_ack_recv; 3391eaf0ac3Slogwang 3401eaf0ac3Slogwang /* Metrics; variable units. */ 3411eaf0ac3Slogwang u_int32_t __tcpi_pmtu; 3421eaf0ac3Slogwang u_int32_t __tcpi_rcv_ssthresh; 3431eaf0ac3Slogwang u_int32_t tcpi_rtt; /* Smoothed RTT in usecs. */ 3441eaf0ac3Slogwang u_int32_t tcpi_rttvar; /* RTT variance in usecs. */ 3451eaf0ac3Slogwang u_int32_t tcpi_snd_ssthresh; /* Slow start threshold. */ 3461eaf0ac3Slogwang u_int32_t tcpi_snd_cwnd; /* Send congestion window. */ 3471eaf0ac3Slogwang u_int32_t __tcpi_advmss; 3481eaf0ac3Slogwang u_int32_t __tcpi_reordering; 3491eaf0ac3Slogwang 3501eaf0ac3Slogwang u_int32_t __tcpi_rcv_rtt; 3511eaf0ac3Slogwang u_int32_t tcpi_rcv_space; /* Advertised recv window. */ 3521eaf0ac3Slogwang 3531eaf0ac3Slogwang /* FreeBSD extensions to tcp_info. */ 3541eaf0ac3Slogwang u_int32_t tcpi_snd_wnd; /* Advertised send window. */ 3551eaf0ac3Slogwang u_int32_t tcpi_snd_bwnd; /* No longer used. */ 3561eaf0ac3Slogwang u_int32_t tcpi_snd_nxt; /* Next egress seqno */ 3571eaf0ac3Slogwang u_int32_t tcpi_rcv_nxt; /* Next ingress seqno */ 3581eaf0ac3Slogwang u_int32_t tcpi_toe_tid; /* HWTID for TOE endpoints */ 3591eaf0ac3Slogwang u_int32_t tcpi_snd_rexmitpack; /* Retransmitted packets */ 3601eaf0ac3Slogwang u_int32_t tcpi_rcv_ooopack; /* Out-of-order packets */ 3611eaf0ac3Slogwang u_int32_t tcpi_snd_zerowin; /* Zero-sized windows sent */ 3621eaf0ac3Slogwang 3631eaf0ac3Slogwang /* Padding to grow without breaking ABI. */ 3641eaf0ac3Slogwang u_int32_t __tcpi_pad[26]; /* Padding. */ 3651eaf0ac3Slogwang }; 366*d4a07e70Sfengbojiang 367*d4a07e70Sfengbojiang /* 368*d4a07e70Sfengbojiang * If this structure is provided when setting the TCP_FASTOPEN socket 369*d4a07e70Sfengbojiang * option, and the enable member is non-zero, a subsequent connect will use 370*d4a07e70Sfengbojiang * pre-shared key (PSK) mode using the provided key. 371*d4a07e70Sfengbojiang */ 372*d4a07e70Sfengbojiang struct tcp_fastopen { 373*d4a07e70Sfengbojiang int enable; 374*d4a07e70Sfengbojiang uint8_t psk[TCP_FASTOPEN_PSK_LEN]; 375*d4a07e70Sfengbojiang }; 3761eaf0ac3Slogwang #endif 3771eaf0ac3Slogwang #define TCP_FUNCTION_NAME_LEN_MAX 32 3781eaf0ac3Slogwang 3791eaf0ac3Slogwang struct tcp_function_set { 3801eaf0ac3Slogwang char function_set_name[TCP_FUNCTION_NAME_LEN_MAX]; 3811eaf0ac3Slogwang uint32_t pcbcnt; 3821eaf0ac3Slogwang }; 3831eaf0ac3Slogwang 384*d4a07e70Sfengbojiang /* TLS modes for TCP_TXTLS_MODE */ 385*d4a07e70Sfengbojiang #define TCP_TLS_MODE_NONE 0 386*d4a07e70Sfengbojiang #define TCP_TLS_MODE_SW 1 387*d4a07e70Sfengbojiang #define TCP_TLS_MODE_IFNET 2 388*d4a07e70Sfengbojiang #define TCP_TLS_MODE_TOE 3 389*d4a07e70Sfengbojiang 390*d4a07e70Sfengbojiang /* 391*d4a07e70Sfengbojiang * TCP Control message types 392*d4a07e70Sfengbojiang */ 393*d4a07e70Sfengbojiang #define TLS_SET_RECORD_TYPE 1 394*d4a07e70Sfengbojiang #define TLS_GET_RECORD 2 395*d4a07e70Sfengbojiang 396*d4a07e70Sfengbojiang /* 397*d4a07e70Sfengbojiang * TCP specific variables of interest for tp->t_stats stats(9) accounting. 398*d4a07e70Sfengbojiang */ 399*d4a07e70Sfengbojiang #define VOI_TCP_TXPB 0 /* Transmit payload bytes */ 400*d4a07e70Sfengbojiang #define VOI_TCP_RETXPB 1 /* Retransmit payload bytes */ 401*d4a07e70Sfengbojiang #define VOI_TCP_FRWIN 2 /* Foreign receive window */ 402*d4a07e70Sfengbojiang #define VOI_TCP_LCWIN 3 /* Local congesiton window */ 403*d4a07e70Sfengbojiang #define VOI_TCP_RTT 4 /* Round trip time */ 404*d4a07e70Sfengbojiang #define VOI_TCP_CSIG 5 /* Congestion signal */ 405*d4a07e70Sfengbojiang #define VOI_TCP_GPUT 6 /* Goodput */ 406*d4a07e70Sfengbojiang #define VOI_TCP_CALCFRWINDIFF 7 /* Congestion avoidance LCWIN - FRWIN */ 407*d4a07e70Sfengbojiang #define VOI_TCP_GPUT_ND 8 /* Goodput normalised delta */ 408*d4a07e70Sfengbojiang #define VOI_TCP_ACKLEN 9 /* Average ACKed bytes per ACK */ 409*d4a07e70Sfengbojiang 410*d4a07e70Sfengbojiang #define TCP_REUSPORT_LB_NUMA_NODOM (-2) /* remove numa binding */ 411*d4a07e70Sfengbojiang #define TCP_REUSPORT_LB_NUMA_CURDOM (-1) /* bind to current domain */ 412*d4a07e70Sfengbojiang 4131eaf0ac3Slogwang #endif /* !_NETINET_TCP_H_ */ 414