1a9643ea8Slogwang /*
2*22ce4affSfengbojiang * SPDX-License-Identifier: BSD-3-Clause
3*22ce4affSfengbojiang *
4a9643ea8Slogwang * Copyright (c) 1982, 1986, 1988, 1993
5a9643ea8Slogwang * The Regents of the University of California.
6a9643ea8Slogwang * Copyright (c) 2005 Andre Oppermann, Internet Business Solutions AG.
7a9643ea8Slogwang * All rights reserved.
8a9643ea8Slogwang *
9a9643ea8Slogwang * Redistribution and use in source and binary forms, with or without
10a9643ea8Slogwang * modification, are permitted provided that the following conditions
11a9643ea8Slogwang * are met:
12a9643ea8Slogwang * 1. Redistributions of source code must retain the above copyright
13a9643ea8Slogwang * notice, this list of conditions and the following disclaimer.
14a9643ea8Slogwang * 2. Redistributions in binary form must reproduce the above copyright
15a9643ea8Slogwang * notice, this list of conditions and the following disclaimer in the
16a9643ea8Slogwang * documentation and/or other materials provided with the distribution.
17*22ce4affSfengbojiang * 3. Neither the name of the University nor the names of its contributors
18a9643ea8Slogwang * may be used to endorse or promote products derived from this software
19a9643ea8Slogwang * without specific prior written permission.
20a9643ea8Slogwang *
21a9643ea8Slogwang * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22a9643ea8Slogwang * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23a9643ea8Slogwang * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24a9643ea8Slogwang * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25a9643ea8Slogwang * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26a9643ea8Slogwang * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27a9643ea8Slogwang * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28a9643ea8Slogwang * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29a9643ea8Slogwang * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30a9643ea8Slogwang * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31a9643ea8Slogwang * SUCH DAMAGE.
32a9643ea8Slogwang */
33a9643ea8Slogwang
34a9643ea8Slogwang #include <sys/cdefs.h>
35a9643ea8Slogwang __FBSDID("$FreeBSD$");
36a9643ea8Slogwang
37a9643ea8Slogwang #include "opt_ipstealth.h"
38a9643ea8Slogwang
39a9643ea8Slogwang #include <sys/param.h>
40a9643ea8Slogwang #include <sys/systm.h>
41a9643ea8Slogwang #include <sys/mbuf.h>
42a9643ea8Slogwang #include <sys/domain.h>
43a9643ea8Slogwang #include <sys/protosw.h>
44a9643ea8Slogwang #include <sys/socket.h>
45a9643ea8Slogwang #include <sys/time.h>
46a9643ea8Slogwang #include <sys/kernel.h>
47a9643ea8Slogwang #include <sys/syslog.h>
48a9643ea8Slogwang #include <sys/sysctl.h>
49a9643ea8Slogwang
50a9643ea8Slogwang #include <net/if.h>
51a9643ea8Slogwang #include <net/if_types.h>
52a9643ea8Slogwang #include <net/if_var.h>
53a9643ea8Slogwang #include <net/if_dl.h>
54a9643ea8Slogwang #include <net/route.h>
55*22ce4affSfengbojiang #include <net/route/nhop.h>
56a9643ea8Slogwang #include <net/netisr.h>
57a9643ea8Slogwang #include <net/vnet.h>
58a9643ea8Slogwang
59a9643ea8Slogwang #include <netinet/in.h>
60a9643ea8Slogwang #include <netinet/in_fib.h>
61a9643ea8Slogwang #include <netinet/in_systm.h>
62a9643ea8Slogwang #include <netinet/in_var.h>
63a9643ea8Slogwang #include <netinet/ip.h>
64a9643ea8Slogwang #include <netinet/in_pcb.h>
65a9643ea8Slogwang #include <netinet/ip_var.h>
66a9643ea8Slogwang #include <netinet/ip_options.h>
67a9643ea8Slogwang #include <netinet/ip_icmp.h>
68a9643ea8Slogwang #include <machine/in_cksum.h>
69a9643ea8Slogwang
70a9643ea8Slogwang #include <sys/socketvar.h>
71a9643ea8Slogwang
72*22ce4affSfengbojiang VNET_DEFINE_STATIC(int, ip_dosourceroute);
73a9643ea8Slogwang SYSCTL_INT(_net_inet_ip, IPCTL_SOURCEROUTE, sourceroute,
74a9643ea8Slogwang CTLFLAG_VNET | CTLFLAG_RW, &VNET_NAME(ip_dosourceroute), 0,
75a9643ea8Slogwang "Enable forwarding source routed IP packets");
76a9643ea8Slogwang #define V_ip_dosourceroute VNET(ip_dosourceroute)
77a9643ea8Slogwang
78*22ce4affSfengbojiang VNET_DEFINE_STATIC(int, ip_acceptsourceroute);
79a9643ea8Slogwang SYSCTL_INT(_net_inet_ip, IPCTL_ACCEPTSOURCEROUTE, accept_sourceroute,
80a9643ea8Slogwang CTLFLAG_VNET | CTLFLAG_RW, &VNET_NAME(ip_acceptsourceroute), 0,
81a9643ea8Slogwang "Enable accepting source routed IP packets");
82a9643ea8Slogwang #define V_ip_acceptsourceroute VNET(ip_acceptsourceroute)
83a9643ea8Slogwang
84a9643ea8Slogwang VNET_DEFINE(int, ip_doopts) = 1; /* 0 = ignore, 1 = process, 2 = reject */
85a9643ea8Slogwang SYSCTL_INT(_net_inet_ip, OID_AUTO, process_options, CTLFLAG_VNET | CTLFLAG_RW,
86a9643ea8Slogwang &VNET_NAME(ip_doopts), 0, "Enable IP options processing ([LS]SRR, RR, TS)");
87a9643ea8Slogwang
88a9643ea8Slogwang static void save_rte(struct mbuf *m, u_char *, struct in_addr);
89a9643ea8Slogwang
90a9643ea8Slogwang /*
91a9643ea8Slogwang * Do option processing on a datagram, possibly discarding it if bad options
92a9643ea8Slogwang * are encountered, or forwarding it if source-routed.
93a9643ea8Slogwang *
94a9643ea8Slogwang * The pass argument is used when operating in the IPSTEALTH mode to tell
95a9643ea8Slogwang * what options to process: [LS]SRR (pass 0) or the others (pass 1). The
96a9643ea8Slogwang * reason for as many as two passes is that when doing IPSTEALTH, non-routing
97a9643ea8Slogwang * options should be processed only if the packet is for us.
98a9643ea8Slogwang *
99a9643ea8Slogwang * Returns 1 if packet has been forwarded/freed, 0 if the packet should be
100a9643ea8Slogwang * processed further.
101a9643ea8Slogwang */
102a9643ea8Slogwang int
ip_dooptions(struct mbuf * m,int pass)103a9643ea8Slogwang ip_dooptions(struct mbuf *m, int pass)
104a9643ea8Slogwang {
105a9643ea8Slogwang struct ip *ip = mtod(m, struct ip *);
106a9643ea8Slogwang u_char *cp;
107a9643ea8Slogwang struct in_ifaddr *ia;
108a9643ea8Slogwang int opt, optlen, cnt, off, code, type = ICMP_PARAMPROB, forward = 0;
109a9643ea8Slogwang struct in_addr *sin, dst;
110a9643ea8Slogwang uint32_t ntime;
111*22ce4affSfengbojiang struct nhop_object *nh;
112a9643ea8Slogwang struct sockaddr_in ipaddr = { sizeof(ipaddr), AF_INET };
113a9643ea8Slogwang
114*22ce4affSfengbojiang NET_EPOCH_ASSERT();
115*22ce4affSfengbojiang
116a9643ea8Slogwang /* Ignore or reject packets with IP options. */
117a9643ea8Slogwang if (V_ip_doopts == 0)
118a9643ea8Slogwang return 0;
119a9643ea8Slogwang else if (V_ip_doopts == 2) {
120a9643ea8Slogwang type = ICMP_UNREACH;
121a9643ea8Slogwang code = ICMP_UNREACH_FILTER_PROHIB;
122a9643ea8Slogwang goto bad;
123a9643ea8Slogwang }
124a9643ea8Slogwang
125a9643ea8Slogwang dst = ip->ip_dst;
126a9643ea8Slogwang cp = (u_char *)(ip + 1);
127a9643ea8Slogwang cnt = (ip->ip_hl << 2) - sizeof (struct ip);
128a9643ea8Slogwang for (; cnt > 0; cnt -= optlen, cp += optlen) {
129a9643ea8Slogwang opt = cp[IPOPT_OPTVAL];
130a9643ea8Slogwang if (opt == IPOPT_EOL)
131a9643ea8Slogwang break;
132a9643ea8Slogwang if (opt == IPOPT_NOP)
133a9643ea8Slogwang optlen = 1;
134a9643ea8Slogwang else {
135a9643ea8Slogwang if (cnt < IPOPT_OLEN + sizeof(*cp)) {
136a9643ea8Slogwang code = &cp[IPOPT_OLEN] - (u_char *)ip;
137a9643ea8Slogwang goto bad;
138a9643ea8Slogwang }
139a9643ea8Slogwang optlen = cp[IPOPT_OLEN];
140a9643ea8Slogwang if (optlen < IPOPT_OLEN + sizeof(*cp) || optlen > cnt) {
141a9643ea8Slogwang code = &cp[IPOPT_OLEN] - (u_char *)ip;
142a9643ea8Slogwang goto bad;
143a9643ea8Slogwang }
144a9643ea8Slogwang }
145a9643ea8Slogwang switch (opt) {
146a9643ea8Slogwang default:
147a9643ea8Slogwang break;
148a9643ea8Slogwang
149a9643ea8Slogwang /*
150a9643ea8Slogwang * Source routing with record. Find interface with current
151a9643ea8Slogwang * destination address. If none on this machine then drop if
152a9643ea8Slogwang * strictly routed, or do nothing if loosely routed. Record
153a9643ea8Slogwang * interface address and bring up next address component. If
154a9643ea8Slogwang * strictly routed make sure next address is on directly
155a9643ea8Slogwang * accessible net.
156a9643ea8Slogwang */
157a9643ea8Slogwang case IPOPT_LSRR:
158a9643ea8Slogwang case IPOPT_SSRR:
159a9643ea8Slogwang #ifdef IPSTEALTH
160a9643ea8Slogwang if (V_ipstealth && pass > 0)
161a9643ea8Slogwang break;
162a9643ea8Slogwang #endif
163a9643ea8Slogwang if (optlen < IPOPT_OFFSET + sizeof(*cp)) {
164a9643ea8Slogwang code = &cp[IPOPT_OLEN] - (u_char *)ip;
165a9643ea8Slogwang goto bad;
166a9643ea8Slogwang }
167a9643ea8Slogwang if ((off = cp[IPOPT_OFFSET]) < IPOPT_MINOFF) {
168a9643ea8Slogwang code = &cp[IPOPT_OFFSET] - (u_char *)ip;
169a9643ea8Slogwang goto bad;
170a9643ea8Slogwang }
171a9643ea8Slogwang ipaddr.sin_addr = ip->ip_dst;
172a9643ea8Slogwang if (ifa_ifwithaddr_check((struct sockaddr *)&ipaddr)
173a9643ea8Slogwang == 0) {
174a9643ea8Slogwang if (opt == IPOPT_SSRR) {
175a9643ea8Slogwang type = ICMP_UNREACH;
176a9643ea8Slogwang code = ICMP_UNREACH_SRCFAIL;
177a9643ea8Slogwang goto bad;
178a9643ea8Slogwang }
179a9643ea8Slogwang if (!V_ip_dosourceroute)
180a9643ea8Slogwang goto nosourcerouting;
181a9643ea8Slogwang /*
182a9643ea8Slogwang * Loose routing, and not at next destination
183a9643ea8Slogwang * yet; nothing to do except forward.
184a9643ea8Slogwang */
185a9643ea8Slogwang break;
186a9643ea8Slogwang }
187a9643ea8Slogwang off--; /* 0 origin */
188a9643ea8Slogwang if (off > optlen - (int)sizeof(struct in_addr)) {
189a9643ea8Slogwang /*
190a9643ea8Slogwang * End of source route. Should be for us.
191a9643ea8Slogwang */
192a9643ea8Slogwang if (!V_ip_acceptsourceroute)
193a9643ea8Slogwang goto nosourcerouting;
194a9643ea8Slogwang save_rte(m, cp, ip->ip_src);
195a9643ea8Slogwang break;
196a9643ea8Slogwang }
197a9643ea8Slogwang #ifdef IPSTEALTH
198a9643ea8Slogwang if (V_ipstealth)
199a9643ea8Slogwang goto dropit;
200a9643ea8Slogwang #endif
201a9643ea8Slogwang if (!V_ip_dosourceroute) {
202a9643ea8Slogwang if (V_ipforwarding) {
203*22ce4affSfengbojiang char srcbuf[INET_ADDRSTRLEN];
204*22ce4affSfengbojiang char dstbuf[INET_ADDRSTRLEN];
205*22ce4affSfengbojiang
206a9643ea8Slogwang /*
207a9643ea8Slogwang * Acting as a router, so generate
208a9643ea8Slogwang * ICMP
209a9643ea8Slogwang */
210a9643ea8Slogwang nosourcerouting:
211a9643ea8Slogwang log(LOG_WARNING,
212*22ce4affSfengbojiang "attempted source route from %s "
213*22ce4affSfengbojiang "to %s\n",
214*22ce4affSfengbojiang inet_ntoa_r(ip->ip_src, srcbuf),
215*22ce4affSfengbojiang inet_ntoa_r(ip->ip_dst, dstbuf));
216a9643ea8Slogwang type = ICMP_UNREACH;
217a9643ea8Slogwang code = ICMP_UNREACH_SRCFAIL;
218a9643ea8Slogwang goto bad;
219a9643ea8Slogwang } else {
220a9643ea8Slogwang /*
221a9643ea8Slogwang * Not acting as a router, so
222a9643ea8Slogwang * silently drop.
223a9643ea8Slogwang */
224a9643ea8Slogwang #ifdef IPSTEALTH
225a9643ea8Slogwang dropit:
226a9643ea8Slogwang #endif
227a9643ea8Slogwang IPSTAT_INC(ips_cantforward);
228a9643ea8Slogwang m_freem(m);
229a9643ea8Slogwang return (1);
230a9643ea8Slogwang }
231a9643ea8Slogwang }
232a9643ea8Slogwang
233a9643ea8Slogwang /*
234a9643ea8Slogwang * locate outgoing interface
235a9643ea8Slogwang */
236a9643ea8Slogwang (void)memcpy(&ipaddr.sin_addr, cp + off,
237a9643ea8Slogwang sizeof(ipaddr.sin_addr));
238a9643ea8Slogwang
239a9643ea8Slogwang type = ICMP_UNREACH;
240a9643ea8Slogwang code = ICMP_UNREACH_SRCFAIL;
241a9643ea8Slogwang
242a9643ea8Slogwang if (opt == IPOPT_SSRR) {
243a9643ea8Slogwang #define INA struct in_ifaddr *
244a9643ea8Slogwang #define SA struct sockaddr *
245a9643ea8Slogwang ia = (INA)ifa_ifwithdstaddr((SA)&ipaddr,
246a9643ea8Slogwang RT_ALL_FIBS);
247a9643ea8Slogwang if (ia == NULL)
248a9643ea8Slogwang ia = (INA)ifa_ifwithnet((SA)&ipaddr, 0,
249a9643ea8Slogwang RT_ALL_FIBS);
250a9643ea8Slogwang if (ia == NULL)
251a9643ea8Slogwang goto bad;
252a9643ea8Slogwang
253a9643ea8Slogwang memcpy(cp + off, &(IA_SIN(ia)->sin_addr),
254a9643ea8Slogwang sizeof(struct in_addr));
255a9643ea8Slogwang } else {
256a9643ea8Slogwang /* XXX MRT 0 for routing */
257*22ce4affSfengbojiang nh = fib4_lookup(M_GETFIB(m), ipaddr.sin_addr,
258*22ce4affSfengbojiang 0, NHR_NONE, 0);
259*22ce4affSfengbojiang if (nh == NULL)
260a9643ea8Slogwang goto bad;
261a9643ea8Slogwang
262*22ce4affSfengbojiang memcpy(cp + off, &(IA_SIN(nh->nh_ifa)->sin_addr),
263a9643ea8Slogwang sizeof(struct in_addr));
264a9643ea8Slogwang }
265a9643ea8Slogwang
266a9643ea8Slogwang ip->ip_dst = ipaddr.sin_addr;
267a9643ea8Slogwang cp[IPOPT_OFFSET] += sizeof(struct in_addr);
268a9643ea8Slogwang /*
269a9643ea8Slogwang * Let ip_intr's mcast routing check handle mcast pkts
270a9643ea8Slogwang */
271a9643ea8Slogwang forward = !IN_MULTICAST(ntohl(ip->ip_dst.s_addr));
272a9643ea8Slogwang break;
273a9643ea8Slogwang
274a9643ea8Slogwang case IPOPT_RR:
275a9643ea8Slogwang #ifdef IPSTEALTH
276a9643ea8Slogwang if (V_ipstealth && pass == 0)
277a9643ea8Slogwang break;
278a9643ea8Slogwang #endif
279a9643ea8Slogwang if (optlen < IPOPT_OFFSET + sizeof(*cp)) {
280a9643ea8Slogwang code = &cp[IPOPT_OFFSET] - (u_char *)ip;
281a9643ea8Slogwang goto bad;
282a9643ea8Slogwang }
283a9643ea8Slogwang if ((off = cp[IPOPT_OFFSET]) < IPOPT_MINOFF) {
284a9643ea8Slogwang code = &cp[IPOPT_OFFSET] - (u_char *)ip;
285a9643ea8Slogwang goto bad;
286a9643ea8Slogwang }
287a9643ea8Slogwang /*
288a9643ea8Slogwang * If no space remains, ignore.
289a9643ea8Slogwang */
290a9643ea8Slogwang off--; /* 0 origin */
291a9643ea8Slogwang if (off > optlen - (int)sizeof(struct in_addr))
292a9643ea8Slogwang break;
293a9643ea8Slogwang (void)memcpy(&ipaddr.sin_addr, &ip->ip_dst,
294a9643ea8Slogwang sizeof(ipaddr.sin_addr));
295a9643ea8Slogwang /*
296a9643ea8Slogwang * Locate outgoing interface; if we're the
297a9643ea8Slogwang * destination, use the incoming interface (should be
298a9643ea8Slogwang * same).
299a9643ea8Slogwang */
300a9643ea8Slogwang if ((ia = (INA)ifa_ifwithaddr((SA)&ipaddr)) != NULL) {
301a9643ea8Slogwang memcpy(cp + off, &(IA_SIN(ia)->sin_addr),
302a9643ea8Slogwang sizeof(struct in_addr));
303*22ce4affSfengbojiang } else if ((nh = fib4_lookup(M_GETFIB(m),
304*22ce4affSfengbojiang ipaddr.sin_addr, 0, NHR_NONE, 0)) != NULL) {
305*22ce4affSfengbojiang memcpy(cp + off, &(IA_SIN(nh->nh_ifa)->sin_addr),
306a9643ea8Slogwang sizeof(struct in_addr));
307a9643ea8Slogwang } else {
308a9643ea8Slogwang type = ICMP_UNREACH;
309a9643ea8Slogwang code = ICMP_UNREACH_HOST;
310a9643ea8Slogwang goto bad;
311a9643ea8Slogwang }
312a9643ea8Slogwang cp[IPOPT_OFFSET] += sizeof(struct in_addr);
313a9643ea8Slogwang break;
314a9643ea8Slogwang
315a9643ea8Slogwang case IPOPT_TS:
316a9643ea8Slogwang #ifdef IPSTEALTH
317a9643ea8Slogwang if (V_ipstealth && pass == 0)
318a9643ea8Slogwang break;
319a9643ea8Slogwang #endif
320a9643ea8Slogwang code = cp - (u_char *)ip;
321a9643ea8Slogwang if (optlen < 4 || optlen > 40) {
322a9643ea8Slogwang code = &cp[IPOPT_OLEN] - (u_char *)ip;
323a9643ea8Slogwang goto bad;
324a9643ea8Slogwang }
325a9643ea8Slogwang if ((off = cp[IPOPT_OFFSET]) < 5) {
326a9643ea8Slogwang code = &cp[IPOPT_OLEN] - (u_char *)ip;
327a9643ea8Slogwang goto bad;
328a9643ea8Slogwang }
329a9643ea8Slogwang if (off > optlen - (int)sizeof(int32_t)) {
330a9643ea8Slogwang cp[IPOPT_OFFSET + 1] += (1 << 4);
331a9643ea8Slogwang if ((cp[IPOPT_OFFSET + 1] & 0xf0) == 0) {
332a9643ea8Slogwang code = &cp[IPOPT_OFFSET] - (u_char *)ip;
333a9643ea8Slogwang goto bad;
334a9643ea8Slogwang }
335a9643ea8Slogwang break;
336a9643ea8Slogwang }
337a9643ea8Slogwang off--; /* 0 origin */
338a9643ea8Slogwang sin = (struct in_addr *)(cp + off);
339a9643ea8Slogwang switch (cp[IPOPT_OFFSET + 1] & 0x0f) {
340a9643ea8Slogwang case IPOPT_TS_TSONLY:
341a9643ea8Slogwang break;
342a9643ea8Slogwang
343a9643ea8Slogwang case IPOPT_TS_TSANDADDR:
344a9643ea8Slogwang if (off + sizeof(uint32_t) +
345a9643ea8Slogwang sizeof(struct in_addr) > optlen) {
346a9643ea8Slogwang code = &cp[IPOPT_OFFSET] - (u_char *)ip;
347a9643ea8Slogwang goto bad;
348a9643ea8Slogwang }
349a9643ea8Slogwang ipaddr.sin_addr = dst;
350a9643ea8Slogwang ia = (INA)ifaof_ifpforaddr((SA)&ipaddr,
351a9643ea8Slogwang m->m_pkthdr.rcvif);
352a9643ea8Slogwang if (ia == NULL)
353a9643ea8Slogwang continue;
354a9643ea8Slogwang (void)memcpy(sin, &IA_SIN(ia)->sin_addr,
355a9643ea8Slogwang sizeof(struct in_addr));
356a9643ea8Slogwang cp[IPOPT_OFFSET] += sizeof(struct in_addr);
357a9643ea8Slogwang off += sizeof(struct in_addr);
358a9643ea8Slogwang break;
359a9643ea8Slogwang
360a9643ea8Slogwang case IPOPT_TS_PRESPEC:
361a9643ea8Slogwang if (off + sizeof(uint32_t) +
362a9643ea8Slogwang sizeof(struct in_addr) > optlen) {
363a9643ea8Slogwang code = &cp[IPOPT_OFFSET] - (u_char *)ip;
364a9643ea8Slogwang goto bad;
365a9643ea8Slogwang }
366a9643ea8Slogwang (void)memcpy(&ipaddr.sin_addr, sin,
367a9643ea8Slogwang sizeof(struct in_addr));
368a9643ea8Slogwang if (ifa_ifwithaddr_check((SA)&ipaddr) == 0)
369a9643ea8Slogwang continue;
370a9643ea8Slogwang cp[IPOPT_OFFSET] += sizeof(struct in_addr);
371a9643ea8Slogwang off += sizeof(struct in_addr);
372a9643ea8Slogwang break;
373a9643ea8Slogwang
374a9643ea8Slogwang default:
375a9643ea8Slogwang code = &cp[IPOPT_OFFSET + 1] - (u_char *)ip;
376a9643ea8Slogwang goto bad;
377a9643ea8Slogwang }
378a9643ea8Slogwang ntime = iptime();
379a9643ea8Slogwang (void)memcpy(cp + off, &ntime, sizeof(uint32_t));
380a9643ea8Slogwang cp[IPOPT_OFFSET] += sizeof(uint32_t);
381a9643ea8Slogwang }
382a9643ea8Slogwang }
383a9643ea8Slogwang if (forward && V_ipforwarding) {
384a9643ea8Slogwang ip_forward(m, 1);
385a9643ea8Slogwang return (1);
386a9643ea8Slogwang }
387a9643ea8Slogwang return (0);
388a9643ea8Slogwang bad:
389a9643ea8Slogwang icmp_error(m, type, code, 0, 0);
390a9643ea8Slogwang IPSTAT_INC(ips_badoptions);
391a9643ea8Slogwang return (1);
392a9643ea8Slogwang }
393a9643ea8Slogwang
394a9643ea8Slogwang /*
395a9643ea8Slogwang * Save incoming source route for use in replies, to be picked up later by
396a9643ea8Slogwang * ip_srcroute if the receiver is interested.
397a9643ea8Slogwang */
398a9643ea8Slogwang static void
save_rte(struct mbuf * m,u_char * option,struct in_addr dst)399a9643ea8Slogwang save_rte(struct mbuf *m, u_char *option, struct in_addr dst)
400a9643ea8Slogwang {
401a9643ea8Slogwang unsigned olen;
402a9643ea8Slogwang struct ipopt_tag *opts;
403a9643ea8Slogwang
404a9643ea8Slogwang opts = (struct ipopt_tag *)m_tag_get(PACKET_TAG_IPOPTIONS,
405a9643ea8Slogwang sizeof(struct ipopt_tag), M_NOWAIT);
406a9643ea8Slogwang if (opts == NULL)
407a9643ea8Slogwang return;
408a9643ea8Slogwang
409a9643ea8Slogwang olen = option[IPOPT_OLEN];
410a9643ea8Slogwang if (olen > sizeof(opts->ip_srcrt) - (1 + sizeof(dst))) {
411a9643ea8Slogwang m_tag_free((struct m_tag *)opts);
412a9643ea8Slogwang return;
413a9643ea8Slogwang }
414a9643ea8Slogwang bcopy(option, opts->ip_srcrt.srcopt, olen);
415a9643ea8Slogwang opts->ip_nhops = (olen - IPOPT_OFFSET - 1) / sizeof(struct in_addr);
416a9643ea8Slogwang opts->ip_srcrt.dst = dst;
417a9643ea8Slogwang m_tag_prepend(m, (struct m_tag *)opts);
418a9643ea8Slogwang }
419a9643ea8Slogwang
420a9643ea8Slogwang /*
421a9643ea8Slogwang * Retrieve incoming source route for use in replies, in the same form used
422a9643ea8Slogwang * by setsockopt. The first hop is placed before the options, will be
423a9643ea8Slogwang * removed later.
424a9643ea8Slogwang */
425a9643ea8Slogwang struct mbuf *
ip_srcroute(struct mbuf * m0)426a9643ea8Slogwang ip_srcroute(struct mbuf *m0)
427a9643ea8Slogwang {
428a9643ea8Slogwang struct in_addr *p, *q;
429a9643ea8Slogwang struct mbuf *m;
430a9643ea8Slogwang struct ipopt_tag *opts;
431a9643ea8Slogwang
432a9643ea8Slogwang opts = (struct ipopt_tag *)m_tag_find(m0, PACKET_TAG_IPOPTIONS, NULL);
433a9643ea8Slogwang if (opts == NULL)
434a9643ea8Slogwang return (NULL);
435a9643ea8Slogwang
436a9643ea8Slogwang if (opts->ip_nhops == 0)
437a9643ea8Slogwang return (NULL);
438a9643ea8Slogwang m = m_get(M_NOWAIT, MT_DATA);
439a9643ea8Slogwang if (m == NULL)
440a9643ea8Slogwang return (NULL);
441a9643ea8Slogwang
442a9643ea8Slogwang #define OPTSIZ (sizeof(opts->ip_srcrt.nop) + sizeof(opts->ip_srcrt.srcopt))
443a9643ea8Slogwang
444a9643ea8Slogwang /* length is (nhops+1)*sizeof(addr) + sizeof(nop + srcrt header) */
445a9643ea8Slogwang m->m_len = opts->ip_nhops * sizeof(struct in_addr) +
446a9643ea8Slogwang sizeof(struct in_addr) + OPTSIZ;
447a9643ea8Slogwang
448a9643ea8Slogwang /*
449a9643ea8Slogwang * First, save first hop for return route.
450a9643ea8Slogwang */
451a9643ea8Slogwang p = &(opts->ip_srcrt.route[opts->ip_nhops - 1]);
452a9643ea8Slogwang *(mtod(m, struct in_addr *)) = *p--;
453a9643ea8Slogwang
454a9643ea8Slogwang /*
455a9643ea8Slogwang * Copy option fields and padding (nop) to mbuf.
456a9643ea8Slogwang */
457a9643ea8Slogwang opts->ip_srcrt.nop = IPOPT_NOP;
458a9643ea8Slogwang opts->ip_srcrt.srcopt[IPOPT_OFFSET] = IPOPT_MINOFF;
459a9643ea8Slogwang (void)memcpy(mtod(m, caddr_t) + sizeof(struct in_addr),
460a9643ea8Slogwang &(opts->ip_srcrt.nop), OPTSIZ);
461a9643ea8Slogwang q = (struct in_addr *)(mtod(m, caddr_t) +
462a9643ea8Slogwang sizeof(struct in_addr) + OPTSIZ);
463a9643ea8Slogwang #undef OPTSIZ
464a9643ea8Slogwang /*
465a9643ea8Slogwang * Record return path as an IP source route, reversing the path
466a9643ea8Slogwang * (pointers are now aligned).
467a9643ea8Slogwang */
468a9643ea8Slogwang while (p >= opts->ip_srcrt.route) {
469a9643ea8Slogwang *q++ = *p--;
470a9643ea8Slogwang }
471a9643ea8Slogwang /*
472a9643ea8Slogwang * Last hop goes to final destination.
473a9643ea8Slogwang */
474a9643ea8Slogwang *q = opts->ip_srcrt.dst;
475a9643ea8Slogwang m_tag_delete(m0, (struct m_tag *)opts);
476a9643ea8Slogwang return (m);
477a9643ea8Slogwang }
478a9643ea8Slogwang
479a9643ea8Slogwang /*
480a9643ea8Slogwang * Strip out IP options, at higher level protocol in the kernel.
481a9643ea8Slogwang */
482a9643ea8Slogwang void
ip_stripoptions(struct mbuf * m)483a9643ea8Slogwang ip_stripoptions(struct mbuf *m)
484a9643ea8Slogwang {
485a9643ea8Slogwang struct ip *ip = mtod(m, struct ip *);
486a9643ea8Slogwang int olen;
487a9643ea8Slogwang
488a9643ea8Slogwang olen = (ip->ip_hl << 2) - sizeof(struct ip);
489a9643ea8Slogwang m->m_len -= olen;
490a9643ea8Slogwang if (m->m_flags & M_PKTHDR)
491a9643ea8Slogwang m->m_pkthdr.len -= olen;
492a9643ea8Slogwang ip->ip_len = htons(ntohs(ip->ip_len) - olen);
493a9643ea8Slogwang ip->ip_hl = sizeof(struct ip) >> 2;
494a9643ea8Slogwang
495a9643ea8Slogwang bcopy((char *)ip + sizeof(struct ip) + olen, (ip + 1),
496a9643ea8Slogwang (size_t )(m->m_len - sizeof(struct ip)));
497a9643ea8Slogwang }
498a9643ea8Slogwang
499a9643ea8Slogwang /*
500a9643ea8Slogwang * Insert IP options into preformed packet. Adjust IP destination as
501a9643ea8Slogwang * required for IP source routing, as indicated by a non-zero in_addr at the
502a9643ea8Slogwang * start of the options.
503a9643ea8Slogwang *
504a9643ea8Slogwang * XXX This routine assumes that the packet has no options in place.
505a9643ea8Slogwang */
506a9643ea8Slogwang struct mbuf *
ip_insertoptions(struct mbuf * m,struct mbuf * opt,int * phlen)507a9643ea8Slogwang ip_insertoptions(struct mbuf *m, struct mbuf *opt, int *phlen)
508a9643ea8Slogwang {
509a9643ea8Slogwang struct ipoption *p = mtod(opt, struct ipoption *);
510a9643ea8Slogwang struct mbuf *n;
511a9643ea8Slogwang struct ip *ip = mtod(m, struct ip *);
512a9643ea8Slogwang unsigned optlen;
513a9643ea8Slogwang
514a9643ea8Slogwang optlen = opt->m_len - sizeof(p->ipopt_dst);
515a9643ea8Slogwang if (optlen + ntohs(ip->ip_len) > IP_MAXPACKET) {
516a9643ea8Slogwang *phlen = 0;
517a9643ea8Slogwang return (m); /* XXX should fail */
518a9643ea8Slogwang }
519a9643ea8Slogwang if (p->ipopt_dst.s_addr)
520a9643ea8Slogwang ip->ip_dst = p->ipopt_dst;
521a9643ea8Slogwang if (!M_WRITABLE(m) || M_LEADINGSPACE(m) < optlen) {
522a9643ea8Slogwang n = m_gethdr(M_NOWAIT, MT_DATA);
523a9643ea8Slogwang if (n == NULL) {
524a9643ea8Slogwang *phlen = 0;
525a9643ea8Slogwang return (m);
526a9643ea8Slogwang }
527a9643ea8Slogwang m_move_pkthdr(n, m);
528a9643ea8Slogwang n->m_pkthdr.rcvif = NULL;
529a9643ea8Slogwang n->m_pkthdr.len += optlen;
530a9643ea8Slogwang m->m_len -= sizeof(struct ip);
531a9643ea8Slogwang m->m_data += sizeof(struct ip);
532a9643ea8Slogwang n->m_next = m;
533a9643ea8Slogwang m = n;
534a9643ea8Slogwang m->m_len = optlen + sizeof(struct ip);
535a9643ea8Slogwang m->m_data += max_linkhdr;
536a9643ea8Slogwang bcopy(ip, mtod(m, void *), sizeof(struct ip));
537a9643ea8Slogwang } else {
538a9643ea8Slogwang m->m_data -= optlen;
539a9643ea8Slogwang m->m_len += optlen;
540a9643ea8Slogwang m->m_pkthdr.len += optlen;
541a9643ea8Slogwang bcopy(ip, mtod(m, void *), sizeof(struct ip));
542a9643ea8Slogwang }
543a9643ea8Slogwang ip = mtod(m, struct ip *);
544a9643ea8Slogwang bcopy(p->ipopt_list, ip + 1, optlen);
545a9643ea8Slogwang *phlen = sizeof(struct ip) + optlen;
546a9643ea8Slogwang ip->ip_v = IPVERSION;
547a9643ea8Slogwang ip->ip_hl = *phlen >> 2;
548a9643ea8Slogwang ip->ip_len = htons(ntohs(ip->ip_len) + optlen);
549a9643ea8Slogwang return (m);
550a9643ea8Slogwang }
551a9643ea8Slogwang
552a9643ea8Slogwang /*
553a9643ea8Slogwang * Copy options from ip to jp, omitting those not copied during
554a9643ea8Slogwang * fragmentation.
555a9643ea8Slogwang */
556a9643ea8Slogwang int
ip_optcopy(struct ip * ip,struct ip * jp)557a9643ea8Slogwang ip_optcopy(struct ip *ip, struct ip *jp)
558a9643ea8Slogwang {
559a9643ea8Slogwang u_char *cp, *dp;
560a9643ea8Slogwang int opt, optlen, cnt;
561a9643ea8Slogwang
562a9643ea8Slogwang cp = (u_char *)(ip + 1);
563a9643ea8Slogwang dp = (u_char *)(jp + 1);
564a9643ea8Slogwang cnt = (ip->ip_hl << 2) - sizeof (struct ip);
565a9643ea8Slogwang for (; cnt > 0; cnt -= optlen, cp += optlen) {
566a9643ea8Slogwang opt = cp[0];
567a9643ea8Slogwang if (opt == IPOPT_EOL)
568a9643ea8Slogwang break;
569a9643ea8Slogwang if (opt == IPOPT_NOP) {
570a9643ea8Slogwang /* Preserve for IP mcast tunnel's LSRR alignment. */
571a9643ea8Slogwang *dp++ = IPOPT_NOP;
572a9643ea8Slogwang optlen = 1;
573a9643ea8Slogwang continue;
574a9643ea8Slogwang }
575a9643ea8Slogwang
576a9643ea8Slogwang KASSERT(cnt >= IPOPT_OLEN + sizeof(*cp),
577a9643ea8Slogwang ("ip_optcopy: malformed ipv4 option"));
578a9643ea8Slogwang optlen = cp[IPOPT_OLEN];
579a9643ea8Slogwang KASSERT(optlen >= IPOPT_OLEN + sizeof(*cp) && optlen <= cnt,
580a9643ea8Slogwang ("ip_optcopy: malformed ipv4 option"));
581a9643ea8Slogwang
582a9643ea8Slogwang /* Bogus lengths should have been caught by ip_dooptions. */
583a9643ea8Slogwang if (optlen > cnt)
584a9643ea8Slogwang optlen = cnt;
585a9643ea8Slogwang if (IPOPT_COPIED(opt)) {
586a9643ea8Slogwang bcopy(cp, dp, optlen);
587a9643ea8Slogwang dp += optlen;
588a9643ea8Slogwang }
589a9643ea8Slogwang }
590a9643ea8Slogwang for (optlen = dp - (u_char *)(jp+1); optlen & 0x3; optlen++)
591a9643ea8Slogwang *dp++ = IPOPT_EOL;
592a9643ea8Slogwang return (optlen);
593a9643ea8Slogwang }
594a9643ea8Slogwang
595a9643ea8Slogwang /*
596a9643ea8Slogwang * Set up IP options in pcb for insertion in output packets. Store in mbuf
597a9643ea8Slogwang * with pointer in pcbopt, adding pseudo-option with destination address if
598a9643ea8Slogwang * source routed.
599a9643ea8Slogwang */
600a9643ea8Slogwang int
ip_pcbopts(struct inpcb * inp,int optname,struct mbuf * m)601a9643ea8Slogwang ip_pcbopts(struct inpcb *inp, int optname, struct mbuf *m)
602a9643ea8Slogwang {
603a9643ea8Slogwang int cnt, optlen;
604a9643ea8Slogwang u_char *cp;
605a9643ea8Slogwang struct mbuf **pcbopt;
606a9643ea8Slogwang u_char opt;
607a9643ea8Slogwang
608a9643ea8Slogwang INP_WLOCK_ASSERT(inp);
609a9643ea8Slogwang
610a9643ea8Slogwang pcbopt = &inp->inp_options;
611a9643ea8Slogwang
612a9643ea8Slogwang /* turn off any old options */
613a9643ea8Slogwang if (*pcbopt)
614a9643ea8Slogwang (void)m_free(*pcbopt);
615a9643ea8Slogwang *pcbopt = NULL;
616a9643ea8Slogwang if (m == NULL || m->m_len == 0) {
617a9643ea8Slogwang /*
618a9643ea8Slogwang * Only turning off any previous options.
619a9643ea8Slogwang */
620a9643ea8Slogwang if (m != NULL)
621a9643ea8Slogwang (void)m_free(m);
622a9643ea8Slogwang return (0);
623a9643ea8Slogwang }
624a9643ea8Slogwang
625a9643ea8Slogwang if (m->m_len % sizeof(int32_t))
626a9643ea8Slogwang goto bad;
627a9643ea8Slogwang /*
628a9643ea8Slogwang * IP first-hop destination address will be stored before actual
629a9643ea8Slogwang * options; move other options back and clear it when none present.
630a9643ea8Slogwang */
631a9643ea8Slogwang if (m->m_data + m->m_len + sizeof(struct in_addr) >= &m->m_dat[MLEN])
632a9643ea8Slogwang goto bad;
633a9643ea8Slogwang cnt = m->m_len;
634a9643ea8Slogwang m->m_len += sizeof(struct in_addr);
635a9643ea8Slogwang cp = mtod(m, u_char *) + sizeof(struct in_addr);
636a9643ea8Slogwang bcopy(mtod(m, void *), cp, (unsigned)cnt);
637a9643ea8Slogwang bzero(mtod(m, void *), sizeof(struct in_addr));
638a9643ea8Slogwang
639a9643ea8Slogwang for (; cnt > 0; cnt -= optlen, cp += optlen) {
640a9643ea8Slogwang opt = cp[IPOPT_OPTVAL];
641a9643ea8Slogwang if (opt == IPOPT_EOL)
642a9643ea8Slogwang break;
643a9643ea8Slogwang if (opt == IPOPT_NOP)
644a9643ea8Slogwang optlen = 1;
645a9643ea8Slogwang else {
646a9643ea8Slogwang if (cnt < IPOPT_OLEN + sizeof(*cp))
647a9643ea8Slogwang goto bad;
648a9643ea8Slogwang optlen = cp[IPOPT_OLEN];
649a9643ea8Slogwang if (optlen < IPOPT_OLEN + sizeof(*cp) || optlen > cnt)
650a9643ea8Slogwang goto bad;
651a9643ea8Slogwang }
652a9643ea8Slogwang switch (opt) {
653a9643ea8Slogwang default:
654a9643ea8Slogwang break;
655a9643ea8Slogwang
656a9643ea8Slogwang case IPOPT_LSRR:
657a9643ea8Slogwang case IPOPT_SSRR:
658a9643ea8Slogwang /*
659a9643ea8Slogwang * User process specifies route as:
660a9643ea8Slogwang *
661a9643ea8Slogwang * ->A->B->C->D
662a9643ea8Slogwang *
663a9643ea8Slogwang * D must be our final destination (but we can't
664a9643ea8Slogwang * check that since we may not have connected yet).
665a9643ea8Slogwang * A is first hop destination, which doesn't appear
666a9643ea8Slogwang * in actual IP option, but is stored before the
667a9643ea8Slogwang * options.
668a9643ea8Slogwang */
669a9643ea8Slogwang /* XXX-BZ PRIV_NETINET_SETHDROPTS? */
670a9643ea8Slogwang if (optlen < IPOPT_MINOFF - 1 + sizeof(struct in_addr))
671a9643ea8Slogwang goto bad;
672a9643ea8Slogwang m->m_len -= sizeof(struct in_addr);
673a9643ea8Slogwang cnt -= sizeof(struct in_addr);
674a9643ea8Slogwang optlen -= sizeof(struct in_addr);
675a9643ea8Slogwang cp[IPOPT_OLEN] = optlen;
676a9643ea8Slogwang /*
677a9643ea8Slogwang * Move first hop before start of options.
678a9643ea8Slogwang */
679a9643ea8Slogwang bcopy((caddr_t)&cp[IPOPT_OFFSET+1], mtod(m, caddr_t),
680a9643ea8Slogwang sizeof(struct in_addr));
681a9643ea8Slogwang /*
682a9643ea8Slogwang * Then copy rest of options back
683a9643ea8Slogwang * to close up the deleted entry.
684a9643ea8Slogwang */
685a9643ea8Slogwang bcopy((&cp[IPOPT_OFFSET+1] + sizeof(struct in_addr)),
686a9643ea8Slogwang &cp[IPOPT_OFFSET+1],
687a9643ea8Slogwang (unsigned)cnt - (IPOPT_MINOFF - 1));
688a9643ea8Slogwang break;
689a9643ea8Slogwang }
690a9643ea8Slogwang }
691a9643ea8Slogwang if (m->m_len > MAX_IPOPTLEN + sizeof(struct in_addr))
692a9643ea8Slogwang goto bad;
693a9643ea8Slogwang *pcbopt = m;
694a9643ea8Slogwang return (0);
695a9643ea8Slogwang
696a9643ea8Slogwang bad:
697a9643ea8Slogwang (void)m_free(m);
698a9643ea8Slogwang return (EINVAL);
699a9643ea8Slogwang }
700a9643ea8Slogwang
701a9643ea8Slogwang /*
702a9643ea8Slogwang * Check for the presence of the IP Router Alert option [RFC2113]
703a9643ea8Slogwang * in the header of an IPv4 datagram.
704a9643ea8Slogwang *
705a9643ea8Slogwang * This call is not intended for use from the forwarding path; it is here
706a9643ea8Slogwang * so that protocol domains may check for the presence of the option.
707a9643ea8Slogwang * Given how FreeBSD's IPv4 stack is currently structured, the Router Alert
708a9643ea8Slogwang * option does not have much relevance to the implementation, though this
709a9643ea8Slogwang * may change in future.
710a9643ea8Slogwang * Router alert options SHOULD be passed if running in IPSTEALTH mode and
711a9643ea8Slogwang * we are not the endpoint.
712a9643ea8Slogwang * Length checks on individual options should already have been performed
713a9643ea8Slogwang * by ip_dooptions() therefore they are folded under INVARIANTS here.
714a9643ea8Slogwang *
715a9643ea8Slogwang * Return zero if not present or options are invalid, non-zero if present.
716a9643ea8Slogwang */
717a9643ea8Slogwang int
ip_checkrouteralert(struct mbuf * m)718a9643ea8Slogwang ip_checkrouteralert(struct mbuf *m)
719a9643ea8Slogwang {
720a9643ea8Slogwang struct ip *ip = mtod(m, struct ip *);
721a9643ea8Slogwang u_char *cp;
722a9643ea8Slogwang int opt, optlen, cnt, found_ra;
723a9643ea8Slogwang
724a9643ea8Slogwang found_ra = 0;
725a9643ea8Slogwang cp = (u_char *)(ip + 1);
726a9643ea8Slogwang cnt = (ip->ip_hl << 2) - sizeof (struct ip);
727a9643ea8Slogwang for (; cnt > 0; cnt -= optlen, cp += optlen) {
728a9643ea8Slogwang opt = cp[IPOPT_OPTVAL];
729a9643ea8Slogwang if (opt == IPOPT_EOL)
730a9643ea8Slogwang break;
731a9643ea8Slogwang if (opt == IPOPT_NOP)
732a9643ea8Slogwang optlen = 1;
733a9643ea8Slogwang else {
734a9643ea8Slogwang #ifdef INVARIANTS
735a9643ea8Slogwang if (cnt < IPOPT_OLEN + sizeof(*cp))
736a9643ea8Slogwang break;
737a9643ea8Slogwang #endif
738a9643ea8Slogwang optlen = cp[IPOPT_OLEN];
739a9643ea8Slogwang #ifdef INVARIANTS
740a9643ea8Slogwang if (optlen < IPOPT_OLEN + sizeof(*cp) || optlen > cnt)
741a9643ea8Slogwang break;
742a9643ea8Slogwang #endif
743a9643ea8Slogwang }
744a9643ea8Slogwang switch (opt) {
745a9643ea8Slogwang case IPOPT_RA:
746a9643ea8Slogwang #ifdef INVARIANTS
747a9643ea8Slogwang if (optlen != IPOPT_OFFSET + sizeof(uint16_t) ||
748a9643ea8Slogwang (*((uint16_t *)&cp[IPOPT_OFFSET]) != 0))
749a9643ea8Slogwang break;
750a9643ea8Slogwang else
751a9643ea8Slogwang #endif
752a9643ea8Slogwang found_ra = 1;
753a9643ea8Slogwang break;
754a9643ea8Slogwang default:
755a9643ea8Slogwang break;
756a9643ea8Slogwang }
757a9643ea8Slogwang }
758a9643ea8Slogwang
759a9643ea8Slogwang return (found_ra);
760a9643ea8Slogwang }
761