xref: /f-stack/freebsd/net/iflib_clone.c (revision 22ce4aff)
1*22ce4affSfengbojiang /*-
2*22ce4affSfengbojiang  * Copyright (c) 2014-2018, Matthew Macy <[email protected]>
3*22ce4affSfengbojiang  * Copyright (C) 2017-2018 Joyent Inc.
4*22ce4affSfengbojiang  * All rights reserved.
5*22ce4affSfengbojiang  *
6*22ce4affSfengbojiang  * Redistribution and use in source and binary forms, with or without
7*22ce4affSfengbojiang  * modification, are permitted provided that the following conditions are met:
8*22ce4affSfengbojiang  *
9*22ce4affSfengbojiang  *  1. Redistributions of source code must retain the above copyright notice,
10*22ce4affSfengbojiang  *     this list of conditions and the following disclaimer.
11*22ce4affSfengbojiang  *
12*22ce4affSfengbojiang  *  2. Neither the name of Matthew Macy nor the names of its
13*22ce4affSfengbojiang  *     contributors may be used to endorse or promote products derived from
14*22ce4affSfengbojiang  *     this software without specific prior written permission.
15*22ce4affSfengbojiang  *
16*22ce4affSfengbojiang  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
17*22ce4affSfengbojiang  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18*22ce4affSfengbojiang  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19*22ce4affSfengbojiang  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
20*22ce4affSfengbojiang  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
21*22ce4affSfengbojiang  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
22*22ce4affSfengbojiang  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
23*22ce4affSfengbojiang  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
24*22ce4affSfengbojiang  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
25*22ce4affSfengbojiang  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
26*22ce4affSfengbojiang  * POSSIBILITY OF SUCH DAMAGE.
27*22ce4affSfengbojiang  */
28*22ce4affSfengbojiang 
29*22ce4affSfengbojiang #include <sys/cdefs.h>
30*22ce4affSfengbojiang __FBSDID("$FreeBSD$");
31*22ce4affSfengbojiang 
32*22ce4affSfengbojiang #include "opt_inet.h"
33*22ce4affSfengbojiang #include "opt_inet6.h"
34*22ce4affSfengbojiang #include "opt_acpi.h"
35*22ce4affSfengbojiang #include "opt_sched.h"
36*22ce4affSfengbojiang 
37*22ce4affSfengbojiang #include <sys/param.h>
38*22ce4affSfengbojiang #include <sys/types.h>
39*22ce4affSfengbojiang #include <sys/bus.h>
40*22ce4affSfengbojiang #include <sys/eventhandler.h>
41*22ce4affSfengbojiang #include <sys/event.h>
42*22ce4affSfengbojiang #include <sys/sockio.h>
43*22ce4affSfengbojiang #include <sys/kernel.h>
44*22ce4affSfengbojiang #include <sys/lock.h>
45*22ce4affSfengbojiang #include <sys/mutex.h>
46*22ce4affSfengbojiang #include <sys/module.h>
47*22ce4affSfengbojiang #include <sys/kobj.h>
48*22ce4affSfengbojiang #include <sys/rman.h>
49*22ce4affSfengbojiang #include <sys/sbuf.h>
50*22ce4affSfengbojiang #include <sys/smp.h>
51*22ce4affSfengbojiang #include <sys/socket.h>
52*22ce4affSfengbojiang #include <sys/sysctl.h>
53*22ce4affSfengbojiang #include <sys/syslog.h>
54*22ce4affSfengbojiang #include <sys/taskqueue.h>
55*22ce4affSfengbojiang #include <sys/limits.h>
56*22ce4affSfengbojiang #include <sys/queue.h>
57*22ce4affSfengbojiang #include <sys/jail.h>
58*22ce4affSfengbojiang #include <sys/md5.h>
59*22ce4affSfengbojiang #include <sys/proc.h>
60*22ce4affSfengbojiang 
61*22ce4affSfengbojiang #include <net/if.h>
62*22ce4affSfengbojiang #include <net/if_var.h>
63*22ce4affSfengbojiang #include <net/if_types.h>
64*22ce4affSfengbojiang #include <net/if_media.h>
65*22ce4affSfengbojiang #include <net/if_clone.h>
66*22ce4affSfengbojiang #include <net/bpf.h>
67*22ce4affSfengbojiang #include <net/ethernet.h>
68*22ce4affSfengbojiang #include <net/vnet.h>
69*22ce4affSfengbojiang 
70*22ce4affSfengbojiang #include <net/iflib.h>
71*22ce4affSfengbojiang #include <net/iflib_private.h>
72*22ce4affSfengbojiang #include "ifdi_if.h"
73*22ce4affSfengbojiang 
74*22ce4affSfengbojiang int
noop_attach(device_t dev)75*22ce4affSfengbojiang noop_attach(device_t dev)
76*22ce4affSfengbojiang {
77*22ce4affSfengbojiang 	return (0);
78*22ce4affSfengbojiang }
79*22ce4affSfengbojiang 
80*22ce4affSfengbojiang int
iflib_pseudo_detach(device_t dev)81*22ce4affSfengbojiang iflib_pseudo_detach(device_t dev)
82*22ce4affSfengbojiang {
83*22ce4affSfengbojiang 	if_ctx_t ctx;
84*22ce4affSfengbojiang 	uint32_t ifc_flags;
85*22ce4affSfengbojiang 
86*22ce4affSfengbojiang 	ctx = device_get_softc(dev);
87*22ce4affSfengbojiang 	ifc_flags = iflib_get_flags(ctx);
88*22ce4affSfengbojiang 	if ((ifc_flags & IFC_INIT_DONE) == 0)
89*22ce4affSfengbojiang 		return (0);
90*22ce4affSfengbojiang 	return (IFDI_DETACH(ctx));
91*22ce4affSfengbojiang }
92*22ce4affSfengbojiang 
93*22ce4affSfengbojiang static device_t iflib_pseudodev;
94*22ce4affSfengbojiang 
95*22ce4affSfengbojiang static struct mtx pseudoif_mtx;
96*22ce4affSfengbojiang MTX_SYSINIT(pseudoif_mtx, &pseudoif_mtx, "pseudoif_mtx", MTX_DEF);
97*22ce4affSfengbojiang 
98*22ce4affSfengbojiang #define PSEUDO_LOCK() mtx_lock(&pseudoif_mtx);
99*22ce4affSfengbojiang #define PSEUDO_UNLOCK() mtx_unlock(&pseudoif_mtx);
100*22ce4affSfengbojiang 
101*22ce4affSfengbojiang struct if_pseudo {
102*22ce4affSfengbojiang 	eventhandler_tag ip_detach_tag;
103*22ce4affSfengbojiang 	eventhandler_tag ip_lladdr_tag;
104*22ce4affSfengbojiang 	struct if_clone *ip_ifc;
105*22ce4affSfengbojiang 	if_shared_ctx_t ip_sctx;
106*22ce4affSfengbojiang 	devclass_t ip_dc;
107*22ce4affSfengbojiang 	LIST_ENTRY(if_pseudo) ip_list;
108*22ce4affSfengbojiang 	int ip_on_list;
109*22ce4affSfengbojiang };
110*22ce4affSfengbojiang 
111*22ce4affSfengbojiang static LIST_HEAD(, if_pseudo) iflib_pseudos = LIST_HEAD_INITIALIZER(iflib_pseudos);
112*22ce4affSfengbojiang 
113*22ce4affSfengbojiang /*
114*22ce4affSfengbojiang  * XXX this assumes that the rest of the
115*22ce4affSfengbojiang  * code won't hang on to it after it's
116*22ce4affSfengbojiang  * removed / unloaded
117*22ce4affSfengbojiang  */
118*22ce4affSfengbojiang static if_pseudo_t
iflib_ip_lookup(const char * name)119*22ce4affSfengbojiang iflib_ip_lookup(const char *name)
120*22ce4affSfengbojiang {
121*22ce4affSfengbojiang 	if_pseudo_t ip = NULL;
122*22ce4affSfengbojiang 
123*22ce4affSfengbojiang 	PSEUDO_LOCK();
124*22ce4affSfengbojiang 	LIST_FOREACH(ip, &iflib_pseudos, ip_list) {
125*22ce4affSfengbojiang 		if (!strcmp(ip->ip_sctx->isc_name, name))
126*22ce4affSfengbojiang 			break;
127*22ce4affSfengbojiang 	}
128*22ce4affSfengbojiang 	PSEUDO_UNLOCK();
129*22ce4affSfengbojiang 	return (ip);
130*22ce4affSfengbojiang }
131*22ce4affSfengbojiang 
132*22ce4affSfengbojiang static void
iflib_ip_delete(if_pseudo_t ip)133*22ce4affSfengbojiang iflib_ip_delete(if_pseudo_t ip)
134*22ce4affSfengbojiang {
135*22ce4affSfengbojiang 	PSEUDO_LOCK();
136*22ce4affSfengbojiang 	if (ip->ip_on_list) {
137*22ce4affSfengbojiang 		LIST_REMOVE(ip, ip_list);
138*22ce4affSfengbojiang 		ip->ip_on_list = 0;
139*22ce4affSfengbojiang 	}
140*22ce4affSfengbojiang 	PSEUDO_UNLOCK();
141*22ce4affSfengbojiang }
142*22ce4affSfengbojiang 
143*22ce4affSfengbojiang static void
iflib_ip_insert(if_pseudo_t ip)144*22ce4affSfengbojiang iflib_ip_insert(if_pseudo_t ip)
145*22ce4affSfengbojiang {
146*22ce4affSfengbojiang 	PSEUDO_LOCK();
147*22ce4affSfengbojiang 	if (!ip->ip_on_list) {
148*22ce4affSfengbojiang 		LIST_INSERT_HEAD(&iflib_pseudos, ip, ip_list);
149*22ce4affSfengbojiang 		ip->ip_on_list = 1;
150*22ce4affSfengbojiang 	}
151*22ce4affSfengbojiang 	PSEUDO_UNLOCK();
152*22ce4affSfengbojiang }
153*22ce4affSfengbojiang 
154*22ce4affSfengbojiang static void
iflib_ifdetach(void * arg __unused,if_t ifp)155*22ce4affSfengbojiang iflib_ifdetach(void *arg __unused, if_t ifp)
156*22ce4affSfengbojiang {
157*22ce4affSfengbojiang 
158*22ce4affSfengbojiang 	/* If the ifnet is just being renamed, don't do anything. */
159*22ce4affSfengbojiang 	if (ifp->if_flags & IFF_RENAMING)
160*22ce4affSfengbojiang 		return;
161*22ce4affSfengbojiang }
162*22ce4affSfengbojiang 
163*22ce4affSfengbojiang static void
iflib_iflladdr(void * arg __unused,if_t ifp __unused)164*22ce4affSfengbojiang iflib_iflladdr(void *arg __unused, if_t ifp __unused)
165*22ce4affSfengbojiang {
166*22ce4affSfengbojiang 
167*22ce4affSfengbojiang }
168*22ce4affSfengbojiang 
169*22ce4affSfengbojiang static int
iflib_clone_create(struct if_clone * ifc,int unit,caddr_t params)170*22ce4affSfengbojiang iflib_clone_create(struct if_clone *ifc, int unit, caddr_t params)
171*22ce4affSfengbojiang {
172*22ce4affSfengbojiang 	const char *name = ifc_name(ifc);
173*22ce4affSfengbojiang 	struct iflib_cloneattach_ctx clctx;
174*22ce4affSfengbojiang 	if_ctx_t ctx;
175*22ce4affSfengbojiang 	if_pseudo_t ip;
176*22ce4affSfengbojiang 	device_t dev;
177*22ce4affSfengbojiang 	int rc;
178*22ce4affSfengbojiang 
179*22ce4affSfengbojiang 	clctx.cc_ifc = ifc;
180*22ce4affSfengbojiang 	clctx.cc_len = 0;
181*22ce4affSfengbojiang 	clctx.cc_params = params;
182*22ce4affSfengbojiang 	clctx.cc_name = name;
183*22ce4affSfengbojiang 
184*22ce4affSfengbojiang 	if (__predict_false(iflib_pseudodev == NULL)) {
185*22ce4affSfengbojiang 		/* SYSINIT initialization would panic !?! */
186*22ce4affSfengbojiang 		mtx_lock(&Giant);
187*22ce4affSfengbojiang 		iflib_pseudodev = device_add_child(root_bus, "ifpseudo", 0);
188*22ce4affSfengbojiang 		mtx_unlock(&Giant);
189*22ce4affSfengbojiang 		MPASS(iflib_pseudodev != NULL);
190*22ce4affSfengbojiang 	}
191*22ce4affSfengbojiang 	ip = iflib_ip_lookup(name);
192*22ce4affSfengbojiang 	if (ip == NULL) {
193*22ce4affSfengbojiang 		printf("no ip found for %s\n", name);
194*22ce4affSfengbojiang 		return (ENOENT);
195*22ce4affSfengbojiang 	}
196*22ce4affSfengbojiang 	if ((dev = devclass_get_device(ip->ip_dc, unit)) != NULL) {
197*22ce4affSfengbojiang 		printf("unit %d allocated\n", unit);
198*22ce4affSfengbojiang 		bus_generic_print_child(iflib_pseudodev, dev);
199*22ce4affSfengbojiang 		return (EBUSY);
200*22ce4affSfengbojiang 	}
201*22ce4affSfengbojiang 	PSEUDO_LOCK();
202*22ce4affSfengbojiang 	dev = device_add_child(iflib_pseudodev, name, unit);
203*22ce4affSfengbojiang 	device_set_driver(dev, &iflib_pseudodriver);
204*22ce4affSfengbojiang 	PSEUDO_UNLOCK();
205*22ce4affSfengbojiang 	device_quiet(dev);
206*22ce4affSfengbojiang 	rc = device_attach(dev);
207*22ce4affSfengbojiang 	MPASS(rc == 0);
208*22ce4affSfengbojiang 	MPASS(dev != NULL);
209*22ce4affSfengbojiang 	MPASS(devclass_get_device(ip->ip_dc, unit) == dev);
210*22ce4affSfengbojiang 	rc = iflib_pseudo_register(dev, ip->ip_sctx, &ctx, &clctx);
211*22ce4affSfengbojiang 	if (rc) {
212*22ce4affSfengbojiang 		mtx_lock(&Giant);
213*22ce4affSfengbojiang 		device_delete_child(iflib_pseudodev, dev);
214*22ce4affSfengbojiang 		mtx_unlock(&Giant);
215*22ce4affSfengbojiang 	} else
216*22ce4affSfengbojiang 		device_set_softc(dev, ctx);
217*22ce4affSfengbojiang 
218*22ce4affSfengbojiang 	return (rc);
219*22ce4affSfengbojiang }
220*22ce4affSfengbojiang 
221*22ce4affSfengbojiang static void
iflib_clone_destroy(if_t ifp)222*22ce4affSfengbojiang iflib_clone_destroy(if_t ifp)
223*22ce4affSfengbojiang {
224*22ce4affSfengbojiang 	if_ctx_t ctx;
225*22ce4affSfengbojiang 	device_t dev;
226*22ce4affSfengbojiang 	struct sx *ctx_lock;
227*22ce4affSfengbojiang 	int rc;
228*22ce4affSfengbojiang 
229*22ce4affSfengbojiang 	/*
230*22ce4affSfengbojiang 	 * Detach device / free / free unit
231*22ce4affSfengbojiang 	 */
232*22ce4affSfengbojiang 	ctx = if_getsoftc(ifp);
233*22ce4affSfengbojiang 	dev = iflib_get_dev(ctx);
234*22ce4affSfengbojiang 	ctx_lock = iflib_ctx_lock_get(ctx);
235*22ce4affSfengbojiang 	sx_xlock(ctx_lock);
236*22ce4affSfengbojiang 	iflib_set_detach(ctx);
237*22ce4affSfengbojiang 	iflib_stop(ctx);
238*22ce4affSfengbojiang 	sx_xunlock(ctx_lock);
239*22ce4affSfengbojiang 
240*22ce4affSfengbojiang 	mtx_lock(&Giant);
241*22ce4affSfengbojiang 	rc = device_delete_child(iflib_pseudodev, dev);
242*22ce4affSfengbojiang 	mtx_unlock(&Giant);
243*22ce4affSfengbojiang 	if (rc == 0)
244*22ce4affSfengbojiang 		iflib_pseudo_deregister(ctx);
245*22ce4affSfengbojiang }
246*22ce4affSfengbojiang 
247*22ce4affSfengbojiang if_pseudo_t
iflib_clone_register(if_shared_ctx_t sctx)248*22ce4affSfengbojiang iflib_clone_register(if_shared_ctx_t sctx)
249*22ce4affSfengbojiang {
250*22ce4affSfengbojiang 	if_pseudo_t ip;
251*22ce4affSfengbojiang 
252*22ce4affSfengbojiang 	if (sctx->isc_name == NULL) {
253*22ce4affSfengbojiang 		printf("iflib_clone_register failed - shared_ctx needs to have a device name\n");
254*22ce4affSfengbojiang 		return (NULL);
255*22ce4affSfengbojiang 	}
256*22ce4affSfengbojiang 	if (iflib_ip_lookup(sctx->isc_name) != NULL) {
257*22ce4affSfengbojiang 		printf("iflib_clone_register failed - shared_ctx %s alread registered\n",
258*22ce4affSfengbojiang 			   sctx->isc_name);
259*22ce4affSfengbojiang 		return (NULL);
260*22ce4affSfengbojiang 	}
261*22ce4affSfengbojiang 	ip = malloc(sizeof(*ip), M_IFLIB, M_WAITOK|M_ZERO);
262*22ce4affSfengbojiang 	ip->ip_sctx = sctx;
263*22ce4affSfengbojiang 	ip->ip_dc = devclass_create(sctx->isc_name);
264*22ce4affSfengbojiang 	if (ip->ip_dc == NULL)
265*22ce4affSfengbojiang 		goto fail_clone;
266*22ce4affSfengbojiang 	/* XXX --- we can handle clone_advanced later */
267*22ce4affSfengbojiang 	ip->ip_ifc  = if_clone_simple(sctx->isc_name, iflib_clone_create, iflib_clone_destroy, 0);
268*22ce4affSfengbojiang 	if (ip->ip_ifc == NULL) {
269*22ce4affSfengbojiang 		printf("clone_simple failed -- cloned %s  devices will not be available\n", sctx->isc_name);
270*22ce4affSfengbojiang 		goto fail_clone;
271*22ce4affSfengbojiang 	}
272*22ce4affSfengbojiang 	ip->ip_lladdr_tag = EVENTHANDLER_REGISTER(iflladdr_event,
273*22ce4affSfengbojiang 											 iflib_iflladdr, NULL, EVENTHANDLER_PRI_ANY);
274*22ce4affSfengbojiang 	if (ip->ip_lladdr_tag == NULL)
275*22ce4affSfengbojiang 		goto fail_addr;
276*22ce4affSfengbojiang 	ip->ip_detach_tag = EVENTHANDLER_REGISTER(ifnet_departure_event,
277*22ce4affSfengbojiang 											 iflib_ifdetach, NULL, EVENTHANDLER_PRI_ANY);
278*22ce4affSfengbojiang 
279*22ce4affSfengbojiang 	if (ip->ip_detach_tag == NULL)
280*22ce4affSfengbojiang 		goto fail_depart;
281*22ce4affSfengbojiang 
282*22ce4affSfengbojiang 	iflib_ip_insert(ip);
283*22ce4affSfengbojiang 	return (ip);
284*22ce4affSfengbojiang  fail_depart:
285*22ce4affSfengbojiang 	EVENTHANDLER_DEREGISTER(iflladdr_event, ip->ip_lladdr_tag);
286*22ce4affSfengbojiang  fail_addr:
287*22ce4affSfengbojiang 	if_clone_detach(ip->ip_ifc);
288*22ce4affSfengbojiang  fail_clone:
289*22ce4affSfengbojiang 	free(ip, M_IFLIB);
290*22ce4affSfengbojiang 	return (NULL);
291*22ce4affSfengbojiang }
292*22ce4affSfengbojiang 
293*22ce4affSfengbojiang void
iflib_clone_deregister(if_pseudo_t ip)294*22ce4affSfengbojiang iflib_clone_deregister(if_pseudo_t ip)
295*22ce4affSfengbojiang {
296*22ce4affSfengbojiang 	/* XXX check that is not still in use */
297*22ce4affSfengbojiang 	iflib_ip_delete(ip);
298*22ce4affSfengbojiang 	EVENTHANDLER_DEREGISTER(ifnet_departure_event, ip->ip_detach_tag);
299*22ce4affSfengbojiang 	EVENTHANDLER_DEREGISTER(iflladdr_event, ip->ip_lladdr_tag);
300*22ce4affSfengbojiang 	if_clone_detach(ip->ip_ifc);
301*22ce4affSfengbojiang 	/* XXX free devclass */
302*22ce4affSfengbojiang 	free(ip, M_IFLIB);
303*22ce4affSfengbojiang }
304