xref: /linux-6.15/drivers/net/netdevsim/netdev.c (revision 8ef890df)
1 /*
2  * Copyright (C) 2017 Netronome Systems, Inc.
3  *
4  * This software is licensed under the GNU General License Version 2,
5  * June 1991 as shown in the file COPYING in the top-level directory of this
6  * source tree.
7  *
8  * THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS"
9  * WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING,
10  * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
11  * FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE
12  * OF THE PROGRAM IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME
13  * THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
14  */
15 
16 #include <linux/debugfs.h>
17 #include <linux/etherdevice.h>
18 #include <linux/ethtool_netlink.h>
19 #include <linux/kernel.h>
20 #include <linux/module.h>
21 #include <linux/netdevice.h>
22 #include <linux/slab.h>
23 #include <net/netdev_queues.h>
24 #include <net/netdev_rx_queue.h>
25 #include <net/page_pool/helpers.h>
26 #include <net/netlink.h>
27 #include <net/net_shaper.h>
28 #include <net/netdev_lock.h>
29 #include <net/pkt_cls.h>
30 #include <net/rtnetlink.h>
31 #include <net/udp_tunnel.h>
32 
33 #include "netdevsim.h"
34 
35 MODULE_IMPORT_NS("NETDEV_INTERNAL");
36 
37 #define NSIM_RING_SIZE		256
38 
39 static int nsim_napi_rx(struct nsim_rq *rq, struct sk_buff *skb)
40 {
41 	if (skb_queue_len(&rq->skb_queue) > NSIM_RING_SIZE) {
42 		dev_kfree_skb_any(skb);
43 		return NET_RX_DROP;
44 	}
45 
46 	skb_queue_tail(&rq->skb_queue, skb);
47 	return NET_RX_SUCCESS;
48 }
49 
50 static int nsim_forward_skb(struct net_device *dev, struct sk_buff *skb,
51 			    struct nsim_rq *rq)
52 {
53 	return __dev_forward_skb(dev, skb) ?: nsim_napi_rx(rq, skb);
54 }
55 
56 static netdev_tx_t nsim_start_xmit(struct sk_buff *skb, struct net_device *dev)
57 {
58 	struct netdevsim *ns = netdev_priv(dev);
59 	struct net_device *peer_dev;
60 	unsigned int len = skb->len;
61 	struct netdevsim *peer_ns;
62 	struct netdev_config *cfg;
63 	struct nsim_rq *rq;
64 	int rxq;
65 
66 	rcu_read_lock();
67 	if (!nsim_ipsec_tx(ns, skb))
68 		goto out_drop_free;
69 
70 	peer_ns = rcu_dereference(ns->peer);
71 	if (!peer_ns)
72 		goto out_drop_free;
73 
74 	peer_dev = peer_ns->netdev;
75 	rxq = skb_get_queue_mapping(skb);
76 	if (rxq >= peer_dev->num_rx_queues)
77 		rxq = rxq % peer_dev->num_rx_queues;
78 	rq = peer_ns->rq[rxq];
79 
80 	cfg = peer_dev->cfg;
81 	if (skb_is_nonlinear(skb) &&
82 	    (cfg->hds_config != ETHTOOL_TCP_DATA_SPLIT_ENABLED ||
83 	     (cfg->hds_config == ETHTOOL_TCP_DATA_SPLIT_ENABLED &&
84 	      cfg->hds_thresh > len)))
85 		skb_linearize(skb);
86 
87 	skb_tx_timestamp(skb);
88 	if (unlikely(nsim_forward_skb(peer_dev, skb, rq) == NET_RX_DROP))
89 		goto out_drop_cnt;
90 
91 	if (!hrtimer_active(&rq->napi_timer))
92 		hrtimer_start(&rq->napi_timer, us_to_ktime(5), HRTIMER_MODE_REL);
93 
94 	rcu_read_unlock();
95 	u64_stats_update_begin(&ns->syncp);
96 	ns->tx_packets++;
97 	ns->tx_bytes += len;
98 	u64_stats_update_end(&ns->syncp);
99 	return NETDEV_TX_OK;
100 
101 out_drop_free:
102 	dev_kfree_skb(skb);
103 out_drop_cnt:
104 	rcu_read_unlock();
105 	u64_stats_update_begin(&ns->syncp);
106 	ns->tx_dropped++;
107 	u64_stats_update_end(&ns->syncp);
108 	return NETDEV_TX_OK;
109 }
110 
111 static void nsim_set_rx_mode(struct net_device *dev)
112 {
113 }
114 
115 static int nsim_change_mtu(struct net_device *dev, int new_mtu)
116 {
117 	struct netdevsim *ns = netdev_priv(dev);
118 
119 	if (ns->xdp.prog && new_mtu > NSIM_XDP_MAX_MTU)
120 		return -EBUSY;
121 
122 	WRITE_ONCE(dev->mtu, new_mtu);
123 
124 	return 0;
125 }
126 
127 static void
128 nsim_get_stats64(struct net_device *dev, struct rtnl_link_stats64 *stats)
129 {
130 	struct netdevsim *ns = netdev_priv(dev);
131 	unsigned int start;
132 
133 	do {
134 		start = u64_stats_fetch_begin(&ns->syncp);
135 		stats->tx_bytes = ns->tx_bytes;
136 		stats->tx_packets = ns->tx_packets;
137 		stats->tx_dropped = ns->tx_dropped;
138 	} while (u64_stats_fetch_retry(&ns->syncp, start));
139 }
140 
141 static int
142 nsim_setup_tc_block_cb(enum tc_setup_type type, void *type_data, void *cb_priv)
143 {
144 	return nsim_bpf_setup_tc_block_cb(type, type_data, cb_priv);
145 }
146 
147 static int nsim_set_vf_mac(struct net_device *dev, int vf, u8 *mac)
148 {
149 	struct netdevsim *ns = netdev_priv(dev);
150 	struct nsim_dev *nsim_dev = ns->nsim_dev;
151 
152 	/* Only refuse multicast addresses, zero address can mean unset/any. */
153 	if (vf >= nsim_dev_get_vfs(nsim_dev) || is_multicast_ether_addr(mac))
154 		return -EINVAL;
155 	memcpy(nsim_dev->vfconfigs[vf].vf_mac, mac, ETH_ALEN);
156 
157 	return 0;
158 }
159 
160 static int nsim_set_vf_vlan(struct net_device *dev, int vf,
161 			    u16 vlan, u8 qos, __be16 vlan_proto)
162 {
163 	struct netdevsim *ns = netdev_priv(dev);
164 	struct nsim_dev *nsim_dev = ns->nsim_dev;
165 
166 	if (vf >= nsim_dev_get_vfs(nsim_dev) || vlan > 4095 || qos > 7)
167 		return -EINVAL;
168 
169 	nsim_dev->vfconfigs[vf].vlan = vlan;
170 	nsim_dev->vfconfigs[vf].qos = qos;
171 	nsim_dev->vfconfigs[vf].vlan_proto = vlan_proto;
172 
173 	return 0;
174 }
175 
176 static int nsim_set_vf_rate(struct net_device *dev, int vf, int min, int max)
177 {
178 	struct netdevsim *ns = netdev_priv(dev);
179 	struct nsim_dev *nsim_dev = ns->nsim_dev;
180 
181 	if (nsim_esw_mode_is_switchdev(ns->nsim_dev)) {
182 		pr_err("Not supported in switchdev mode. Please use devlink API.\n");
183 		return -EOPNOTSUPP;
184 	}
185 
186 	if (vf >= nsim_dev_get_vfs(nsim_dev))
187 		return -EINVAL;
188 
189 	nsim_dev->vfconfigs[vf].min_tx_rate = min;
190 	nsim_dev->vfconfigs[vf].max_tx_rate = max;
191 
192 	return 0;
193 }
194 
195 static int nsim_set_vf_spoofchk(struct net_device *dev, int vf, bool val)
196 {
197 	struct netdevsim *ns = netdev_priv(dev);
198 	struct nsim_dev *nsim_dev = ns->nsim_dev;
199 
200 	if (vf >= nsim_dev_get_vfs(nsim_dev))
201 		return -EINVAL;
202 	nsim_dev->vfconfigs[vf].spoofchk_enabled = val;
203 
204 	return 0;
205 }
206 
207 static int nsim_set_vf_rss_query_en(struct net_device *dev, int vf, bool val)
208 {
209 	struct netdevsim *ns = netdev_priv(dev);
210 	struct nsim_dev *nsim_dev = ns->nsim_dev;
211 
212 	if (vf >= nsim_dev_get_vfs(nsim_dev))
213 		return -EINVAL;
214 	nsim_dev->vfconfigs[vf].rss_query_enabled = val;
215 
216 	return 0;
217 }
218 
219 static int nsim_set_vf_trust(struct net_device *dev, int vf, bool val)
220 {
221 	struct netdevsim *ns = netdev_priv(dev);
222 	struct nsim_dev *nsim_dev = ns->nsim_dev;
223 
224 	if (vf >= nsim_dev_get_vfs(nsim_dev))
225 		return -EINVAL;
226 	nsim_dev->vfconfigs[vf].trusted = val;
227 
228 	return 0;
229 }
230 
231 static int
232 nsim_get_vf_config(struct net_device *dev, int vf, struct ifla_vf_info *ivi)
233 {
234 	struct netdevsim *ns = netdev_priv(dev);
235 	struct nsim_dev *nsim_dev = ns->nsim_dev;
236 
237 	if (vf >= nsim_dev_get_vfs(nsim_dev))
238 		return -EINVAL;
239 
240 	ivi->vf = vf;
241 	ivi->linkstate = nsim_dev->vfconfigs[vf].link_state;
242 	ivi->min_tx_rate = nsim_dev->vfconfigs[vf].min_tx_rate;
243 	ivi->max_tx_rate = nsim_dev->vfconfigs[vf].max_tx_rate;
244 	ivi->vlan = nsim_dev->vfconfigs[vf].vlan;
245 	ivi->vlan_proto = nsim_dev->vfconfigs[vf].vlan_proto;
246 	ivi->qos = nsim_dev->vfconfigs[vf].qos;
247 	memcpy(&ivi->mac, nsim_dev->vfconfigs[vf].vf_mac, ETH_ALEN);
248 	ivi->spoofchk = nsim_dev->vfconfigs[vf].spoofchk_enabled;
249 	ivi->trusted = nsim_dev->vfconfigs[vf].trusted;
250 	ivi->rss_query_en = nsim_dev->vfconfigs[vf].rss_query_enabled;
251 
252 	return 0;
253 }
254 
255 static int nsim_set_vf_link_state(struct net_device *dev, int vf, int state)
256 {
257 	struct netdevsim *ns = netdev_priv(dev);
258 	struct nsim_dev *nsim_dev = ns->nsim_dev;
259 
260 	if (vf >= nsim_dev_get_vfs(nsim_dev))
261 		return -EINVAL;
262 
263 	switch (state) {
264 	case IFLA_VF_LINK_STATE_AUTO:
265 	case IFLA_VF_LINK_STATE_ENABLE:
266 	case IFLA_VF_LINK_STATE_DISABLE:
267 		break;
268 	default:
269 		return -EINVAL;
270 	}
271 
272 	nsim_dev->vfconfigs[vf].link_state = state;
273 
274 	return 0;
275 }
276 
277 static void nsim_taprio_stats(struct tc_taprio_qopt_stats *stats)
278 {
279 	stats->window_drops = 0;
280 	stats->tx_overruns = 0;
281 }
282 
283 static int nsim_setup_tc_taprio(struct net_device *dev,
284 				struct tc_taprio_qopt_offload *offload)
285 {
286 	int err = 0;
287 
288 	switch (offload->cmd) {
289 	case TAPRIO_CMD_REPLACE:
290 	case TAPRIO_CMD_DESTROY:
291 		break;
292 	case TAPRIO_CMD_STATS:
293 		nsim_taprio_stats(&offload->stats);
294 		break;
295 	default:
296 		err = -EOPNOTSUPP;
297 	}
298 
299 	return err;
300 }
301 
302 static LIST_HEAD(nsim_block_cb_list);
303 
304 static int
305 nsim_setup_tc(struct net_device *dev, enum tc_setup_type type, void *type_data)
306 {
307 	struct netdevsim *ns = netdev_priv(dev);
308 
309 	switch (type) {
310 	case TC_SETUP_QDISC_TAPRIO:
311 		return nsim_setup_tc_taprio(dev, type_data);
312 	case TC_SETUP_BLOCK:
313 		return flow_block_cb_setup_simple(type_data,
314 						  &nsim_block_cb_list,
315 						  nsim_setup_tc_block_cb,
316 						  ns, ns, true);
317 	default:
318 		return -EOPNOTSUPP;
319 	}
320 }
321 
322 static int
323 nsim_set_features(struct net_device *dev, netdev_features_t features)
324 {
325 	struct netdevsim *ns = netdev_priv(dev);
326 
327 	if ((dev->features & NETIF_F_HW_TC) > (features & NETIF_F_HW_TC))
328 		return nsim_bpf_disable_tc(ns);
329 
330 	return 0;
331 }
332 
333 static int nsim_get_iflink(const struct net_device *dev)
334 {
335 	struct netdevsim *nsim, *peer;
336 	int iflink;
337 
338 	nsim = netdev_priv(dev);
339 
340 	rcu_read_lock();
341 	peer = rcu_dereference(nsim->peer);
342 	iflink = peer ? READ_ONCE(peer->netdev->ifindex) :
343 			READ_ONCE(dev->ifindex);
344 	rcu_read_unlock();
345 
346 	return iflink;
347 }
348 
349 static int nsim_rcv(struct nsim_rq *rq, int budget)
350 {
351 	struct sk_buff *skb;
352 	int i;
353 
354 	for (i = 0; i < budget; i++) {
355 		if (skb_queue_empty(&rq->skb_queue))
356 			break;
357 
358 		skb = skb_dequeue(&rq->skb_queue);
359 		netif_receive_skb(skb);
360 	}
361 
362 	return i;
363 }
364 
365 static int nsim_poll(struct napi_struct *napi, int budget)
366 {
367 	struct nsim_rq *rq = container_of(napi, struct nsim_rq, napi);
368 	int done;
369 
370 	done = nsim_rcv(rq, budget);
371 	napi_complete(napi);
372 
373 	return done;
374 }
375 
376 static int nsim_create_page_pool(struct page_pool **p, struct napi_struct *napi)
377 {
378 	struct page_pool_params params = {
379 		.order = 0,
380 		.pool_size = NSIM_RING_SIZE,
381 		.nid = NUMA_NO_NODE,
382 		.dev = &napi->dev->dev,
383 		.napi = napi,
384 		.dma_dir = DMA_BIDIRECTIONAL,
385 		.netdev = napi->dev,
386 	};
387 	struct page_pool *pool;
388 
389 	pool = page_pool_create(&params);
390 	if (IS_ERR(pool))
391 		return PTR_ERR(pool);
392 
393 	*p = pool;
394 	return 0;
395 }
396 
397 static int nsim_init_napi(struct netdevsim *ns)
398 {
399 	struct net_device *dev = ns->netdev;
400 	struct nsim_rq *rq;
401 	int err, i;
402 
403 	for (i = 0; i < dev->num_rx_queues; i++) {
404 		rq = ns->rq[i];
405 
406 		netif_napi_add_config_locked(dev, &rq->napi, nsim_poll, i);
407 	}
408 
409 	for (i = 0; i < dev->num_rx_queues; i++) {
410 		rq = ns->rq[i];
411 
412 		err = nsim_create_page_pool(&rq->page_pool, &rq->napi);
413 		if (err)
414 			goto err_pp_destroy;
415 	}
416 
417 	return 0;
418 
419 err_pp_destroy:
420 	while (i--) {
421 		page_pool_destroy(ns->rq[i]->page_pool);
422 		ns->rq[i]->page_pool = NULL;
423 	}
424 
425 	for (i = 0; i < dev->num_rx_queues; i++)
426 		__netif_napi_del_locked(&ns->rq[i]->napi);
427 
428 	return err;
429 }
430 
431 static enum hrtimer_restart nsim_napi_schedule(struct hrtimer *timer)
432 {
433 	struct nsim_rq *rq;
434 
435 	rq = container_of(timer, struct nsim_rq, napi_timer);
436 	napi_schedule(&rq->napi);
437 
438 	return HRTIMER_NORESTART;
439 }
440 
441 static void nsim_rq_timer_init(struct nsim_rq *rq)
442 {
443 	hrtimer_init(&rq->napi_timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
444 	rq->napi_timer.function = nsim_napi_schedule;
445 }
446 
447 static void nsim_enable_napi(struct netdevsim *ns)
448 {
449 	struct net_device *dev = ns->netdev;
450 	int i;
451 
452 	for (i = 0; i < dev->num_rx_queues; i++) {
453 		struct nsim_rq *rq = ns->rq[i];
454 
455 		netif_queue_set_napi(dev, i, NETDEV_QUEUE_TYPE_RX, &rq->napi);
456 		napi_enable_locked(&rq->napi);
457 	}
458 }
459 
460 static int nsim_open(struct net_device *dev)
461 {
462 	struct netdevsim *ns = netdev_priv(dev);
463 	int err;
464 
465 	netdev_assert_locked(dev);
466 
467 	err = nsim_init_napi(ns);
468 	if (err)
469 		return err;
470 
471 	nsim_enable_napi(ns);
472 
473 	return 0;
474 }
475 
476 static void nsim_del_napi(struct netdevsim *ns)
477 {
478 	struct net_device *dev = ns->netdev;
479 	int i;
480 
481 	for (i = 0; i < dev->num_rx_queues; i++) {
482 		struct nsim_rq *rq = ns->rq[i];
483 
484 		napi_disable_locked(&rq->napi);
485 		__netif_napi_del_locked(&rq->napi);
486 	}
487 	synchronize_net();
488 
489 	for (i = 0; i < dev->num_rx_queues; i++) {
490 		page_pool_destroy(ns->rq[i]->page_pool);
491 		ns->rq[i]->page_pool = NULL;
492 	}
493 }
494 
495 static int nsim_stop(struct net_device *dev)
496 {
497 	struct netdevsim *ns = netdev_priv(dev);
498 	struct netdevsim *peer;
499 
500 	netdev_assert_locked(dev);
501 
502 	netif_carrier_off(dev);
503 	peer = rtnl_dereference(ns->peer);
504 	if (peer)
505 		netif_carrier_off(peer->netdev);
506 
507 	nsim_del_napi(ns);
508 
509 	return 0;
510 }
511 
512 static int nsim_shaper_set(struct net_shaper_binding *binding,
513 			   const struct net_shaper *shaper,
514 			   struct netlink_ext_ack *extack)
515 {
516 	return 0;
517 }
518 
519 static int nsim_shaper_del(struct net_shaper_binding *binding,
520 			   const struct net_shaper_handle *handle,
521 			   struct netlink_ext_ack *extack)
522 {
523 	return 0;
524 }
525 
526 static int nsim_shaper_group(struct net_shaper_binding *binding,
527 			     int leaves_count,
528 			     const struct net_shaper *leaves,
529 			     const struct net_shaper *root,
530 			     struct netlink_ext_ack *extack)
531 {
532 	return 0;
533 }
534 
535 static void nsim_shaper_cap(struct net_shaper_binding *binding,
536 			    enum net_shaper_scope scope,
537 			    unsigned long *flags)
538 {
539 	*flags = ULONG_MAX;
540 }
541 
542 static const struct net_shaper_ops nsim_shaper_ops = {
543 	.set			= nsim_shaper_set,
544 	.delete			= nsim_shaper_del,
545 	.group			= nsim_shaper_group,
546 	.capabilities		= nsim_shaper_cap,
547 };
548 
549 static const struct net_device_ops nsim_netdev_ops = {
550 	.ndo_start_xmit		= nsim_start_xmit,
551 	.ndo_set_rx_mode	= nsim_set_rx_mode,
552 	.ndo_set_mac_address	= eth_mac_addr,
553 	.ndo_validate_addr	= eth_validate_addr,
554 	.ndo_change_mtu		= nsim_change_mtu,
555 	.ndo_get_stats64	= nsim_get_stats64,
556 	.ndo_set_vf_mac		= nsim_set_vf_mac,
557 	.ndo_set_vf_vlan	= nsim_set_vf_vlan,
558 	.ndo_set_vf_rate	= nsim_set_vf_rate,
559 	.ndo_set_vf_spoofchk	= nsim_set_vf_spoofchk,
560 	.ndo_set_vf_trust	= nsim_set_vf_trust,
561 	.ndo_get_vf_config	= nsim_get_vf_config,
562 	.ndo_set_vf_link_state	= nsim_set_vf_link_state,
563 	.ndo_set_vf_rss_query_en = nsim_set_vf_rss_query_en,
564 	.ndo_setup_tc		= nsim_setup_tc,
565 	.ndo_set_features	= nsim_set_features,
566 	.ndo_get_iflink		= nsim_get_iflink,
567 	.ndo_bpf		= nsim_bpf,
568 	.ndo_open		= nsim_open,
569 	.ndo_stop		= nsim_stop,
570 	.net_shaper_ops		= &nsim_shaper_ops,
571 };
572 
573 static const struct net_device_ops nsim_vf_netdev_ops = {
574 	.ndo_start_xmit		= nsim_start_xmit,
575 	.ndo_set_rx_mode	= nsim_set_rx_mode,
576 	.ndo_set_mac_address	= eth_mac_addr,
577 	.ndo_validate_addr	= eth_validate_addr,
578 	.ndo_change_mtu		= nsim_change_mtu,
579 	.ndo_get_stats64	= nsim_get_stats64,
580 	.ndo_setup_tc		= nsim_setup_tc,
581 	.ndo_set_features	= nsim_set_features,
582 };
583 
584 /* We don't have true per-queue stats, yet, so do some random fakery here.
585  * Only report stuff for queue 0.
586  */
587 static void nsim_get_queue_stats_rx(struct net_device *dev, int idx,
588 				    struct netdev_queue_stats_rx *stats)
589 {
590 	struct rtnl_link_stats64 rtstats = {};
591 
592 	if (!idx)
593 		nsim_get_stats64(dev, &rtstats);
594 
595 	stats->packets = rtstats.rx_packets - !!rtstats.rx_packets;
596 	stats->bytes = rtstats.rx_bytes;
597 }
598 
599 static void nsim_get_queue_stats_tx(struct net_device *dev, int idx,
600 				    struct netdev_queue_stats_tx *stats)
601 {
602 	struct rtnl_link_stats64 rtstats = {};
603 
604 	if (!idx)
605 		nsim_get_stats64(dev, &rtstats);
606 
607 	stats->packets = rtstats.tx_packets - !!rtstats.tx_packets;
608 	stats->bytes = rtstats.tx_bytes;
609 }
610 
611 static void nsim_get_base_stats(struct net_device *dev,
612 				struct netdev_queue_stats_rx *rx,
613 				struct netdev_queue_stats_tx *tx)
614 {
615 	struct rtnl_link_stats64 rtstats = {};
616 
617 	nsim_get_stats64(dev, &rtstats);
618 
619 	rx->packets = !!rtstats.rx_packets;
620 	rx->bytes = 0;
621 	tx->packets = !!rtstats.tx_packets;
622 	tx->bytes = 0;
623 }
624 
625 static const struct netdev_stat_ops nsim_stat_ops = {
626 	.get_queue_stats_tx	= nsim_get_queue_stats_tx,
627 	.get_queue_stats_rx	= nsim_get_queue_stats_rx,
628 	.get_base_stats		= nsim_get_base_stats,
629 };
630 
631 static struct nsim_rq *nsim_queue_alloc(void)
632 {
633 	struct nsim_rq *rq;
634 
635 	rq = kzalloc(sizeof(*rq), GFP_KERNEL_ACCOUNT);
636 	if (!rq)
637 		return NULL;
638 
639 	skb_queue_head_init(&rq->skb_queue);
640 	nsim_rq_timer_init(rq);
641 	return rq;
642 }
643 
644 static void nsim_queue_free(struct nsim_rq *rq)
645 {
646 	hrtimer_cancel(&rq->napi_timer);
647 	skb_queue_purge_reason(&rq->skb_queue, SKB_DROP_REASON_QUEUE_PURGE);
648 	kfree(rq);
649 }
650 
651 /* Queue reset mode is controlled by ns->rq_reset_mode.
652  * - normal - new NAPI new pool (old NAPI enabled when new added)
653  * - mode 1 - allocate new pool (NAPI is only disabled / enabled)
654  * - mode 2 - new NAPI new pool (old NAPI removed before new added)
655  * - mode 3 - new NAPI new pool (old NAPI disabled when new added)
656  */
657 struct nsim_queue_mem {
658 	struct nsim_rq *rq;
659 	struct page_pool *pp;
660 };
661 
662 static int
663 nsim_queue_mem_alloc(struct net_device *dev, void *per_queue_mem, int idx)
664 {
665 	struct nsim_queue_mem *qmem = per_queue_mem;
666 	struct netdevsim *ns = netdev_priv(dev);
667 	int err;
668 
669 	if (ns->rq_reset_mode > 3)
670 		return -EINVAL;
671 
672 	if (ns->rq_reset_mode == 1) {
673 		if (!netif_running(ns->netdev))
674 			return -ENETDOWN;
675 		return nsim_create_page_pool(&qmem->pp, &ns->rq[idx]->napi);
676 	}
677 
678 	qmem->rq = nsim_queue_alloc();
679 	if (!qmem->rq)
680 		return -ENOMEM;
681 
682 	err = nsim_create_page_pool(&qmem->rq->page_pool, &qmem->rq->napi);
683 	if (err)
684 		goto err_free;
685 
686 	if (!ns->rq_reset_mode)
687 		netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll,
688 					     idx);
689 
690 	return 0;
691 
692 err_free:
693 	nsim_queue_free(qmem->rq);
694 	return err;
695 }
696 
697 static void nsim_queue_mem_free(struct net_device *dev, void *per_queue_mem)
698 {
699 	struct nsim_queue_mem *qmem = per_queue_mem;
700 	struct netdevsim *ns = netdev_priv(dev);
701 
702 	page_pool_destroy(qmem->pp);
703 	if (qmem->rq) {
704 		if (!ns->rq_reset_mode)
705 			netif_napi_del_locked(&qmem->rq->napi);
706 		page_pool_destroy(qmem->rq->page_pool);
707 		nsim_queue_free(qmem->rq);
708 	}
709 }
710 
711 static int
712 nsim_queue_start(struct net_device *dev, void *per_queue_mem, int idx)
713 {
714 	struct nsim_queue_mem *qmem = per_queue_mem;
715 	struct netdevsim *ns = netdev_priv(dev);
716 
717 	netdev_assert_locked(dev);
718 
719 	if (ns->rq_reset_mode == 1) {
720 		ns->rq[idx]->page_pool = qmem->pp;
721 		napi_enable_locked(&ns->rq[idx]->napi);
722 		return 0;
723 	}
724 
725 	/* netif_napi_add()/_del() should normally be called from alloc/free,
726 	 * here we want to test various call orders.
727 	 */
728 	if (ns->rq_reset_mode == 2) {
729 		netif_napi_del_locked(&ns->rq[idx]->napi);
730 		netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll,
731 					     idx);
732 	} else if (ns->rq_reset_mode == 3) {
733 		netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll,
734 					     idx);
735 		netif_napi_del_locked(&ns->rq[idx]->napi);
736 	}
737 
738 	ns->rq[idx] = qmem->rq;
739 	napi_enable_locked(&ns->rq[idx]->napi);
740 
741 	return 0;
742 }
743 
744 static int nsim_queue_stop(struct net_device *dev, void *per_queue_mem, int idx)
745 {
746 	struct nsim_queue_mem *qmem = per_queue_mem;
747 	struct netdevsim *ns = netdev_priv(dev);
748 
749 	netdev_assert_locked(dev);
750 
751 	napi_disable_locked(&ns->rq[idx]->napi);
752 
753 	if (ns->rq_reset_mode == 1) {
754 		qmem->pp = ns->rq[idx]->page_pool;
755 		page_pool_disable_direct_recycling(qmem->pp);
756 	} else {
757 		qmem->rq = ns->rq[idx];
758 	}
759 
760 	return 0;
761 }
762 
763 static const struct netdev_queue_mgmt_ops nsim_queue_mgmt_ops = {
764 	.ndo_queue_mem_size	= sizeof(struct nsim_queue_mem),
765 	.ndo_queue_mem_alloc	= nsim_queue_mem_alloc,
766 	.ndo_queue_mem_free	= nsim_queue_mem_free,
767 	.ndo_queue_start	= nsim_queue_start,
768 	.ndo_queue_stop		= nsim_queue_stop,
769 };
770 
771 static ssize_t
772 nsim_qreset_write(struct file *file, const char __user *data,
773 		  size_t count, loff_t *ppos)
774 {
775 	struct netdevsim *ns = file->private_data;
776 	unsigned int queue, mode;
777 	char buf[32];
778 	ssize_t ret;
779 
780 	if (count >= sizeof(buf))
781 		return -EINVAL;
782 	if (copy_from_user(buf, data, count))
783 		return -EFAULT;
784 	buf[count] = '\0';
785 
786 	ret = sscanf(buf, "%u %u", &queue, &mode);
787 	if (ret != 2)
788 		return -EINVAL;
789 
790 	rtnl_lock();
791 	if (queue >= ns->netdev->real_num_rx_queues) {
792 		ret = -EINVAL;
793 		goto exit_unlock;
794 	}
795 
796 	ns->rq_reset_mode = mode;
797 	ret = netdev_rx_queue_restart(ns->netdev, queue);
798 	ns->rq_reset_mode = 0;
799 	if (ret)
800 		goto exit_unlock;
801 
802 	ret = count;
803 exit_unlock:
804 	rtnl_unlock();
805 	return ret;
806 }
807 
808 static const struct file_operations nsim_qreset_fops = {
809 	.open = simple_open,
810 	.write = nsim_qreset_write,
811 	.owner = THIS_MODULE,
812 };
813 
814 static ssize_t
815 nsim_pp_hold_read(struct file *file, char __user *data,
816 		  size_t count, loff_t *ppos)
817 {
818 	struct netdevsim *ns = file->private_data;
819 	char buf[3] = "n\n";
820 
821 	if (ns->page)
822 		buf[0] = 'y';
823 
824 	return simple_read_from_buffer(data, count, ppos, buf, 2);
825 }
826 
827 static ssize_t
828 nsim_pp_hold_write(struct file *file, const char __user *data,
829 		   size_t count, loff_t *ppos)
830 {
831 	struct netdevsim *ns = file->private_data;
832 	ssize_t ret;
833 	bool val;
834 
835 	ret = kstrtobool_from_user(data, count, &val);
836 	if (ret)
837 		return ret;
838 
839 	rtnl_lock();
840 	ret = count;
841 	if (val == !!ns->page)
842 		goto exit;
843 
844 	if (!netif_running(ns->netdev) && val) {
845 		ret = -ENETDOWN;
846 	} else if (val) {
847 		ns->page = page_pool_dev_alloc_pages(ns->rq[0]->page_pool);
848 		if (!ns->page)
849 			ret = -ENOMEM;
850 	} else {
851 		page_pool_put_full_page(ns->page->pp, ns->page, false);
852 		ns->page = NULL;
853 	}
854 
855 exit:
856 	rtnl_unlock();
857 	return ret;
858 }
859 
860 static const struct file_operations nsim_pp_hold_fops = {
861 	.open = simple_open,
862 	.read = nsim_pp_hold_read,
863 	.write = nsim_pp_hold_write,
864 	.llseek = generic_file_llseek,
865 	.owner = THIS_MODULE,
866 };
867 
868 static void nsim_setup(struct net_device *dev)
869 {
870 	ether_setup(dev);
871 	eth_hw_addr_random(dev);
872 
873 	dev->tx_queue_len = 0;
874 	dev->flags &= ~IFF_MULTICAST;
875 	dev->priv_flags |= IFF_LIVE_ADDR_CHANGE |
876 			   IFF_NO_QUEUE;
877 	dev->features |= NETIF_F_HIGHDMA |
878 			 NETIF_F_SG |
879 			 NETIF_F_FRAGLIST |
880 			 NETIF_F_HW_CSUM |
881 			 NETIF_F_TSO;
882 	dev->hw_features |= NETIF_F_HW_TC |
883 			    NETIF_F_SG |
884 			    NETIF_F_FRAGLIST |
885 			    NETIF_F_HW_CSUM |
886 			    NETIF_F_TSO;
887 	dev->max_mtu = ETH_MAX_MTU;
888 	dev->xdp_features = NETDEV_XDP_ACT_HW_OFFLOAD;
889 }
890 
891 static int nsim_queue_init(struct netdevsim *ns)
892 {
893 	struct net_device *dev = ns->netdev;
894 	int i;
895 
896 	ns->rq = kcalloc(dev->num_rx_queues, sizeof(*ns->rq),
897 			 GFP_KERNEL_ACCOUNT);
898 	if (!ns->rq)
899 		return -ENOMEM;
900 
901 	for (i = 0; i < dev->num_rx_queues; i++) {
902 		ns->rq[i] = nsim_queue_alloc();
903 		if (!ns->rq[i])
904 			goto err_free_prev;
905 	}
906 
907 	return 0;
908 
909 err_free_prev:
910 	while (i--)
911 		kfree(ns->rq[i]);
912 	kfree(ns->rq);
913 	return -ENOMEM;
914 }
915 
916 static void nsim_queue_uninit(struct netdevsim *ns)
917 {
918 	struct net_device *dev = ns->netdev;
919 	int i;
920 
921 	for (i = 0; i < dev->num_rx_queues; i++)
922 		nsim_queue_free(ns->rq[i]);
923 
924 	kfree(ns->rq);
925 	ns->rq = NULL;
926 }
927 
928 static int nsim_init_netdevsim(struct netdevsim *ns)
929 {
930 	struct mock_phc *phc;
931 	int err;
932 
933 	phc = mock_phc_create(&ns->nsim_bus_dev->dev);
934 	if (IS_ERR(phc))
935 		return PTR_ERR(phc);
936 
937 	ns->phc = phc;
938 	ns->netdev->netdev_ops = &nsim_netdev_ops;
939 	ns->netdev->stat_ops = &nsim_stat_ops;
940 	ns->netdev->queue_mgmt_ops = &nsim_queue_mgmt_ops;
941 
942 	err = nsim_udp_tunnels_info_create(ns->nsim_dev, ns->netdev);
943 	if (err)
944 		goto err_phc_destroy;
945 
946 	rtnl_lock();
947 	err = nsim_queue_init(ns);
948 	if (err)
949 		goto err_utn_destroy;
950 
951 	err = nsim_bpf_init(ns);
952 	if (err)
953 		goto err_rq_destroy;
954 
955 	nsim_macsec_init(ns);
956 	nsim_ipsec_init(ns);
957 
958 	err = register_netdevice(ns->netdev);
959 	if (err)
960 		goto err_ipsec_teardown;
961 	rtnl_unlock();
962 	return 0;
963 
964 err_ipsec_teardown:
965 	nsim_ipsec_teardown(ns);
966 	nsim_macsec_teardown(ns);
967 	nsim_bpf_uninit(ns);
968 err_rq_destroy:
969 	nsim_queue_uninit(ns);
970 err_utn_destroy:
971 	rtnl_unlock();
972 	nsim_udp_tunnels_info_destroy(ns->netdev);
973 err_phc_destroy:
974 	mock_phc_destroy(ns->phc);
975 	return err;
976 }
977 
978 static int nsim_init_netdevsim_vf(struct netdevsim *ns)
979 {
980 	int err;
981 
982 	ns->netdev->netdev_ops = &nsim_vf_netdev_ops;
983 	rtnl_lock();
984 	err = register_netdevice(ns->netdev);
985 	rtnl_unlock();
986 	return err;
987 }
988 
989 static void nsim_exit_netdevsim(struct netdevsim *ns)
990 {
991 	nsim_udp_tunnels_info_destroy(ns->netdev);
992 	mock_phc_destroy(ns->phc);
993 }
994 
995 struct netdevsim *
996 nsim_create(struct nsim_dev *nsim_dev, struct nsim_dev_port *nsim_dev_port)
997 {
998 	struct net_device *dev;
999 	struct netdevsim *ns;
1000 	int err;
1001 
1002 	dev = alloc_netdev_mq(sizeof(*ns), "eth%d", NET_NAME_UNKNOWN, nsim_setup,
1003 			      nsim_dev->nsim_bus_dev->num_queues);
1004 	if (!dev)
1005 		return ERR_PTR(-ENOMEM);
1006 
1007 	dev_net_set(dev, nsim_dev_net(nsim_dev));
1008 	ns = netdev_priv(dev);
1009 	ns->netdev = dev;
1010 	u64_stats_init(&ns->syncp);
1011 	ns->nsim_dev = nsim_dev;
1012 	ns->nsim_dev_port = nsim_dev_port;
1013 	ns->nsim_bus_dev = nsim_dev->nsim_bus_dev;
1014 	SET_NETDEV_DEV(dev, &ns->nsim_bus_dev->dev);
1015 	SET_NETDEV_DEVLINK_PORT(dev, &nsim_dev_port->devlink_port);
1016 	nsim_ethtool_init(ns);
1017 	if (nsim_dev_port_is_pf(nsim_dev_port))
1018 		err = nsim_init_netdevsim(ns);
1019 	else
1020 		err = nsim_init_netdevsim_vf(ns);
1021 	if (err)
1022 		goto err_free_netdev;
1023 
1024 	ns->pp_dfs = debugfs_create_file("pp_hold", 0600, nsim_dev_port->ddir,
1025 					 ns, &nsim_pp_hold_fops);
1026 	ns->qr_dfs = debugfs_create_file("queue_reset", 0200,
1027 					 nsim_dev_port->ddir, ns,
1028 					 &nsim_qreset_fops);
1029 
1030 	return ns;
1031 
1032 err_free_netdev:
1033 	free_netdev(dev);
1034 	return ERR_PTR(err);
1035 }
1036 
1037 void nsim_destroy(struct netdevsim *ns)
1038 {
1039 	struct net_device *dev = ns->netdev;
1040 	struct netdevsim *peer;
1041 
1042 	debugfs_remove(ns->qr_dfs);
1043 	debugfs_remove(ns->pp_dfs);
1044 
1045 	rtnl_lock();
1046 	peer = rtnl_dereference(ns->peer);
1047 	if (peer)
1048 		RCU_INIT_POINTER(peer->peer, NULL);
1049 	RCU_INIT_POINTER(ns->peer, NULL);
1050 	unregister_netdevice(dev);
1051 	if (nsim_dev_port_is_pf(ns->nsim_dev_port)) {
1052 		nsim_macsec_teardown(ns);
1053 		nsim_ipsec_teardown(ns);
1054 		nsim_bpf_uninit(ns);
1055 		nsim_queue_uninit(ns);
1056 	}
1057 	rtnl_unlock();
1058 	if (nsim_dev_port_is_pf(ns->nsim_dev_port))
1059 		nsim_exit_netdevsim(ns);
1060 
1061 	/* Put this intentionally late to exercise the orphaning path */
1062 	if (ns->page) {
1063 		page_pool_put_full_page(ns->page->pp, ns->page, false);
1064 		ns->page = NULL;
1065 	}
1066 
1067 	free_netdev(dev);
1068 }
1069 
1070 bool netdev_is_nsim(struct net_device *dev)
1071 {
1072 	return dev->netdev_ops == &nsim_netdev_ops;
1073 }
1074 
1075 static int nsim_validate(struct nlattr *tb[], struct nlattr *data[],
1076 			 struct netlink_ext_ack *extack)
1077 {
1078 	NL_SET_ERR_MSG_MOD(extack,
1079 			   "Please use: echo \"[ID] [PORT_COUNT] [NUM_QUEUES]\" > /sys/bus/netdevsim/new_device");
1080 	return -EOPNOTSUPP;
1081 }
1082 
1083 static struct rtnl_link_ops nsim_link_ops __read_mostly = {
1084 	.kind		= DRV_NAME,
1085 	.validate	= nsim_validate,
1086 };
1087 
1088 static int __init nsim_module_init(void)
1089 {
1090 	int err;
1091 
1092 	err = nsim_dev_init();
1093 	if (err)
1094 		return err;
1095 
1096 	err = nsim_bus_init();
1097 	if (err)
1098 		goto err_dev_exit;
1099 
1100 	err = rtnl_link_register(&nsim_link_ops);
1101 	if (err)
1102 		goto err_bus_exit;
1103 
1104 	return 0;
1105 
1106 err_bus_exit:
1107 	nsim_bus_exit();
1108 err_dev_exit:
1109 	nsim_dev_exit();
1110 	return err;
1111 }
1112 
1113 static void __exit nsim_module_exit(void)
1114 {
1115 	rtnl_link_unregister(&nsim_link_ops);
1116 	nsim_bus_exit();
1117 	nsim_dev_exit();
1118 }
1119 
1120 module_init(nsim_module_init);
1121 module_exit(nsim_module_exit);
1122 MODULE_LICENSE("GPL");
1123 MODULE_DESCRIPTION("Simulated networking device for testing");
1124 MODULE_ALIAS_RTNL_LINK(DRV_NAME);
1125