1 /* 2 * Copyright (C) 2017 Netronome Systems, Inc. 3 * 4 * This software is licensed under the GNU General License Version 2, 5 * June 1991 as shown in the file COPYING in the top-level directory of this 6 * source tree. 7 * 8 * THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS" 9 * WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, 10 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS 11 * FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE 12 * OF THE PROGRAM IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME 13 * THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION. 14 */ 15 16 #include <linux/debugfs.h> 17 #include <linux/etherdevice.h> 18 #include <linux/ethtool_netlink.h> 19 #include <linux/kernel.h> 20 #include <linux/module.h> 21 #include <linux/netdevice.h> 22 #include <linux/slab.h> 23 #include <net/netdev_queues.h> 24 #include <net/netdev_rx_queue.h> 25 #include <net/page_pool/helpers.h> 26 #include <net/netlink.h> 27 #include <net/net_shaper.h> 28 #include <net/netdev_lock.h> 29 #include <net/pkt_cls.h> 30 #include <net/rtnetlink.h> 31 #include <net/udp_tunnel.h> 32 33 #include "netdevsim.h" 34 35 MODULE_IMPORT_NS("NETDEV_INTERNAL"); 36 37 #define NSIM_RING_SIZE 256 38 39 static int nsim_napi_rx(struct nsim_rq *rq, struct sk_buff *skb) 40 { 41 if (skb_queue_len(&rq->skb_queue) > NSIM_RING_SIZE) { 42 dev_kfree_skb_any(skb); 43 return NET_RX_DROP; 44 } 45 46 skb_queue_tail(&rq->skb_queue, skb); 47 return NET_RX_SUCCESS; 48 } 49 50 static int nsim_forward_skb(struct net_device *dev, struct sk_buff *skb, 51 struct nsim_rq *rq) 52 { 53 return __dev_forward_skb(dev, skb) ?: nsim_napi_rx(rq, skb); 54 } 55 56 static netdev_tx_t nsim_start_xmit(struct sk_buff *skb, struct net_device *dev) 57 { 58 struct netdevsim *ns = netdev_priv(dev); 59 struct net_device *peer_dev; 60 unsigned int len = skb->len; 61 struct netdevsim *peer_ns; 62 struct netdev_config *cfg; 63 struct nsim_rq *rq; 64 int rxq; 65 66 rcu_read_lock(); 67 if (!nsim_ipsec_tx(ns, skb)) 68 goto out_drop_free; 69 70 peer_ns = rcu_dereference(ns->peer); 71 if (!peer_ns) 72 goto out_drop_free; 73 74 peer_dev = peer_ns->netdev; 75 rxq = skb_get_queue_mapping(skb); 76 if (rxq >= peer_dev->num_rx_queues) 77 rxq = rxq % peer_dev->num_rx_queues; 78 rq = peer_ns->rq[rxq]; 79 80 cfg = peer_dev->cfg; 81 if (skb_is_nonlinear(skb) && 82 (cfg->hds_config != ETHTOOL_TCP_DATA_SPLIT_ENABLED || 83 (cfg->hds_config == ETHTOOL_TCP_DATA_SPLIT_ENABLED && 84 cfg->hds_thresh > len))) 85 skb_linearize(skb); 86 87 skb_tx_timestamp(skb); 88 if (unlikely(nsim_forward_skb(peer_dev, skb, rq) == NET_RX_DROP)) 89 goto out_drop_cnt; 90 91 if (!hrtimer_active(&rq->napi_timer)) 92 hrtimer_start(&rq->napi_timer, us_to_ktime(5), HRTIMER_MODE_REL); 93 94 rcu_read_unlock(); 95 u64_stats_update_begin(&ns->syncp); 96 ns->tx_packets++; 97 ns->tx_bytes += len; 98 u64_stats_update_end(&ns->syncp); 99 return NETDEV_TX_OK; 100 101 out_drop_free: 102 dev_kfree_skb(skb); 103 out_drop_cnt: 104 rcu_read_unlock(); 105 u64_stats_update_begin(&ns->syncp); 106 ns->tx_dropped++; 107 u64_stats_update_end(&ns->syncp); 108 return NETDEV_TX_OK; 109 } 110 111 static void nsim_set_rx_mode(struct net_device *dev) 112 { 113 } 114 115 static int nsim_change_mtu(struct net_device *dev, int new_mtu) 116 { 117 struct netdevsim *ns = netdev_priv(dev); 118 119 if (ns->xdp.prog && new_mtu > NSIM_XDP_MAX_MTU) 120 return -EBUSY; 121 122 WRITE_ONCE(dev->mtu, new_mtu); 123 124 return 0; 125 } 126 127 static void 128 nsim_get_stats64(struct net_device *dev, struct rtnl_link_stats64 *stats) 129 { 130 struct netdevsim *ns = netdev_priv(dev); 131 unsigned int start; 132 133 do { 134 start = u64_stats_fetch_begin(&ns->syncp); 135 stats->tx_bytes = ns->tx_bytes; 136 stats->tx_packets = ns->tx_packets; 137 stats->tx_dropped = ns->tx_dropped; 138 } while (u64_stats_fetch_retry(&ns->syncp, start)); 139 } 140 141 static int 142 nsim_setup_tc_block_cb(enum tc_setup_type type, void *type_data, void *cb_priv) 143 { 144 return nsim_bpf_setup_tc_block_cb(type, type_data, cb_priv); 145 } 146 147 static int nsim_set_vf_mac(struct net_device *dev, int vf, u8 *mac) 148 { 149 struct netdevsim *ns = netdev_priv(dev); 150 struct nsim_dev *nsim_dev = ns->nsim_dev; 151 152 /* Only refuse multicast addresses, zero address can mean unset/any. */ 153 if (vf >= nsim_dev_get_vfs(nsim_dev) || is_multicast_ether_addr(mac)) 154 return -EINVAL; 155 memcpy(nsim_dev->vfconfigs[vf].vf_mac, mac, ETH_ALEN); 156 157 return 0; 158 } 159 160 static int nsim_set_vf_vlan(struct net_device *dev, int vf, 161 u16 vlan, u8 qos, __be16 vlan_proto) 162 { 163 struct netdevsim *ns = netdev_priv(dev); 164 struct nsim_dev *nsim_dev = ns->nsim_dev; 165 166 if (vf >= nsim_dev_get_vfs(nsim_dev) || vlan > 4095 || qos > 7) 167 return -EINVAL; 168 169 nsim_dev->vfconfigs[vf].vlan = vlan; 170 nsim_dev->vfconfigs[vf].qos = qos; 171 nsim_dev->vfconfigs[vf].vlan_proto = vlan_proto; 172 173 return 0; 174 } 175 176 static int nsim_set_vf_rate(struct net_device *dev, int vf, int min, int max) 177 { 178 struct netdevsim *ns = netdev_priv(dev); 179 struct nsim_dev *nsim_dev = ns->nsim_dev; 180 181 if (nsim_esw_mode_is_switchdev(ns->nsim_dev)) { 182 pr_err("Not supported in switchdev mode. Please use devlink API.\n"); 183 return -EOPNOTSUPP; 184 } 185 186 if (vf >= nsim_dev_get_vfs(nsim_dev)) 187 return -EINVAL; 188 189 nsim_dev->vfconfigs[vf].min_tx_rate = min; 190 nsim_dev->vfconfigs[vf].max_tx_rate = max; 191 192 return 0; 193 } 194 195 static int nsim_set_vf_spoofchk(struct net_device *dev, int vf, bool val) 196 { 197 struct netdevsim *ns = netdev_priv(dev); 198 struct nsim_dev *nsim_dev = ns->nsim_dev; 199 200 if (vf >= nsim_dev_get_vfs(nsim_dev)) 201 return -EINVAL; 202 nsim_dev->vfconfigs[vf].spoofchk_enabled = val; 203 204 return 0; 205 } 206 207 static int nsim_set_vf_rss_query_en(struct net_device *dev, int vf, bool val) 208 { 209 struct netdevsim *ns = netdev_priv(dev); 210 struct nsim_dev *nsim_dev = ns->nsim_dev; 211 212 if (vf >= nsim_dev_get_vfs(nsim_dev)) 213 return -EINVAL; 214 nsim_dev->vfconfigs[vf].rss_query_enabled = val; 215 216 return 0; 217 } 218 219 static int nsim_set_vf_trust(struct net_device *dev, int vf, bool val) 220 { 221 struct netdevsim *ns = netdev_priv(dev); 222 struct nsim_dev *nsim_dev = ns->nsim_dev; 223 224 if (vf >= nsim_dev_get_vfs(nsim_dev)) 225 return -EINVAL; 226 nsim_dev->vfconfigs[vf].trusted = val; 227 228 return 0; 229 } 230 231 static int 232 nsim_get_vf_config(struct net_device *dev, int vf, struct ifla_vf_info *ivi) 233 { 234 struct netdevsim *ns = netdev_priv(dev); 235 struct nsim_dev *nsim_dev = ns->nsim_dev; 236 237 if (vf >= nsim_dev_get_vfs(nsim_dev)) 238 return -EINVAL; 239 240 ivi->vf = vf; 241 ivi->linkstate = nsim_dev->vfconfigs[vf].link_state; 242 ivi->min_tx_rate = nsim_dev->vfconfigs[vf].min_tx_rate; 243 ivi->max_tx_rate = nsim_dev->vfconfigs[vf].max_tx_rate; 244 ivi->vlan = nsim_dev->vfconfigs[vf].vlan; 245 ivi->vlan_proto = nsim_dev->vfconfigs[vf].vlan_proto; 246 ivi->qos = nsim_dev->vfconfigs[vf].qos; 247 memcpy(&ivi->mac, nsim_dev->vfconfigs[vf].vf_mac, ETH_ALEN); 248 ivi->spoofchk = nsim_dev->vfconfigs[vf].spoofchk_enabled; 249 ivi->trusted = nsim_dev->vfconfigs[vf].trusted; 250 ivi->rss_query_en = nsim_dev->vfconfigs[vf].rss_query_enabled; 251 252 return 0; 253 } 254 255 static int nsim_set_vf_link_state(struct net_device *dev, int vf, int state) 256 { 257 struct netdevsim *ns = netdev_priv(dev); 258 struct nsim_dev *nsim_dev = ns->nsim_dev; 259 260 if (vf >= nsim_dev_get_vfs(nsim_dev)) 261 return -EINVAL; 262 263 switch (state) { 264 case IFLA_VF_LINK_STATE_AUTO: 265 case IFLA_VF_LINK_STATE_ENABLE: 266 case IFLA_VF_LINK_STATE_DISABLE: 267 break; 268 default: 269 return -EINVAL; 270 } 271 272 nsim_dev->vfconfigs[vf].link_state = state; 273 274 return 0; 275 } 276 277 static void nsim_taprio_stats(struct tc_taprio_qopt_stats *stats) 278 { 279 stats->window_drops = 0; 280 stats->tx_overruns = 0; 281 } 282 283 static int nsim_setup_tc_taprio(struct net_device *dev, 284 struct tc_taprio_qopt_offload *offload) 285 { 286 int err = 0; 287 288 switch (offload->cmd) { 289 case TAPRIO_CMD_REPLACE: 290 case TAPRIO_CMD_DESTROY: 291 break; 292 case TAPRIO_CMD_STATS: 293 nsim_taprio_stats(&offload->stats); 294 break; 295 default: 296 err = -EOPNOTSUPP; 297 } 298 299 return err; 300 } 301 302 static LIST_HEAD(nsim_block_cb_list); 303 304 static int 305 nsim_setup_tc(struct net_device *dev, enum tc_setup_type type, void *type_data) 306 { 307 struct netdevsim *ns = netdev_priv(dev); 308 309 switch (type) { 310 case TC_SETUP_QDISC_TAPRIO: 311 return nsim_setup_tc_taprio(dev, type_data); 312 case TC_SETUP_BLOCK: 313 return flow_block_cb_setup_simple(type_data, 314 &nsim_block_cb_list, 315 nsim_setup_tc_block_cb, 316 ns, ns, true); 317 default: 318 return -EOPNOTSUPP; 319 } 320 } 321 322 static int 323 nsim_set_features(struct net_device *dev, netdev_features_t features) 324 { 325 struct netdevsim *ns = netdev_priv(dev); 326 327 if ((dev->features & NETIF_F_HW_TC) > (features & NETIF_F_HW_TC)) 328 return nsim_bpf_disable_tc(ns); 329 330 return 0; 331 } 332 333 static int nsim_get_iflink(const struct net_device *dev) 334 { 335 struct netdevsim *nsim, *peer; 336 int iflink; 337 338 nsim = netdev_priv(dev); 339 340 rcu_read_lock(); 341 peer = rcu_dereference(nsim->peer); 342 iflink = peer ? READ_ONCE(peer->netdev->ifindex) : 343 READ_ONCE(dev->ifindex); 344 rcu_read_unlock(); 345 346 return iflink; 347 } 348 349 static int nsim_rcv(struct nsim_rq *rq, int budget) 350 { 351 struct sk_buff *skb; 352 int i; 353 354 for (i = 0; i < budget; i++) { 355 if (skb_queue_empty(&rq->skb_queue)) 356 break; 357 358 skb = skb_dequeue(&rq->skb_queue); 359 netif_receive_skb(skb); 360 } 361 362 return i; 363 } 364 365 static int nsim_poll(struct napi_struct *napi, int budget) 366 { 367 struct nsim_rq *rq = container_of(napi, struct nsim_rq, napi); 368 int done; 369 370 done = nsim_rcv(rq, budget); 371 napi_complete(napi); 372 373 return done; 374 } 375 376 static int nsim_create_page_pool(struct page_pool **p, struct napi_struct *napi) 377 { 378 struct page_pool_params params = { 379 .order = 0, 380 .pool_size = NSIM_RING_SIZE, 381 .nid = NUMA_NO_NODE, 382 .dev = &napi->dev->dev, 383 .napi = napi, 384 .dma_dir = DMA_BIDIRECTIONAL, 385 .netdev = napi->dev, 386 }; 387 struct page_pool *pool; 388 389 pool = page_pool_create(¶ms); 390 if (IS_ERR(pool)) 391 return PTR_ERR(pool); 392 393 *p = pool; 394 return 0; 395 } 396 397 static int nsim_init_napi(struct netdevsim *ns) 398 { 399 struct net_device *dev = ns->netdev; 400 struct nsim_rq *rq; 401 int err, i; 402 403 for (i = 0; i < dev->num_rx_queues; i++) { 404 rq = ns->rq[i]; 405 406 netif_napi_add_config_locked(dev, &rq->napi, nsim_poll, i); 407 } 408 409 for (i = 0; i < dev->num_rx_queues; i++) { 410 rq = ns->rq[i]; 411 412 err = nsim_create_page_pool(&rq->page_pool, &rq->napi); 413 if (err) 414 goto err_pp_destroy; 415 } 416 417 return 0; 418 419 err_pp_destroy: 420 while (i--) { 421 page_pool_destroy(ns->rq[i]->page_pool); 422 ns->rq[i]->page_pool = NULL; 423 } 424 425 for (i = 0; i < dev->num_rx_queues; i++) 426 __netif_napi_del_locked(&ns->rq[i]->napi); 427 428 return err; 429 } 430 431 static enum hrtimer_restart nsim_napi_schedule(struct hrtimer *timer) 432 { 433 struct nsim_rq *rq; 434 435 rq = container_of(timer, struct nsim_rq, napi_timer); 436 napi_schedule(&rq->napi); 437 438 return HRTIMER_NORESTART; 439 } 440 441 static void nsim_rq_timer_init(struct nsim_rq *rq) 442 { 443 hrtimer_init(&rq->napi_timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL); 444 rq->napi_timer.function = nsim_napi_schedule; 445 } 446 447 static void nsim_enable_napi(struct netdevsim *ns) 448 { 449 struct net_device *dev = ns->netdev; 450 int i; 451 452 for (i = 0; i < dev->num_rx_queues; i++) { 453 struct nsim_rq *rq = ns->rq[i]; 454 455 netif_queue_set_napi(dev, i, NETDEV_QUEUE_TYPE_RX, &rq->napi); 456 napi_enable_locked(&rq->napi); 457 } 458 } 459 460 static int nsim_open(struct net_device *dev) 461 { 462 struct netdevsim *ns = netdev_priv(dev); 463 int err; 464 465 netdev_assert_locked(dev); 466 467 err = nsim_init_napi(ns); 468 if (err) 469 return err; 470 471 nsim_enable_napi(ns); 472 473 return 0; 474 } 475 476 static void nsim_del_napi(struct netdevsim *ns) 477 { 478 struct net_device *dev = ns->netdev; 479 int i; 480 481 for (i = 0; i < dev->num_rx_queues; i++) { 482 struct nsim_rq *rq = ns->rq[i]; 483 484 napi_disable_locked(&rq->napi); 485 __netif_napi_del_locked(&rq->napi); 486 } 487 synchronize_net(); 488 489 for (i = 0; i < dev->num_rx_queues; i++) { 490 page_pool_destroy(ns->rq[i]->page_pool); 491 ns->rq[i]->page_pool = NULL; 492 } 493 } 494 495 static int nsim_stop(struct net_device *dev) 496 { 497 struct netdevsim *ns = netdev_priv(dev); 498 struct netdevsim *peer; 499 500 netdev_assert_locked(dev); 501 502 netif_carrier_off(dev); 503 peer = rtnl_dereference(ns->peer); 504 if (peer) 505 netif_carrier_off(peer->netdev); 506 507 nsim_del_napi(ns); 508 509 return 0; 510 } 511 512 static int nsim_shaper_set(struct net_shaper_binding *binding, 513 const struct net_shaper *shaper, 514 struct netlink_ext_ack *extack) 515 { 516 return 0; 517 } 518 519 static int nsim_shaper_del(struct net_shaper_binding *binding, 520 const struct net_shaper_handle *handle, 521 struct netlink_ext_ack *extack) 522 { 523 return 0; 524 } 525 526 static int nsim_shaper_group(struct net_shaper_binding *binding, 527 int leaves_count, 528 const struct net_shaper *leaves, 529 const struct net_shaper *root, 530 struct netlink_ext_ack *extack) 531 { 532 return 0; 533 } 534 535 static void nsim_shaper_cap(struct net_shaper_binding *binding, 536 enum net_shaper_scope scope, 537 unsigned long *flags) 538 { 539 *flags = ULONG_MAX; 540 } 541 542 static const struct net_shaper_ops nsim_shaper_ops = { 543 .set = nsim_shaper_set, 544 .delete = nsim_shaper_del, 545 .group = nsim_shaper_group, 546 .capabilities = nsim_shaper_cap, 547 }; 548 549 static const struct net_device_ops nsim_netdev_ops = { 550 .ndo_start_xmit = nsim_start_xmit, 551 .ndo_set_rx_mode = nsim_set_rx_mode, 552 .ndo_set_mac_address = eth_mac_addr, 553 .ndo_validate_addr = eth_validate_addr, 554 .ndo_change_mtu = nsim_change_mtu, 555 .ndo_get_stats64 = nsim_get_stats64, 556 .ndo_set_vf_mac = nsim_set_vf_mac, 557 .ndo_set_vf_vlan = nsim_set_vf_vlan, 558 .ndo_set_vf_rate = nsim_set_vf_rate, 559 .ndo_set_vf_spoofchk = nsim_set_vf_spoofchk, 560 .ndo_set_vf_trust = nsim_set_vf_trust, 561 .ndo_get_vf_config = nsim_get_vf_config, 562 .ndo_set_vf_link_state = nsim_set_vf_link_state, 563 .ndo_set_vf_rss_query_en = nsim_set_vf_rss_query_en, 564 .ndo_setup_tc = nsim_setup_tc, 565 .ndo_set_features = nsim_set_features, 566 .ndo_get_iflink = nsim_get_iflink, 567 .ndo_bpf = nsim_bpf, 568 .ndo_open = nsim_open, 569 .ndo_stop = nsim_stop, 570 .net_shaper_ops = &nsim_shaper_ops, 571 }; 572 573 static const struct net_device_ops nsim_vf_netdev_ops = { 574 .ndo_start_xmit = nsim_start_xmit, 575 .ndo_set_rx_mode = nsim_set_rx_mode, 576 .ndo_set_mac_address = eth_mac_addr, 577 .ndo_validate_addr = eth_validate_addr, 578 .ndo_change_mtu = nsim_change_mtu, 579 .ndo_get_stats64 = nsim_get_stats64, 580 .ndo_setup_tc = nsim_setup_tc, 581 .ndo_set_features = nsim_set_features, 582 }; 583 584 /* We don't have true per-queue stats, yet, so do some random fakery here. 585 * Only report stuff for queue 0. 586 */ 587 static void nsim_get_queue_stats_rx(struct net_device *dev, int idx, 588 struct netdev_queue_stats_rx *stats) 589 { 590 struct rtnl_link_stats64 rtstats = {}; 591 592 if (!idx) 593 nsim_get_stats64(dev, &rtstats); 594 595 stats->packets = rtstats.rx_packets - !!rtstats.rx_packets; 596 stats->bytes = rtstats.rx_bytes; 597 } 598 599 static void nsim_get_queue_stats_tx(struct net_device *dev, int idx, 600 struct netdev_queue_stats_tx *stats) 601 { 602 struct rtnl_link_stats64 rtstats = {}; 603 604 if (!idx) 605 nsim_get_stats64(dev, &rtstats); 606 607 stats->packets = rtstats.tx_packets - !!rtstats.tx_packets; 608 stats->bytes = rtstats.tx_bytes; 609 } 610 611 static void nsim_get_base_stats(struct net_device *dev, 612 struct netdev_queue_stats_rx *rx, 613 struct netdev_queue_stats_tx *tx) 614 { 615 struct rtnl_link_stats64 rtstats = {}; 616 617 nsim_get_stats64(dev, &rtstats); 618 619 rx->packets = !!rtstats.rx_packets; 620 rx->bytes = 0; 621 tx->packets = !!rtstats.tx_packets; 622 tx->bytes = 0; 623 } 624 625 static const struct netdev_stat_ops nsim_stat_ops = { 626 .get_queue_stats_tx = nsim_get_queue_stats_tx, 627 .get_queue_stats_rx = nsim_get_queue_stats_rx, 628 .get_base_stats = nsim_get_base_stats, 629 }; 630 631 static struct nsim_rq *nsim_queue_alloc(void) 632 { 633 struct nsim_rq *rq; 634 635 rq = kzalloc(sizeof(*rq), GFP_KERNEL_ACCOUNT); 636 if (!rq) 637 return NULL; 638 639 skb_queue_head_init(&rq->skb_queue); 640 nsim_rq_timer_init(rq); 641 return rq; 642 } 643 644 static void nsim_queue_free(struct nsim_rq *rq) 645 { 646 hrtimer_cancel(&rq->napi_timer); 647 skb_queue_purge_reason(&rq->skb_queue, SKB_DROP_REASON_QUEUE_PURGE); 648 kfree(rq); 649 } 650 651 /* Queue reset mode is controlled by ns->rq_reset_mode. 652 * - normal - new NAPI new pool (old NAPI enabled when new added) 653 * - mode 1 - allocate new pool (NAPI is only disabled / enabled) 654 * - mode 2 - new NAPI new pool (old NAPI removed before new added) 655 * - mode 3 - new NAPI new pool (old NAPI disabled when new added) 656 */ 657 struct nsim_queue_mem { 658 struct nsim_rq *rq; 659 struct page_pool *pp; 660 }; 661 662 static int 663 nsim_queue_mem_alloc(struct net_device *dev, void *per_queue_mem, int idx) 664 { 665 struct nsim_queue_mem *qmem = per_queue_mem; 666 struct netdevsim *ns = netdev_priv(dev); 667 int err; 668 669 if (ns->rq_reset_mode > 3) 670 return -EINVAL; 671 672 if (ns->rq_reset_mode == 1) { 673 if (!netif_running(ns->netdev)) 674 return -ENETDOWN; 675 return nsim_create_page_pool(&qmem->pp, &ns->rq[idx]->napi); 676 } 677 678 qmem->rq = nsim_queue_alloc(); 679 if (!qmem->rq) 680 return -ENOMEM; 681 682 err = nsim_create_page_pool(&qmem->rq->page_pool, &qmem->rq->napi); 683 if (err) 684 goto err_free; 685 686 if (!ns->rq_reset_mode) 687 netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll, 688 idx); 689 690 return 0; 691 692 err_free: 693 nsim_queue_free(qmem->rq); 694 return err; 695 } 696 697 static void nsim_queue_mem_free(struct net_device *dev, void *per_queue_mem) 698 { 699 struct nsim_queue_mem *qmem = per_queue_mem; 700 struct netdevsim *ns = netdev_priv(dev); 701 702 page_pool_destroy(qmem->pp); 703 if (qmem->rq) { 704 if (!ns->rq_reset_mode) 705 netif_napi_del_locked(&qmem->rq->napi); 706 page_pool_destroy(qmem->rq->page_pool); 707 nsim_queue_free(qmem->rq); 708 } 709 } 710 711 static int 712 nsim_queue_start(struct net_device *dev, void *per_queue_mem, int idx) 713 { 714 struct nsim_queue_mem *qmem = per_queue_mem; 715 struct netdevsim *ns = netdev_priv(dev); 716 717 netdev_assert_locked(dev); 718 719 if (ns->rq_reset_mode == 1) { 720 ns->rq[idx]->page_pool = qmem->pp; 721 napi_enable_locked(&ns->rq[idx]->napi); 722 return 0; 723 } 724 725 /* netif_napi_add()/_del() should normally be called from alloc/free, 726 * here we want to test various call orders. 727 */ 728 if (ns->rq_reset_mode == 2) { 729 netif_napi_del_locked(&ns->rq[idx]->napi); 730 netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll, 731 idx); 732 } else if (ns->rq_reset_mode == 3) { 733 netif_napi_add_config_locked(dev, &qmem->rq->napi, nsim_poll, 734 idx); 735 netif_napi_del_locked(&ns->rq[idx]->napi); 736 } 737 738 ns->rq[idx] = qmem->rq; 739 napi_enable_locked(&ns->rq[idx]->napi); 740 741 return 0; 742 } 743 744 static int nsim_queue_stop(struct net_device *dev, void *per_queue_mem, int idx) 745 { 746 struct nsim_queue_mem *qmem = per_queue_mem; 747 struct netdevsim *ns = netdev_priv(dev); 748 749 netdev_assert_locked(dev); 750 751 napi_disable_locked(&ns->rq[idx]->napi); 752 753 if (ns->rq_reset_mode == 1) { 754 qmem->pp = ns->rq[idx]->page_pool; 755 page_pool_disable_direct_recycling(qmem->pp); 756 } else { 757 qmem->rq = ns->rq[idx]; 758 } 759 760 return 0; 761 } 762 763 static const struct netdev_queue_mgmt_ops nsim_queue_mgmt_ops = { 764 .ndo_queue_mem_size = sizeof(struct nsim_queue_mem), 765 .ndo_queue_mem_alloc = nsim_queue_mem_alloc, 766 .ndo_queue_mem_free = nsim_queue_mem_free, 767 .ndo_queue_start = nsim_queue_start, 768 .ndo_queue_stop = nsim_queue_stop, 769 }; 770 771 static ssize_t 772 nsim_qreset_write(struct file *file, const char __user *data, 773 size_t count, loff_t *ppos) 774 { 775 struct netdevsim *ns = file->private_data; 776 unsigned int queue, mode; 777 char buf[32]; 778 ssize_t ret; 779 780 if (count >= sizeof(buf)) 781 return -EINVAL; 782 if (copy_from_user(buf, data, count)) 783 return -EFAULT; 784 buf[count] = '\0'; 785 786 ret = sscanf(buf, "%u %u", &queue, &mode); 787 if (ret != 2) 788 return -EINVAL; 789 790 rtnl_lock(); 791 if (queue >= ns->netdev->real_num_rx_queues) { 792 ret = -EINVAL; 793 goto exit_unlock; 794 } 795 796 ns->rq_reset_mode = mode; 797 ret = netdev_rx_queue_restart(ns->netdev, queue); 798 ns->rq_reset_mode = 0; 799 if (ret) 800 goto exit_unlock; 801 802 ret = count; 803 exit_unlock: 804 rtnl_unlock(); 805 return ret; 806 } 807 808 static const struct file_operations nsim_qreset_fops = { 809 .open = simple_open, 810 .write = nsim_qreset_write, 811 .owner = THIS_MODULE, 812 }; 813 814 static ssize_t 815 nsim_pp_hold_read(struct file *file, char __user *data, 816 size_t count, loff_t *ppos) 817 { 818 struct netdevsim *ns = file->private_data; 819 char buf[3] = "n\n"; 820 821 if (ns->page) 822 buf[0] = 'y'; 823 824 return simple_read_from_buffer(data, count, ppos, buf, 2); 825 } 826 827 static ssize_t 828 nsim_pp_hold_write(struct file *file, const char __user *data, 829 size_t count, loff_t *ppos) 830 { 831 struct netdevsim *ns = file->private_data; 832 ssize_t ret; 833 bool val; 834 835 ret = kstrtobool_from_user(data, count, &val); 836 if (ret) 837 return ret; 838 839 rtnl_lock(); 840 ret = count; 841 if (val == !!ns->page) 842 goto exit; 843 844 if (!netif_running(ns->netdev) && val) { 845 ret = -ENETDOWN; 846 } else if (val) { 847 ns->page = page_pool_dev_alloc_pages(ns->rq[0]->page_pool); 848 if (!ns->page) 849 ret = -ENOMEM; 850 } else { 851 page_pool_put_full_page(ns->page->pp, ns->page, false); 852 ns->page = NULL; 853 } 854 855 exit: 856 rtnl_unlock(); 857 return ret; 858 } 859 860 static const struct file_operations nsim_pp_hold_fops = { 861 .open = simple_open, 862 .read = nsim_pp_hold_read, 863 .write = nsim_pp_hold_write, 864 .llseek = generic_file_llseek, 865 .owner = THIS_MODULE, 866 }; 867 868 static void nsim_setup(struct net_device *dev) 869 { 870 ether_setup(dev); 871 eth_hw_addr_random(dev); 872 873 dev->tx_queue_len = 0; 874 dev->flags &= ~IFF_MULTICAST; 875 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE | 876 IFF_NO_QUEUE; 877 dev->features |= NETIF_F_HIGHDMA | 878 NETIF_F_SG | 879 NETIF_F_FRAGLIST | 880 NETIF_F_HW_CSUM | 881 NETIF_F_TSO; 882 dev->hw_features |= NETIF_F_HW_TC | 883 NETIF_F_SG | 884 NETIF_F_FRAGLIST | 885 NETIF_F_HW_CSUM | 886 NETIF_F_TSO; 887 dev->max_mtu = ETH_MAX_MTU; 888 dev->xdp_features = NETDEV_XDP_ACT_HW_OFFLOAD; 889 } 890 891 static int nsim_queue_init(struct netdevsim *ns) 892 { 893 struct net_device *dev = ns->netdev; 894 int i; 895 896 ns->rq = kcalloc(dev->num_rx_queues, sizeof(*ns->rq), 897 GFP_KERNEL_ACCOUNT); 898 if (!ns->rq) 899 return -ENOMEM; 900 901 for (i = 0; i < dev->num_rx_queues; i++) { 902 ns->rq[i] = nsim_queue_alloc(); 903 if (!ns->rq[i]) 904 goto err_free_prev; 905 } 906 907 return 0; 908 909 err_free_prev: 910 while (i--) 911 kfree(ns->rq[i]); 912 kfree(ns->rq); 913 return -ENOMEM; 914 } 915 916 static void nsim_queue_uninit(struct netdevsim *ns) 917 { 918 struct net_device *dev = ns->netdev; 919 int i; 920 921 for (i = 0; i < dev->num_rx_queues; i++) 922 nsim_queue_free(ns->rq[i]); 923 924 kfree(ns->rq); 925 ns->rq = NULL; 926 } 927 928 static int nsim_init_netdevsim(struct netdevsim *ns) 929 { 930 struct mock_phc *phc; 931 int err; 932 933 phc = mock_phc_create(&ns->nsim_bus_dev->dev); 934 if (IS_ERR(phc)) 935 return PTR_ERR(phc); 936 937 ns->phc = phc; 938 ns->netdev->netdev_ops = &nsim_netdev_ops; 939 ns->netdev->stat_ops = &nsim_stat_ops; 940 ns->netdev->queue_mgmt_ops = &nsim_queue_mgmt_ops; 941 942 err = nsim_udp_tunnels_info_create(ns->nsim_dev, ns->netdev); 943 if (err) 944 goto err_phc_destroy; 945 946 rtnl_lock(); 947 err = nsim_queue_init(ns); 948 if (err) 949 goto err_utn_destroy; 950 951 err = nsim_bpf_init(ns); 952 if (err) 953 goto err_rq_destroy; 954 955 nsim_macsec_init(ns); 956 nsim_ipsec_init(ns); 957 958 err = register_netdevice(ns->netdev); 959 if (err) 960 goto err_ipsec_teardown; 961 rtnl_unlock(); 962 return 0; 963 964 err_ipsec_teardown: 965 nsim_ipsec_teardown(ns); 966 nsim_macsec_teardown(ns); 967 nsim_bpf_uninit(ns); 968 err_rq_destroy: 969 nsim_queue_uninit(ns); 970 err_utn_destroy: 971 rtnl_unlock(); 972 nsim_udp_tunnels_info_destroy(ns->netdev); 973 err_phc_destroy: 974 mock_phc_destroy(ns->phc); 975 return err; 976 } 977 978 static int nsim_init_netdevsim_vf(struct netdevsim *ns) 979 { 980 int err; 981 982 ns->netdev->netdev_ops = &nsim_vf_netdev_ops; 983 rtnl_lock(); 984 err = register_netdevice(ns->netdev); 985 rtnl_unlock(); 986 return err; 987 } 988 989 static void nsim_exit_netdevsim(struct netdevsim *ns) 990 { 991 nsim_udp_tunnels_info_destroy(ns->netdev); 992 mock_phc_destroy(ns->phc); 993 } 994 995 struct netdevsim * 996 nsim_create(struct nsim_dev *nsim_dev, struct nsim_dev_port *nsim_dev_port) 997 { 998 struct net_device *dev; 999 struct netdevsim *ns; 1000 int err; 1001 1002 dev = alloc_netdev_mq(sizeof(*ns), "eth%d", NET_NAME_UNKNOWN, nsim_setup, 1003 nsim_dev->nsim_bus_dev->num_queues); 1004 if (!dev) 1005 return ERR_PTR(-ENOMEM); 1006 1007 dev_net_set(dev, nsim_dev_net(nsim_dev)); 1008 ns = netdev_priv(dev); 1009 ns->netdev = dev; 1010 u64_stats_init(&ns->syncp); 1011 ns->nsim_dev = nsim_dev; 1012 ns->nsim_dev_port = nsim_dev_port; 1013 ns->nsim_bus_dev = nsim_dev->nsim_bus_dev; 1014 SET_NETDEV_DEV(dev, &ns->nsim_bus_dev->dev); 1015 SET_NETDEV_DEVLINK_PORT(dev, &nsim_dev_port->devlink_port); 1016 nsim_ethtool_init(ns); 1017 if (nsim_dev_port_is_pf(nsim_dev_port)) 1018 err = nsim_init_netdevsim(ns); 1019 else 1020 err = nsim_init_netdevsim_vf(ns); 1021 if (err) 1022 goto err_free_netdev; 1023 1024 ns->pp_dfs = debugfs_create_file("pp_hold", 0600, nsim_dev_port->ddir, 1025 ns, &nsim_pp_hold_fops); 1026 ns->qr_dfs = debugfs_create_file("queue_reset", 0200, 1027 nsim_dev_port->ddir, ns, 1028 &nsim_qreset_fops); 1029 1030 return ns; 1031 1032 err_free_netdev: 1033 free_netdev(dev); 1034 return ERR_PTR(err); 1035 } 1036 1037 void nsim_destroy(struct netdevsim *ns) 1038 { 1039 struct net_device *dev = ns->netdev; 1040 struct netdevsim *peer; 1041 1042 debugfs_remove(ns->qr_dfs); 1043 debugfs_remove(ns->pp_dfs); 1044 1045 rtnl_lock(); 1046 peer = rtnl_dereference(ns->peer); 1047 if (peer) 1048 RCU_INIT_POINTER(peer->peer, NULL); 1049 RCU_INIT_POINTER(ns->peer, NULL); 1050 unregister_netdevice(dev); 1051 if (nsim_dev_port_is_pf(ns->nsim_dev_port)) { 1052 nsim_macsec_teardown(ns); 1053 nsim_ipsec_teardown(ns); 1054 nsim_bpf_uninit(ns); 1055 nsim_queue_uninit(ns); 1056 } 1057 rtnl_unlock(); 1058 if (nsim_dev_port_is_pf(ns->nsim_dev_port)) 1059 nsim_exit_netdevsim(ns); 1060 1061 /* Put this intentionally late to exercise the orphaning path */ 1062 if (ns->page) { 1063 page_pool_put_full_page(ns->page->pp, ns->page, false); 1064 ns->page = NULL; 1065 } 1066 1067 free_netdev(dev); 1068 } 1069 1070 bool netdev_is_nsim(struct net_device *dev) 1071 { 1072 return dev->netdev_ops == &nsim_netdev_ops; 1073 } 1074 1075 static int nsim_validate(struct nlattr *tb[], struct nlattr *data[], 1076 struct netlink_ext_ack *extack) 1077 { 1078 NL_SET_ERR_MSG_MOD(extack, 1079 "Please use: echo \"[ID] [PORT_COUNT] [NUM_QUEUES]\" > /sys/bus/netdevsim/new_device"); 1080 return -EOPNOTSUPP; 1081 } 1082 1083 static struct rtnl_link_ops nsim_link_ops __read_mostly = { 1084 .kind = DRV_NAME, 1085 .validate = nsim_validate, 1086 }; 1087 1088 static int __init nsim_module_init(void) 1089 { 1090 int err; 1091 1092 err = nsim_dev_init(); 1093 if (err) 1094 return err; 1095 1096 err = nsim_bus_init(); 1097 if (err) 1098 goto err_dev_exit; 1099 1100 err = rtnl_link_register(&nsim_link_ops); 1101 if (err) 1102 goto err_bus_exit; 1103 1104 return 0; 1105 1106 err_bus_exit: 1107 nsim_bus_exit(); 1108 err_dev_exit: 1109 nsim_dev_exit(); 1110 return err; 1111 } 1112 1113 static void __exit nsim_module_exit(void) 1114 { 1115 rtnl_link_unregister(&nsim_link_ops); 1116 nsim_bus_exit(); 1117 nsim_dev_exit(); 1118 } 1119 1120 module_init(nsim_module_init); 1121 module_exit(nsim_module_exit); 1122 MODULE_LICENSE("GPL"); 1123 MODULE_DESCRIPTION("Simulated networking device for testing"); 1124 MODULE_ALIAS_RTNL_LINK(DRV_NAME); 1125