1 // SPDX-License-Identifier: GPL-2.0 2 /* 3 * Copyright(c) 2010-2014 Intel Corporation. 4 */ 5 6 #include <linux/version.h> 7 #include <linux/module.h> 8 #include <linux/miscdevice.h> 9 #include <linux/netdevice.h> 10 #include <linux/etherdevice.h> 11 #include <linux/pci.h> 12 #include <linux/kthread.h> 13 #include <linux/rwsem.h> 14 #include <linux/mutex.h> 15 #include <linux/nsproxy.h> 16 #include <net/net_namespace.h> 17 #include <net/netns/generic.h> 18 19 #include <rte_kni_common.h> 20 21 #include "compat.h" 22 #include "kni_dev.h" 23 24 MODULE_VERSION(KNI_VERSION); 25 MODULE_LICENSE("Dual BSD/GPL"); 26 MODULE_AUTHOR("Intel Corporation"); 27 MODULE_DESCRIPTION("Kernel Module for managing kni devices"); 28 29 #define KNI_RX_LOOP_NUM 1000 30 31 #define KNI_MAX_DEVICES 32 32 33 /* loopback mode */ 34 static char *lo_mode; 35 36 /* Kernel thread mode */ 37 static char *kthread_mode; 38 static uint32_t multiple_kthread_on; 39 40 /* Default carrier state for created KNI network interfaces */ 41 static char *carrier; 42 uint32_t kni_dflt_carrier; 43 44 #define KNI_DEV_IN_USE_BIT_NUM 0 /* Bit number for device in use */ 45 46 static int kni_net_id; 47 48 struct kni_net { 49 unsigned long device_in_use; /* device in use flag */ 50 struct mutex kni_kthread_lock; 51 struct task_struct *kni_kthread; 52 struct rw_semaphore kni_list_lock; 53 struct list_head kni_list_head; 54 }; 55 56 static int __net_init 57 kni_init_net(struct net *net) 58 { 59 #ifdef HAVE_SIMPLIFIED_PERNET_OPERATIONS 60 struct kni_net *knet = net_generic(net, kni_net_id); 61 62 memset(knet, 0, sizeof(*knet)); 63 #else 64 struct kni_net *knet; 65 int ret; 66 67 knet = kzalloc(sizeof(struct kni_net), GFP_KERNEL); 68 if (!knet) { 69 ret = -ENOMEM; 70 return ret; 71 } 72 #endif 73 74 /* Clear the bit of device in use */ 75 clear_bit(KNI_DEV_IN_USE_BIT_NUM, &knet->device_in_use); 76 77 mutex_init(&knet->kni_kthread_lock); 78 79 init_rwsem(&knet->kni_list_lock); 80 INIT_LIST_HEAD(&knet->kni_list_head); 81 82 #ifdef HAVE_SIMPLIFIED_PERNET_OPERATIONS 83 return 0; 84 #else 85 ret = net_assign_generic(net, kni_net_id, knet); 86 if (ret < 0) 87 kfree(knet); 88 89 return ret; 90 #endif 91 } 92 93 static void __net_exit 94 kni_exit_net(struct net *net) 95 { 96 struct kni_net *knet __maybe_unused; 97 98 knet = net_generic(net, kni_net_id); 99 mutex_destroy(&knet->kni_kthread_lock); 100 101 #ifndef HAVE_SIMPLIFIED_PERNET_OPERATIONS 102 kfree(knet); 103 #endif 104 } 105 106 static struct pernet_operations kni_net_ops = { 107 .init = kni_init_net, 108 .exit = kni_exit_net, 109 #ifdef HAVE_SIMPLIFIED_PERNET_OPERATIONS 110 .id = &kni_net_id, 111 .size = sizeof(struct kni_net), 112 #endif 113 }; 114 115 static int 116 kni_thread_single(void *data) 117 { 118 struct kni_net *knet = data; 119 int j; 120 struct kni_dev *dev; 121 122 while (!kthread_should_stop()) { 123 down_read(&knet->kni_list_lock); 124 for (j = 0; j < KNI_RX_LOOP_NUM; j++) { 125 list_for_each_entry(dev, &knet->kni_list_head, list) { 126 kni_net_rx(dev); 127 kni_net_poll_resp(dev); 128 } 129 } 130 up_read(&knet->kni_list_lock); 131 #ifdef RTE_KNI_PREEMPT_DEFAULT 132 /* reschedule out for a while */ 133 schedule_timeout_interruptible( 134 usecs_to_jiffies(KNI_KTHREAD_RESCHEDULE_INTERVAL)); 135 #endif 136 } 137 138 return 0; 139 } 140 141 static int 142 kni_thread_multiple(void *param) 143 { 144 int j; 145 struct kni_dev *dev = param; 146 147 while (!kthread_should_stop()) { 148 for (j = 0; j < KNI_RX_LOOP_NUM; j++) { 149 kni_net_rx(dev); 150 kni_net_poll_resp(dev); 151 } 152 #ifdef RTE_KNI_PREEMPT_DEFAULT 153 schedule_timeout_interruptible( 154 usecs_to_jiffies(KNI_KTHREAD_RESCHEDULE_INTERVAL)); 155 #endif 156 } 157 158 return 0; 159 } 160 161 static int 162 kni_open(struct inode *inode, struct file *file) 163 { 164 struct net *net = current->nsproxy->net_ns; 165 struct kni_net *knet = net_generic(net, kni_net_id); 166 167 /* kni device can be opened by one user only per netns */ 168 if (test_and_set_bit(KNI_DEV_IN_USE_BIT_NUM, &knet->device_in_use)) 169 return -EBUSY; 170 171 file->private_data = get_net(net); 172 pr_debug("/dev/kni opened\n"); 173 174 return 0; 175 } 176 177 static int 178 kni_dev_remove(struct kni_dev *dev) 179 { 180 if (!dev) 181 return -ENODEV; 182 183 if (dev->net_dev) { 184 unregister_netdev(dev->net_dev); 185 free_netdev(dev->net_dev); 186 } 187 188 kni_net_release_fifo_phy(dev); 189 190 return 0; 191 } 192 193 static int 194 kni_release(struct inode *inode, struct file *file) 195 { 196 struct net *net = file->private_data; 197 struct kni_net *knet = net_generic(net, kni_net_id); 198 struct kni_dev *dev, *n; 199 200 /* Stop kernel thread for single mode */ 201 if (multiple_kthread_on == 0) { 202 mutex_lock(&knet->kni_kthread_lock); 203 /* Stop kernel thread */ 204 if (knet->kni_kthread != NULL) { 205 kthread_stop(knet->kni_kthread); 206 knet->kni_kthread = NULL; 207 } 208 mutex_unlock(&knet->kni_kthread_lock); 209 } 210 211 down_write(&knet->kni_list_lock); 212 list_for_each_entry_safe(dev, n, &knet->kni_list_head, list) { 213 /* Stop kernel thread for multiple mode */ 214 if (multiple_kthread_on && dev->pthread != NULL) { 215 kthread_stop(dev->pthread); 216 dev->pthread = NULL; 217 } 218 219 kni_dev_remove(dev); 220 list_del(&dev->list); 221 } 222 up_write(&knet->kni_list_lock); 223 224 /* Clear the bit of device in use */ 225 clear_bit(KNI_DEV_IN_USE_BIT_NUM, &knet->device_in_use); 226 227 put_net(net); 228 pr_debug("/dev/kni closed\n"); 229 230 return 0; 231 } 232 233 static int 234 kni_check_param(struct kni_dev *kni, struct rte_kni_device_info *dev) 235 { 236 if (!kni || !dev) 237 return -1; 238 239 /* Check if network name has been used */ 240 if (!strncmp(kni->name, dev->name, RTE_KNI_NAMESIZE)) { 241 pr_err("KNI name %s duplicated\n", dev->name); 242 return -1; 243 } 244 245 return 0; 246 } 247 248 static int 249 kni_run_thread(struct kni_net *knet, struct kni_dev *kni, uint8_t force_bind) 250 { 251 /** 252 * Create a new kernel thread for multiple mode, set its core affinity, 253 * and finally wake it up. 254 */ 255 if (multiple_kthread_on) { 256 kni->pthread = kthread_create(kni_thread_multiple, 257 (void *)kni, "kni_%s", kni->name); 258 if (IS_ERR(kni->pthread)) { 259 kni_dev_remove(kni); 260 return -ECANCELED; 261 } 262 263 if (force_bind) 264 kthread_bind(kni->pthread, kni->core_id); 265 wake_up_process(kni->pthread); 266 } else { 267 mutex_lock(&knet->kni_kthread_lock); 268 269 if (knet->kni_kthread == NULL) { 270 knet->kni_kthread = kthread_create(kni_thread_single, 271 (void *)knet, "kni_single"); 272 if (IS_ERR(knet->kni_kthread)) { 273 mutex_unlock(&knet->kni_kthread_lock); 274 kni_dev_remove(kni); 275 return -ECANCELED; 276 } 277 278 if (force_bind) 279 kthread_bind(knet->kni_kthread, kni->core_id); 280 wake_up_process(knet->kni_kthread); 281 } 282 283 mutex_unlock(&knet->kni_kthread_lock); 284 } 285 286 return 0; 287 } 288 289 static int 290 kni_ioctl_create(struct net *net, uint32_t ioctl_num, 291 unsigned long ioctl_param) 292 { 293 struct kni_net *knet = net_generic(net, kni_net_id); 294 int ret; 295 struct rte_kni_device_info dev_info; 296 struct net_device *net_dev = NULL; 297 struct kni_dev *kni, *dev, *n; 298 299 pr_info("Creating kni...\n"); 300 /* Check the buffer size, to avoid warning */ 301 if (_IOC_SIZE(ioctl_num) > sizeof(dev_info)) 302 return -EINVAL; 303 304 /* Copy kni info from user space */ 305 if (copy_from_user(&dev_info, (void *)ioctl_param, sizeof(dev_info))) 306 return -EFAULT; 307 308 /* Check if name is zero-ended */ 309 if (strnlen(dev_info.name, sizeof(dev_info.name)) == sizeof(dev_info.name)) { 310 pr_err("kni.name not zero-terminated"); 311 return -EINVAL; 312 } 313 314 /** 315 * Check if the cpu core id is valid for binding. 316 */ 317 if (dev_info.force_bind && !cpu_online(dev_info.core_id)) { 318 pr_err("cpu %u is not online\n", dev_info.core_id); 319 return -EINVAL; 320 } 321 322 /* Check if it has been created */ 323 down_read(&knet->kni_list_lock); 324 list_for_each_entry_safe(dev, n, &knet->kni_list_head, list) { 325 if (kni_check_param(dev, &dev_info) < 0) { 326 up_read(&knet->kni_list_lock); 327 return -EINVAL; 328 } 329 } 330 up_read(&knet->kni_list_lock); 331 332 net_dev = alloc_netdev(sizeof(struct kni_dev), dev_info.name, 333 #ifdef NET_NAME_USER 334 NET_NAME_USER, 335 #endif 336 kni_net_init); 337 if (net_dev == NULL) { 338 pr_err("error allocating device \"%s\"\n", dev_info.name); 339 return -EBUSY; 340 } 341 342 dev_net_set(net_dev, net); 343 344 kni = netdev_priv(net_dev); 345 346 kni->net_dev = net_dev; 347 kni->core_id = dev_info.core_id; 348 strncpy(kni->name, dev_info.name, RTE_KNI_NAMESIZE); 349 350 /* Translate user space info into kernel space info */ 351 if (dev_info.iova_mode) { 352 #ifdef HAVE_IOVA_TO_KVA_MAPPING_SUPPORT 353 kni->tx_q = iova_to_kva(current, dev_info.tx_phys); 354 kni->rx_q = iova_to_kva(current, dev_info.rx_phys); 355 kni->alloc_q = iova_to_kva(current, dev_info.alloc_phys); 356 kni->free_q = iova_to_kva(current, dev_info.free_phys); 357 358 kni->req_q = iova_to_kva(current, dev_info.req_phys); 359 kni->resp_q = iova_to_kva(current, dev_info.resp_phys); 360 kni->sync_va = dev_info.sync_va; 361 kni->sync_kva = iova_to_kva(current, dev_info.sync_phys); 362 kni->usr_tsk = current; 363 kni->iova_mode = 1; 364 #else 365 pr_err("KNI module does not support IOVA to VA translation\n"); 366 return -EINVAL; 367 #endif 368 } else { 369 370 kni->tx_q = phys_to_virt(dev_info.tx_phys); 371 kni->rx_q = phys_to_virt(dev_info.rx_phys); 372 kni->alloc_q = phys_to_virt(dev_info.alloc_phys); 373 kni->free_q = phys_to_virt(dev_info.free_phys); 374 375 kni->req_q = phys_to_virt(dev_info.req_phys); 376 kni->resp_q = phys_to_virt(dev_info.resp_phys); 377 kni->sync_va = dev_info.sync_va; 378 kni->sync_kva = phys_to_virt(dev_info.sync_phys); 379 kni->iova_mode = 0; 380 } 381 382 kni->mbuf_size = dev_info.mbuf_size; 383 384 pr_debug("tx_phys: 0x%016llx, tx_q addr: 0x%p\n", 385 (unsigned long long) dev_info.tx_phys, kni->tx_q); 386 pr_debug("rx_phys: 0x%016llx, rx_q addr: 0x%p\n", 387 (unsigned long long) dev_info.rx_phys, kni->rx_q); 388 pr_debug("alloc_phys: 0x%016llx, alloc_q addr: 0x%p\n", 389 (unsigned long long) dev_info.alloc_phys, kni->alloc_q); 390 pr_debug("free_phys: 0x%016llx, free_q addr: 0x%p\n", 391 (unsigned long long) dev_info.free_phys, kni->free_q); 392 pr_debug("req_phys: 0x%016llx, req_q addr: 0x%p\n", 393 (unsigned long long) dev_info.req_phys, kni->req_q); 394 pr_debug("resp_phys: 0x%016llx, resp_q addr: 0x%p\n", 395 (unsigned long long) dev_info.resp_phys, kni->resp_q); 396 pr_debug("mbuf_size: %u\n", kni->mbuf_size); 397 398 /* if user has provided a valid mac address */ 399 if (is_valid_ether_addr(dev_info.mac_addr)) 400 memcpy(net_dev->dev_addr, dev_info.mac_addr, ETH_ALEN); 401 else 402 /* Generate random MAC address. */ 403 eth_random_addr(net_dev->dev_addr); 404 405 if (dev_info.mtu) 406 net_dev->mtu = dev_info.mtu; 407 #ifdef HAVE_MAX_MTU_PARAM 408 net_dev->max_mtu = net_dev->mtu; 409 410 if (dev_info.min_mtu) 411 net_dev->min_mtu = dev_info.min_mtu; 412 413 if (dev_info.max_mtu) 414 net_dev->max_mtu = dev_info.max_mtu; 415 #endif 416 417 ret = register_netdev(net_dev); 418 if (ret) { 419 pr_err("error %i registering device \"%s\"\n", 420 ret, dev_info.name); 421 kni->net_dev = NULL; 422 kni_dev_remove(kni); 423 free_netdev(net_dev); 424 return -ENODEV; 425 } 426 427 netif_carrier_off(net_dev); 428 429 ret = kni_run_thread(knet, kni, dev_info.force_bind); 430 if (ret != 0) 431 return ret; 432 433 down_write(&knet->kni_list_lock); 434 list_add(&kni->list, &knet->kni_list_head); 435 up_write(&knet->kni_list_lock); 436 437 return 0; 438 } 439 440 static int 441 kni_ioctl_release(struct net *net, uint32_t ioctl_num, 442 unsigned long ioctl_param) 443 { 444 struct kni_net *knet = net_generic(net, kni_net_id); 445 int ret = -EINVAL; 446 struct kni_dev *dev, *n; 447 struct rte_kni_device_info dev_info; 448 449 if (_IOC_SIZE(ioctl_num) > sizeof(dev_info)) 450 return -EINVAL; 451 452 if (copy_from_user(&dev_info, (void *)ioctl_param, sizeof(dev_info))) 453 return -EFAULT; 454 455 /* Release the network device according to its name */ 456 if (strlen(dev_info.name) == 0) 457 return -EINVAL; 458 459 down_write(&knet->kni_list_lock); 460 list_for_each_entry_safe(dev, n, &knet->kni_list_head, list) { 461 if (strncmp(dev->name, dev_info.name, RTE_KNI_NAMESIZE) != 0) 462 continue; 463 464 if (multiple_kthread_on && dev->pthread != NULL) { 465 kthread_stop(dev->pthread); 466 dev->pthread = NULL; 467 } 468 469 kni_dev_remove(dev); 470 list_del(&dev->list); 471 ret = 0; 472 break; 473 } 474 up_write(&knet->kni_list_lock); 475 pr_info("%s release kni named %s\n", 476 (ret == 0 ? "Successfully" : "Unsuccessfully"), dev_info.name); 477 478 return ret; 479 } 480 481 static int 482 kni_ioctl(struct inode *inode, uint32_t ioctl_num, unsigned long ioctl_param) 483 { 484 int ret = -EINVAL; 485 struct net *net = current->nsproxy->net_ns; 486 487 pr_debug("IOCTL num=0x%0x param=0x%0lx\n", ioctl_num, ioctl_param); 488 489 /* 490 * Switch according to the ioctl called 491 */ 492 switch (_IOC_NR(ioctl_num)) { 493 case _IOC_NR(RTE_KNI_IOCTL_TEST): 494 /* For test only, not used */ 495 break; 496 case _IOC_NR(RTE_KNI_IOCTL_CREATE): 497 ret = kni_ioctl_create(net, ioctl_num, ioctl_param); 498 break; 499 case _IOC_NR(RTE_KNI_IOCTL_RELEASE): 500 ret = kni_ioctl_release(net, ioctl_num, ioctl_param); 501 break; 502 default: 503 pr_debug("IOCTL default\n"); 504 break; 505 } 506 507 return ret; 508 } 509 510 static int 511 kni_compat_ioctl(struct inode *inode, uint32_t ioctl_num, 512 unsigned long ioctl_param) 513 { 514 /* 32 bits app on 64 bits OS to be supported later */ 515 pr_debug("Not implemented.\n"); 516 517 return -EINVAL; 518 } 519 520 static const struct file_operations kni_fops = { 521 .owner = THIS_MODULE, 522 .open = kni_open, 523 .release = kni_release, 524 .unlocked_ioctl = (void *)kni_ioctl, 525 .compat_ioctl = (void *)kni_compat_ioctl, 526 }; 527 528 static struct miscdevice kni_misc = { 529 .minor = MISC_DYNAMIC_MINOR, 530 .name = KNI_DEVICE, 531 .fops = &kni_fops, 532 }; 533 534 static int __init 535 kni_parse_kthread_mode(void) 536 { 537 if (!kthread_mode) 538 return 0; 539 540 if (strcmp(kthread_mode, "single") == 0) 541 return 0; 542 else if (strcmp(kthread_mode, "multiple") == 0) 543 multiple_kthread_on = 1; 544 else 545 return -1; 546 547 return 0; 548 } 549 550 static int __init 551 kni_parse_carrier_state(void) 552 { 553 if (!carrier) { 554 kni_dflt_carrier = 0; 555 return 0; 556 } 557 558 if (strcmp(carrier, "off") == 0) 559 kni_dflt_carrier = 0; 560 else if (strcmp(carrier, "on") == 0) 561 kni_dflt_carrier = 1; 562 else 563 return -1; 564 565 return 0; 566 } 567 568 static int __init 569 kni_init(void) 570 { 571 int rc; 572 573 if (kni_parse_kthread_mode() < 0) { 574 pr_err("Invalid parameter for kthread_mode\n"); 575 return -EINVAL; 576 } 577 578 if (multiple_kthread_on == 0) 579 pr_debug("Single kernel thread for all KNI devices\n"); 580 else 581 pr_debug("Multiple kernel thread mode enabled\n"); 582 583 if (kni_parse_carrier_state() < 0) { 584 pr_err("Invalid parameter for carrier\n"); 585 return -EINVAL; 586 } 587 588 if (kni_dflt_carrier == 0) 589 pr_debug("Default carrier state set to off.\n"); 590 else 591 pr_debug("Default carrier state set to on.\n"); 592 593 #ifdef HAVE_SIMPLIFIED_PERNET_OPERATIONS 594 rc = register_pernet_subsys(&kni_net_ops); 595 #else 596 rc = register_pernet_gen_subsys(&kni_net_id, &kni_net_ops); 597 #endif 598 if (rc) 599 return -EPERM; 600 601 rc = misc_register(&kni_misc); 602 if (rc != 0) { 603 pr_err("Misc registration failed\n"); 604 goto out; 605 } 606 607 /* Configure the lo mode according to the input parameter */ 608 kni_net_config_lo_mode(lo_mode); 609 610 return 0; 611 612 out: 613 #ifdef HAVE_SIMPLIFIED_PERNET_OPERATIONS 614 unregister_pernet_subsys(&kni_net_ops); 615 #else 616 unregister_pernet_gen_subsys(kni_net_id, &kni_net_ops); 617 #endif 618 return rc; 619 } 620 621 static void __exit 622 kni_exit(void) 623 { 624 misc_deregister(&kni_misc); 625 #ifdef HAVE_SIMPLIFIED_PERNET_OPERATIONS 626 unregister_pernet_subsys(&kni_net_ops); 627 #else 628 unregister_pernet_gen_subsys(kni_net_id, &kni_net_ops); 629 #endif 630 } 631 632 module_init(kni_init); 633 module_exit(kni_exit); 634 635 module_param(lo_mode, charp, 0644); 636 MODULE_PARM_DESC(lo_mode, 637 "KNI loopback mode (default=lo_mode_none):\n" 638 "\t\tlo_mode_none Kernel loopback disabled\n" 639 "\t\tlo_mode_fifo Enable kernel loopback with fifo\n" 640 "\t\tlo_mode_fifo_skb Enable kernel loopback with fifo and skb buffer\n" 641 "\t\t" 642 ); 643 644 module_param(kthread_mode, charp, 0644); 645 MODULE_PARM_DESC(kthread_mode, 646 "Kernel thread mode (default=single):\n" 647 "\t\tsingle Single kernel thread mode enabled.\n" 648 "\t\tmultiple Multiple kernel thread mode enabled.\n" 649 "\t\t" 650 ); 651 652 module_param(carrier, charp, 0644); 653 MODULE_PARM_DESC(carrier, 654 "Default carrier state for KNI interface (default=off):\n" 655 "\t\toff Interfaces will be created with carrier state set to off.\n" 656 "\t\ton Interfaces will be created with carrier state set to on.\n" 657 "\t\t" 658 ); 659