176404edcSAsim Jamshed /* for io_module_func def'ns */
276404edcSAsim Jamshed #include "io_module.h"
376404edcSAsim Jamshed /* for mtcp related def'ns */
476404edcSAsim Jamshed #include "mtcp.h"
576404edcSAsim Jamshed /* for errno */
676404edcSAsim Jamshed #include <errno.h>
7*dcdbbb98SAsim Jamshed /* for close/optind */
8*dcdbbb98SAsim Jamshed #include <unistd.h>
976404edcSAsim Jamshed /* for logging */
1076404edcSAsim Jamshed #include "debug.h"
1176404edcSAsim Jamshed /* for num_devices_* */
1276404edcSAsim Jamshed #include "config.h"
1376404edcSAsim Jamshed /* for rte_max_eth_ports */
1476404edcSAsim Jamshed #include <rte_common.h>
1576404edcSAsim Jamshed /* for rte_eth_rxconf */
1676404edcSAsim Jamshed #include <rte_ethdev.h>
1776404edcSAsim Jamshed /* for delay funcs */
1876404edcSAsim Jamshed #include <rte_cycles.h>
1976404edcSAsim Jamshed /* for ip pesudo-chksum */
2076404edcSAsim Jamshed #include <rte_ip.h>
2176404edcSAsim Jamshed #define ENABLE_STATS_IOCTL		1
2276404edcSAsim Jamshed #ifdef ENABLE_STATS_IOCTL
2376404edcSAsim Jamshed /* for open */
2476404edcSAsim Jamshed #include <fcntl.h>
2576404edcSAsim Jamshed /* for ioctl */
2676404edcSAsim Jamshed #include <sys/ioctl.h>
2776404edcSAsim Jamshed #endif /* !ENABLE_STATS_IOCTL */
2876404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
2976404edcSAsim Jamshed /* Essential macros */
3076404edcSAsim Jamshed #define MAX_RX_QUEUE_PER_LCORE		MAX_CPUS
3176404edcSAsim Jamshed #define MAX_TX_QUEUE_PER_PORT		MAX_CPUS
3276404edcSAsim Jamshed 
3376404edcSAsim Jamshed #define MBUF_SIZE 			(2048 + sizeof(struct rte_mbuf) + RTE_PKTMBUF_HEADROOM)
3476404edcSAsim Jamshed #define NB_MBUF				8192
3576404edcSAsim Jamshed #define MEMPOOL_CACHE_SIZE		256
36a5e1a556SAsim Jamshed //#define RX_IDLE_ENABLE			1
37a5e1a556SAsim Jamshed #define RX_IDLE_TIMEOUT			1	/* in micro-seconds */
38a5e1a556SAsim Jamshed #define RX_IDLE_THRESH			64
3976404edcSAsim Jamshed 
4076404edcSAsim Jamshed /*
4176404edcSAsim Jamshed  * RX and TX Prefetch, Host, and Write-back threshold values should be
4276404edcSAsim Jamshed  * carefully set for optimal performance. Consult the network
4376404edcSAsim Jamshed  * controller's datasheet and supporting DPDK documentation for guidance
4476404edcSAsim Jamshed  * on how these parameters should be set.
4576404edcSAsim Jamshed  */
4676404edcSAsim Jamshed #define RX_PTHRESH 			8 /**< Default values of RX prefetch threshold reg. */
4776404edcSAsim Jamshed #define RX_HTHRESH 			8 /**< Default values of RX host threshold reg. */
4876404edcSAsim Jamshed #define RX_WTHRESH 			4 /**< Default values of RX write-back threshold reg. */
4976404edcSAsim Jamshed 
5076404edcSAsim Jamshed /*
5176404edcSAsim Jamshed  * These default values are optimized for use with the Intel(R) 82599 10 GbE
5276404edcSAsim Jamshed  * Controller and the DPDK ixgbe PMD. Consider using other values for other
5376404edcSAsim Jamshed  * network controllers and/or network drivers.
5476404edcSAsim Jamshed  */
5576404edcSAsim Jamshed #define TX_PTHRESH 			36 /**< Default values of TX prefetch threshold reg. */
5676404edcSAsim Jamshed #define TX_HTHRESH			0  /**< Default values of TX host threshold reg. */
5776404edcSAsim Jamshed #define TX_WTHRESH			0  /**< Default values of TX write-back threshold reg. */
5876404edcSAsim Jamshed 
5976404edcSAsim Jamshed #define MAX_PKT_BURST			/*32*/64/*128*//*32*/
6076404edcSAsim Jamshed 
6176404edcSAsim Jamshed /*
6276404edcSAsim Jamshed  * Configurable number of RX/TX ring descriptors
6376404edcSAsim Jamshed  */
6476404edcSAsim Jamshed #define RTE_TEST_RX_DESC_DEFAULT	128
6576404edcSAsim Jamshed #define RTE_TEST_TX_DESC_DEFAULT	512
6676404edcSAsim Jamshed 
6776404edcSAsim Jamshed static uint16_t nb_rxd = RTE_TEST_RX_DESC_DEFAULT;
6876404edcSAsim Jamshed static uint16_t nb_txd = RTE_TEST_TX_DESC_DEFAULT;
6976404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
7076404edcSAsim Jamshed /* packet memory pools for storing packet bufs */
7176404edcSAsim Jamshed static struct rte_mempool *pktmbuf_pool[MAX_CPUS] = {NULL};
7276404edcSAsim Jamshed static uint8_t cpu_qid_map[RTE_MAX_ETHPORTS][MAX_CPUS] = {{0}};
7376404edcSAsim Jamshed 
7476404edcSAsim Jamshed //#define DEBUG				1
7576404edcSAsim Jamshed #ifdef DEBUG
7676404edcSAsim Jamshed /* ethernet addresses of ports */
7776404edcSAsim Jamshed static struct ether_addr ports_eth_addr[RTE_MAX_ETHPORTS];
7876404edcSAsim Jamshed #endif
7976404edcSAsim Jamshed 
8076404edcSAsim Jamshed static struct rte_eth_conf port_conf = {
8176404edcSAsim Jamshed 	.rxmode = {
8276404edcSAsim Jamshed 		.mq_mode	= 	ETH_MQ_RX_RSS,
8376404edcSAsim Jamshed 		.max_rx_pkt_len = 	ETHER_MAX_LEN,
8476404edcSAsim Jamshed 		.split_hdr_size = 	0,
8576404edcSAsim Jamshed 		.header_split   = 	0, /**< Header Split disabled */
8676404edcSAsim Jamshed 		.hw_ip_checksum = 	1, /**< IP checksum offload enabled */
8776404edcSAsim Jamshed 		.hw_vlan_filter = 	0, /**< VLAN filtering disabled */
8876404edcSAsim Jamshed 		.jumbo_frame    = 	0, /**< Jumbo Frame Support disabled */
8976404edcSAsim Jamshed 		.hw_strip_crc   = 	1, /**< CRC stripped by hardware */
9076404edcSAsim Jamshed 	},
9176404edcSAsim Jamshed 	.rx_adv_conf = {
9276404edcSAsim Jamshed 		.rss_conf = {
9376404edcSAsim Jamshed 			.rss_key = 	NULL,
9476404edcSAsim Jamshed 			.rss_hf = 	ETH_RSS_TCP
9576404edcSAsim Jamshed 		},
9676404edcSAsim Jamshed 	},
9776404edcSAsim Jamshed 	.txmode = {
9876404edcSAsim Jamshed 		.mq_mode = 		ETH_MQ_TX_NONE,
9976404edcSAsim Jamshed 	},
10076404edcSAsim Jamshed };
10176404edcSAsim Jamshed 
10276404edcSAsim Jamshed static const struct rte_eth_rxconf rx_conf = {
10376404edcSAsim Jamshed 	.rx_thresh = {
10476404edcSAsim Jamshed 		.pthresh = 		RX_PTHRESH, /* RX prefetch threshold reg */
10576404edcSAsim Jamshed 		.hthresh = 		RX_HTHRESH, /* RX host threshold reg */
10676404edcSAsim Jamshed 		.wthresh = 		RX_WTHRESH, /* RX write-back threshold reg */
10776404edcSAsim Jamshed 	},
10876404edcSAsim Jamshed 	.rx_free_thresh = 		32,
10976404edcSAsim Jamshed };
11076404edcSAsim Jamshed 
11176404edcSAsim Jamshed static const struct rte_eth_txconf tx_conf = {
11276404edcSAsim Jamshed 	.tx_thresh = {
11376404edcSAsim Jamshed 		.pthresh = 		TX_PTHRESH, /* TX prefetch threshold reg */
11476404edcSAsim Jamshed 		.hthresh = 		TX_HTHRESH, /* TX host threshold reg */
11576404edcSAsim Jamshed 		.wthresh = 		TX_WTHRESH, /* TX write-back threshold reg */
11676404edcSAsim Jamshed 	},
11776404edcSAsim Jamshed 	.tx_free_thresh = 		0, /* Use PMD default values */
11876404edcSAsim Jamshed 	.tx_rs_thresh = 		0, /* Use PMD default values */
11976404edcSAsim Jamshed 	/*
12076404edcSAsim Jamshed 	 * As the example won't handle mult-segments and offload cases,
12176404edcSAsim Jamshed 	 * set the flag by default.
12276404edcSAsim Jamshed 	 */
12376404edcSAsim Jamshed 	.txq_flags = 			0x0,
12476404edcSAsim Jamshed };
12576404edcSAsim Jamshed 
12676404edcSAsim Jamshed struct mbuf_table {
12776404edcSAsim Jamshed 	unsigned len; /* length of queued packets */
12876404edcSAsim Jamshed 	struct rte_mbuf *m_table[MAX_PKT_BURST];
12976404edcSAsim Jamshed };
13076404edcSAsim Jamshed 
13176404edcSAsim Jamshed struct dpdk_private_context {
13276404edcSAsim Jamshed 	struct mbuf_table rmbufs[RTE_MAX_ETHPORTS];
13376404edcSAsim Jamshed 	struct mbuf_table wmbufs[RTE_MAX_ETHPORTS];
13476404edcSAsim Jamshed 	struct rte_mempool *pktmbuf_pool;
13576404edcSAsim Jamshed 	struct rte_mbuf *pkts_burst[MAX_PKT_BURST];
136a5e1a556SAsim Jamshed #ifdef RX_IDLE_ENABLE
137a5e1a556SAsim Jamshed 	uint8_t rx_idle;
138a5e1a556SAsim Jamshed #endif
13976404edcSAsim Jamshed #ifdef ENABLE_STATS_IOCTL
14076404edcSAsim Jamshed 	int fd;
14176404edcSAsim Jamshed #endif /* !ENABLE_STATS_IOCTL */
14276404edcSAsim Jamshed } __rte_cache_aligned;
14376404edcSAsim Jamshed 
14476404edcSAsim Jamshed #ifdef ENABLE_STATS_IOCTL
14576404edcSAsim Jamshed /**
14676404edcSAsim Jamshed  * stats struct passed on from user space to the driver
14776404edcSAsim Jamshed  */
14876404edcSAsim Jamshed struct stats_struct {
14976404edcSAsim Jamshed 	uint64_t tx_bytes;
15076404edcSAsim Jamshed 	uint64_t tx_pkts;
15176404edcSAsim Jamshed 	uint64_t rx_bytes;
15276404edcSAsim Jamshed 	uint64_t rx_pkts;
15376404edcSAsim Jamshed 	uint8_t qid;
15476404edcSAsim Jamshed 	uint8_t dev;
15576404edcSAsim Jamshed };
15676404edcSAsim Jamshed #endif /* !ENABLE_STATS_IOCTL */
15776404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
15876404edcSAsim Jamshed void
15976404edcSAsim Jamshed dpdk_init_handle(struct mtcp_thread_context *ctxt)
16076404edcSAsim Jamshed {
16176404edcSAsim Jamshed 	struct dpdk_private_context *dpc;
16276404edcSAsim Jamshed 	int i, j;
16376404edcSAsim Jamshed 	char mempool_name[20];
16476404edcSAsim Jamshed 
16576404edcSAsim Jamshed 	/* create and initialize private I/O module context */
16676404edcSAsim Jamshed 	ctxt->io_private_context = calloc(1, sizeof(struct dpdk_private_context));
16776404edcSAsim Jamshed 	if (ctxt->io_private_context == NULL) {
16876404edcSAsim Jamshed 		TRACE_ERROR("Failed to initialize ctxt->io_private_context: "
16976404edcSAsim Jamshed 			    "Can't allocate memory\n");
17076404edcSAsim Jamshed 		exit(EXIT_FAILURE);
17176404edcSAsim Jamshed 	}
17276404edcSAsim Jamshed 
17376404edcSAsim Jamshed 	sprintf(mempool_name, "mbuf_pool-%d", ctxt->cpu);
17476404edcSAsim Jamshed 	dpc = (struct dpdk_private_context *)ctxt->io_private_context;
17576404edcSAsim Jamshed 	dpc->pktmbuf_pool = pktmbuf_pool[ctxt->cpu];
17676404edcSAsim Jamshed 
17776404edcSAsim Jamshed 	/* set wmbufs correctly */
17876404edcSAsim Jamshed 	for (j = 0; j < g_config.mos->netdev_table->num; j++) {
17976404edcSAsim Jamshed 		/* Allocate wmbufs for each registered port */
18076404edcSAsim Jamshed 		for (i = 0; i < MAX_PKT_BURST; i++) {
18176404edcSAsim Jamshed 			dpc->wmbufs[j].m_table[i] = rte_pktmbuf_alloc(pktmbuf_pool[ctxt->cpu]);
18276404edcSAsim Jamshed 			if (dpc->wmbufs[j].m_table[i] == NULL) {
18376404edcSAsim Jamshed 				TRACE_ERROR("Failed to allocate %d:wmbuf[%d] on device %d!\n",
18476404edcSAsim Jamshed 					    ctxt->cpu, i, j);
18576404edcSAsim Jamshed 				exit(EXIT_FAILURE);
18676404edcSAsim Jamshed 			}
18776404edcSAsim Jamshed 		}
18876404edcSAsim Jamshed 		/* set mbufs queue length to 0 to begin with */
18976404edcSAsim Jamshed 		dpc->wmbufs[j].len = 0;
19076404edcSAsim Jamshed 	}
19176404edcSAsim Jamshed 
19276404edcSAsim Jamshed #ifdef ENABLE_STATS_IOCTL
19376404edcSAsim Jamshed 	dpc->fd = open("/dev/dpdk-iface", O_RDWR);
19476404edcSAsim Jamshed 	if (dpc->fd == -1) {
195c789f6daSAsim Jamshed 		TRACE_ERROR("Can't open /dev/dpdk-iface for context->cpu: %d! "
196c789f6daSAsim Jamshed 			    "Are you using mlx4/mlx5 driver?\n",
19776404edcSAsim Jamshed 			    ctxt->cpu);
19876404edcSAsim Jamshed 	}
19976404edcSAsim Jamshed #endif /* !ENABLE_STATS_IOCTL */
20076404edcSAsim Jamshed }
20176404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
20276404edcSAsim Jamshed int
20376404edcSAsim Jamshed dpdk_send_pkts(struct mtcp_thread_context *ctxt, int nif)
20476404edcSAsim Jamshed {
20576404edcSAsim Jamshed 	struct dpdk_private_context *dpc;
20676404edcSAsim Jamshed 	mtcp_manager_t mtcp;
20776404edcSAsim Jamshed 	int ret;
20876404edcSAsim Jamshed 	int qid;
20976404edcSAsim Jamshed 
21076404edcSAsim Jamshed 	dpc = (struct dpdk_private_context *)ctxt->io_private_context;
21176404edcSAsim Jamshed 	mtcp = ctxt->mtcp_manager;
21276404edcSAsim Jamshed 	ret = 0;
21376404edcSAsim Jamshed 	qid = cpu_qid_map[nif][ctxt->cpu];
21476404edcSAsim Jamshed 
21576404edcSAsim Jamshed 	/* if queue is unassigned, skip it.. */
21676404edcSAsim Jamshed 	if (unlikely(qid == 0xFF))
21776404edcSAsim Jamshed 		return 0;
21876404edcSAsim Jamshed 
21976404edcSAsim Jamshed 	/* if there are packets in the queue... flush them out to the wire */
22076404edcSAsim Jamshed 	if (dpc->wmbufs[nif].len >/*= MAX_PKT_BURST*/ 0) {
22176404edcSAsim Jamshed 		struct rte_mbuf **pkts;
22276404edcSAsim Jamshed #ifdef ENABLE_STATS_IOCTL
22376404edcSAsim Jamshed 		struct stats_struct ss;
22476404edcSAsim Jamshed #endif /* !ENABLE_STATS_IOCTL */
22576404edcSAsim Jamshed 		int cnt = dpc->wmbufs[nif].len;
22676404edcSAsim Jamshed 		pkts = dpc->wmbufs[nif].m_table;
22776404edcSAsim Jamshed #ifdef NETSTAT
22876404edcSAsim Jamshed 		mtcp->nstat.tx_packets[nif] += cnt;
22976404edcSAsim Jamshed #ifdef ENABLE_STATS_IOCTL
230c789f6daSAsim Jamshed 		if (likely(dpc->fd) >= 0) {
23176404edcSAsim Jamshed 			ss.tx_pkts = mtcp->nstat.tx_packets[nif];
23276404edcSAsim Jamshed 			ss.tx_bytes = mtcp->nstat.tx_bytes[nif];
23376404edcSAsim Jamshed 			ss.rx_pkts = mtcp->nstat.rx_packets[nif];
23476404edcSAsim Jamshed 			ss.rx_bytes = mtcp->nstat.rx_bytes[nif];
23576404edcSAsim Jamshed 			ss.qid = ctxt->cpu;
23676404edcSAsim Jamshed 			ss.dev = nif;
23776404edcSAsim Jamshed 			ioctl(dpc->fd, 0, &ss);
238c789f6daSAsim Jamshed 		}
23976404edcSAsim Jamshed #endif /* !ENABLE_STATS_IOCTL */
24076404edcSAsim Jamshed #endif
24176404edcSAsim Jamshed 		do {
24276404edcSAsim Jamshed 			/* tx cnt # of packets */
24376404edcSAsim Jamshed 			ret = rte_eth_tx_burst(nif, qid,
24476404edcSAsim Jamshed 					       pkts, cnt);
24576404edcSAsim Jamshed 			pkts += ret;
24676404edcSAsim Jamshed 			cnt -= ret;
24776404edcSAsim Jamshed 			/* if not all pkts were sent... then repeat the cycle */
24876404edcSAsim Jamshed 		} while (cnt > 0);
24976404edcSAsim Jamshed 
25076404edcSAsim Jamshed #ifndef SHARE_IO_BUFFER
25176404edcSAsim Jamshed 		int i;
25276404edcSAsim Jamshed 		/* time to allocate fresh mbufs for the queue */
25376404edcSAsim Jamshed 		for (i = 0; i < dpc->wmbufs[nif].len; i++) {
25476404edcSAsim Jamshed 			dpc->wmbufs[nif].m_table[i] = rte_pktmbuf_alloc(pktmbuf_pool[ctxt->cpu]);
25576404edcSAsim Jamshed 			/* error checking */
25676404edcSAsim Jamshed 			if (unlikely(dpc->wmbufs[nif].m_table[i] == NULL)) {
25776404edcSAsim Jamshed 				TRACE_ERROR("Failed to allocate %d:wmbuf[%d] on device %d!\n",
25876404edcSAsim Jamshed 					    ctxt->cpu, i, nif);
25976404edcSAsim Jamshed 				exit(EXIT_FAILURE);
26076404edcSAsim Jamshed 			}
26176404edcSAsim Jamshed 		}
26276404edcSAsim Jamshed #endif
26376404edcSAsim Jamshed 		/* reset the len of mbufs var after flushing of packets */
26476404edcSAsim Jamshed 		dpc->wmbufs[nif].len = 0;
26576404edcSAsim Jamshed 	}
26676404edcSAsim Jamshed 
26776404edcSAsim Jamshed 	return ret;
26876404edcSAsim Jamshed }
26976404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
27076404edcSAsim Jamshed uint8_t *
27176404edcSAsim Jamshed dpdk_get_wptr(struct mtcp_thread_context *ctxt, int nif, uint16_t pktsize)
27276404edcSAsim Jamshed {
27376404edcSAsim Jamshed 	struct dpdk_private_context *dpc;
27476404edcSAsim Jamshed 	mtcp_manager_t mtcp;
27576404edcSAsim Jamshed 	struct rte_mbuf *m;
27676404edcSAsim Jamshed 	uint8_t *ptr;
27776404edcSAsim Jamshed 	int len_of_mbuf;
27876404edcSAsim Jamshed 
27976404edcSAsim Jamshed 	dpc = (struct dpdk_private_context *) ctxt->io_private_context;
28076404edcSAsim Jamshed 	mtcp = ctxt->mtcp_manager;
28176404edcSAsim Jamshed 
28276404edcSAsim Jamshed 	/* sanity check */
28376404edcSAsim Jamshed 	if (unlikely(dpc->wmbufs[nif].len == MAX_PKT_BURST))
28476404edcSAsim Jamshed 		return NULL;
28576404edcSAsim Jamshed 
28676404edcSAsim Jamshed 	len_of_mbuf = dpc->wmbufs[nif].len;
28776404edcSAsim Jamshed 	m = dpc->wmbufs[nif].m_table[len_of_mbuf];
28876404edcSAsim Jamshed 
28976404edcSAsim Jamshed 	/* retrieve the right write offset */
29076404edcSAsim Jamshed 	ptr = (void *)rte_pktmbuf_mtod(m, struct ether_hdr *);
29176404edcSAsim Jamshed 	m->pkt_len = m->data_len = pktsize;
29276404edcSAsim Jamshed 	m->nb_segs = 1;
29376404edcSAsim Jamshed 	m->next = NULL;
29476404edcSAsim Jamshed 
29576404edcSAsim Jamshed #ifdef NETSTAT
296a834ea89SAsim Jamshed 	mtcp->nstat.tx_bytes[nif] += pktsize + ETHER_OVR;
29776404edcSAsim Jamshed #endif
29876404edcSAsim Jamshed 
29976404edcSAsim Jamshed 	/* increment the len_of_mbuf var */
30076404edcSAsim Jamshed 	dpc->wmbufs[nif].len = len_of_mbuf + 1;
30176404edcSAsim Jamshed 
30276404edcSAsim Jamshed 	return (uint8_t *)ptr;
30376404edcSAsim Jamshed }
30476404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
30576404edcSAsim Jamshed void
30676404edcSAsim Jamshed dpdk_set_wptr(struct mtcp_thread_context *ctxt, int out_nif, int in_nif, int index)
30776404edcSAsim Jamshed {
30876404edcSAsim Jamshed 	struct dpdk_private_context *dpc;
30976404edcSAsim Jamshed 	mtcp_manager_t mtcp;
31076404edcSAsim Jamshed 	int len_of_mbuf;
31176404edcSAsim Jamshed 
31276404edcSAsim Jamshed 	dpc = (struct dpdk_private_context *) ctxt->io_private_context;
31376404edcSAsim Jamshed 	mtcp = ctxt->mtcp_manager;
31476404edcSAsim Jamshed 
31576404edcSAsim Jamshed 	/* sanity check */
31676404edcSAsim Jamshed 	if (unlikely(dpc->wmbufs[out_nif].len == MAX_PKT_BURST))
31776404edcSAsim Jamshed 		return;
31876404edcSAsim Jamshed 
31976404edcSAsim Jamshed 	len_of_mbuf = dpc->wmbufs[out_nif].len;
32076404edcSAsim Jamshed 	dpc->wmbufs[out_nif].m_table[len_of_mbuf] =
32176404edcSAsim Jamshed 		dpc->rmbufs[in_nif].m_table[index];
32276404edcSAsim Jamshed 
32376404edcSAsim Jamshed 	dpc->wmbufs[out_nif].m_table[len_of_mbuf]->udata64 = 0;
32476404edcSAsim Jamshed 
32576404edcSAsim Jamshed #ifdef NETSTAT
326a834ea89SAsim Jamshed 	mtcp->nstat.tx_bytes[out_nif] += dpc->rmbufs[in_nif].m_table[index]->pkt_len + ETHER_OVR;
32776404edcSAsim Jamshed #endif
32876404edcSAsim Jamshed 
32976404edcSAsim Jamshed 	/* increment the len_of_mbuf var */
33076404edcSAsim Jamshed 	dpc->wmbufs[out_nif].len = len_of_mbuf + 1;
33176404edcSAsim Jamshed 
33276404edcSAsim Jamshed 	return;
33376404edcSAsim Jamshed }
33476404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
33576404edcSAsim Jamshed static inline void
33676404edcSAsim Jamshed free_pkts(struct rte_mbuf **mtable, unsigned len)
33776404edcSAsim Jamshed {
33876404edcSAsim Jamshed 	int i;
33976404edcSAsim Jamshed 
34076404edcSAsim Jamshed 	/* free the freaking packets */
34176404edcSAsim Jamshed 	for (i = 0; i < len; i++) {
34276404edcSAsim Jamshed 		if (mtable[i]->udata64 == 1) {
34376404edcSAsim Jamshed 			rte_pktmbuf_free_seg(mtable[i]);
34476404edcSAsim Jamshed 			RTE_MBUF_PREFETCH_TO_FREE(mtable[i+1]);
34576404edcSAsim Jamshed 		}
34676404edcSAsim Jamshed 	}
34776404edcSAsim Jamshed }
34876404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
34976404edcSAsim Jamshed int32_t
35076404edcSAsim Jamshed dpdk_recv_pkts(struct mtcp_thread_context *ctxt, int ifidx)
35176404edcSAsim Jamshed {
35276404edcSAsim Jamshed 	struct dpdk_private_context *dpc;
35376404edcSAsim Jamshed 	int ret;
35476404edcSAsim Jamshed 	uint8_t qid;
35576404edcSAsim Jamshed 
35676404edcSAsim Jamshed 	dpc = (struct dpdk_private_context *) ctxt->io_private_context;
35776404edcSAsim Jamshed 	qid = cpu_qid_map[ifidx][ctxt->cpu];
35876404edcSAsim Jamshed 
35976404edcSAsim Jamshed 	/* if queue is unassigned, skip it.. */
36076404edcSAsim Jamshed 	if (qid == 0xFF)
36176404edcSAsim Jamshed 		return 0;
36276404edcSAsim Jamshed 
36376404edcSAsim Jamshed 	if (dpc->rmbufs[ifidx].len != 0) {
36476404edcSAsim Jamshed 		free_pkts(dpc->rmbufs[ifidx].m_table, dpc->rmbufs[ifidx].len);
36576404edcSAsim Jamshed 		dpc->rmbufs[ifidx].len = 0;
36676404edcSAsim Jamshed 	}
36776404edcSAsim Jamshed 
36876404edcSAsim Jamshed 	ret = rte_eth_rx_burst((uint8_t)ifidx, qid,
36976404edcSAsim Jamshed 			       dpc->pkts_burst, MAX_PKT_BURST);
370a5e1a556SAsim Jamshed #ifdef RX_IDLE_ENABLE
371a5e1a556SAsim Jamshed 	dpc->rx_idle = (likely(ret != 0)) ? 0 : dpc->rx_idle + 1;
372a5e1a556SAsim Jamshed #endif
37376404edcSAsim Jamshed 	dpc->rmbufs[ifidx].len = ret;
37476404edcSAsim Jamshed 
37576404edcSAsim Jamshed 	return ret;
37676404edcSAsim Jamshed }
37776404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
37876404edcSAsim Jamshed uint8_t *
37976404edcSAsim Jamshed dpdk_get_rptr(struct mtcp_thread_context *ctxt, int ifidx, int index, uint16_t *len)
38076404edcSAsim Jamshed {
38176404edcSAsim Jamshed 	struct dpdk_private_context *dpc;
38276404edcSAsim Jamshed 	struct rte_mbuf *m;
38376404edcSAsim Jamshed 	uint8_t *pktbuf;
38476404edcSAsim Jamshed 
38576404edcSAsim Jamshed 	dpc = (struct dpdk_private_context *) ctxt->io_private_context;
38676404edcSAsim Jamshed 
38776404edcSAsim Jamshed 
38876404edcSAsim Jamshed 	m = dpc->pkts_burst[index];
38976404edcSAsim Jamshed 	/* tag to check if the packet is a local or a forwarded pkt */
39076404edcSAsim Jamshed 	m->udata64 = 1;
39176404edcSAsim Jamshed 	/* don't enable pre-fetching... performance goes down */
39276404edcSAsim Jamshed 	//rte_prefetch0(rte_pktmbuf_mtod(m, void *));
39376404edcSAsim Jamshed 	*len = m->pkt_len;
39476404edcSAsim Jamshed 	pktbuf = rte_pktmbuf_mtod(m, uint8_t *);
39576404edcSAsim Jamshed 
39676404edcSAsim Jamshed 	/* enqueue the pkt ptr in mbuf */
39776404edcSAsim Jamshed 	dpc->rmbufs[ifidx].m_table[index] = m;
39876404edcSAsim Jamshed 
39976404edcSAsim Jamshed 	return pktbuf;
40076404edcSAsim Jamshed }
40176404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
40276404edcSAsim Jamshed int
40376404edcSAsim Jamshed dpdk_get_nif(struct ifreq *ifr)
40476404edcSAsim Jamshed {
40576404edcSAsim Jamshed 	int i;
40676404edcSAsim Jamshed 	static int num_dev = -1;
40776404edcSAsim Jamshed 	static struct ether_addr ports_eth_addr[RTE_MAX_ETHPORTS];
40876404edcSAsim Jamshed 	/* get mac addr entries of 'detected' dpdk ports */
40976404edcSAsim Jamshed 	if (num_dev < 0) {
41076404edcSAsim Jamshed 		num_dev = rte_eth_dev_count();
41176404edcSAsim Jamshed 		for (i = 0; i < num_dev; i++)
41276404edcSAsim Jamshed 			rte_eth_macaddr_get(i, &ports_eth_addr[i]);
41376404edcSAsim Jamshed 	}
41476404edcSAsim Jamshed 
41576404edcSAsim Jamshed 	for (i = 0; i < num_dev; i++)
41676404edcSAsim Jamshed 		if (!memcmp(&ifr->ifr_addr.sa_data[0], &ports_eth_addr[i], ETH_ALEN))
41776404edcSAsim Jamshed 			return i;
41876404edcSAsim Jamshed 
41976404edcSAsim Jamshed 	return -1;
42076404edcSAsim Jamshed }
42176404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
422a5e1a556SAsim Jamshed int32_t
423a5e1a556SAsim Jamshed dpdk_select(struct mtcp_thread_context *ctxt)
424a5e1a556SAsim Jamshed {
425a5e1a556SAsim Jamshed #ifdef RX_IDLE_ENABLE
426a5e1a556SAsim Jamshed 	struct dpdk_private_context *dpc;
427a5e1a556SAsim Jamshed 
428a5e1a556SAsim Jamshed 	dpc = (struct dpdk_private_context *) ctxt->io_private_context;
429a5e1a556SAsim Jamshed 	if (dpc->rx_idle > RX_IDLE_THRESH) {
430a5e1a556SAsim Jamshed 		dpc->rx_idle = 0;
431a5e1a556SAsim Jamshed 		usleep(RX_IDLE_TIMEOUT);
432a5e1a556SAsim Jamshed 	}
433a5e1a556SAsim Jamshed #endif
434a5e1a556SAsim Jamshed 	return 0;
435a5e1a556SAsim Jamshed }
436a5e1a556SAsim Jamshed /*----------------------------------------------------------------------------*/
43776404edcSAsim Jamshed void
43876404edcSAsim Jamshed dpdk_destroy_handle(struct mtcp_thread_context *ctxt)
43976404edcSAsim Jamshed {
44076404edcSAsim Jamshed 	struct dpdk_private_context *dpc;
44176404edcSAsim Jamshed 	int i;
44276404edcSAsim Jamshed 
44376404edcSAsim Jamshed 	dpc = (struct dpdk_private_context *) ctxt->io_private_context;
44476404edcSAsim Jamshed 
44576404edcSAsim Jamshed 	/* free wmbufs */
44676404edcSAsim Jamshed 	for (i = 0; i < g_config.mos->netdev_table->num; i++)
44776404edcSAsim Jamshed 		free_pkts(dpc->wmbufs[i].m_table, MAX_PKT_BURST);
44876404edcSAsim Jamshed 
44976404edcSAsim Jamshed #ifdef ENABLE_STATS_IOCTL
45076404edcSAsim Jamshed 	/* free fd */
451c789f6daSAsim Jamshed 	if (dpc->fd >= 0)
45276404edcSAsim Jamshed 		close(dpc->fd);
45376404edcSAsim Jamshed #endif /* !ENABLE_STATS_IOCTL */
45476404edcSAsim Jamshed 
45576404edcSAsim Jamshed 	/* free it all up */
45676404edcSAsim Jamshed 	free(dpc);
45776404edcSAsim Jamshed }
45876404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
45976404edcSAsim Jamshed static void
46076404edcSAsim Jamshed check_all_ports_link_status(uint8_t port_num, uint32_t port_mask)
46176404edcSAsim Jamshed {
46276404edcSAsim Jamshed #define CHECK_INTERVAL 			100 /* 100ms */
46376404edcSAsim Jamshed #define MAX_CHECK_TIME 			90 /* 9s (90 * 100ms) in total */
46476404edcSAsim Jamshed 
46576404edcSAsim Jamshed 	uint8_t portid, count, all_ports_up, print_flag = 0;
46676404edcSAsim Jamshed 	struct rte_eth_link link;
46776404edcSAsim Jamshed 
46876404edcSAsim Jamshed 	printf("\nChecking link status");
46976404edcSAsim Jamshed 	fflush(stdout);
47076404edcSAsim Jamshed 	for (count = 0; count <= MAX_CHECK_TIME; count++) {
47176404edcSAsim Jamshed 		all_ports_up = 1;
47276404edcSAsim Jamshed 		for (portid = 0; portid < port_num; portid++) {
47376404edcSAsim Jamshed 			if ((port_mask & (1 << portid)) == 0)
47476404edcSAsim Jamshed 				continue;
47576404edcSAsim Jamshed 			memset(&link, 0, sizeof(link));
47676404edcSAsim Jamshed 			rte_eth_link_get_nowait(portid, &link);
47776404edcSAsim Jamshed 			/* print link status if flag set */
47876404edcSAsim Jamshed 			if (print_flag == 1) {
47976404edcSAsim Jamshed 				if (link.link_status)
48076404edcSAsim Jamshed 					printf("Port %d Link Up - speed %u "
48176404edcSAsim Jamshed 						"Mbps - %s\n", (uint8_t)portid,
48276404edcSAsim Jamshed 						(unsigned)link.link_speed,
48376404edcSAsim Jamshed 				(link.link_duplex == ETH_LINK_FULL_DUPLEX) ?
48476404edcSAsim Jamshed 					("full-duplex") : ("half-duplex\n"));
48576404edcSAsim Jamshed 				else
48676404edcSAsim Jamshed 					printf("Port %d Link Down\n",
48776404edcSAsim Jamshed 						(uint8_t)portid);
48876404edcSAsim Jamshed 				continue;
48976404edcSAsim Jamshed 			}
49076404edcSAsim Jamshed 			/* clear all_ports_up flag if any link down */
49176404edcSAsim Jamshed 			if (link.link_status == 0) {
49276404edcSAsim Jamshed 				all_ports_up = 0;
49376404edcSAsim Jamshed 				break;
49476404edcSAsim Jamshed 			}
49576404edcSAsim Jamshed 		}
49676404edcSAsim Jamshed 		/* after finally printing all link status, get out */
49776404edcSAsim Jamshed 		if (print_flag == 1)
49876404edcSAsim Jamshed 			break;
49976404edcSAsim Jamshed 
50076404edcSAsim Jamshed 		if (all_ports_up == 0) {
50176404edcSAsim Jamshed 			printf(".");
50276404edcSAsim Jamshed 			fflush(stdout);
50376404edcSAsim Jamshed 			rte_delay_ms(CHECK_INTERVAL);
50476404edcSAsim Jamshed 		}
50576404edcSAsim Jamshed 
50676404edcSAsim Jamshed 		/* set the print_flag if all ports up or timeout */
50776404edcSAsim Jamshed 		if (all_ports_up == 1 || count == (MAX_CHECK_TIME - 1)) {
50876404edcSAsim Jamshed 			print_flag = 1;
50976404edcSAsim Jamshed 			printf("done\n");
51076404edcSAsim Jamshed 		}
51176404edcSAsim Jamshed 	}
51276404edcSAsim Jamshed }
51376404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
51476404edcSAsim Jamshed int32_t
51576404edcSAsim Jamshed dpdk_dev_ioctl(struct mtcp_thread_context *ctx, int nif, int cmd, void *argp)
51676404edcSAsim Jamshed {
51776404edcSAsim Jamshed 	struct dpdk_private_context *dpc;
51876404edcSAsim Jamshed 	struct rte_mbuf *m;
51976404edcSAsim Jamshed 	int len_of_mbuf;
52076404edcSAsim Jamshed 	struct iphdr *iph;
52176404edcSAsim Jamshed 	struct tcphdr *tcph;
52276404edcSAsim Jamshed 	RssInfo *rss_i;
52376404edcSAsim Jamshed 
52476404edcSAsim Jamshed 	iph = (struct iphdr *)argp;
52576404edcSAsim Jamshed 	dpc = (struct dpdk_private_context *)ctx->io_private_context;
52676404edcSAsim Jamshed 	len_of_mbuf = dpc->wmbufs[nif].len;
52776404edcSAsim Jamshed 	rss_i = NULL;
52876404edcSAsim Jamshed 
52976404edcSAsim Jamshed 	switch (cmd) {
53076404edcSAsim Jamshed 	case PKT_TX_IP_CSUM:
53176404edcSAsim Jamshed 		m = dpc->wmbufs[nif].m_table[len_of_mbuf - 1];
532522d5c66SAsim Jamshed 		m->ol_flags = PKT_TX_IP_CKSUM | PKT_TX_IPV4;
53376404edcSAsim Jamshed 		m->l2_len = sizeof(struct ether_hdr);
53476404edcSAsim Jamshed 		m->l3_len = (iph->ihl<<2);
53576404edcSAsim Jamshed 		break;
53676404edcSAsim Jamshed 	case PKT_TX_TCP_CSUM:
53776404edcSAsim Jamshed 		m = dpc->wmbufs[nif].m_table[len_of_mbuf - 1];
53876404edcSAsim Jamshed 		tcph = (struct tcphdr *)((unsigned char *)iph + (iph->ihl<<2));
53976404edcSAsim Jamshed 		m->ol_flags |= PKT_TX_TCP_CKSUM;
54076404edcSAsim Jamshed 		tcph->check = rte_ipv4_phdr_cksum((struct ipv4_hdr *)iph, m->ol_flags);
54176404edcSAsim Jamshed 		break;
54276404edcSAsim Jamshed 	case PKT_RX_RSS:
54376404edcSAsim Jamshed 		rss_i = (RssInfo *)argp;
54476404edcSAsim Jamshed 		m = dpc->pkts_burst[rss_i->pktidx];
54576404edcSAsim Jamshed 		rss_i->hash_value = m->hash.rss;
54676404edcSAsim Jamshed 		break;
54776404edcSAsim Jamshed 	default:
54876404edcSAsim Jamshed 		goto dev_ioctl_err;
54976404edcSAsim Jamshed 	}
55076404edcSAsim Jamshed 
55176404edcSAsim Jamshed 	return 0;
55276404edcSAsim Jamshed  dev_ioctl_err:
55376404edcSAsim Jamshed 	return -1;
55476404edcSAsim Jamshed }
55576404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
55676404edcSAsim Jamshed void
55776404edcSAsim Jamshed dpdk_load_module_upper_half(void)
55876404edcSAsim Jamshed {
55976404edcSAsim Jamshed 	int cpu = g_config.mos->num_cores, ret;
56076404edcSAsim Jamshed 	uint32_t cpumask = 0;
56176404edcSAsim Jamshed 	char cpumaskbuf[10];
56276404edcSAsim Jamshed 	char mem_channels[5];
56376404edcSAsim Jamshed 
56476404edcSAsim Jamshed 	/* set the log level */
56576404edcSAsim Jamshed 	rte_set_log_type(RTE_LOGTYPE_PMD, 0);
56676404edcSAsim Jamshed 	rte_set_log_type(RTE_LOGTYPE_MALLOC, 0);
56776404edcSAsim Jamshed 	rte_set_log_type(RTE_LOGTYPE_MEMPOOL, 0);
56876404edcSAsim Jamshed 	rte_set_log_type(RTE_LOGTYPE_RING, 0);
56976404edcSAsim Jamshed 	rte_set_log_level(RTE_LOG_WARNING);
57076404edcSAsim Jamshed 
57176404edcSAsim Jamshed 	/* get the cpu mask */
57276404edcSAsim Jamshed 	for (ret = 0; ret < cpu; ret++)
57376404edcSAsim Jamshed 		cpumask = (cpumask | (1 << ret));
57476404edcSAsim Jamshed 	sprintf(cpumaskbuf, "%X", cpumask);
57576404edcSAsim Jamshed 
57676404edcSAsim Jamshed 	/* get the mem channels per socket */
57776404edcSAsim Jamshed 	if (g_config.mos->nb_mem_channels == 0) {
57876404edcSAsim Jamshed 		TRACE_ERROR("DPDK module requires # of memory channels "
57976404edcSAsim Jamshed 				"per socket parameter!\n");
58076404edcSAsim Jamshed 		exit(EXIT_FAILURE);
58176404edcSAsim Jamshed 	}
58276404edcSAsim Jamshed 	sprintf(mem_channels, "%d", g_config.mos->nb_mem_channels);
58376404edcSAsim Jamshed 
58476404edcSAsim Jamshed 	/* initialize the rte env first, what a waste of implementation effort!  */
58576404edcSAsim Jamshed 	char *argv[] = {"",
58676404edcSAsim Jamshed 			"-c",
58776404edcSAsim Jamshed 			cpumaskbuf,
58876404edcSAsim Jamshed 			"-n",
58976404edcSAsim Jamshed 			mem_channels,
59076404edcSAsim Jamshed 			"--proc-type=auto",
59176404edcSAsim Jamshed 			""
59276404edcSAsim Jamshed 	};
59376404edcSAsim Jamshed 	const int argc = 6;
59476404edcSAsim Jamshed 
59576404edcSAsim Jamshed 	/*
59676404edcSAsim Jamshed 	 * re-set getopt extern variable optind.
59776404edcSAsim Jamshed 	 * this issue was a bitch to debug
59876404edcSAsim Jamshed 	 * rte_eal_init() internally uses getopt() syscall
59976404edcSAsim Jamshed 	 * mtcp applications that also use an `external' getopt
60076404edcSAsim Jamshed 	 * will cause a violent crash if optind is not reset to zero
60176404edcSAsim Jamshed 	 * prior to calling the func below...
60276404edcSAsim Jamshed 	 * see man getopt(3) for more details
60376404edcSAsim Jamshed 	 */
60476404edcSAsim Jamshed 	optind = 0;
60576404edcSAsim Jamshed 
60676404edcSAsim Jamshed 	/* initialize the dpdk eal env */
60776404edcSAsim Jamshed 	ret = rte_eal_init(argc, argv);
60876404edcSAsim Jamshed 	if (ret < 0)
60976404edcSAsim Jamshed 		rte_exit(EXIT_FAILURE, "Invalid EAL args!\n");
61076404edcSAsim Jamshed 
61176404edcSAsim Jamshed }
61276404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
61376404edcSAsim Jamshed void
61476404edcSAsim Jamshed dpdk_load_module_lower_half(void)
61576404edcSAsim Jamshed {
61676404edcSAsim Jamshed 	int portid, rxlcore_id, ret;
61776404edcSAsim Jamshed 	struct rte_eth_fc_conf fc_conf;	/* for Ethernet flow control settings */
61876404edcSAsim Jamshed 	/* setting the rss key */
61976404edcSAsim Jamshed 	static const uint8_t key[] = {
62076404edcSAsim Jamshed 		0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05,
62176404edcSAsim Jamshed 		0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05,
62276404edcSAsim Jamshed 		0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05,
62376404edcSAsim Jamshed 		0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05, 0x05
62476404edcSAsim Jamshed 	};
62576404edcSAsim Jamshed 
62676404edcSAsim Jamshed 	port_conf.rx_adv_conf.rss_conf.rss_key = (uint8_t *)&key;
62776404edcSAsim Jamshed 	port_conf.rx_adv_conf.rss_conf.rss_key_len = sizeof(key);
62876404edcSAsim Jamshed 
62976404edcSAsim Jamshed 	/* resetting cpu_qid mapping */
63076404edcSAsim Jamshed 	memset(cpu_qid_map, 0xFF, sizeof(cpu_qid_map));
63176404edcSAsim Jamshed 
63276404edcSAsim Jamshed 	if (!g_config.mos->multiprocess
63376404edcSAsim Jamshed 			|| (g_config.mos->multiprocess && g_config.mos->multiprocess_is_master)) {
63476404edcSAsim Jamshed 		for (rxlcore_id = 0; rxlcore_id < g_config.mos->num_cores; rxlcore_id++) {
63576404edcSAsim Jamshed 			char name[20];
63676404edcSAsim Jamshed 			sprintf(name, "mbuf_pool-%d", rxlcore_id);
63776404edcSAsim Jamshed 			/* create the mbuf pools */
63876404edcSAsim Jamshed 			pktmbuf_pool[rxlcore_id] =
63976404edcSAsim Jamshed 				rte_mempool_create(name, NB_MBUF,
64076404edcSAsim Jamshed 						   MBUF_SIZE, MEMPOOL_CACHE_SIZE,
64176404edcSAsim Jamshed 						   sizeof(struct rte_pktmbuf_pool_private),
64276404edcSAsim Jamshed 						   rte_pktmbuf_pool_init, NULL,
64376404edcSAsim Jamshed 						   rte_pktmbuf_init, NULL,
64476404edcSAsim Jamshed 						   rte_lcore_to_socket_id(rxlcore_id), 0);
64576404edcSAsim Jamshed 			if (pktmbuf_pool[rxlcore_id] == NULL)
64676404edcSAsim Jamshed 				rte_exit(EXIT_FAILURE, "Cannot init mbuf pool\n");
64776404edcSAsim Jamshed 		}
64876404edcSAsim Jamshed 
64976404edcSAsim Jamshed 		/* Initialise each port */
65076404edcSAsim Jamshed 		for (portid = 0; portid < g_config.mos->netdev_table->num; portid++) {
65176404edcSAsim Jamshed 			int num_queue = 0, eth_idx, i, queue_id;
65276404edcSAsim Jamshed 			for (eth_idx = 0; eth_idx < g_config.mos->netdev_table->num; eth_idx++)
65376404edcSAsim Jamshed 				if (portid == g_config.mos->netdev_table->ent[eth_idx]->ifindex)
65476404edcSAsim Jamshed 					break;
65576404edcSAsim Jamshed 			if (eth_idx == g_config.mos->netdev_table->num)
65676404edcSAsim Jamshed 				continue;
65776404edcSAsim Jamshed 			for (i = 0; i < sizeof(uint64_t) * 8; i++)
65876404edcSAsim Jamshed 				if (g_config.mos->netdev_table->ent[eth_idx]->cpu_mask & (1L << i))
65976404edcSAsim Jamshed 					num_queue++;
66076404edcSAsim Jamshed 
66176404edcSAsim Jamshed 			/* set 'num_queues' (used for GetRSSCPUCore() in util.c) */
66276404edcSAsim Jamshed 			num_queues = num_queue;
66376404edcSAsim Jamshed 
66476404edcSAsim Jamshed 			/* init port */
66576404edcSAsim Jamshed 			printf("Initializing port %u... ", (unsigned) portid);
66676404edcSAsim Jamshed 			fflush(stdout);
66776404edcSAsim Jamshed 			ret = rte_eth_dev_configure(portid, num_queue, num_queue,
66876404edcSAsim Jamshed 										&port_conf);
66976404edcSAsim Jamshed 			if (ret < 0)
67076404edcSAsim Jamshed 				rte_exit(EXIT_FAILURE, "Cannot configure device:"
67176404edcSAsim Jamshed 									   "err=%d, port=%u\n",
67276404edcSAsim Jamshed 									   ret, (unsigned) portid);
67376404edcSAsim Jamshed 
67476404edcSAsim Jamshed 			/* init one RX queue per CPU */
67576404edcSAsim Jamshed 			fflush(stdout);
67676404edcSAsim Jamshed #ifdef DEBUG
67776404edcSAsim Jamshed 			rte_eth_macaddr_get(portid, &ports_eth_addr[portid]);
67876404edcSAsim Jamshed #endif
67976404edcSAsim Jamshed 			queue_id = 0;
68076404edcSAsim Jamshed 			for (rxlcore_id = 0; rxlcore_id < g_config.mos->num_cores; rxlcore_id++) {
68176404edcSAsim Jamshed 				if (!(g_config.mos->netdev_table->ent[eth_idx]->cpu_mask & (1L << rxlcore_id)))
68276404edcSAsim Jamshed 					continue;
68376404edcSAsim Jamshed 				ret = rte_eth_rx_queue_setup(portid, queue_id, nb_rxd,
68476404edcSAsim Jamshed 						rte_eth_dev_socket_id(portid), &rx_conf,
68576404edcSAsim Jamshed 						pktmbuf_pool[rxlcore_id]);
68676404edcSAsim Jamshed 				if (ret < 0)
68776404edcSAsim Jamshed 					rte_exit(EXIT_FAILURE, "rte_eth_rx_queue_setup:"
68876404edcSAsim Jamshed 										   "err=%d, port=%u, queueid: %d\n",
68976404edcSAsim Jamshed 										   ret, (unsigned) portid, rxlcore_id);
69076404edcSAsim Jamshed 				cpu_qid_map[portid][rxlcore_id] = queue_id++;
69176404edcSAsim Jamshed 			}
69276404edcSAsim Jamshed 
69376404edcSAsim Jamshed 			/* init one TX queue on each port per CPU (this is redundant for
69476404edcSAsim Jamshed 			 * this app) */
69576404edcSAsim Jamshed 			fflush(stdout);
69676404edcSAsim Jamshed 			queue_id = 0;
69776404edcSAsim Jamshed 			for (rxlcore_id = 0; rxlcore_id < g_config.mos->num_cores; rxlcore_id++) {
69876404edcSAsim Jamshed 				if (!(g_config.mos->netdev_table->ent[eth_idx]->cpu_mask & (1L << rxlcore_id)))
69976404edcSAsim Jamshed 					continue;
70076404edcSAsim Jamshed 				ret = rte_eth_tx_queue_setup(portid, queue_id++, nb_txd,
70176404edcSAsim Jamshed 						rte_eth_dev_socket_id(portid), &tx_conf);
70276404edcSAsim Jamshed 				if (ret < 0)
70376404edcSAsim Jamshed 					rte_exit(EXIT_FAILURE, "rte_eth_tx_queue_setup:"
70476404edcSAsim Jamshed 										   "err=%d, port=%u, queueid: %d\n",
70576404edcSAsim Jamshed 										   ret, (unsigned) portid, rxlcore_id);
70676404edcSAsim Jamshed 			}
70776404edcSAsim Jamshed 
70876404edcSAsim Jamshed 			/* Start device */
70976404edcSAsim Jamshed 			ret = rte_eth_dev_start(portid);
71076404edcSAsim Jamshed 			if (ret < 0)
71176404edcSAsim Jamshed 				rte_exit(EXIT_FAILURE, "rte_eth_dev_start:err=%d, port=%u\n",
71276404edcSAsim Jamshed 									   ret, (unsigned) portid);
71376404edcSAsim Jamshed 
71476404edcSAsim Jamshed 			printf("done: \n");
71576404edcSAsim Jamshed 			rte_eth_promiscuous_enable(portid);
71676404edcSAsim Jamshed 
71776404edcSAsim Jamshed 			/* retrieve current flow control settings per port */
71876404edcSAsim Jamshed 			memset(&fc_conf, 0, sizeof(fc_conf));
71976404edcSAsim Jamshed 			ret = rte_eth_dev_flow_ctrl_get(portid, &fc_conf);
72076404edcSAsim Jamshed 			if (ret != 0) {
72176404edcSAsim Jamshed 				rte_exit(EXIT_FAILURE, "Failed to get flow control info!\n");
72276404edcSAsim Jamshed 			}
72376404edcSAsim Jamshed 
72476404edcSAsim Jamshed 			/* and just disable the rx/tx flow control */
72576404edcSAsim Jamshed 			fc_conf.mode = RTE_FC_NONE;
72676404edcSAsim Jamshed 			ret = rte_eth_dev_flow_ctrl_set(portid, &fc_conf);
72776404edcSAsim Jamshed 			if (ret != 0) {
72876404edcSAsim Jamshed 				rte_exit(EXIT_FAILURE, "Failed to set flow control info!: errno: %d\n",
72976404edcSAsim Jamshed 					 ret);
73076404edcSAsim Jamshed 			}
73176404edcSAsim Jamshed 
73276404edcSAsim Jamshed #ifdef DEBUG
73376404edcSAsim Jamshed 			printf("Port %u, MAC address: %02X:%02X:%02X:%02X:%02X:%02X\n\n",
73476404edcSAsim Jamshed 					(unsigned) portid,
73576404edcSAsim Jamshed 					ports_eth_addr[portid].addr_bytes[0],
73676404edcSAsim Jamshed 					ports_eth_addr[portid].addr_bytes[1],
73776404edcSAsim Jamshed 					ports_eth_addr[portid].addr_bytes[2],
73876404edcSAsim Jamshed 					ports_eth_addr[portid].addr_bytes[3],
73976404edcSAsim Jamshed 					ports_eth_addr[portid].addr_bytes[4],
74076404edcSAsim Jamshed 					ports_eth_addr[portid].addr_bytes[5]);
74176404edcSAsim Jamshed #endif
7423ae9e016SAsim Jamshed 			/* only check for link status if the thread is master */
7433ae9e016SAsim Jamshed 			check_all_ports_link_status(g_config.mos->netdev_table->num, 0xFFFFFFFF);
74476404edcSAsim Jamshed 		}
74576404edcSAsim Jamshed 	} else { /* g_config.mos->multiprocess && !g_config.mos->multiprocess_is_master */
74676404edcSAsim Jamshed 		for (rxlcore_id = 0; rxlcore_id < g_config.mos->num_cores; rxlcore_id++) {
74776404edcSAsim Jamshed 			char name[20];
74876404edcSAsim Jamshed 			sprintf(name, "mbuf_pool-%d", rxlcore_id);
74976404edcSAsim Jamshed 			/* initialize the mbuf pools */
75076404edcSAsim Jamshed 			pktmbuf_pool[rxlcore_id] =
75176404edcSAsim Jamshed 				rte_mempool_lookup(name);
75276404edcSAsim Jamshed 			if (pktmbuf_pool[rxlcore_id] == NULL)
75376404edcSAsim Jamshed 				rte_exit(EXIT_FAILURE, "Cannot init mbuf pool\n");
7543ae9e016SAsim Jamshed 			for (portid = 0; portid < g_config.mos->netdev_table->num; portid++)
7553ae9e016SAsim Jamshed 				cpu_qid_map[portid][rxlcore_id] = rxlcore_id;
75676404edcSAsim Jamshed 		}
7573ae9e016SAsim Jamshed 		/* set 'num_queues' (used for GetRSSCPUCore() in util.c) */
7583ae9e016SAsim Jamshed 		num_queues = g_config.mos->num_cores;
75976404edcSAsim Jamshed 	}
76076404edcSAsim Jamshed 
76176404edcSAsim Jamshed }
76276404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
76376404edcSAsim Jamshed io_module_func dpdk_module_func = {
76476404edcSAsim Jamshed 	.load_module_upper_half		   = dpdk_load_module_upper_half,
76576404edcSAsim Jamshed 	.load_module_lower_half		   = dpdk_load_module_lower_half,
76676404edcSAsim Jamshed 	.init_handle		   = dpdk_init_handle,
76776404edcSAsim Jamshed 	.link_devices		   = NULL,
76876404edcSAsim Jamshed 	.release_pkt		   = NULL,
76976404edcSAsim Jamshed 	.send_pkts		   = dpdk_send_pkts,
77076404edcSAsim Jamshed 	.get_wptr   		   = dpdk_get_wptr,
77176404edcSAsim Jamshed 	.recv_pkts		   = dpdk_recv_pkts,
77276404edcSAsim Jamshed 	.get_rptr	   	   = dpdk_get_rptr,
77376404edcSAsim Jamshed 	.get_nif		   = dpdk_get_nif,
774a5e1a556SAsim Jamshed 	.select			   = dpdk_select,
77576404edcSAsim Jamshed 	.destroy_handle		   = dpdk_destroy_handle,
77676404edcSAsim Jamshed 	.dev_ioctl		   = dpdk_dev_ioctl,
77776404edcSAsim Jamshed 	.set_wptr		   = dpdk_set_wptr,
77876404edcSAsim Jamshed };
77976404edcSAsim Jamshed /*----------------------------------------------------------------------------*/
78076404edcSAsim Jamshed 
781