xref: /f-stack/dpdk/examples/vhost/ioat.c (revision 2d9fd380)
1*2d9fd380Sjfb8856606 /* SPDX-License-Identifier: BSD-3-Clause
2*2d9fd380Sjfb8856606  * Copyright(c) 2010-2020 Intel Corporation
3*2d9fd380Sjfb8856606  */
4*2d9fd380Sjfb8856606 
5*2d9fd380Sjfb8856606 #include <sys/uio.h>
6*2d9fd380Sjfb8856606 #ifdef RTE_RAW_IOAT
7*2d9fd380Sjfb8856606 #include <rte_rawdev.h>
8*2d9fd380Sjfb8856606 #include <rte_ioat_rawdev.h>
9*2d9fd380Sjfb8856606 
10*2d9fd380Sjfb8856606 #include "ioat.h"
11*2d9fd380Sjfb8856606 #include "main.h"
12*2d9fd380Sjfb8856606 
13*2d9fd380Sjfb8856606 struct dma_for_vhost dma_bind[MAX_VHOST_DEVICE];
14*2d9fd380Sjfb8856606 
15*2d9fd380Sjfb8856606 struct packet_tracker {
16*2d9fd380Sjfb8856606 	unsigned short size_track[MAX_ENQUEUED_SIZE];
17*2d9fd380Sjfb8856606 	unsigned short next_read;
18*2d9fd380Sjfb8856606 	unsigned short next_write;
19*2d9fd380Sjfb8856606 	unsigned short last_remain;
20*2d9fd380Sjfb8856606 };
21*2d9fd380Sjfb8856606 
22*2d9fd380Sjfb8856606 struct packet_tracker cb_tracker[MAX_VHOST_DEVICE];
23*2d9fd380Sjfb8856606 
24*2d9fd380Sjfb8856606 
25*2d9fd380Sjfb8856606 int
open_ioat(const char * value)26*2d9fd380Sjfb8856606 open_ioat(const char *value)
27*2d9fd380Sjfb8856606 {
28*2d9fd380Sjfb8856606 	struct dma_for_vhost *dma_info = dma_bind;
29*2d9fd380Sjfb8856606 	char *input = strndup(value, strlen(value) + 1);
30*2d9fd380Sjfb8856606 	char *addrs = input;
31*2d9fd380Sjfb8856606 	char *ptrs[2];
32*2d9fd380Sjfb8856606 	char *start, *end, *substr;
33*2d9fd380Sjfb8856606 	int64_t vid, vring_id;
34*2d9fd380Sjfb8856606 	struct rte_ioat_rawdev_config config;
35*2d9fd380Sjfb8856606 	struct rte_rawdev_info info = { .dev_private = &config };
36*2d9fd380Sjfb8856606 	char name[32];
37*2d9fd380Sjfb8856606 	int dev_id;
38*2d9fd380Sjfb8856606 	int ret = 0;
39*2d9fd380Sjfb8856606 	uint16_t i = 0;
40*2d9fd380Sjfb8856606 	char *dma_arg[MAX_VHOST_DEVICE];
41*2d9fd380Sjfb8856606 	int args_nr;
42*2d9fd380Sjfb8856606 
43*2d9fd380Sjfb8856606 	while (isblank(*addrs))
44*2d9fd380Sjfb8856606 		addrs++;
45*2d9fd380Sjfb8856606 	if (*addrs == '\0') {
46*2d9fd380Sjfb8856606 		ret = -1;
47*2d9fd380Sjfb8856606 		goto out;
48*2d9fd380Sjfb8856606 	}
49*2d9fd380Sjfb8856606 
50*2d9fd380Sjfb8856606 	/* process DMA devices within bracket. */
51*2d9fd380Sjfb8856606 	addrs++;
52*2d9fd380Sjfb8856606 	substr = strtok(addrs, ";]");
53*2d9fd380Sjfb8856606 	if (!substr) {
54*2d9fd380Sjfb8856606 		ret = -1;
55*2d9fd380Sjfb8856606 		goto out;
56*2d9fd380Sjfb8856606 	}
57*2d9fd380Sjfb8856606 	args_nr = rte_strsplit(substr, strlen(substr),
58*2d9fd380Sjfb8856606 			dma_arg, MAX_VHOST_DEVICE, ',');
59*2d9fd380Sjfb8856606 	if (args_nr <= 0) {
60*2d9fd380Sjfb8856606 		ret = -1;
61*2d9fd380Sjfb8856606 		goto out;
62*2d9fd380Sjfb8856606 	}
63*2d9fd380Sjfb8856606 	while (i < args_nr) {
64*2d9fd380Sjfb8856606 		char *arg_temp = dma_arg[i];
65*2d9fd380Sjfb8856606 		uint8_t sub_nr;
66*2d9fd380Sjfb8856606 		sub_nr = rte_strsplit(arg_temp, strlen(arg_temp), ptrs, 2, '@');
67*2d9fd380Sjfb8856606 		if (sub_nr != 2) {
68*2d9fd380Sjfb8856606 			ret = -1;
69*2d9fd380Sjfb8856606 			goto out;
70*2d9fd380Sjfb8856606 		}
71*2d9fd380Sjfb8856606 
72*2d9fd380Sjfb8856606 		start = strstr(ptrs[0], "txd");
73*2d9fd380Sjfb8856606 		if (start == NULL) {
74*2d9fd380Sjfb8856606 			ret = -1;
75*2d9fd380Sjfb8856606 			goto out;
76*2d9fd380Sjfb8856606 		}
77*2d9fd380Sjfb8856606 
78*2d9fd380Sjfb8856606 		start += 3;
79*2d9fd380Sjfb8856606 		vid = strtol(start, &end, 0);
80*2d9fd380Sjfb8856606 		if (end == start) {
81*2d9fd380Sjfb8856606 			ret = -1;
82*2d9fd380Sjfb8856606 			goto out;
83*2d9fd380Sjfb8856606 		}
84*2d9fd380Sjfb8856606 
85*2d9fd380Sjfb8856606 		vring_id = 0 + VIRTIO_RXQ;
86*2d9fd380Sjfb8856606 		if (rte_pci_addr_parse(ptrs[1],
87*2d9fd380Sjfb8856606 				&(dma_info + vid)->dmas[vring_id].addr) < 0) {
88*2d9fd380Sjfb8856606 			ret = -1;
89*2d9fd380Sjfb8856606 			goto out;
90*2d9fd380Sjfb8856606 		}
91*2d9fd380Sjfb8856606 
92*2d9fd380Sjfb8856606 		rte_pci_device_name(&(dma_info + vid)->dmas[vring_id].addr,
93*2d9fd380Sjfb8856606 				name, sizeof(name));
94*2d9fd380Sjfb8856606 		dev_id = rte_rawdev_get_dev_id(name);
95*2d9fd380Sjfb8856606 		if (dev_id == (uint16_t)(-ENODEV) ||
96*2d9fd380Sjfb8856606 		dev_id == (uint16_t)(-EINVAL)) {
97*2d9fd380Sjfb8856606 			ret = -1;
98*2d9fd380Sjfb8856606 			goto out;
99*2d9fd380Sjfb8856606 		}
100*2d9fd380Sjfb8856606 
101*2d9fd380Sjfb8856606 		if (rte_rawdev_info_get(dev_id, &info, sizeof(config)) < 0 ||
102*2d9fd380Sjfb8856606 		strstr(info.driver_name, "ioat") == NULL) {
103*2d9fd380Sjfb8856606 			ret = -1;
104*2d9fd380Sjfb8856606 			goto out;
105*2d9fd380Sjfb8856606 		}
106*2d9fd380Sjfb8856606 
107*2d9fd380Sjfb8856606 		(dma_info + vid)->dmas[vring_id].dev_id = dev_id;
108*2d9fd380Sjfb8856606 		(dma_info + vid)->dmas[vring_id].is_valid = true;
109*2d9fd380Sjfb8856606 		config.ring_size = IOAT_RING_SIZE;
110*2d9fd380Sjfb8856606 		config.hdls_disable = true;
111*2d9fd380Sjfb8856606 		if (rte_rawdev_configure(dev_id, &info, sizeof(config)) < 0) {
112*2d9fd380Sjfb8856606 			ret = -1;
113*2d9fd380Sjfb8856606 			goto out;
114*2d9fd380Sjfb8856606 		}
115*2d9fd380Sjfb8856606 		rte_rawdev_start(dev_id);
116*2d9fd380Sjfb8856606 
117*2d9fd380Sjfb8856606 		dma_info->nr++;
118*2d9fd380Sjfb8856606 		i++;
119*2d9fd380Sjfb8856606 	}
120*2d9fd380Sjfb8856606 out:
121*2d9fd380Sjfb8856606 	free(input);
122*2d9fd380Sjfb8856606 	return ret;
123*2d9fd380Sjfb8856606 }
124*2d9fd380Sjfb8856606 
125*2d9fd380Sjfb8856606 uint32_t
ioat_transfer_data_cb(int vid,uint16_t queue_id,struct rte_vhost_async_desc * descs,struct rte_vhost_async_status * opaque_data,uint16_t count)126*2d9fd380Sjfb8856606 ioat_transfer_data_cb(int vid, uint16_t queue_id,
127*2d9fd380Sjfb8856606 		struct rte_vhost_async_desc *descs,
128*2d9fd380Sjfb8856606 		struct rte_vhost_async_status *opaque_data, uint16_t count)
129*2d9fd380Sjfb8856606 {
130*2d9fd380Sjfb8856606 	uint32_t i_desc;
131*2d9fd380Sjfb8856606 	int dev_id = dma_bind[vid].dmas[queue_id * 2 + VIRTIO_RXQ].dev_id;
132*2d9fd380Sjfb8856606 	struct rte_vhost_iov_iter *src = NULL;
133*2d9fd380Sjfb8856606 	struct rte_vhost_iov_iter *dst = NULL;
134*2d9fd380Sjfb8856606 	unsigned long i_seg;
135*2d9fd380Sjfb8856606 	unsigned short mask = MAX_ENQUEUED_SIZE - 1;
136*2d9fd380Sjfb8856606 	unsigned short write = cb_tracker[dev_id].next_write;
137*2d9fd380Sjfb8856606 
138*2d9fd380Sjfb8856606 	if (!opaque_data) {
139*2d9fd380Sjfb8856606 		for (i_desc = 0; i_desc < count; i_desc++) {
140*2d9fd380Sjfb8856606 			src = descs[i_desc].src;
141*2d9fd380Sjfb8856606 			dst = descs[i_desc].dst;
142*2d9fd380Sjfb8856606 			i_seg = 0;
143*2d9fd380Sjfb8856606 			while (i_seg < src->nr_segs) {
144*2d9fd380Sjfb8856606 				/*
145*2d9fd380Sjfb8856606 				 * TODO: Assuming that the ring space of the
146*2d9fd380Sjfb8856606 				 * IOAT device is large enough, so there is no
147*2d9fd380Sjfb8856606 				 * error here, and the actual error handling
148*2d9fd380Sjfb8856606 				 * will be added later.
149*2d9fd380Sjfb8856606 				 */
150*2d9fd380Sjfb8856606 				rte_ioat_enqueue_copy(dev_id,
151*2d9fd380Sjfb8856606 					(uintptr_t)(src->iov[i_seg].iov_base)
152*2d9fd380Sjfb8856606 						+ src->offset,
153*2d9fd380Sjfb8856606 					(uintptr_t)(dst->iov[i_seg].iov_base)
154*2d9fd380Sjfb8856606 						+ dst->offset,
155*2d9fd380Sjfb8856606 					src->iov[i_seg].iov_len,
156*2d9fd380Sjfb8856606 					0,
157*2d9fd380Sjfb8856606 					0);
158*2d9fd380Sjfb8856606 				i_seg++;
159*2d9fd380Sjfb8856606 			}
160*2d9fd380Sjfb8856606 			write &= mask;
161*2d9fd380Sjfb8856606 			cb_tracker[dev_id].size_track[write] = i_seg;
162*2d9fd380Sjfb8856606 			write++;
163*2d9fd380Sjfb8856606 		}
164*2d9fd380Sjfb8856606 	} else {
165*2d9fd380Sjfb8856606 		/* Opaque data is not supported */
166*2d9fd380Sjfb8856606 		return -1;
167*2d9fd380Sjfb8856606 	}
168*2d9fd380Sjfb8856606 	/* ring the doorbell */
169*2d9fd380Sjfb8856606 	rte_ioat_perform_ops(dev_id);
170*2d9fd380Sjfb8856606 	cb_tracker[dev_id].next_write = write;
171*2d9fd380Sjfb8856606 	return i_desc;
172*2d9fd380Sjfb8856606 }
173*2d9fd380Sjfb8856606 
174*2d9fd380Sjfb8856606 uint32_t
ioat_check_completed_copies_cb(int vid,uint16_t queue_id,struct rte_vhost_async_status * opaque_data,uint16_t max_packets)175*2d9fd380Sjfb8856606 ioat_check_completed_copies_cb(int vid, uint16_t queue_id,
176*2d9fd380Sjfb8856606 		struct rte_vhost_async_status *opaque_data,
177*2d9fd380Sjfb8856606 		uint16_t max_packets)
178*2d9fd380Sjfb8856606 {
179*2d9fd380Sjfb8856606 	if (!opaque_data) {
180*2d9fd380Sjfb8856606 		uintptr_t dump[255];
181*2d9fd380Sjfb8856606 		unsigned short n_seg;
182*2d9fd380Sjfb8856606 		unsigned short read, write;
183*2d9fd380Sjfb8856606 		unsigned short nb_packet = 0;
184*2d9fd380Sjfb8856606 		unsigned short mask = MAX_ENQUEUED_SIZE - 1;
185*2d9fd380Sjfb8856606 		unsigned short i;
186*2d9fd380Sjfb8856606 		int dev_id = dma_bind[vid].dmas[queue_id * 2
187*2d9fd380Sjfb8856606 				+ VIRTIO_RXQ].dev_id;
188*2d9fd380Sjfb8856606 		n_seg = rte_ioat_completed_ops(dev_id, 255, dump, dump);
189*2d9fd380Sjfb8856606 		n_seg += cb_tracker[dev_id].last_remain;
190*2d9fd380Sjfb8856606 		if (!n_seg)
191*2d9fd380Sjfb8856606 			return 0;
192*2d9fd380Sjfb8856606 		read = cb_tracker[dev_id].next_read;
193*2d9fd380Sjfb8856606 		write = cb_tracker[dev_id].next_write;
194*2d9fd380Sjfb8856606 		for (i = 0; i < max_packets; i++) {
195*2d9fd380Sjfb8856606 			read &= mask;
196*2d9fd380Sjfb8856606 			if (read == write)
197*2d9fd380Sjfb8856606 				break;
198*2d9fd380Sjfb8856606 			if (n_seg >= cb_tracker[dev_id].size_track[read]) {
199*2d9fd380Sjfb8856606 				n_seg -= cb_tracker[dev_id].size_track[read];
200*2d9fd380Sjfb8856606 				read++;
201*2d9fd380Sjfb8856606 				nb_packet++;
202*2d9fd380Sjfb8856606 			} else {
203*2d9fd380Sjfb8856606 				break;
204*2d9fd380Sjfb8856606 			}
205*2d9fd380Sjfb8856606 		}
206*2d9fd380Sjfb8856606 		cb_tracker[dev_id].next_read = read;
207*2d9fd380Sjfb8856606 		cb_tracker[dev_id].last_remain = n_seg;
208*2d9fd380Sjfb8856606 		return nb_packet;
209*2d9fd380Sjfb8856606 	}
210*2d9fd380Sjfb8856606 	/* Opaque data is not supported */
211*2d9fd380Sjfb8856606 	return -1;
212*2d9fd380Sjfb8856606 }
213*2d9fd380Sjfb8856606 
214*2d9fd380Sjfb8856606 #endif /* RTE_RAW_IOAT */
215