xref: /freebsd-14.2/sys/dev/netmap/netmap_kloop.c (revision dde885de)
1b6e66be2SVincenzo Maffione /*
2b6e66be2SVincenzo Maffione  * Copyright (C) 2016-2018 Vincenzo Maffione
3b6e66be2SVincenzo Maffione  * Copyright (C) 2015 Stefano Garzarella
4b6e66be2SVincenzo Maffione  * All rights reserved.
5b6e66be2SVincenzo Maffione  *
6b6e66be2SVincenzo Maffione  * Redistribution and use in source and binary forms, with or without
7b6e66be2SVincenzo Maffione  * modification, are permitted provided that the following conditions
8b6e66be2SVincenzo Maffione  * are met:
9b6e66be2SVincenzo Maffione  *   1. Redistributions of source code must retain the above copyright
10b6e66be2SVincenzo Maffione  *      notice, this list of conditions and the following disclaimer.
11b6e66be2SVincenzo Maffione  *   2. Redistributions in binary form must reproduce the above copyright
12b6e66be2SVincenzo Maffione  *      notice, this list of conditions and the following disclaimer in the
13b6e66be2SVincenzo Maffione  *      documentation and/or other materials provided with the distribution.
14b6e66be2SVincenzo Maffione  *
15b6e66be2SVincenzo Maffione  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16b6e66be2SVincenzo Maffione  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17b6e66be2SVincenzo Maffione  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18b6e66be2SVincenzo Maffione  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19b6e66be2SVincenzo Maffione  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20b6e66be2SVincenzo Maffione  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21b6e66be2SVincenzo Maffione  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22b6e66be2SVincenzo Maffione  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23b6e66be2SVincenzo Maffione  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24b6e66be2SVincenzo Maffione  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25b6e66be2SVincenzo Maffione  * SUCH DAMAGE.
26b6e66be2SVincenzo Maffione  *
27b6e66be2SVincenzo Maffione  * $FreeBSD$
28b6e66be2SVincenzo Maffione  */
29b6e66be2SVincenzo Maffione 
30b6e66be2SVincenzo Maffione /*
31b6e66be2SVincenzo Maffione  * common headers
32b6e66be2SVincenzo Maffione  */
33b6e66be2SVincenzo Maffione #if defined(__FreeBSD__)
34b6e66be2SVincenzo Maffione #include <sys/cdefs.h>
35b6e66be2SVincenzo Maffione #include <sys/param.h>
36b6e66be2SVincenzo Maffione #include <sys/kernel.h>
37b6e66be2SVincenzo Maffione #include <sys/types.h>
38b6e66be2SVincenzo Maffione #include <sys/selinfo.h>
39b6e66be2SVincenzo Maffione #include <sys/socket.h>
40b6e66be2SVincenzo Maffione #include <net/if.h>
41b6e66be2SVincenzo Maffione #include <net/if_var.h>
42b6e66be2SVincenzo Maffione #include <machine/bus.h>
43b6e66be2SVincenzo Maffione 
44b6e66be2SVincenzo Maffione #define usleep_range(_1, _2) \
45b6e66be2SVincenzo Maffione         pause_sbt("sync-kloop-sleep", SBT_1US * _1, SBT_1US * 1, C_ABSOLUTE)
46b6e66be2SVincenzo Maffione 
47b6e66be2SVincenzo Maffione #elif defined(linux)
48b6e66be2SVincenzo Maffione #include <bsd_glue.h>
49b6e66be2SVincenzo Maffione #include <linux/file.h>
50b6e66be2SVincenzo Maffione #include <linux/eventfd.h>
51b6e66be2SVincenzo Maffione #endif
52b6e66be2SVincenzo Maffione 
53b6e66be2SVincenzo Maffione #include <net/netmap.h>
54b6e66be2SVincenzo Maffione #include <dev/netmap/netmap_kern.h>
55b6e66be2SVincenzo Maffione #include <net/netmap_virt.h>
56b6e66be2SVincenzo Maffione #include <dev/netmap/netmap_mem2.h>
57b6e66be2SVincenzo Maffione 
58b6e66be2SVincenzo Maffione /* Support for eventfd-based notifications. */
59b6e66be2SVincenzo Maffione #if defined(linux)
60b6e66be2SVincenzo Maffione #define SYNC_KLOOP_POLL
61b6e66be2SVincenzo Maffione #endif
62b6e66be2SVincenzo Maffione 
63b6e66be2SVincenzo Maffione /* Write kring pointers (hwcur, hwtail) to the CSB.
64b6e66be2SVincenzo Maffione  * This routine is coupled with ptnetmap_guest_read_kring_csb(). */
65b6e66be2SVincenzo Maffione static inline void
66b6e66be2SVincenzo Maffione sync_kloop_kernel_write(struct nm_csb_ktoa __user *ptr, uint32_t hwcur,
67b6e66be2SVincenzo Maffione 			   uint32_t hwtail)
68b6e66be2SVincenzo Maffione {
69b6e66be2SVincenzo Maffione 	/*
70b6e66be2SVincenzo Maffione 	 * The same scheme used in ptnetmap_guest_write_kring_csb() applies here.
71b6e66be2SVincenzo Maffione 	 * We allow the application to read a value of hwcur more recent than the value
72b6e66be2SVincenzo Maffione 	 * of hwtail, since this would anyway result in a consistent view of the
73b6e66be2SVincenzo Maffione 	 * ring state (and hwcur can never wraparound hwtail, since hwcur must be
74b6e66be2SVincenzo Maffione 	 * behind head).
75b6e66be2SVincenzo Maffione 	 *
76b6e66be2SVincenzo Maffione 	 * The following memory barrier scheme is used to make this happen:
77b6e66be2SVincenzo Maffione 	 *
78b6e66be2SVincenzo Maffione 	 *          Application          Kernel
79b6e66be2SVincenzo Maffione 	 *
80b6e66be2SVincenzo Maffione 	 *          STORE(hwcur)         LOAD(hwtail)
81b6e66be2SVincenzo Maffione 	 *          mb() <-------------> mb()
82b6e66be2SVincenzo Maffione 	 *          STORE(hwtail)        LOAD(hwcur)
83b6e66be2SVincenzo Maffione 	 */
84b6e66be2SVincenzo Maffione 	CSB_WRITE(ptr, hwcur, hwcur);
85b6e66be2SVincenzo Maffione 	nm_stst_barrier();
86b6e66be2SVincenzo Maffione 	CSB_WRITE(ptr, hwtail, hwtail);
87b6e66be2SVincenzo Maffione }
88b6e66be2SVincenzo Maffione 
89b6e66be2SVincenzo Maffione /* Read kring pointers (head, cur, sync_flags) from the CSB.
90b6e66be2SVincenzo Maffione  * This routine is coupled with ptnetmap_guest_write_kring_csb(). */
91b6e66be2SVincenzo Maffione static inline void
92b6e66be2SVincenzo Maffione sync_kloop_kernel_read(struct nm_csb_atok __user *ptr,
93b6e66be2SVincenzo Maffione 			  struct netmap_ring *shadow_ring,
94b6e66be2SVincenzo Maffione 			  uint32_t num_slots)
95b6e66be2SVincenzo Maffione {
96b6e66be2SVincenzo Maffione 	/*
97b6e66be2SVincenzo Maffione 	 * We place a memory barrier to make sure that the update of head never
98b6e66be2SVincenzo Maffione 	 * overtakes the update of cur.
99b6e66be2SVincenzo Maffione 	 * (see explanation in ptnetmap_guest_write_kring_csb).
100b6e66be2SVincenzo Maffione 	 */
101b6e66be2SVincenzo Maffione 	CSB_READ(ptr, head, shadow_ring->head);
102b6e66be2SVincenzo Maffione 	nm_stst_barrier();
103b6e66be2SVincenzo Maffione 	CSB_READ(ptr, cur, shadow_ring->cur);
104b6e66be2SVincenzo Maffione 	CSB_READ(ptr, sync_flags, shadow_ring->flags);
105b6e66be2SVincenzo Maffione }
106b6e66be2SVincenzo Maffione 
107b6e66be2SVincenzo Maffione /* Enable or disable application --> kernel kicks. */
108b6e66be2SVincenzo Maffione static inline void
109b6e66be2SVincenzo Maffione csb_ktoa_kick_enable(struct nm_csb_ktoa __user *csb_ktoa, uint32_t val)
110b6e66be2SVincenzo Maffione {
111b6e66be2SVincenzo Maffione 	CSB_WRITE(csb_ktoa, kern_need_kick, val);
112b6e66be2SVincenzo Maffione }
113b6e66be2SVincenzo Maffione 
114*dde885deSVincenzo Maffione #ifdef SYNC_KLOOP_POLL
115b6e66be2SVincenzo Maffione /* Are application interrupt enabled or disabled? */
116b6e66be2SVincenzo Maffione static inline uint32_t
117b6e66be2SVincenzo Maffione csb_atok_intr_enabled(struct nm_csb_atok __user *csb_atok)
118b6e66be2SVincenzo Maffione {
119b6e66be2SVincenzo Maffione 	uint32_t v;
120b6e66be2SVincenzo Maffione 
121b6e66be2SVincenzo Maffione 	CSB_READ(csb_atok, appl_need_kick, v);
122b6e66be2SVincenzo Maffione 
123b6e66be2SVincenzo Maffione 	return v;
124b6e66be2SVincenzo Maffione }
125*dde885deSVincenzo Maffione #endif  /* SYNC_KLOOP_POLL */
126b6e66be2SVincenzo Maffione 
127b6e66be2SVincenzo Maffione static inline void
128b6e66be2SVincenzo Maffione sync_kloop_kring_dump(const char *title, const struct netmap_kring *kring)
129b6e66be2SVincenzo Maffione {
130b6e66be2SVincenzo Maffione 	nm_prinf("%s - name: %s hwcur: %d hwtail: %d "
131b6e66be2SVincenzo Maffione 		"rhead: %d rcur: %d rtail: %d",
132b6e66be2SVincenzo Maffione 		title, kring->name, kring->nr_hwcur, kring->nr_hwtail,
133b6e66be2SVincenzo Maffione 		kring->rhead, kring->rcur, kring->rtail);
134b6e66be2SVincenzo Maffione }
135b6e66be2SVincenzo Maffione 
136b6e66be2SVincenzo Maffione struct sync_kloop_ring_args {
137b6e66be2SVincenzo Maffione 	struct netmap_kring *kring;
138b6e66be2SVincenzo Maffione 	struct nm_csb_atok *csb_atok;
139b6e66be2SVincenzo Maffione 	struct nm_csb_ktoa *csb_ktoa;
140b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
141b6e66be2SVincenzo Maffione 	struct eventfd_ctx *irq_ctx;
142b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
143b6e66be2SVincenzo Maffione };
144b6e66be2SVincenzo Maffione 
145b6e66be2SVincenzo Maffione static void
146b6e66be2SVincenzo Maffione netmap_sync_kloop_tx_ring(const struct sync_kloop_ring_args *a)
147b6e66be2SVincenzo Maffione {
148b6e66be2SVincenzo Maffione 	struct netmap_kring *kring = a->kring;
149b6e66be2SVincenzo Maffione 	struct nm_csb_atok *csb_atok = a->csb_atok;
150b6e66be2SVincenzo Maffione 	struct nm_csb_ktoa *csb_ktoa = a->csb_ktoa;
151b6e66be2SVincenzo Maffione 	struct netmap_ring shadow_ring; /* shadow copy of the netmap_ring */
152b6e66be2SVincenzo Maffione 	bool more_txspace = false;
153b6e66be2SVincenzo Maffione 	uint32_t num_slots;
154b6e66be2SVincenzo Maffione 	int batch;
155b6e66be2SVincenzo Maffione 
156b6e66be2SVincenzo Maffione 	num_slots = kring->nkr_num_slots;
157b6e66be2SVincenzo Maffione 
158b6e66be2SVincenzo Maffione 	/* Disable application --> kernel notifications. */
159b6e66be2SVincenzo Maffione 	csb_ktoa_kick_enable(csb_ktoa, 0);
160b6e66be2SVincenzo Maffione 	/* Copy the application kring pointers from the CSB */
161b6e66be2SVincenzo Maffione 	sync_kloop_kernel_read(csb_atok, &shadow_ring, num_slots);
162b6e66be2SVincenzo Maffione 
163b6e66be2SVincenzo Maffione 	for (;;) {
164b6e66be2SVincenzo Maffione 		batch = shadow_ring.head - kring->nr_hwcur;
165b6e66be2SVincenzo Maffione 		if (batch < 0)
166b6e66be2SVincenzo Maffione 			batch += num_slots;
167b6e66be2SVincenzo Maffione 
168b6e66be2SVincenzo Maffione #ifdef PTN_TX_BATCH_LIM
169b6e66be2SVincenzo Maffione 		if (batch > PTN_TX_BATCH_LIM(num_slots)) {
170b6e66be2SVincenzo Maffione 			/* If application moves ahead too fast, let's cut the move so
171b6e66be2SVincenzo Maffione 			 * that we don't exceed our batch limit. */
172b6e66be2SVincenzo Maffione 			uint32_t head_lim = kring->nr_hwcur + PTN_TX_BATCH_LIM(num_slots);
173b6e66be2SVincenzo Maffione 
174b6e66be2SVincenzo Maffione 			if (head_lim >= num_slots)
175b6e66be2SVincenzo Maffione 				head_lim -= num_slots;
176b6e66be2SVincenzo Maffione 			nm_prdis(1, "batch: %d head: %d head_lim: %d", batch, shadow_ring.head,
177b6e66be2SVincenzo Maffione 					head_lim);
178b6e66be2SVincenzo Maffione 			shadow_ring.head = head_lim;
179b6e66be2SVincenzo Maffione 			batch = PTN_TX_BATCH_LIM(num_slots);
180b6e66be2SVincenzo Maffione 		}
181b6e66be2SVincenzo Maffione #endif /* PTN_TX_BATCH_LIM */
182b6e66be2SVincenzo Maffione 
183b6e66be2SVincenzo Maffione 		if (nm_kr_txspace(kring) <= (num_slots >> 1)) {
184b6e66be2SVincenzo Maffione 			shadow_ring.flags |= NAF_FORCE_RECLAIM;
185b6e66be2SVincenzo Maffione 		}
186b6e66be2SVincenzo Maffione 
187b6e66be2SVincenzo Maffione 		/* Netmap prologue */
188b6e66be2SVincenzo Maffione 		shadow_ring.tail = kring->rtail;
189b6e66be2SVincenzo Maffione 		if (unlikely(nm_txsync_prologue(kring, &shadow_ring) >= num_slots)) {
190b6e66be2SVincenzo Maffione 			/* Reinit ring and enable notifications. */
191b6e66be2SVincenzo Maffione 			netmap_ring_reinit(kring);
192b6e66be2SVincenzo Maffione 			csb_ktoa_kick_enable(csb_ktoa, 1);
193b6e66be2SVincenzo Maffione 			break;
194b6e66be2SVincenzo Maffione 		}
195b6e66be2SVincenzo Maffione 
196b6e66be2SVincenzo Maffione 		if (unlikely(netmap_debug & NM_DEBUG_TXSYNC)) {
197b6e66be2SVincenzo Maffione 			sync_kloop_kring_dump("pre txsync", kring);
198b6e66be2SVincenzo Maffione 		}
199b6e66be2SVincenzo Maffione 
200b6e66be2SVincenzo Maffione 		if (unlikely(kring->nm_sync(kring, shadow_ring.flags))) {
201b6e66be2SVincenzo Maffione 			/* Reenable notifications. */
202b6e66be2SVincenzo Maffione 			csb_ktoa_kick_enable(csb_ktoa, 1);
203b6e66be2SVincenzo Maffione 			nm_prerr("txsync() failed");
204b6e66be2SVincenzo Maffione 			break;
205b6e66be2SVincenzo Maffione 		}
206b6e66be2SVincenzo Maffione 
207b6e66be2SVincenzo Maffione 		/*
208b6e66be2SVincenzo Maffione 		 * Finalize
209b6e66be2SVincenzo Maffione 		 * Copy kernel hwcur and hwtail into the CSB for the application sync(), and
210b6e66be2SVincenzo Maffione 		 * do the nm_sync_finalize.
211b6e66be2SVincenzo Maffione 		 */
212b6e66be2SVincenzo Maffione 		sync_kloop_kernel_write(csb_ktoa, kring->nr_hwcur,
213b6e66be2SVincenzo Maffione 				kring->nr_hwtail);
214b6e66be2SVincenzo Maffione 		if (kring->rtail != kring->nr_hwtail) {
215b6e66be2SVincenzo Maffione 			/* Some more room available in the parent adapter. */
216b6e66be2SVincenzo Maffione 			kring->rtail = kring->nr_hwtail;
217b6e66be2SVincenzo Maffione 			more_txspace = true;
218b6e66be2SVincenzo Maffione 		}
219b6e66be2SVincenzo Maffione 
220b6e66be2SVincenzo Maffione 		if (unlikely(netmap_debug & NM_DEBUG_TXSYNC)) {
221b6e66be2SVincenzo Maffione 			sync_kloop_kring_dump("post txsync", kring);
222b6e66be2SVincenzo Maffione 		}
223b6e66be2SVincenzo Maffione 
224b6e66be2SVincenzo Maffione 		/* Interrupt the application if needed. */
225b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
226b6e66be2SVincenzo Maffione 		if (a->irq_ctx && more_txspace && csb_atok_intr_enabled(csb_atok)) {
227b6e66be2SVincenzo Maffione 			/* Disable application kick to avoid sending unnecessary kicks */
228b6e66be2SVincenzo Maffione 			eventfd_signal(a->irq_ctx, 1);
229b6e66be2SVincenzo Maffione 			more_txspace = false;
230b6e66be2SVincenzo Maffione 		}
231b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
232b6e66be2SVincenzo Maffione 
233b6e66be2SVincenzo Maffione 		/* Read CSB to see if there is more work to do. */
234b6e66be2SVincenzo Maffione 		sync_kloop_kernel_read(csb_atok, &shadow_ring, num_slots);
235b6e66be2SVincenzo Maffione 		if (shadow_ring.head == kring->rhead) {
236b6e66be2SVincenzo Maffione 			/*
237b6e66be2SVincenzo Maffione 			 * No more packets to transmit. We enable notifications and
238b6e66be2SVincenzo Maffione 			 * go to sleep, waiting for a kick from the application when new
239b6e66be2SVincenzo Maffione 			 * new slots are ready for transmission.
240b6e66be2SVincenzo Maffione 			 */
241b6e66be2SVincenzo Maffione 			/* Reenable notifications. */
242b6e66be2SVincenzo Maffione 			csb_ktoa_kick_enable(csb_ktoa, 1);
243b6e66be2SVincenzo Maffione 			/* Doublecheck. */
244b6e66be2SVincenzo Maffione 			sync_kloop_kernel_read(csb_atok, &shadow_ring, num_slots);
245b6e66be2SVincenzo Maffione 			if (shadow_ring.head != kring->rhead) {
246b6e66be2SVincenzo Maffione 				/* We won the race condition, there are more packets to
247b6e66be2SVincenzo Maffione 				 * transmit. Disable notifications and do another cycle */
248b6e66be2SVincenzo Maffione 				csb_ktoa_kick_enable(csb_ktoa, 0);
249b6e66be2SVincenzo Maffione 				continue;
250b6e66be2SVincenzo Maffione 			}
251b6e66be2SVincenzo Maffione 			break;
252b6e66be2SVincenzo Maffione 		}
253b6e66be2SVincenzo Maffione 
254b6e66be2SVincenzo Maffione 		if (nm_kr_txempty(kring)) {
255b6e66be2SVincenzo Maffione 			/* No more available TX slots. We stop waiting for a notification
256b6e66be2SVincenzo Maffione 			 * from the backend (netmap_tx_irq). */
257b6e66be2SVincenzo Maffione 			nm_prdis(1, "TX ring");
258b6e66be2SVincenzo Maffione 			break;
259b6e66be2SVincenzo Maffione 		}
260b6e66be2SVincenzo Maffione 	}
261b6e66be2SVincenzo Maffione 
262b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
263b6e66be2SVincenzo Maffione 	if (a->irq_ctx && more_txspace && csb_atok_intr_enabled(csb_atok)) {
264b6e66be2SVincenzo Maffione 		eventfd_signal(a->irq_ctx, 1);
265b6e66be2SVincenzo Maffione 	}
266b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
267b6e66be2SVincenzo Maffione }
268b6e66be2SVincenzo Maffione 
269b6e66be2SVincenzo Maffione /* RX cycle without receive any packets */
270b6e66be2SVincenzo Maffione #define SYNC_LOOP_RX_DRY_CYCLES_MAX	2
271b6e66be2SVincenzo Maffione 
272b6e66be2SVincenzo Maffione static inline int
273b6e66be2SVincenzo Maffione sync_kloop_norxslots(struct netmap_kring *kring, uint32_t g_head)
274b6e66be2SVincenzo Maffione {
275b6e66be2SVincenzo Maffione 	return (NM_ACCESS_ONCE(kring->nr_hwtail) == nm_prev(g_head,
276b6e66be2SVincenzo Maffione 				kring->nkr_num_slots - 1));
277b6e66be2SVincenzo Maffione }
278b6e66be2SVincenzo Maffione 
279b6e66be2SVincenzo Maffione static void
280b6e66be2SVincenzo Maffione netmap_sync_kloop_rx_ring(const struct sync_kloop_ring_args *a)
281b6e66be2SVincenzo Maffione {
282b6e66be2SVincenzo Maffione 
283b6e66be2SVincenzo Maffione 	struct netmap_kring *kring = a->kring;
284b6e66be2SVincenzo Maffione 	struct nm_csb_atok *csb_atok = a->csb_atok;
285b6e66be2SVincenzo Maffione 	struct nm_csb_ktoa *csb_ktoa = a->csb_ktoa;
286b6e66be2SVincenzo Maffione 	struct netmap_ring shadow_ring; /* shadow copy of the netmap_ring */
287b6e66be2SVincenzo Maffione 	int dry_cycles = 0;
288b6e66be2SVincenzo Maffione 	bool some_recvd = false;
289b6e66be2SVincenzo Maffione 	uint32_t num_slots;
290b6e66be2SVincenzo Maffione 
291b6e66be2SVincenzo Maffione 	num_slots = kring->nkr_num_slots;
292b6e66be2SVincenzo Maffione 
293b6e66be2SVincenzo Maffione 	/* Get RX csb_atok and csb_ktoa pointers from the CSB. */
294b6e66be2SVincenzo Maffione 	num_slots = kring->nkr_num_slots;
295b6e66be2SVincenzo Maffione 
296b6e66be2SVincenzo Maffione 	/* Disable notifications. */
297b6e66be2SVincenzo Maffione 	csb_ktoa_kick_enable(csb_ktoa, 0);
298b6e66be2SVincenzo Maffione 	/* Copy the application kring pointers from the CSB */
299b6e66be2SVincenzo Maffione 	sync_kloop_kernel_read(csb_atok, &shadow_ring, num_slots);
300b6e66be2SVincenzo Maffione 
301b6e66be2SVincenzo Maffione 	for (;;) {
302b6e66be2SVincenzo Maffione 		uint32_t hwtail;
303b6e66be2SVincenzo Maffione 
304b6e66be2SVincenzo Maffione 		/* Netmap prologue */
305b6e66be2SVincenzo Maffione 		shadow_ring.tail = kring->rtail;
306b6e66be2SVincenzo Maffione 		if (unlikely(nm_rxsync_prologue(kring, &shadow_ring) >= num_slots)) {
307b6e66be2SVincenzo Maffione 			/* Reinit ring and enable notifications. */
308b6e66be2SVincenzo Maffione 			netmap_ring_reinit(kring);
309b6e66be2SVincenzo Maffione 			csb_ktoa_kick_enable(csb_ktoa, 1);
310b6e66be2SVincenzo Maffione 			break;
311b6e66be2SVincenzo Maffione 		}
312b6e66be2SVincenzo Maffione 
313b6e66be2SVincenzo Maffione 		if (unlikely(netmap_debug & NM_DEBUG_RXSYNC)) {
314b6e66be2SVincenzo Maffione 			sync_kloop_kring_dump("pre rxsync", kring);
315b6e66be2SVincenzo Maffione 		}
316b6e66be2SVincenzo Maffione 
317b6e66be2SVincenzo Maffione 		if (unlikely(kring->nm_sync(kring, shadow_ring.flags))) {
318b6e66be2SVincenzo Maffione 			/* Reenable notifications. */
319b6e66be2SVincenzo Maffione 			csb_ktoa_kick_enable(csb_ktoa, 1);
320b6e66be2SVincenzo Maffione 			nm_prerr("rxsync() failed");
321b6e66be2SVincenzo Maffione 			break;
322b6e66be2SVincenzo Maffione 		}
323b6e66be2SVincenzo Maffione 
324b6e66be2SVincenzo Maffione 		/*
325b6e66be2SVincenzo Maffione 		 * Finalize
326b6e66be2SVincenzo Maffione 		 * Copy kernel hwcur and hwtail into the CSB for the application sync()
327b6e66be2SVincenzo Maffione 		 */
328b6e66be2SVincenzo Maffione 		hwtail = NM_ACCESS_ONCE(kring->nr_hwtail);
329b6e66be2SVincenzo Maffione 		sync_kloop_kernel_write(csb_ktoa, kring->nr_hwcur, hwtail);
330b6e66be2SVincenzo Maffione 		if (kring->rtail != hwtail) {
331b6e66be2SVincenzo Maffione 			kring->rtail = hwtail;
332b6e66be2SVincenzo Maffione 			some_recvd = true;
333b6e66be2SVincenzo Maffione 			dry_cycles = 0;
334b6e66be2SVincenzo Maffione 		} else {
335b6e66be2SVincenzo Maffione 			dry_cycles++;
336b6e66be2SVincenzo Maffione 		}
337b6e66be2SVincenzo Maffione 
338b6e66be2SVincenzo Maffione 		if (unlikely(netmap_debug & NM_DEBUG_RXSYNC)) {
339b6e66be2SVincenzo Maffione 			sync_kloop_kring_dump("post rxsync", kring);
340b6e66be2SVincenzo Maffione 		}
341b6e66be2SVincenzo Maffione 
342b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
343b6e66be2SVincenzo Maffione 		/* Interrupt the application if needed. */
344b6e66be2SVincenzo Maffione 		if (a->irq_ctx && some_recvd && csb_atok_intr_enabled(csb_atok)) {
345b6e66be2SVincenzo Maffione 			/* Disable application kick to avoid sending unnecessary kicks */
346b6e66be2SVincenzo Maffione 			eventfd_signal(a->irq_ctx, 1);
347b6e66be2SVincenzo Maffione 			some_recvd = false;
348b6e66be2SVincenzo Maffione 		}
349b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
350b6e66be2SVincenzo Maffione 
351b6e66be2SVincenzo Maffione 		/* Read CSB to see if there is more work to do. */
352b6e66be2SVincenzo Maffione 		sync_kloop_kernel_read(csb_atok, &shadow_ring, num_slots);
353b6e66be2SVincenzo Maffione 		if (sync_kloop_norxslots(kring, shadow_ring.head)) {
354b6e66be2SVincenzo Maffione 			/*
355b6e66be2SVincenzo Maffione 			 * No more slots available for reception. We enable notification and
356b6e66be2SVincenzo Maffione 			 * go to sleep, waiting for a kick from the application when new receive
357b6e66be2SVincenzo Maffione 			 * slots are available.
358b6e66be2SVincenzo Maffione 			 */
359b6e66be2SVincenzo Maffione 			/* Reenable notifications. */
360b6e66be2SVincenzo Maffione 			csb_ktoa_kick_enable(csb_ktoa, 1);
361b6e66be2SVincenzo Maffione 			/* Doublecheck. */
362b6e66be2SVincenzo Maffione 			sync_kloop_kernel_read(csb_atok, &shadow_ring, num_slots);
363b6e66be2SVincenzo Maffione 			if (!sync_kloop_norxslots(kring, shadow_ring.head)) {
364b6e66be2SVincenzo Maffione 				/* We won the race condition, more slots are available. Disable
365b6e66be2SVincenzo Maffione 				 * notifications and do another cycle. */
366b6e66be2SVincenzo Maffione 				csb_ktoa_kick_enable(csb_ktoa, 0);
367b6e66be2SVincenzo Maffione 				continue;
368b6e66be2SVincenzo Maffione 			}
369b6e66be2SVincenzo Maffione 			break;
370b6e66be2SVincenzo Maffione 		}
371b6e66be2SVincenzo Maffione 
372b6e66be2SVincenzo Maffione 		hwtail = NM_ACCESS_ONCE(kring->nr_hwtail);
373b6e66be2SVincenzo Maffione 		if (unlikely(hwtail == kring->rhead ||
374b6e66be2SVincenzo Maffione 					dry_cycles >= SYNC_LOOP_RX_DRY_CYCLES_MAX)) {
375b6e66be2SVincenzo Maffione 			/* No more packets to be read from the backend. We stop and
376b6e66be2SVincenzo Maffione 			 * wait for a notification from the backend (netmap_rx_irq). */
377b6e66be2SVincenzo Maffione 			nm_prdis(1, "nr_hwtail: %d rhead: %d dry_cycles: %d",
378b6e66be2SVincenzo Maffione 					hwtail, kring->rhead, dry_cycles);
379b6e66be2SVincenzo Maffione 			break;
380b6e66be2SVincenzo Maffione 		}
381b6e66be2SVincenzo Maffione 	}
382b6e66be2SVincenzo Maffione 
383b6e66be2SVincenzo Maffione 	nm_kr_put(kring);
384b6e66be2SVincenzo Maffione 
385b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
386b6e66be2SVincenzo Maffione 	/* Interrupt the application if needed. */
387b6e66be2SVincenzo Maffione 	if (a->irq_ctx && some_recvd && csb_atok_intr_enabled(csb_atok)) {
388b6e66be2SVincenzo Maffione 		eventfd_signal(a->irq_ctx, 1);
389b6e66be2SVincenzo Maffione 	}
390b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
391b6e66be2SVincenzo Maffione }
392b6e66be2SVincenzo Maffione 
393b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
394b6e66be2SVincenzo Maffione struct sync_kloop_poll_entry {
395b6e66be2SVincenzo Maffione 	/* Support for receiving notifications from
396b6e66be2SVincenzo Maffione 	 * a netmap ring or from the application. */
397b6e66be2SVincenzo Maffione 	struct file *filp;
398b6e66be2SVincenzo Maffione 	wait_queue_t wait;
399b6e66be2SVincenzo Maffione 	wait_queue_head_t *wqh;
400b6e66be2SVincenzo Maffione 
401b6e66be2SVincenzo Maffione 	/* Support for sending notifications to the application. */
402b6e66be2SVincenzo Maffione 	struct eventfd_ctx *irq_ctx;
403b6e66be2SVincenzo Maffione 	struct file *irq_filp;
404b6e66be2SVincenzo Maffione };
405b6e66be2SVincenzo Maffione 
406b6e66be2SVincenzo Maffione struct sync_kloop_poll_ctx {
407b6e66be2SVincenzo Maffione 	poll_table wait_table;
408b6e66be2SVincenzo Maffione 	unsigned int next_entry;
409b6e66be2SVincenzo Maffione 	unsigned int num_entries;
410b6e66be2SVincenzo Maffione 	struct sync_kloop_poll_entry entries[0];
411b6e66be2SVincenzo Maffione };
412b6e66be2SVincenzo Maffione 
413b6e66be2SVincenzo Maffione static void
414b6e66be2SVincenzo Maffione sync_kloop_poll_table_queue_proc(struct file *file, wait_queue_head_t *wqh,
415b6e66be2SVincenzo Maffione 				poll_table *pt)
416b6e66be2SVincenzo Maffione {
417b6e66be2SVincenzo Maffione 	struct sync_kloop_poll_ctx *poll_ctx =
418b6e66be2SVincenzo Maffione 		container_of(pt, struct sync_kloop_poll_ctx, wait_table);
419b6e66be2SVincenzo Maffione 	struct sync_kloop_poll_entry *entry = poll_ctx->entries +
420b6e66be2SVincenzo Maffione 						poll_ctx->next_entry;
421b6e66be2SVincenzo Maffione 
422b6e66be2SVincenzo Maffione 	BUG_ON(poll_ctx->next_entry >= poll_ctx->num_entries);
423b6e66be2SVincenzo Maffione 	entry->wqh = wqh;
424b6e66be2SVincenzo Maffione 	entry->filp = file;
425b6e66be2SVincenzo Maffione 	/* Use the default wake up function. */
426b6e66be2SVincenzo Maffione 	init_waitqueue_entry(&entry->wait, current);
427b6e66be2SVincenzo Maffione 	add_wait_queue(wqh, &entry->wait);
428b6e66be2SVincenzo Maffione 	poll_ctx->next_entry++;
429b6e66be2SVincenzo Maffione }
430b6e66be2SVincenzo Maffione #endif  /* SYNC_KLOOP_POLL */
431b6e66be2SVincenzo Maffione 
432b6e66be2SVincenzo Maffione int
433b6e66be2SVincenzo Maffione netmap_sync_kloop(struct netmap_priv_d *priv, struct nmreq_header *hdr)
434b6e66be2SVincenzo Maffione {
435b6e66be2SVincenzo Maffione 	struct nmreq_sync_kloop_start *req =
436b6e66be2SVincenzo Maffione 		(struct nmreq_sync_kloop_start *)(uintptr_t)hdr->nr_body;
437b6e66be2SVincenzo Maffione 	struct nmreq_opt_sync_kloop_eventfds *eventfds_opt = NULL;
438b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
439b6e66be2SVincenzo Maffione 	struct sync_kloop_poll_ctx *poll_ctx = NULL;
440b6e66be2SVincenzo Maffione #endif  /* SYNC_KLOOP_POLL */
441b6e66be2SVincenzo Maffione 	int num_rx_rings, num_tx_rings, num_rings;
442b6e66be2SVincenzo Maffione 	uint32_t sleep_us = req->sleep_us;
443b6e66be2SVincenzo Maffione 	struct nm_csb_atok* csb_atok_base;
444b6e66be2SVincenzo Maffione 	struct nm_csb_ktoa* csb_ktoa_base;
445b6e66be2SVincenzo Maffione 	struct netmap_adapter *na;
446b6e66be2SVincenzo Maffione 	struct nmreq_option *opt;
447b6e66be2SVincenzo Maffione 	int err = 0;
448b6e66be2SVincenzo Maffione 	int i;
449b6e66be2SVincenzo Maffione 
450b6e66be2SVincenzo Maffione 	if (sleep_us > 1000000) {
451b6e66be2SVincenzo Maffione 		/* We do not accept sleeping for more than a second. */
452b6e66be2SVincenzo Maffione 		return EINVAL;
453b6e66be2SVincenzo Maffione 	}
454b6e66be2SVincenzo Maffione 
455b6e66be2SVincenzo Maffione 	if (priv->np_nifp == NULL) {
456b6e66be2SVincenzo Maffione 		return ENXIO;
457b6e66be2SVincenzo Maffione 	}
458b6e66be2SVincenzo Maffione 	mb(); /* make sure following reads are not from cache */
459b6e66be2SVincenzo Maffione 
460b6e66be2SVincenzo Maffione 	na = priv->np_na;
461b6e66be2SVincenzo Maffione 	if (!nm_netmap_on(na)) {
462b6e66be2SVincenzo Maffione 		return ENXIO;
463b6e66be2SVincenzo Maffione 	}
464b6e66be2SVincenzo Maffione 
465b6e66be2SVincenzo Maffione 	NMG_LOCK();
466b6e66be2SVincenzo Maffione 	/* Make sure the application is working in CSB mode. */
467b6e66be2SVincenzo Maffione 	if (!priv->np_csb_atok_base || !priv->np_csb_ktoa_base) {
468b6e66be2SVincenzo Maffione 		NMG_UNLOCK();
469b6e66be2SVincenzo Maffione 		nm_prerr("sync-kloop on %s requires "
470b6e66be2SVincenzo Maffione 				"NETMAP_REQ_OPT_CSB option", na->name);
471b6e66be2SVincenzo Maffione 		return EINVAL;
472b6e66be2SVincenzo Maffione 	}
473b6e66be2SVincenzo Maffione 
474b6e66be2SVincenzo Maffione 	csb_atok_base = priv->np_csb_atok_base;
475b6e66be2SVincenzo Maffione 	csb_ktoa_base = priv->np_csb_ktoa_base;
476b6e66be2SVincenzo Maffione 
477b6e66be2SVincenzo Maffione 	/* Make sure that no kloop is currently running. */
478b6e66be2SVincenzo Maffione 	if (priv->np_kloop_state & NM_SYNC_KLOOP_RUNNING) {
479b6e66be2SVincenzo Maffione 		err = EBUSY;
480b6e66be2SVincenzo Maffione 	}
481b6e66be2SVincenzo Maffione 	priv->np_kloop_state |= NM_SYNC_KLOOP_RUNNING;
482b6e66be2SVincenzo Maffione 	NMG_UNLOCK();
483b6e66be2SVincenzo Maffione 	if (err) {
484b6e66be2SVincenzo Maffione 		return err;
485b6e66be2SVincenzo Maffione 	}
486b6e66be2SVincenzo Maffione 
487b6e66be2SVincenzo Maffione 	num_rx_rings = priv->np_qlast[NR_RX] - priv->np_qfirst[NR_RX];
488b6e66be2SVincenzo Maffione 	num_tx_rings = priv->np_qlast[NR_TX] - priv->np_qfirst[NR_TX];
489b6e66be2SVincenzo Maffione 	num_rings = num_tx_rings + num_rx_rings;
490b6e66be2SVincenzo Maffione 
491b6e66be2SVincenzo Maffione 	/* Validate notification options. */
492b6e66be2SVincenzo Maffione 	opt = nmreq_findoption((struct nmreq_option *)(uintptr_t)hdr->nr_options,
493b6e66be2SVincenzo Maffione 				NETMAP_REQ_OPT_SYNC_KLOOP_EVENTFDS);
494b6e66be2SVincenzo Maffione 	if (opt != NULL) {
495b6e66be2SVincenzo Maffione 		err = nmreq_checkduplicate(opt);
496b6e66be2SVincenzo Maffione 		if (err) {
497b6e66be2SVincenzo Maffione 			opt->nro_status = err;
498b6e66be2SVincenzo Maffione 			goto out;
499b6e66be2SVincenzo Maffione 		}
500b6e66be2SVincenzo Maffione 		if (opt->nro_size != sizeof(*eventfds_opt) +
501b6e66be2SVincenzo Maffione 			sizeof(eventfds_opt->eventfds[0]) * num_rings) {
502b6e66be2SVincenzo Maffione 			/* Option size not consistent with the number of
503b6e66be2SVincenzo Maffione 			 * entries. */
504b6e66be2SVincenzo Maffione 			opt->nro_status = err = EINVAL;
505b6e66be2SVincenzo Maffione 			goto out;
506b6e66be2SVincenzo Maffione 		}
507b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
508b6e66be2SVincenzo Maffione 		eventfds_opt = (struct nmreq_opt_sync_kloop_eventfds *)opt;
509b6e66be2SVincenzo Maffione 		opt->nro_status = 0;
510b6e66be2SVincenzo Maffione 		/* We need 2 poll entries for TX and RX notifications coming
511b6e66be2SVincenzo Maffione 		 * from the netmap adapter, plus one entries per ring for the
512b6e66be2SVincenzo Maffione 		 * notifications coming from the application. */
513b6e66be2SVincenzo Maffione 		poll_ctx = nm_os_malloc(sizeof(*poll_ctx) +
514b6e66be2SVincenzo Maffione 				(2 + num_rings) * sizeof(poll_ctx->entries[0]));
515b6e66be2SVincenzo Maffione 		init_poll_funcptr(&poll_ctx->wait_table,
516b6e66be2SVincenzo Maffione 					sync_kloop_poll_table_queue_proc);
517b6e66be2SVincenzo Maffione 		poll_ctx->num_entries = 2 + num_rings;
518b6e66be2SVincenzo Maffione 		poll_ctx->next_entry = 0;
519b6e66be2SVincenzo Maffione 		/* Poll for notifications coming from the applications through
520b6e66be2SVincenzo Maffione 		 * eventfds . */
521b6e66be2SVincenzo Maffione 		for (i = 0; i < num_rings; i++) {
522b6e66be2SVincenzo Maffione 			struct eventfd_ctx *irq;
523b6e66be2SVincenzo Maffione 			struct file *filp;
524b6e66be2SVincenzo Maffione 			unsigned long mask;
525b6e66be2SVincenzo Maffione 
526b6e66be2SVincenzo Maffione 			filp = eventfd_fget(eventfds_opt->eventfds[i].ioeventfd);
527b6e66be2SVincenzo Maffione 			if (IS_ERR(filp)) {
528b6e66be2SVincenzo Maffione 				err = PTR_ERR(filp);
529b6e66be2SVincenzo Maffione 				goto out;
530b6e66be2SVincenzo Maffione 			}
531b6e66be2SVincenzo Maffione 			mask = filp->f_op->poll(filp, &poll_ctx->wait_table);
532b6e66be2SVincenzo Maffione 			if (mask & POLLERR) {
533b6e66be2SVincenzo Maffione 				err = EINVAL;
534b6e66be2SVincenzo Maffione 				goto out;
535b6e66be2SVincenzo Maffione 			}
536b6e66be2SVincenzo Maffione 
537b6e66be2SVincenzo Maffione 			filp = eventfd_fget(eventfds_opt->eventfds[i].irqfd);
538b6e66be2SVincenzo Maffione 			if (IS_ERR(filp)) {
539b6e66be2SVincenzo Maffione 				err = PTR_ERR(filp);
540b6e66be2SVincenzo Maffione 				goto out;
541b6e66be2SVincenzo Maffione 			}
542b6e66be2SVincenzo Maffione 			poll_ctx->entries[i].irq_filp = filp;
543b6e66be2SVincenzo Maffione 			irq = eventfd_ctx_fileget(filp);
544b6e66be2SVincenzo Maffione 			if (IS_ERR(irq)) {
545b6e66be2SVincenzo Maffione 				err = PTR_ERR(irq);
546b6e66be2SVincenzo Maffione 				goto out;
547b6e66be2SVincenzo Maffione 			}
548b6e66be2SVincenzo Maffione 			poll_ctx->entries[i].irq_ctx = irq;
549b6e66be2SVincenzo Maffione 		}
550b6e66be2SVincenzo Maffione 		/* Poll for notifications coming from the netmap rings bound to
551b6e66be2SVincenzo Maffione 		 * this file descriptor. */
552b6e66be2SVincenzo Maffione 		{
553b6e66be2SVincenzo Maffione 			NM_SELINFO_T *si[NR_TXRX];
554b6e66be2SVincenzo Maffione 
555b6e66be2SVincenzo Maffione 			NMG_LOCK();
556b6e66be2SVincenzo Maffione 			si[NR_RX] = nm_si_user(priv, NR_RX) ? &na->si[NR_RX] :
557b6e66be2SVincenzo Maffione 				&na->rx_rings[priv->np_qfirst[NR_RX]]->si;
558b6e66be2SVincenzo Maffione 			si[NR_TX] = nm_si_user(priv, NR_TX) ? &na->si[NR_TX] :
559b6e66be2SVincenzo Maffione 				&na->tx_rings[priv->np_qfirst[NR_TX]]->si;
560b6e66be2SVincenzo Maffione 			NMG_UNLOCK();
561b6e66be2SVincenzo Maffione 			poll_wait(priv->np_filp, si[NR_RX], &poll_ctx->wait_table);
562b6e66be2SVincenzo Maffione 			poll_wait(priv->np_filp, si[NR_TX], &poll_ctx->wait_table);
563b6e66be2SVincenzo Maffione 		}
564b6e66be2SVincenzo Maffione #else   /* SYNC_KLOOP_POLL */
565b6e66be2SVincenzo Maffione 		opt->nro_status = EOPNOTSUPP;
566b6e66be2SVincenzo Maffione 		goto out;
567b6e66be2SVincenzo Maffione #endif  /* SYNC_KLOOP_POLL */
568b6e66be2SVincenzo Maffione 	}
569b6e66be2SVincenzo Maffione 
570b6e66be2SVincenzo Maffione 	/* Main loop. */
571b6e66be2SVincenzo Maffione 	for (;;) {
572b6e66be2SVincenzo Maffione 		if (unlikely(NM_ACCESS_ONCE(priv->np_kloop_state) & NM_SYNC_KLOOP_STOPPING)) {
573b6e66be2SVincenzo Maffione 			break;
574b6e66be2SVincenzo Maffione 		}
575b6e66be2SVincenzo Maffione 
576b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
577b6e66be2SVincenzo Maffione 		if (poll_ctx)
578b6e66be2SVincenzo Maffione 			__set_current_state(TASK_INTERRUPTIBLE);
579b6e66be2SVincenzo Maffione #endif  /* SYNC_KLOOP_POLL */
580b6e66be2SVincenzo Maffione 
581b6e66be2SVincenzo Maffione 		/* Process all the TX rings bound to this file descriptor. */
582b6e66be2SVincenzo Maffione 		for (i = 0; i < num_tx_rings; i++) {
583b6e66be2SVincenzo Maffione 			struct sync_kloop_ring_args a = {
584b6e66be2SVincenzo Maffione 				.kring = NMR(na, NR_TX)[i + priv->np_qfirst[NR_TX]],
585b6e66be2SVincenzo Maffione 				.csb_atok = csb_atok_base + i,
586b6e66be2SVincenzo Maffione 				.csb_ktoa = csb_ktoa_base + i,
587b6e66be2SVincenzo Maffione 			};
588b6e66be2SVincenzo Maffione 
589b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
590b6e66be2SVincenzo Maffione 			if (poll_ctx)
591b6e66be2SVincenzo Maffione 				a.irq_ctx = poll_ctx->entries[i].irq_ctx;
592b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
593b6e66be2SVincenzo Maffione 			if (unlikely(nm_kr_tryget(a.kring, 1, NULL))) {
594b6e66be2SVincenzo Maffione 				continue;
595b6e66be2SVincenzo Maffione 			}
596b6e66be2SVincenzo Maffione 			netmap_sync_kloop_tx_ring(&a);
597b6e66be2SVincenzo Maffione 			nm_kr_put(a.kring);
598b6e66be2SVincenzo Maffione 		}
599b6e66be2SVincenzo Maffione 
600b6e66be2SVincenzo Maffione 		/* Process all the RX rings bound to this file descriptor. */
601b6e66be2SVincenzo Maffione 		for (i = 0; i < num_rx_rings; i++) {
602b6e66be2SVincenzo Maffione 			struct sync_kloop_ring_args a = {
603b6e66be2SVincenzo Maffione 				.kring = NMR(na, NR_RX)[i + priv->np_qfirst[NR_RX]],
604b6e66be2SVincenzo Maffione 				.csb_atok = csb_atok_base + num_tx_rings + i,
605b6e66be2SVincenzo Maffione 				.csb_ktoa = csb_ktoa_base + num_tx_rings + i,
606b6e66be2SVincenzo Maffione 			};
607b6e66be2SVincenzo Maffione 
608b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
609b6e66be2SVincenzo Maffione 			if (poll_ctx)
610b6e66be2SVincenzo Maffione 				a.irq_ctx = poll_ctx->entries[num_tx_rings + i].irq_ctx;
611b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
612b6e66be2SVincenzo Maffione 
613b6e66be2SVincenzo Maffione 			if (unlikely(nm_kr_tryget(a.kring, 1, NULL))) {
614b6e66be2SVincenzo Maffione 				continue;
615b6e66be2SVincenzo Maffione 			}
616b6e66be2SVincenzo Maffione 			netmap_sync_kloop_rx_ring(&a);
617b6e66be2SVincenzo Maffione 			nm_kr_put(a.kring);
618b6e66be2SVincenzo Maffione 		}
619b6e66be2SVincenzo Maffione 
620b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
621b6e66be2SVincenzo Maffione 		if (poll_ctx) {
622b6e66be2SVincenzo Maffione 			/* If a poll context is present, yield to the scheduler
623b6e66be2SVincenzo Maffione 			 * waiting for a notification to come either from
624b6e66be2SVincenzo Maffione 			 * netmap or the application. */
625b6e66be2SVincenzo Maffione 			schedule_timeout_interruptible(msecs_to_jiffies(1000));
626b6e66be2SVincenzo Maffione 		} else
627b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
628b6e66be2SVincenzo Maffione 		{
629b6e66be2SVincenzo Maffione 			/* Default synchronization method: sleep for a while. */
630b6e66be2SVincenzo Maffione 			usleep_range(sleep_us, sleep_us);
631b6e66be2SVincenzo Maffione 		}
632b6e66be2SVincenzo Maffione 	}
633b6e66be2SVincenzo Maffione out:
634b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
635b6e66be2SVincenzo Maffione 	if (poll_ctx) {
636b6e66be2SVincenzo Maffione 		/* Stop polling from netmap and the eventfds, and deallocate
637b6e66be2SVincenzo Maffione 		 * the poll context. */
638b6e66be2SVincenzo Maffione 		__set_current_state(TASK_RUNNING);
639b6e66be2SVincenzo Maffione 		for (i = 0; i < poll_ctx->next_entry; i++) {
640b6e66be2SVincenzo Maffione 			struct sync_kloop_poll_entry *entry =
641b6e66be2SVincenzo Maffione 						poll_ctx->entries + i;
642b6e66be2SVincenzo Maffione 
643b6e66be2SVincenzo Maffione 			if (entry->wqh)
644b6e66be2SVincenzo Maffione 				remove_wait_queue(entry->wqh, &entry->wait);
645b6e66be2SVincenzo Maffione 			/* We did not get a reference to the eventfds, but
646b6e66be2SVincenzo Maffione 			 * don't do that on netmap file descriptors (since
647b6e66be2SVincenzo Maffione 			 * a reference was not taken. */
648b6e66be2SVincenzo Maffione 			if (entry->filp && entry->filp != priv->np_filp)
649b6e66be2SVincenzo Maffione 				fput(entry->filp);
650b6e66be2SVincenzo Maffione 			if (entry->irq_ctx)
651b6e66be2SVincenzo Maffione 				eventfd_ctx_put(entry->irq_ctx);
652b6e66be2SVincenzo Maffione 			if (entry->irq_filp)
653b6e66be2SVincenzo Maffione 				fput(entry->irq_filp);
654b6e66be2SVincenzo Maffione 		}
655b6e66be2SVincenzo Maffione 		nm_os_free(poll_ctx);
656b6e66be2SVincenzo Maffione 		poll_ctx = NULL;
657b6e66be2SVincenzo Maffione 	}
658b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
659b6e66be2SVincenzo Maffione 
660b6e66be2SVincenzo Maffione 	/* Reset the kloop state. */
661b6e66be2SVincenzo Maffione 	NMG_LOCK();
662b6e66be2SVincenzo Maffione 	priv->np_kloop_state = 0;
663b6e66be2SVincenzo Maffione 	NMG_UNLOCK();
664b6e66be2SVincenzo Maffione 
665b6e66be2SVincenzo Maffione 	return err;
666b6e66be2SVincenzo Maffione }
667b6e66be2SVincenzo Maffione 
668b6e66be2SVincenzo Maffione int
669b6e66be2SVincenzo Maffione netmap_sync_kloop_stop(struct netmap_priv_d *priv)
670b6e66be2SVincenzo Maffione {
671b6e66be2SVincenzo Maffione 	bool running = true;
672b6e66be2SVincenzo Maffione 	int err = 0;
673b6e66be2SVincenzo Maffione 
674b6e66be2SVincenzo Maffione 	NMG_LOCK();
675b6e66be2SVincenzo Maffione 	priv->np_kloop_state |= NM_SYNC_KLOOP_STOPPING;
676b6e66be2SVincenzo Maffione 	NMG_UNLOCK();
677b6e66be2SVincenzo Maffione 	while (running) {
678b6e66be2SVincenzo Maffione 		usleep_range(1000, 1500);
679b6e66be2SVincenzo Maffione 		NMG_LOCK();
680b6e66be2SVincenzo Maffione 		running = (NM_ACCESS_ONCE(priv->np_kloop_state)
681b6e66be2SVincenzo Maffione 				& NM_SYNC_KLOOP_RUNNING);
682b6e66be2SVincenzo Maffione 		NMG_UNLOCK();
683b6e66be2SVincenzo Maffione 	}
684b6e66be2SVincenzo Maffione 
685b6e66be2SVincenzo Maffione 	return err;
686b6e66be2SVincenzo Maffione }
687b6e66be2SVincenzo Maffione 
688b6e66be2SVincenzo Maffione #ifdef WITH_PTNETMAP
689b6e66be2SVincenzo Maffione /*
690b6e66be2SVincenzo Maffione  * Guest ptnetmap txsync()/rxsync() routines, used in ptnet device drivers.
691b6e66be2SVincenzo Maffione  * These routines are reused across the different operating systems supported
692b6e66be2SVincenzo Maffione  * by netmap.
693b6e66be2SVincenzo Maffione  */
694b6e66be2SVincenzo Maffione 
695b6e66be2SVincenzo Maffione /*
696b6e66be2SVincenzo Maffione  * Reconcile host and guest views of the transmit ring.
697b6e66be2SVincenzo Maffione  *
698b6e66be2SVincenzo Maffione  * Guest user wants to transmit packets up to the one before ring->head,
699b6e66be2SVincenzo Maffione  * and guest kernel knows tx_ring->hwcur is the first packet unsent
700b6e66be2SVincenzo Maffione  * by the host kernel.
701b6e66be2SVincenzo Maffione  *
702b6e66be2SVincenzo Maffione  * We push out as many packets as possible, and possibly
703b6e66be2SVincenzo Maffione  * reclaim buffers from previously completed transmission.
704b6e66be2SVincenzo Maffione  *
705b6e66be2SVincenzo Maffione  * Notifications from the host are enabled only if the user guest would
706b6e66be2SVincenzo Maffione  * block (no space in the ring).
707b6e66be2SVincenzo Maffione  */
708b6e66be2SVincenzo Maffione bool
709b6e66be2SVincenzo Maffione netmap_pt_guest_txsync(struct nm_csb_atok *atok, struct nm_csb_ktoa *ktoa,
710b6e66be2SVincenzo Maffione 			struct netmap_kring *kring, int flags)
711b6e66be2SVincenzo Maffione {
712b6e66be2SVincenzo Maffione 	bool notify = false;
713b6e66be2SVincenzo Maffione 
714b6e66be2SVincenzo Maffione 	/* Disable notifications */
715b6e66be2SVincenzo Maffione 	atok->appl_need_kick = 0;
716b6e66be2SVincenzo Maffione 
717b6e66be2SVincenzo Maffione 	/*
718b6e66be2SVincenzo Maffione 	 * First part: tell the host (updating the CSB) to process the new
719b6e66be2SVincenzo Maffione 	 * packets.
720b6e66be2SVincenzo Maffione 	 */
721b6e66be2SVincenzo Maffione 	kring->nr_hwcur = ktoa->hwcur;
722b6e66be2SVincenzo Maffione 	ptnetmap_guest_write_kring_csb(atok, kring->rcur, kring->rhead);
723b6e66be2SVincenzo Maffione 
724b6e66be2SVincenzo Maffione         /* Ask for a kick from a guest to the host if needed. */
725b6e66be2SVincenzo Maffione 	if (((kring->rhead != kring->nr_hwcur || nm_kr_txempty(kring))
726b6e66be2SVincenzo Maffione 		&& NM_ACCESS_ONCE(ktoa->kern_need_kick)) ||
727b6e66be2SVincenzo Maffione 			(flags & NAF_FORCE_RECLAIM)) {
728b6e66be2SVincenzo Maffione 		atok->sync_flags = flags;
729b6e66be2SVincenzo Maffione 		notify = true;
730b6e66be2SVincenzo Maffione 	}
731b6e66be2SVincenzo Maffione 
732b6e66be2SVincenzo Maffione 	/*
733b6e66be2SVincenzo Maffione 	 * Second part: reclaim buffers for completed transmissions.
734b6e66be2SVincenzo Maffione 	 */
735b6e66be2SVincenzo Maffione 	if (nm_kr_txempty(kring) || (flags & NAF_FORCE_RECLAIM)) {
736b6e66be2SVincenzo Maffione                 ptnetmap_guest_read_kring_csb(ktoa, kring);
737b6e66be2SVincenzo Maffione 	}
738b6e66be2SVincenzo Maffione 
739b6e66be2SVincenzo Maffione         /*
740b6e66be2SVincenzo Maffione          * No more room in the ring for new transmissions. The user thread will
741b6e66be2SVincenzo Maffione 	 * go to sleep and we need to be notified by the host when more free
742b6e66be2SVincenzo Maffione 	 * space is available.
743b6e66be2SVincenzo Maffione          */
744b6e66be2SVincenzo Maffione 	if (nm_kr_txempty(kring) && !(kring->nr_kflags & NKR_NOINTR)) {
745b6e66be2SVincenzo Maffione 		/* Reenable notifications. */
746b6e66be2SVincenzo Maffione 		atok->appl_need_kick = 1;
747b6e66be2SVincenzo Maffione                 /* Double check */
748b6e66be2SVincenzo Maffione                 ptnetmap_guest_read_kring_csb(ktoa, kring);
749b6e66be2SVincenzo Maffione                 /* If there is new free space, disable notifications */
750b6e66be2SVincenzo Maffione 		if (unlikely(!nm_kr_txempty(kring))) {
751b6e66be2SVincenzo Maffione 			atok->appl_need_kick = 0;
752b6e66be2SVincenzo Maffione 		}
753b6e66be2SVincenzo Maffione 	}
754b6e66be2SVincenzo Maffione 
755b6e66be2SVincenzo Maffione 	nm_prdis(1, "%s CSB(head:%u cur:%u hwtail:%u) KRING(head:%u cur:%u tail:%u)",
756b6e66be2SVincenzo Maffione 		kring->name, atok->head, atok->cur, ktoa->hwtail,
757b6e66be2SVincenzo Maffione 		kring->rhead, kring->rcur, kring->nr_hwtail);
758b6e66be2SVincenzo Maffione 
759b6e66be2SVincenzo Maffione 	return notify;
760b6e66be2SVincenzo Maffione }
761b6e66be2SVincenzo Maffione 
762b6e66be2SVincenzo Maffione /*
763b6e66be2SVincenzo Maffione  * Reconcile host and guest view of the receive ring.
764b6e66be2SVincenzo Maffione  *
765b6e66be2SVincenzo Maffione  * Update hwcur/hwtail from host (reading from CSB).
766b6e66be2SVincenzo Maffione  *
767b6e66be2SVincenzo Maffione  * If guest user has released buffers up to the one before ring->head, we
768b6e66be2SVincenzo Maffione  * also give them to the host.
769b6e66be2SVincenzo Maffione  *
770b6e66be2SVincenzo Maffione  * Notifications from the host are enabled only if the user guest would
771b6e66be2SVincenzo Maffione  * block (no more completed slots in the ring).
772b6e66be2SVincenzo Maffione  */
773b6e66be2SVincenzo Maffione bool
774b6e66be2SVincenzo Maffione netmap_pt_guest_rxsync(struct nm_csb_atok *atok, struct nm_csb_ktoa *ktoa,
775b6e66be2SVincenzo Maffione 			struct netmap_kring *kring, int flags)
776b6e66be2SVincenzo Maffione {
777b6e66be2SVincenzo Maffione 	bool notify = false;
778b6e66be2SVincenzo Maffione 
779b6e66be2SVincenzo Maffione         /* Disable notifications */
780b6e66be2SVincenzo Maffione 	atok->appl_need_kick = 0;
781b6e66be2SVincenzo Maffione 
782b6e66be2SVincenzo Maffione 	/*
783b6e66be2SVincenzo Maffione 	 * First part: import newly received packets, by updating the kring
784b6e66be2SVincenzo Maffione 	 * hwtail to the hwtail known from the host (read from the CSB).
785b6e66be2SVincenzo Maffione 	 * This also updates the kring hwcur.
786b6e66be2SVincenzo Maffione 	 */
787b6e66be2SVincenzo Maffione         ptnetmap_guest_read_kring_csb(ktoa, kring);
788b6e66be2SVincenzo Maffione 	kring->nr_kflags &= ~NKR_PENDINTR;
789b6e66be2SVincenzo Maffione 
790b6e66be2SVincenzo Maffione 	/*
791b6e66be2SVincenzo Maffione 	 * Second part: tell the host about the slots that guest user has
792b6e66be2SVincenzo Maffione 	 * released, by updating cur and head in the CSB.
793b6e66be2SVincenzo Maffione 	 */
794b6e66be2SVincenzo Maffione 	if (kring->rhead != kring->nr_hwcur) {
795b6e66be2SVincenzo Maffione 		ptnetmap_guest_write_kring_csb(atok, kring->rcur,
796b6e66be2SVincenzo Maffione 					       kring->rhead);
797b6e66be2SVincenzo Maffione                 /* Ask for a kick from the guest to the host if needed. */
798b6e66be2SVincenzo Maffione 		if (NM_ACCESS_ONCE(ktoa->kern_need_kick)) {
799b6e66be2SVincenzo Maffione 			atok->sync_flags = flags;
800b6e66be2SVincenzo Maffione 			notify = true;
801b6e66be2SVincenzo Maffione 		}
802b6e66be2SVincenzo Maffione 	}
803b6e66be2SVincenzo Maffione 
804b6e66be2SVincenzo Maffione         /*
805b6e66be2SVincenzo Maffione          * No more completed RX slots. The user thread will go to sleep and
806b6e66be2SVincenzo Maffione 	 * we need to be notified by the host when more RX slots have been
807b6e66be2SVincenzo Maffione 	 * completed.
808b6e66be2SVincenzo Maffione          */
809b6e66be2SVincenzo Maffione 	if (nm_kr_rxempty(kring) && !(kring->nr_kflags & NKR_NOINTR)) {
810b6e66be2SVincenzo Maffione 		/* Reenable notifications. */
811b6e66be2SVincenzo Maffione                 atok->appl_need_kick = 1;
812b6e66be2SVincenzo Maffione                 /* Double check */
813b6e66be2SVincenzo Maffione                 ptnetmap_guest_read_kring_csb(ktoa, kring);
814b6e66be2SVincenzo Maffione                 /* If there are new slots, disable notifications. */
815b6e66be2SVincenzo Maffione 		if (!nm_kr_rxempty(kring)) {
816b6e66be2SVincenzo Maffione                         atok->appl_need_kick = 0;
817b6e66be2SVincenzo Maffione                 }
818b6e66be2SVincenzo Maffione         }
819b6e66be2SVincenzo Maffione 
820b6e66be2SVincenzo Maffione 	nm_prdis(1, "%s CSB(head:%u cur:%u hwtail:%u) KRING(head:%u cur:%u tail:%u)",
821b6e66be2SVincenzo Maffione 		kring->name, atok->head, atok->cur, ktoa->hwtail,
822b6e66be2SVincenzo Maffione 		kring->rhead, kring->rcur, kring->nr_hwtail);
823b6e66be2SVincenzo Maffione 
824b6e66be2SVincenzo Maffione 	return notify;
825b6e66be2SVincenzo Maffione }
826b6e66be2SVincenzo Maffione 
827b6e66be2SVincenzo Maffione /*
828b6e66be2SVincenzo Maffione  * Callbacks for ptnet drivers: nm_krings_create, nm_krings_delete, nm_dtor.
829b6e66be2SVincenzo Maffione  */
830b6e66be2SVincenzo Maffione int
831b6e66be2SVincenzo Maffione ptnet_nm_krings_create(struct netmap_adapter *na)
832b6e66be2SVincenzo Maffione {
833b6e66be2SVincenzo Maffione 	struct netmap_pt_guest_adapter *ptna =
834b6e66be2SVincenzo Maffione 			(struct netmap_pt_guest_adapter *)na; /* Upcast. */
835b6e66be2SVincenzo Maffione 	struct netmap_adapter *na_nm = &ptna->hwup.up;
836b6e66be2SVincenzo Maffione 	struct netmap_adapter *na_dr = &ptna->dr.up;
837b6e66be2SVincenzo Maffione 	int ret;
838b6e66be2SVincenzo Maffione 
839b6e66be2SVincenzo Maffione 	if (ptna->backend_users) {
840b6e66be2SVincenzo Maffione 		return 0;
841b6e66be2SVincenzo Maffione 	}
842b6e66be2SVincenzo Maffione 
843b6e66be2SVincenzo Maffione 	/* Create krings on the public netmap adapter. */
844b6e66be2SVincenzo Maffione 	ret = netmap_hw_krings_create(na_nm);
845b6e66be2SVincenzo Maffione 	if (ret) {
846b6e66be2SVincenzo Maffione 		return ret;
847b6e66be2SVincenzo Maffione 	}
848b6e66be2SVincenzo Maffione 
849b6e66be2SVincenzo Maffione 	/* Copy krings into the netmap adapter private to the driver. */
850b6e66be2SVincenzo Maffione 	na_dr->tx_rings = na_nm->tx_rings;
851b6e66be2SVincenzo Maffione 	na_dr->rx_rings = na_nm->rx_rings;
852b6e66be2SVincenzo Maffione 
853b6e66be2SVincenzo Maffione 	return 0;
854b6e66be2SVincenzo Maffione }
855b6e66be2SVincenzo Maffione 
856b6e66be2SVincenzo Maffione void
857b6e66be2SVincenzo Maffione ptnet_nm_krings_delete(struct netmap_adapter *na)
858b6e66be2SVincenzo Maffione {
859b6e66be2SVincenzo Maffione 	struct netmap_pt_guest_adapter *ptna =
860b6e66be2SVincenzo Maffione 			(struct netmap_pt_guest_adapter *)na; /* Upcast. */
861b6e66be2SVincenzo Maffione 	struct netmap_adapter *na_nm = &ptna->hwup.up;
862b6e66be2SVincenzo Maffione 	struct netmap_adapter *na_dr = &ptna->dr.up;
863b6e66be2SVincenzo Maffione 
864b6e66be2SVincenzo Maffione 	if (ptna->backend_users) {
865b6e66be2SVincenzo Maffione 		return;
866b6e66be2SVincenzo Maffione 	}
867b6e66be2SVincenzo Maffione 
868b6e66be2SVincenzo Maffione 	na_dr->tx_rings = NULL;
869b6e66be2SVincenzo Maffione 	na_dr->rx_rings = NULL;
870b6e66be2SVincenzo Maffione 
871b6e66be2SVincenzo Maffione 	netmap_hw_krings_delete(na_nm);
872b6e66be2SVincenzo Maffione }
873b6e66be2SVincenzo Maffione 
874b6e66be2SVincenzo Maffione void
875b6e66be2SVincenzo Maffione ptnet_nm_dtor(struct netmap_adapter *na)
876b6e66be2SVincenzo Maffione {
877b6e66be2SVincenzo Maffione 	struct netmap_pt_guest_adapter *ptna =
878b6e66be2SVincenzo Maffione 			(struct netmap_pt_guest_adapter *)na;
879b6e66be2SVincenzo Maffione 
880b6e66be2SVincenzo Maffione 	netmap_mem_put(ptna->dr.up.nm_mem);
881b6e66be2SVincenzo Maffione 	memset(&ptna->dr, 0, sizeof(ptna->dr));
882b6e66be2SVincenzo Maffione 	netmap_mem_pt_guest_ifp_del(na->nm_mem, na->ifp);
883b6e66be2SVincenzo Maffione }
884b6e66be2SVincenzo Maffione 
885b6e66be2SVincenzo Maffione int
886b6e66be2SVincenzo Maffione netmap_pt_guest_attach(struct netmap_adapter *arg,
887b6e66be2SVincenzo Maffione 		       unsigned int nifp_offset, unsigned int memid)
888b6e66be2SVincenzo Maffione {
889b6e66be2SVincenzo Maffione 	struct netmap_pt_guest_adapter *ptna;
890b6e66be2SVincenzo Maffione 	struct ifnet *ifp = arg ? arg->ifp : NULL;
891b6e66be2SVincenzo Maffione 	int error;
892b6e66be2SVincenzo Maffione 
893b6e66be2SVincenzo Maffione 	/* get allocator */
894b6e66be2SVincenzo Maffione 	arg->nm_mem = netmap_mem_pt_guest_new(ifp, nifp_offset, memid);
895b6e66be2SVincenzo Maffione 	if (arg->nm_mem == NULL)
896b6e66be2SVincenzo Maffione 		return ENOMEM;
897b6e66be2SVincenzo Maffione 	arg->na_flags |= NAF_MEM_OWNER;
898b6e66be2SVincenzo Maffione 	error = netmap_attach_ext(arg, sizeof(struct netmap_pt_guest_adapter), 1);
899b6e66be2SVincenzo Maffione 	if (error)
900b6e66be2SVincenzo Maffione 		return error;
901b6e66be2SVincenzo Maffione 
902b6e66be2SVincenzo Maffione 	/* get the netmap_pt_guest_adapter */
903b6e66be2SVincenzo Maffione 	ptna = (struct netmap_pt_guest_adapter *) NA(ifp);
904b6e66be2SVincenzo Maffione 
905b6e66be2SVincenzo Maffione 	/* Initialize a separate pass-through netmap adapter that is going to
906b6e66be2SVincenzo Maffione 	 * be used by the ptnet driver only, and so never exposed to netmap
907b6e66be2SVincenzo Maffione          * applications. We only need a subset of the available fields. */
908b6e66be2SVincenzo Maffione 	memset(&ptna->dr, 0, sizeof(ptna->dr));
909b6e66be2SVincenzo Maffione 	ptna->dr.up.ifp = ifp;
910b6e66be2SVincenzo Maffione 	ptna->dr.up.nm_mem = netmap_mem_get(ptna->hwup.up.nm_mem);
911b6e66be2SVincenzo Maffione         ptna->dr.up.nm_config = ptna->hwup.up.nm_config;
912b6e66be2SVincenzo Maffione 
913b6e66be2SVincenzo Maffione 	ptna->backend_users = 0;
914b6e66be2SVincenzo Maffione 
915b6e66be2SVincenzo Maffione 	return 0;
916b6e66be2SVincenzo Maffione }
917b6e66be2SVincenzo Maffione 
918b6e66be2SVincenzo Maffione #endif /* WITH_PTNETMAP */
919