xref: /freebsd/sys/dev/netmap/netmap_kloop.c (revision fdafd315ad0d0f28a11b9fb4476a9ab059c62b92)
1b6e66be2SVincenzo Maffione /*
2b6e66be2SVincenzo Maffione  * Copyright (C) 2016-2018 Vincenzo Maffione
3b6e66be2SVincenzo Maffione  * Copyright (C) 2015 Stefano Garzarella
4b6e66be2SVincenzo Maffione  * All rights reserved.
5b6e66be2SVincenzo Maffione  *
6b6e66be2SVincenzo Maffione  * Redistribution and use in source and binary forms, with or without
7b6e66be2SVincenzo Maffione  * modification, are permitted provided that the following conditions
8b6e66be2SVincenzo Maffione  * are met:
9b6e66be2SVincenzo Maffione  *   1. Redistributions of source code must retain the above copyright
10b6e66be2SVincenzo Maffione  *      notice, this list of conditions and the following disclaimer.
11b6e66be2SVincenzo Maffione  *   2. Redistributions in binary form must reproduce the above copyright
12b6e66be2SVincenzo Maffione  *      notice, this list of conditions and the following disclaimer in the
13b6e66be2SVincenzo Maffione  *      documentation and/or other materials provided with the distribution.
14b6e66be2SVincenzo Maffione  *
15b6e66be2SVincenzo Maffione  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16b6e66be2SVincenzo Maffione  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17b6e66be2SVincenzo Maffione  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18b6e66be2SVincenzo Maffione  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19b6e66be2SVincenzo Maffione  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20b6e66be2SVincenzo Maffione  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21b6e66be2SVincenzo Maffione  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22b6e66be2SVincenzo Maffione  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23b6e66be2SVincenzo Maffione  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24b6e66be2SVincenzo Maffione  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25b6e66be2SVincenzo Maffione  * SUCH DAMAGE.
26b6e66be2SVincenzo Maffione  */
27b6e66be2SVincenzo Maffione 
28b6e66be2SVincenzo Maffione /*
29b6e66be2SVincenzo Maffione  * common headers
30b6e66be2SVincenzo Maffione  */
31b6e66be2SVincenzo Maffione #if defined(__FreeBSD__)
32*fdafd315SWarner Losh 
33b6e66be2SVincenzo Maffione #include <sys/param.h>
34b6e66be2SVincenzo Maffione #include <sys/kernel.h>
35b6e66be2SVincenzo Maffione #include <sys/types.h>
36b6e66be2SVincenzo Maffione #include <sys/selinfo.h>
37b6e66be2SVincenzo Maffione #include <sys/socket.h>
38b6e66be2SVincenzo Maffione #include <net/if.h>
39b6e66be2SVincenzo Maffione #include <net/if_var.h>
40b6e66be2SVincenzo Maffione #include <machine/bus.h>
41b6e66be2SVincenzo Maffione 
42b6e66be2SVincenzo Maffione #define usleep_range(_1, _2) \
43b6e66be2SVincenzo Maffione         pause_sbt("sync-kloop-sleep", SBT_1US * _1, SBT_1US * 1, C_ABSOLUTE)
44b6e66be2SVincenzo Maffione 
45b6e66be2SVincenzo Maffione #elif defined(linux)
46b6e66be2SVincenzo Maffione #include <bsd_glue.h>
47b6e66be2SVincenzo Maffione #include <linux/file.h>
48b6e66be2SVincenzo Maffione #include <linux/eventfd.h>
49b6e66be2SVincenzo Maffione #endif
50b6e66be2SVincenzo Maffione 
51b6e66be2SVincenzo Maffione #include <net/netmap.h>
52b6e66be2SVincenzo Maffione #include <dev/netmap/netmap_kern.h>
53b6e66be2SVincenzo Maffione #include <net/netmap_virt.h>
54b6e66be2SVincenzo Maffione #include <dev/netmap/netmap_mem2.h>
55b6e66be2SVincenzo Maffione 
56b6e66be2SVincenzo Maffione /* Support for eventfd-based notifications. */
57b6e66be2SVincenzo Maffione #if defined(linux)
58b6e66be2SVincenzo Maffione #define SYNC_KLOOP_POLL
59b6e66be2SVincenzo Maffione #endif
60b6e66be2SVincenzo Maffione 
61b6e66be2SVincenzo Maffione /* Write kring pointers (hwcur, hwtail) to the CSB.
62b6e66be2SVincenzo Maffione  * This routine is coupled with ptnetmap_guest_read_kring_csb(). */
63b6e66be2SVincenzo Maffione static inline void
sync_kloop_kernel_write(struct nm_csb_ktoa __user * ptr,uint32_t hwcur,uint32_t hwtail)64b6e66be2SVincenzo Maffione sync_kloop_kernel_write(struct nm_csb_ktoa __user *ptr, uint32_t hwcur,
65b6e66be2SVincenzo Maffione 			   uint32_t hwtail)
66b6e66be2SVincenzo Maffione {
67f79ba6d7SVincenzo Maffione 	/* Issue a first store-store barrier to make sure writes to the
68f79ba6d7SVincenzo Maffione 	 * netmap ring do not overcome updates on ktoa->hwcur and ktoa->hwtail. */
69f79ba6d7SVincenzo Maffione 	nm_stst_barrier();
70f79ba6d7SVincenzo Maffione 
71b6e66be2SVincenzo Maffione 	/*
72f79ba6d7SVincenzo Maffione 	 * The same scheme used in nm_sync_kloop_appl_write() applies here.
73b6e66be2SVincenzo Maffione 	 * We allow the application to read a value of hwcur more recent than the value
74b6e66be2SVincenzo Maffione 	 * of hwtail, since this would anyway result in a consistent view of the
75b6e66be2SVincenzo Maffione 	 * ring state (and hwcur can never wraparound hwtail, since hwcur must be
76b6e66be2SVincenzo Maffione 	 * behind head).
77b6e66be2SVincenzo Maffione 	 *
78b6e66be2SVincenzo Maffione 	 * The following memory barrier scheme is used to make this happen:
79b6e66be2SVincenzo Maffione 	 *
80b6e66be2SVincenzo Maffione 	 *          Application            Kernel
81b6e66be2SVincenzo Maffione 	 *
82b6e66be2SVincenzo Maffione 	 *          STORE(hwcur)           LOAD(hwtail)
83f79ba6d7SVincenzo Maffione 	 *          wmb() <------------->  rmb()
84b6e66be2SVincenzo Maffione 	 *          STORE(hwtail)          LOAD(hwcur)
85b6e66be2SVincenzo Maffione 	 */
86b6e66be2SVincenzo Maffione 	CSB_WRITE(ptr, hwcur, hwcur);
87b6e66be2SVincenzo Maffione 	nm_stst_barrier();
88b6e66be2SVincenzo Maffione 	CSB_WRITE(ptr, hwtail, hwtail);
89b6e66be2SVincenzo Maffione }
90b6e66be2SVincenzo Maffione 
91b6e66be2SVincenzo Maffione /* Read kring pointers (head, cur, sync_flags) from the CSB.
92b6e66be2SVincenzo Maffione  * This routine is coupled with ptnetmap_guest_write_kring_csb(). */
93b6e66be2SVincenzo Maffione static inline void
sync_kloop_kernel_read(struct nm_csb_atok __user * ptr,struct netmap_ring * shadow_ring,uint32_t num_slots)94b6e66be2SVincenzo Maffione sync_kloop_kernel_read(struct nm_csb_atok __user *ptr,
95b6e66be2SVincenzo Maffione 			  struct netmap_ring *shadow_ring,
96b6e66be2SVincenzo Maffione 			  uint32_t num_slots)
97b6e66be2SVincenzo Maffione {
98b6e66be2SVincenzo Maffione 	/*
99b6e66be2SVincenzo Maffione 	 * We place a memory barrier to make sure that the update of head never
100b6e66be2SVincenzo Maffione 	 * overtakes the update of cur.
101f79ba6d7SVincenzo Maffione 	 * (see explanation in sync_kloop_kernel_write).
102b6e66be2SVincenzo Maffione 	 */
103b6e66be2SVincenzo Maffione 	CSB_READ(ptr, head, shadow_ring->head);
104f79ba6d7SVincenzo Maffione 	nm_ldld_barrier();
105b6e66be2SVincenzo Maffione 	CSB_READ(ptr, cur, shadow_ring->cur);
106b6e66be2SVincenzo Maffione 	CSB_READ(ptr, sync_flags, shadow_ring->flags);
107f79ba6d7SVincenzo Maffione 
108f79ba6d7SVincenzo Maffione 	/* Make sure that loads from atok->head and atok->cur are not delayed
109f79ba6d7SVincenzo Maffione 	 * after the loads from the netmap ring. */
110f79ba6d7SVincenzo Maffione 	nm_ldld_barrier();
111b6e66be2SVincenzo Maffione }
112b6e66be2SVincenzo Maffione 
113b6e66be2SVincenzo Maffione /* Enable or disable application --> kernel kicks. */
114b6e66be2SVincenzo Maffione static inline void
csb_ktoa_kick_enable(struct nm_csb_ktoa __user * csb_ktoa,uint32_t val)115b6e66be2SVincenzo Maffione csb_ktoa_kick_enable(struct nm_csb_ktoa __user *csb_ktoa, uint32_t val)
116b6e66be2SVincenzo Maffione {
117b6e66be2SVincenzo Maffione 	CSB_WRITE(csb_ktoa, kern_need_kick, val);
118b6e66be2SVincenzo Maffione }
119b6e66be2SVincenzo Maffione 
120dde885deSVincenzo Maffione #ifdef SYNC_KLOOP_POLL
121b6e66be2SVincenzo Maffione /* Are application interrupt enabled or disabled? */
122b6e66be2SVincenzo Maffione static inline uint32_t
csb_atok_intr_enabled(struct nm_csb_atok __user * csb_atok)123b6e66be2SVincenzo Maffione csb_atok_intr_enabled(struct nm_csb_atok __user *csb_atok)
124b6e66be2SVincenzo Maffione {
125b6e66be2SVincenzo Maffione 	uint32_t v;
126b6e66be2SVincenzo Maffione 
127b6e66be2SVincenzo Maffione 	CSB_READ(csb_atok, appl_need_kick, v);
128b6e66be2SVincenzo Maffione 
129b6e66be2SVincenzo Maffione 	return v;
130b6e66be2SVincenzo Maffione }
131dde885deSVincenzo Maffione #endif  /* SYNC_KLOOP_POLL */
132b6e66be2SVincenzo Maffione 
133b6e66be2SVincenzo Maffione static inline void
sync_kloop_kring_dump(const char * title,const struct netmap_kring * kring)134b6e66be2SVincenzo Maffione sync_kloop_kring_dump(const char *title, const struct netmap_kring *kring)
135b6e66be2SVincenzo Maffione {
136f79ba6d7SVincenzo Maffione 	nm_prinf("%s, kring %s, hwcur %d, rhead %d, "
137f79ba6d7SVincenzo Maffione 		"rcur %d, rtail %d, hwtail %d",
138f79ba6d7SVincenzo Maffione 		title, kring->name, kring->nr_hwcur, kring->rhead,
139f79ba6d7SVincenzo Maffione 		kring->rcur, kring->rtail, kring->nr_hwtail);
140b6e66be2SVincenzo Maffione }
141b6e66be2SVincenzo Maffione 
1425faab778SVincenzo Maffione /* Arguments for netmap_sync_kloop_tx_ring() and
1435faab778SVincenzo Maffione  * netmap_sync_kloop_rx_ring().
1445faab778SVincenzo Maffione  */
145b6e66be2SVincenzo Maffione struct sync_kloop_ring_args {
146b6e66be2SVincenzo Maffione 	struct netmap_kring *kring;
147b6e66be2SVincenzo Maffione 	struct nm_csb_atok *csb_atok;
148b6e66be2SVincenzo Maffione 	struct nm_csb_ktoa *csb_ktoa;
149b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
150b6e66be2SVincenzo Maffione 	struct eventfd_ctx *irq_ctx;
151b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
1525faab778SVincenzo Maffione 	/* Are we busy waiting rather than using a schedule() loop ? */
1535faab778SVincenzo Maffione 	bool busy_wait;
1545faab778SVincenzo Maffione 	/* Are we processing in the context of VM exit ? */
1555faab778SVincenzo Maffione 	bool direct;
156b6e66be2SVincenzo Maffione };
157b6e66be2SVincenzo Maffione 
158b6e66be2SVincenzo Maffione static void
netmap_sync_kloop_tx_ring(const struct sync_kloop_ring_args * a)159b6e66be2SVincenzo Maffione netmap_sync_kloop_tx_ring(const struct sync_kloop_ring_args *a)
160b6e66be2SVincenzo Maffione {
161b6e66be2SVincenzo Maffione 	struct netmap_kring *kring = a->kring;
162b6e66be2SVincenzo Maffione 	struct nm_csb_atok *csb_atok = a->csb_atok;
163b6e66be2SVincenzo Maffione 	struct nm_csb_ktoa *csb_ktoa = a->csb_ktoa;
164b6e66be2SVincenzo Maffione 	struct netmap_ring shadow_ring; /* shadow copy of the netmap_ring */
1656d2a46f0SJohn Baldwin #ifdef SYNC_KLOOP_POLL
166b6e66be2SVincenzo Maffione 	bool more_txspace = false;
1676d2a46f0SJohn Baldwin #endif /* SYNC_KLOOP_POLL */
168b6e66be2SVincenzo Maffione 	uint32_t num_slots;
169b6e66be2SVincenzo Maffione 	int batch;
170b6e66be2SVincenzo Maffione 
1715faab778SVincenzo Maffione 	if (unlikely(nm_kr_tryget(kring, 1, NULL))) {
1725faab778SVincenzo Maffione 		return;
1735faab778SVincenzo Maffione 	}
1745faab778SVincenzo Maffione 
175b6e66be2SVincenzo Maffione 	num_slots = kring->nkr_num_slots;
176b6e66be2SVincenzo Maffione 
177b6e66be2SVincenzo Maffione 	/* Disable application --> kernel notifications. */
1785faab778SVincenzo Maffione 	if (!a->direct) {
179b6e66be2SVincenzo Maffione 		csb_ktoa_kick_enable(csb_ktoa, 0);
1805faab778SVincenzo Maffione 	}
181b6e66be2SVincenzo Maffione 	/* Copy the application kring pointers from the CSB */
182b6e66be2SVincenzo Maffione 	sync_kloop_kernel_read(csb_atok, &shadow_ring, num_slots);
183b6e66be2SVincenzo Maffione 
184b6e66be2SVincenzo Maffione 	for (;;) {
185b6e66be2SVincenzo Maffione 		batch = shadow_ring.head - kring->nr_hwcur;
186b6e66be2SVincenzo Maffione 		if (batch < 0)
187b6e66be2SVincenzo Maffione 			batch += num_slots;
188b6e66be2SVincenzo Maffione 
189b6e66be2SVincenzo Maffione #ifdef PTN_TX_BATCH_LIM
190b6e66be2SVincenzo Maffione 		if (batch > PTN_TX_BATCH_LIM(num_slots)) {
191b6e66be2SVincenzo Maffione 			/* If application moves ahead too fast, let's cut the move so
192b6e66be2SVincenzo Maffione 			 * that we don't exceed our batch limit. */
193b6e66be2SVincenzo Maffione 			uint32_t head_lim = kring->nr_hwcur + PTN_TX_BATCH_LIM(num_slots);
194b6e66be2SVincenzo Maffione 
195b6e66be2SVincenzo Maffione 			if (head_lim >= num_slots)
196b6e66be2SVincenzo Maffione 				head_lim -= num_slots;
197b6e66be2SVincenzo Maffione 			nm_prdis(1, "batch: %d head: %d head_lim: %d", batch, shadow_ring.head,
198b6e66be2SVincenzo Maffione 					head_lim);
199b6e66be2SVincenzo Maffione 			shadow_ring.head = head_lim;
200b6e66be2SVincenzo Maffione 			batch = PTN_TX_BATCH_LIM(num_slots);
201b6e66be2SVincenzo Maffione 		}
202b6e66be2SVincenzo Maffione #endif /* PTN_TX_BATCH_LIM */
203b6e66be2SVincenzo Maffione 
204b6e66be2SVincenzo Maffione 		if (nm_kr_txspace(kring) <= (num_slots >> 1)) {
205b6e66be2SVincenzo Maffione 			shadow_ring.flags |= NAF_FORCE_RECLAIM;
206b6e66be2SVincenzo Maffione 		}
207b6e66be2SVincenzo Maffione 
208b6e66be2SVincenzo Maffione 		/* Netmap prologue */
209b6e66be2SVincenzo Maffione 		shadow_ring.tail = kring->rtail;
210b6e66be2SVincenzo Maffione 		if (unlikely(nm_txsync_prologue(kring, &shadow_ring) >= num_slots)) {
211b6e66be2SVincenzo Maffione 			/* Reinit ring and enable notifications. */
212b6e66be2SVincenzo Maffione 			netmap_ring_reinit(kring);
2135faab778SVincenzo Maffione 			if (!a->busy_wait) {
214b6e66be2SVincenzo Maffione 				csb_ktoa_kick_enable(csb_ktoa, 1);
2155faab778SVincenzo Maffione 			}
216b6e66be2SVincenzo Maffione 			break;
217b6e66be2SVincenzo Maffione 		}
218b6e66be2SVincenzo Maffione 
219b6e66be2SVincenzo Maffione 		if (unlikely(netmap_debug & NM_DEBUG_TXSYNC)) {
220b6e66be2SVincenzo Maffione 			sync_kloop_kring_dump("pre txsync", kring);
221b6e66be2SVincenzo Maffione 		}
222b6e66be2SVincenzo Maffione 
223b6e66be2SVincenzo Maffione 		if (unlikely(kring->nm_sync(kring, shadow_ring.flags))) {
2245faab778SVincenzo Maffione 			if (!a->busy_wait) {
22545c67e8fSVincenzo Maffione 				/* Re-enable notifications. */
226b6e66be2SVincenzo Maffione 				csb_ktoa_kick_enable(csb_ktoa, 1);
2275faab778SVincenzo Maffione 			}
228b6e66be2SVincenzo Maffione 			nm_prerr("txsync() failed");
229b6e66be2SVincenzo Maffione 			break;
230b6e66be2SVincenzo Maffione 		}
231b6e66be2SVincenzo Maffione 
232b6e66be2SVincenzo Maffione 		/*
233b6e66be2SVincenzo Maffione 		 * Finalize
234b6e66be2SVincenzo Maffione 		 * Copy kernel hwcur and hwtail into the CSB for the application sync(), and
235b6e66be2SVincenzo Maffione 		 * do the nm_sync_finalize.
236b6e66be2SVincenzo Maffione 		 */
237b6e66be2SVincenzo Maffione 		sync_kloop_kernel_write(csb_ktoa, kring->nr_hwcur,
238b6e66be2SVincenzo Maffione 				kring->nr_hwtail);
239b6e66be2SVincenzo Maffione 		if (kring->rtail != kring->nr_hwtail) {
240b6e66be2SVincenzo Maffione 			/* Some more room available in the parent adapter. */
241b6e66be2SVincenzo Maffione 			kring->rtail = kring->nr_hwtail;
2426d2a46f0SJohn Baldwin #ifdef SYNC_KLOOP_POLL
243b6e66be2SVincenzo Maffione 			more_txspace = true;
2446d2a46f0SJohn Baldwin #endif /* SYNC_KLOOP_POLL */
245b6e66be2SVincenzo Maffione 		}
246b6e66be2SVincenzo Maffione 
247b6e66be2SVincenzo Maffione 		if (unlikely(netmap_debug & NM_DEBUG_TXSYNC)) {
248b6e66be2SVincenzo Maffione 			sync_kloop_kring_dump("post txsync", kring);
249b6e66be2SVincenzo Maffione 		}
250b6e66be2SVincenzo Maffione 
251b6e66be2SVincenzo Maffione 		/* Interrupt the application if needed. */
252b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
253b6e66be2SVincenzo Maffione 		if (a->irq_ctx && more_txspace && csb_atok_intr_enabled(csb_atok)) {
2545faab778SVincenzo Maffione 			/* We could disable kernel --> application kicks here,
2555faab778SVincenzo Maffione 			 * to avoid spurious interrupts. */
256b6e66be2SVincenzo Maffione 			eventfd_signal(a->irq_ctx, 1);
257b6e66be2SVincenzo Maffione 			more_txspace = false;
258b6e66be2SVincenzo Maffione 		}
259b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
260b6e66be2SVincenzo Maffione 
261b6e66be2SVincenzo Maffione 		/* Read CSB to see if there is more work to do. */
262b6e66be2SVincenzo Maffione 		sync_kloop_kernel_read(csb_atok, &shadow_ring, num_slots);
263b6e66be2SVincenzo Maffione 		if (shadow_ring.head == kring->rhead) {
2645faab778SVincenzo Maffione 			if (a->busy_wait) {
2655faab778SVincenzo Maffione 				break;
2665faab778SVincenzo Maffione 			}
267b6e66be2SVincenzo Maffione 			/*
268b6e66be2SVincenzo Maffione 			 * No more packets to transmit. We enable notifications and
269b6e66be2SVincenzo Maffione 			 * go to sleep, waiting for a kick from the application when new
270b6e66be2SVincenzo Maffione 			 * new slots are ready for transmission.
271b6e66be2SVincenzo Maffione 			 */
27245c67e8fSVincenzo Maffione 			/* Re-enable notifications. */
273b6e66be2SVincenzo Maffione 			csb_ktoa_kick_enable(csb_ktoa, 1);
274f79ba6d7SVincenzo Maffione 			/* Double check, with store-load memory barrier. */
275f79ba6d7SVincenzo Maffione 			nm_stld_barrier();
276b6e66be2SVincenzo Maffione 			sync_kloop_kernel_read(csb_atok, &shadow_ring, num_slots);
277b6e66be2SVincenzo Maffione 			if (shadow_ring.head != kring->rhead) {
278b6e66be2SVincenzo Maffione 				/* We won the race condition, there are more packets to
279b6e66be2SVincenzo Maffione 				 * transmit. Disable notifications and do another cycle */
280b6e66be2SVincenzo Maffione 				csb_ktoa_kick_enable(csb_ktoa, 0);
281b6e66be2SVincenzo Maffione 				continue;
282b6e66be2SVincenzo Maffione 			}
283b6e66be2SVincenzo Maffione 			break;
284b6e66be2SVincenzo Maffione 		}
285b6e66be2SVincenzo Maffione 
286b6e66be2SVincenzo Maffione 		if (nm_kr_txempty(kring)) {
287b6e66be2SVincenzo Maffione 			/* No more available TX slots. We stop waiting for a notification
288b6e66be2SVincenzo Maffione 			 * from the backend (netmap_tx_irq). */
289b6e66be2SVincenzo Maffione 			nm_prdis(1, "TX ring");
290b6e66be2SVincenzo Maffione 			break;
291b6e66be2SVincenzo Maffione 		}
292b6e66be2SVincenzo Maffione 	}
293b6e66be2SVincenzo Maffione 
2945faab778SVincenzo Maffione 	nm_kr_put(kring);
2955faab778SVincenzo Maffione 
296b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
297b6e66be2SVincenzo Maffione 	if (a->irq_ctx && more_txspace && csb_atok_intr_enabled(csb_atok)) {
298b6e66be2SVincenzo Maffione 		eventfd_signal(a->irq_ctx, 1);
299b6e66be2SVincenzo Maffione 	}
300b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
301b6e66be2SVincenzo Maffione }
302b6e66be2SVincenzo Maffione 
303b6e66be2SVincenzo Maffione /* RX cycle without receive any packets */
304b6e66be2SVincenzo Maffione #define SYNC_LOOP_RX_DRY_CYCLES_MAX	2
305b6e66be2SVincenzo Maffione 
306b6e66be2SVincenzo Maffione static inline int
sync_kloop_norxslots(struct netmap_kring * kring,uint32_t g_head)307b6e66be2SVincenzo Maffione sync_kloop_norxslots(struct netmap_kring *kring, uint32_t g_head)
308b6e66be2SVincenzo Maffione {
309b6e66be2SVincenzo Maffione 	return (NM_ACCESS_ONCE(kring->nr_hwtail) == nm_prev(g_head,
310b6e66be2SVincenzo Maffione 				kring->nkr_num_slots - 1));
311b6e66be2SVincenzo Maffione }
312b6e66be2SVincenzo Maffione 
313b6e66be2SVincenzo Maffione static void
netmap_sync_kloop_rx_ring(const struct sync_kloop_ring_args * a)314b6e66be2SVincenzo Maffione netmap_sync_kloop_rx_ring(const struct sync_kloop_ring_args *a)
315b6e66be2SVincenzo Maffione {
316b6e66be2SVincenzo Maffione 
317b6e66be2SVincenzo Maffione 	struct netmap_kring *kring = a->kring;
318b6e66be2SVincenzo Maffione 	struct nm_csb_atok *csb_atok = a->csb_atok;
319b6e66be2SVincenzo Maffione 	struct nm_csb_ktoa *csb_ktoa = a->csb_ktoa;
320b6e66be2SVincenzo Maffione 	struct netmap_ring shadow_ring; /* shadow copy of the netmap_ring */
321b6e66be2SVincenzo Maffione 	int dry_cycles = 0;
3226d2a46f0SJohn Baldwin #ifdef SYNC_KLOOP_POLL
323b6e66be2SVincenzo Maffione 	bool some_recvd = false;
3246d2a46f0SJohn Baldwin #endif /* SYNC_KLOOP_POLL */
325b6e66be2SVincenzo Maffione 	uint32_t num_slots;
326b6e66be2SVincenzo Maffione 
3275faab778SVincenzo Maffione 	if (unlikely(nm_kr_tryget(kring, 1, NULL))) {
3285faab778SVincenzo Maffione 		return;
3295faab778SVincenzo Maffione 	}
3305faab778SVincenzo Maffione 
331b6e66be2SVincenzo Maffione 	num_slots = kring->nkr_num_slots;
332b6e66be2SVincenzo Maffione 
333b6e66be2SVincenzo Maffione 	/* Get RX csb_atok and csb_ktoa pointers from the CSB. */
334b6e66be2SVincenzo Maffione 	num_slots = kring->nkr_num_slots;
335b6e66be2SVincenzo Maffione 
336b6e66be2SVincenzo Maffione 	/* Disable notifications. */
3375faab778SVincenzo Maffione 	if (!a->direct) {
338b6e66be2SVincenzo Maffione 		csb_ktoa_kick_enable(csb_ktoa, 0);
3395faab778SVincenzo Maffione 	}
340b6e66be2SVincenzo Maffione 	/* Copy the application kring pointers from the CSB */
341b6e66be2SVincenzo Maffione 	sync_kloop_kernel_read(csb_atok, &shadow_ring, num_slots);
342b6e66be2SVincenzo Maffione 
343b6e66be2SVincenzo Maffione 	for (;;) {
344b6e66be2SVincenzo Maffione 		uint32_t hwtail;
345b6e66be2SVincenzo Maffione 
346b6e66be2SVincenzo Maffione 		/* Netmap prologue */
347b6e66be2SVincenzo Maffione 		shadow_ring.tail = kring->rtail;
348b6e66be2SVincenzo Maffione 		if (unlikely(nm_rxsync_prologue(kring, &shadow_ring) >= num_slots)) {
349b6e66be2SVincenzo Maffione 			/* Reinit ring and enable notifications. */
350b6e66be2SVincenzo Maffione 			netmap_ring_reinit(kring);
3515faab778SVincenzo Maffione 			if (!a->busy_wait) {
352b6e66be2SVincenzo Maffione 				csb_ktoa_kick_enable(csb_ktoa, 1);
3535faab778SVincenzo Maffione 			}
354b6e66be2SVincenzo Maffione 			break;
355b6e66be2SVincenzo Maffione 		}
356b6e66be2SVincenzo Maffione 
357b6e66be2SVincenzo Maffione 		if (unlikely(netmap_debug & NM_DEBUG_RXSYNC)) {
358b6e66be2SVincenzo Maffione 			sync_kloop_kring_dump("pre rxsync", kring);
359b6e66be2SVincenzo Maffione 		}
360b6e66be2SVincenzo Maffione 
361b6e66be2SVincenzo Maffione 		if (unlikely(kring->nm_sync(kring, shadow_ring.flags))) {
3625faab778SVincenzo Maffione 			if (!a->busy_wait) {
36345c67e8fSVincenzo Maffione 				/* Re-enable notifications. */
364b6e66be2SVincenzo Maffione 				csb_ktoa_kick_enable(csb_ktoa, 1);
3655faab778SVincenzo Maffione 			}
366b6e66be2SVincenzo Maffione 			nm_prerr("rxsync() failed");
367b6e66be2SVincenzo Maffione 			break;
368b6e66be2SVincenzo Maffione 		}
369b6e66be2SVincenzo Maffione 
370b6e66be2SVincenzo Maffione 		/*
371b6e66be2SVincenzo Maffione 		 * Finalize
372b6e66be2SVincenzo Maffione 		 * Copy kernel hwcur and hwtail into the CSB for the application sync()
373b6e66be2SVincenzo Maffione 		 */
374b6e66be2SVincenzo Maffione 		hwtail = NM_ACCESS_ONCE(kring->nr_hwtail);
375b6e66be2SVincenzo Maffione 		sync_kloop_kernel_write(csb_ktoa, kring->nr_hwcur, hwtail);
376b6e66be2SVincenzo Maffione 		if (kring->rtail != hwtail) {
377b6e66be2SVincenzo Maffione 			kring->rtail = hwtail;
3786d2a46f0SJohn Baldwin #ifdef SYNC_KLOOP_POLL
379b6e66be2SVincenzo Maffione 			some_recvd = true;
3806d2a46f0SJohn Baldwin #endif /* SYNC_KLOOP_POLL */
381b6e66be2SVincenzo Maffione 			dry_cycles = 0;
382b6e66be2SVincenzo Maffione 		} else {
383b6e66be2SVincenzo Maffione 			dry_cycles++;
384b6e66be2SVincenzo Maffione 		}
385b6e66be2SVincenzo Maffione 
386b6e66be2SVincenzo Maffione 		if (unlikely(netmap_debug & NM_DEBUG_RXSYNC)) {
387b6e66be2SVincenzo Maffione 			sync_kloop_kring_dump("post rxsync", kring);
388b6e66be2SVincenzo Maffione 		}
389b6e66be2SVincenzo Maffione 
390b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
391b6e66be2SVincenzo Maffione 		/* Interrupt the application if needed. */
392b6e66be2SVincenzo Maffione 		if (a->irq_ctx && some_recvd && csb_atok_intr_enabled(csb_atok)) {
3935faab778SVincenzo Maffione 			/* We could disable kernel --> application kicks here,
3945faab778SVincenzo Maffione 			 * to avoid spurious interrupts. */
395b6e66be2SVincenzo Maffione 			eventfd_signal(a->irq_ctx, 1);
396b6e66be2SVincenzo Maffione 			some_recvd = false;
397b6e66be2SVincenzo Maffione 		}
398b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
399b6e66be2SVincenzo Maffione 
400b6e66be2SVincenzo Maffione 		/* Read CSB to see if there is more work to do. */
401b6e66be2SVincenzo Maffione 		sync_kloop_kernel_read(csb_atok, &shadow_ring, num_slots);
402b6e66be2SVincenzo Maffione 		if (sync_kloop_norxslots(kring, shadow_ring.head)) {
4035faab778SVincenzo Maffione 			if (a->busy_wait) {
4045faab778SVincenzo Maffione 				break;
4055faab778SVincenzo Maffione 			}
406b6e66be2SVincenzo Maffione 			/*
407b6e66be2SVincenzo Maffione 			 * No more slots available for reception. We enable notification and
408b6e66be2SVincenzo Maffione 			 * go to sleep, waiting for a kick from the application when new receive
409b6e66be2SVincenzo Maffione 			 * slots are available.
410b6e66be2SVincenzo Maffione 			 */
41145c67e8fSVincenzo Maffione 			/* Re-enable notifications. */
412b6e66be2SVincenzo Maffione 			csb_ktoa_kick_enable(csb_ktoa, 1);
413f79ba6d7SVincenzo Maffione 			/* Double check, with store-load memory barrier. */
414f79ba6d7SVincenzo Maffione 			nm_stld_barrier();
415b6e66be2SVincenzo Maffione 			sync_kloop_kernel_read(csb_atok, &shadow_ring, num_slots);
416b6e66be2SVincenzo Maffione 			if (!sync_kloop_norxslots(kring, shadow_ring.head)) {
417b6e66be2SVincenzo Maffione 				/* We won the race condition, more slots are available. Disable
418b6e66be2SVincenzo Maffione 				 * notifications and do another cycle. */
419b6e66be2SVincenzo Maffione 				csb_ktoa_kick_enable(csb_ktoa, 0);
420b6e66be2SVincenzo Maffione 				continue;
421b6e66be2SVincenzo Maffione 			}
422b6e66be2SVincenzo Maffione 			break;
423b6e66be2SVincenzo Maffione 		}
424b6e66be2SVincenzo Maffione 
425b6e66be2SVincenzo Maffione 		hwtail = NM_ACCESS_ONCE(kring->nr_hwtail);
426b6e66be2SVincenzo Maffione 		if (unlikely(hwtail == kring->rhead ||
427b6e66be2SVincenzo Maffione 					dry_cycles >= SYNC_LOOP_RX_DRY_CYCLES_MAX)) {
428b6e66be2SVincenzo Maffione 			/* No more packets to be read from the backend. We stop and
429b6e66be2SVincenzo Maffione 			 * wait for a notification from the backend (netmap_rx_irq). */
430b6e66be2SVincenzo Maffione 			nm_prdis(1, "nr_hwtail: %d rhead: %d dry_cycles: %d",
431b6e66be2SVincenzo Maffione 					hwtail, kring->rhead, dry_cycles);
432b6e66be2SVincenzo Maffione 			break;
433b6e66be2SVincenzo Maffione 		}
434b6e66be2SVincenzo Maffione 	}
435b6e66be2SVincenzo Maffione 
436b6e66be2SVincenzo Maffione 	nm_kr_put(kring);
437b6e66be2SVincenzo Maffione 
438b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
439b6e66be2SVincenzo Maffione 	/* Interrupt the application if needed. */
440b6e66be2SVincenzo Maffione 	if (a->irq_ctx && some_recvd && csb_atok_intr_enabled(csb_atok)) {
441b6e66be2SVincenzo Maffione 		eventfd_signal(a->irq_ctx, 1);
442b6e66be2SVincenzo Maffione 	}
443b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
444b6e66be2SVincenzo Maffione }
445b6e66be2SVincenzo Maffione 
446b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
4475faab778SVincenzo Maffione struct sync_kloop_poll_ctx;
448b6e66be2SVincenzo Maffione struct sync_kloop_poll_entry {
449b6e66be2SVincenzo Maffione 	/* Support for receiving notifications from
450b6e66be2SVincenzo Maffione 	 * a netmap ring or from the application. */
451b6e66be2SVincenzo Maffione 	struct file *filp;
452b6e66be2SVincenzo Maffione 	wait_queue_t wait;
453b6e66be2SVincenzo Maffione 	wait_queue_head_t *wqh;
454b6e66be2SVincenzo Maffione 
455b6e66be2SVincenzo Maffione 	/* Support for sending notifications to the application. */
456b6e66be2SVincenzo Maffione 	struct eventfd_ctx *irq_ctx;
457b6e66be2SVincenzo Maffione 	struct file *irq_filp;
4585faab778SVincenzo Maffione 
4595faab778SVincenzo Maffione 	/* Arguments for the ring processing function. Useful
4605faab778SVincenzo Maffione 	 * in case of custom wake-up function. */
4615faab778SVincenzo Maffione 	struct sync_kloop_ring_args *args;
4625faab778SVincenzo Maffione 	struct sync_kloop_poll_ctx *parent;
4635faab778SVincenzo Maffione 
464b6e66be2SVincenzo Maffione };
465b6e66be2SVincenzo Maffione 
466b6e66be2SVincenzo Maffione struct sync_kloop_poll_ctx {
467b6e66be2SVincenzo Maffione 	poll_table wait_table;
468b6e66be2SVincenzo Maffione 	unsigned int next_entry;
4695faab778SVincenzo Maffione 	int (*next_wake_fun)(wait_queue_t *, unsigned, int, void *);
470b6e66be2SVincenzo Maffione 	unsigned int num_entries;
4715faab778SVincenzo Maffione 	unsigned int num_tx_rings;
4725faab778SVincenzo Maffione 	unsigned int num_rings;
4735faab778SVincenzo Maffione 	/* First num_tx_rings entries are for the TX kicks.
4745faab778SVincenzo Maffione 	 * Then the RX kicks entries follow. The last two
4755faab778SVincenzo Maffione 	 * entries are for TX irq, and RX irq. */
476b6e66be2SVincenzo Maffione 	struct sync_kloop_poll_entry entries[0];
477b6e66be2SVincenzo Maffione };
478b6e66be2SVincenzo Maffione 
479b6e66be2SVincenzo Maffione static void
sync_kloop_poll_table_queue_proc(struct file * file,wait_queue_head_t * wqh,poll_table * pt)480b6e66be2SVincenzo Maffione sync_kloop_poll_table_queue_proc(struct file *file, wait_queue_head_t *wqh,
481b6e66be2SVincenzo Maffione 				poll_table *pt)
482b6e66be2SVincenzo Maffione {
483b6e66be2SVincenzo Maffione 	struct sync_kloop_poll_ctx *poll_ctx =
484b6e66be2SVincenzo Maffione 		container_of(pt, struct sync_kloop_poll_ctx, wait_table);
485b6e66be2SVincenzo Maffione 	struct sync_kloop_poll_entry *entry = poll_ctx->entries +
486b6e66be2SVincenzo Maffione 						poll_ctx->next_entry;
487b6e66be2SVincenzo Maffione 
488b6e66be2SVincenzo Maffione 	BUG_ON(poll_ctx->next_entry >= poll_ctx->num_entries);
489b6e66be2SVincenzo Maffione 	entry->wqh = wqh;
490b6e66be2SVincenzo Maffione 	entry->filp = file;
491b6e66be2SVincenzo Maffione 	/* Use the default wake up function. */
4925faab778SVincenzo Maffione 	if (poll_ctx->next_wake_fun == NULL) {
493b6e66be2SVincenzo Maffione 		init_waitqueue_entry(&entry->wait, current);
4945faab778SVincenzo Maffione 	} else {
4955faab778SVincenzo Maffione 		init_waitqueue_func_entry(&entry->wait,
4965faab778SVincenzo Maffione 		    poll_ctx->next_wake_fun);
4975faab778SVincenzo Maffione 	}
498b6e66be2SVincenzo Maffione 	add_wait_queue(wqh, &entry->wait);
4995faab778SVincenzo Maffione }
5005faab778SVincenzo Maffione 
5015faab778SVincenzo Maffione static int
sync_kloop_tx_kick_wake_fun(wait_queue_t * wait,unsigned mode,int wake_flags,void * key)5025faab778SVincenzo Maffione sync_kloop_tx_kick_wake_fun(wait_queue_t *wait, unsigned mode,
5035faab778SVincenzo Maffione     int wake_flags, void *key)
5045faab778SVincenzo Maffione {
5055faab778SVincenzo Maffione 	struct sync_kloop_poll_entry *entry =
5065faab778SVincenzo Maffione 	    container_of(wait, struct sync_kloop_poll_entry, wait);
5075faab778SVincenzo Maffione 
5085faab778SVincenzo Maffione 	netmap_sync_kloop_tx_ring(entry->args);
5095faab778SVincenzo Maffione 
5105faab778SVincenzo Maffione 	return 0;
5115faab778SVincenzo Maffione }
5125faab778SVincenzo Maffione 
5135faab778SVincenzo Maffione static int
sync_kloop_tx_irq_wake_fun(wait_queue_t * wait,unsigned mode,int wake_flags,void * key)5145faab778SVincenzo Maffione sync_kloop_tx_irq_wake_fun(wait_queue_t *wait, unsigned mode,
5155faab778SVincenzo Maffione     int wake_flags, void *key)
5165faab778SVincenzo Maffione {
5175faab778SVincenzo Maffione 	struct sync_kloop_poll_entry *entry =
5185faab778SVincenzo Maffione 	    container_of(wait, struct sync_kloop_poll_entry, wait);
5195faab778SVincenzo Maffione 	struct sync_kloop_poll_ctx *poll_ctx = entry->parent;
5205faab778SVincenzo Maffione 	int i;
5215faab778SVincenzo Maffione 
5225faab778SVincenzo Maffione 	for (i = 0; i < poll_ctx->num_tx_rings; i++) {
5235faab778SVincenzo Maffione 		struct eventfd_ctx *irq_ctx = poll_ctx->entries[i].irq_ctx;
5245faab778SVincenzo Maffione 
5255faab778SVincenzo Maffione 		if (irq_ctx) {
5265faab778SVincenzo Maffione 			eventfd_signal(irq_ctx, 1);
5275faab778SVincenzo Maffione 		}
5285faab778SVincenzo Maffione 	}
5295faab778SVincenzo Maffione 
5305faab778SVincenzo Maffione 	return 0;
5315faab778SVincenzo Maffione }
5325faab778SVincenzo Maffione 
5335faab778SVincenzo Maffione static int
sync_kloop_rx_kick_wake_fun(wait_queue_t * wait,unsigned mode,int wake_flags,void * key)5345faab778SVincenzo Maffione sync_kloop_rx_kick_wake_fun(wait_queue_t *wait, unsigned mode,
5355faab778SVincenzo Maffione     int wake_flags, void *key)
5365faab778SVincenzo Maffione {
5375faab778SVincenzo Maffione 	struct sync_kloop_poll_entry *entry =
5385faab778SVincenzo Maffione 	    container_of(wait, struct sync_kloop_poll_entry, wait);
5395faab778SVincenzo Maffione 
5405faab778SVincenzo Maffione 	netmap_sync_kloop_rx_ring(entry->args);
5415faab778SVincenzo Maffione 
5425faab778SVincenzo Maffione 	return 0;
5435faab778SVincenzo Maffione }
5445faab778SVincenzo Maffione 
5455faab778SVincenzo Maffione static int
sync_kloop_rx_irq_wake_fun(wait_queue_t * wait,unsigned mode,int wake_flags,void * key)5465faab778SVincenzo Maffione sync_kloop_rx_irq_wake_fun(wait_queue_t *wait, unsigned mode,
5475faab778SVincenzo Maffione     int wake_flags, void *key)
5485faab778SVincenzo Maffione {
5495faab778SVincenzo Maffione 	struct sync_kloop_poll_entry *entry =
5505faab778SVincenzo Maffione 	    container_of(wait, struct sync_kloop_poll_entry, wait);
5515faab778SVincenzo Maffione 	struct sync_kloop_poll_ctx *poll_ctx = entry->parent;
5525faab778SVincenzo Maffione 	int i;
5535faab778SVincenzo Maffione 
5545faab778SVincenzo Maffione 	for (i = poll_ctx->num_tx_rings; i < poll_ctx->num_rings; i++) {
5555faab778SVincenzo Maffione 		struct eventfd_ctx *irq_ctx = poll_ctx->entries[i].irq_ctx;
5565faab778SVincenzo Maffione 
5575faab778SVincenzo Maffione 		if (irq_ctx) {
5585faab778SVincenzo Maffione 			eventfd_signal(irq_ctx, 1);
5595faab778SVincenzo Maffione 		}
5605faab778SVincenzo Maffione 	}
5615faab778SVincenzo Maffione 
5625faab778SVincenzo Maffione 	return 0;
563b6e66be2SVincenzo Maffione }
564b6e66be2SVincenzo Maffione #endif  /* SYNC_KLOOP_POLL */
565b6e66be2SVincenzo Maffione 
566b6e66be2SVincenzo Maffione int
netmap_sync_kloop(struct netmap_priv_d * priv,struct nmreq_header * hdr)567b6e66be2SVincenzo Maffione netmap_sync_kloop(struct netmap_priv_d *priv, struct nmreq_header *hdr)
568b6e66be2SVincenzo Maffione {
569b6e66be2SVincenzo Maffione 	struct nmreq_sync_kloop_start *req =
570b6e66be2SVincenzo Maffione 		(struct nmreq_sync_kloop_start *)(uintptr_t)hdr->nr_body;
571b6e66be2SVincenzo Maffione 	struct nmreq_opt_sync_kloop_eventfds *eventfds_opt = NULL;
572b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
573b6e66be2SVincenzo Maffione 	struct sync_kloop_poll_ctx *poll_ctx = NULL;
574b6e66be2SVincenzo Maffione #endif  /* SYNC_KLOOP_POLL */
575b6e66be2SVincenzo Maffione 	int num_rx_rings, num_tx_rings, num_rings;
576f79ba6d7SVincenzo Maffione 	struct sync_kloop_ring_args *args = NULL;
577b6e66be2SVincenzo Maffione 	uint32_t sleep_us = req->sleep_us;
578b6e66be2SVincenzo Maffione 	struct nm_csb_atok* csb_atok_base;
579b6e66be2SVincenzo Maffione 	struct nm_csb_ktoa* csb_ktoa_base;
580b6e66be2SVincenzo Maffione 	struct netmap_adapter *na;
581b6e66be2SVincenzo Maffione 	struct nmreq_option *opt;
5825faab778SVincenzo Maffione 	bool na_could_sleep = false;
5835faab778SVincenzo Maffione 	bool busy_wait = true;
5845faab778SVincenzo Maffione 	bool direct_tx = false;
5855faab778SVincenzo Maffione 	bool direct_rx = false;
586b6e66be2SVincenzo Maffione 	int err = 0;
587b6e66be2SVincenzo Maffione 	int i;
588b6e66be2SVincenzo Maffione 
589b6e66be2SVincenzo Maffione 	if (sleep_us > 1000000) {
590b6e66be2SVincenzo Maffione 		/* We do not accept sleeping for more than a second. */
591b6e66be2SVincenzo Maffione 		return EINVAL;
592b6e66be2SVincenzo Maffione 	}
593b6e66be2SVincenzo Maffione 
594b6e66be2SVincenzo Maffione 	if (priv->np_nifp == NULL) {
595b6e66be2SVincenzo Maffione 		return ENXIO;
596b6e66be2SVincenzo Maffione 	}
597b6e66be2SVincenzo Maffione 	mb(); /* make sure following reads are not from cache */
598b6e66be2SVincenzo Maffione 
599b6e66be2SVincenzo Maffione 	na = priv->np_na;
600b6e66be2SVincenzo Maffione 	if (!nm_netmap_on(na)) {
601b6e66be2SVincenzo Maffione 		return ENXIO;
602b6e66be2SVincenzo Maffione 	}
603b6e66be2SVincenzo Maffione 
604b6e66be2SVincenzo Maffione 	NMG_LOCK();
605b6e66be2SVincenzo Maffione 	/* Make sure the application is working in CSB mode. */
606b6e66be2SVincenzo Maffione 	if (!priv->np_csb_atok_base || !priv->np_csb_ktoa_base) {
607b6e66be2SVincenzo Maffione 		NMG_UNLOCK();
608b6e66be2SVincenzo Maffione 		nm_prerr("sync-kloop on %s requires "
609b6e66be2SVincenzo Maffione 				"NETMAP_REQ_OPT_CSB option", na->name);
610b6e66be2SVincenzo Maffione 		return EINVAL;
611b6e66be2SVincenzo Maffione 	}
612b6e66be2SVincenzo Maffione 
613b6e66be2SVincenzo Maffione 	csb_atok_base = priv->np_csb_atok_base;
614b6e66be2SVincenzo Maffione 	csb_ktoa_base = priv->np_csb_ktoa_base;
615b6e66be2SVincenzo Maffione 
616b6e66be2SVincenzo Maffione 	/* Make sure that no kloop is currently running. */
617b6e66be2SVincenzo Maffione 	if (priv->np_kloop_state & NM_SYNC_KLOOP_RUNNING) {
618b6e66be2SVincenzo Maffione 		err = EBUSY;
619b6e66be2SVincenzo Maffione 	}
620b6e66be2SVincenzo Maffione 	priv->np_kloop_state |= NM_SYNC_KLOOP_RUNNING;
621b6e66be2SVincenzo Maffione 	NMG_UNLOCK();
622b6e66be2SVincenzo Maffione 	if (err) {
623b6e66be2SVincenzo Maffione 		return err;
624b6e66be2SVincenzo Maffione 	}
625b6e66be2SVincenzo Maffione 
626b6e66be2SVincenzo Maffione 	num_rx_rings = priv->np_qlast[NR_RX] - priv->np_qfirst[NR_RX];
627b6e66be2SVincenzo Maffione 	num_tx_rings = priv->np_qlast[NR_TX] - priv->np_qfirst[NR_TX];
628b6e66be2SVincenzo Maffione 	num_rings = num_tx_rings + num_rx_rings;
629b6e66be2SVincenzo Maffione 
630f79ba6d7SVincenzo Maffione 	args = nm_os_malloc(num_rings * sizeof(args[0]));
631f79ba6d7SVincenzo Maffione 	if (!args) {
632f79ba6d7SVincenzo Maffione 		err = ENOMEM;
633f79ba6d7SVincenzo Maffione 		goto out;
634f79ba6d7SVincenzo Maffione 	}
635f79ba6d7SVincenzo Maffione 
6365faab778SVincenzo Maffione 	/* Prepare the arguments for netmap_sync_kloop_tx_ring()
6375faab778SVincenzo Maffione 	 * and netmap_sync_kloop_rx_ring(). */
6385faab778SVincenzo Maffione 	for (i = 0; i < num_tx_rings; i++) {
6395faab778SVincenzo Maffione 		struct sync_kloop_ring_args *a = args + i;
6405faab778SVincenzo Maffione 
6415faab778SVincenzo Maffione 		a->kring = NMR(na, NR_TX)[i + priv->np_qfirst[NR_TX]];
6425faab778SVincenzo Maffione 		a->csb_atok = csb_atok_base + i;
6435faab778SVincenzo Maffione 		a->csb_ktoa = csb_ktoa_base + i;
6445faab778SVincenzo Maffione 		a->busy_wait = busy_wait;
6455faab778SVincenzo Maffione 		a->direct = direct_tx;
6465faab778SVincenzo Maffione 	}
6475faab778SVincenzo Maffione 	for (i = 0; i < num_rx_rings; i++) {
6485faab778SVincenzo Maffione 		struct sync_kloop_ring_args *a = args + num_tx_rings + i;
6495faab778SVincenzo Maffione 
6505faab778SVincenzo Maffione 		a->kring = NMR(na, NR_RX)[i + priv->np_qfirst[NR_RX]];
6515faab778SVincenzo Maffione 		a->csb_atok = csb_atok_base + num_tx_rings + i;
6525faab778SVincenzo Maffione 		a->csb_ktoa = csb_ktoa_base + num_tx_rings + i;
6535faab778SVincenzo Maffione 		a->busy_wait = busy_wait;
6545faab778SVincenzo Maffione 		a->direct = direct_rx;
6555faab778SVincenzo Maffione 	}
6565faab778SVincenzo Maffione 
657b6e66be2SVincenzo Maffione 	/* Validate notification options. */
658253b2ec1SVincenzo Maffione 	opt = nmreq_getoption(hdr, NETMAP_REQ_OPT_SYNC_KLOOP_MODE);
6595faab778SVincenzo Maffione 	if (opt != NULL) {
6605faab778SVincenzo Maffione 		struct nmreq_opt_sync_kloop_mode *mode_opt =
6615faab778SVincenzo Maffione 		    (struct nmreq_opt_sync_kloop_mode *)opt;
6625faab778SVincenzo Maffione 
6635faab778SVincenzo Maffione 		direct_tx = !!(mode_opt->mode & NM_OPT_SYNC_KLOOP_DIRECT_TX);
6645faab778SVincenzo Maffione 		direct_rx = !!(mode_opt->mode & NM_OPT_SYNC_KLOOP_DIRECT_RX);
6655faab778SVincenzo Maffione 		if (mode_opt->mode & ~(NM_OPT_SYNC_KLOOP_DIRECT_TX |
6665faab778SVincenzo Maffione 		    NM_OPT_SYNC_KLOOP_DIRECT_RX)) {
6675faab778SVincenzo Maffione 			opt->nro_status = err = EINVAL;
6685faab778SVincenzo Maffione 			goto out;
6695faab778SVincenzo Maffione 		}
6705faab778SVincenzo Maffione 		opt->nro_status = 0;
6715faab778SVincenzo Maffione 	}
672253b2ec1SVincenzo Maffione 	opt = nmreq_getoption(hdr, NETMAP_REQ_OPT_SYNC_KLOOP_EVENTFDS);
673b6e66be2SVincenzo Maffione 	if (opt != NULL) {
674b6e66be2SVincenzo Maffione 		if (opt->nro_size != sizeof(*eventfds_opt) +
675b6e66be2SVincenzo Maffione 			sizeof(eventfds_opt->eventfds[0]) * num_rings) {
676b6e66be2SVincenzo Maffione 			/* Option size not consistent with the number of
677b6e66be2SVincenzo Maffione 			 * entries. */
678b6e66be2SVincenzo Maffione 			opt->nro_status = err = EINVAL;
679b6e66be2SVincenzo Maffione 			goto out;
680b6e66be2SVincenzo Maffione 		}
681b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
682b6e66be2SVincenzo Maffione 		eventfds_opt = (struct nmreq_opt_sync_kloop_eventfds *)opt;
683b6e66be2SVincenzo Maffione 		opt->nro_status = 0;
6845faab778SVincenzo Maffione 
6855faab778SVincenzo Maffione 		/* Check if some ioeventfd entry is not defined, and force sleep
6865faab778SVincenzo Maffione 		 * synchronization in that case. */
6875faab778SVincenzo Maffione 		busy_wait = false;
6885faab778SVincenzo Maffione 		for (i = 0; i < num_rings; i++) {
6895faab778SVincenzo Maffione 			if (eventfds_opt->eventfds[i].ioeventfd < 0) {
6905faab778SVincenzo Maffione 				busy_wait = true;
6915faab778SVincenzo Maffione 				break;
6925faab778SVincenzo Maffione 			}
6935faab778SVincenzo Maffione 		}
6945faab778SVincenzo Maffione 
6955faab778SVincenzo Maffione 		if (busy_wait && (direct_tx || direct_rx)) {
6965faab778SVincenzo Maffione 			/* For direct processing we need all the
6975faab778SVincenzo Maffione 			 * ioeventfds to be valid. */
6985faab778SVincenzo Maffione 			opt->nro_status = err = EINVAL;
6995faab778SVincenzo Maffione 			goto out;
7005faab778SVincenzo Maffione 		}
7015faab778SVincenzo Maffione 
702b6e66be2SVincenzo Maffione 		/* We need 2 poll entries for TX and RX notifications coming
703b6e66be2SVincenzo Maffione 		 * from the netmap adapter, plus one entries per ring for the
704b6e66be2SVincenzo Maffione 		 * notifications coming from the application. */
705b6e66be2SVincenzo Maffione 		poll_ctx = nm_os_malloc(sizeof(*poll_ctx) +
7065faab778SVincenzo Maffione 				(num_rings + 2) * sizeof(poll_ctx->entries[0]));
707b6e66be2SVincenzo Maffione 		init_poll_funcptr(&poll_ctx->wait_table,
708b6e66be2SVincenzo Maffione 					sync_kloop_poll_table_queue_proc);
709b6e66be2SVincenzo Maffione 		poll_ctx->num_entries = 2 + num_rings;
7105faab778SVincenzo Maffione 		poll_ctx->num_tx_rings = num_tx_rings;
7115faab778SVincenzo Maffione 		poll_ctx->num_rings = num_rings;
712b6e66be2SVincenzo Maffione 		poll_ctx->next_entry = 0;
7135faab778SVincenzo Maffione 		poll_ctx->next_wake_fun = NULL;
7145faab778SVincenzo Maffione 
7155faab778SVincenzo Maffione 		if (direct_tx && (na->na_flags & NAF_BDG_MAYSLEEP)) {
7165faab778SVincenzo Maffione 			/* In direct mode, VALE txsync is called from
7175faab778SVincenzo Maffione 			 * wake-up context, where it is not possible
7185faab778SVincenzo Maffione 			 * to sleep.
7195faab778SVincenzo Maffione 			 */
7205faab778SVincenzo Maffione 			na->na_flags &= ~NAF_BDG_MAYSLEEP;
7215faab778SVincenzo Maffione 			na_could_sleep = true;
7225faab778SVincenzo Maffione 		}
7235faab778SVincenzo Maffione 
7245faab778SVincenzo Maffione 		for (i = 0; i < num_rings + 2; i++) {
7255faab778SVincenzo Maffione 			poll_ctx->entries[i].args = args + i;
7265faab778SVincenzo Maffione 			poll_ctx->entries[i].parent = poll_ctx;
7275faab778SVincenzo Maffione 		}
7285faab778SVincenzo Maffione 
729b6e66be2SVincenzo Maffione 		/* Poll for notifications coming from the applications through
730b6e66be2SVincenzo Maffione 		 * eventfds. */
7315faab778SVincenzo Maffione 		for (i = 0; i < num_rings; i++, poll_ctx->next_entry++) {
7325faab778SVincenzo Maffione 			struct eventfd_ctx *irq = NULL;
7335faab778SVincenzo Maffione 			struct file *filp = NULL;
734b6e66be2SVincenzo Maffione 			unsigned long mask;
7355faab778SVincenzo Maffione 			bool tx_ring = (i < num_tx_rings);
736b6e66be2SVincenzo Maffione 
7375faab778SVincenzo Maffione 			if (eventfds_opt->eventfds[i].irqfd >= 0) {
7385faab778SVincenzo Maffione 				filp = eventfd_fget(
7395faab778SVincenzo Maffione 				    eventfds_opt->eventfds[i].irqfd);
740b6e66be2SVincenzo Maffione 				if (IS_ERR(filp)) {
741b6e66be2SVincenzo Maffione 					err = PTR_ERR(filp);
742b6e66be2SVincenzo Maffione 					goto out;
743b6e66be2SVincenzo Maffione 				}
744b6e66be2SVincenzo Maffione 				irq = eventfd_ctx_fileget(filp);
745b6e66be2SVincenzo Maffione 				if (IS_ERR(irq)) {
746b6e66be2SVincenzo Maffione 					err = PTR_ERR(irq);
747b6e66be2SVincenzo Maffione 					goto out;
748b6e66be2SVincenzo Maffione 				}
749b6e66be2SVincenzo Maffione 			}
7505faab778SVincenzo Maffione 			poll_ctx->entries[i].irq_filp = filp;
7515faab778SVincenzo Maffione 			poll_ctx->entries[i].irq_ctx = irq;
7525faab778SVincenzo Maffione 			poll_ctx->entries[i].args->busy_wait = busy_wait;
7535faab778SVincenzo Maffione 			/* Don't let netmap_sync_kloop_*x_ring() use
7545faab778SVincenzo Maffione 			 * IRQs in direct mode. */
7555faab778SVincenzo Maffione 			poll_ctx->entries[i].args->irq_ctx =
7565faab778SVincenzo Maffione 			    ((tx_ring && direct_tx) ||
7575faab778SVincenzo Maffione 			    (!tx_ring && direct_rx)) ? NULL :
7585faab778SVincenzo Maffione 			    poll_ctx->entries[i].irq_ctx;
7595faab778SVincenzo Maffione 			poll_ctx->entries[i].args->direct =
7605faab778SVincenzo Maffione 			    (tx_ring ? direct_tx : direct_rx);
7615faab778SVincenzo Maffione 
7625faab778SVincenzo Maffione 			if (!busy_wait) {
7635faab778SVincenzo Maffione 				filp = eventfd_fget(
7645faab778SVincenzo Maffione 				    eventfds_opt->eventfds[i].ioeventfd);
7655faab778SVincenzo Maffione 				if (IS_ERR(filp)) {
7665faab778SVincenzo Maffione 					err = PTR_ERR(filp);
7675faab778SVincenzo Maffione 					goto out;
7685faab778SVincenzo Maffione 				}
7695faab778SVincenzo Maffione 				if (tx_ring && direct_tx) {
7705faab778SVincenzo Maffione 					/* Override the wake up function
7715faab778SVincenzo Maffione 					 * so that it can directly call
7725faab778SVincenzo Maffione 					 * netmap_sync_kloop_tx_ring().
7735faab778SVincenzo Maffione 					 */
7745faab778SVincenzo Maffione 					poll_ctx->next_wake_fun =
7755faab778SVincenzo Maffione 					    sync_kloop_tx_kick_wake_fun;
7765faab778SVincenzo Maffione 				} else if (!tx_ring && direct_rx) {
7775faab778SVincenzo Maffione 					/* Same for direct RX. */
7785faab778SVincenzo Maffione 					poll_ctx->next_wake_fun =
7795faab778SVincenzo Maffione 					    sync_kloop_rx_kick_wake_fun;
7805faab778SVincenzo Maffione 				} else {
7815faab778SVincenzo Maffione 					poll_ctx->next_wake_fun = NULL;
7825faab778SVincenzo Maffione 				}
7835faab778SVincenzo Maffione 				mask = filp->f_op->poll(filp,
7845faab778SVincenzo Maffione 				    &poll_ctx->wait_table);
7855faab778SVincenzo Maffione 				if (mask & POLLERR) {
7865faab778SVincenzo Maffione 					err = EINVAL;
7875faab778SVincenzo Maffione 					goto out;
7885faab778SVincenzo Maffione 				}
7895faab778SVincenzo Maffione 			}
7905faab778SVincenzo Maffione 		}
7915faab778SVincenzo Maffione 
792b6e66be2SVincenzo Maffione 		/* Poll for notifications coming from the netmap rings bound to
793b6e66be2SVincenzo Maffione 		 * this file descriptor. */
7945faab778SVincenzo Maffione 		if (!busy_wait) {
795b6e66be2SVincenzo Maffione 			NMG_LOCK();
7965faab778SVincenzo Maffione 			/* In direct mode, override the wake up function so
7975faab778SVincenzo Maffione 			 * that it can forward the netmap_tx_irq() to the
7985faab778SVincenzo Maffione 			 * guest. */
7995faab778SVincenzo Maffione 			poll_ctx->next_wake_fun = direct_tx ?
8005faab778SVincenzo Maffione 			    sync_kloop_tx_irq_wake_fun : NULL;
801a56136a1SVincenzo Maffione 			poll_wait(priv->np_filp, priv->np_si[NR_TX],
802a56136a1SVincenzo Maffione 			    &poll_ctx->wait_table);
8035faab778SVincenzo Maffione 			poll_ctx->next_entry++;
8045faab778SVincenzo Maffione 
8055faab778SVincenzo Maffione 			poll_ctx->next_wake_fun = direct_rx ?
8065faab778SVincenzo Maffione 			    sync_kloop_rx_irq_wake_fun : NULL;
807a56136a1SVincenzo Maffione 			poll_wait(priv->np_filp, priv->np_si[NR_RX],
808a56136a1SVincenzo Maffione 			    &poll_ctx->wait_table);
8095faab778SVincenzo Maffione 			poll_ctx->next_entry++;
810b6e66be2SVincenzo Maffione 			NMG_UNLOCK();
811b6e66be2SVincenzo Maffione 		}
812b6e66be2SVincenzo Maffione #else   /* SYNC_KLOOP_POLL */
813b6e66be2SVincenzo Maffione 		opt->nro_status = EOPNOTSUPP;
814b6e66be2SVincenzo Maffione 		goto out;
815b6e66be2SVincenzo Maffione #endif  /* SYNC_KLOOP_POLL */
816b6e66be2SVincenzo Maffione 	}
817b6e66be2SVincenzo Maffione 
8185faab778SVincenzo Maffione 	nm_prinf("kloop busy_wait %u, direct_tx %u, direct_rx %u, "
8195faab778SVincenzo Maffione 	    "na_could_sleep %u", busy_wait, direct_tx, direct_rx,
8205faab778SVincenzo Maffione 	    na_could_sleep);
821f79ba6d7SVincenzo Maffione 
822b6e66be2SVincenzo Maffione 	/* Main loop. */
823b6e66be2SVincenzo Maffione 	for (;;) {
824b6e66be2SVincenzo Maffione 		if (unlikely(NM_ACCESS_ONCE(priv->np_kloop_state) & NM_SYNC_KLOOP_STOPPING)) {
825b6e66be2SVincenzo Maffione 			break;
826b6e66be2SVincenzo Maffione 		}
827b6e66be2SVincenzo Maffione 
828b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
8295faab778SVincenzo Maffione 		if (!busy_wait) {
830f79ba6d7SVincenzo Maffione 			/* It is important to set the task state as
831f79ba6d7SVincenzo Maffione 			 * interruptible before processing any TX/RX ring,
832f79ba6d7SVincenzo Maffione 			 * so that if a notification on ring Y comes after
833f79ba6d7SVincenzo Maffione 			 * we have processed ring Y, but before we call
834f79ba6d7SVincenzo Maffione 			 * schedule(), we don't miss it. This is true because
835591a9b5eSGordon Bergling 			 * the wake up function will change the task state,
836f79ba6d7SVincenzo Maffione 			 * and therefore the schedule_timeout() call below
837f79ba6d7SVincenzo Maffione 			 * will observe the change).
838f79ba6d7SVincenzo Maffione 			 */
839f79ba6d7SVincenzo Maffione 			set_current_state(TASK_INTERRUPTIBLE);
840f79ba6d7SVincenzo Maffione 		}
841b6e66be2SVincenzo Maffione #endif  /* SYNC_KLOOP_POLL */
842b6e66be2SVincenzo Maffione 
843b6e66be2SVincenzo Maffione 		/* Process all the TX rings bound to this file descriptor. */
8445faab778SVincenzo Maffione 		for (i = 0; !direct_tx && i < num_tx_rings; i++) {
845f79ba6d7SVincenzo Maffione 			struct sync_kloop_ring_args *a = args + i;
846f79ba6d7SVincenzo Maffione 			netmap_sync_kloop_tx_ring(a);
847b6e66be2SVincenzo Maffione 		}
848b6e66be2SVincenzo Maffione 
849b6e66be2SVincenzo Maffione 		/* Process all the RX rings bound to this file descriptor. */
8505faab778SVincenzo Maffione 		for (i = 0; !direct_rx && i < num_rx_rings; i++) {
851f79ba6d7SVincenzo Maffione 			struct sync_kloop_ring_args *a = args + num_tx_rings + i;
852f79ba6d7SVincenzo Maffione 			netmap_sync_kloop_rx_ring(a);
853b6e66be2SVincenzo Maffione 		}
854b6e66be2SVincenzo Maffione 
8555faab778SVincenzo Maffione 		if (busy_wait) {
856b6e66be2SVincenzo Maffione 			/* Default synchronization method: sleep for a while. */
857b6e66be2SVincenzo Maffione 			usleep_range(sleep_us, sleep_us);
858b6e66be2SVincenzo Maffione 		}
8595faab778SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
8605faab778SVincenzo Maffione 		else {
8615faab778SVincenzo Maffione 			/* Yield to the scheduler waiting for a notification
8625faab778SVincenzo Maffione 			 * to come either from netmap or the application. */
8635faab778SVincenzo Maffione 			schedule_timeout(msecs_to_jiffies(3000));
8645faab778SVincenzo Maffione 		}
8655faab778SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
866b6e66be2SVincenzo Maffione 	}
867b6e66be2SVincenzo Maffione out:
868b6e66be2SVincenzo Maffione #ifdef SYNC_KLOOP_POLL
869b6e66be2SVincenzo Maffione 	if (poll_ctx) {
870b6e66be2SVincenzo Maffione 		/* Stop polling from netmap and the eventfds, and deallocate
871b6e66be2SVincenzo Maffione 		 * the poll context. */
8725faab778SVincenzo Maffione 		if (!busy_wait) {
873b6e66be2SVincenzo Maffione 			__set_current_state(TASK_RUNNING);
8745faab778SVincenzo Maffione 		}
875b6e66be2SVincenzo Maffione 		for (i = 0; i < poll_ctx->next_entry; i++) {
876b6e66be2SVincenzo Maffione 			struct sync_kloop_poll_entry *entry =
877b6e66be2SVincenzo Maffione 						poll_ctx->entries + i;
878b6e66be2SVincenzo Maffione 
879b6e66be2SVincenzo Maffione 			if (entry->wqh)
880b6e66be2SVincenzo Maffione 				remove_wait_queue(entry->wqh, &entry->wait);
881b6e66be2SVincenzo Maffione 			/* We did not get a reference to the eventfds, but
882b6e66be2SVincenzo Maffione 			 * don't do that on netmap file descriptors (since
883b6e66be2SVincenzo Maffione 			 * a reference was not taken. */
884b6e66be2SVincenzo Maffione 			if (entry->filp && entry->filp != priv->np_filp)
885b6e66be2SVincenzo Maffione 				fput(entry->filp);
886b6e66be2SVincenzo Maffione 			if (entry->irq_ctx)
887b6e66be2SVincenzo Maffione 				eventfd_ctx_put(entry->irq_ctx);
888b6e66be2SVincenzo Maffione 			if (entry->irq_filp)
889b6e66be2SVincenzo Maffione 				fput(entry->irq_filp);
890b6e66be2SVincenzo Maffione 		}
891b6e66be2SVincenzo Maffione 		nm_os_free(poll_ctx);
892b6e66be2SVincenzo Maffione 		poll_ctx = NULL;
893b6e66be2SVincenzo Maffione 	}
894b6e66be2SVincenzo Maffione #endif /* SYNC_KLOOP_POLL */
895b6e66be2SVincenzo Maffione 
896f79ba6d7SVincenzo Maffione 	if (args) {
897f79ba6d7SVincenzo Maffione 		nm_os_free(args);
898f79ba6d7SVincenzo Maffione 		args = NULL;
899f79ba6d7SVincenzo Maffione 	}
900f79ba6d7SVincenzo Maffione 
901b6e66be2SVincenzo Maffione 	/* Reset the kloop state. */
902b6e66be2SVincenzo Maffione 	NMG_LOCK();
903b6e66be2SVincenzo Maffione 	priv->np_kloop_state = 0;
9045faab778SVincenzo Maffione 	if (na_could_sleep) {
9055faab778SVincenzo Maffione 		na->na_flags |= NAF_BDG_MAYSLEEP;
9065faab778SVincenzo Maffione 	}
907b6e66be2SVincenzo Maffione 	NMG_UNLOCK();
908b6e66be2SVincenzo Maffione 
909b6e66be2SVincenzo Maffione 	return err;
910b6e66be2SVincenzo Maffione }
911b6e66be2SVincenzo Maffione 
912b6e66be2SVincenzo Maffione int
netmap_sync_kloop_stop(struct netmap_priv_d * priv)913b6e66be2SVincenzo Maffione netmap_sync_kloop_stop(struct netmap_priv_d *priv)
914b6e66be2SVincenzo Maffione {
915a56136a1SVincenzo Maffione 	struct netmap_adapter *na;
916b6e66be2SVincenzo Maffione 	bool running = true;
917b6e66be2SVincenzo Maffione 	int err = 0;
918b6e66be2SVincenzo Maffione 
919a56136a1SVincenzo Maffione 	if (priv->np_nifp == NULL) {
920a56136a1SVincenzo Maffione 		return ENXIO;
921a56136a1SVincenzo Maffione 	}
922a56136a1SVincenzo Maffione 	mb(); /* make sure following reads are not from cache */
923a56136a1SVincenzo Maffione 
924a56136a1SVincenzo Maffione 	na = priv->np_na;
925a56136a1SVincenzo Maffione 	if (!nm_netmap_on(na)) {
926a56136a1SVincenzo Maffione 		return ENXIO;
927a56136a1SVincenzo Maffione 	}
928a56136a1SVincenzo Maffione 
929a56136a1SVincenzo Maffione 	/* Set the kloop stopping flag. */
930b6e66be2SVincenzo Maffione 	NMG_LOCK();
931b6e66be2SVincenzo Maffione 	priv->np_kloop_state |= NM_SYNC_KLOOP_STOPPING;
932b6e66be2SVincenzo Maffione 	NMG_UNLOCK();
933a56136a1SVincenzo Maffione 
934a56136a1SVincenzo Maffione 	/* Send a notification to the kloop, in case it is blocked in
935a56136a1SVincenzo Maffione 	 * schedule_timeout(). We can use either RX or TX, because the
936a56136a1SVincenzo Maffione 	 * kloop is waiting on both. */
937a56136a1SVincenzo Maffione 	nm_os_selwakeup(priv->np_si[NR_RX]);
938a56136a1SVincenzo Maffione 
939a56136a1SVincenzo Maffione 	/* Wait for the kloop to actually terminate. */
940b6e66be2SVincenzo Maffione 	while (running) {
941b6e66be2SVincenzo Maffione 		usleep_range(1000, 1500);
942b6e66be2SVincenzo Maffione 		NMG_LOCK();
943b6e66be2SVincenzo Maffione 		running = (NM_ACCESS_ONCE(priv->np_kloop_state)
944b6e66be2SVincenzo Maffione 				& NM_SYNC_KLOOP_RUNNING);
945b6e66be2SVincenzo Maffione 		NMG_UNLOCK();
946b6e66be2SVincenzo Maffione 	}
947b6e66be2SVincenzo Maffione 
948b6e66be2SVincenzo Maffione 	return err;
949b6e66be2SVincenzo Maffione }
950b6e66be2SVincenzo Maffione 
951b6e66be2SVincenzo Maffione #ifdef WITH_PTNETMAP
952b6e66be2SVincenzo Maffione /*
953b6e66be2SVincenzo Maffione  * Guest ptnetmap txsync()/rxsync() routines, used in ptnet device drivers.
954b6e66be2SVincenzo Maffione  * These routines are reused across the different operating systems supported
955b6e66be2SVincenzo Maffione  * by netmap.
956b6e66be2SVincenzo Maffione  */
957b6e66be2SVincenzo Maffione 
958b6e66be2SVincenzo Maffione /*
959b6e66be2SVincenzo Maffione  * Reconcile host and guest views of the transmit ring.
960b6e66be2SVincenzo Maffione  *
961b6e66be2SVincenzo Maffione  * Guest user wants to transmit packets up to the one before ring->head,
962b6e66be2SVincenzo Maffione  * and guest kernel knows tx_ring->hwcur is the first packet unsent
963b6e66be2SVincenzo Maffione  * by the host kernel.
964b6e66be2SVincenzo Maffione  *
965b6e66be2SVincenzo Maffione  * We push out as many packets as possible, and possibly
966b6e66be2SVincenzo Maffione  * reclaim buffers from previously completed transmission.
967b6e66be2SVincenzo Maffione  *
968b6e66be2SVincenzo Maffione  * Notifications from the host are enabled only if the user guest would
969b6e66be2SVincenzo Maffione  * block (no space in the ring).
970b6e66be2SVincenzo Maffione  */
971b6e66be2SVincenzo Maffione bool
netmap_pt_guest_txsync(struct nm_csb_atok * atok,struct nm_csb_ktoa * ktoa,struct netmap_kring * kring,int flags)972b6e66be2SVincenzo Maffione netmap_pt_guest_txsync(struct nm_csb_atok *atok, struct nm_csb_ktoa *ktoa,
973b6e66be2SVincenzo Maffione 			struct netmap_kring *kring, int flags)
974b6e66be2SVincenzo Maffione {
975b6e66be2SVincenzo Maffione 	bool notify = false;
976b6e66be2SVincenzo Maffione 
977b6e66be2SVincenzo Maffione 	/* Disable notifications */
978b6e66be2SVincenzo Maffione 	atok->appl_need_kick = 0;
979b6e66be2SVincenzo Maffione 
980b6e66be2SVincenzo Maffione 	/*
9815faab778SVincenzo Maffione 	 * First part: tell the host to process the new packets,
9825faab778SVincenzo Maffione 	 * updating the CSB.
983b6e66be2SVincenzo Maffione 	 */
984b6e66be2SVincenzo Maffione 	kring->nr_hwcur = ktoa->hwcur;
985f79ba6d7SVincenzo Maffione 	nm_sync_kloop_appl_write(atok, kring->rcur, kring->rhead);
986b6e66be2SVincenzo Maffione 
987b6e66be2SVincenzo Maffione         /* Ask for a kick from a guest to the host if needed. */
9885faab778SVincenzo Maffione 	if (((kring->rhead != kring->nr_hwcur || nm_kr_wouldblock(kring))
989b6e66be2SVincenzo Maffione 		&& NM_ACCESS_ONCE(ktoa->kern_need_kick)) ||
990b6e66be2SVincenzo Maffione 			(flags & NAF_FORCE_RECLAIM)) {
991b6e66be2SVincenzo Maffione 		atok->sync_flags = flags;
992b6e66be2SVincenzo Maffione 		notify = true;
993b6e66be2SVincenzo Maffione 	}
994b6e66be2SVincenzo Maffione 
995b6e66be2SVincenzo Maffione 	/*
996b6e66be2SVincenzo Maffione 	 * Second part: reclaim buffers for completed transmissions.
997b6e66be2SVincenzo Maffione 	 */
9985faab778SVincenzo Maffione 	if (nm_kr_wouldblock(kring) || (flags & NAF_FORCE_RECLAIM)) {
999f79ba6d7SVincenzo Maffione 		nm_sync_kloop_appl_read(ktoa, &kring->nr_hwtail,
1000f79ba6d7SVincenzo Maffione 					&kring->nr_hwcur);
1001b6e66be2SVincenzo Maffione 	}
1002b6e66be2SVincenzo Maffione 
1003b6e66be2SVincenzo Maffione         /*
1004b6e66be2SVincenzo Maffione          * No more room in the ring for new transmissions. The user thread will
1005b6e66be2SVincenzo Maffione 	 * go to sleep and we need to be notified by the host when more free
1006b6e66be2SVincenzo Maffione 	 * space is available.
1007b6e66be2SVincenzo Maffione          */
10085faab778SVincenzo Maffione 	if (nm_kr_wouldblock(kring) && !(kring->nr_kflags & NKR_NOINTR)) {
100945c67e8fSVincenzo Maffione 		/* Re-enable notifications. */
1010b6e66be2SVincenzo Maffione 		atok->appl_need_kick = 1;
1011f79ba6d7SVincenzo Maffione                 /* Double check, with store-load memory barrier. */
1012f79ba6d7SVincenzo Maffione 		nm_stld_barrier();
1013f79ba6d7SVincenzo Maffione 		nm_sync_kloop_appl_read(ktoa, &kring->nr_hwtail,
1014f79ba6d7SVincenzo Maffione 					&kring->nr_hwcur);
1015b6e66be2SVincenzo Maffione                 /* If there is new free space, disable notifications */
10165faab778SVincenzo Maffione 		if (unlikely(!nm_kr_wouldblock(kring))) {
1017b6e66be2SVincenzo Maffione 			atok->appl_need_kick = 0;
1018b6e66be2SVincenzo Maffione 		}
1019b6e66be2SVincenzo Maffione 	}
1020b6e66be2SVincenzo Maffione 
1021b6e66be2SVincenzo Maffione 	nm_prdis(1, "%s CSB(head:%u cur:%u hwtail:%u) KRING(head:%u cur:%u tail:%u)",
1022b6e66be2SVincenzo Maffione 		kring->name, atok->head, atok->cur, ktoa->hwtail,
1023b6e66be2SVincenzo Maffione 		kring->rhead, kring->rcur, kring->nr_hwtail);
1024b6e66be2SVincenzo Maffione 
1025b6e66be2SVincenzo Maffione 	return notify;
1026b6e66be2SVincenzo Maffione }
1027b6e66be2SVincenzo Maffione 
1028b6e66be2SVincenzo Maffione /*
1029b6e66be2SVincenzo Maffione  * Reconcile host and guest view of the receive ring.
1030b6e66be2SVincenzo Maffione  *
1031b6e66be2SVincenzo Maffione  * Update hwcur/hwtail from host (reading from CSB).
1032b6e66be2SVincenzo Maffione  *
1033b6e66be2SVincenzo Maffione  * If guest user has released buffers up to the one before ring->head, we
1034b6e66be2SVincenzo Maffione  * also give them to the host.
1035b6e66be2SVincenzo Maffione  *
1036b6e66be2SVincenzo Maffione  * Notifications from the host are enabled only if the user guest would
1037b6e66be2SVincenzo Maffione  * block (no more completed slots in the ring).
1038b6e66be2SVincenzo Maffione  */
1039b6e66be2SVincenzo Maffione bool
netmap_pt_guest_rxsync(struct nm_csb_atok * atok,struct nm_csb_ktoa * ktoa,struct netmap_kring * kring,int flags)1040b6e66be2SVincenzo Maffione netmap_pt_guest_rxsync(struct nm_csb_atok *atok, struct nm_csb_ktoa *ktoa,
1041b6e66be2SVincenzo Maffione 			struct netmap_kring *kring, int flags)
1042b6e66be2SVincenzo Maffione {
1043b6e66be2SVincenzo Maffione 	bool notify = false;
1044b6e66be2SVincenzo Maffione 
1045b6e66be2SVincenzo Maffione         /* Disable notifications */
1046b6e66be2SVincenzo Maffione 	atok->appl_need_kick = 0;
1047b6e66be2SVincenzo Maffione 
1048b6e66be2SVincenzo Maffione 	/*
1049b6e66be2SVincenzo Maffione 	 * First part: import newly received packets, by updating the kring
1050b6e66be2SVincenzo Maffione 	 * hwtail to the hwtail known from the host (read from the CSB).
1051b6e66be2SVincenzo Maffione 	 * This also updates the kring hwcur.
1052b6e66be2SVincenzo Maffione 	 */
1053f79ba6d7SVincenzo Maffione 	nm_sync_kloop_appl_read(ktoa, &kring->nr_hwtail, &kring->nr_hwcur);
1054b6e66be2SVincenzo Maffione 	kring->nr_kflags &= ~NKR_PENDINTR;
1055b6e66be2SVincenzo Maffione 
1056b6e66be2SVincenzo Maffione 	/*
1057b6e66be2SVincenzo Maffione 	 * Second part: tell the host about the slots that guest user has
1058b6e66be2SVincenzo Maffione 	 * released, by updating cur and head in the CSB.
1059b6e66be2SVincenzo Maffione 	 */
1060b6e66be2SVincenzo Maffione 	if (kring->rhead != kring->nr_hwcur) {
1061f79ba6d7SVincenzo Maffione 		nm_sync_kloop_appl_write(atok, kring->rcur, kring->rhead);
1062b6e66be2SVincenzo Maffione 	}
1063b6e66be2SVincenzo Maffione 
1064b6e66be2SVincenzo Maffione         /*
1065b6e66be2SVincenzo Maffione          * No more completed RX slots. The user thread will go to sleep and
1066b6e66be2SVincenzo Maffione 	 * we need to be notified by the host when more RX slots have been
1067b6e66be2SVincenzo Maffione 	 * completed.
1068b6e66be2SVincenzo Maffione          */
10695faab778SVincenzo Maffione 	if (nm_kr_wouldblock(kring) && !(kring->nr_kflags & NKR_NOINTR)) {
107045c67e8fSVincenzo Maffione 		/* Re-enable notifications. */
1071b6e66be2SVincenzo Maffione                 atok->appl_need_kick = 1;
1072f79ba6d7SVincenzo Maffione                 /* Double check, with store-load memory barrier. */
1073f79ba6d7SVincenzo Maffione 		nm_stld_barrier();
1074f79ba6d7SVincenzo Maffione 		nm_sync_kloop_appl_read(ktoa, &kring->nr_hwtail,
1075f79ba6d7SVincenzo Maffione 					&kring->nr_hwcur);
1076b6e66be2SVincenzo Maffione                 /* If there are new slots, disable notifications. */
10775faab778SVincenzo Maffione 		if (!nm_kr_wouldblock(kring)) {
1078b6e66be2SVincenzo Maffione                         atok->appl_need_kick = 0;
1079b6e66be2SVincenzo Maffione                 }
1080b6e66be2SVincenzo Maffione         }
1081b6e66be2SVincenzo Maffione 
10825faab778SVincenzo Maffione 	/* Ask for a kick from the guest to the host if needed. */
10835faab778SVincenzo Maffione 	if ((kring->rhead != kring->nr_hwcur || nm_kr_wouldblock(kring))
10845faab778SVincenzo Maffione 		&& NM_ACCESS_ONCE(ktoa->kern_need_kick)) {
10855faab778SVincenzo Maffione 		atok->sync_flags = flags;
10865faab778SVincenzo Maffione 		notify = true;
10875faab778SVincenzo Maffione 	}
10885faab778SVincenzo Maffione 
1089b6e66be2SVincenzo Maffione 	nm_prdis(1, "%s CSB(head:%u cur:%u hwtail:%u) KRING(head:%u cur:%u tail:%u)",
1090b6e66be2SVincenzo Maffione 		kring->name, atok->head, atok->cur, ktoa->hwtail,
1091b6e66be2SVincenzo Maffione 		kring->rhead, kring->rcur, kring->nr_hwtail);
1092b6e66be2SVincenzo Maffione 
1093b6e66be2SVincenzo Maffione 	return notify;
1094b6e66be2SVincenzo Maffione }
1095b6e66be2SVincenzo Maffione 
1096b6e66be2SVincenzo Maffione /*
1097b6e66be2SVincenzo Maffione  * Callbacks for ptnet drivers: nm_krings_create, nm_krings_delete, nm_dtor.
1098b6e66be2SVincenzo Maffione  */
1099b6e66be2SVincenzo Maffione int
ptnet_nm_krings_create(struct netmap_adapter * na)1100b6e66be2SVincenzo Maffione ptnet_nm_krings_create(struct netmap_adapter *na)
1101b6e66be2SVincenzo Maffione {
1102b6e66be2SVincenzo Maffione 	struct netmap_pt_guest_adapter *ptna =
1103b6e66be2SVincenzo Maffione 			(struct netmap_pt_guest_adapter *)na; /* Upcast. */
1104b6e66be2SVincenzo Maffione 	struct netmap_adapter *na_nm = &ptna->hwup.up;
1105b6e66be2SVincenzo Maffione 	struct netmap_adapter *na_dr = &ptna->dr.up;
1106b6e66be2SVincenzo Maffione 	int ret;
1107b6e66be2SVincenzo Maffione 
1108b6e66be2SVincenzo Maffione 	if (ptna->backend_users) {
1109b6e66be2SVincenzo Maffione 		return 0;
1110b6e66be2SVincenzo Maffione 	}
1111b6e66be2SVincenzo Maffione 
1112b6e66be2SVincenzo Maffione 	/* Create krings on the public netmap adapter. */
1113b6e66be2SVincenzo Maffione 	ret = netmap_hw_krings_create(na_nm);
1114b6e66be2SVincenzo Maffione 	if (ret) {
1115b6e66be2SVincenzo Maffione 		return ret;
1116b6e66be2SVincenzo Maffione 	}
1117b6e66be2SVincenzo Maffione 
1118b6e66be2SVincenzo Maffione 	/* Copy krings into the netmap adapter private to the driver. */
1119b6e66be2SVincenzo Maffione 	na_dr->tx_rings = na_nm->tx_rings;
1120b6e66be2SVincenzo Maffione 	na_dr->rx_rings = na_nm->rx_rings;
1121b6e66be2SVincenzo Maffione 
1122b6e66be2SVincenzo Maffione 	return 0;
1123b6e66be2SVincenzo Maffione }
1124b6e66be2SVincenzo Maffione 
1125b6e66be2SVincenzo Maffione void
ptnet_nm_krings_delete(struct netmap_adapter * na)1126b6e66be2SVincenzo Maffione ptnet_nm_krings_delete(struct netmap_adapter *na)
1127b6e66be2SVincenzo Maffione {
1128b6e66be2SVincenzo Maffione 	struct netmap_pt_guest_adapter *ptna =
1129b6e66be2SVincenzo Maffione 			(struct netmap_pt_guest_adapter *)na; /* Upcast. */
1130b6e66be2SVincenzo Maffione 	struct netmap_adapter *na_nm = &ptna->hwup.up;
1131b6e66be2SVincenzo Maffione 	struct netmap_adapter *na_dr = &ptna->dr.up;
1132b6e66be2SVincenzo Maffione 
1133b6e66be2SVincenzo Maffione 	if (ptna->backend_users) {
1134b6e66be2SVincenzo Maffione 		return;
1135b6e66be2SVincenzo Maffione 	}
1136b6e66be2SVincenzo Maffione 
1137b6e66be2SVincenzo Maffione 	na_dr->tx_rings = NULL;
1138b6e66be2SVincenzo Maffione 	na_dr->rx_rings = NULL;
1139b6e66be2SVincenzo Maffione 
1140b6e66be2SVincenzo Maffione 	netmap_hw_krings_delete(na_nm);
1141b6e66be2SVincenzo Maffione }
1142b6e66be2SVincenzo Maffione 
1143b6e66be2SVincenzo Maffione void
ptnet_nm_dtor(struct netmap_adapter * na)1144b6e66be2SVincenzo Maffione ptnet_nm_dtor(struct netmap_adapter *na)
1145b6e66be2SVincenzo Maffione {
1146b6e66be2SVincenzo Maffione 	struct netmap_pt_guest_adapter *ptna =
1147b6e66be2SVincenzo Maffione 			(struct netmap_pt_guest_adapter *)na;
1148b6e66be2SVincenzo Maffione 
1149b6e66be2SVincenzo Maffione 	netmap_mem_put(ptna->dr.up.nm_mem);
1150b6e66be2SVincenzo Maffione 	memset(&ptna->dr, 0, sizeof(ptna->dr));
1151b6e66be2SVincenzo Maffione 	netmap_mem_pt_guest_ifp_del(na->nm_mem, na->ifp);
1152b6e66be2SVincenzo Maffione }
1153b6e66be2SVincenzo Maffione 
1154b6e66be2SVincenzo Maffione int
netmap_pt_guest_attach(struct netmap_adapter * arg,unsigned int nifp_offset,unsigned int memid)1155b6e66be2SVincenzo Maffione netmap_pt_guest_attach(struct netmap_adapter *arg,
1156b6e66be2SVincenzo Maffione 		       unsigned int nifp_offset, unsigned int memid)
1157b6e66be2SVincenzo Maffione {
1158b6e66be2SVincenzo Maffione 	struct netmap_pt_guest_adapter *ptna;
1159e330262fSJustin Hibbits 	if_t ifp = arg ? arg->ifp : NULL;
1160b6e66be2SVincenzo Maffione 	int error;
1161b6e66be2SVincenzo Maffione 
1162b6e66be2SVincenzo Maffione 	/* get allocator */
1163b6e66be2SVincenzo Maffione 	arg->nm_mem = netmap_mem_pt_guest_new(ifp, nifp_offset, memid);
1164b6e66be2SVincenzo Maffione 	if (arg->nm_mem == NULL)
1165b6e66be2SVincenzo Maffione 		return ENOMEM;
1166b6e66be2SVincenzo Maffione 	arg->na_flags |= NAF_MEM_OWNER;
1167b6e66be2SVincenzo Maffione 	error = netmap_attach_ext(arg, sizeof(struct netmap_pt_guest_adapter), 1);
1168b6e66be2SVincenzo Maffione 	if (error)
1169b6e66be2SVincenzo Maffione 		return error;
1170b6e66be2SVincenzo Maffione 
1171b6e66be2SVincenzo Maffione 	/* get the netmap_pt_guest_adapter */
1172b6e66be2SVincenzo Maffione 	ptna = (struct netmap_pt_guest_adapter *) NA(ifp);
1173b6e66be2SVincenzo Maffione 
1174b6e66be2SVincenzo Maffione 	/* Initialize a separate pass-through netmap adapter that is going to
1175b6e66be2SVincenzo Maffione 	 * be used by the ptnet driver only, and so never exposed to netmap
1176b6e66be2SVincenzo Maffione          * applications. We only need a subset of the available fields. */
1177b6e66be2SVincenzo Maffione 	memset(&ptna->dr, 0, sizeof(ptna->dr));
1178b6e66be2SVincenzo Maffione 	ptna->dr.up.ifp = ifp;
1179b6e66be2SVincenzo Maffione 	ptna->dr.up.nm_mem = netmap_mem_get(ptna->hwup.up.nm_mem);
1180b6e66be2SVincenzo Maffione         ptna->dr.up.nm_config = ptna->hwup.up.nm_config;
1181b6e66be2SVincenzo Maffione 
1182b6e66be2SVincenzo Maffione 	ptna->backend_users = 0;
1183b6e66be2SVincenzo Maffione 
1184b6e66be2SVincenzo Maffione 	return 0;
1185b6e66be2SVincenzo Maffione }
1186b6e66be2SVincenzo Maffione 
1187b6e66be2SVincenzo Maffione #endif /* WITH_PTNETMAP */
1188