xref: /freebsd-13-stable/sys/dev/netmap/netmap_pipe.c (revision 4fbf14e22d7b83de7080a8e491ba14a5785a0ff4)
1 /*-
2  * SPDX-License-Identifier: BSD-2-Clause
3  *
4  * Copyright (C) 2014-2018 Giuseppe Lettieri
5  * All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  *   1. Redistributions of source code must retain the above copyright
11  *      notice, this list of conditions and the following disclaimer.
12  *   2. Redistributions in binary form must reproduce the above copyright
13  *      notice, this list of conditions and the following disclaimer in the
14  *      documentation and/or other materials provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26  * SUCH DAMAGE.
27  */
28 
29 
30 #if defined(__FreeBSD__)
31 #include <sys/cdefs.h> /* prerequisite */
32 
33 #include <sys/types.h>
34 #include <sys/errno.h>
35 #include <sys/param.h>	/* defines used in kernel.h */
36 #include <sys/kernel.h>	/* types used in module initialization */
37 #include <sys/malloc.h>
38 #include <sys/poll.h>
39 #include <sys/lock.h>
40 #include <sys/rwlock.h>
41 #include <sys/selinfo.h>
42 #include <sys/sysctl.h>
43 #include <sys/socket.h> /* sockaddrs */
44 #include <net/if.h>
45 #include <net/if_var.h>
46 #include <machine/bus.h>	/* bus_dmamap_* */
47 #include <sys/refcount.h>
48 
49 
50 #elif defined(linux)
51 
52 #include "bsd_glue.h"
53 
54 #elif defined(__APPLE__)
55 
56 #warning OSX support is only partial
57 #include "osx_glue.h"
58 
59 #elif defined(_WIN32)
60 #include "win_glue.h"
61 
62 #else
63 
64 #error	Unsupported platform
65 
66 #endif /* unsupported */
67 
68 /*
69  * common headers
70  */
71 
72 #include <net/netmap.h>
73 #include <dev/netmap/netmap_kern.h>
74 #include <dev/netmap/netmap_mem2.h>
75 
76 #ifdef WITH_PIPES
77 
78 #define NM_PIPE_MAXSLOTS	4096
79 #define NM_PIPE_MAXRINGS	256
80 
81 static int netmap_default_pipes = 0; /* ignored, kept for compatibility */
82 SYSBEGIN(vars_pipes);
83 SYSCTL_DECL(_dev_netmap);
84 SYSCTL_INT(_dev_netmap, OID_AUTO, default_pipes, CTLFLAG_RW,
85 		&netmap_default_pipes, 0, "For compatibility only");
86 SYSEND;
87 
88 /* allocate the pipe array in the parent adapter */
89 static int
nm_pipe_alloc(struct netmap_adapter * na,u_int npipes)90 nm_pipe_alloc(struct netmap_adapter *na, u_int npipes)
91 {
92 	size_t old_len, len;
93 	struct netmap_pipe_adapter **npa;
94 
95 	if (npipes <= na->na_max_pipes)
96 		/* we already have more entries that requested */
97 		return 0;
98 
99 	if (npipes < na->na_next_pipe || npipes > NM_MAXPIPES)
100 		return EINVAL;
101 
102 	old_len = sizeof(struct netmap_pipe_adapter *)*na->na_max_pipes;
103 	len = sizeof(struct netmap_pipe_adapter *) * npipes;
104 	npa = nm_os_realloc(na->na_pipes, len, old_len);
105 	if (npa == NULL)
106 		return ENOMEM;
107 
108 	na->na_pipes = npa;
109 	na->na_max_pipes = npipes;
110 
111 	return 0;
112 }
113 
114 /* deallocate the parent array in the parent adapter */
115 void
netmap_pipe_dealloc(struct netmap_adapter * na)116 netmap_pipe_dealloc(struct netmap_adapter *na)
117 {
118 	if (na->na_pipes) {
119 		if (na->na_next_pipe > 0) {
120 			nm_prerr("freeing not empty pipe array for %s (%d dangling pipes)!",
121 			    na->name, na->na_next_pipe);
122 		}
123 		nm_os_free(na->na_pipes);
124 		na->na_pipes = NULL;
125 		na->na_max_pipes = 0;
126 		na->na_next_pipe = 0;
127 	}
128 }
129 
130 /* find a pipe endpoint with the given id among the parent's pipes */
131 static struct netmap_pipe_adapter *
netmap_pipe_find(struct netmap_adapter * parent,const char * pipe_id)132 netmap_pipe_find(struct netmap_adapter *parent, const char *pipe_id)
133 {
134 	int i;
135 	struct netmap_pipe_adapter *na;
136 
137 	for (i = 0; i < parent->na_next_pipe; i++) {
138 		const char *na_pipe_id;
139 		na = parent->na_pipes[i];
140 		na_pipe_id = strrchr(na->up.name,
141 			na->role == NM_PIPE_ROLE_MASTER ? '{' : '}');
142 		KASSERT(na_pipe_id != NULL, ("Invalid pipe name"));
143 		++na_pipe_id;
144 		if (!strcmp(na_pipe_id, pipe_id)) {
145 			return na;
146 		}
147 	}
148 	return NULL;
149 }
150 
151 /* add a new pipe endpoint to the parent array */
152 static int
netmap_pipe_add(struct netmap_adapter * parent,struct netmap_pipe_adapter * na)153 netmap_pipe_add(struct netmap_adapter *parent, struct netmap_pipe_adapter *na)
154 {
155 	if (parent->na_next_pipe >= parent->na_max_pipes) {
156 		u_int npipes = parent->na_max_pipes ?  2*parent->na_max_pipes : 2;
157 		int error = nm_pipe_alloc(parent, npipes);
158 		if (error)
159 			return error;
160 	}
161 
162 	parent->na_pipes[parent->na_next_pipe] = na;
163 	na->parent_slot = parent->na_next_pipe;
164 	parent->na_next_pipe++;
165 	return 0;
166 }
167 
168 /* remove the given pipe endpoint from the parent array */
169 static void
netmap_pipe_remove(struct netmap_adapter * parent,struct netmap_pipe_adapter * na)170 netmap_pipe_remove(struct netmap_adapter *parent, struct netmap_pipe_adapter *na)
171 {
172 	u_int n;
173 	n = --parent->na_next_pipe;
174 	if (n != na->parent_slot) {
175 		struct netmap_pipe_adapter **p =
176 			&parent->na_pipes[na->parent_slot];
177 		*p = parent->na_pipes[n];
178 		(*p)->parent_slot = na->parent_slot;
179 	}
180 	parent->na_pipes[n] = NULL;
181 }
182 
183 int
netmap_pipe_txsync(struct netmap_kring * txkring,int flags)184 netmap_pipe_txsync(struct netmap_kring *txkring, int flags)
185 {
186 	struct netmap_kring *rxkring = txkring->pipe;
187 	u_int k, lim = txkring->nkr_num_slots - 1, nk;
188 	int m; /* slots to transfer */
189 	int complete; /* did we see a complete packet ? */
190 	struct netmap_ring *txring = txkring->ring, *rxring = rxkring->ring;
191 
192 	nm_prdis("%p: %s %x -> %s", txkring, txkring->name, flags, rxkring->name);
193 	nm_prdis(20, "TX before: hwcur %d hwtail %d cur %d head %d tail %d",
194 		txkring->nr_hwcur, txkring->nr_hwtail,
195 		txkring->rcur, txkring->rhead, txkring->rtail);
196 
197 	/* update the hwtail */
198 	txkring->nr_hwtail = txkring->pipe_tail;
199 
200 	m = txkring->rhead - txkring->nr_hwcur; /* new slots */
201 	if (m < 0)
202 		m += txkring->nkr_num_slots;
203 
204 	if (m == 0) {
205 		/* nothing to send */
206 		return 0;
207 	}
208 
209 	for (k = txkring->nr_hwcur, nk = lim + 1, complete = 0; m;
210 			m--, k = nm_next(k, lim), nk = (complete ? k : nk)) {
211 		struct netmap_slot *rs = &rxring->slot[k];
212 		struct netmap_slot *ts = &txring->slot[k];
213 
214 		*rs = *ts;
215 		if (ts->flags & NS_BUF_CHANGED) {
216 			ts->flags &= ~NS_BUF_CHANGED;
217 		}
218 		complete = !(ts->flags & NS_MOREFRAG);
219 	}
220 
221 	txkring->nr_hwcur = k;
222 
223 	nm_prdis(20, "TX after : hwcur %d hwtail %d cur %d head %d tail %d k %d",
224 		txkring->nr_hwcur, txkring->nr_hwtail,
225 		txkring->rcur, txkring->rhead, txkring->rtail, k);
226 
227 	if (likely(nk <= lim)) {
228 		mb(); /* make sure the slots are updated before publishing them */
229 		rxkring->pipe_tail = nk; /* only publish complete packets */
230 		rxkring->nm_notify(rxkring, 0);
231 	}
232 
233 	return 0;
234 }
235 
236 int
netmap_pipe_rxsync(struct netmap_kring * rxkring,int flags)237 netmap_pipe_rxsync(struct netmap_kring *rxkring, int flags)
238 {
239 	struct netmap_kring *txkring = rxkring->pipe;
240 	u_int k, lim = rxkring->nkr_num_slots - 1;
241 	int m; /* slots to release */
242 	struct netmap_ring *txring = txkring->ring, *rxring = rxkring->ring;
243 
244 	nm_prdis("%p: %s %x -> %s", txkring, txkring->name, flags, rxkring->name);
245 	nm_prdis(20, "RX before: hwcur %d hwtail %d cur %d head %d tail %d",
246 		rxkring->nr_hwcur, rxkring->nr_hwtail,
247 		rxkring->rcur, rxkring->rhead, rxkring->rtail);
248 
249 	/* update the hwtail */
250 	rxkring->nr_hwtail = rxkring->pipe_tail;
251 
252 	m = rxkring->rhead - rxkring->nr_hwcur; /* released slots */
253 	if (m < 0)
254 		m += rxkring->nkr_num_slots;
255 
256 	if (m == 0) {
257 		/* nothing to release */
258 		return 0;
259 	}
260 
261 	for (k = rxkring->nr_hwcur; m; m--, k = nm_next(k, lim)) {
262 		struct netmap_slot *rs = &rxring->slot[k];
263 		struct netmap_slot *ts = &txring->slot[k];
264 
265 		if (rs->flags & NS_BUF_CHANGED) {
266 			/* copy the slot and report the buffer change */
267 			*ts = *rs;
268 			rs->flags &= ~NS_BUF_CHANGED;
269 		}
270 	}
271 
272 	mb(); /* make sure the slots are updated before publishing them */
273 	txkring->pipe_tail = nm_prev(k, lim);
274 	rxkring->nr_hwcur = k;
275 
276 	nm_prdis(20, "RX after : hwcur %d hwtail %d cur %d head %d tail %d k %d",
277 		rxkring->nr_hwcur, rxkring->nr_hwtail,
278 		rxkring->rcur, rxkring->rhead, rxkring->rtail, k);
279 
280 	txkring->nm_notify(txkring, 0);
281 
282 	return 0;
283 }
284 
285 /* Pipe endpoints are created and destroyed together, so that endopoints do not
286  * have to check for the existence of their peer at each ?xsync.
287  *
288  * To play well with the existing netmap infrastructure (refcounts etc.), we
289  * adopt the following strategy:
290  *
291  * 1) The first endpoint that is created also creates the other endpoint and
292  * grabs a reference to it.
293  *
294  *    state A)  user1 --> endpoint1 --> endpoint2
295  *
296  * 2) If, starting from state A, endpoint2 is then registered, endpoint1 gives
297  * its reference to the user:
298  *
299  *    state B)  user1 --> endpoint1     endpoint2 <--- user2
300  *
301  * 3) Assume that, starting from state B endpoint2 is closed. In the unregister
302  * callback endpoint2 notes that endpoint1 is still active and adds a reference
303  * from endpoint1 to itself. When user2 then releases her own reference,
304  * endpoint2 is not destroyed and we are back to state A. A symmetrical state
305  * would be reached if endpoint1 were released instead.
306  *
307  * 4) If, starting from state A, endpoint1 is closed, the destructor notes that
308  * it owns a reference to endpoint2 and releases it.
309  *
310  * Something similar goes on for the creation and destruction of the krings.
311  */
312 
313 
netmap_pipe_krings_create_both(struct netmap_adapter * na,struct netmap_adapter * ona)314 int netmap_pipe_krings_create_both(struct netmap_adapter *na,
315 				  struct netmap_adapter *ona)
316 {
317 	enum txrx t;
318 	int error;
319 	int i;
320 
321 	/* case 1) below */
322 	nm_prdis("%p: case 1, create both ends", na);
323 	error = netmap_krings_create(na, 0);
324 	if (error)
325 		return error;
326 
327 	/* create the krings of the other end */
328 	error = netmap_krings_create(ona, 0);
329 	if (error)
330 		goto del_krings1;
331 
332 	/* cross link the krings and initialize the pipe_tails */
333 	for_rx_tx(t) {
334 		enum txrx r = nm_txrx_swap(t); /* swap NR_TX <-> NR_RX */
335 		for (i = 0; i < nma_get_nrings(na, t); i++) {
336 			struct netmap_kring *k1 = NMR(na, t)[i],
337 					    *k2 = NMR(ona, r)[i];
338 			k1->pipe = k2;
339 			k2->pipe = k1;
340 			/* mark all peer-adapter rings as fake */
341 			k2->nr_kflags |= NKR_FAKERING;
342 			/* init tails */
343 			k1->pipe_tail = k1->nr_hwtail;
344 			k2->pipe_tail = k2->nr_hwtail;
345 		}
346 	}
347 
348 	return 0;
349 
350 del_krings1:
351 	netmap_krings_delete(na);
352 	return error;
353 }
354 
355 /* netmap_pipe_krings_create.
356  *
357  * There are two cases:
358  *
359  * 1) state is
360  *
361  *        usr1 --> e1 --> e2
362  *
363  *    and we are e1. We have to create both sets
364  *    of krings.
365  *
366  * 2) state is
367  *
368  *        usr1 --> e1 --> e2
369  *
370  *    and we are e2. e1 is certainly registered and our
371  *    krings already exist. Nothing to do.
372  */
373 static int
netmap_pipe_krings_create(struct netmap_adapter * na)374 netmap_pipe_krings_create(struct netmap_adapter *na)
375 {
376 	struct netmap_pipe_adapter *pna =
377 		(struct netmap_pipe_adapter *)na;
378 	struct netmap_adapter *ona = &pna->peer->up;
379 
380 	if (pna->peer_ref)
381 		return netmap_pipe_krings_create_both(na, ona);
382 
383 	return 0;
384 }
385 
386 int
netmap_pipe_reg_both(struct netmap_adapter * na,struct netmap_adapter * ona)387 netmap_pipe_reg_both(struct netmap_adapter *na, struct netmap_adapter *ona)
388 {
389 	int i, error = 0;
390 	enum txrx t;
391 
392 	for_rx_tx(t) {
393 		for (i = 0; i < nma_get_nrings(na, t); i++) {
394 			struct netmap_kring *kring = NMR(na, t)[i];
395 
396 			if (nm_kring_pending_on(kring)) {
397 				/* mark the peer ring as needed */
398 				kring->pipe->nr_kflags |= NKR_NEEDRING;
399 			}
400 		}
401 	}
402 
403 	/* create all missing needed rings on the other end.
404 	 * Either our end, or the other, has been marked as
405 	 * fake, so the allocation will not be done twice.
406 	 */
407 	error = netmap_mem_rings_create(ona);
408 	if (error)
409 		return error;
410 
411 	/* In case of no error we put our rings in netmap mode */
412 	for_rx_tx(t) {
413 		for (i = 0; i < nma_get_nrings(na, t); i++) {
414 			struct netmap_kring *kring = NMR(na, t)[i];
415 			if (nm_kring_pending_on(kring)) {
416 				struct netmap_kring *sring, *dring;
417 
418 				kring->nr_mode = NKR_NETMAP_ON;
419 				if ((kring->nr_kflags & NKR_FAKERING) &&
420 				    (kring->pipe->nr_kflags & NKR_FAKERING)) {
421 					/* this is a re-open of a pipe
422 					 * end-point kept alive by the other end.
423 					 * We need to leave everything as it is
424 					 */
425 					continue;
426 				}
427 
428 				/* copy the buffers from the non-fake ring */
429 				if (kring->nr_kflags & NKR_FAKERING) {
430 					sring = kring->pipe;
431 					dring = kring;
432 				} else {
433 					sring = kring;
434 					dring = kring->pipe;
435 				}
436 				memcpy(dring->ring->slot,
437 				       sring->ring->slot,
438 				       sizeof(struct netmap_slot) *
439 						sring->nkr_num_slots);
440 				/* mark both rings as fake and needed,
441 				 * so that buffers will not be
442 				 * deleted by the standard machinery
443 				 * (we will delete them by ourselves in
444 				 * netmap_pipe_krings_delete)
445 				 */
446 				sring->nr_kflags |=
447 					(NKR_FAKERING | NKR_NEEDRING);
448 				dring->nr_kflags |=
449 					(NKR_FAKERING | NKR_NEEDRING);
450 				kring->nr_mode = NKR_NETMAP_ON;
451 			}
452 		}
453 	}
454 
455 	return 0;
456 }
457 
458 /* netmap_pipe_reg.
459  *
460  * There are two cases on registration (onoff==1)
461  *
462  * 1.a) state is
463  *
464  *        usr1 --> e1 --> e2
465  *
466  *      and we are e1. Create the needed rings of the
467  *      other end.
468  *
469  * 1.b) state is
470  *
471  *        usr1 --> e1 --> e2 <-- usr2
472  *
473  *      and we are e2. Drop the ref e1 is holding.
474  *
475  *  There are two additional cases on unregister (onoff==0)
476  *
477  *  2.a) state is
478  *
479  *         usr1 --> e1 --> e2
480  *
481  *       and we are e1. Nothing special to do, e2 will
482  *       be cleaned up by the destructor of e1.
483  *
484  *  2.b) state is
485  *
486  *         usr1 --> e1     e2 <-- usr2
487  *
488  *       and we are either e1 or e2. Add a ref from the
489  *       other end.
490  */
491 static int
netmap_pipe_reg(struct netmap_adapter * na,int onoff)492 netmap_pipe_reg(struct netmap_adapter *na, int onoff)
493 {
494 	struct netmap_pipe_adapter *pna =
495 		(struct netmap_pipe_adapter *)na;
496 	struct netmap_adapter *ona = &pna->peer->up;
497 	int error = 0;
498 
499 	nm_prdis("%p: onoff %d", na, onoff);
500 	if (onoff) {
501 		error = netmap_pipe_reg_both(na, ona);
502 		if (error) {
503 			return error;
504 		}
505 		if (na->active_fds == 0)
506 			na->na_flags |= NAF_NETMAP_ON;
507 	} else {
508 		if (na->active_fds == 0)
509 			na->na_flags &= ~NAF_NETMAP_ON;
510 		netmap_krings_mode_commit(na, onoff);
511 	}
512 
513 	if (na->active_fds) {
514 		nm_prdis("active_fds %d", na->active_fds);
515 		return 0;
516 	}
517 
518 	if (pna->peer_ref) {
519 		nm_prdis("%p: case 1.a or 2.a, nothing to do", na);
520 		return 0;
521 	}
522 	if (onoff) {
523 		nm_prdis("%p: case 1.b, drop peer", na);
524 		pna->peer->peer_ref = 0;
525 		netmap_adapter_put(na);
526 	} else {
527 		nm_prdis("%p: case 2.b, grab peer", na);
528 		netmap_adapter_get(na);
529 		pna->peer->peer_ref = 1;
530 	}
531 	return error;
532 }
533 
534 void
netmap_pipe_krings_delete_both(struct netmap_adapter * na,struct netmap_adapter * ona)535 netmap_pipe_krings_delete_both(struct netmap_adapter *na,
536 			       struct netmap_adapter *ona)
537 {
538 	struct netmap_adapter *sna;
539 	enum txrx t;
540 	int i;
541 
542 	/* case 1) below */
543 	nm_prdis("%p: case 1, deleting everything", na);
544 	/* To avoid double-frees we zero-out all the buffers in the kernel part
545 	 * of each ring. The reason is this: If the user is behaving correctly,
546 	 * all buffers are found in exactly one slot in the userspace part of
547 	 * some ring.  If the user is not behaving correctly, we cannot release
548 	 * buffers cleanly anyway. In the latter case, the allocator will
549 	 * return to a clean state only when all its users will close.
550 	 */
551 	sna = na;
552 cleanup:
553 	for_rx_tx(t) {
554 		for (i = 0; i < nma_get_nrings(sna, t); i++) {
555 			struct netmap_kring *kring = NMR(sna, t)[i];
556 			struct netmap_ring *ring = kring->ring;
557 			uint32_t j, lim = kring->nkr_num_slots - 1;
558 
559 			nm_prdis("%s ring %p hwtail %u hwcur %u",
560 				kring->name, ring, kring->nr_hwtail, kring->nr_hwcur);
561 
562 			if (ring == NULL)
563 				continue;
564 
565 			if (kring->tx == NR_RX)
566 				ring->slot[kring->pipe_tail].buf_idx = 0;
567 
568 			for (j = nm_next(kring->pipe_tail, lim);
569 			     j != kring->nr_hwcur;
570 			     j = nm_next(j, lim))
571 			{
572 				nm_prdis("%s[%d] %u", kring->name, j, ring->slot[j].buf_idx);
573 				ring->slot[j].buf_idx = 0;
574 			}
575 			kring->nr_kflags &= ~(NKR_FAKERING | NKR_NEEDRING);
576 		}
577 
578 	}
579 	if (sna != ona && ona->tx_rings) {
580 		sna = ona;
581 		goto cleanup;
582 	}
583 
584 	netmap_mem_rings_delete(na);
585 	netmap_krings_delete(na); /* also zeroes tx_rings etc. */
586 
587 	if (ona->tx_rings == NULL) {
588 		/* already deleted, we must be on an
589 		 * cleanup-after-error path */
590 		return;
591 	}
592 	netmap_mem_rings_delete(ona);
593 	netmap_krings_delete(ona);
594 }
595 
596 /* netmap_pipe_krings_delete.
597  *
598  * There are two cases:
599  *
600  * 1) state is
601  *
602  *                usr1 --> e1 --> e2
603  *
604  *    and we are e1 (e2 is not registered, so krings_delete cannot be
605  *    called on it);
606  *
607  * 2) state is
608  *
609  *                usr1 --> e1     e2 <-- usr2
610  *
611  *    and we are either e1 or e2.
612  *
613  * In the former case we have to also delete the krings of e2;
614  * in the latter case we do nothing.
615  */
616 static void
netmap_pipe_krings_delete(struct netmap_adapter * na)617 netmap_pipe_krings_delete(struct netmap_adapter *na)
618 {
619 	struct netmap_pipe_adapter *pna =
620 		(struct netmap_pipe_adapter *)na;
621 	struct netmap_adapter *ona; /* na of the other end */
622 
623 	if (!pna->peer_ref) {
624 		nm_prdis("%p: case 2, kept alive by peer",  na);
625 		return;
626 	}
627 	ona = &pna->peer->up;
628 	netmap_pipe_krings_delete_both(na, ona);
629 }
630 
631 
632 static void
netmap_pipe_dtor(struct netmap_adapter * na)633 netmap_pipe_dtor(struct netmap_adapter *na)
634 {
635 	struct netmap_pipe_adapter *pna =
636 		(struct netmap_pipe_adapter *)na;
637 	nm_prdis("%p %p", na, pna->parent_ifp);
638 	if (pna->peer_ref) {
639 		nm_prdis("%p: clean up peer", na);
640 		pna->peer_ref = 0;
641 		netmap_adapter_put(&pna->peer->up);
642 	}
643 	if (pna->role == NM_PIPE_ROLE_MASTER)
644 		netmap_pipe_remove(pna->parent, pna);
645 	if (pna->parent_ifp)
646 		if_rele(pna->parent_ifp);
647 	netmap_adapter_put(pna->parent);
648 	pna->parent = NULL;
649 }
650 
651 int
netmap_get_pipe_na(struct nmreq_header * hdr,struct netmap_adapter ** na,struct netmap_mem_d * nmd,int create)652 netmap_get_pipe_na(struct nmreq_header *hdr, struct netmap_adapter **na,
653 		struct netmap_mem_d *nmd, int create)
654 {
655 	struct nmreq_register *req = (struct nmreq_register *)(uintptr_t)hdr->nr_body;
656 	struct netmap_adapter *pna; /* parent adapter */
657 	struct netmap_pipe_adapter *mna, *sna, *reqna;
658 	struct ifnet *ifp = NULL;
659 	const char *pipe_id = NULL;
660 	int role = 0;
661 	int error, retries = 0;
662 	char *cbra;
663 
664 	/* Try to parse the pipe syntax 'xx{yy' or 'xx}yy'. */
665 	cbra = strrchr(hdr->nr_name, '{');
666 	if (cbra != NULL) {
667 		role = NM_PIPE_ROLE_MASTER;
668 	} else {
669 		cbra = strrchr(hdr->nr_name, '}');
670 		if (cbra != NULL) {
671 			role = NM_PIPE_ROLE_SLAVE;
672 		} else {
673 			nm_prdis("not a pipe");
674 			return 0;
675 		}
676 	}
677 	pipe_id = cbra + 1;
678 	if (*pipe_id == '\0' || cbra == hdr->nr_name) {
679 		/* Bracket is the last character, so pipe name is missing;
680 		 * or bracket is the first character, so base port name
681 		 * is missing. */
682 		return EINVAL;
683 	}
684 
685 	if (req->nr_mode != NR_REG_ALL_NIC && req->nr_mode != NR_REG_ONE_NIC) {
686 		/* We only accept modes involving hardware rings. */
687 		return EINVAL;
688 	}
689 
690 	/* first, try to find the parent adapter */
691 	for (;;) {
692 		char nr_name_orig[NETMAP_REQ_IFNAMSIZ];
693 		int create_error;
694 
695 		/* Temporarily remove the pipe suffix. */
696 		strlcpy(nr_name_orig, hdr->nr_name, sizeof(nr_name_orig));
697 		*cbra = '\0';
698 		error = netmap_get_na(hdr, &pna, &ifp, nmd, create);
699 		/* Restore the pipe suffix. */
700 		strlcpy(hdr->nr_name, nr_name_orig, sizeof(hdr->nr_name));
701 		if (!error)
702 			break;
703 		if (error != ENXIO || retries++) {
704 			nm_prdis("parent lookup failed: %d", error);
705 			return error;
706 		}
707 		nm_prdis("try to create a persistent vale port");
708 		/* create a persistent vale port and try again */
709 		*cbra = '\0';
710 		NMG_UNLOCK();
711 		create_error = netmap_vi_create(hdr, 1 /* autodelete */);
712 		NMG_LOCK();
713 		strlcpy(hdr->nr_name, nr_name_orig, sizeof(hdr->nr_name));
714 		if (create_error && create_error != EEXIST) {
715 			if (create_error != EOPNOTSUPP) {
716 				nm_prerr("failed to create a persistent vale port: %d",
717 				    create_error);
718 			}
719 			return error;
720 		}
721 	}
722 
723 	if (NETMAP_OWNED_BY_KERN(pna)) {
724 		nm_prdis("parent busy");
725 		error = EBUSY;
726 		goto put_out;
727 	}
728 
729 	/* next, lookup the pipe id in the parent list */
730 	reqna = NULL;
731 	mna = netmap_pipe_find(pna, pipe_id);
732 	if (mna) {
733 		if (mna->role == role) {
734 			nm_prdis("found %s directly at %d", pipe_id, mna->parent_slot);
735 			reqna = mna;
736 		} else {
737 			nm_prdis("found %s indirectly at %d", pipe_id, mna->parent_slot);
738 			reqna = mna->peer;
739 		}
740 		/* the pipe we have found already holds a ref to the parent,
741 		 * so we need to drop the one we got from netmap_get_na()
742 		 */
743 		netmap_unget_na(pna, ifp);
744 		goto found;
745 	}
746 	nm_prdis("pipe %s not found, create %d", pipe_id, create);
747 	if (!create) {
748 		error = ENODEV;
749 		goto put_out;
750 	}
751 	/* we create both master and slave.
752 	 * The endpoint we were asked for holds a reference to
753 	 * the other one.
754 	 */
755 	mna = nm_os_malloc(sizeof(*mna));
756 	if (mna == NULL) {
757 		error = ENOMEM;
758 		goto put_out;
759 	}
760 	snprintf(mna->up.name, sizeof(mna->up.name), "%s{%s", pna->name, pipe_id);
761 
762 	mna->role = NM_PIPE_ROLE_MASTER;
763 	mna->parent = pna;
764 	mna->parent_ifp = ifp;
765 
766 	mna->up.nm_txsync = netmap_pipe_txsync;
767 	mna->up.nm_rxsync = netmap_pipe_rxsync;
768 	mna->up.nm_register = netmap_pipe_reg;
769 	mna->up.nm_dtor = netmap_pipe_dtor;
770 	mna->up.nm_krings_create = netmap_pipe_krings_create;
771 	mna->up.nm_krings_delete = netmap_pipe_krings_delete;
772 	mna->up.nm_mem = netmap_mem_get(pna->nm_mem);
773 	mna->up.na_flags |= NAF_MEM_OWNER;
774 	mna->up.na_lut = pna->na_lut;
775 
776 	mna->up.num_tx_rings = req->nr_tx_rings;
777 	nm_bound_var(&mna->up.num_tx_rings, 1,
778 			1, NM_PIPE_MAXRINGS, NULL);
779 	mna->up.num_rx_rings = req->nr_rx_rings;
780 	nm_bound_var(&mna->up.num_rx_rings, 1,
781 			1, NM_PIPE_MAXRINGS, NULL);
782 	mna->up.num_tx_desc = req->nr_tx_slots;
783 	nm_bound_var(&mna->up.num_tx_desc, pna->num_tx_desc,
784 			1, NM_PIPE_MAXSLOTS, NULL);
785 	mna->up.num_rx_desc = req->nr_rx_slots;
786 	nm_bound_var(&mna->up.num_rx_desc, pna->num_rx_desc,
787 			1, NM_PIPE_MAXSLOTS, NULL);
788 	error = netmap_attach_common(&mna->up);
789 	if (error)
790 		goto free_mna;
791 	/* register the master with the parent */
792 	error = netmap_pipe_add(pna, mna);
793 	if (error)
794 		goto free_mna;
795 
796 	/* create the slave */
797 	sna = nm_os_malloc(sizeof(*mna));
798 	if (sna == NULL) {
799 		error = ENOMEM;
800 		goto unregister_mna;
801 	}
802 	/* most fields are the same, copy from master and then fix */
803 	*sna = *mna;
804 	sna->up.nm_mem = netmap_mem_get(mna->up.nm_mem);
805 	/* swap the number of tx/rx rings and slots */
806 	sna->up.num_tx_rings = mna->up.num_rx_rings;
807 	sna->up.num_tx_desc  = mna->up.num_rx_desc;
808 	sna->up.num_rx_rings = mna->up.num_tx_rings;
809 	sna->up.num_rx_desc  = mna->up.num_tx_desc;
810 	snprintf(sna->up.name, sizeof(sna->up.name), "%s}%s", pna->name, pipe_id);
811 	sna->role = NM_PIPE_ROLE_SLAVE;
812 	error = netmap_attach_common(&sna->up);
813 	if (error)
814 		goto free_sna;
815 
816 	/* join the two endpoints */
817 	mna->peer = sna;
818 	sna->peer = mna;
819 
820 	/* we already have a reference to the parent, but we
821 	 * need another one for the other endpoint we created
822 	 */
823 	netmap_adapter_get(pna);
824 	/* likewise for the ifp, if any */
825 	if (ifp)
826 		if_ref(ifp);
827 
828 	if (role == NM_PIPE_ROLE_MASTER) {
829 		reqna = mna;
830 		mna->peer_ref = 1;
831 		netmap_adapter_get(&sna->up);
832 	} else {
833 		reqna = sna;
834 		sna->peer_ref = 1;
835 		netmap_adapter_get(&mna->up);
836 	}
837 	nm_prdis("created master %p and slave %p", mna, sna);
838 found:
839 
840 	nm_prdis("pipe %s %s at %p", pipe_id,
841 		(reqna->role == NM_PIPE_ROLE_MASTER ? "master" : "slave"), reqna);
842 	*na = &reqna->up;
843 	netmap_adapter_get(*na);
844 
845 	/* keep the reference to the parent.
846 	 * It will be released by the req destructor
847 	 */
848 
849 	return 0;
850 
851 free_sna:
852 	nm_os_free(sna);
853 unregister_mna:
854 	netmap_pipe_remove(pna, mna);
855 free_mna:
856 	nm_os_free(mna);
857 put_out:
858 	netmap_unget_na(pna, ifp);
859 	return error;
860 }
861 
862 
863 #endif /* WITH_PIPES */
864