1 /*
2 * Copyright (C) 2014-2016 Giuseppe Lettieri
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 *
14 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24 * SUCH DAMAGE.
25 */
26
27 /*
28 * $FreeBSD: stable/12/sys/dev/netmap/netmap_monitor.c 372834 2022-12-31 12:30:39Z vmaffione $
29 *
30 * Monitors
31 *
32 * netmap monitors can be used to do monitoring of network traffic
33 * on another adapter, when the latter adapter is working in netmap mode.
34 *
35 * Monitors offer to userspace the same interface as any other netmap port,
36 * with as many pairs of netmap rings as the monitored adapter.
37 * However, only the rx rings are actually used. Each monitor rx ring receives
38 * the traffic transiting on both the tx and rx corresponding rings in the
39 * monitored adapter. During registration, the user can choose if she wants
40 * to intercept tx only, rx only, or both tx and rx traffic.
41 * The slots containing traffic intercepted in the tx direction will have
42 * the NS_TXMON flag set.
43 *
44 * If the monitor is not able to cope with the stream of frames, excess traffic
45 * will be dropped.
46 *
47 * If the monitored adapter leaves netmap mode, the monitor has to be restarted.
48 *
49 * Monitors can be either zero-copy or copy-based.
50 *
51 * Copy monitors see the frames before they are consumed:
52 *
53 * - For tx traffic, this is when the application sends them, before they are
54 * passed down to the adapter.
55 *
56 * - For rx traffic, this is when they are received by the adapter, before
57 * they are sent up to the application, if any (note that, if no
58 * application is reading from a monitored ring, the ring will eventually
59 * fill up and traffic will stop).
60 *
61 * Zero-copy monitors only see the frames after they have been consumed:
62 *
63 * - For tx traffic, this is after the slots containing the frames have been
64 * marked as free. Note that this may happen at a considerably delay after
65 * frame transmission, since freeing of slots is often done lazily.
66 *
67 * - For rx traffic, this is after the consumer on the monitored adapter
68 * has released them. In most cases, the consumer is a userspace
69 * application which may have modified the frame contents.
70 *
71 * Several copy or zero-copy monitors may be active on any ring.
72 *
73 */
74
75
76 #if defined(__FreeBSD__)
77 #include <sys/cdefs.h> /* prerequisite */
78
79 #include <sys/types.h>
80 #include <sys/errno.h>
81 #include <sys/param.h> /* defines used in kernel.h */
82 #include <sys/kernel.h> /* types used in module initialization */
83 #include <sys/malloc.h>
84 #include <sys/poll.h>
85 #include <sys/lock.h>
86 #include <sys/rwlock.h>
87 #include <sys/selinfo.h>
88 #include <sys/sysctl.h>
89 #include <sys/socket.h> /* sockaddrs */
90 #include <net/if.h>
91 #include <net/if_var.h>
92 #include <machine/bus.h> /* bus_dmamap_* */
93 #include <sys/refcount.h>
94
95
96 #elif defined(linux)
97
98 #include "bsd_glue.h"
99
100 #elif defined(__APPLE__)
101
102 #warning OSX support is only partial
103 #include "osx_glue.h"
104
105 #elif defined(_WIN32)
106 #include "win_glue.h"
107 #else
108
109 #error Unsupported platform
110
111 #endif /* unsupported */
112
113 /*
114 * common headers
115 */
116
117 #include <net/netmap.h>
118 #include <dev/netmap/netmap_kern.h>
119 #include <dev/netmap/netmap_mem2.h>
120
121 #ifdef WITH_MONITOR
122
123 #define NM_MONITOR_MAXSLOTS 4096
124
125 /*
126 ********************************************************************
127 * functions common to both kind of monitors
128 ********************************************************************
129 */
130
131 static int netmap_zmon_reg(struct netmap_adapter *, int);
132 static int
nm_is_zmon(struct netmap_adapter * na)133 nm_is_zmon(struct netmap_adapter *na)
134 {
135 return na->nm_register == netmap_zmon_reg;
136 }
137
138 /* nm_sync callback for the monitor's own tx rings.
139 * This makes no sense and always returns error
140 */
141 static int
netmap_monitor_txsync(struct netmap_kring * kring,int flags)142 netmap_monitor_txsync(struct netmap_kring *kring, int flags)
143 {
144 nm_prlim(1, "%s %x", kring->name, flags);
145 return EIO;
146 }
147
148 /* nm_sync callback for the monitor's own rx rings.
149 * Note that the lock in netmap_zmon_parent_sync only protects
150 * writers among themselves. Synchronization between writers
151 * (i.e., netmap_zmon_parent_txsync and netmap_zmon_parent_rxsync)
152 * and readers (i.e., netmap_zmon_rxsync) relies on memory barriers.
153 */
154 static int
netmap_monitor_rxsync(struct netmap_kring * kring,int flags)155 netmap_monitor_rxsync(struct netmap_kring *kring, int flags)
156 {
157 struct netmap_monitor_adapter *mna =
158 (struct netmap_monitor_adapter *)kring->na;
159 if (unlikely(mna->priv.np_na == NULL)) {
160 /* parent left netmap mode */
161 return EIO;
162 }
163 nm_prdis("%s %x", kring->name, flags);
164 kring->nr_hwcur = kring->rhead;
165 mb();
166 return 0;
167 }
168
169 /* nm_krings_create callbacks for monitors.
170 */
171 static int
netmap_monitor_krings_create(struct netmap_adapter * na)172 netmap_monitor_krings_create(struct netmap_adapter *na)
173 {
174 int error = netmap_krings_create(na, 0);
175 enum txrx t;
176
177 if (error)
178 return error;
179 /* override the host rings callbacks */
180 for_rx_tx(t) {
181 int i;
182 u_int first = nma_get_nrings(na, t);
183 for (i = 0; i < nma_get_host_nrings(na, t); i++) {
184 struct netmap_kring *kring = NMR(na, t)[first + i];
185 kring->nm_sync = t == NR_TX ? netmap_monitor_txsync :
186 netmap_monitor_rxsync;
187 }
188 }
189 return 0;
190 }
191
192 /* nm_krings_delete callback for monitors */
193 static void
netmap_monitor_krings_delete(struct netmap_adapter * na)194 netmap_monitor_krings_delete(struct netmap_adapter *na)
195 {
196 netmap_krings_delete(na);
197 }
198
199
200 static u_int
nm_txrx2flag(enum txrx t)201 nm_txrx2flag(enum txrx t)
202 {
203 return (t == NR_RX ? NR_MONITOR_RX : NR_MONITOR_TX);
204 }
205
206 /* allocate the monitors array in the monitored kring */
207 static int
nm_monitor_alloc(struct netmap_kring * kring,u_int n)208 nm_monitor_alloc(struct netmap_kring *kring, u_int n)
209 {
210 size_t old_len, len;
211 struct netmap_kring **nm;
212
213 if (n <= kring->max_monitors)
214 /* we already have more entries that requested */
215 return 0;
216
217 old_len = sizeof(struct netmap_kring *)*kring->max_monitors;
218 len = sizeof(struct netmap_kring *) * n;
219 nm = nm_os_realloc(kring->monitors, len, old_len);
220 if (nm == NULL)
221 return ENOMEM;
222
223 kring->monitors = nm;
224 kring->max_monitors = n;
225
226 return 0;
227 }
228
229 /* deallocate the parent array in the parent adapter */
230 static void
nm_monitor_dealloc(struct netmap_kring * kring)231 nm_monitor_dealloc(struct netmap_kring *kring)
232 {
233 if (kring->monitors) {
234 if (kring->n_monitors > 0) {
235 nm_prerr("freeing not empty monitor array for %s (%d dangling monitors)!",
236 kring->name, kring->n_monitors);
237 }
238 nm_os_free(kring->monitors);
239 kring->monitors = NULL;
240 kring->max_monitors = 0;
241 kring->n_monitors = 0;
242 }
243 }
244
245 /* returns 1 iff kring has no monitors */
246 static inline int
nm_monitor_none(struct netmap_kring * kring)247 nm_monitor_none(struct netmap_kring *kring)
248 {
249 return kring->n_monitors == 0 &&
250 kring->zmon_list[NR_TX].next == NULL &&
251 kring->zmon_list[NR_RX].next == NULL;
252 }
253
254 /*
255 * monitors work by replacing the nm_sync() and possibly the
256 * nm_notify() callbacks in the monitored rings.
257 */
258 static int netmap_zmon_parent_txsync(struct netmap_kring *, int);
259 static int netmap_zmon_parent_rxsync(struct netmap_kring *, int);
260 static int netmap_monitor_parent_txsync(struct netmap_kring *, int);
261 static int netmap_monitor_parent_rxsync(struct netmap_kring *, int);
262 static int netmap_monitor_parent_notify(struct netmap_kring *, int);
263
264 static int
nm_monitor_dummycb(struct netmap_kring * kring,int flags)265 nm_monitor_dummycb(struct netmap_kring *kring, int flags)
266 {
267 (void)kring;
268 (void)flags;
269 return 0;
270 }
271
272 static void
nm_monitor_intercept_callbacks(struct netmap_kring * kring)273 nm_monitor_intercept_callbacks(struct netmap_kring *kring)
274 {
275 nm_prdis("intercept callbacks on %s", kring->name);
276 kring->mon_sync = kring->nm_sync != NULL ?
277 kring->nm_sync : nm_monitor_dummycb;
278 kring->mon_notify = kring->nm_notify;
279 if (kring->tx == NR_TX) {
280 kring->nm_sync = netmap_monitor_parent_txsync;
281 } else {
282 kring->nm_sync = netmap_monitor_parent_rxsync;
283 kring->nm_notify = netmap_monitor_parent_notify;
284 kring->mon_tail = kring->nr_hwtail;
285 }
286 }
287
288 static void
nm_monitor_restore_callbacks(struct netmap_kring * kring)289 nm_monitor_restore_callbacks(struct netmap_kring *kring)
290 {
291 nm_prdis("restoring callbacks on %s", kring->name);
292 kring->nm_sync = kring->mon_sync;
293 kring->mon_sync = NULL;
294 if (kring->tx == NR_RX) {
295 kring->nm_notify = kring->mon_notify;
296 }
297 kring->mon_notify = NULL;
298 }
299
300 static struct netmap_kring *
nm_zmon_list_head(struct netmap_kring * mkring,enum txrx t)301 nm_zmon_list_head(struct netmap_kring *mkring, enum txrx t)
302 {
303 struct netmap_adapter *na = mkring->na;
304 struct netmap_kring *kring = mkring;
305 struct netmap_zmon_list *z = &kring->zmon_list[t];
306 /* reach the head of the list */
307 while (nm_is_zmon(na) && z->prev != NULL) {
308 kring = z->prev;
309 na = kring->na;
310 z = &kring->zmon_list[t];
311 }
312 return nm_is_zmon(na) ? NULL : kring;
313 }
314
315 /* add the monitor mkring to the list of monitors of kring.
316 * If this is the first monitor, intercept the callbacks
317 */
318 static int
netmap_monitor_add(struct netmap_kring * mkring,struct netmap_kring * kring,int zmon)319 netmap_monitor_add(struct netmap_kring *mkring, struct netmap_kring *kring, int zmon)
320 {
321 int error = NM_IRQ_COMPLETED;
322 enum txrx t = kring->tx;
323 struct netmap_zmon_list *z = &kring->zmon_list[t];
324 struct netmap_zmon_list *mz = &mkring->zmon_list[t];
325 struct netmap_kring *ikring = kring;
326
327 /* a zero-copy monitor which is not the first in the list
328 * must monitor the previous monitor
329 */
330 if (zmon && z->prev != NULL)
331 ikring = z->prev; /* tail of the list */
332
333 /* synchronize with concurrently running nm_sync()s */
334 nm_kr_stop(kring, NM_KR_LOCKED);
335
336 if (nm_monitor_none(ikring)) {
337 /* this is the first monitor, intercept the callbacks */
338 nm_prdis("%s: intercept callbacks on %s", mkring->name, ikring->name);
339 nm_monitor_intercept_callbacks(ikring);
340 }
341
342 if (zmon) {
343 /* append the zmon to the list */
344 ikring->zmon_list[t].next = mkring;
345 z->prev = mkring; /* new tail */
346 mz->prev = ikring;
347 mz->next = NULL;
348 /* grab a reference to the previous netmap adapter
349 * in the chain (this may be the monitored port
350 * or another zero-copy monitor)
351 */
352 netmap_adapter_get(ikring->na);
353 } else {
354 /* make sure the monitor array exists and is big enough */
355 error = nm_monitor_alloc(kring, kring->n_monitors + 1);
356 if (error)
357 goto out;
358 kring->monitors[kring->n_monitors] = mkring;
359 mkring->mon_pos[kring->tx] = kring->n_monitors;
360 kring->n_monitors++;
361 }
362
363 out:
364 nm_kr_start(kring);
365 return error;
366 }
367
368 /* remove the monitor mkring from the list of monitors of kring.
369 * If this is the last monitor, restore the original callbacks
370 */
371 static void
netmap_monitor_del(struct netmap_kring * mkring,struct netmap_kring * kring,enum txrx t)372 netmap_monitor_del(struct netmap_kring *mkring, struct netmap_kring *kring, enum txrx t)
373 {
374 int zmon = nm_is_zmon(mkring->na);
375 struct netmap_zmon_list *mz = &mkring->zmon_list[t];
376 struct netmap_kring *ikring = kring;
377
378
379 if (zmon) {
380 /* get to the head of the list */
381 kring = nm_zmon_list_head(mkring, t);
382 ikring = mz->prev;
383 }
384
385 /* synchronize with concurrently running nm_sync()s
386 * if kring is NULL (orphaned list) the monitored port
387 * has exited netmap mode, so there is nothing to stop
388 */
389 if (kring != NULL)
390 nm_kr_stop(kring, NM_KR_LOCKED);
391
392 if (zmon) {
393 /* remove the monitor from the list */
394 if (mz->next != NULL) {
395 mz->next->zmon_list[t].prev = mz->prev;
396 /* we also need to let the next monitor drop the
397 * reference to us and grab the reference to the
398 * previous ring owner, instead
399 */
400 if (mz->prev != NULL)
401 netmap_adapter_get(mz->prev->na);
402 netmap_adapter_put(mkring->na);
403 } else if (kring != NULL) {
404 /* in the monitored kring, prev is actually the
405 * pointer to the tail of the list
406 */
407 kring->zmon_list[t].prev =
408 (mz->prev != kring ? mz->prev : NULL);
409 }
410 if (mz->prev != NULL) {
411 netmap_adapter_put(mz->prev->na);
412 mz->prev->zmon_list[t].next = mz->next;
413 }
414 mz->prev = NULL;
415 mz->next = NULL;
416 } else {
417 /* this is a copy monitor */
418 uint32_t mon_pos = mkring->mon_pos[kring->tx];
419 kring->n_monitors--;
420 if (mon_pos != kring->n_monitors) {
421 kring->monitors[mon_pos] =
422 kring->monitors[kring->n_monitors];
423 kring->monitors[mon_pos]->mon_pos[kring->tx] = mon_pos;
424 }
425 kring->monitors[kring->n_monitors] = NULL;
426 if (kring->n_monitors == 0) {
427 nm_monitor_dealloc(kring);
428 }
429 }
430
431 if (ikring != NULL && nm_monitor_none(ikring)) {
432 /* this was the last monitor, restore the callbacks */
433 nm_monitor_restore_callbacks(ikring);
434 }
435
436 if (kring != NULL)
437 nm_kr_start(kring);
438 }
439
440
441 /* This is called when the monitored adapter leaves netmap mode
442 * (see netmap_do_unregif).
443 * We need to notify the monitors that the monitored rings are gone.
444 * We do this by setting their mna->priv.np_na to NULL.
445 * Note that the rings are already stopped when this happens, so
446 * no monitor ring callback can be active.
447 */
448 void
netmap_monitor_stop(struct netmap_adapter * na)449 netmap_monitor_stop(struct netmap_adapter *na)
450 {
451 enum txrx t;
452
453 for_rx_tx(t) {
454 u_int i;
455
456 for (i = 0; i < netmap_all_rings(na, t); i++) {
457 struct netmap_kring *kring = NMR(na, t)[i];
458 struct netmap_zmon_list *z = &kring->zmon_list[t];
459 u_int j;
460
461 if (nm_monitor_none(kring))
462 continue;
463
464 for (j = 0; j < kring->n_monitors; j++) {
465 struct netmap_kring *mkring =
466 kring->monitors[j];
467 struct netmap_monitor_adapter *mna =
468 (struct netmap_monitor_adapter *)mkring->na;
469 /* forget about this adapter */
470 if (mna->priv.np_na != NULL) {
471 netmap_adapter_put(mna->priv.np_na);
472 mna->priv.np_na = NULL;
473 }
474 kring->monitors[j] = NULL;
475 }
476 kring->n_monitors = 0;
477 nm_monitor_dealloc(kring);
478
479 if (!nm_is_zmon(na)) {
480 /* we are the head of at most one list */
481 struct netmap_kring *zkring;
482 for (zkring = z->next; zkring != NULL;
483 zkring = zkring->zmon_list[t].next)
484 {
485 struct netmap_monitor_adapter *next =
486 (struct netmap_monitor_adapter *)zkring->na;
487 /* let the monitor forget about us */
488 netmap_adapter_put(next->priv.np_na); /* nop if null */
489 next->priv.np_na = NULL;
490 /* drop the additional ref taken in netmap_monitor_add() */
491 netmap_adapter_put(zkring->zmon_list[t].prev->na);
492 }
493 /* orhpan the zmon list */
494 if (z->next != NULL)
495 z->next->zmon_list[t].prev = NULL;
496 z->next = NULL;
497 z->prev = NULL;
498 }
499
500 nm_monitor_restore_callbacks(kring);
501 }
502 }
503 }
504
505
506 /* common functions for the nm_register() callbacks of both kind of
507 * monitors.
508 */
509 static int
netmap_monitor_reg_common(struct netmap_adapter * na,int onoff,int zmon)510 netmap_monitor_reg_common(struct netmap_adapter *na, int onoff, int zmon)
511 {
512 struct netmap_monitor_adapter *mna =
513 (struct netmap_monitor_adapter *)na;
514 struct netmap_priv_d *priv = &mna->priv;
515 struct netmap_adapter *pna = priv->np_na;
516 struct netmap_kring *kring, *mkring;
517 int i;
518 enum txrx t, s;
519
520 nm_prdis("%p: onoff %d", na, onoff);
521 if (onoff) {
522 if (pna == NULL) {
523 /* parent left netmap mode, fatal */
524 nm_prerr("%s: parent left netmap mode", na->name);
525 return ENXIO;
526 }
527 for_rx_tx(t) {
528 for (i = 0; i < netmap_all_rings(na, t); i++) {
529 mkring = NMR(na, t)[i];
530 if (!nm_kring_pending_on(mkring))
531 continue;
532 mkring->nr_mode = NKR_NETMAP_ON;
533 if (t == NR_TX)
534 continue;
535 for_rx_tx(s) {
536 if (i > nma_get_nrings(pna, s))
537 continue;
538 if (mna->flags & nm_txrx2flag(s)) {
539 kring = NMR(pna, s)[i];
540 netmap_monitor_add(mkring, kring, zmon);
541 }
542 }
543 }
544 }
545 na->na_flags |= NAF_NETMAP_ON;
546 } else {
547 if (na->active_fds == 0)
548 na->na_flags &= ~NAF_NETMAP_ON;
549 for_rx_tx(t) {
550 for (i = 0; i < netmap_all_rings(na, t); i++) {
551 mkring = NMR(na, t)[i];
552 if (!nm_kring_pending_off(mkring))
553 continue;
554 mkring->nr_mode = NKR_NETMAP_OFF;
555 if (t == NR_TX)
556 continue;
557 /* we cannot access the parent krings if the parent
558 * has left netmap mode. This is signaled by a NULL
559 * pna pointer
560 */
561 if (pna == NULL)
562 continue;
563 for_rx_tx(s) {
564 if (i > nma_get_nrings(pna, s))
565 continue;
566 if (mna->flags & nm_txrx2flag(s)) {
567 kring = NMR(pna, s)[i];
568 netmap_monitor_del(mkring, kring, s);
569 }
570 }
571 }
572 }
573 }
574 return 0;
575 }
576
577 /*
578 ****************************************************************
579 * functions specific for zero-copy monitors
580 ****************************************************************
581 */
582
583 /*
584 * Common function for both zero-copy tx and rx nm_sync()
585 * callbacks
586 */
587 static int
netmap_zmon_parent_sync(struct netmap_kring * kring,int flags,enum txrx tx)588 netmap_zmon_parent_sync(struct netmap_kring *kring, int flags, enum txrx tx)
589 {
590 struct netmap_kring *mkring = kring->zmon_list[tx].next;
591 struct netmap_ring *ring = kring->ring, *mring;
592 int error = 0;
593 int rel_slots, free_slots, busy, sent = 0;
594 u_int beg, end, i;
595 u_int lim = kring->nkr_num_slots - 1,
596 mlim; // = mkring->nkr_num_slots - 1;
597 uint16_t txmon = kring->tx == NR_TX ? NS_TXMON : 0;
598
599 if (mkring == NULL) {
600 nm_prlim(5, "NULL monitor on %s", kring->name);
601 return 0;
602 }
603 mring = mkring->ring;
604 mlim = mkring->nkr_num_slots - 1;
605
606 /* get the relased slots (rel_slots) */
607 if (tx == NR_TX) {
608 beg = kring->nr_hwtail + 1;
609 error = kring->mon_sync(kring, flags);
610 if (error)
611 return error;
612 end = kring->nr_hwtail + 1;
613 } else { /* NR_RX */
614 beg = kring->nr_hwcur;
615 end = kring->rhead;
616 }
617
618 rel_slots = end - beg;
619 if (rel_slots < 0)
620 rel_slots += kring->nkr_num_slots;
621
622 if (!rel_slots) {
623 /* no released slots, but we still need
624 * to call rxsync if this is a rx ring
625 */
626 goto out_rxsync;
627 }
628
629 /* we need to lock the monitor receive ring, since it
630 * is the target of bot tx and rx traffic from the monitored
631 * adapter
632 */
633 mtx_lock(&mkring->q_lock);
634 /* get the free slots available on the monitor ring */
635 i = mkring->nr_hwtail;
636 busy = i - mkring->nr_hwcur;
637 if (busy < 0)
638 busy += mkring->nkr_num_slots;
639 free_slots = mlim - busy;
640
641 if (!free_slots)
642 goto out;
643
644 /* swap min(free_slots, rel_slots) slots */
645 if (free_slots < rel_slots) {
646 beg += (rel_slots - free_slots);
647 rel_slots = free_slots;
648 }
649 if (unlikely(beg >= kring->nkr_num_slots))
650 beg -= kring->nkr_num_slots;
651
652 sent = rel_slots;
653 for ( ; rel_slots; rel_slots--) {
654 struct netmap_slot *s = &ring->slot[beg];
655 struct netmap_slot *ms = &mring->slot[i];
656 uint32_t tmp;
657
658 tmp = ms->buf_idx;
659 ms->buf_idx = s->buf_idx;
660 s->buf_idx = tmp;
661 nm_prdis(5, "beg %d buf_idx %d", beg, tmp);
662
663 tmp = ms->len;
664 ms->len = s->len;
665 s->len = tmp;
666
667 ms->flags = (s->flags & ~NS_TXMON) | txmon;
668 s->flags |= NS_BUF_CHANGED;
669
670 beg = nm_next(beg, lim);
671 i = nm_next(i, mlim);
672
673 }
674 mb();
675 mkring->nr_hwtail = i;
676
677 out:
678 mtx_unlock(&mkring->q_lock);
679
680 if (sent) {
681 /* notify the new frames to the monitor */
682 mkring->nm_notify(mkring, 0);
683 }
684
685 out_rxsync:
686 if (tx == NR_RX)
687 error = kring->mon_sync(kring, flags);
688
689 return error;
690 }
691
692 /* callback used to replace the nm_sync callback in the monitored tx rings */
693 static int
netmap_zmon_parent_txsync(struct netmap_kring * kring,int flags)694 netmap_zmon_parent_txsync(struct netmap_kring *kring, int flags)
695 {
696 return netmap_zmon_parent_sync(kring, flags, NR_TX);
697 }
698
699 /* callback used to replace the nm_sync callback in the monitored rx rings */
700 static int
netmap_zmon_parent_rxsync(struct netmap_kring * kring,int flags)701 netmap_zmon_parent_rxsync(struct netmap_kring *kring, int flags)
702 {
703 return netmap_zmon_parent_sync(kring, flags, NR_RX);
704 }
705
706 static int
netmap_zmon_reg(struct netmap_adapter * na,int onoff)707 netmap_zmon_reg(struct netmap_adapter *na, int onoff)
708 {
709 return netmap_monitor_reg_common(na, onoff, 1 /* zcopy */);
710 }
711
712 /* nm_dtor callback for monitors */
713 static void
netmap_zmon_dtor(struct netmap_adapter * na)714 netmap_zmon_dtor(struct netmap_adapter *na)
715 {
716 struct netmap_monitor_adapter *mna =
717 (struct netmap_monitor_adapter *)na;
718 struct netmap_priv_d *priv = &mna->priv;
719 struct netmap_adapter *pna = priv->np_na;
720
721 netmap_adapter_put(pna);
722 }
723
724 /*
725 ****************************************************************
726 * functions specific for copy monitors
727 ****************************************************************
728 */
729
730 static void
netmap_monitor_parent_sync(struct netmap_kring * kring,u_int first_new,int new_slots)731 netmap_monitor_parent_sync(struct netmap_kring *kring, u_int first_new, int new_slots)
732 {
733 u_int j;
734 uint16_t txmon = kring->tx == NR_TX ? NS_TXMON : 0;
735
736 for (j = 0; j < kring->n_monitors; j++) {
737 struct netmap_kring *mkring = kring->monitors[j];
738 u_int i, mlim, beg;
739 int free_slots, busy, sent = 0, m;
740 u_int lim = kring->nkr_num_slots - 1;
741 struct netmap_ring *ring = kring->ring, *mring = mkring->ring;
742 u_int max_len = NETMAP_BUF_SIZE(mkring->na);
743
744 mlim = mkring->nkr_num_slots - 1;
745
746 /* we need to lock the monitor receive ring, since it
747 * is the target of bot tx and rx traffic from the monitored
748 * adapter
749 */
750 mtx_lock(&mkring->q_lock);
751 /* get the free slots available on the monitor ring */
752 i = mkring->nr_hwtail;
753 busy = i - mkring->nr_hwcur;
754 if (busy < 0)
755 busy += mkring->nkr_num_slots;
756 free_slots = mlim - busy;
757
758 if (!free_slots)
759 goto out;
760
761 /* copy min(free_slots, new_slots) slots */
762 m = new_slots;
763 beg = first_new;
764 if (free_slots < m) {
765 beg += (m - free_slots);
766 if (beg >= kring->nkr_num_slots)
767 beg -= kring->nkr_num_slots;
768 m = free_slots;
769 }
770
771 for ( ; m; m--) {
772 struct netmap_slot *s = &ring->slot[beg];
773 struct netmap_slot *ms = &mring->slot[i];
774 u_int copy_len = s->len;
775 char *src = NMB(kring->na, s),
776 *dst = NMB(mkring->na, ms);
777
778 if (unlikely(copy_len > max_len)) {
779 nm_prlim(5, "%s->%s: truncating %d to %d", kring->name,
780 mkring->name, copy_len, max_len);
781 copy_len = max_len;
782 }
783
784 memcpy(dst, src, copy_len);
785 ms->len = copy_len;
786 ms->flags = (s->flags & ~NS_TXMON) | txmon;
787 sent++;
788
789 beg = nm_next(beg, lim);
790 i = nm_next(i, mlim);
791 }
792 mb();
793 mkring->nr_hwtail = i;
794 out:
795 mtx_unlock(&mkring->q_lock);
796
797 if (sent) {
798 /* notify the new frames to the monitor */
799 mkring->nm_notify(mkring, 0);
800 }
801 }
802 }
803
804 /* callback used to replace the nm_sync callback in the monitored tx rings */
805 static int
netmap_monitor_parent_txsync(struct netmap_kring * kring,int flags)806 netmap_monitor_parent_txsync(struct netmap_kring *kring, int flags)
807 {
808 u_int first_new;
809 int new_slots;
810
811 /* get the new slots */
812 if (kring->n_monitors > 0) {
813 first_new = kring->nr_hwcur;
814 new_slots = kring->rhead - first_new;
815 if (new_slots < 0)
816 new_slots += kring->nkr_num_slots;
817 if (new_slots)
818 netmap_monitor_parent_sync(kring, first_new, new_slots);
819 }
820 if (kring->zmon_list[NR_TX].next != NULL) {
821 return netmap_zmon_parent_txsync(kring, flags);
822 }
823 return kring->mon_sync(kring, flags);
824 }
825
826 /* callback used to replace the nm_sync callback in the monitored rx rings */
827 static int
netmap_monitor_parent_rxsync(struct netmap_kring * kring,int flags)828 netmap_monitor_parent_rxsync(struct netmap_kring *kring, int flags)
829 {
830 u_int first_new;
831 int new_slots, error;
832
833 /* get the new slots */
834 if (kring->zmon_list[NR_RX].next != NULL) {
835 error = netmap_zmon_parent_rxsync(kring, flags);
836 } else {
837 error = kring->mon_sync(kring, flags);
838 }
839 if (error)
840 return error;
841 if (kring->n_monitors > 0) {
842 first_new = kring->mon_tail;
843 new_slots = kring->nr_hwtail - first_new;
844 if (new_slots < 0)
845 new_slots += kring->nkr_num_slots;
846 if (new_slots)
847 netmap_monitor_parent_sync(kring, first_new, new_slots);
848 kring->mon_tail = kring->nr_hwtail;
849 }
850 return 0;
851 }
852
853 /* callback used to replace the nm_notify() callback in the monitored rx rings */
854 static int
netmap_monitor_parent_notify(struct netmap_kring * kring,int flags)855 netmap_monitor_parent_notify(struct netmap_kring *kring, int flags)
856 {
857 int (*notify)(struct netmap_kring*, int);
858 nm_prdis(5, "%s %x", kring->name, flags);
859 /* ?xsync callbacks have tryget called by their callers
860 * (NIOCREGIF and poll()), but here we have to call it
861 * by ourself
862 */
863 if (nm_kr_tryget(kring, 0, NULL)) {
864 /* in all cases, just skip the sync */
865 return NM_IRQ_COMPLETED;
866 }
867 if (kring->n_monitors > 0) {
868 netmap_monitor_parent_rxsync(kring, NAF_FORCE_READ);
869 }
870 if (nm_monitor_none(kring)) {
871 /* we are no longer monitoring this ring, so both
872 * mon_sync and mon_notify are NULL
873 */
874 notify = kring->nm_notify;
875 } else {
876 notify = kring->mon_notify;
877 }
878 nm_kr_put(kring);
879 return notify(kring, flags);
880 }
881
882
883 static int
netmap_monitor_reg(struct netmap_adapter * na,int onoff)884 netmap_monitor_reg(struct netmap_adapter *na, int onoff)
885 {
886 return netmap_monitor_reg_common(na, onoff, 0 /* no zcopy */);
887 }
888
889 static void
netmap_monitor_dtor(struct netmap_adapter * na)890 netmap_monitor_dtor(struct netmap_adapter *na)
891 {
892 struct netmap_monitor_adapter *mna =
893 (struct netmap_monitor_adapter *)na;
894 struct netmap_priv_d *priv = &mna->priv;
895 struct netmap_adapter *pna = priv->np_na;
896
897 netmap_adapter_put(pna);
898 }
899
900
901 /* check if req is a request for a monitor adapter that we can satisfy */
902 int
netmap_get_monitor_na(struct nmreq_header * hdr,struct netmap_adapter ** na,struct netmap_mem_d * nmd,int create)903 netmap_get_monitor_na(struct nmreq_header *hdr, struct netmap_adapter **na,
904 struct netmap_mem_d *nmd, int create)
905 {
906 struct nmreq_register *req = (struct nmreq_register *)(uintptr_t)hdr->nr_body;
907 struct nmreq_register preq;
908 struct netmap_adapter *pna; /* parent adapter */
909 struct netmap_monitor_adapter *mna;
910 struct ifnet *ifp = NULL;
911 int error;
912 int zcopy = (req->nr_flags & NR_ZCOPY_MON);
913
914 if (zcopy) {
915 req->nr_flags |= (NR_MONITOR_TX | NR_MONITOR_RX);
916 }
917 if ((req->nr_flags & (NR_MONITOR_TX | NR_MONITOR_RX)) == 0) {
918 nm_prdis("not a monitor");
919 return 0;
920 }
921 /* this is a request for a monitor adapter */
922
923 nm_prdis("flags %lx", req->nr_flags);
924
925 /* First, try to find the adapter that we want to monitor.
926 * We use the same req, after we have turned off the monitor flags.
927 * In this way we can potentially monitor everything netmap understands,
928 * except other monitors.
929 */
930 memcpy(&preq, req, sizeof(preq));
931 preq.nr_flags &= ~(NR_MONITOR_TX | NR_MONITOR_RX | NR_ZCOPY_MON);
932 hdr->nr_body = (uintptr_t)&preq;
933 error = netmap_get_na(hdr, &pna, &ifp, nmd, create);
934 hdr->nr_body = (uintptr_t)req;
935 if (error) {
936 nm_prerr("parent lookup failed: %d", error);
937 return error;
938 }
939 nm_prdis("found parent: %s", pna->name);
940
941 if (!nm_netmap_on(pna)) {
942 /* parent not in netmap mode */
943 /* XXX we can wait for the parent to enter netmap mode,
944 * by intercepting its nm_register callback (2014-03-16)
945 */
946 nm_prerr("%s not in netmap mode", pna->name);
947 error = EINVAL;
948 goto put_out;
949 }
950
951 mna = nm_os_malloc(sizeof(*mna));
952 if (mna == NULL) {
953 error = ENOMEM;
954 goto put_out;
955 }
956 mna->priv.np_na = pna;
957
958 /* grab all the rings we need in the parent */
959 error = netmap_interp_ringid(&mna->priv, hdr);
960 if (error) {
961 nm_prerr("ringid error");
962 goto free_out;
963 }
964 snprintf(mna->up.name, sizeof(mna->up.name), "%s/%s%s%s#%lu", pna->name,
965 zcopy ? "z" : "",
966 (req->nr_flags & NR_MONITOR_RX) ? "r" : "",
967 (req->nr_flags & NR_MONITOR_TX) ? "t" : "",
968 pna->monitor_id++);
969
970 /* the monitor supports the host rings iff the parent does */
971 mna->up.na_flags |= (pna->na_flags & NAF_HOST_RINGS);
972 /* a do-nothing txsync: monitors cannot be used to inject packets */
973 mna->up.nm_txsync = netmap_monitor_txsync;
974 mna->up.nm_rxsync = netmap_monitor_rxsync;
975 mna->up.nm_krings_create = netmap_monitor_krings_create;
976 mna->up.nm_krings_delete = netmap_monitor_krings_delete;
977 mna->up.num_tx_rings = 1; // XXX what should we do here with chained zmons?
978 /* we set the number of our rx_rings to be max(num_rx_rings, num_rx_rings)
979 * in the parent
980 */
981 mna->up.num_rx_rings = pna->num_rx_rings;
982 if (pna->num_tx_rings > pna->num_rx_rings)
983 mna->up.num_rx_rings = pna->num_tx_rings;
984 /* by default, the number of slots is the same as in
985 * the parent rings, but the user may ask for a different
986 * number
987 */
988 mna->up.num_tx_desc = req->nr_tx_slots;
989 nm_bound_var(&mna->up.num_tx_desc, pna->num_tx_desc,
990 1, NM_MONITOR_MAXSLOTS, NULL);
991 mna->up.num_rx_desc = req->nr_rx_slots;
992 nm_bound_var(&mna->up.num_rx_desc, pna->num_rx_desc,
993 1, NM_MONITOR_MAXSLOTS, NULL);
994 if (zcopy) {
995 mna->up.nm_register = netmap_zmon_reg;
996 mna->up.nm_dtor = netmap_zmon_dtor;
997 /* to have zero copy, we need to use the same memory allocator
998 * as the monitored port
999 */
1000 mna->up.nm_mem = netmap_mem_get(pna->nm_mem);
1001 /* and the allocator cannot be changed */
1002 mna->up.na_flags |= NAF_MEM_OWNER;
1003 } else {
1004 mna->up.nm_register = netmap_monitor_reg;
1005 mna->up.nm_dtor = netmap_monitor_dtor;
1006 mna->up.nm_mem = netmap_mem_private_new(
1007 mna->up.num_tx_rings,
1008 mna->up.num_tx_desc,
1009 mna->up.num_rx_rings,
1010 mna->up.num_rx_desc,
1011 0, /* extra bufs */
1012 0, /* pipes */
1013 &error);
1014 if (mna->up.nm_mem == NULL)
1015 goto put_out;
1016 }
1017
1018 error = netmap_attach_common(&mna->up);
1019 if (error) {
1020 nm_prerr("netmap_attach_common failed");
1021 goto mem_put_out;
1022 }
1023
1024 /* remember the traffic directions we have to monitor */
1025 mna->flags = (req->nr_flags & (NR_MONITOR_TX | NR_MONITOR_RX | NR_ZCOPY_MON));
1026
1027 *na = &mna->up;
1028 netmap_adapter_get(*na);
1029
1030 /* keep the reference to the parent */
1031 nm_prdis("monitor ok");
1032
1033 /* drop the reference to the ifp, if any */
1034 if (ifp)
1035 if_rele(ifp);
1036
1037 return 0;
1038
1039 mem_put_out:
1040 netmap_mem_put(mna->up.nm_mem);
1041 free_out:
1042 nm_os_free(mna);
1043 put_out:
1044 netmap_unget_na(pna, ifp);
1045 return error;
1046 }
1047
1048
1049 #endif /* WITH_MONITOR */
1050