if_vioif.c revision 1.92 1 /* $NetBSD: if_vioif.c,v 1.92 2023/03/23 01:58:04 yamaguchi Exp $ */
2
3 /*
4 * Copyright (c) 2020 The NetBSD Foundation, Inc.
5 * Copyright (c) 2010 Minoura Makoto.
6 * All rights reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
18 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
19 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
20 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
21 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
22 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
26 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27 */
28
29 #include <sys/cdefs.h>
30 __KERNEL_RCSID(0, "$NetBSD: if_vioif.c,v 1.92 2023/03/23 01:58:04 yamaguchi Exp $");
31
32 #ifdef _KERNEL_OPT
33 #include "opt_net_mpsafe.h"
34 #endif
35
36 #include <sys/param.h>
37 #include <sys/systm.h>
38 #include <sys/kernel.h>
39 #include <sys/atomic.h>
40 #include <sys/bus.h>
41 #include <sys/condvar.h>
42 #include <sys/device.h>
43 #include <sys/evcnt.h>
44 #include <sys/intr.h>
45 #include <sys/kmem.h>
46 #include <sys/mbuf.h>
47 #include <sys/mutex.h>
48 #include <sys/sockio.h>
49 #include <sys/syslog.h>
50 #include <sys/cpu.h>
51 #include <sys/module.h>
52 #include <sys/pcq.h>
53 #include <sys/workqueue.h>
54 #include <sys/xcall.h>
55
56 #include <dev/pci/virtioreg.h>
57 #include <dev/pci/virtiovar.h>
58
59 #include <net/if.h>
60 #include <net/if_dl.h>
61 #include <net/if_media.h>
62 #include <net/if_ether.h>
63
64 #include <net/bpf.h>
65
66 #include "ioconf.h"
67
68 #ifdef NET_MPSAFE
69 #define VIOIF_MPSAFE 1
70 #define VIOIF_MULTIQ 1
71 #endif
72
73 /*
74 * if_vioifreg.h:
75 */
76 /* Configuration registers */
77 #define VIRTIO_NET_CONFIG_MAC 0 /* 8bit x 6byte */
78 #define VIRTIO_NET_CONFIG_STATUS 6 /* 16bit */
79 #define VIRTIO_NET_CONFIG_MAX_VQ_PAIRS 8 /* 16bit */
80 #define VIRTIO_NET_CONFIG_MTU 10 /* 16bit */
81
82 /* Feature bits */
83 #define VIRTIO_NET_F_CSUM __BIT(0)
84 #define VIRTIO_NET_F_GUEST_CSUM __BIT(1)
85 #define VIRTIO_NET_F_MAC __BIT(5)
86 #define VIRTIO_NET_F_GSO __BIT(6)
87 #define VIRTIO_NET_F_GUEST_TSO4 __BIT(7)
88 #define VIRTIO_NET_F_GUEST_TSO6 __BIT(8)
89 #define VIRTIO_NET_F_GUEST_ECN __BIT(9)
90 #define VIRTIO_NET_F_GUEST_UFO __BIT(10)
91 #define VIRTIO_NET_F_HOST_TSO4 __BIT(11)
92 #define VIRTIO_NET_F_HOST_TSO6 __BIT(12)
93 #define VIRTIO_NET_F_HOST_ECN __BIT(13)
94 #define VIRTIO_NET_F_HOST_UFO __BIT(14)
95 #define VIRTIO_NET_F_MRG_RXBUF __BIT(15)
96 #define VIRTIO_NET_F_STATUS __BIT(16)
97 #define VIRTIO_NET_F_CTRL_VQ __BIT(17)
98 #define VIRTIO_NET_F_CTRL_RX __BIT(18)
99 #define VIRTIO_NET_F_CTRL_VLAN __BIT(19)
100 #define VIRTIO_NET_F_CTRL_RX_EXTRA __BIT(20)
101 #define VIRTIO_NET_F_GUEST_ANNOUNCE __BIT(21)
102 #define VIRTIO_NET_F_MQ __BIT(22)
103 #define VIRTIO_NET_F_CTRL_MAC_ADDR __BIT(23)
104
105 #define VIRTIO_NET_FLAG_BITS \
106 VIRTIO_COMMON_FLAG_BITS \
107 "b\x17" "CTRL_MAC\0" \
108 "b\x16" "MQ\0" \
109 "b\x15" "GUEST_ANNOUNCE\0" \
110 "b\x14" "CTRL_RX_EXTRA\0" \
111 "b\x13" "CTRL_VLAN\0" \
112 "b\x12" "CTRL_RX\0" \
113 "b\x11" "CTRL_VQ\0" \
114 "b\x10" "STATUS\0" \
115 "b\x0f" "MRG_RXBUF\0" \
116 "b\x0e" "HOST_UFO\0" \
117 "b\x0d" "HOST_ECN\0" \
118 "b\x0c" "HOST_TSO6\0" \
119 "b\x0b" "HOST_TSO4\0" \
120 "b\x0a" "GUEST_UFO\0" \
121 "b\x09" "GUEST_ECN\0" \
122 "b\x08" "GUEST_TSO6\0" \
123 "b\x07" "GUEST_TSO4\0" \
124 "b\x06" "GSO\0" \
125 "b\x05" "MAC\0" \
126 "b\x01" "GUEST_CSUM\0" \
127 "b\x00" "CSUM\0"
128
129 /* Status */
130 #define VIRTIO_NET_S_LINK_UP 1
131
132 /* Packet header structure */
133 struct virtio_net_hdr {
134 uint8_t flags;
135 uint8_t gso_type;
136 uint16_t hdr_len;
137 uint16_t gso_size;
138 uint16_t csum_start;
139 uint16_t csum_offset;
140
141 uint16_t num_buffers; /* VIRTIO_NET_F_MRG_RXBUF enabled or v1 */
142 } __packed;
143
144 #define VIRTIO_NET_HDR_F_NEEDS_CSUM 1 /* flags */
145 #define VIRTIO_NET_HDR_GSO_NONE 0 /* gso_type */
146 #define VIRTIO_NET_HDR_GSO_TCPV4 1 /* gso_type */
147 #define VIRTIO_NET_HDR_GSO_UDP 3 /* gso_type */
148 #define VIRTIO_NET_HDR_GSO_TCPV6 4 /* gso_type */
149 #define VIRTIO_NET_HDR_GSO_ECN 0x80 /* gso_type, |'ed */
150
151 #define VIRTIO_NET_MAX_GSO_LEN (65536+ETHER_HDR_LEN)
152
153 /* Control virtqueue */
154 struct virtio_net_ctrl_cmd {
155 uint8_t class;
156 uint8_t command;
157 } __packed;
158 #define VIRTIO_NET_CTRL_RX 0
159 # define VIRTIO_NET_CTRL_RX_PROMISC 0
160 # define VIRTIO_NET_CTRL_RX_ALLMULTI 1
161
162 #define VIRTIO_NET_CTRL_MAC 1
163 # define VIRTIO_NET_CTRL_MAC_TABLE_SET 0
164 # define VIRTIO_NET_CTRL_MAC_ADDR_SET 1
165
166 #define VIRTIO_NET_CTRL_VLAN 2
167 # define VIRTIO_NET_CTRL_VLAN_ADD 0
168 # define VIRTIO_NET_CTRL_VLAN_DEL 1
169
170 #define VIRTIO_NET_CTRL_MQ 4
171 # define VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET 0
172 # define VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN 1
173 # define VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX 0x8000
174
175 struct virtio_net_ctrl_status {
176 uint8_t ack;
177 } __packed;
178 #define VIRTIO_NET_OK 0
179 #define VIRTIO_NET_ERR 1
180
181 struct virtio_net_ctrl_rx {
182 uint8_t onoff;
183 } __packed;
184
185 struct virtio_net_ctrl_mac_tbl {
186 uint32_t nentries;
187 uint8_t macs[][ETHER_ADDR_LEN];
188 } __packed;
189
190 struct virtio_net_ctrl_mac_addr {
191 uint8_t mac[ETHER_ADDR_LEN];
192 } __packed;
193
194 struct virtio_net_ctrl_vlan {
195 uint16_t id;
196 } __packed;
197
198 struct virtio_net_ctrl_mq {
199 uint16_t virtqueue_pairs;
200 } __packed;
201
202 /*
203 * if_vioifvar.h:
204 */
205
206 /*
207 * Locking notes:
208 * + a field in vioif_txqueue is protected by txq_lock (a spin mutex), and
209 * a field in vioif_rxqueue is protected by rxq_lock (a spin mutex).
210 * - more than one lock cannot be held at onece
211 * + ctrlq_inuse is protected by ctrlq_wait_lock.
212 * - other fields in vioif_ctrlqueue are protected by ctrlq_inuse
213 * - txq_lock or rxq_lock cannot be held along with ctrlq_wait_lock
214 * + fields in vioif_softc except queues are protected by
215 * sc->sc_lock(an adaptive mutex)
216 * - the lock is held before acquisition of other locks
217 */
218
219 struct vioif_ctrl_cmdspec {
220 bus_dmamap_t dmamap;
221 void *buf;
222 bus_size_t bufsize;
223 };
224
225 struct vioif_work {
226 struct work cookie;
227 void (*func)(void *);
228 void *arg;
229 unsigned int added;
230 };
231
232 struct vioif_txqueue {
233 kmutex_t *txq_lock; /* lock for tx operations */
234
235 struct virtqueue *txq_vq;
236 bool txq_stopping;
237 bool txq_link_active;
238 pcq_t *txq_intrq;
239
240 struct virtio_net_hdr *txq_hdrs;
241 bus_dmamap_t *txq_hdr_dmamaps;
242
243 struct mbuf **txq_mbufs;
244 bus_dmamap_t *txq_dmamaps;
245
246 void *txq_deferred_transmit;
247 void *txq_handle_si;
248 struct vioif_work txq_work;
249 bool txq_workqueue;
250 bool txq_running_handle;
251
252 char txq_evgroup[16];
253 struct evcnt txq_defrag_failed;
254 struct evcnt txq_mbuf_load_failed;
255 struct evcnt txq_enqueue_reserve_failed;
256 };
257
258 struct vioif_rxqueue {
259 kmutex_t *rxq_lock; /* lock for rx operations */
260
261 struct virtqueue *rxq_vq;
262 bool rxq_stopping;
263
264 struct virtio_net_hdr *rxq_hdrs;
265 bus_dmamap_t *rxq_hdr_dmamaps;
266
267 struct mbuf **rxq_mbufs;
268 bus_dmamap_t *rxq_dmamaps;
269
270 void *rxq_handle_si;
271 struct vioif_work rxq_work;
272 bool rxq_workqueue;
273 bool rxq_running_handle;
274
275 char rxq_evgroup[16];
276 struct evcnt rxq_mbuf_enobufs;
277 struct evcnt rxq_mbuf_load_failed;
278 struct evcnt rxq_enqueue_reserve_failed;
279 };
280
281 struct vioif_ctrlqueue {
282 struct virtqueue *ctrlq_vq;
283 enum {
284 FREE, INUSE, DONE
285 } ctrlq_inuse;
286 kcondvar_t ctrlq_wait;
287 kmutex_t ctrlq_wait_lock;
288 struct lwp *ctrlq_owner;
289
290 struct virtio_net_ctrl_cmd *ctrlq_cmd;
291 struct virtio_net_ctrl_status *ctrlq_status;
292 struct virtio_net_ctrl_rx *ctrlq_rx;
293 struct virtio_net_ctrl_mac_tbl *ctrlq_mac_tbl_uc;
294 struct virtio_net_ctrl_mac_tbl *ctrlq_mac_tbl_mc;
295 struct virtio_net_ctrl_mac_addr *ctrlq_mac_addr;
296 struct virtio_net_ctrl_mq *ctrlq_mq;
297
298 bus_dmamap_t ctrlq_cmd_dmamap;
299 bus_dmamap_t ctrlq_status_dmamap;
300 bus_dmamap_t ctrlq_rx_dmamap;
301 bus_dmamap_t ctrlq_tbl_uc_dmamap;
302 bus_dmamap_t ctrlq_tbl_mc_dmamap;
303 bus_dmamap_t ctrlq_mac_addr_dmamap;
304 bus_dmamap_t ctrlq_mq_dmamap;
305
306 struct evcnt ctrlq_cmd_load_failed;
307 struct evcnt ctrlq_cmd_failed;
308 };
309
310 struct vioif_softc {
311 device_t sc_dev;
312 kmutex_t sc_lock;
313 struct sysctllog *sc_sysctllog;
314
315 struct virtio_softc *sc_virtio;
316 struct virtqueue *sc_vqs;
317 u_int sc_hdr_size;
318
319 int sc_max_nvq_pairs;
320 int sc_req_nvq_pairs;
321 int sc_act_nvq_pairs;
322
323 uint8_t sc_mac[ETHER_ADDR_LEN];
324 struct ethercom sc_ethercom;
325 int sc_link_state;
326
327 struct vioif_txqueue *sc_txq;
328 struct vioif_rxqueue *sc_rxq;
329
330 bool sc_has_ctrl;
331 struct vioif_ctrlqueue sc_ctrlq;
332
333 bus_dma_segment_t sc_hdr_segs[1];
334 void *sc_dmamem;
335 void *sc_kmem;
336
337 void *sc_ctl_softint;
338
339 struct workqueue *sc_txrx_workqueue;
340 bool sc_txrx_workqueue_sysctl;
341 u_int sc_tx_intr_process_limit;
342 u_int sc_tx_process_limit;
343 u_int sc_rx_intr_process_limit;
344 u_int sc_rx_process_limit;
345 };
346 #define VIRTIO_NET_TX_MAXNSEGS (16) /* XXX */
347 #define VIRTIO_NET_CTRL_MAC_MAXENTRIES (64) /* XXX */
348
349 #define VIOIF_TX_INTR_PROCESS_LIMIT 256
350 #define VIOIF_TX_PROCESS_LIMIT 256
351 #define VIOIF_RX_INTR_PROCESS_LIMIT 0U
352 #define VIOIF_RX_PROCESS_LIMIT 256
353
354 #define VIOIF_WORKQUEUE_PRI PRI_SOFTNET
355 #define VIOIF_IS_LINK_ACTIVE(_sc) ((_sc)->sc_link_state == LINK_STATE_UP ? \
356 true : false)
357
358 /* cfattach interface functions */
359 static int vioif_match(device_t, cfdata_t, void *);
360 static void vioif_attach(device_t, device_t, void *);
361 static int vioif_finalize_teardown(device_t);
362
363 /* ifnet interface functions */
364 static int vioif_init(struct ifnet *);
365 static void vioif_stop(struct ifnet *, int);
366 static void vioif_start(struct ifnet *);
367 static void vioif_start_locked(struct ifnet *, struct vioif_txqueue *);
368 static int vioif_transmit(struct ifnet *, struct mbuf *);
369 static void vioif_transmit_locked(struct ifnet *, struct vioif_txqueue *);
370 static int vioif_ioctl(struct ifnet *, u_long, void *);
371 static void vioif_watchdog(struct ifnet *);
372 static int vioif_ifflags_cb(struct ethercom *);
373
374 /* rx */
375 static void vioif_populate_rx_mbufs_locked(struct vioif_softc *,
376 struct vioif_rxqueue *);
377 static void vioif_rx_queue_clear(struct vioif_rxqueue *);
378 static bool vioif_rx_deq_locked(struct vioif_softc *, struct virtio_softc *,
379 struct vioif_rxqueue *, u_int, size_t *);
380 static int vioif_rx_intr(void *);
381 static void vioif_rx_handle(void *);
382 static void vioif_rx_sched_handle(struct vioif_softc *,
383 struct vioif_rxqueue *);
384 static void vioif_rx_drain(struct vioif_rxqueue *);
385
386 /* tx */
387 static int vioif_tx_intr(void *);
388 static void vioif_tx_handle(void *);
389 static void vioif_tx_sched_handle(struct vioif_softc *,
390 struct vioif_txqueue *);
391 static void vioif_tx_queue_clear(struct vioif_txqueue *);
392 static bool vioif_tx_deq_locked(struct vioif_softc *, struct virtio_softc *,
393 struct vioif_txqueue *, u_int);
394 static void vioif_tx_drain(struct vioif_txqueue *);
395 static void vioif_deferred_transmit(void *);
396
397 /* workqueue */
398 static struct workqueue*
399 vioif_workq_create(const char *, pri_t, int, int);
400 static void vioif_workq_destroy(struct workqueue *);
401 static void vioif_workq_work(struct work *, void *);
402 static void vioif_work_set(struct vioif_work *, void(*)(void *), void *);
403 static void vioif_work_add(struct workqueue *, struct vioif_work *);
404 static void vioif_work_wait(struct workqueue *, struct vioif_work *);
405
406 /* other control */
407 static int vioif_get_link_status(struct vioif_softc *);
408 static void vioif_update_link_status(struct vioif_softc *);
409 static int vioif_ctrl_rx(struct vioif_softc *, int, bool);
410 static int vioif_set_promisc(struct vioif_softc *, bool);
411 static int vioif_set_allmulti(struct vioif_softc *, bool);
412 static int vioif_set_rx_filter(struct vioif_softc *);
413 static int vioif_rx_filter(struct vioif_softc *);
414 static int vioif_set_mac_addr(struct vioif_softc *);
415 static int vioif_ctrl_intr(void *);
416 static int vioif_config_change(struct virtio_softc *);
417 static void vioif_ctl_softint(void *);
418 static int vioif_ctrl_mq_vq_pairs_set(struct vioif_softc *, int);
419 static void vioif_enable_interrupt_vqpairs(struct vioif_softc *);
420 static void vioif_disable_interrupt_vqpairs(struct vioif_softc *);
421 static int vioif_setup_sysctl(struct vioif_softc *);
422 static void vioif_setup_stats(struct vioif_softc *);
423 static int vioif_ifflags(struct vioif_softc *);
424 static void vioif_intr_barrier(void);
425
426 CFATTACH_DECL_NEW(vioif, sizeof(struct vioif_softc),
427 vioif_match, vioif_attach, NULL, NULL);
428
429 static int
430 vioif_match(device_t parent, cfdata_t match, void *aux)
431 {
432 struct virtio_attach_args *va = aux;
433
434 if (va->sc_childdevid == VIRTIO_DEVICE_ID_NETWORK)
435 return 1;
436
437 return 0;
438 }
439
440 static int
441 vioif_dmamap_create(struct vioif_softc *sc, bus_dmamap_t *map,
442 bus_size_t size, int nsegs, const char *usage)
443 {
444 int r;
445
446 r = bus_dmamap_create(virtio_dmat(sc->sc_virtio), size,
447 nsegs, size, 0, BUS_DMA_NOWAIT | BUS_DMA_ALLOCNOW, map);
448
449 if (r != 0) {
450 aprint_error_dev(sc->sc_dev, "%s dmamap creation failed, "
451 "error code %d\n", usage, r);
452 }
453
454 return r;
455 }
456
457 static void
458 vioif_dmamap_destroy(struct vioif_softc *sc, bus_dmamap_t *map)
459 {
460
461 if (*map) {
462 bus_dmamap_destroy(virtio_dmat(sc->sc_virtio), *map);
463 *map = NULL;
464 }
465 }
466
467 static int
468 vioif_dmamap_create_load(struct vioif_softc *sc, bus_dmamap_t *map,
469 void *buf, bus_size_t size, int nsegs, int rw, const char *usage)
470 {
471 int r;
472
473 r = vioif_dmamap_create(sc, map, size, nsegs, usage);
474 if (r != 0)
475 return 1;
476
477 r = bus_dmamap_load(virtio_dmat(sc->sc_virtio), *map, buf,
478 size, NULL, rw | BUS_DMA_NOWAIT);
479 if (r != 0) {
480 vioif_dmamap_destroy(sc, map);
481 aprint_error_dev(sc->sc_dev, "%s dmamap load failed. "
482 "error code %d\n", usage, r);
483 }
484
485 return r;
486 }
487
488 static void *
489 vioif_assign_mem(intptr_t *p, size_t size)
490 {
491 intptr_t rv;
492
493 rv = *p;
494 *p += size;
495
496 return (void *)rv;
497 }
498
499 static void
500 vioif_alloc_queues(struct vioif_softc *sc)
501 {
502 int nvq_pairs = sc->sc_max_nvq_pairs;
503 int nvqs = nvq_pairs * 2;
504 int i;
505
506 KASSERT(nvq_pairs <= VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX);
507
508 sc->sc_rxq = kmem_zalloc(sizeof(sc->sc_rxq[0]) * nvq_pairs,
509 KM_SLEEP);
510 sc->sc_txq = kmem_zalloc(sizeof(sc->sc_txq[0]) * nvq_pairs,
511 KM_SLEEP);
512
513 if (sc->sc_has_ctrl)
514 nvqs++;
515
516 sc->sc_vqs = kmem_zalloc(sizeof(sc->sc_vqs[0]) * nvqs, KM_SLEEP);
517 nvqs = 0;
518 for (i = 0; i < nvq_pairs; i++) {
519 sc->sc_rxq[i].rxq_vq = &sc->sc_vqs[nvqs++];
520 sc->sc_txq[i].txq_vq = &sc->sc_vqs[nvqs++];
521 }
522
523 if (sc->sc_has_ctrl)
524 sc->sc_ctrlq.ctrlq_vq = &sc->sc_vqs[nvqs++];
525 }
526
527 static void
528 vioif_free_queues(struct vioif_softc *sc)
529 {
530 int nvq_pairs = sc->sc_max_nvq_pairs;
531 int nvqs = nvq_pairs * 2;
532
533 if (sc->sc_ctrlq.ctrlq_vq)
534 nvqs++;
535
536 if (sc->sc_txq) {
537 kmem_free(sc->sc_txq, sizeof(sc->sc_txq[0]) * nvq_pairs);
538 sc->sc_txq = NULL;
539 }
540
541 if (sc->sc_rxq) {
542 kmem_free(sc->sc_rxq, sizeof(sc->sc_rxq[0]) * nvq_pairs);
543 sc->sc_rxq = NULL;
544 }
545
546 if (sc->sc_vqs) {
547 kmem_free(sc->sc_vqs, sizeof(sc->sc_vqs[0]) * nvqs);
548 sc->sc_vqs = NULL;
549 }
550 }
551
552 /* allocate memory */
553 /*
554 * dma memory is used for:
555 * rxq_hdrs[slot]: metadata array for received frames (READ)
556 * txq_hdrs[slot]: metadata array for frames to be sent (WRITE)
557 * ctrlq_cmd: command to be sent via ctrl vq (WRITE)
558 * ctrlq_status: return value for a command via ctrl vq (READ)
559 * ctrlq_rx: parameter for a VIRTIO_NET_CTRL_RX class command
560 * (WRITE)
561 * ctrlq_mac_tbl_uc: unicast MAC address filter for a VIRTIO_NET_CTRL_MAC
562 * class command (WRITE)
563 * ctrlq_mac_tbl_mc: multicast MAC address filter for a VIRTIO_NET_CTRL_MAC
564 * class command (WRITE)
565 * ctrlq_* structures are allocated only one each; they are protected by
566 * ctrlq_inuse variable and ctrlq_wait condvar.
567 */
568 /*
569 * dynamically allocated memory is used for:
570 * rxq_hdr_dmamaps[slot]: bus_dmamap_t array for sc_rx_hdrs[slot]
571 * txq_hdr_dmamaps[slot]: bus_dmamap_t array for sc_tx_hdrs[slot]
572 * rxq_dmamaps[slot]: bus_dmamap_t array for received payload
573 * txq_dmamaps[slot]: bus_dmamap_t array for sent payload
574 * rxq_mbufs[slot]: mbuf pointer array for received frames
575 * txq_mbufs[slot]: mbuf pointer array for sent frames
576 */
577 static int
578 vioif_alloc_mems(struct vioif_softc *sc)
579 {
580 struct virtio_softc *vsc = sc->sc_virtio;
581 struct vioif_txqueue *txq;
582 struct vioif_rxqueue *rxq;
583 struct vioif_ctrlqueue *ctrlq = &sc->sc_ctrlq;
584 int allocsize, allocsize2, r, rsegs, i, qid;
585 void *vaddr;
586 intptr_t p;
587
588 allocsize = 0;
589 for (qid = 0; qid < sc->sc_max_nvq_pairs; qid++) {
590 rxq = &sc->sc_rxq[qid];
591 txq = &sc->sc_txq[qid];
592
593 allocsize += sizeof(struct virtio_net_hdr) *
594 (rxq->rxq_vq->vq_num + txq->txq_vq->vq_num);
595 }
596 if (sc->sc_has_ctrl) {
597 allocsize += sizeof(struct virtio_net_ctrl_cmd);
598 allocsize += sizeof(struct virtio_net_ctrl_status);
599 allocsize += sizeof(struct virtio_net_ctrl_rx);
600 allocsize += sizeof(struct virtio_net_ctrl_mac_tbl)
601 + ETHER_ADDR_LEN;
602 allocsize += sizeof(struct virtio_net_ctrl_mac_tbl)
603 + ETHER_ADDR_LEN * VIRTIO_NET_CTRL_MAC_MAXENTRIES;
604 allocsize += sizeof(struct virtio_net_ctrl_mac_addr);
605 allocsize += sizeof(struct virtio_net_ctrl_mq);
606 }
607 r = bus_dmamem_alloc(virtio_dmat(vsc), allocsize, 0, 0,
608 &sc->sc_hdr_segs[0], 1, &rsegs, BUS_DMA_NOWAIT);
609 if (r != 0) {
610 aprint_error_dev(sc->sc_dev,
611 "DMA memory allocation failed, size %d, "
612 "error code %d\n", allocsize, r);
613 goto err_none;
614 }
615 r = bus_dmamem_map(virtio_dmat(vsc),
616 &sc->sc_hdr_segs[0], 1, allocsize, &vaddr, BUS_DMA_NOWAIT);
617 if (r != 0) {
618 aprint_error_dev(sc->sc_dev,
619 "DMA memory map failed, error code %d\n", r);
620 goto err_dmamem_alloc;
621 }
622
623 memset(vaddr, 0, allocsize);
624 sc->sc_dmamem = vaddr;
625 p = (intptr_t) vaddr;
626
627 for (qid = 0; qid < sc->sc_max_nvq_pairs; qid++) {
628 rxq = &sc->sc_rxq[qid];
629 txq = &sc->sc_txq[qid];
630
631 rxq->rxq_hdrs = vioif_assign_mem(&p,
632 sizeof(struct virtio_net_hdr) * rxq->rxq_vq->vq_num);
633 txq->txq_hdrs = vioif_assign_mem(&p,
634 sizeof(struct virtio_net_hdr) * txq->txq_vq->vq_num);
635 }
636 if (sc->sc_has_ctrl) {
637 ctrlq->ctrlq_cmd = vioif_assign_mem(&p,
638 sizeof(*ctrlq->ctrlq_cmd));
639 ctrlq->ctrlq_status = vioif_assign_mem(&p,
640 sizeof(*ctrlq->ctrlq_status));
641 ctrlq->ctrlq_rx = vioif_assign_mem(&p,
642 sizeof(*ctrlq->ctrlq_rx));
643 ctrlq->ctrlq_mac_tbl_uc = vioif_assign_mem(&p,
644 sizeof(*ctrlq->ctrlq_mac_tbl_uc)
645 + ETHER_ADDR_LEN);
646 ctrlq->ctrlq_mac_tbl_mc = vioif_assign_mem(&p,
647 sizeof(*ctrlq->ctrlq_mac_tbl_mc)
648 + ETHER_ADDR_LEN * VIRTIO_NET_CTRL_MAC_MAXENTRIES);
649 ctrlq->ctrlq_mac_addr = vioif_assign_mem(&p,
650 sizeof(*ctrlq->ctrlq_mac_addr));
651 ctrlq->ctrlq_mq = vioif_assign_mem(&p, sizeof(*ctrlq->ctrlq_mq));
652 }
653
654 allocsize2 = 0;
655 for (qid = 0; qid < sc->sc_max_nvq_pairs; qid++) {
656 int rxqsize, txqsize;
657
658 rxq = &sc->sc_rxq[qid];
659 txq = &sc->sc_txq[qid];
660 rxqsize = rxq->rxq_vq->vq_num;
661 txqsize = txq->txq_vq->vq_num;
662
663 allocsize2 += sizeof(rxq->rxq_dmamaps[0]) * rxqsize;
664 allocsize2 += sizeof(rxq->rxq_hdr_dmamaps[0]) * rxqsize;
665 allocsize2 += sizeof(rxq->rxq_mbufs[0]) * rxqsize;
666
667 allocsize2 += sizeof(txq->txq_dmamaps[0]) * txqsize;
668 allocsize2 += sizeof(txq->txq_hdr_dmamaps[0]) * txqsize;
669 allocsize2 += sizeof(txq->txq_mbufs[0]) * txqsize;
670 }
671 vaddr = kmem_zalloc(allocsize2, KM_SLEEP);
672 sc->sc_kmem = vaddr;
673 p = (intptr_t) vaddr;
674
675 for (qid = 0; qid < sc->sc_max_nvq_pairs; qid++) {
676 int rxqsize, txqsize;
677 rxq = &sc->sc_rxq[qid];
678 txq = &sc->sc_txq[qid];
679 rxqsize = rxq->rxq_vq->vq_num;
680 txqsize = txq->txq_vq->vq_num;
681
682 rxq->rxq_hdr_dmamaps = vioif_assign_mem(&p,
683 sizeof(rxq->rxq_hdr_dmamaps[0]) * rxqsize);
684 txq->txq_hdr_dmamaps = vioif_assign_mem(&p,
685 sizeof(txq->txq_hdr_dmamaps[0]) * txqsize);
686 rxq->rxq_dmamaps = vioif_assign_mem(&p,
687 sizeof(rxq->rxq_dmamaps[0]) * rxqsize);
688 txq->txq_dmamaps = vioif_assign_mem(&p,
689 sizeof(txq->txq_dmamaps[0]) * txqsize);
690 rxq->rxq_mbufs = vioif_assign_mem(&p,
691 sizeof(rxq->rxq_mbufs[0]) * rxqsize);
692 txq->txq_mbufs = vioif_assign_mem(&p,
693 sizeof(txq->txq_mbufs[0]) * txqsize);
694 }
695
696 for (qid = 0; qid < sc->sc_max_nvq_pairs; qid++) {
697 rxq = &sc->sc_rxq[qid];
698 txq = &sc->sc_txq[qid];
699
700 for (i = 0; i < rxq->rxq_vq->vq_num; i++) {
701 r = vioif_dmamap_create_load(sc, &rxq->rxq_hdr_dmamaps[i],
702 &rxq->rxq_hdrs[i], sc->sc_hdr_size, 1,
703 BUS_DMA_READ, "rx header");
704 if (r != 0)
705 goto err_reqs;
706
707 r = vioif_dmamap_create(sc, &rxq->rxq_dmamaps[i],
708 MCLBYTES - ETHER_ALIGN, 1, "rx payload");
709 if (r != 0)
710 goto err_reqs;
711 }
712
713 for (i = 0; i < txq->txq_vq->vq_num; i++) {
714 r = vioif_dmamap_create_load(sc, &txq->txq_hdr_dmamaps[i],
715 &txq->txq_hdrs[i], sc->sc_hdr_size, 1,
716 BUS_DMA_READ, "tx header");
717 if (r != 0)
718 goto err_reqs;
719
720 r = vioif_dmamap_create(sc, &txq->txq_dmamaps[i], ETHER_MAX_LEN,
721 VIRTIO_NET_TX_MAXNSEGS, "tx payload");
722 if (r != 0)
723 goto err_reqs;
724 }
725 }
726
727 if (sc->sc_has_ctrl) {
728 /* control vq class & command */
729 r = vioif_dmamap_create_load(sc, &ctrlq->ctrlq_cmd_dmamap,
730 ctrlq->ctrlq_cmd, sizeof(*ctrlq->ctrlq_cmd), 1,
731 BUS_DMA_WRITE, "control command");
732 if (r != 0)
733 goto err_reqs;
734
735 r = vioif_dmamap_create_load(sc, &ctrlq->ctrlq_status_dmamap,
736 ctrlq->ctrlq_status, sizeof(*ctrlq->ctrlq_status), 1,
737 BUS_DMA_READ, "control status");
738 if (r != 0)
739 goto err_reqs;
740
741 /* control vq rx mode command parameter */
742 r = vioif_dmamap_create_load(sc, &ctrlq->ctrlq_rx_dmamap,
743 ctrlq->ctrlq_rx, sizeof(*ctrlq->ctrlq_rx), 1,
744 BUS_DMA_WRITE, "rx mode control command");
745 if (r != 0)
746 goto err_reqs;
747
748 /* multiqueue set command */
749 r = vioif_dmamap_create_load(sc, &ctrlq->ctrlq_mq_dmamap,
750 ctrlq->ctrlq_mq, sizeof(*ctrlq->ctrlq_mq), 1,
751 BUS_DMA_WRITE, "multiqueue set command");
752 if (r != 0)
753 goto err_reqs;
754
755 /* control vq MAC filter table for unicast */
756 /* do not load now since its length is variable */
757 r = vioif_dmamap_create(sc, &ctrlq->ctrlq_tbl_uc_dmamap,
758 sizeof(*ctrlq->ctrlq_mac_tbl_uc)
759 + ETHER_ADDR_LEN, 1,
760 "unicast MAC address filter command");
761 if (r != 0)
762 goto err_reqs;
763
764 /* control vq MAC filter table for multicast */
765 r = vioif_dmamap_create(sc, &ctrlq->ctrlq_tbl_mc_dmamap,
766 sizeof(*ctrlq->ctrlq_mac_tbl_mc)
767 + ETHER_ADDR_LEN * VIRTIO_NET_CTRL_MAC_MAXENTRIES, 1,
768 "multicast MAC address filter command");
769 if (r != 0)
770 goto err_reqs;
771
772 /* control vq MAC address set command */
773 r = vioif_dmamap_create_load(sc,
774 &ctrlq->ctrlq_mac_addr_dmamap,
775 ctrlq->ctrlq_mac_addr,
776 sizeof(*ctrlq->ctrlq_mac_addr), 1,
777 BUS_DMA_WRITE, "mac addr set command");
778 if (r != 0)
779 goto err_reqs;
780 }
781
782 return 0;
783
784 err_reqs:
785 vioif_dmamap_destroy(sc, &ctrlq->ctrlq_tbl_mc_dmamap);
786 vioif_dmamap_destroy(sc, &ctrlq->ctrlq_tbl_uc_dmamap);
787 vioif_dmamap_destroy(sc, &ctrlq->ctrlq_rx_dmamap);
788 vioif_dmamap_destroy(sc, &ctrlq->ctrlq_status_dmamap);
789 vioif_dmamap_destroy(sc, &ctrlq->ctrlq_cmd_dmamap);
790 vioif_dmamap_destroy(sc, &ctrlq->ctrlq_mac_addr_dmamap);
791 for (qid = 0; qid < sc->sc_max_nvq_pairs; qid++) {
792 rxq = &sc->sc_rxq[qid];
793 txq = &sc->sc_txq[qid];
794
795 for (i = 0; i < txq->txq_vq->vq_num; i++) {
796 vioif_dmamap_destroy(sc, &txq->txq_dmamaps[i]);
797 vioif_dmamap_destroy(sc, &txq->txq_hdr_dmamaps[i]);
798 }
799 for (i = 0; i < rxq->rxq_vq->vq_num; i++) {
800 vioif_dmamap_destroy(sc, &rxq->rxq_dmamaps[i]);
801 vioif_dmamap_destroy(sc, &rxq->rxq_hdr_dmamaps[i]);
802 }
803 }
804 if (sc->sc_kmem) {
805 kmem_free(sc->sc_kmem, allocsize2);
806 sc->sc_kmem = NULL;
807 }
808 bus_dmamem_unmap(virtio_dmat(vsc), sc->sc_dmamem, allocsize);
809 err_dmamem_alloc:
810 bus_dmamem_free(virtio_dmat(vsc), &sc->sc_hdr_segs[0], 1);
811 err_none:
812 return -1;
813 }
814
815 static void
816 vioif_attach(device_t parent, device_t self, void *aux)
817 {
818 struct vioif_softc *sc = device_private(self);
819 struct virtio_softc *vsc = device_private(parent);
820 struct vioif_ctrlqueue *ctrlq = &sc->sc_ctrlq;
821 struct vioif_txqueue *txq;
822 struct vioif_rxqueue *rxq;
823 uint64_t features, req_features;
824 struct ifnet *ifp = &sc->sc_ethercom.ec_if;
825 u_int softint_flags;
826 int r, i, nvqs = 0, req_flags;
827 char xnamebuf[MAXCOMLEN];
828
829 if (virtio_child(vsc) != NULL) {
830 aprint_normal(": child already attached for %s; "
831 "something wrong...\n", device_xname(parent));
832 return;
833 }
834
835 sc->sc_dev = self;
836 sc->sc_virtio = vsc;
837 sc->sc_link_state = LINK_STATE_UNKNOWN;
838
839 sc->sc_max_nvq_pairs = 1;
840 sc->sc_req_nvq_pairs = 1;
841 sc->sc_act_nvq_pairs = 1;
842 sc->sc_txrx_workqueue_sysctl = true;
843 sc->sc_tx_intr_process_limit = VIOIF_TX_INTR_PROCESS_LIMIT;
844 sc->sc_tx_process_limit = VIOIF_TX_PROCESS_LIMIT;
845 sc->sc_rx_intr_process_limit = VIOIF_RX_INTR_PROCESS_LIMIT;
846 sc->sc_rx_process_limit = VIOIF_RX_PROCESS_LIMIT;
847
848 mutex_init(&sc->sc_lock, MUTEX_DEFAULT, IPL_NONE);
849
850 snprintf(xnamebuf, sizeof(xnamebuf), "%s_txrx", device_xname(self));
851 sc->sc_txrx_workqueue = vioif_workq_create(xnamebuf, VIOIF_WORKQUEUE_PRI,
852 IPL_NET, WQ_PERCPU | WQ_MPSAFE);
853 if (sc->sc_txrx_workqueue == NULL)
854 goto err;
855
856 req_flags = 0;
857
858 #ifdef VIOIF_MPSAFE
859 req_flags |= VIRTIO_F_INTR_MPSAFE;
860 #endif
861 req_flags |= VIRTIO_F_INTR_MSIX;
862
863 req_features =
864 VIRTIO_NET_F_MAC | VIRTIO_NET_F_STATUS | VIRTIO_NET_F_CTRL_VQ |
865 VIRTIO_NET_F_CTRL_RX | VIRTIO_F_NOTIFY_ON_EMPTY;
866 req_features |= VIRTIO_F_RING_EVENT_IDX;
867 req_features |= VIRTIO_NET_F_CTRL_MAC_ADDR;
868 #ifdef VIOIF_MULTIQ
869 req_features |= VIRTIO_NET_F_MQ;
870 #endif
871 virtio_child_attach_start(vsc, self, IPL_NET, NULL,
872 vioif_config_change, virtio_vq_intrhand, req_flags,
873 req_features, VIRTIO_NET_FLAG_BITS);
874
875 features = virtio_features(vsc);
876 if (features == 0)
877 goto err;
878
879 if (features & VIRTIO_NET_F_MAC) {
880 for (i = 0; i < __arraycount(sc->sc_mac); i++) {
881 sc->sc_mac[i] = virtio_read_device_config_1(vsc,
882 VIRTIO_NET_CONFIG_MAC + i);
883 }
884 } else {
885 /* code stolen from sys/net/if_tap.c */
886 struct timeval tv;
887 uint32_t ui;
888 getmicrouptime(&tv);
889 ui = (tv.tv_sec ^ tv.tv_usec) & 0xffffff;
890 memcpy(sc->sc_mac+3, (uint8_t *)&ui, 3);
891 for (i = 0; i < __arraycount(sc->sc_mac); i++) {
892 virtio_write_device_config_1(vsc,
893 VIRTIO_NET_CONFIG_MAC + i, sc->sc_mac[i]);
894 }
895 }
896
897 /* 'Ethernet' with capital follows other ethernet driver attachment */
898 aprint_normal_dev(self, "Ethernet address %s\n",
899 ether_sprintf(sc->sc_mac));
900
901 if (features & (VIRTIO_NET_F_MRG_RXBUF | VIRTIO_F_VERSION_1)) {
902 sc->sc_hdr_size = sizeof(struct virtio_net_hdr);
903 } else {
904 sc->sc_hdr_size = offsetof(struct virtio_net_hdr, num_buffers);
905 }
906
907 if ((features & VIRTIO_NET_F_CTRL_VQ) &&
908 (features & VIRTIO_NET_F_CTRL_RX)) {
909 sc->sc_has_ctrl = true;
910
911 cv_init(&ctrlq->ctrlq_wait, "ctrl_vq");
912 mutex_init(&ctrlq->ctrlq_wait_lock, MUTEX_DEFAULT, IPL_NET);
913 ctrlq->ctrlq_inuse = FREE;
914 } else {
915 sc->sc_has_ctrl = false;
916 }
917
918 if (sc->sc_has_ctrl && (features & VIRTIO_NET_F_MQ)) {
919 sc->sc_max_nvq_pairs = virtio_read_device_config_2(vsc,
920 VIRTIO_NET_CONFIG_MAX_VQ_PAIRS);
921
922 if (sc->sc_max_nvq_pairs > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX)
923 goto err;
924
925 /* Limit the number of queue pairs to use */
926 sc->sc_req_nvq_pairs = MIN(sc->sc_max_nvq_pairs, ncpu);
927 }
928
929 vioif_alloc_queues(sc);
930 virtio_child_attach_set_vqs(vsc, sc->sc_vqs, sc->sc_req_nvq_pairs);
931
932 #ifdef VIOIF_MPSAFE
933 softint_flags = SOFTINT_NET | SOFTINT_MPSAFE;
934 #else
935 softint_flags = SOFTINT_NET;
936 #endif
937
938 /*
939 * Allocating virtqueues
940 */
941 for (i = 0; i < sc->sc_max_nvq_pairs; i++) {
942 rxq = &sc->sc_rxq[i];
943 txq = &sc->sc_txq[i];
944 char qname[32];
945
946 rxq->rxq_lock = mutex_obj_alloc(MUTEX_DEFAULT, IPL_NET);
947
948 rxq->rxq_handle_si = softint_establish(softint_flags,
949 vioif_rx_handle, rxq);
950 if (rxq->rxq_handle_si == NULL) {
951 aprint_error_dev(self, "cannot establish rx softint\n");
952 goto err;
953 }
954
955 snprintf(qname, sizeof(qname), "rx%d", i);
956 r = virtio_alloc_vq(vsc, rxq->rxq_vq, nvqs,
957 MCLBYTES + sc->sc_hdr_size, 2, qname);
958 if (r != 0)
959 goto err;
960 nvqs++;
961 rxq->rxq_vq->vq_intrhand = vioif_rx_intr;
962 rxq->rxq_vq->vq_intrhand_arg = (void *)rxq;
963 rxq->rxq_stopping = false;
964 rxq->rxq_running_handle = false;
965 vioif_work_set(&rxq->rxq_work, vioif_rx_handle, rxq);
966
967 txq->txq_lock = mutex_obj_alloc(MUTEX_DEFAULT, IPL_NET);
968
969 txq->txq_deferred_transmit = softint_establish(softint_flags,
970 vioif_deferred_transmit, txq);
971 if (txq->txq_deferred_transmit == NULL) {
972 aprint_error_dev(self, "cannot establish tx softint\n");
973 goto err;
974 }
975 txq->txq_handle_si = softint_establish(softint_flags,
976 vioif_tx_handle, txq);
977 if (txq->txq_handle_si == NULL) {
978 aprint_error_dev(self, "cannot establish tx softint\n");
979 goto err;
980 }
981
982 snprintf(qname, sizeof(qname), "tx%d", i);
983 r = virtio_alloc_vq(vsc, txq->txq_vq, nvqs,
984 sc->sc_hdr_size + (ETHER_MAX_LEN - ETHER_HDR_LEN),
985 VIRTIO_NET_TX_MAXNSEGS + 1, qname);
986 if (r != 0)
987 goto err;
988 nvqs++;
989 txq->txq_vq->vq_intrhand = vioif_tx_intr;
990 txq->txq_vq->vq_intrhand_arg = (void *)txq;
991 txq->txq_link_active = VIOIF_IS_LINK_ACTIVE(sc);
992 txq->txq_stopping = false;
993 txq->txq_running_handle = false;
994 txq->txq_intrq = pcq_create(txq->txq_vq->vq_num, KM_SLEEP);
995 vioif_work_set(&txq->txq_work, vioif_tx_handle, txq);
996 }
997
998 if (sc->sc_has_ctrl) {
999 /*
1000 * Allocating a virtqueue for control channel
1001 */
1002 r = virtio_alloc_vq(vsc, ctrlq->ctrlq_vq, nvqs,
1003 NBPG, 1, "control");
1004 if (r != 0) {
1005 aprint_error_dev(self, "failed to allocate "
1006 "a virtqueue for control channel, error code %d\n",
1007 r);
1008
1009 sc->sc_has_ctrl = false;
1010 cv_destroy(&ctrlq->ctrlq_wait);
1011 mutex_destroy(&ctrlq->ctrlq_wait_lock);
1012 } else {
1013 nvqs++;
1014 ctrlq->ctrlq_vq->vq_intrhand = vioif_ctrl_intr;
1015 ctrlq->ctrlq_vq->vq_intrhand_arg = (void *) ctrlq;
1016 }
1017 }
1018
1019 sc->sc_ctl_softint = softint_establish(softint_flags,
1020 vioif_ctl_softint, sc);
1021 if (sc->sc_ctl_softint == NULL) {
1022 aprint_error_dev(self, "cannot establish ctl softint\n");
1023 goto err;
1024 }
1025
1026 if (vioif_alloc_mems(sc) < 0)
1027 goto err;
1028
1029 if (virtio_child_attach_finish(vsc) != 0)
1030 goto err;
1031
1032 if (vioif_setup_sysctl(sc) != 0) {
1033 aprint_error_dev(self, "unable to create sysctl node\n");
1034 /* continue */
1035 }
1036
1037 vioif_setup_stats(sc);
1038
1039 strlcpy(ifp->if_xname, device_xname(self), IFNAMSIZ);
1040 ifp->if_softc = sc;
1041 ifp->if_flags = IFF_BROADCAST | IFF_SIMPLEX | IFF_MULTICAST;
1042 #ifdef VIOIF_MPSAFE
1043 ifp->if_extflags = IFEF_MPSAFE;
1044 #endif
1045 ifp->if_start = vioif_start;
1046 if (sc->sc_req_nvq_pairs > 1)
1047 ifp->if_transmit = vioif_transmit;
1048 ifp->if_ioctl = vioif_ioctl;
1049 ifp->if_init = vioif_init;
1050 ifp->if_stop = vioif_stop;
1051 ifp->if_capabilities = 0;
1052 ifp->if_watchdog = vioif_watchdog;
1053 txq = &sc->sc_txq[0];
1054 IFQ_SET_MAXLEN(&ifp->if_snd, MAX(txq->txq_vq->vq_num, IFQ_MAXLEN));
1055 IFQ_SET_READY(&ifp->if_snd);
1056
1057 sc->sc_ethercom.ec_capabilities |= ETHERCAP_VLAN_MTU;
1058
1059 if_attach(ifp);
1060 if_deferred_start_init(ifp, NULL);
1061 ether_ifattach(ifp, sc->sc_mac);
1062 ether_set_ifflags_cb(&sc->sc_ethercom, vioif_ifflags_cb);
1063
1064 return;
1065
1066 err:
1067 for (i = 0; i < sc->sc_max_nvq_pairs; i++) {
1068 rxq = &sc->sc_rxq[i];
1069 txq = &sc->sc_txq[i];
1070
1071 if (rxq->rxq_lock) {
1072 mutex_obj_free(rxq->rxq_lock);
1073 rxq->rxq_lock = NULL;
1074 }
1075
1076 if (rxq->rxq_handle_si) {
1077 softint_disestablish(rxq->rxq_handle_si);
1078 rxq->rxq_handle_si = NULL;
1079 }
1080
1081 if (txq->txq_lock) {
1082 mutex_obj_free(txq->txq_lock);
1083 txq->txq_lock = NULL;
1084 }
1085
1086 if (txq->txq_handle_si) {
1087 softint_disestablish(txq->txq_handle_si);
1088 txq->txq_handle_si = NULL;
1089 }
1090
1091 if (txq->txq_deferred_transmit) {
1092 softint_disestablish(txq->txq_deferred_transmit);
1093 txq->txq_deferred_transmit = NULL;
1094 }
1095
1096 if (txq->txq_intrq) {
1097 pcq_destroy(txq->txq_intrq);
1098 txq->txq_intrq = NULL;
1099 }
1100 }
1101
1102 if (sc->sc_has_ctrl) {
1103 cv_destroy(&ctrlq->ctrlq_wait);
1104 mutex_destroy(&ctrlq->ctrlq_wait_lock);
1105 }
1106
1107 while (nvqs > 0)
1108 virtio_free_vq(vsc, &sc->sc_vqs[--nvqs]);
1109
1110 vioif_free_queues(sc);
1111 mutex_destroy(&sc->sc_lock);
1112 virtio_child_attach_failed(vsc);
1113 config_finalize_register(self, vioif_finalize_teardown);
1114
1115 return;
1116 }
1117
1118 static int
1119 vioif_finalize_teardown(device_t self)
1120 {
1121 struct vioif_softc *sc = device_private(self);
1122
1123 if (sc->sc_txrx_workqueue != NULL) {
1124 vioif_workq_destroy(sc->sc_txrx_workqueue);
1125 sc->sc_txrx_workqueue = NULL;
1126 }
1127
1128 return 0;
1129 }
1130
1131 static void
1132 vioif_enable_interrupt_vqpairs(struct vioif_softc *sc)
1133 {
1134 struct virtio_softc *vsc = sc->sc_virtio;
1135 struct vioif_txqueue *txq;
1136 struct vioif_rxqueue *rxq;
1137 int i;
1138
1139 for (i = 0; i < sc->sc_act_nvq_pairs; i++) {
1140 txq = &sc->sc_txq[i];
1141 rxq = &sc->sc_rxq[i];
1142
1143 virtio_start_vq_intr(vsc, txq->txq_vq);
1144 virtio_start_vq_intr(vsc, rxq->rxq_vq);
1145 }
1146 }
1147
1148 static void
1149 vioif_disable_interrupt_vqpairs(struct vioif_softc *sc)
1150 {
1151 struct virtio_softc *vsc = sc->sc_virtio;
1152 struct vioif_txqueue *txq;
1153 struct vioif_rxqueue *rxq;
1154 int i;
1155
1156 for (i = 0; i < sc->sc_act_nvq_pairs; i++) {
1157 rxq = &sc->sc_rxq[i];
1158 txq = &sc->sc_txq[i];
1159
1160 virtio_stop_vq_intr(vsc, rxq->rxq_vq);
1161 virtio_stop_vq_intr(vsc, txq->txq_vq);
1162 }
1163 }
1164
1165 /*
1166 * Interface functions for ifnet
1167 */
1168 static int
1169 vioif_init(struct ifnet *ifp)
1170 {
1171 struct vioif_softc *sc = ifp->if_softc;
1172 struct virtio_softc *vsc = sc->sc_virtio;
1173 struct vioif_rxqueue *rxq;
1174 struct vioif_ctrlqueue *ctrlq = &sc->sc_ctrlq;
1175 int r, i;
1176
1177 vioif_stop(ifp, 0);
1178
1179 r = virtio_reinit_start(vsc);
1180 if (r != 0) {
1181 log(LOG_ERR, "%s: reset failed\n", ifp->if_xname);
1182 return EIO;
1183 }
1184
1185 virtio_negotiate_features(vsc, virtio_features(vsc));
1186
1187 for (i = 0; i < sc->sc_req_nvq_pairs; i++) {
1188 rxq = &sc->sc_rxq[i];
1189
1190 mutex_enter(rxq->rxq_lock);
1191 vioif_populate_rx_mbufs_locked(sc, rxq);
1192 mutex_exit(rxq->rxq_lock);
1193
1194 }
1195
1196 virtio_reinit_end(vsc);
1197
1198 if (sc->sc_has_ctrl)
1199 virtio_start_vq_intr(vsc, ctrlq->ctrlq_vq);
1200
1201 r = vioif_ctrl_mq_vq_pairs_set(sc, sc->sc_req_nvq_pairs);
1202 if (r == 0)
1203 sc->sc_act_nvq_pairs = sc->sc_req_nvq_pairs;
1204 else
1205 sc->sc_act_nvq_pairs = 1;
1206
1207 vioif_enable_interrupt_vqpairs(sc);
1208
1209 vioif_update_link_status(sc);
1210 ifp->if_flags |= IFF_RUNNING;
1211 ifp->if_flags &= ~IFF_OACTIVE;
1212 r = vioif_rx_filter(sc);
1213
1214 return r;
1215 }
1216
1217 static void
1218 vioif_stop(struct ifnet *ifp, int disable)
1219 {
1220 struct vioif_softc *sc = ifp->if_softc;
1221 struct virtio_softc *vsc = sc->sc_virtio;
1222 struct vioif_txqueue *txq;
1223 struct vioif_rxqueue *rxq;
1224 struct vioif_ctrlqueue *ctrlq = &sc->sc_ctrlq;
1225 int i;
1226
1227
1228 for (i = 0; i < sc->sc_act_nvq_pairs; i++) {
1229 txq = &sc->sc_txq[i];
1230 rxq = &sc->sc_rxq[i];
1231
1232 mutex_enter(rxq->rxq_lock);
1233 rxq->rxq_stopping = true;
1234 mutex_exit(rxq->rxq_lock);
1235
1236 mutex_enter(txq->txq_lock);
1237 txq->txq_stopping = true;
1238 mutex_exit(txq->txq_lock);
1239 }
1240
1241 /* disable interrupts */
1242 vioif_disable_interrupt_vqpairs(sc);
1243 if (sc->sc_has_ctrl)
1244 virtio_stop_vq_intr(vsc, ctrlq->ctrlq_vq);
1245
1246 /*
1247 * only way to stop interrupt, I/O and DMA is resetting...
1248 *
1249 * NOTE: Devices based on VirtIO draft specification can not
1250 * stop interrupt completely even if virtio_stop_vq_intr() is called.
1251 */
1252 virtio_reset(vsc);
1253
1254 vioif_intr_barrier();
1255
1256 for (i = 0; i < sc->sc_act_nvq_pairs; i++) {
1257 txq = &sc->sc_txq[i];
1258 rxq = &sc->sc_rxq[i];
1259
1260 vioif_work_wait(sc->sc_txrx_workqueue, &rxq->rxq_work);
1261 vioif_work_wait(sc->sc_txrx_workqueue, &txq->txq_work);
1262 }
1263
1264 for (i = 0; i < sc->sc_act_nvq_pairs; i++) {
1265 vioif_rx_queue_clear(&sc->sc_rxq[i]);
1266 vioif_tx_queue_clear(&sc->sc_txq[i]);
1267 }
1268
1269 ifp->if_flags &= ~(IFF_RUNNING | IFF_OACTIVE);
1270
1271 /* all packet processing is stopped */
1272 for (i = 0; i < sc->sc_act_nvq_pairs; i++) {
1273 txq = &sc->sc_txq[i];
1274 rxq = &sc->sc_rxq[i];
1275
1276 mutex_enter(rxq->rxq_lock);
1277 rxq->rxq_stopping = false;
1278 KASSERT(!rxq->rxq_running_handle);
1279 mutex_exit(rxq->rxq_lock);
1280
1281 mutex_enter(txq->txq_lock);
1282 txq->txq_stopping = false;
1283 KASSERT(!txq->txq_running_handle);
1284 mutex_exit(txq->txq_lock);
1285 }
1286
1287 for (i = 0; i < sc->sc_act_nvq_pairs; i++) {
1288 txq = &sc->sc_txq[i];
1289 rxq = &sc->sc_rxq[i];
1290
1291 vioif_rx_drain(rxq);
1292 vioif_tx_drain(txq);
1293 }
1294 }
1295
1296 static void
1297 vioif_send_common_locked(struct ifnet *ifp, struct vioif_txqueue *txq,
1298 bool is_transmit)
1299 {
1300 struct vioif_softc *sc = ifp->if_softc;
1301 struct virtio_softc *vsc = sc->sc_virtio;
1302 struct virtqueue *vq = txq->txq_vq;
1303 struct virtio_net_hdr *hdr;
1304 struct mbuf *m;
1305 int queued = 0;
1306
1307 KASSERT(mutex_owned(txq->txq_lock));
1308
1309 if ((ifp->if_flags & IFF_RUNNING) == 0)
1310 return;
1311
1312 if (!txq->txq_link_active || txq->txq_stopping)
1313 return;
1314
1315 if ((ifp->if_flags & IFF_OACTIVE) != 0 && !is_transmit)
1316 return;
1317
1318 for (;;) {
1319 int slot, r;
1320
1321 if (is_transmit)
1322 m = pcq_get(txq->txq_intrq);
1323 else
1324 IFQ_DEQUEUE(&ifp->if_snd, m);
1325
1326 if (m == NULL)
1327 break;
1328
1329 r = virtio_enqueue_prep(vsc, vq, &slot);
1330 if (r == EAGAIN) {
1331 ifp->if_flags |= IFF_OACTIVE;
1332 m_freem(m);
1333 break;
1334 }
1335 if (r != 0)
1336 panic("enqueue_prep for a tx buffer");
1337
1338 r = bus_dmamap_load_mbuf(virtio_dmat(vsc),
1339 txq->txq_dmamaps[slot], m, BUS_DMA_WRITE | BUS_DMA_NOWAIT);
1340 if (r != 0) {
1341 /* maybe just too fragmented */
1342 struct mbuf *newm;
1343
1344 newm = m_defrag(m, M_NOWAIT);
1345 if (newm == NULL) {
1346 txq->txq_defrag_failed.ev_count++;
1347 goto skip;
1348 }
1349
1350 m = newm;
1351 r = bus_dmamap_load_mbuf(virtio_dmat(vsc),
1352 txq->txq_dmamaps[slot], m,
1353 BUS_DMA_WRITE | BUS_DMA_NOWAIT);
1354 if (r != 0) {
1355 txq->txq_mbuf_load_failed.ev_count++;
1356 skip:
1357 m_freem(m);
1358 virtio_enqueue_abort(vsc, vq, slot);
1359 continue;
1360 }
1361 }
1362
1363 /* This should actually never fail */
1364 r = virtio_enqueue_reserve(vsc, vq, slot,
1365 txq->txq_dmamaps[slot]->dm_nsegs + 1);
1366 if (r != 0) {
1367 txq->txq_enqueue_reserve_failed.ev_count++;
1368 bus_dmamap_unload(virtio_dmat(vsc),
1369 txq->txq_dmamaps[slot]);
1370 /* slot already freed by virtio_enqueue_reserve */
1371 m_freem(m);
1372 continue;
1373 }
1374
1375 txq->txq_mbufs[slot] = m;
1376
1377 hdr = &txq->txq_hdrs[slot];
1378 memset(hdr, 0, sc->sc_hdr_size);
1379 bus_dmamap_sync(virtio_dmat(vsc), txq->txq_dmamaps[slot],
1380 0, txq->txq_dmamaps[slot]->dm_mapsize,
1381 BUS_DMASYNC_PREWRITE);
1382 bus_dmamap_sync(virtio_dmat(vsc), txq->txq_hdr_dmamaps[slot],
1383 0, txq->txq_hdr_dmamaps[slot]->dm_mapsize,
1384 BUS_DMASYNC_PREWRITE);
1385 virtio_enqueue(vsc, vq, slot, txq->txq_hdr_dmamaps[slot], true);
1386 virtio_enqueue(vsc, vq, slot, txq->txq_dmamaps[slot], true);
1387 virtio_enqueue_commit(vsc, vq, slot, false);
1388
1389 queued++;
1390 bpf_mtap(ifp, m, BPF_D_OUT);
1391 }
1392
1393 if (queued > 0) {
1394 virtio_enqueue_commit(vsc, vq, -1, true);
1395 ifp->if_timer = 5;
1396 }
1397 }
1398
1399 static void
1400 vioif_start_locked(struct ifnet *ifp, struct vioif_txqueue *txq)
1401 {
1402
1403 /*
1404 * ifp->if_obytes and ifp->if_omcasts are added in if_transmit()@if.c.
1405 */
1406 vioif_send_common_locked(ifp, txq, false);
1407
1408 }
1409
1410 static void
1411 vioif_start(struct ifnet *ifp)
1412 {
1413 struct vioif_softc *sc = ifp->if_softc;
1414 struct vioif_txqueue *txq = &sc->sc_txq[0];
1415
1416 #ifdef VIOIF_MPSAFE
1417 KASSERT(if_is_mpsafe(ifp));
1418 #endif
1419
1420 mutex_enter(txq->txq_lock);
1421 vioif_start_locked(ifp, txq);
1422 mutex_exit(txq->txq_lock);
1423 }
1424
1425 static inline int
1426 vioif_select_txqueue(struct ifnet *ifp, struct mbuf *m)
1427 {
1428 struct vioif_softc *sc = ifp->if_softc;
1429 u_int cpuid = cpu_index(curcpu());
1430
1431 return cpuid % sc->sc_act_nvq_pairs;
1432 }
1433
1434 static void
1435 vioif_transmit_locked(struct ifnet *ifp, struct vioif_txqueue *txq)
1436 {
1437
1438 vioif_send_common_locked(ifp, txq, true);
1439 }
1440
1441 static int
1442 vioif_transmit(struct ifnet *ifp, struct mbuf *m)
1443 {
1444 struct vioif_softc *sc = ifp->if_softc;
1445 struct vioif_txqueue *txq;
1446 int qid;
1447
1448 qid = vioif_select_txqueue(ifp, m);
1449 txq = &sc->sc_txq[qid];
1450
1451 if (__predict_false(!pcq_put(txq->txq_intrq, m))) {
1452 m_freem(m);
1453 return ENOBUFS;
1454 }
1455
1456 net_stat_ref_t nsr = IF_STAT_GETREF(ifp);
1457 if_statadd_ref(nsr, if_obytes, m->m_pkthdr.len);
1458 if (m->m_flags & M_MCAST)
1459 if_statinc_ref(nsr, if_omcasts);
1460 IF_STAT_PUTREF(ifp);
1461
1462 if (mutex_tryenter(txq->txq_lock)) {
1463 vioif_transmit_locked(ifp, txq);
1464 mutex_exit(txq->txq_lock);
1465 }
1466
1467 return 0;
1468 }
1469
1470 static void
1471 vioif_deferred_transmit(void *arg)
1472 {
1473 struct vioif_txqueue *txq = arg;
1474 struct virtio_softc *vsc = txq->txq_vq->vq_owner;
1475 struct vioif_softc *sc = device_private(virtio_child(vsc));
1476 struct ifnet *ifp = &sc->sc_ethercom.ec_if;
1477
1478 mutex_enter(txq->txq_lock);
1479 vioif_send_common_locked(ifp, txq, true);
1480 mutex_exit(txq->txq_lock);
1481 }
1482
1483 static int
1484 vioif_ioctl(struct ifnet *ifp, u_long cmd, void *data)
1485 {
1486 int s, r;
1487
1488 s = splnet();
1489
1490 r = ether_ioctl(ifp, cmd, data);
1491 if (r == ENETRESET && (cmd == SIOCADDMULTI || cmd == SIOCDELMULTI)) {
1492 if (ifp->if_flags & IFF_RUNNING) {
1493 r = vioif_rx_filter(ifp->if_softc);
1494 } else {
1495 r = 0;
1496 }
1497 }
1498
1499 splx(s);
1500
1501 return r;
1502 }
1503
1504 void
1505 vioif_watchdog(struct ifnet *ifp)
1506 {
1507 struct vioif_softc *sc = ifp->if_softc;
1508 int i;
1509
1510 if (ifp->if_flags & IFF_RUNNING) {
1511 for (i = 0; i < sc->sc_act_nvq_pairs; i++) {
1512 vioif_tx_queue_clear(&sc->sc_txq[i]);
1513 }
1514 }
1515 }
1516
1517 /*
1518 * Receive implementation
1519 */
1520 /* add mbufs for all the empty receive slots */
1521 static void
1522 vioif_populate_rx_mbufs_locked(struct vioif_softc *sc, struct vioif_rxqueue *rxq)
1523 {
1524 struct virtqueue *vq = rxq->rxq_vq;
1525 struct virtio_softc *vsc = vq->vq_owner;
1526 struct mbuf *m;
1527 int i, r, ndone = 0;
1528
1529 KASSERT(mutex_owned(rxq->rxq_lock));
1530
1531 for (i = 0; i < vq->vq_num; i++) {
1532 int slot;
1533 r = virtio_enqueue_prep(vsc, vq, &slot);
1534 if (r == EAGAIN)
1535 break;
1536 if (r != 0)
1537 panic("enqueue_prep for rx buffers");
1538
1539 MGETHDR(m, M_DONTWAIT, MT_DATA);
1540 if (m == NULL) {
1541 virtio_enqueue_abort(vsc, vq, slot);
1542 rxq->rxq_mbuf_enobufs.ev_count++;
1543 break;
1544 }
1545 MCLGET(m, M_DONTWAIT);
1546 if ((m->m_flags & M_EXT) == 0) {
1547 virtio_enqueue_abort(vsc, vq, slot);
1548 m_freem(m);
1549 rxq->rxq_mbuf_enobufs.ev_count++;
1550 break;
1551 }
1552
1553 m->m_len = m->m_pkthdr.len = MCLBYTES;
1554 m_adj(m, ETHER_ALIGN);
1555
1556 r = bus_dmamap_load_mbuf(virtio_dmat(vsc),
1557 rxq->rxq_dmamaps[slot], m, BUS_DMA_READ | BUS_DMA_NOWAIT);
1558
1559 if (r != 0) {
1560 virtio_enqueue_abort(vsc, vq, slot);
1561 m_freem(m);
1562 rxq->rxq_mbuf_load_failed.ev_count++;
1563 break;
1564 }
1565
1566 r = virtio_enqueue_reserve(vsc, vq, slot,
1567 rxq->rxq_dmamaps[slot]->dm_nsegs + 1);
1568 if (r != 0) {
1569 rxq->rxq_enqueue_reserve_failed.ev_count++;
1570 bus_dmamap_unload(virtio_dmat(vsc), rxq->rxq_dmamaps[slot]);
1571 m_freem(m);
1572 /* slot already freed by virtio_enqueue_reserve */
1573 break;
1574 }
1575 KASSERT(rxq->rxq_mbufs[slot] == NULL);
1576 rxq->rxq_mbufs[slot] = m;
1577 bus_dmamap_sync(virtio_dmat(vsc), rxq->rxq_hdr_dmamaps[slot],
1578 0, sc->sc_hdr_size, BUS_DMASYNC_PREREAD);
1579 bus_dmamap_sync(virtio_dmat(vsc), rxq->rxq_dmamaps[slot],
1580 0, rxq->rxq_dmamaps[slot]->dm_mapsize, BUS_DMASYNC_PREREAD);
1581 virtio_enqueue(vsc, vq, slot, rxq->rxq_hdr_dmamaps[slot],
1582 false);
1583 virtio_enqueue(vsc, vq, slot, rxq->rxq_dmamaps[slot], false);
1584 virtio_enqueue_commit(vsc, vq, slot, false);
1585 ndone++;
1586 }
1587 if (ndone > 0)
1588 virtio_enqueue_commit(vsc, vq, -1, true);
1589 }
1590
1591 static void
1592 vioif_rx_queue_clear(struct vioif_rxqueue *rxq)
1593 {
1594 struct virtqueue *vq = rxq->rxq_vq;
1595 struct virtio_softc *vsc = vq->vq_owner;
1596 struct vioif_softc *sc = device_private(virtio_child(vsc));
1597 u_int limit = UINT_MAX;
1598 bool more;
1599
1600 mutex_enter(rxq->rxq_lock);
1601 for (;;) {
1602 more = vioif_rx_deq_locked(sc, vsc, rxq, limit, NULL);
1603 if (more == false)
1604 break;
1605 }
1606 mutex_exit(rxq->rxq_lock);
1607 }
1608
1609 /* dequeue received packets */
1610 static bool
1611 vioif_rx_deq_locked(struct vioif_softc *sc, struct virtio_softc *vsc,
1612 struct vioif_rxqueue *rxq, u_int limit, size_t *ndeqp)
1613 {
1614 struct virtqueue *vq = rxq->rxq_vq;
1615 struct ifnet *ifp = &sc->sc_ethercom.ec_if;
1616 struct mbuf *m;
1617 int slot, len;
1618 bool more;
1619 size_t ndeq;
1620
1621 KASSERT(mutex_owned(rxq->rxq_lock));
1622
1623 more = false;
1624 ndeq = 0;
1625
1626 if (virtio_vq_is_enqueued(vsc, vq) == false)
1627 goto done;
1628
1629 for (;;ndeq++) {
1630 if (ndeq >= limit) {
1631 more = true;
1632 break;
1633 }
1634
1635 if (virtio_dequeue(vsc, vq, &slot, &len) != 0)
1636 break;
1637
1638 len -= sc->sc_hdr_size;
1639 bus_dmamap_sync(virtio_dmat(vsc), rxq->rxq_hdr_dmamaps[slot],
1640 0, sc->sc_hdr_size, BUS_DMASYNC_POSTREAD);
1641 bus_dmamap_sync(virtio_dmat(vsc), rxq->rxq_dmamaps[slot],
1642 0, rxq->rxq_dmamaps[slot]->dm_mapsize, BUS_DMASYNC_POSTREAD);
1643 m = rxq->rxq_mbufs[slot];
1644 KASSERT(m != NULL);
1645 bus_dmamap_unload(virtio_dmat(vsc), rxq->rxq_dmamaps[slot]);
1646 rxq->rxq_mbufs[slot] = NULL;
1647 virtio_dequeue_commit(vsc, vq, slot);
1648 m_set_rcvif(m, ifp);
1649 m->m_len = m->m_pkthdr.len = len;
1650
1651 if_percpuq_enqueue(ifp->if_percpuq, m);
1652 }
1653
1654
1655 done:
1656 if (ndeqp != NULL)
1657 *ndeqp = ndeq;
1658
1659 return more;
1660 }
1661
1662 /* rx interrupt; call _dequeue above and schedule a softint */
1663
1664 static void
1665 vioif_rx_handle_locked(void *xrxq, u_int limit)
1666 {
1667 struct vioif_rxqueue *rxq = xrxq;
1668 struct virtqueue *vq = rxq->rxq_vq;
1669 struct virtio_softc *vsc = vq->vq_owner;
1670 struct vioif_softc *sc = device_private(virtio_child(vsc));
1671 bool more;
1672 int enqueued;
1673 size_t ndeq;
1674
1675 KASSERT(mutex_owned(rxq->rxq_lock));
1676 KASSERT(!rxq->rxq_stopping);
1677
1678 more = vioif_rx_deq_locked(sc, vsc, rxq, limit, &ndeq);
1679 if (ndeq > 0)
1680 vioif_populate_rx_mbufs_locked(sc, rxq);
1681
1682 if (more) {
1683 vioif_rx_sched_handle(sc, rxq);
1684 return;
1685 }
1686
1687 enqueued = virtio_start_vq_intr(vsc, rxq->rxq_vq);
1688 if (enqueued != 0) {
1689 virtio_stop_vq_intr(vsc, rxq->rxq_vq);
1690 vioif_rx_sched_handle(sc, rxq);
1691 return;
1692 }
1693
1694 rxq->rxq_running_handle = false;
1695 }
1696
1697 static int
1698 vioif_rx_intr(void *arg)
1699 {
1700 struct vioif_rxqueue *rxq = arg;
1701 struct virtqueue *vq = rxq->rxq_vq;
1702 struct virtio_softc *vsc = vq->vq_owner;
1703 struct vioif_softc *sc = device_private(virtio_child(vsc));
1704 u_int limit;
1705
1706
1707 mutex_enter(rxq->rxq_lock);
1708
1709 /* rx handler is already running in softint/workqueue */
1710 if (rxq->rxq_running_handle)
1711 goto done;
1712
1713 if (rxq->rxq_stopping)
1714 goto done;
1715
1716 rxq->rxq_running_handle = true;
1717
1718 limit = sc->sc_rx_intr_process_limit;
1719 virtio_stop_vq_intr(vsc, vq);
1720 vioif_rx_handle_locked(rxq, limit);
1721
1722 done:
1723 mutex_exit(rxq->rxq_lock);
1724 return 1;
1725 }
1726
1727 static void
1728 vioif_rx_handle(void *xrxq)
1729 {
1730 struct vioif_rxqueue *rxq = xrxq;
1731 struct virtqueue *vq = rxq->rxq_vq;
1732 struct virtio_softc *vsc = vq->vq_owner;
1733 struct vioif_softc *sc = device_private(virtio_child(vsc));
1734 u_int limit;
1735
1736 mutex_enter(rxq->rxq_lock);
1737
1738 KASSERT(rxq->rxq_running_handle);
1739
1740 if (rxq->rxq_stopping) {
1741 rxq->rxq_running_handle = false;
1742 goto done;
1743 }
1744
1745 limit = sc->sc_rx_process_limit;
1746 vioif_rx_handle_locked(rxq, limit);
1747
1748 done:
1749 mutex_exit(rxq->rxq_lock);
1750 }
1751
1752 static void
1753 vioif_rx_sched_handle(struct vioif_softc *sc, struct vioif_rxqueue *rxq)
1754 {
1755
1756 KASSERT(mutex_owned(rxq->rxq_lock));
1757
1758 if (rxq->rxq_stopping)
1759 return;
1760
1761 if (rxq->rxq_workqueue)
1762 vioif_work_add(sc->sc_txrx_workqueue, &rxq->rxq_work);
1763 else
1764 softint_schedule(rxq->rxq_handle_si);
1765 }
1766
1767 /* free all the mbufs; called from if_stop(disable) */
1768 static void
1769 vioif_rx_drain(struct vioif_rxqueue *rxq)
1770 {
1771 struct virtqueue *vq = rxq->rxq_vq;
1772 struct virtio_softc *vsc = vq->vq_owner;
1773 struct mbuf *m;
1774 int i;
1775
1776 for (i = 0; i < vq->vq_num; i++) {
1777 m = rxq->rxq_mbufs[i];
1778 if (m == NULL)
1779 continue;
1780 rxq->rxq_mbufs[i] = NULL;
1781 bus_dmamap_unload(virtio_dmat(vsc), rxq->rxq_dmamaps[i]);
1782 m_freem(m);
1783 }
1784 }
1785
1786 /*
1787 * Transmition implementation
1788 */
1789 /* actual transmission is done in if_start */
1790 /* tx interrupt; dequeue and free mbufs */
1791 /*
1792 * tx interrupt is actually disabled; this should be called upon
1793 * tx vq full and watchdog
1794 */
1795
1796 static void
1797 vioif_tx_handle_locked(struct vioif_txqueue *txq, u_int limit)
1798 {
1799 struct virtqueue *vq = txq->txq_vq;
1800 struct virtio_softc *vsc = vq->vq_owner;
1801 struct vioif_softc *sc = device_private(virtio_child(vsc));
1802 struct ifnet *ifp = &sc->sc_ethercom.ec_if;
1803 bool more;
1804 int enqueued;
1805
1806 KASSERT(mutex_owned(txq->txq_lock));
1807 KASSERT(!txq->txq_stopping);
1808
1809 more = vioif_tx_deq_locked(sc, vsc, txq, limit);
1810 if (more) {
1811 vioif_tx_sched_handle(sc, txq);
1812 return;
1813 }
1814
1815 enqueued = (virtio_features(vsc) & VIRTIO_F_RING_EVENT_IDX) ?
1816 virtio_postpone_intr_smart(vsc, vq):
1817 virtio_start_vq_intr(vsc, vq);
1818 if (enqueued != 0) {
1819 virtio_stop_vq_intr(vsc, vq);
1820 vioif_tx_sched_handle(sc, txq);
1821 return;
1822 }
1823
1824 txq->txq_running_handle = false;
1825
1826 /* for ALTQ */
1827 if (txq == &sc->sc_txq[0]) {
1828 if_schedule_deferred_start(ifp);
1829 ifp->if_flags &= ~IFF_OACTIVE;
1830 }
1831 softint_schedule(txq->txq_deferred_transmit);
1832 }
1833
1834
1835 static int
1836 vioif_tx_intr(void *arg)
1837 {
1838 struct vioif_txqueue *txq = arg;
1839 struct virtqueue *vq = txq->txq_vq;
1840 struct virtio_softc *vsc = vq->vq_owner;
1841 struct vioif_softc *sc = device_private(virtio_child(vsc));
1842 u_int limit;
1843
1844 limit = sc->sc_tx_intr_process_limit;
1845
1846 mutex_enter(txq->txq_lock);
1847
1848 /* tx handler is already running in softint/workqueue */
1849 if (txq->txq_running_handle)
1850 goto done;
1851
1852 if (txq->txq_stopping)
1853 goto done;
1854
1855 txq->txq_running_handle = true;
1856
1857 virtio_stop_vq_intr(vsc, vq);
1858 txq->txq_workqueue = sc->sc_txrx_workqueue_sysctl;
1859 vioif_tx_handle_locked(txq, limit);
1860
1861 done:
1862 mutex_exit(txq->txq_lock);
1863 return 1;
1864 }
1865
1866 static void
1867 vioif_tx_handle(void *xtxq)
1868 {
1869 struct vioif_txqueue *txq = xtxq;
1870 struct virtqueue *vq = txq->txq_vq;
1871 struct virtio_softc *vsc = vq->vq_owner;
1872 struct vioif_softc *sc = device_private(virtio_child(vsc));
1873 u_int limit;
1874
1875 mutex_enter(txq->txq_lock);
1876
1877 KASSERT(txq->txq_running_handle);
1878
1879 if (txq->txq_stopping) {
1880 txq->txq_running_handle = false;
1881 goto done;
1882 }
1883
1884 limit = sc->sc_tx_process_limit;
1885 vioif_tx_handle_locked(txq, limit);
1886
1887 done:
1888 mutex_exit(txq->txq_lock);
1889 }
1890
1891 static void
1892 vioif_tx_sched_handle(struct vioif_softc *sc, struct vioif_txqueue *txq)
1893 {
1894
1895 KASSERT(mutex_owned(txq->txq_lock));
1896
1897 if (txq->txq_stopping)
1898 return;
1899
1900 if (txq->txq_workqueue)
1901 vioif_work_add(sc->sc_txrx_workqueue, &txq->txq_work);
1902 else
1903 softint_schedule(txq->txq_handle_si);
1904 }
1905
1906 static void
1907 vioif_tx_queue_clear(struct vioif_txqueue *txq)
1908 {
1909 struct virtqueue *vq = txq->txq_vq;
1910 struct virtio_softc *vsc = vq->vq_owner;
1911 struct vioif_softc *sc = device_private(virtio_child(vsc));
1912 u_int limit = UINT_MAX;
1913 bool more;
1914
1915 mutex_enter(txq->txq_lock);
1916 for (;;) {
1917 more = vioif_tx_deq_locked(sc, vsc, txq, limit);
1918 if (more == false)
1919 break;
1920 }
1921 mutex_exit(txq->txq_lock);
1922 }
1923
1924 static bool
1925 vioif_tx_deq_locked(struct vioif_softc *sc, struct virtio_softc *vsc,
1926 struct vioif_txqueue *txq, u_int limit)
1927 {
1928 struct virtqueue *vq = txq->txq_vq;
1929 struct ifnet *ifp = &sc->sc_ethercom.ec_if;
1930 struct mbuf *m;
1931 int slot, len;
1932 bool more = false;
1933
1934 KASSERT(mutex_owned(txq->txq_lock));
1935
1936 if (virtio_vq_is_enqueued(vsc, vq) == false)
1937 return false;
1938
1939 for (;;) {
1940 if (limit-- == 0) {
1941 more = true;
1942 break;
1943 }
1944
1945 if (virtio_dequeue(vsc, vq, &slot, &len) != 0)
1946 break;
1947
1948 bus_dmamap_sync(virtio_dmat(vsc), txq->txq_hdr_dmamaps[slot],
1949 0, sc->sc_hdr_size, BUS_DMASYNC_POSTWRITE);
1950 bus_dmamap_sync(virtio_dmat(vsc), txq->txq_dmamaps[slot],
1951 0, txq->txq_dmamaps[slot]->dm_mapsize,
1952 BUS_DMASYNC_POSTWRITE);
1953 m = txq->txq_mbufs[slot];
1954 bus_dmamap_unload(virtio_dmat(vsc), txq->txq_dmamaps[slot]);
1955 txq->txq_mbufs[slot] = NULL;
1956 virtio_dequeue_commit(vsc, vq, slot);
1957 if_statinc(ifp, if_opackets);
1958 m_freem(m);
1959 }
1960
1961 return more;
1962 }
1963
1964 /* free all the mbufs already put on vq; called from if_stop(disable) */
1965 static void
1966 vioif_tx_drain(struct vioif_txqueue *txq)
1967 {
1968 struct virtqueue *vq = txq->txq_vq;
1969 struct virtio_softc *vsc = vq->vq_owner;
1970 int i;
1971
1972 for (i = 0; i < vq->vq_num; i++) {
1973 if (txq->txq_mbufs[i] == NULL)
1974 continue;
1975 bus_dmamap_unload(virtio_dmat(vsc), txq->txq_dmamaps[i]);
1976 m_freem(txq->txq_mbufs[i]);
1977 txq->txq_mbufs[i] = NULL;
1978 }
1979 }
1980
1981 /*
1982 * Control vq
1983 */
1984 /* issue a VIRTIO_NET_CTRL_RX class command and wait for completion */
1985 static void
1986 vioif_ctrl_acquire(struct vioif_softc *sc)
1987 {
1988 struct vioif_ctrlqueue *ctrlq = &sc->sc_ctrlq;
1989
1990 mutex_enter(&ctrlq->ctrlq_wait_lock);
1991 while (ctrlq->ctrlq_inuse != FREE)
1992 cv_wait(&ctrlq->ctrlq_wait, &ctrlq->ctrlq_wait_lock);
1993 ctrlq->ctrlq_inuse = INUSE;
1994 ctrlq->ctrlq_owner = curlwp;
1995 mutex_exit(&ctrlq->ctrlq_wait_lock);
1996 }
1997
1998 static void
1999 vioif_ctrl_release(struct vioif_softc *sc)
2000 {
2001 struct vioif_ctrlqueue *ctrlq = &sc->sc_ctrlq;
2002
2003 KASSERT(ctrlq->ctrlq_inuse != FREE);
2004 KASSERT(ctrlq->ctrlq_owner == curlwp);
2005
2006 mutex_enter(&ctrlq->ctrlq_wait_lock);
2007 ctrlq->ctrlq_inuse = FREE;
2008 ctrlq->ctrlq_owner = NULL;
2009 cv_signal(&ctrlq->ctrlq_wait);
2010 mutex_exit(&ctrlq->ctrlq_wait_lock);
2011 }
2012
2013 static int
2014 vioif_ctrl_load_cmdspec(struct vioif_softc *sc,
2015 struct vioif_ctrl_cmdspec *specs, int nspecs)
2016 {
2017 struct virtio_softc *vsc = sc->sc_virtio;
2018 int i, r, loaded;
2019
2020 loaded = 0;
2021 for (i = 0; i < nspecs; i++) {
2022 r = bus_dmamap_load(virtio_dmat(vsc),
2023 specs[i].dmamap, specs[i].buf, specs[i].bufsize,
2024 NULL, BUS_DMA_WRITE | BUS_DMA_NOWAIT);
2025 if (r) {
2026 sc->sc_ctrlq.ctrlq_cmd_load_failed.ev_count++;
2027 goto err;
2028 }
2029 loaded++;
2030
2031 }
2032
2033 return r;
2034
2035 err:
2036 for (i = 0; i < loaded; i++) {
2037 bus_dmamap_unload(virtio_dmat(vsc), specs[i].dmamap);
2038 }
2039
2040 return r;
2041 }
2042
2043 static void
2044 vioif_ctrl_unload_cmdspec(struct vioif_softc *sc,
2045 struct vioif_ctrl_cmdspec *specs, int nspecs)
2046 {
2047 struct virtio_softc *vsc = sc->sc_virtio;
2048 int i;
2049
2050 for (i = 0; i < nspecs; i++) {
2051 bus_dmamap_unload(virtio_dmat(vsc), specs[i].dmamap);
2052 }
2053 }
2054
2055 static int
2056 vioif_ctrl_send_command(struct vioif_softc *sc, uint8_t class, uint8_t cmd,
2057 struct vioif_ctrl_cmdspec *specs, int nspecs)
2058 {
2059 struct vioif_ctrlqueue *ctrlq = &sc->sc_ctrlq;
2060 struct virtqueue *vq = ctrlq->ctrlq_vq;
2061 struct virtio_softc *vsc = sc->sc_virtio;
2062 int i, r, slot;
2063
2064 ctrlq->ctrlq_cmd->class = class;
2065 ctrlq->ctrlq_cmd->command = cmd;
2066
2067 bus_dmamap_sync(virtio_dmat(vsc), ctrlq->ctrlq_cmd_dmamap,
2068 0, sizeof(struct virtio_net_ctrl_cmd), BUS_DMASYNC_PREWRITE);
2069 for (i = 0; i < nspecs; i++) {
2070 bus_dmamap_sync(virtio_dmat(vsc), specs[i].dmamap,
2071 0, specs[i].bufsize, BUS_DMASYNC_PREWRITE);
2072 }
2073 bus_dmamap_sync(virtio_dmat(vsc), ctrlq->ctrlq_status_dmamap,
2074 0, sizeof(struct virtio_net_ctrl_status), BUS_DMASYNC_PREREAD);
2075
2076 /* we need to explicitly (re)start vq intr when using RING EVENT IDX */
2077 if (virtio_features(vsc) & VIRTIO_F_RING_EVENT_IDX)
2078 virtio_start_vq_intr(vsc, ctrlq->ctrlq_vq);
2079
2080 r = virtio_enqueue_prep(vsc, vq, &slot);
2081 if (r != 0)
2082 panic("%s: control vq busy!?", device_xname(sc->sc_dev));
2083 r = virtio_enqueue_reserve(vsc, vq, slot, nspecs + 2);
2084 if (r != 0)
2085 panic("%s: control vq busy!?", device_xname(sc->sc_dev));
2086 virtio_enqueue(vsc, vq, slot, ctrlq->ctrlq_cmd_dmamap, true);
2087 for (i = 0; i < nspecs; i++) {
2088 virtio_enqueue(vsc, vq, slot, specs[i].dmamap, true);
2089 }
2090 virtio_enqueue(vsc, vq, slot, ctrlq->ctrlq_status_dmamap, false);
2091 virtio_enqueue_commit(vsc, vq, slot, true);
2092
2093 /* wait for done */
2094 mutex_enter(&ctrlq->ctrlq_wait_lock);
2095 while (ctrlq->ctrlq_inuse != DONE)
2096 cv_wait(&ctrlq->ctrlq_wait, &ctrlq->ctrlq_wait_lock);
2097 mutex_exit(&ctrlq->ctrlq_wait_lock);
2098 /* already dequeueued */
2099
2100 bus_dmamap_sync(virtio_dmat(vsc), ctrlq->ctrlq_cmd_dmamap, 0,
2101 sizeof(struct virtio_net_ctrl_cmd), BUS_DMASYNC_POSTWRITE);
2102 for (i = 0; i < nspecs; i++) {
2103 bus_dmamap_sync(virtio_dmat(vsc), specs[i].dmamap, 0,
2104 specs[i].bufsize, BUS_DMASYNC_POSTWRITE);
2105 }
2106 bus_dmamap_sync(virtio_dmat(vsc), ctrlq->ctrlq_status_dmamap, 0,
2107 sizeof(struct virtio_net_ctrl_status), BUS_DMASYNC_POSTREAD);
2108
2109 if (ctrlq->ctrlq_status->ack == VIRTIO_NET_OK)
2110 r = 0;
2111 else {
2112 device_printf(sc->sc_dev, "failed setting rx mode\n");
2113 sc->sc_ctrlq.ctrlq_cmd_failed.ev_count++;
2114 r = EIO;
2115 }
2116
2117 return r;
2118 }
2119
2120 static int
2121 vioif_ctrl_rx(struct vioif_softc *sc, int cmd, bool onoff)
2122 {
2123 struct virtio_net_ctrl_rx *rx = sc->sc_ctrlq.ctrlq_rx;
2124 struct vioif_ctrl_cmdspec specs[1];
2125 int r;
2126
2127 if (!sc->sc_has_ctrl)
2128 return ENOTSUP;
2129
2130 vioif_ctrl_acquire(sc);
2131
2132 rx->onoff = onoff;
2133 specs[0].dmamap = sc->sc_ctrlq.ctrlq_rx_dmamap;
2134 specs[0].buf = rx;
2135 specs[0].bufsize = sizeof(*rx);
2136
2137 r = vioif_ctrl_send_command(sc, VIRTIO_NET_CTRL_RX, cmd,
2138 specs, __arraycount(specs));
2139
2140 vioif_ctrl_release(sc);
2141 return r;
2142 }
2143
2144 static int
2145 vioif_set_promisc(struct vioif_softc *sc, bool onoff)
2146 {
2147 return vioif_ctrl_rx(sc, VIRTIO_NET_CTRL_RX_PROMISC, onoff);
2148 }
2149
2150 static int
2151 vioif_set_allmulti(struct vioif_softc *sc, bool onoff)
2152 {
2153 return vioif_ctrl_rx(sc, VIRTIO_NET_CTRL_RX_ALLMULTI, onoff);
2154 }
2155
2156 /* issue VIRTIO_NET_CTRL_MAC_TABLE_SET command and wait for completion */
2157 static int
2158 vioif_set_rx_filter(struct vioif_softc *sc)
2159 {
2160 /* filter already set in ctrlq->ctrlq_mac_tbl */
2161 struct virtio_softc *vsc = sc->sc_virtio;
2162 struct virtio_net_ctrl_mac_tbl *mac_tbl_uc, *mac_tbl_mc;
2163 struct vioif_ctrl_cmdspec specs[2];
2164 int nspecs = __arraycount(specs);
2165 int r;
2166
2167 mac_tbl_uc = sc->sc_ctrlq.ctrlq_mac_tbl_uc;
2168 mac_tbl_mc = sc->sc_ctrlq.ctrlq_mac_tbl_mc;
2169
2170 if (!sc->sc_has_ctrl)
2171 return ENOTSUP;
2172
2173 vioif_ctrl_acquire(sc);
2174
2175 specs[0].dmamap = sc->sc_ctrlq.ctrlq_tbl_uc_dmamap;
2176 specs[0].buf = mac_tbl_uc;
2177 specs[0].bufsize = sizeof(*mac_tbl_uc)
2178 + (ETHER_ADDR_LEN * virtio_rw32(vsc, mac_tbl_uc->nentries));
2179
2180 specs[1].dmamap = sc->sc_ctrlq.ctrlq_tbl_mc_dmamap;
2181 specs[1].buf = mac_tbl_mc;
2182 specs[1].bufsize = sizeof(*mac_tbl_mc)
2183 + (ETHER_ADDR_LEN * virtio_rw32(vsc, mac_tbl_mc->nentries));
2184
2185 r = vioif_ctrl_load_cmdspec(sc, specs, nspecs);
2186 if (r != 0)
2187 goto out;
2188
2189 r = vioif_ctrl_send_command(sc,
2190 VIRTIO_NET_CTRL_MAC, VIRTIO_NET_CTRL_MAC_TABLE_SET,
2191 specs, nspecs);
2192
2193 vioif_ctrl_unload_cmdspec(sc, specs, nspecs);
2194
2195 out:
2196 vioif_ctrl_release(sc);
2197
2198 return r;
2199 }
2200
2201 static int
2202 vioif_set_mac_addr(struct vioif_softc *sc)
2203 {
2204 struct virtio_net_ctrl_mac_addr *ma =
2205 sc->sc_ctrlq.ctrlq_mac_addr;
2206 struct vioif_ctrl_cmdspec specs[1];
2207 struct ifnet *ifp = &sc->sc_ethercom.ec_if;
2208 int nspecs = __arraycount(specs);
2209 uint64_t features;
2210 int r;
2211 size_t i;
2212
2213 if (!sc->sc_has_ctrl)
2214 return ENOTSUP;
2215
2216 if (memcmp(CLLADDR(ifp->if_sadl), sc->sc_mac,
2217 ETHER_ADDR_LEN) == 0) {
2218 return 0;
2219 }
2220
2221 memcpy(sc->sc_mac, CLLADDR(ifp->if_sadl), ETHER_ADDR_LEN);
2222
2223 features = virtio_features(sc->sc_virtio);
2224 if (features & VIRTIO_NET_F_CTRL_MAC_ADDR) {
2225 vioif_ctrl_acquire(sc);
2226
2227 memcpy(ma->mac, sc->sc_mac, ETHER_ADDR_LEN);
2228 specs[0].dmamap = sc->sc_ctrlq.ctrlq_mac_addr_dmamap;
2229 specs[0].buf = ma;
2230 specs[0].bufsize = sizeof(*ma);
2231
2232 r = vioif_ctrl_send_command(sc,
2233 VIRTIO_NET_CTRL_MAC, VIRTIO_NET_CTRL_MAC_ADDR_SET,
2234 specs, nspecs);
2235
2236 vioif_ctrl_release(sc);
2237 } else {
2238 for (i = 0; i < __arraycount(sc->sc_mac); i++) {
2239 virtio_write_device_config_1(sc->sc_virtio,
2240 VIRTIO_NET_CONFIG_MAC + i, sc->sc_mac[i]);
2241 }
2242 r = 0;
2243 }
2244
2245 return r;
2246 }
2247
2248 static int
2249 vioif_ctrl_mq_vq_pairs_set(struct vioif_softc *sc, int nvq_pairs)
2250 {
2251 struct virtio_net_ctrl_mq *mq = sc->sc_ctrlq.ctrlq_mq;
2252 struct vioif_ctrl_cmdspec specs[1];
2253 int r;
2254
2255 if (!sc->sc_has_ctrl)
2256 return ENOTSUP;
2257
2258 if (nvq_pairs <= 1)
2259 return EINVAL;
2260
2261 vioif_ctrl_acquire(sc);
2262
2263 mq->virtqueue_pairs = virtio_rw16(sc->sc_virtio, nvq_pairs);
2264 specs[0].dmamap = sc->sc_ctrlq.ctrlq_mq_dmamap;
2265 specs[0].buf = mq;
2266 specs[0].bufsize = sizeof(*mq);
2267
2268 r = vioif_ctrl_send_command(sc,
2269 VIRTIO_NET_CTRL_MQ, VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET,
2270 specs, __arraycount(specs));
2271
2272 vioif_ctrl_release(sc);
2273
2274 return r;
2275 }
2276
2277 /* ctrl vq interrupt; wake up the command issuer */
2278 static int
2279 vioif_ctrl_intr(void *arg)
2280 {
2281 struct vioif_ctrlqueue *ctrlq = arg;
2282 struct virtqueue *vq = ctrlq->ctrlq_vq;
2283 struct virtio_softc *vsc = vq->vq_owner;
2284 int r, slot;
2285
2286 if (virtio_vq_is_enqueued(vsc, vq) == false)
2287 return 0;
2288
2289 r = virtio_dequeue(vsc, vq, &slot, NULL);
2290 if (r == ENOENT)
2291 return 0;
2292 virtio_dequeue_commit(vsc, vq, slot);
2293
2294 mutex_enter(&ctrlq->ctrlq_wait_lock);
2295 ctrlq->ctrlq_inuse = DONE;
2296 cv_signal(&ctrlq->ctrlq_wait);
2297 mutex_exit(&ctrlq->ctrlq_wait_lock);
2298
2299 return 1;
2300 }
2301
2302 static int
2303 vioif_ifflags(struct vioif_softc *sc)
2304 {
2305 struct ifnet *ifp = &sc->sc_ethercom.ec_if;
2306 bool onoff;
2307 int r;
2308
2309 if (!sc->sc_has_ctrl) {
2310 /* no ctrl vq; always promisc and allmulti */
2311 ifp->if_flags |= (IFF_PROMISC | IFF_ALLMULTI);
2312 return 0;
2313 }
2314
2315 onoff = ifp->if_flags & IFF_ALLMULTI ? true : false;
2316 r = vioif_set_allmulti(sc, onoff);
2317 if (r != 0) {
2318 log(LOG_WARNING,
2319 "%s: couldn't %sable ALLMULTI\n",
2320 ifp->if_xname, onoff ? "en" : "dis");
2321 if (onoff == false) {
2322 ifp->if_flags |= IFF_ALLMULTI;
2323 }
2324 }
2325
2326 onoff = ifp->if_flags & IFF_PROMISC ? true : false;
2327 r = vioif_set_promisc(sc, onoff);
2328 if (r != 0) {
2329 log(LOG_WARNING,
2330 "%s: couldn't %sable PROMISC\n",
2331 ifp->if_xname, onoff ? "en" : "dis");
2332 if (onoff == false) {
2333 ifp->if_flags |= IFF_PROMISC;
2334 }
2335 }
2336
2337 return 0;
2338 }
2339
2340 static int
2341 vioif_ifflags_cb(struct ethercom *ec)
2342 {
2343 struct ifnet *ifp = &ec->ec_if;
2344 struct vioif_softc *sc = ifp->if_softc;
2345
2346 return vioif_ifflags(sc);
2347 }
2348
2349 /*
2350 * If multicast filter small enough (<=MAXENTRIES) set rx filter
2351 * If large multicast filter exist use ALLMULTI
2352 * If setting rx filter fails fall back to ALLMULTI
2353 */
2354 static int
2355 vioif_rx_filter(struct vioif_softc *sc)
2356 {
2357 struct virtio_softc *vsc = sc->sc_virtio;
2358 struct ethercom *ec = &sc->sc_ethercom;
2359 struct ifnet *ifp = &ec->ec_if;
2360 struct ether_multi *enm;
2361 struct ether_multistep step;
2362 struct vioif_ctrlqueue *ctrlq = &sc->sc_ctrlq;
2363 int nentries;
2364 bool allmulti = 0;
2365 int r;
2366
2367 if (!sc->sc_has_ctrl) {
2368 goto set_ifflags;
2369 }
2370
2371 memcpy(ctrlq->ctrlq_mac_tbl_uc->macs[0],
2372 CLLADDR(ifp->if_sadl), ETHER_ADDR_LEN);
2373
2374 nentries = 0;
2375 allmulti = false;
2376
2377 ETHER_LOCK(ec);
2378 for (ETHER_FIRST_MULTI(step, ec, enm); enm != NULL;
2379 ETHER_NEXT_MULTI(step, enm)) {
2380 if (nentries >= VIRTIO_NET_CTRL_MAC_MAXENTRIES) {
2381 allmulti = true;
2382 break;
2383 }
2384 if (memcmp(enm->enm_addrlo, enm->enm_addrhi, ETHER_ADDR_LEN)) {
2385 allmulti = true;
2386 break;
2387 }
2388
2389 memcpy(ctrlq->ctrlq_mac_tbl_mc->macs[nentries],
2390 enm->enm_addrlo, ETHER_ADDR_LEN);
2391 nentries++;
2392 }
2393 ETHER_UNLOCK(ec);
2394
2395 r = vioif_set_mac_addr(sc);
2396 if (r != 0) {
2397 log(LOG_WARNING, "%s: couldn't set MAC address\n",
2398 ifp->if_xname);
2399 }
2400
2401 if (!allmulti) {
2402 ctrlq->ctrlq_mac_tbl_uc->nentries = virtio_rw32(vsc, 1);
2403 ctrlq->ctrlq_mac_tbl_mc->nentries = virtio_rw32(vsc, nentries);
2404 r = vioif_set_rx_filter(sc);
2405 if (r != 0) {
2406 allmulti = true; /* fallback */
2407 }
2408 }
2409
2410 if (allmulti) {
2411 ctrlq->ctrlq_mac_tbl_uc->nentries = virtio_rw32(vsc, 0);
2412 ctrlq->ctrlq_mac_tbl_mc->nentries = virtio_rw32(vsc, 0);
2413 r = vioif_set_rx_filter(sc);
2414 if (r != 0) {
2415 log(LOG_DEBUG, "%s: couldn't clear RX filter\n",
2416 ifp->if_xname);
2417 /* what to do on failure? */
2418 }
2419
2420 ifp->if_flags |= IFF_ALLMULTI;
2421 }
2422
2423 set_ifflags:
2424 r = vioif_ifflags(sc);
2425
2426 return r;
2427 }
2428
2429 static int
2430 vioif_get_link_status(struct vioif_softc *sc)
2431 {
2432 struct virtio_softc *vsc = sc->sc_virtio;
2433 uint16_t status;
2434
2435 if (virtio_features(vsc) & VIRTIO_NET_F_STATUS)
2436 status = virtio_read_device_config_2(vsc,
2437 VIRTIO_NET_CONFIG_STATUS);
2438 else
2439 status = VIRTIO_NET_S_LINK_UP;
2440
2441 if ((status & VIRTIO_NET_S_LINK_UP) != 0)
2442 return LINK_STATE_UP;
2443
2444 return LINK_STATE_DOWN;
2445 }
2446
2447 /* change link status */
2448 static void
2449 vioif_update_link_status(struct vioif_softc *sc)
2450 {
2451 struct ifnet *ifp = &sc->sc_ethercom.ec_if;
2452 struct vioif_txqueue *txq;
2453 bool active;
2454 int link, i;
2455
2456 mutex_enter(&sc->sc_lock);
2457
2458 link = vioif_get_link_status(sc);
2459
2460 if (link == sc->sc_link_state)
2461 goto done;
2462
2463 sc->sc_link_state = link;
2464
2465 active = VIOIF_IS_LINK_ACTIVE(sc);
2466 for (i = 0; i < sc->sc_act_nvq_pairs; i++) {
2467 txq = &sc->sc_txq[i];
2468
2469 mutex_enter(txq->txq_lock);
2470 txq->txq_link_active = active;
2471 mutex_exit(txq->txq_lock);
2472 }
2473
2474 if_link_state_change(ifp, sc->sc_link_state);
2475
2476 done:
2477 mutex_exit(&sc->sc_lock);
2478 }
2479
2480 static int
2481 vioif_config_change(struct virtio_softc *vsc)
2482 {
2483 struct vioif_softc *sc = device_private(virtio_child(vsc));
2484
2485 softint_schedule(sc->sc_ctl_softint);
2486 return 0;
2487 }
2488
2489 static void
2490 vioif_ctl_softint(void *arg)
2491 {
2492 struct vioif_softc *sc = arg;
2493 struct ifnet *ifp = &sc->sc_ethercom.ec_if;
2494
2495 vioif_update_link_status(sc);
2496 vioif_start(ifp);
2497 }
2498
2499 static struct workqueue *
2500 vioif_workq_create(const char *name, pri_t prio, int ipl, int flags)
2501 {
2502 struct workqueue *wq;
2503 int error;
2504
2505 error = workqueue_create(&wq, name, vioif_workq_work, NULL,
2506 prio, ipl, flags);
2507
2508 if (error)
2509 return NULL;
2510
2511 return wq;
2512 }
2513
2514 static void
2515 vioif_workq_destroy(struct workqueue *wq)
2516 {
2517
2518 workqueue_destroy(wq);
2519 }
2520
2521 static void
2522 vioif_workq_work(struct work *wk, void *context)
2523 {
2524 struct vioif_work *work;
2525
2526 work = container_of(wk, struct vioif_work, cookie);
2527
2528 atomic_store_relaxed(&work->added, 0);
2529 work->func(work->arg);
2530 }
2531
2532 static void
2533 vioif_work_set(struct vioif_work *work, void (*func)(void *), void *arg)
2534 {
2535
2536 memset(work, 0, sizeof(*work));
2537 work->func = func;
2538 work->arg = arg;
2539 }
2540
2541 static void
2542 vioif_work_add(struct workqueue *wq, struct vioif_work *work)
2543 {
2544
2545 if (atomic_load_relaxed(&work->added) != 0)
2546 return;
2547
2548 atomic_store_relaxed(&work->added, 1);
2549 kpreempt_disable();
2550 workqueue_enqueue(wq, &work->cookie, NULL);
2551 kpreempt_enable();
2552 }
2553
2554 static void
2555 vioif_work_wait(struct workqueue *wq, struct vioif_work *work)
2556 {
2557
2558 workqueue_wait(wq, &work->cookie);
2559 }
2560
2561 static int
2562 vioif_setup_sysctl(struct vioif_softc *sc)
2563 {
2564 const char *devname;
2565 struct sysctllog **log;
2566 const struct sysctlnode *rnode, *rxnode, *txnode;
2567 int error;
2568
2569 log = &sc->sc_sysctllog;
2570 devname = device_xname(sc->sc_dev);
2571
2572 error = sysctl_createv(log, 0, NULL, &rnode,
2573 0, CTLTYPE_NODE, devname,
2574 SYSCTL_DESCR("virtio-net information and settings"),
2575 NULL, 0, NULL, 0, CTL_HW, CTL_CREATE, CTL_EOL);
2576 if (error)
2577 goto out;
2578
2579 error = sysctl_createv(log, 0, &rnode, NULL,
2580 CTLFLAG_READWRITE, CTLTYPE_BOOL, "txrx_workqueue",
2581 SYSCTL_DESCR("Use workqueue for packet processing"),
2582 NULL, 0, &sc->sc_txrx_workqueue_sysctl, 0, CTL_CREATE, CTL_EOL);
2583 if (error)
2584 goto out;
2585
2586 error = sysctl_createv(log, 0, &rnode, &rxnode,
2587 0, CTLTYPE_NODE, "rx",
2588 SYSCTL_DESCR("virtio-net information and settings for Rx"),
2589 NULL, 0, NULL, 0, CTL_CREATE, CTL_EOL);
2590 if (error)
2591 goto out;
2592
2593 error = sysctl_createv(log, 0, &rxnode, NULL,
2594 CTLFLAG_READWRITE, CTLTYPE_INT, "intr_process_limit",
2595 SYSCTL_DESCR("max number of Rx packets to process for interrupt processing"),
2596 NULL, 0, &sc->sc_rx_intr_process_limit, 0, CTL_CREATE, CTL_EOL);
2597 if (error)
2598 goto out;
2599
2600 error = sysctl_createv(log, 0, &rxnode, NULL,
2601 CTLFLAG_READWRITE, CTLTYPE_INT, "process_limit",
2602 SYSCTL_DESCR("max number of Rx packets to process for deferred processing"),
2603 NULL, 0, &sc->sc_rx_process_limit, 0, CTL_CREATE, CTL_EOL);
2604 if (error)
2605 goto out;
2606
2607 error = sysctl_createv(log, 0, &rnode, &txnode,
2608 0, CTLTYPE_NODE, "tx",
2609 SYSCTL_DESCR("virtio-net information and settings for Tx"),
2610 NULL, 0, NULL, 0, CTL_CREATE, CTL_EOL);
2611 if (error)
2612 goto out;
2613
2614 error = sysctl_createv(log, 0, &txnode, NULL,
2615 CTLFLAG_READWRITE, CTLTYPE_INT, "intr_process_limit",
2616 SYSCTL_DESCR("max number of Tx packets to process for interrupt processing"),
2617 NULL, 0, &sc->sc_tx_intr_process_limit, 0, CTL_CREATE, CTL_EOL);
2618 if (error)
2619 goto out;
2620
2621 error = sysctl_createv(log, 0, &txnode, NULL,
2622 CTLFLAG_READWRITE, CTLTYPE_INT, "process_limit",
2623 SYSCTL_DESCR("max number of Tx packets to process for deferred processing"),
2624 NULL, 0, &sc->sc_tx_process_limit, 0, CTL_CREATE, CTL_EOL);
2625
2626 out:
2627 if (error)
2628 sysctl_teardown(log);
2629
2630 return error;
2631 }
2632
2633 static void
2634 vioif_setup_stats(struct vioif_softc *sc)
2635 {
2636 struct vioif_rxqueue *rxq;
2637 struct vioif_txqueue *txq;
2638 int i;
2639
2640 for (i = 0; i < sc->sc_max_nvq_pairs; i++) {
2641 rxq = &sc->sc_rxq[i];
2642 txq = &sc->sc_txq[i];
2643
2644 snprintf(txq->txq_evgroup, sizeof(txq->txq_evgroup), "%s-TX%d",
2645 device_xname(sc->sc_dev), i);
2646 evcnt_attach_dynamic(&txq->txq_defrag_failed, EVCNT_TYPE_MISC,
2647 NULL, txq->txq_evgroup, "tx m_defrag() failed");
2648 evcnt_attach_dynamic(&txq->txq_mbuf_load_failed, EVCNT_TYPE_MISC,
2649 NULL, txq->txq_evgroup, "tx dmamap load failed");
2650 evcnt_attach_dynamic(&txq->txq_enqueue_reserve_failed, EVCNT_TYPE_MISC,
2651 NULL, txq->txq_evgroup, "virtio_enqueue_reserve failed");
2652
2653 snprintf(rxq->rxq_evgroup, sizeof(rxq->rxq_evgroup), "%s-RX%d",
2654 device_xname(sc->sc_dev), i);
2655 evcnt_attach_dynamic(&rxq->rxq_mbuf_enobufs, EVCNT_TYPE_MISC,
2656 NULL, rxq->rxq_evgroup, "no receive buffer");
2657 evcnt_attach_dynamic(&rxq->rxq_mbuf_load_failed, EVCNT_TYPE_MISC,
2658 NULL, rxq->rxq_evgroup, "tx dmamap load failed");
2659 evcnt_attach_dynamic(&rxq->rxq_enqueue_reserve_failed, EVCNT_TYPE_MISC,
2660 NULL, rxq->rxq_evgroup, "virtio_enqueue_reserve failed");
2661 }
2662
2663 evcnt_attach_dynamic(&sc->sc_ctrlq.ctrlq_cmd_load_failed, EVCNT_TYPE_MISC,
2664 NULL, device_xname(sc->sc_dev), "control command dmamap load failed");
2665 evcnt_attach_dynamic(&sc->sc_ctrlq.ctrlq_cmd_failed, EVCNT_TYPE_MISC,
2666 NULL, device_xname(sc->sc_dev), "control command failed");
2667 }
2668
2669 static void
2670 vioif_intr_barrier(void)
2671 {
2672
2673 /* wait for finish all interrupt handler */
2674 xc_barrier(0);
2675 }
2676
2677 MODULE(MODULE_CLASS_DRIVER, if_vioif, "virtio");
2678
2679 #ifdef _MODULE
2680 #include "ioconf.c"
2681 #endif
2682
2683 static int
2684 if_vioif_modcmd(modcmd_t cmd, void *opaque)
2685 {
2686 int error = 0;
2687
2688 #ifdef _MODULE
2689 switch (cmd) {
2690 case MODULE_CMD_INIT:
2691 error = config_init_component(cfdriver_ioconf_if_vioif,
2692 cfattach_ioconf_if_vioif, cfdata_ioconf_if_vioif);
2693 break;
2694 case MODULE_CMD_FINI:
2695 error = config_fini_component(cfdriver_ioconf_if_vioif,
2696 cfattach_ioconf_if_vioif, cfdata_ioconf_if_vioif);
2697 break;
2698 default:
2699 error = ENOTTY;
2700 break;
2701 }
2702 #endif
2703
2704 return error;
2705 }
2706