ix_txrx.c revision 1.102 1 1.102 msaitoh /* $NetBSD: ix_txrx.c,v 1.102 2023/10/06 14:37:04 msaitoh Exp $ */
2 1.28 msaitoh
3 1.1 msaitoh /******************************************************************************
4 1.1 msaitoh
5 1.28 msaitoh Copyright (c) 2001-2017, Intel Corporation
6 1.1 msaitoh All rights reserved.
7 1.28 msaitoh
8 1.28 msaitoh Redistribution and use in source and binary forms, with or without
9 1.1 msaitoh modification, are permitted provided that the following conditions are met:
10 1.28 msaitoh
11 1.28 msaitoh 1. Redistributions of source code must retain the above copyright notice,
12 1.1 msaitoh this list of conditions and the following disclaimer.
13 1.28 msaitoh
14 1.28 msaitoh 2. Redistributions in binary form must reproduce the above copyright
15 1.28 msaitoh notice, this list of conditions and the following disclaimer in the
16 1.1 msaitoh documentation and/or other materials provided with the distribution.
17 1.28 msaitoh
18 1.28 msaitoh 3. Neither the name of the Intel Corporation nor the names of its
19 1.28 msaitoh contributors may be used to endorse or promote products derived from
20 1.1 msaitoh this software without specific prior written permission.
21 1.28 msaitoh
22 1.1 msaitoh THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
23 1.28 msaitoh AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24 1.28 msaitoh IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25 1.28 msaitoh ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
26 1.28 msaitoh LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
27 1.28 msaitoh CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
28 1.28 msaitoh SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
29 1.28 msaitoh INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
30 1.28 msaitoh CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
31 1.1 msaitoh ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
32 1.1 msaitoh POSSIBILITY OF SUCH DAMAGE.
33 1.1 msaitoh
34 1.1 msaitoh ******************************************************************************/
35 1.39 msaitoh /*$FreeBSD: head/sys/dev/ixgbe/ix_txrx.c 327031 2017-12-20 18:15:06Z erj $*/
36 1.28 msaitoh
37 1.1 msaitoh /*
38 1.1 msaitoh * Copyright (c) 2011 The NetBSD Foundation, Inc.
39 1.1 msaitoh * All rights reserved.
40 1.1 msaitoh *
41 1.1 msaitoh * This code is derived from software contributed to The NetBSD Foundation
42 1.1 msaitoh * by Coyote Point Systems, Inc.
43 1.1 msaitoh *
44 1.1 msaitoh * Redistribution and use in source and binary forms, with or without
45 1.1 msaitoh * modification, are permitted provided that the following conditions
46 1.1 msaitoh * are met:
47 1.1 msaitoh * 1. Redistributions of source code must retain the above copyright
48 1.1 msaitoh * notice, this list of conditions and the following disclaimer.
49 1.1 msaitoh * 2. Redistributions in binary form must reproduce the above copyright
50 1.1 msaitoh * notice, this list of conditions and the following disclaimer in the
51 1.1 msaitoh * documentation and/or other materials provided with the distribution.
52 1.1 msaitoh *
53 1.1 msaitoh * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
54 1.1 msaitoh * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
55 1.1 msaitoh * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
56 1.1 msaitoh * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
57 1.1 msaitoh * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
58 1.1 msaitoh * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
59 1.1 msaitoh * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
60 1.1 msaitoh * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
61 1.1 msaitoh * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
62 1.1 msaitoh * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
63 1.1 msaitoh * POSSIBILITY OF SUCH DAMAGE.
64 1.1 msaitoh */
65 1.1 msaitoh
66 1.71 msaitoh #include <sys/cdefs.h>
67 1.102 msaitoh __KERNEL_RCSID(0, "$NetBSD: ix_txrx.c,v 1.102 2023/10/06 14:37:04 msaitoh Exp $");
68 1.71 msaitoh
69 1.8 msaitoh #include "opt_inet.h"
70 1.8 msaitoh #include "opt_inet6.h"
71 1.8 msaitoh
72 1.1 msaitoh #include "ixgbe.h"
73 1.1 msaitoh
74 1.1 msaitoh /*
75 1.28 msaitoh * HW RSC control:
76 1.28 msaitoh * this feature only works with
77 1.28 msaitoh * IPv4, and only on 82599 and later.
78 1.28 msaitoh * Also this will cause IP forwarding to
79 1.28 msaitoh * fail and that can't be controlled by
80 1.28 msaitoh * the stack as LRO can. For all these
81 1.28 msaitoh * reasons I've deemed it best to leave
82 1.28 msaitoh * this off and not bother with a tuneable
83 1.28 msaitoh * interface, this would need to be compiled
84 1.28 msaitoh * to enable.
85 1.28 msaitoh */
86 1.1 msaitoh static bool ixgbe_rsc_enable = FALSE;
87 1.1 msaitoh
88 1.3 msaitoh /*
89 1.28 msaitoh * For Flow Director: this is the
90 1.28 msaitoh * number of TX packets we sample
91 1.28 msaitoh * for the filter pool, this means
92 1.28 msaitoh * every 20th packet will be probed.
93 1.28 msaitoh *
94 1.28 msaitoh * This feature can be disabled by
95 1.28 msaitoh * setting this to 0.
96 1.28 msaitoh */
97 1.3 msaitoh static int atr_sample_rate = 20;
98 1.3 msaitoh
99 1.102 msaitoh #define IXGBE_M_ADJ(sc, rxr, mp) \
100 1.102 msaitoh if (sc->max_frame_size <= (rxr->mbuf_sz - ETHER_ALIGN)) \
101 1.86 msaitoh m_adj(mp, ETHER_ALIGN)
102 1.86 msaitoh
103 1.28 msaitoh /************************************************************************
104 1.3 msaitoh * Local Function prototypes
105 1.28 msaitoh ************************************************************************/
106 1.28 msaitoh static void ixgbe_setup_transmit_ring(struct tx_ring *);
107 1.28 msaitoh static void ixgbe_free_transmit_buffers(struct tx_ring *);
108 1.28 msaitoh static int ixgbe_setup_receive_ring(struct rx_ring *);
109 1.28 msaitoh static void ixgbe_free_receive_buffers(struct rx_ring *);
110 1.28 msaitoh static void ixgbe_rx_checksum(u32, struct mbuf *, u32,
111 1.28 msaitoh struct ixgbe_hw_stats *);
112 1.28 msaitoh static void ixgbe_refresh_mbufs(struct rx_ring *, int);
113 1.38 knakahar static void ixgbe_drain(struct ifnet *, struct tx_ring *);
114 1.28 msaitoh static int ixgbe_xmit(struct tx_ring *, struct mbuf *);
115 1.28 msaitoh static int ixgbe_tx_ctx_setup(struct tx_ring *,
116 1.28 msaitoh struct mbuf *, u32 *, u32 *);
117 1.28 msaitoh static int ixgbe_tso_setup(struct tx_ring *,
118 1.28 msaitoh struct mbuf *, u32 *, u32 *);
119 1.1 msaitoh static __inline void ixgbe_rx_discard(struct rx_ring *, int);
120 1.1 msaitoh static __inline void ixgbe_rx_input(struct rx_ring *, struct ifnet *,
121 1.28 msaitoh struct mbuf *, u32);
122 1.102 msaitoh static int ixgbe_dma_malloc(struct ixgbe_softc *, bus_size_t,
123 1.28 msaitoh struct ixgbe_dma_alloc *, int);
124 1.102 msaitoh static void ixgbe_dma_free(struct ixgbe_softc *, struct ixgbe_dma_alloc *);
125 1.1 msaitoh
126 1.1 msaitoh static void ixgbe_setup_hw_rsc(struct rx_ring *);
127 1.1 msaitoh
128 1.28 msaitoh /************************************************************************
129 1.28 msaitoh * ixgbe_legacy_start_locked - Transmit entry point
130 1.1 msaitoh *
131 1.28 msaitoh * Called by the stack to initiate a transmit.
132 1.28 msaitoh * The driver will remain in this routine as long as there are
133 1.28 msaitoh * packets to transmit and transmit resources are available.
134 1.28 msaitoh * In case resources are not available, the stack is notified
135 1.28 msaitoh * and the packet is requeued.
136 1.28 msaitoh ************************************************************************/
137 1.28 msaitoh int
138 1.28 msaitoh ixgbe_legacy_start_locked(struct ifnet *ifp, struct tx_ring *txr)
139 1.1 msaitoh {
140 1.45 msaitoh int rc;
141 1.1 msaitoh struct mbuf *m_head;
142 1.102 msaitoh struct ixgbe_softc *sc = txr->sc;
143 1.1 msaitoh
144 1.1 msaitoh IXGBE_TX_LOCK_ASSERT(txr);
145 1.1 msaitoh
146 1.102 msaitoh if (sc->link_active != LINK_STATE_UP) {
147 1.38 knakahar /*
148 1.38 knakahar * discard all packets buffered in IFQ to avoid
149 1.38 knakahar * sending old packets at next link up timing.
150 1.38 knakahar */
151 1.38 knakahar ixgbe_drain(ifp, txr);
152 1.38 knakahar return (ENETDOWN);
153 1.38 knakahar }
154 1.1 msaitoh if ((ifp->if_flags & IFF_RUNNING) == 0)
155 1.28 msaitoh return (ENETDOWN);
156 1.47 msaitoh if (txr->txr_no_space)
157 1.47 msaitoh return (ENETDOWN);
158 1.58 msaitoh
159 1.1 msaitoh while (!IFQ_IS_EMPTY(&ifp->if_snd)) {
160 1.1 msaitoh if (txr->tx_avail <= IXGBE_QUEUE_MIN_FREE)
161 1.1 msaitoh break;
162 1.1 msaitoh
163 1.1 msaitoh IFQ_POLL(&ifp->if_snd, m_head);
164 1.1 msaitoh if (m_head == NULL)
165 1.1 msaitoh break;
166 1.1 msaitoh
167 1.1 msaitoh if ((rc = ixgbe_xmit(txr, m_head)) == EAGAIN) {
168 1.1 msaitoh break;
169 1.1 msaitoh }
170 1.1 msaitoh IFQ_DEQUEUE(&ifp->if_snd, m_head);
171 1.1 msaitoh if (rc != 0) {
172 1.1 msaitoh m_freem(m_head);
173 1.1 msaitoh continue;
174 1.1 msaitoh }
175 1.1 msaitoh
176 1.1 msaitoh /* Send a copy of the frame to the BPF listener */
177 1.48 msaitoh bpf_mtap(ifp, m_head, BPF_D_OUT);
178 1.1 msaitoh }
179 1.44 msaitoh
180 1.28 msaitoh return IXGBE_SUCCESS;
181 1.28 msaitoh } /* ixgbe_legacy_start_locked */
182 1.28 msaitoh
183 1.28 msaitoh /************************************************************************
184 1.28 msaitoh * ixgbe_legacy_start
185 1.28 msaitoh *
186 1.28 msaitoh * Called by the stack, this always uses the first tx ring,
187 1.28 msaitoh * and should not be used with multiqueue tx enabled.
188 1.28 msaitoh ************************************************************************/
189 1.1 msaitoh void
190 1.28 msaitoh ixgbe_legacy_start(struct ifnet *ifp)
191 1.1 msaitoh {
192 1.102 msaitoh struct ixgbe_softc *sc = ifp->if_softc;
193 1.102 msaitoh struct tx_ring *txr = sc->tx_rings;
194 1.1 msaitoh
195 1.1 msaitoh if (ifp->if_flags & IFF_RUNNING) {
196 1.1 msaitoh IXGBE_TX_LOCK(txr);
197 1.28 msaitoh ixgbe_legacy_start_locked(ifp, txr);
198 1.1 msaitoh IXGBE_TX_UNLOCK(txr);
199 1.1 msaitoh }
200 1.28 msaitoh } /* ixgbe_legacy_start */
201 1.1 msaitoh
202 1.28 msaitoh /************************************************************************
203 1.28 msaitoh * ixgbe_mq_start - Multiqueue Transmit Entry Point
204 1.28 msaitoh *
205 1.28 msaitoh * (if_transmit function)
206 1.28 msaitoh ************************************************************************/
207 1.1 msaitoh int
208 1.1 msaitoh ixgbe_mq_start(struct ifnet *ifp, struct mbuf *m)
209 1.1 msaitoh {
210 1.102 msaitoh struct ixgbe_softc *sc = ifp->if_softc;
211 1.1 msaitoh struct tx_ring *txr;
212 1.70 msaitoh int i;
213 1.28 msaitoh #ifdef RSS
214 1.1 msaitoh uint32_t bucket_id;
215 1.1 msaitoh #endif
216 1.1 msaitoh
217 1.1 msaitoh /*
218 1.1 msaitoh * When doing RSS, map it to the same outbound queue
219 1.1 msaitoh * as the incoming flow would be mapped to.
220 1.1 msaitoh *
221 1.1 msaitoh * If everything is setup correctly, it should be the
222 1.1 msaitoh * same bucket that the current CPU we're on is.
223 1.1 msaitoh */
224 1.28 msaitoh #ifdef RSS
225 1.1 msaitoh if (M_HASHTYPE_GET(m) != M_HASHTYPE_NONE) {
226 1.102 msaitoh if ((sc->feat_en & IXGBE_FEATURE_RSS) &&
227 1.28 msaitoh (rss_hash2bucket(m->m_pkthdr.flowid, M_HASHTYPE_GET(m),
228 1.28 msaitoh &bucket_id) == 0)) {
229 1.102 msaitoh i = bucket_id % sc->num_queues;
230 1.8 msaitoh #ifdef IXGBE_DEBUG
231 1.102 msaitoh if (bucket_id > sc->num_queues)
232 1.28 msaitoh if_printf(ifp,
233 1.28 msaitoh "bucket_id (%d) > num_queues (%d)\n",
234 1.102 msaitoh bucket_id, sc->num_queues);
235 1.8 msaitoh #endif
236 1.8 msaitoh } else
237 1.102 msaitoh i = m->m_pkthdr.flowid % sc->num_queues;
238 1.3 msaitoh } else
239 1.28 msaitoh #endif /* 0 */
240 1.102 msaitoh i = (cpu_index(curcpu()) % ncpu) % sc->num_queues;
241 1.3 msaitoh
242 1.3 msaitoh /* Check for a hung queue and pick alternative */
243 1.102 msaitoh if (((1ULL << i) & sc->active_queues) == 0)
244 1.102 msaitoh i = ffs64(sc->active_queues);
245 1.1 msaitoh
246 1.102 msaitoh txr = &sc->tx_rings[i];
247 1.1 msaitoh
248 1.50 msaitoh if (__predict_false(!pcq_put(txr->txr_interq, m))) {
249 1.18 msaitoh m_freem(m);
250 1.95 msaitoh IXGBE_EVC_ADD(&txr->pcq_drops, 1);
251 1.50 msaitoh return ENOBUFS;
252 1.18 msaitoh }
253 1.100 knakahar #ifdef IXGBE_ALWAYS_TXDEFER
254 1.100 knakahar kpreempt_disable();
255 1.100 knakahar softint_schedule(txr->txr_si);
256 1.100 knakahar kpreempt_enable();
257 1.100 knakahar #else
258 1.1 msaitoh if (IXGBE_TX_TRYLOCK(txr)) {
259 1.1 msaitoh ixgbe_mq_start_locked(ifp, txr);
260 1.1 msaitoh IXGBE_TX_UNLOCK(txr);
261 1.34 knakahar } else {
262 1.102 msaitoh if (sc->txrx_use_workqueue) {
263 1.44 msaitoh u_int *enqueued;
264 1.44 msaitoh
265 1.34 knakahar /*
266 1.34 knakahar * This function itself is not called in interrupt
267 1.34 knakahar * context, however it can be called in fast softint
268 1.34 knakahar * context right after receiving forwarding packets.
269 1.34 knakahar * So, it is required to protect workqueue from twice
270 1.34 knakahar * enqueuing when the machine uses both spontaneous
271 1.34 knakahar * packets and forwarding packets.
272 1.34 knakahar */
273 1.102 msaitoh enqueued = percpu_getref(sc->txr_wq_enqueued);
274 1.34 knakahar if (*enqueued == 0) {
275 1.34 knakahar *enqueued = 1;
276 1.102 msaitoh percpu_putref(sc->txr_wq_enqueued);
277 1.102 msaitoh workqueue_enqueue(sc->txr_wq,
278 1.44 msaitoh &txr->wq_cookie, curcpu());
279 1.34 knakahar } else
280 1.102 msaitoh percpu_putref(sc->txr_wq_enqueued);
281 1.56 knakahar } else {
282 1.56 knakahar kpreempt_disable();
283 1.34 knakahar softint_schedule(txr->txr_si);
284 1.56 knakahar kpreempt_enable();
285 1.56 knakahar }
286 1.34 knakahar }
287 1.100 knakahar #endif
288 1.1 msaitoh
289 1.1 msaitoh return (0);
290 1.28 msaitoh } /* ixgbe_mq_start */
291 1.1 msaitoh
292 1.28 msaitoh /************************************************************************
293 1.28 msaitoh * ixgbe_mq_start_locked
294 1.28 msaitoh ************************************************************************/
295 1.1 msaitoh int
296 1.1 msaitoh ixgbe_mq_start_locked(struct ifnet *ifp, struct tx_ring *txr)
297 1.1 msaitoh {
298 1.28 msaitoh struct mbuf *next;
299 1.28 msaitoh int enqueued = 0, err = 0;
300 1.1 msaitoh
301 1.102 msaitoh if (txr->sc->link_active != LINK_STATE_UP) {
302 1.38 knakahar /*
303 1.38 knakahar * discard all packets buffered in txr_interq to avoid
304 1.38 knakahar * sending old packets at next link up timing.
305 1.38 knakahar */
306 1.38 knakahar ixgbe_drain(ifp, txr);
307 1.38 knakahar return (ENETDOWN);
308 1.38 knakahar }
309 1.28 msaitoh if ((ifp->if_flags & IFF_RUNNING) == 0)
310 1.28 msaitoh return (ENETDOWN);
311 1.47 msaitoh if (txr->txr_no_space)
312 1.47 msaitoh return (ENETDOWN);
313 1.1 msaitoh
314 1.1 msaitoh /* Process the queue */
315 1.18 msaitoh while ((next = pcq_get(txr->txr_interq)) != NULL) {
316 1.18 msaitoh if ((err = ixgbe_xmit(txr, next)) != 0) {
317 1.18 msaitoh m_freem(next);
318 1.18 msaitoh /* All errors are counted in ixgbe_xmit() */
319 1.1 msaitoh break;
320 1.1 msaitoh }
321 1.1 msaitoh enqueued++;
322 1.3 msaitoh #if __FreeBSD_version >= 1100036
323 1.4 msaitoh /*
324 1.4 msaitoh * Since we're looking at the tx ring, we can check
325 1.99 andvar * to see if we're a VF by examining our tail register
326 1.4 msaitoh * address.
327 1.4 msaitoh */
328 1.102 msaitoh if ((txr->sc->feat_en & IXGBE_FEATURE_VF) &&
329 1.28 msaitoh (next->m_flags & M_MCAST))
330 1.3 msaitoh if_inc_counter(ifp, IFCOUNTER_OMCASTS, 1);
331 1.3 msaitoh #endif
332 1.1 msaitoh /* Send a copy of the frame to the BPF listener */
333 1.48 msaitoh bpf_mtap(ifp, next, BPF_D_OUT);
334 1.1 msaitoh if ((ifp->if_flags & IFF_RUNNING) == 0)
335 1.1 msaitoh break;
336 1.1 msaitoh }
337 1.1 msaitoh
338 1.102 msaitoh if (txr->tx_avail < IXGBE_TX_CLEANUP_THRESHOLD(txr->sc))
339 1.1 msaitoh ixgbe_txeof(txr);
340 1.1 msaitoh
341 1.1 msaitoh return (err);
342 1.28 msaitoh } /* ixgbe_mq_start_locked */
343 1.1 msaitoh
344 1.28 msaitoh /************************************************************************
345 1.28 msaitoh * ixgbe_deferred_mq_start
346 1.28 msaitoh *
347 1.34 knakahar * Called from a softint and workqueue (indirectly) to drain queued
348 1.34 knakahar * transmit packets.
349 1.28 msaitoh ************************************************************************/
350 1.1 msaitoh void
351 1.18 msaitoh ixgbe_deferred_mq_start(void *arg)
352 1.1 msaitoh {
353 1.1 msaitoh struct tx_ring *txr = arg;
354 1.102 msaitoh struct ixgbe_softc *sc = txr->sc;
355 1.102 msaitoh struct ifnet *ifp = sc->ifp;
356 1.1 msaitoh
357 1.1 msaitoh IXGBE_TX_LOCK(txr);
358 1.18 msaitoh if (pcq_peek(txr->txr_interq) != NULL)
359 1.1 msaitoh ixgbe_mq_start_locked(ifp, txr);
360 1.1 msaitoh IXGBE_TX_UNLOCK(txr);
361 1.28 msaitoh } /* ixgbe_deferred_mq_start */
362 1.3 msaitoh
363 1.28 msaitoh /************************************************************************
364 1.34 knakahar * ixgbe_deferred_mq_start_work
365 1.34 knakahar *
366 1.34 knakahar * Called from a workqueue to drain queued transmit packets.
367 1.34 knakahar ************************************************************************/
368 1.34 knakahar void
369 1.34 knakahar ixgbe_deferred_mq_start_work(struct work *wk, void *arg)
370 1.34 knakahar {
371 1.34 knakahar struct tx_ring *txr = container_of(wk, struct tx_ring, wq_cookie);
372 1.102 msaitoh struct ixgbe_softc *sc = txr->sc;
373 1.102 msaitoh u_int *enqueued = percpu_getref(sc->txr_wq_enqueued);
374 1.34 knakahar *enqueued = 0;
375 1.102 msaitoh percpu_putref(sc->txr_wq_enqueued);
376 1.34 knakahar
377 1.34 knakahar ixgbe_deferred_mq_start(txr);
378 1.34 knakahar } /* ixgbe_deferred_mq_start */
379 1.34 knakahar
380 1.38 knakahar /************************************************************************
381 1.38 knakahar * ixgbe_drain_all
382 1.38 knakahar ************************************************************************/
383 1.38 knakahar void
384 1.102 msaitoh ixgbe_drain_all(struct ixgbe_softc *sc)
385 1.38 knakahar {
386 1.102 msaitoh struct ifnet *ifp = sc->ifp;
387 1.102 msaitoh struct ix_queue *que = sc->queues;
388 1.38 knakahar
389 1.102 msaitoh for (int i = 0; i < sc->num_queues; i++, que++) {
390 1.38 knakahar struct tx_ring *txr = que->txr;
391 1.38 knakahar
392 1.38 knakahar IXGBE_TX_LOCK(txr);
393 1.38 knakahar ixgbe_drain(ifp, txr);
394 1.38 knakahar IXGBE_TX_UNLOCK(txr);
395 1.38 knakahar }
396 1.38 knakahar }
397 1.34 knakahar
398 1.34 knakahar /************************************************************************
399 1.28 msaitoh * ixgbe_xmit
400 1.1 msaitoh *
401 1.28 msaitoh * Maps the mbufs to tx descriptors, allowing the
402 1.28 msaitoh * TX engine to transmit the packets.
403 1.1 msaitoh *
404 1.28 msaitoh * Return 0 on success, positive on failure
405 1.28 msaitoh ************************************************************************/
406 1.1 msaitoh static int
407 1.1 msaitoh ixgbe_xmit(struct tx_ring *txr, struct mbuf *m_head)
408 1.1 msaitoh {
409 1.102 msaitoh struct ixgbe_softc *sc = txr->sc;
410 1.28 msaitoh struct ixgbe_tx_buf *txbuf;
411 1.1 msaitoh union ixgbe_adv_tx_desc *txd = NULL;
412 1.102 msaitoh struct ifnet *ifp = sc->ifp;
413 1.28 msaitoh int i, j, error;
414 1.28 msaitoh int first;
415 1.28 msaitoh u32 olinfo_status = 0, cmd_type_len;
416 1.28 msaitoh bool remap = TRUE;
417 1.28 msaitoh bus_dmamap_t map;
418 1.1 msaitoh
419 1.1 msaitoh /* Basic descriptor defines */
420 1.28 msaitoh cmd_type_len = (IXGBE_ADVTXD_DTYP_DATA |
421 1.1 msaitoh IXGBE_ADVTXD_DCMD_IFCS | IXGBE_ADVTXD_DCMD_DEXT);
422 1.1 msaitoh
423 1.29 knakahar if (vlan_has_tag(m_head))
424 1.28 msaitoh cmd_type_len |= IXGBE_ADVTXD_DCMD_VLE;
425 1.1 msaitoh
426 1.28 msaitoh /*
427 1.28 msaitoh * Important to capture the first descriptor
428 1.28 msaitoh * used because it will contain the index of
429 1.28 msaitoh * the one we tell the hardware to report back
430 1.28 msaitoh */
431 1.28 msaitoh first = txr->next_avail_desc;
432 1.1 msaitoh txbuf = &txr->tx_buffers[first];
433 1.1 msaitoh map = txbuf->map;
434 1.1 msaitoh
435 1.1 msaitoh /*
436 1.1 msaitoh * Map the packet for DMA.
437 1.1 msaitoh */
438 1.22 msaitoh retry:
439 1.28 msaitoh error = bus_dmamap_load_mbuf(txr->txtag->dt_dmat, map, m_head,
440 1.28 msaitoh BUS_DMA_NOWAIT);
441 1.1 msaitoh
442 1.1 msaitoh if (__predict_false(error)) {
443 1.22 msaitoh struct mbuf *m;
444 1.1 msaitoh
445 1.1 msaitoh switch (error) {
446 1.1 msaitoh case EAGAIN:
447 1.35 msaitoh txr->q_eagain_tx_dma_setup++;
448 1.1 msaitoh return EAGAIN;
449 1.1 msaitoh case ENOMEM:
450 1.35 msaitoh txr->q_enomem_tx_dma_setup++;
451 1.1 msaitoh return EAGAIN;
452 1.1 msaitoh case EFBIG:
453 1.22 msaitoh /* Try it again? - one try */
454 1.22 msaitoh if (remap == TRUE) {
455 1.22 msaitoh remap = FALSE;
456 1.22 msaitoh /*
457 1.22 msaitoh * XXX: m_defrag will choke on
458 1.22 msaitoh * non-MCLBYTES-sized clusters
459 1.22 msaitoh */
460 1.35 msaitoh txr->q_efbig_tx_dma_setup++;
461 1.22 msaitoh m = m_defrag(m_head, M_NOWAIT);
462 1.22 msaitoh if (m == NULL) {
463 1.35 msaitoh txr->q_mbuf_defrag_failed++;
464 1.22 msaitoh return ENOBUFS;
465 1.22 msaitoh }
466 1.22 msaitoh m_head = m;
467 1.22 msaitoh goto retry;
468 1.22 msaitoh } else {
469 1.35 msaitoh txr->q_efbig2_tx_dma_setup++;
470 1.22 msaitoh return error;
471 1.22 msaitoh }
472 1.1 msaitoh case EINVAL:
473 1.35 msaitoh txr->q_einval_tx_dma_setup++;
474 1.1 msaitoh return error;
475 1.1 msaitoh default:
476 1.35 msaitoh txr->q_other_tx_dma_setup++;
477 1.1 msaitoh return error;
478 1.1 msaitoh }
479 1.1 msaitoh }
480 1.1 msaitoh
481 1.1 msaitoh /* Make certain there are enough descriptors */
482 1.10 msaitoh if (txr->tx_avail < (map->dm_nsegs + 2)) {
483 1.47 msaitoh txr->txr_no_space = true;
484 1.95 msaitoh IXGBE_EVC_ADD(&txr->no_desc_avail, 1);
485 1.1 msaitoh ixgbe_dmamap_unload(txr->txtag, txbuf->map);
486 1.1 msaitoh return EAGAIN;
487 1.1 msaitoh }
488 1.1 msaitoh
489 1.1 msaitoh /*
490 1.4 msaitoh * Set up the appropriate offload context
491 1.4 msaitoh * this will consume the first descriptor
492 1.4 msaitoh */
493 1.1 msaitoh error = ixgbe_tx_ctx_setup(txr, m_head, &cmd_type_len, &olinfo_status);
494 1.1 msaitoh if (__predict_false(error)) {
495 1.1 msaitoh return (error);
496 1.1 msaitoh }
497 1.1 msaitoh
498 1.73 knakahar #ifdef IXGBE_FDIR
499 1.1 msaitoh /* Do the flow director magic */
500 1.102 msaitoh if ((sc->feat_en & IXGBE_FEATURE_FDIR) &&
501 1.102 msaitoh (txr->atr_sample) && (!sc->fdir_reinit)) {
502 1.1 msaitoh ++txr->atr_count;
503 1.1 msaitoh if (txr->atr_count >= atr_sample_rate) {
504 1.1 msaitoh ixgbe_atr(txr, m_head);
505 1.1 msaitoh txr->atr_count = 0;
506 1.1 msaitoh }
507 1.1 msaitoh }
508 1.73 knakahar #endif
509 1.1 msaitoh
510 1.8 msaitoh olinfo_status |= IXGBE_ADVTXD_CC;
511 1.1 msaitoh i = txr->next_avail_desc;
512 1.1 msaitoh for (j = 0; j < map->dm_nsegs; j++) {
513 1.1 msaitoh bus_size_t seglen;
514 1.77 msaitoh uint64_t segaddr;
515 1.1 msaitoh
516 1.1 msaitoh txbuf = &txr->tx_buffers[i];
517 1.1 msaitoh txd = &txr->tx_base[i];
518 1.1 msaitoh seglen = map->dm_segs[j].ds_len;
519 1.1 msaitoh segaddr = htole64(map->dm_segs[j].ds_addr);
520 1.1 msaitoh
521 1.1 msaitoh txd->read.buffer_addr = segaddr;
522 1.40 msaitoh txd->read.cmd_type_len = htole32(cmd_type_len | seglen);
523 1.1 msaitoh txd->read.olinfo_status = htole32(olinfo_status);
524 1.1 msaitoh
525 1.1 msaitoh if (++i == txr->num_desc)
526 1.1 msaitoh i = 0;
527 1.1 msaitoh }
528 1.1 msaitoh
529 1.28 msaitoh txd->read.cmd_type_len |= htole32(IXGBE_TXD_CMD_EOP | IXGBE_TXD_CMD_RS);
530 1.1 msaitoh txr->tx_avail -= map->dm_nsegs;
531 1.1 msaitoh txr->next_avail_desc = i;
532 1.1 msaitoh
533 1.1 msaitoh txbuf->m_head = m_head;
534 1.1 msaitoh /*
535 1.4 msaitoh * Here we swap the map so the last descriptor,
536 1.4 msaitoh * which gets the completion interrupt has the
537 1.4 msaitoh * real map, and the first descriptor gets the
538 1.4 msaitoh * unused map from this descriptor.
539 1.4 msaitoh */
540 1.1 msaitoh txr->tx_buffers[first].map = txbuf->map;
541 1.1 msaitoh txbuf->map = map;
542 1.1 msaitoh bus_dmamap_sync(txr->txtag->dt_dmat, map, 0, m_head->m_pkthdr.len,
543 1.1 msaitoh BUS_DMASYNC_PREWRITE);
544 1.1 msaitoh
545 1.28 msaitoh /* Set the EOP descriptor that will be marked done */
546 1.28 msaitoh txbuf = &txr->tx_buffers[first];
547 1.1 msaitoh txbuf->eop = txd;
548 1.1 msaitoh
549 1.28 msaitoh ixgbe_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
550 1.1 msaitoh BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
551 1.1 msaitoh /*
552 1.1 msaitoh * Advance the Transmit Descriptor Tail (Tdt), this tells the
553 1.1 msaitoh * hardware that this frame is available to transmit.
554 1.1 msaitoh */
555 1.95 msaitoh IXGBE_EVC_ADD(&txr->total_packets, 1);
556 1.102 msaitoh IXGBE_WRITE_REG(&sc->hw, txr->tail, i);
557 1.3 msaitoh
558 1.61 thorpej net_stat_ref_t nsr = IF_STAT_GETREF(ifp);
559 1.61 thorpej if_statadd_ref(nsr, if_obytes, m_head->m_pkthdr.len);
560 1.23 msaitoh if (m_head->m_flags & M_MCAST)
561 1.61 thorpej if_statinc_ref(nsr, if_omcasts);
562 1.61 thorpej IF_STAT_PUTREF(ifp);
563 1.23 msaitoh
564 1.45 msaitoh /* Mark queue as having work */
565 1.45 msaitoh if (txr->busy == 0)
566 1.45 msaitoh txr->busy = 1;
567 1.45 msaitoh
568 1.28 msaitoh return (0);
569 1.28 msaitoh } /* ixgbe_xmit */
570 1.1 msaitoh
571 1.38 knakahar /************************************************************************
572 1.38 knakahar * ixgbe_drain
573 1.38 knakahar ************************************************************************/
574 1.38 knakahar static void
575 1.38 knakahar ixgbe_drain(struct ifnet *ifp, struct tx_ring *txr)
576 1.38 knakahar {
577 1.38 knakahar struct mbuf *m;
578 1.38 knakahar
579 1.38 knakahar IXGBE_TX_LOCK_ASSERT(txr);
580 1.38 knakahar
581 1.38 knakahar if (txr->me == 0) {
582 1.38 knakahar while (!IFQ_IS_EMPTY(&ifp->if_snd)) {
583 1.38 knakahar IFQ_DEQUEUE(&ifp->if_snd, m);
584 1.38 knakahar m_freem(m);
585 1.38 knakahar IF_DROP(&ifp->if_snd);
586 1.38 knakahar }
587 1.38 knakahar }
588 1.38 knakahar
589 1.38 knakahar while ((m = pcq_get(txr->txr_interq)) != NULL) {
590 1.38 knakahar m_freem(m);
591 1.95 msaitoh IXGBE_EVC_ADD(&txr->pcq_drops, 1);
592 1.38 knakahar }
593 1.38 knakahar }
594 1.16 msaitoh
595 1.28 msaitoh /************************************************************************
596 1.28 msaitoh * ixgbe_allocate_transmit_buffers
597 1.1 msaitoh *
598 1.28 msaitoh * Allocate memory for tx_buffer structures. The tx_buffer stores all
599 1.28 msaitoh * the information needed to transmit a packet on the wire. This is
600 1.28 msaitoh * called only once at attach, setup is done every reset.
601 1.28 msaitoh ************************************************************************/
602 1.28 msaitoh static int
603 1.1 msaitoh ixgbe_allocate_transmit_buffers(struct tx_ring *txr)
604 1.1 msaitoh {
605 1.102 msaitoh struct ixgbe_softc *sc = txr->sc;
606 1.102 msaitoh device_t dev = sc->dev;
607 1.1 msaitoh struct ixgbe_tx_buf *txbuf;
608 1.28 msaitoh int error, i;
609 1.1 msaitoh
610 1.1 msaitoh /*
611 1.1 msaitoh * Setup DMA descriptor areas.
612 1.1 msaitoh */
613 1.28 msaitoh error = ixgbe_dma_tag_create(
614 1.102 msaitoh /* parent */ sc->osdep.dmat,
615 1.28 msaitoh /* alignment */ 1,
616 1.28 msaitoh /* bounds */ 0,
617 1.28 msaitoh /* maxsize */ IXGBE_TSO_SIZE,
618 1.102 msaitoh /* nsegments */ sc->num_segs,
619 1.28 msaitoh /* maxsegsize */ PAGE_SIZE,
620 1.28 msaitoh /* flags */ 0,
621 1.28 msaitoh &txr->txtag);
622 1.28 msaitoh if (error != 0) {
623 1.1 msaitoh aprint_error_dev(dev,"Unable to allocate TX DMA tag\n");
624 1.1 msaitoh goto fail;
625 1.1 msaitoh }
626 1.1 msaitoh
627 1.57 chs txr->tx_buffers = malloc(sizeof(struct ixgbe_tx_buf) *
628 1.102 msaitoh sc->num_tx_desc, M_DEVBUF, M_WAITOK | M_ZERO);
629 1.1 msaitoh
630 1.28 msaitoh /* Create the descriptor buffer dma maps */
631 1.1 msaitoh txbuf = txr->tx_buffers;
632 1.102 msaitoh for (i = 0; i < sc->num_tx_desc; i++, txbuf++) {
633 1.1 msaitoh error = ixgbe_dmamap_create(txr->txtag, 0, &txbuf->map);
634 1.1 msaitoh if (error != 0) {
635 1.1 msaitoh aprint_error_dev(dev,
636 1.1 msaitoh "Unable to create TX DMA map (%d)\n", error);
637 1.1 msaitoh goto fail;
638 1.1 msaitoh }
639 1.1 msaitoh }
640 1.1 msaitoh
641 1.1 msaitoh return 0;
642 1.1 msaitoh fail:
643 1.1 msaitoh /* We free all, it handles case where we are in the middle */
644 1.15 msaitoh #if 0 /* XXX was FreeBSD */
645 1.102 msaitoh ixgbe_free_transmit_structures(sc);
646 1.15 msaitoh #else
647 1.15 msaitoh ixgbe_free_transmit_buffers(txr);
648 1.15 msaitoh #endif
649 1.1 msaitoh return (error);
650 1.28 msaitoh } /* ixgbe_allocate_transmit_buffers */
651 1.1 msaitoh
652 1.28 msaitoh /************************************************************************
653 1.28 msaitoh * ixgbe_setup_transmit_ring - Initialize a transmit ring.
654 1.28 msaitoh ************************************************************************/
655 1.1 msaitoh static void
656 1.1 msaitoh ixgbe_setup_transmit_ring(struct tx_ring *txr)
657 1.1 msaitoh {
658 1.102 msaitoh struct ixgbe_softc *sc = txr->sc;
659 1.28 msaitoh struct ixgbe_tx_buf *txbuf;
660 1.1 msaitoh #ifdef DEV_NETMAP
661 1.102 msaitoh struct netmap_sc *na = NA(sc->ifp);
662 1.28 msaitoh struct netmap_slot *slot;
663 1.1 msaitoh #endif /* DEV_NETMAP */
664 1.1 msaitoh
665 1.1 msaitoh /* Clear the old ring contents */
666 1.1 msaitoh IXGBE_TX_LOCK(txr);
667 1.28 msaitoh
668 1.1 msaitoh #ifdef DEV_NETMAP
669 1.102 msaitoh if (sc->feat_en & IXGBE_FEATURE_NETMAP) {
670 1.28 msaitoh /*
671 1.28 msaitoh * (under lock): if in netmap mode, do some consistency
672 1.28 msaitoh * checks and set slot to entry 0 of the netmap ring.
673 1.28 msaitoh */
674 1.28 msaitoh slot = netmap_reset(na, NR_TX, txr->me, 0);
675 1.28 msaitoh }
676 1.1 msaitoh #endif /* DEV_NETMAP */
677 1.28 msaitoh
678 1.1 msaitoh bzero((void *)txr->tx_base,
679 1.102 msaitoh (sizeof(union ixgbe_adv_tx_desc)) * sc->num_tx_desc);
680 1.1 msaitoh /* Reset indices */
681 1.1 msaitoh txr->next_avail_desc = 0;
682 1.1 msaitoh txr->next_to_clean = 0;
683 1.1 msaitoh
684 1.1 msaitoh /* Free any existing tx buffers. */
685 1.28 msaitoh txbuf = txr->tx_buffers;
686 1.5 msaitoh for (int i = 0; i < txr->num_desc; i++, txbuf++) {
687 1.1 msaitoh if (txbuf->m_head != NULL) {
688 1.1 msaitoh bus_dmamap_sync(txr->txtag->dt_dmat, txbuf->map,
689 1.1 msaitoh 0, txbuf->m_head->m_pkthdr.len,
690 1.1 msaitoh BUS_DMASYNC_POSTWRITE);
691 1.1 msaitoh ixgbe_dmamap_unload(txr->txtag, txbuf->map);
692 1.1 msaitoh m_freem(txbuf->m_head);
693 1.1 msaitoh txbuf->m_head = NULL;
694 1.1 msaitoh }
695 1.28 msaitoh
696 1.1 msaitoh #ifdef DEV_NETMAP
697 1.1 msaitoh /*
698 1.1 msaitoh * In netmap mode, set the map for the packet buffer.
699 1.1 msaitoh * NOTE: Some drivers (not this one) also need to set
700 1.1 msaitoh * the physical buffer address in the NIC ring.
701 1.1 msaitoh * Slots in the netmap ring (indexed by "si") are
702 1.1 msaitoh * kring->nkr_hwofs positions "ahead" wrt the
703 1.1 msaitoh * corresponding slot in the NIC ring. In some drivers
704 1.1 msaitoh * (not here) nkr_hwofs can be negative. Function
705 1.1 msaitoh * netmap_idx_n2k() handles wraparounds properly.
706 1.1 msaitoh */
707 1.102 msaitoh if ((sc->feat_en & IXGBE_FEATURE_NETMAP) && slot) {
708 1.53 msaitoh int si = netmap_idx_n2k(na->tx_rings[txr->me], i);
709 1.5 msaitoh netmap_load_map(na, txr->txtag,
710 1.5 msaitoh txbuf->map, NMB(na, slot + si));
711 1.1 msaitoh }
712 1.1 msaitoh #endif /* DEV_NETMAP */
713 1.28 msaitoh
714 1.1 msaitoh /* Clear the EOP descriptor pointer */
715 1.1 msaitoh txbuf->eop = NULL;
716 1.28 msaitoh }
717 1.1 msaitoh
718 1.1 msaitoh /* Set the rate at which we sample packets */
719 1.102 msaitoh if (sc->feat_en & IXGBE_FEATURE_FDIR)
720 1.1 msaitoh txr->atr_sample = atr_sample_rate;
721 1.1 msaitoh
722 1.1 msaitoh /* Set number of descriptors available */
723 1.102 msaitoh txr->tx_avail = sc->num_tx_desc;
724 1.1 msaitoh
725 1.1 msaitoh ixgbe_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
726 1.1 msaitoh BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
727 1.1 msaitoh IXGBE_TX_UNLOCK(txr);
728 1.28 msaitoh } /* ixgbe_setup_transmit_ring */
729 1.1 msaitoh
730 1.28 msaitoh /************************************************************************
731 1.28 msaitoh * ixgbe_setup_transmit_structures - Initialize all transmit rings.
732 1.28 msaitoh ************************************************************************/
733 1.1 msaitoh int
734 1.102 msaitoh ixgbe_setup_transmit_structures(struct ixgbe_softc *sc)
735 1.1 msaitoh {
736 1.102 msaitoh struct tx_ring *txr = sc->tx_rings;
737 1.1 msaitoh
738 1.102 msaitoh for (int i = 0; i < sc->num_queues; i++, txr++)
739 1.1 msaitoh ixgbe_setup_transmit_ring(txr);
740 1.1 msaitoh
741 1.1 msaitoh return (0);
742 1.28 msaitoh } /* ixgbe_setup_transmit_structures */
743 1.1 msaitoh
744 1.28 msaitoh /************************************************************************
745 1.28 msaitoh * ixgbe_free_transmit_structures - Free all transmit rings.
746 1.28 msaitoh ************************************************************************/
747 1.1 msaitoh void
748 1.102 msaitoh ixgbe_free_transmit_structures(struct ixgbe_softc *sc)
749 1.1 msaitoh {
750 1.102 msaitoh struct tx_ring *txr = sc->tx_rings;
751 1.1 msaitoh
752 1.102 msaitoh for (int i = 0; i < sc->num_queues; i++, txr++) {
753 1.1 msaitoh ixgbe_free_transmit_buffers(txr);
754 1.102 msaitoh ixgbe_dma_free(sc, &txr->txdma);
755 1.1 msaitoh IXGBE_TX_LOCK_DESTROY(txr);
756 1.1 msaitoh }
757 1.102 msaitoh free(sc->tx_rings, M_DEVBUF);
758 1.28 msaitoh } /* ixgbe_free_transmit_structures */
759 1.1 msaitoh
760 1.28 msaitoh /************************************************************************
761 1.28 msaitoh * ixgbe_free_transmit_buffers
762 1.1 msaitoh *
763 1.28 msaitoh * Free transmit ring related data structures.
764 1.28 msaitoh ************************************************************************/
765 1.1 msaitoh static void
766 1.1 msaitoh ixgbe_free_transmit_buffers(struct tx_ring *txr)
767 1.1 msaitoh {
768 1.102 msaitoh struct ixgbe_softc *sc = txr->sc;
769 1.1 msaitoh struct ixgbe_tx_buf *tx_buffer;
770 1.28 msaitoh int i;
771 1.1 msaitoh
772 1.14 msaitoh INIT_DEBUGOUT("ixgbe_free_transmit_buffers: begin");
773 1.1 msaitoh
774 1.1 msaitoh if (txr->tx_buffers == NULL)
775 1.1 msaitoh return;
776 1.1 msaitoh
777 1.1 msaitoh tx_buffer = txr->tx_buffers;
778 1.102 msaitoh for (i = 0; i < sc->num_tx_desc; i++, tx_buffer++) {
779 1.1 msaitoh if (tx_buffer->m_head != NULL) {
780 1.1 msaitoh bus_dmamap_sync(txr->txtag->dt_dmat, tx_buffer->map,
781 1.1 msaitoh 0, tx_buffer->m_head->m_pkthdr.len,
782 1.1 msaitoh BUS_DMASYNC_POSTWRITE);
783 1.1 msaitoh ixgbe_dmamap_unload(txr->txtag, tx_buffer->map);
784 1.1 msaitoh m_freem(tx_buffer->m_head);
785 1.1 msaitoh tx_buffer->m_head = NULL;
786 1.1 msaitoh if (tx_buffer->map != NULL) {
787 1.1 msaitoh ixgbe_dmamap_destroy(txr->txtag,
788 1.1 msaitoh tx_buffer->map);
789 1.1 msaitoh tx_buffer->map = NULL;
790 1.1 msaitoh }
791 1.1 msaitoh } else if (tx_buffer->map != NULL) {
792 1.1 msaitoh ixgbe_dmamap_unload(txr->txtag, tx_buffer->map);
793 1.1 msaitoh ixgbe_dmamap_destroy(txr->txtag, tx_buffer->map);
794 1.1 msaitoh tx_buffer->map = NULL;
795 1.1 msaitoh }
796 1.1 msaitoh }
797 1.18 msaitoh if (txr->txr_interq != NULL) {
798 1.18 msaitoh struct mbuf *m;
799 1.18 msaitoh
800 1.18 msaitoh while ((m = pcq_get(txr->txr_interq)) != NULL)
801 1.18 msaitoh m_freem(m);
802 1.18 msaitoh pcq_destroy(txr->txr_interq);
803 1.18 msaitoh }
804 1.1 msaitoh if (txr->tx_buffers != NULL) {
805 1.1 msaitoh free(txr->tx_buffers, M_DEVBUF);
806 1.1 msaitoh txr->tx_buffers = NULL;
807 1.1 msaitoh }
808 1.1 msaitoh if (txr->txtag != NULL) {
809 1.1 msaitoh ixgbe_dma_tag_destroy(txr->txtag);
810 1.1 msaitoh txr->txtag = NULL;
811 1.1 msaitoh }
812 1.28 msaitoh } /* ixgbe_free_transmit_buffers */
813 1.1 msaitoh
814 1.28 msaitoh /************************************************************************
815 1.28 msaitoh * ixgbe_tx_ctx_setup
816 1.1 msaitoh *
817 1.28 msaitoh * Advanced Context Descriptor setup for VLAN, CSUM or TSO
818 1.28 msaitoh ************************************************************************/
819 1.1 msaitoh static int
820 1.1 msaitoh ixgbe_tx_ctx_setup(struct tx_ring *txr, struct mbuf *mp,
821 1.1 msaitoh u32 *cmd_type_len, u32 *olinfo_status)
822 1.1 msaitoh {
823 1.102 msaitoh struct ixgbe_softc *sc = txr->sc;
824 1.1 msaitoh struct ixgbe_adv_tx_context_desc *TXD;
825 1.28 msaitoh struct ether_vlan_header *eh;
826 1.8 msaitoh #ifdef INET
827 1.28 msaitoh struct ip *ip;
828 1.8 msaitoh #endif
829 1.8 msaitoh #ifdef INET6
830 1.28 msaitoh struct ip6_hdr *ip6;
831 1.8 msaitoh #endif
832 1.28 msaitoh int ehdrlen, ip_hlen = 0;
833 1.28 msaitoh int offload = TRUE;
834 1.28 msaitoh int ctxd = txr->next_avail_desc;
835 1.28 msaitoh u32 vlan_macip_lens = 0;
836 1.28 msaitoh u32 type_tucmd_mlhl = 0;
837 1.28 msaitoh u16 vtag = 0;
838 1.28 msaitoh u16 etype;
839 1.28 msaitoh u8 ipproto = 0;
840 1.28 msaitoh char *l3d;
841 1.8 msaitoh
842 1.1 msaitoh
843 1.1 msaitoh /* First check if TSO is to be used */
844 1.28 msaitoh if (mp->m_pkthdr.csum_flags & (M_CSUM_TSOv4 | M_CSUM_TSOv6)) {
845 1.17 msaitoh int rv = ixgbe_tso_setup(txr, mp, cmd_type_len, olinfo_status);
846 1.17 msaitoh
847 1.21 msaitoh if (rv != 0)
848 1.102 msaitoh IXGBE_EVC_ADD(&sc->tso_err, 1);
849 1.21 msaitoh return rv;
850 1.17 msaitoh }
851 1.1 msaitoh
852 1.1 msaitoh if ((mp->m_pkthdr.csum_flags & M_CSUM_OFFLOAD) == 0)
853 1.1 msaitoh offload = FALSE;
854 1.1 msaitoh
855 1.1 msaitoh /* Indicate the whole packet as payload when not doing TSO */
856 1.28 msaitoh *olinfo_status |= mp->m_pkthdr.len << IXGBE_ADVTXD_PAYLEN_SHIFT;
857 1.1 msaitoh
858 1.1 msaitoh /* Now ready a context descriptor */
859 1.28 msaitoh TXD = (struct ixgbe_adv_tx_context_desc *)&txr->tx_base[ctxd];
860 1.1 msaitoh
861 1.1 msaitoh /*
862 1.28 msaitoh * In advanced descriptors the vlan tag must
863 1.28 msaitoh * be placed into the context descriptor. Hence
864 1.28 msaitoh * we need to make one even if not doing offloads.
865 1.28 msaitoh */
866 1.29 knakahar if (vlan_has_tag(mp)) {
867 1.29 knakahar vtag = htole16(vlan_get_tag(mp));
868 1.1 msaitoh vlan_macip_lens |= (vtag << IXGBE_ADVTXD_VLAN_SHIFT);
869 1.102 msaitoh } else if (!(txr->sc->feat_en & IXGBE_FEATURE_NEEDS_CTXD) &&
870 1.28 msaitoh (offload == FALSE))
871 1.4 msaitoh return (0);
872 1.1 msaitoh
873 1.1 msaitoh /*
874 1.1 msaitoh * Determine where frame payload starts.
875 1.1 msaitoh * Jump over vlan headers if already present,
876 1.1 msaitoh * helpful for QinQ too.
877 1.1 msaitoh */
878 1.1 msaitoh KASSERT(mp->m_len >= offsetof(struct ether_vlan_header, evl_tag));
879 1.1 msaitoh eh = mtod(mp, struct ether_vlan_header *);
880 1.1 msaitoh if (eh->evl_encap_proto == htons(ETHERTYPE_VLAN)) {
881 1.1 msaitoh KASSERT(mp->m_len >= sizeof(struct ether_vlan_header));
882 1.1 msaitoh etype = ntohs(eh->evl_proto);
883 1.1 msaitoh ehdrlen = ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN;
884 1.1 msaitoh } else {
885 1.1 msaitoh etype = ntohs(eh->evl_encap_proto);
886 1.1 msaitoh ehdrlen = ETHER_HDR_LEN;
887 1.1 msaitoh }
888 1.1 msaitoh
889 1.1 msaitoh /* Set the ether header length */
890 1.1 msaitoh vlan_macip_lens |= ehdrlen << IXGBE_ADVTXD_MACLEN_SHIFT;
891 1.1 msaitoh
892 1.3 msaitoh if (offload == FALSE)
893 1.3 msaitoh goto no_offloads;
894 1.3 msaitoh
895 1.8 msaitoh /*
896 1.28 msaitoh * If the first mbuf only includes the ethernet header,
897 1.28 msaitoh * jump to the next one
898 1.28 msaitoh * XXX: This assumes the stack splits mbufs containing headers
899 1.28 msaitoh * on header boundaries
900 1.8 msaitoh * XXX: And assumes the entire IP header is contained in one mbuf
901 1.8 msaitoh */
902 1.8 msaitoh if (mp->m_len == ehdrlen && mp->m_next)
903 1.8 msaitoh l3d = mtod(mp->m_next, char *);
904 1.8 msaitoh else
905 1.8 msaitoh l3d = mtod(mp, char *) + ehdrlen;
906 1.8 msaitoh
907 1.1 msaitoh switch (etype) {
908 1.9 msaitoh #ifdef INET
909 1.1 msaitoh case ETHERTYPE_IP:
910 1.8 msaitoh ip = (struct ip *)(l3d);
911 1.8 msaitoh ip_hlen = ip->ip_hl << 2;
912 1.8 msaitoh ipproto = ip->ip_p;
913 1.8 msaitoh type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_IPV4;
914 1.1 msaitoh KASSERT((mp->m_pkthdr.csum_flags & M_CSUM_IPv4) == 0 ||
915 1.8 msaitoh ip->ip_sum == 0);
916 1.1 msaitoh break;
917 1.9 msaitoh #endif
918 1.9 msaitoh #ifdef INET6
919 1.1 msaitoh case ETHERTYPE_IPV6:
920 1.8 msaitoh ip6 = (struct ip6_hdr *)(l3d);
921 1.8 msaitoh ip_hlen = sizeof(struct ip6_hdr);
922 1.8 msaitoh ipproto = ip6->ip6_nxt;
923 1.1 msaitoh type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_IPV6;
924 1.1 msaitoh break;
925 1.9 msaitoh #endif
926 1.1 msaitoh default:
927 1.11 msaitoh offload = false;
928 1.1 msaitoh break;
929 1.1 msaitoh }
930 1.1 msaitoh
931 1.1 msaitoh if ((mp->m_pkthdr.csum_flags & M_CSUM_IPv4) != 0)
932 1.1 msaitoh *olinfo_status |= IXGBE_TXD_POPTS_IXSM << 8;
933 1.1 msaitoh
934 1.1 msaitoh vlan_macip_lens |= ip_hlen;
935 1.1 msaitoh
936 1.8 msaitoh /* No support for offloads for non-L4 next headers */
937 1.63 msaitoh switch (ipproto) {
938 1.36 msaitoh case IPPROTO_TCP:
939 1.36 msaitoh if (mp->m_pkthdr.csum_flags &
940 1.36 msaitoh (M_CSUM_TCPv4 | M_CSUM_TCPv6))
941 1.36 msaitoh type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_L4T_TCP;
942 1.36 msaitoh else
943 1.36 msaitoh offload = false;
944 1.36 msaitoh break;
945 1.36 msaitoh case IPPROTO_UDP:
946 1.36 msaitoh if (mp->m_pkthdr.csum_flags &
947 1.36 msaitoh (M_CSUM_UDPv4 | M_CSUM_UDPv6))
948 1.36 msaitoh type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_L4T_UDP;
949 1.36 msaitoh else
950 1.11 msaitoh offload = false;
951 1.36 msaitoh break;
952 1.36 msaitoh default:
953 1.36 msaitoh offload = false;
954 1.36 msaitoh break;
955 1.8 msaitoh }
956 1.8 msaitoh
957 1.8 msaitoh if (offload) /* Insert L4 checksum into data descriptors */
958 1.1 msaitoh *olinfo_status |= IXGBE_TXD_POPTS_TXSM << 8;
959 1.1 msaitoh
960 1.3 msaitoh no_offloads:
961 1.3 msaitoh type_tucmd_mlhl |= IXGBE_ADVTXD_DCMD_DEXT | IXGBE_ADVTXD_DTYP_CTXT;
962 1.3 msaitoh
963 1.1 msaitoh /* Now copy bits into descriptor */
964 1.1 msaitoh TXD->vlan_macip_lens = htole32(vlan_macip_lens);
965 1.1 msaitoh TXD->type_tucmd_mlhl = htole32(type_tucmd_mlhl);
966 1.1 msaitoh TXD->seqnum_seed = htole32(0);
967 1.1 msaitoh TXD->mss_l4len_idx = htole32(0);
968 1.1 msaitoh
969 1.1 msaitoh /* We've consumed the first desc, adjust counters */
970 1.1 msaitoh if (++ctxd == txr->num_desc)
971 1.1 msaitoh ctxd = 0;
972 1.1 msaitoh txr->next_avail_desc = ctxd;
973 1.1 msaitoh --txr->tx_avail;
974 1.1 msaitoh
975 1.28 msaitoh return (0);
976 1.28 msaitoh } /* ixgbe_tx_ctx_setup */
977 1.1 msaitoh
978 1.28 msaitoh /************************************************************************
979 1.28 msaitoh * ixgbe_tso_setup
980 1.1 msaitoh *
981 1.28 msaitoh * Setup work for hardware segmentation offload (TSO) on
982 1.28 msaitoh * adapters using advanced tx descriptors
983 1.28 msaitoh ************************************************************************/
984 1.1 msaitoh static int
985 1.28 msaitoh ixgbe_tso_setup(struct tx_ring *txr, struct mbuf *mp, u32 *cmd_type_len,
986 1.28 msaitoh u32 *olinfo_status)
987 1.1 msaitoh {
988 1.1 msaitoh struct ixgbe_adv_tx_context_desc *TXD;
989 1.28 msaitoh struct ether_vlan_header *eh;
990 1.1 msaitoh #ifdef INET6
991 1.28 msaitoh struct ip6_hdr *ip6;
992 1.1 msaitoh #endif
993 1.1 msaitoh #ifdef INET
994 1.28 msaitoh struct ip *ip;
995 1.1 msaitoh #endif
996 1.28 msaitoh struct tcphdr *th;
997 1.28 msaitoh int ctxd, ehdrlen, ip_hlen, tcp_hlen;
998 1.28 msaitoh u32 vlan_macip_lens = 0;
999 1.28 msaitoh u32 type_tucmd_mlhl = 0;
1000 1.28 msaitoh u32 mss_l4len_idx = 0, paylen;
1001 1.28 msaitoh u16 vtag = 0, eh_type;
1002 1.1 msaitoh
1003 1.1 msaitoh /*
1004 1.1 msaitoh * Determine where frame payload starts.
1005 1.1 msaitoh * Jump over vlan headers if already present
1006 1.1 msaitoh */
1007 1.1 msaitoh eh = mtod(mp, struct ether_vlan_header *);
1008 1.1 msaitoh if (eh->evl_encap_proto == htons(ETHERTYPE_VLAN)) {
1009 1.1 msaitoh ehdrlen = ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN;
1010 1.1 msaitoh eh_type = eh->evl_proto;
1011 1.1 msaitoh } else {
1012 1.1 msaitoh ehdrlen = ETHER_HDR_LEN;
1013 1.1 msaitoh eh_type = eh->evl_encap_proto;
1014 1.1 msaitoh }
1015 1.1 msaitoh
1016 1.1 msaitoh switch (ntohs(eh_type)) {
1017 1.1 msaitoh #ifdef INET
1018 1.1 msaitoh case ETHERTYPE_IP:
1019 1.1 msaitoh ip = (struct ip *)(mp->m_data + ehdrlen);
1020 1.1 msaitoh if (ip->ip_p != IPPROTO_TCP)
1021 1.1 msaitoh return (ENXIO);
1022 1.1 msaitoh ip->ip_sum = 0;
1023 1.1 msaitoh ip_hlen = ip->ip_hl << 2;
1024 1.1 msaitoh th = (struct tcphdr *)((char *)ip + ip_hlen);
1025 1.1 msaitoh th->th_sum = in_cksum_phdr(ip->ip_src.s_addr,
1026 1.1 msaitoh ip->ip_dst.s_addr, htons(IPPROTO_TCP));
1027 1.1 msaitoh type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_IPV4;
1028 1.1 msaitoh /* Tell transmit desc to also do IPv4 checksum. */
1029 1.1 msaitoh *olinfo_status |= IXGBE_TXD_POPTS_IXSM << 8;
1030 1.1 msaitoh break;
1031 1.1 msaitoh #endif
1032 1.28 msaitoh #ifdef INET6
1033 1.28 msaitoh case ETHERTYPE_IPV6:
1034 1.28 msaitoh ip6 = (struct ip6_hdr *)(mp->m_data + ehdrlen);
1035 1.28 msaitoh /* XXX-BZ For now we do not pretend to support ext. hdrs. */
1036 1.28 msaitoh if (ip6->ip6_nxt != IPPROTO_TCP)
1037 1.28 msaitoh return (ENXIO);
1038 1.28 msaitoh ip_hlen = sizeof(struct ip6_hdr);
1039 1.28 msaitoh ip6 = (struct ip6_hdr *)(mp->m_data + ehdrlen);
1040 1.28 msaitoh th = (struct tcphdr *)((char *)ip6 + ip_hlen);
1041 1.28 msaitoh th->th_sum = in6_cksum_phdr(&ip6->ip6_src,
1042 1.28 msaitoh &ip6->ip6_dst, 0, htonl(IPPROTO_TCP));
1043 1.28 msaitoh type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_IPV6;
1044 1.28 msaitoh break;
1045 1.28 msaitoh #endif
1046 1.1 msaitoh default:
1047 1.1 msaitoh panic("%s: CSUM_TSO but no supported IP version (0x%04x)",
1048 1.1 msaitoh __func__, ntohs(eh_type));
1049 1.1 msaitoh break;
1050 1.1 msaitoh }
1051 1.1 msaitoh
1052 1.1 msaitoh ctxd = txr->next_avail_desc;
1053 1.28 msaitoh TXD = (struct ixgbe_adv_tx_context_desc *)&txr->tx_base[ctxd];
1054 1.1 msaitoh
1055 1.1 msaitoh tcp_hlen = th->th_off << 2;
1056 1.1 msaitoh
1057 1.1 msaitoh /* This is used in the transmit desc in encap */
1058 1.1 msaitoh paylen = mp->m_pkthdr.len - ehdrlen - ip_hlen - tcp_hlen;
1059 1.1 msaitoh
1060 1.1 msaitoh /* VLAN MACLEN IPLEN */
1061 1.29 knakahar if (vlan_has_tag(mp)) {
1062 1.29 knakahar vtag = htole16(vlan_get_tag(mp));
1063 1.28 msaitoh vlan_macip_lens |= (vtag << IXGBE_ADVTXD_VLAN_SHIFT);
1064 1.1 msaitoh }
1065 1.1 msaitoh
1066 1.1 msaitoh vlan_macip_lens |= ehdrlen << IXGBE_ADVTXD_MACLEN_SHIFT;
1067 1.1 msaitoh vlan_macip_lens |= ip_hlen;
1068 1.1 msaitoh TXD->vlan_macip_lens = htole32(vlan_macip_lens);
1069 1.1 msaitoh
1070 1.1 msaitoh /* ADV DTYPE TUCMD */
1071 1.1 msaitoh type_tucmd_mlhl |= IXGBE_ADVTXD_DCMD_DEXT | IXGBE_ADVTXD_DTYP_CTXT;
1072 1.1 msaitoh type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_L4T_TCP;
1073 1.1 msaitoh TXD->type_tucmd_mlhl = htole32(type_tucmd_mlhl);
1074 1.1 msaitoh
1075 1.1 msaitoh /* MSS L4LEN IDX */
1076 1.1 msaitoh mss_l4len_idx |= (mp->m_pkthdr.segsz << IXGBE_ADVTXD_MSS_SHIFT);
1077 1.1 msaitoh mss_l4len_idx |= (tcp_hlen << IXGBE_ADVTXD_L4LEN_SHIFT);
1078 1.1 msaitoh TXD->mss_l4len_idx = htole32(mss_l4len_idx);
1079 1.1 msaitoh
1080 1.1 msaitoh TXD->seqnum_seed = htole32(0);
1081 1.1 msaitoh
1082 1.1 msaitoh if (++ctxd == txr->num_desc)
1083 1.1 msaitoh ctxd = 0;
1084 1.1 msaitoh
1085 1.1 msaitoh txr->tx_avail--;
1086 1.1 msaitoh txr->next_avail_desc = ctxd;
1087 1.1 msaitoh *cmd_type_len |= IXGBE_ADVTXD_DCMD_TSE;
1088 1.1 msaitoh *olinfo_status |= IXGBE_TXD_POPTS_TXSM << 8;
1089 1.1 msaitoh *olinfo_status |= paylen << IXGBE_ADVTXD_PAYLEN_SHIFT;
1090 1.95 msaitoh IXGBE_EVC_ADD(&txr->tso_tx, 1);
1091 1.28 msaitoh
1092 1.1 msaitoh return (0);
1093 1.28 msaitoh } /* ixgbe_tso_setup */
1094 1.1 msaitoh
1095 1.3 msaitoh
1096 1.28 msaitoh /************************************************************************
1097 1.28 msaitoh * ixgbe_txeof
1098 1.1 msaitoh *
1099 1.28 msaitoh * Examine each tx_buffer in the used queue. If the hardware is done
1100 1.28 msaitoh * processing the packet then free associated resources. The
1101 1.28 msaitoh * tx_buffer is put back on the free queue.
1102 1.28 msaitoh ************************************************************************/
1103 1.32 msaitoh bool
1104 1.1 msaitoh ixgbe_txeof(struct tx_ring *txr)
1105 1.1 msaitoh {
1106 1.102 msaitoh struct ixgbe_softc *sc = txr->sc;
1107 1.102 msaitoh struct ifnet *ifp = sc->ifp;
1108 1.28 msaitoh struct ixgbe_tx_buf *buf;
1109 1.28 msaitoh union ixgbe_adv_tx_desc *txd;
1110 1.1 msaitoh u32 work, processed = 0;
1111 1.102 msaitoh u32 limit = sc->tx_process_limit;
1112 1.1 msaitoh
1113 1.1 msaitoh KASSERT(mutex_owned(&txr->tx_mtx));
1114 1.1 msaitoh
1115 1.1 msaitoh #ifdef DEV_NETMAP
1116 1.102 msaitoh if ((sc->feat_en & IXGBE_FEATURE_NETMAP) &&
1117 1.102 msaitoh (sc->ifp->if_capenable & IFCAP_NETMAP)) {
1118 1.102 msaitoh struct netmap_sc *na = NA(sc->ifp);
1119 1.53 msaitoh struct netmap_kring *kring = na->tx_rings[txr->me];
1120 1.1 msaitoh txd = txr->tx_base;
1121 1.1 msaitoh bus_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
1122 1.1 msaitoh BUS_DMASYNC_POSTREAD);
1123 1.1 msaitoh /*
1124 1.1 msaitoh * In netmap mode, all the work is done in the context
1125 1.1 msaitoh * of the client thread. Interrupt handlers only wake up
1126 1.1 msaitoh * clients, which may be sleeping on individual rings
1127 1.1 msaitoh * or on a global resource for all rings.
1128 1.1 msaitoh * To implement tx interrupt mitigation, we wake up the client
1129 1.1 msaitoh * thread roughly every half ring, even if the NIC interrupts
1130 1.1 msaitoh * more frequently. This is implemented as follows:
1131 1.1 msaitoh * - ixgbe_txsync() sets kring->nr_kflags with the index of
1132 1.1 msaitoh * the slot that should wake up the thread (nkr_num_slots
1133 1.1 msaitoh * means the user thread should not be woken up);
1134 1.1 msaitoh * - the driver ignores tx interrupts unless netmap_mitigate=0
1135 1.1 msaitoh * or the slot has the DD bit set.
1136 1.1 msaitoh */
1137 1.53 msaitoh if (kring->nr_kflags < kring->nkr_num_slots &&
1138 1.78 ryo le32toh(txd[kring->nr_kflags].wb.status) & IXGBE_TXD_STAT_DD) {
1139 1.1 msaitoh netmap_tx_irq(ifp, txr->me);
1140 1.1 msaitoh }
1141 1.32 msaitoh return false;
1142 1.1 msaitoh }
1143 1.1 msaitoh #endif /* DEV_NETMAP */
1144 1.1 msaitoh
1145 1.1 msaitoh if (txr->tx_avail == txr->num_desc) {
1146 1.45 msaitoh txr->busy = 0;
1147 1.32 msaitoh return false;
1148 1.1 msaitoh }
1149 1.1 msaitoh
1150 1.1 msaitoh /* Get work starting point */
1151 1.1 msaitoh work = txr->next_to_clean;
1152 1.1 msaitoh buf = &txr->tx_buffers[work];
1153 1.1 msaitoh txd = &txr->tx_base[work];
1154 1.1 msaitoh work -= txr->num_desc; /* The distance to ring end */
1155 1.28 msaitoh ixgbe_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
1156 1.1 msaitoh BUS_DMASYNC_POSTREAD);
1157 1.8 msaitoh
1158 1.1 msaitoh do {
1159 1.8 msaitoh union ixgbe_adv_tx_desc *eop = buf->eop;
1160 1.1 msaitoh if (eop == NULL) /* No work */
1161 1.1 msaitoh break;
1162 1.1 msaitoh
1163 1.78 ryo if ((le32toh(eop->wb.status) & IXGBE_TXD_STAT_DD) == 0)
1164 1.1 msaitoh break; /* I/O not complete */
1165 1.1 msaitoh
1166 1.1 msaitoh if (buf->m_head) {
1167 1.28 msaitoh txr->bytes += buf->m_head->m_pkthdr.len;
1168 1.28 msaitoh bus_dmamap_sync(txr->txtag->dt_dmat, buf->map,
1169 1.1 msaitoh 0, buf->m_head->m_pkthdr.len,
1170 1.1 msaitoh BUS_DMASYNC_POSTWRITE);
1171 1.28 msaitoh ixgbe_dmamap_unload(txr->txtag, buf->map);
1172 1.1 msaitoh m_freem(buf->m_head);
1173 1.1 msaitoh buf->m_head = NULL;
1174 1.1 msaitoh }
1175 1.1 msaitoh buf->eop = NULL;
1176 1.47 msaitoh txr->txr_no_space = false;
1177 1.1 msaitoh ++txr->tx_avail;
1178 1.1 msaitoh
1179 1.1 msaitoh /* We clean the range if multi segment */
1180 1.1 msaitoh while (txd != eop) {
1181 1.1 msaitoh ++txd;
1182 1.1 msaitoh ++buf;
1183 1.1 msaitoh ++work;
1184 1.1 msaitoh /* wrap the ring? */
1185 1.1 msaitoh if (__predict_false(!work)) {
1186 1.1 msaitoh work -= txr->num_desc;
1187 1.1 msaitoh buf = txr->tx_buffers;
1188 1.1 msaitoh txd = txr->tx_base;
1189 1.1 msaitoh }
1190 1.1 msaitoh if (buf->m_head) {
1191 1.1 msaitoh txr->bytes +=
1192 1.1 msaitoh buf->m_head->m_pkthdr.len;
1193 1.1 msaitoh bus_dmamap_sync(txr->txtag->dt_dmat,
1194 1.1 msaitoh buf->map,
1195 1.1 msaitoh 0, buf->m_head->m_pkthdr.len,
1196 1.1 msaitoh BUS_DMASYNC_POSTWRITE);
1197 1.1 msaitoh ixgbe_dmamap_unload(txr->txtag,
1198 1.1 msaitoh buf->map);
1199 1.1 msaitoh m_freem(buf->m_head);
1200 1.1 msaitoh buf->m_head = NULL;
1201 1.1 msaitoh }
1202 1.1 msaitoh ++txr->tx_avail;
1203 1.1 msaitoh buf->eop = NULL;
1204 1.1 msaitoh
1205 1.1 msaitoh }
1206 1.1 msaitoh ++txr->packets;
1207 1.1 msaitoh ++processed;
1208 1.61 thorpej if_statinc(ifp, if_opackets);
1209 1.1 msaitoh
1210 1.1 msaitoh /* Try the next packet */
1211 1.1 msaitoh ++txd;
1212 1.1 msaitoh ++buf;
1213 1.1 msaitoh ++work;
1214 1.1 msaitoh /* reset with a wrap */
1215 1.1 msaitoh if (__predict_false(!work)) {
1216 1.1 msaitoh work -= txr->num_desc;
1217 1.1 msaitoh buf = txr->tx_buffers;
1218 1.1 msaitoh txd = txr->tx_base;
1219 1.1 msaitoh }
1220 1.1 msaitoh prefetch(txd);
1221 1.1 msaitoh } while (__predict_true(--limit));
1222 1.1 msaitoh
1223 1.1 msaitoh ixgbe_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
1224 1.1 msaitoh BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
1225 1.1 msaitoh
1226 1.1 msaitoh work += txr->num_desc;
1227 1.1 msaitoh txr->next_to_clean = work;
1228 1.1 msaitoh
1229 1.45 msaitoh /*
1230 1.45 msaitoh * Queue Hang detection, we know there's
1231 1.45 msaitoh * work outstanding or the first return
1232 1.45 msaitoh * would have been taken, so increment busy
1233 1.45 msaitoh * if nothing managed to get cleaned, then
1234 1.45 msaitoh * in local_timer it will be checked and
1235 1.45 msaitoh * marked as HUNG if it exceeds a MAX attempt.
1236 1.45 msaitoh */
1237 1.45 msaitoh if ((processed == 0) && (txr->busy != IXGBE_QUEUE_HUNG))
1238 1.45 msaitoh ++txr->busy;
1239 1.45 msaitoh /*
1240 1.45 msaitoh * If anything gets cleaned we reset state to 1,
1241 1.45 msaitoh * note this will turn off HUNG if its set.
1242 1.45 msaitoh */
1243 1.45 msaitoh if (processed)
1244 1.45 msaitoh txr->busy = 1;
1245 1.45 msaitoh
1246 1.43 msaitoh if (txr->tx_avail == txr->num_desc)
1247 1.45 msaitoh txr->busy = 0;
1248 1.43 msaitoh
1249 1.32 msaitoh return ((limit > 0) ? false : true);
1250 1.28 msaitoh } /* ixgbe_txeof */
1251 1.1 msaitoh
1252 1.28 msaitoh /************************************************************************
1253 1.28 msaitoh * ixgbe_rsc_count
1254 1.28 msaitoh *
1255 1.28 msaitoh * Used to detect a descriptor that has been merged by Hardware RSC.
1256 1.28 msaitoh ************************************************************************/
1257 1.1 msaitoh static inline u32
1258 1.1 msaitoh ixgbe_rsc_count(union ixgbe_adv_rx_desc *rx)
1259 1.1 msaitoh {
1260 1.1 msaitoh return (le32toh(rx->wb.lower.lo_dword.data) &
1261 1.1 msaitoh IXGBE_RXDADV_RSCCNT_MASK) >> IXGBE_RXDADV_RSCCNT_SHIFT;
1262 1.28 msaitoh } /* ixgbe_rsc_count */
1263 1.1 msaitoh
1264 1.28 msaitoh /************************************************************************
1265 1.28 msaitoh * ixgbe_setup_hw_rsc
1266 1.1 msaitoh *
1267 1.28 msaitoh * Initialize Hardware RSC (LRO) feature on 82599
1268 1.28 msaitoh * for an RX ring, this is toggled by the LRO capability
1269 1.28 msaitoh * even though it is transparent to the stack.
1270 1.28 msaitoh *
1271 1.28 msaitoh * NOTE: Since this HW feature only works with IPv4 and
1272 1.28 msaitoh * testing has shown soft LRO to be as effective,
1273 1.28 msaitoh * this feature will be disabled by default.
1274 1.28 msaitoh ************************************************************************/
1275 1.1 msaitoh static void
1276 1.1 msaitoh ixgbe_setup_hw_rsc(struct rx_ring *rxr)
1277 1.1 msaitoh {
1278 1.102 msaitoh struct ixgbe_softc *sc = rxr->sc;
1279 1.102 msaitoh struct ixgbe_hw *hw = &sc->hw;
1280 1.28 msaitoh u32 rscctrl, rdrxctl;
1281 1.1 msaitoh
1282 1.1 msaitoh /* If turning LRO/RSC off we need to disable it */
1283 1.102 msaitoh if ((sc->ifp->if_capenable & IFCAP_LRO) == 0) {
1284 1.1 msaitoh rscctrl = IXGBE_READ_REG(hw, IXGBE_RSCCTL(rxr->me));
1285 1.1 msaitoh rscctrl &= ~IXGBE_RSCCTL_RSCEN;
1286 1.1 msaitoh return;
1287 1.1 msaitoh }
1288 1.1 msaitoh
1289 1.1 msaitoh rdrxctl = IXGBE_READ_REG(hw, IXGBE_RDRXCTL);
1290 1.1 msaitoh rdrxctl &= ~IXGBE_RDRXCTL_RSCFRSTSIZE;
1291 1.28 msaitoh #ifdef DEV_NETMAP
1292 1.28 msaitoh /* Always strip CRC unless Netmap disabled it */
1293 1.102 msaitoh if (!(sc->feat_en & IXGBE_FEATURE_NETMAP) ||
1294 1.102 msaitoh !(sc->ifp->if_capenable & IFCAP_NETMAP) ||
1295 1.28 msaitoh ix_crcstrip)
1296 1.1 msaitoh #endif /* DEV_NETMAP */
1297 1.28 msaitoh rdrxctl |= IXGBE_RDRXCTL_CRCSTRIP;
1298 1.1 msaitoh rdrxctl |= IXGBE_RDRXCTL_RSCACKC;
1299 1.1 msaitoh IXGBE_WRITE_REG(hw, IXGBE_RDRXCTL, rdrxctl);
1300 1.1 msaitoh
1301 1.1 msaitoh rscctrl = IXGBE_READ_REG(hw, IXGBE_RSCCTL(rxr->me));
1302 1.1 msaitoh rscctrl |= IXGBE_RSCCTL_RSCEN;
1303 1.1 msaitoh /*
1304 1.28 msaitoh * Limit the total number of descriptors that
1305 1.28 msaitoh * can be combined, so it does not exceed 64K
1306 1.28 msaitoh */
1307 1.1 msaitoh if (rxr->mbuf_sz == MCLBYTES)
1308 1.1 msaitoh rscctrl |= IXGBE_RSCCTL_MAXDESC_16;
1309 1.1 msaitoh else if (rxr->mbuf_sz == MJUMPAGESIZE)
1310 1.1 msaitoh rscctrl |= IXGBE_RSCCTL_MAXDESC_8;
1311 1.1 msaitoh else if (rxr->mbuf_sz == MJUM9BYTES)
1312 1.1 msaitoh rscctrl |= IXGBE_RSCCTL_MAXDESC_4;
1313 1.1 msaitoh else /* Using 16K cluster */
1314 1.1 msaitoh rscctrl |= IXGBE_RSCCTL_MAXDESC_1;
1315 1.1 msaitoh
1316 1.1 msaitoh IXGBE_WRITE_REG(hw, IXGBE_RSCCTL(rxr->me), rscctrl);
1317 1.1 msaitoh
1318 1.1 msaitoh /* Enable TCP header recognition */
1319 1.1 msaitoh IXGBE_WRITE_REG(hw, IXGBE_PSRTYPE(0),
1320 1.28 msaitoh (IXGBE_READ_REG(hw, IXGBE_PSRTYPE(0)) | IXGBE_PSRTYPE_TCPHDR));
1321 1.1 msaitoh
1322 1.1 msaitoh /* Disable RSC for ACK packets */
1323 1.1 msaitoh IXGBE_WRITE_REG(hw, IXGBE_RSCDBU,
1324 1.1 msaitoh (IXGBE_RSCDBU_RSCACKDIS | IXGBE_READ_REG(hw, IXGBE_RSCDBU)));
1325 1.1 msaitoh
1326 1.1 msaitoh rxr->hw_rsc = TRUE;
1327 1.28 msaitoh } /* ixgbe_setup_hw_rsc */
1328 1.8 msaitoh
1329 1.28 msaitoh /************************************************************************
1330 1.28 msaitoh * ixgbe_refresh_mbufs
1331 1.1 msaitoh *
1332 1.28 msaitoh * Refresh mbuf buffers for RX descriptor rings
1333 1.28 msaitoh * - now keeps its own state so discards due to resource
1334 1.28 msaitoh * exhaustion are unnecessary, if an mbuf cannot be obtained
1335 1.28 msaitoh * it just returns, keeping its placeholder, thus it can simply
1336 1.28 msaitoh * be recalled to try again.
1337 1.28 msaitoh ************************************************************************/
1338 1.1 msaitoh static void
1339 1.1 msaitoh ixgbe_refresh_mbufs(struct rx_ring *rxr, int limit)
1340 1.1 msaitoh {
1341 1.102 msaitoh struct ixgbe_softc *sc = rxr->sc;
1342 1.28 msaitoh struct ixgbe_rx_buf *rxbuf;
1343 1.28 msaitoh struct mbuf *mp;
1344 1.82 msaitoh int i, error;
1345 1.28 msaitoh bool refreshed = false;
1346 1.1 msaitoh
1347 1.82 msaitoh i = rxr->next_to_refresh;
1348 1.82 msaitoh /* next_to_refresh points to the previous one */
1349 1.82 msaitoh if (++i == rxr->num_desc)
1350 1.82 msaitoh i = 0;
1351 1.1 msaitoh
1352 1.82 msaitoh while (i != limit) {
1353 1.1 msaitoh rxbuf = &rxr->rx_buffers[i];
1354 1.91 msaitoh if (__predict_false(rxbuf->buf == NULL)) {
1355 1.87 msaitoh mp = ixgbe_getcl();
1356 1.1 msaitoh if (mp == NULL) {
1357 1.95 msaitoh IXGBE_EVC_ADD(&rxr->no_mbuf, 1);
1358 1.1 msaitoh goto update;
1359 1.1 msaitoh }
1360 1.86 msaitoh mp->m_pkthdr.len = mp->m_len = rxr->mbuf_sz;
1361 1.102 msaitoh IXGBE_M_ADJ(sc, rxr, mp);
1362 1.1 msaitoh } else
1363 1.1 msaitoh mp = rxbuf->buf;
1364 1.1 msaitoh
1365 1.1 msaitoh /* If we're dealing with an mbuf that was copied rather
1366 1.1 msaitoh * than replaced, there's no need to go through busdma.
1367 1.1 msaitoh */
1368 1.1 msaitoh if ((rxbuf->flags & IXGBE_RX_COPY) == 0) {
1369 1.1 msaitoh /* Get the memory mapping */
1370 1.4 msaitoh ixgbe_dmamap_unload(rxr->ptag, rxbuf->pmap);
1371 1.1 msaitoh error = bus_dmamap_load_mbuf(rxr->ptag->dt_dmat,
1372 1.1 msaitoh rxbuf->pmap, mp, BUS_DMA_NOWAIT);
1373 1.91 msaitoh if (__predict_false(error != 0)) {
1374 1.102 msaitoh device_printf(sc->dev, "Refresh mbufs: "
1375 1.55 msaitoh "payload dmamap load failure - %d\n",
1376 1.55 msaitoh error);
1377 1.1 msaitoh m_free(mp);
1378 1.1 msaitoh rxbuf->buf = NULL;
1379 1.1 msaitoh goto update;
1380 1.1 msaitoh }
1381 1.1 msaitoh rxbuf->buf = mp;
1382 1.1 msaitoh bus_dmamap_sync(rxr->ptag->dt_dmat, rxbuf->pmap,
1383 1.1 msaitoh 0, mp->m_pkthdr.len, BUS_DMASYNC_PREREAD);
1384 1.1 msaitoh rxbuf->addr = rxr->rx_base[i].read.pkt_addr =
1385 1.1 msaitoh htole64(rxbuf->pmap->dm_segs[0].ds_addr);
1386 1.1 msaitoh } else {
1387 1.1 msaitoh rxr->rx_base[i].read.pkt_addr = rxbuf->addr;
1388 1.1 msaitoh rxbuf->flags &= ~IXGBE_RX_COPY;
1389 1.1 msaitoh }
1390 1.1 msaitoh
1391 1.1 msaitoh refreshed = true;
1392 1.82 msaitoh /* next_to_refresh points to the previous one */
1393 1.1 msaitoh rxr->next_to_refresh = i;
1394 1.82 msaitoh if (++i == rxr->num_desc)
1395 1.82 msaitoh i = 0;
1396 1.1 msaitoh }
1397 1.28 msaitoh
1398 1.1 msaitoh update:
1399 1.1 msaitoh if (refreshed) /* Update hardware tail index */
1400 1.102 msaitoh IXGBE_WRITE_REG(&sc->hw, rxr->tail, rxr->next_to_refresh);
1401 1.28 msaitoh
1402 1.1 msaitoh return;
1403 1.28 msaitoh } /* ixgbe_refresh_mbufs */
1404 1.1 msaitoh
1405 1.28 msaitoh /************************************************************************
1406 1.28 msaitoh * ixgbe_allocate_receive_buffers
1407 1.1 msaitoh *
1408 1.28 msaitoh * Allocate memory for rx_buffer structures. Since we use one
1409 1.28 msaitoh * rx_buffer per received packet, the maximum number of rx_buffer's
1410 1.28 msaitoh * that we'll need is equal to the number of receive descriptors
1411 1.28 msaitoh * that we've allocated.
1412 1.28 msaitoh ************************************************************************/
1413 1.28 msaitoh static int
1414 1.1 msaitoh ixgbe_allocate_receive_buffers(struct rx_ring *rxr)
1415 1.1 msaitoh {
1416 1.102 msaitoh struct ixgbe_softc *sc = rxr->sc;
1417 1.102 msaitoh device_t dev = sc->dev;
1418 1.28 msaitoh struct ixgbe_rx_buf *rxbuf;
1419 1.28 msaitoh int bsize, error;
1420 1.1 msaitoh
1421 1.1 msaitoh bsize = sizeof(struct ixgbe_rx_buf) * rxr->num_desc;
1422 1.57 chs rxr->rx_buffers = malloc(bsize, M_DEVBUF, M_WAITOK | M_ZERO);
1423 1.1 msaitoh
1424 1.28 msaitoh error = ixgbe_dma_tag_create(
1425 1.102 msaitoh /* parent */ sc->osdep.dmat,
1426 1.28 msaitoh /* alignment */ 1,
1427 1.28 msaitoh /* bounds */ 0,
1428 1.28 msaitoh /* maxsize */ MJUM16BYTES,
1429 1.28 msaitoh /* nsegments */ 1,
1430 1.28 msaitoh /* maxsegsize */ MJUM16BYTES,
1431 1.28 msaitoh /* flags */ 0,
1432 1.28 msaitoh &rxr->ptag);
1433 1.28 msaitoh if (error != 0) {
1434 1.1 msaitoh aprint_error_dev(dev, "Unable to create RX DMA tag\n");
1435 1.1 msaitoh goto fail;
1436 1.1 msaitoh }
1437 1.1 msaitoh
1438 1.5 msaitoh for (int i = 0; i < rxr->num_desc; i++, rxbuf++) {
1439 1.1 msaitoh rxbuf = &rxr->rx_buffers[i];
1440 1.4 msaitoh error = ixgbe_dmamap_create(rxr->ptag, 0, &rxbuf->pmap);
1441 1.1 msaitoh if (error) {
1442 1.1 msaitoh aprint_error_dev(dev, "Unable to create RX dma map\n");
1443 1.1 msaitoh goto fail;
1444 1.1 msaitoh }
1445 1.1 msaitoh }
1446 1.1 msaitoh
1447 1.1 msaitoh return (0);
1448 1.1 msaitoh
1449 1.1 msaitoh fail:
1450 1.1 msaitoh /* Frees all, but can handle partial completion */
1451 1.102 msaitoh ixgbe_free_receive_structures(sc);
1452 1.28 msaitoh
1453 1.1 msaitoh return (error);
1454 1.28 msaitoh } /* ixgbe_allocate_receive_buffers */
1455 1.1 msaitoh
1456 1.28 msaitoh /************************************************************************
1457 1.30 msaitoh * ixgbe_free_receive_ring
1458 1.28 msaitoh ************************************************************************/
1459 1.28 msaitoh static void
1460 1.1 msaitoh ixgbe_free_receive_ring(struct rx_ring *rxr)
1461 1.27 msaitoh {
1462 1.5 msaitoh for (int i = 0; i < rxr->num_desc; i++) {
1463 1.27 msaitoh ixgbe_rx_discard(rxr, i);
1464 1.1 msaitoh }
1465 1.28 msaitoh } /* ixgbe_free_receive_ring */
1466 1.1 msaitoh
1467 1.28 msaitoh /************************************************************************
1468 1.28 msaitoh * ixgbe_setup_receive_ring
1469 1.1 msaitoh *
1470 1.28 msaitoh * Initialize a receive ring and its buffers.
1471 1.28 msaitoh ************************************************************************/
1472 1.1 msaitoh static int
1473 1.1 msaitoh ixgbe_setup_receive_ring(struct rx_ring *rxr)
1474 1.1 msaitoh {
1475 1.102 msaitoh struct ixgbe_softc *sc;
1476 1.28 msaitoh struct ixgbe_rx_buf *rxbuf;
1477 1.1 msaitoh #ifdef LRO
1478 1.28 msaitoh struct ifnet *ifp;
1479 1.28 msaitoh struct lro_ctrl *lro = &rxr->lro;
1480 1.1 msaitoh #endif /* LRO */
1481 1.1 msaitoh #ifdef DEV_NETMAP
1482 1.102 msaitoh struct netmap_sc *na = NA(rxr->sc->ifp);
1483 1.28 msaitoh struct netmap_slot *slot;
1484 1.1 msaitoh #endif /* DEV_NETMAP */
1485 1.28 msaitoh int rsize, error = 0;
1486 1.1 msaitoh
1487 1.102 msaitoh sc = rxr->sc;
1488 1.1 msaitoh #ifdef LRO
1489 1.102 msaitoh ifp = sc->ifp;
1490 1.1 msaitoh #endif /* LRO */
1491 1.1 msaitoh
1492 1.1 msaitoh /* Clear the ring contents */
1493 1.1 msaitoh IXGBE_RX_LOCK(rxr);
1494 1.28 msaitoh
1495 1.1 msaitoh #ifdef DEV_NETMAP
1496 1.102 msaitoh if (sc->feat_en & IXGBE_FEATURE_NETMAP)
1497 1.28 msaitoh slot = netmap_reset(na, NR_RX, rxr->me, 0);
1498 1.1 msaitoh #endif /* DEV_NETMAP */
1499 1.28 msaitoh
1500 1.102 msaitoh rsize = roundup2(sc->num_rx_desc *
1501 1.1 msaitoh sizeof(union ixgbe_adv_rx_desc), DBA_ALIGN);
1502 1.1 msaitoh bzero((void *)rxr->rx_base, rsize);
1503 1.1 msaitoh /* Cache the size */
1504 1.102 msaitoh rxr->mbuf_sz = sc->rx_mbuf_sz;
1505 1.1 msaitoh
1506 1.1 msaitoh /* Free current RX buffer structs and their mbufs */
1507 1.1 msaitoh ixgbe_free_receive_ring(rxr);
1508 1.1 msaitoh
1509 1.1 msaitoh /* Now replenish the mbufs */
1510 1.1 msaitoh for (int j = 0; j != rxr->num_desc; ++j) {
1511 1.28 msaitoh struct mbuf *mp;
1512 1.1 msaitoh
1513 1.1 msaitoh rxbuf = &rxr->rx_buffers[j];
1514 1.28 msaitoh
1515 1.1 msaitoh #ifdef DEV_NETMAP
1516 1.1 msaitoh /*
1517 1.1 msaitoh * In netmap mode, fill the map and set the buffer
1518 1.1 msaitoh * address in the NIC ring, considering the offset
1519 1.1 msaitoh * between the netmap and NIC rings (see comment in
1520 1.1 msaitoh * ixgbe_setup_transmit_ring() ). No need to allocate
1521 1.1 msaitoh * an mbuf, so end the block with a continue;
1522 1.1 msaitoh */
1523 1.102 msaitoh if ((sc->feat_en & IXGBE_FEATURE_NETMAP) && slot) {
1524 1.53 msaitoh int sj = netmap_idx_n2k(na->rx_rings[rxr->me], j);
1525 1.1 msaitoh uint64_t paddr;
1526 1.1 msaitoh void *addr;
1527 1.1 msaitoh
1528 1.1 msaitoh addr = PNMB(na, slot + sj, &paddr);
1529 1.1 msaitoh netmap_load_map(na, rxr->ptag, rxbuf->pmap, addr);
1530 1.1 msaitoh /* Update descriptor and the cached value */
1531 1.1 msaitoh rxr->rx_base[j].read.pkt_addr = htole64(paddr);
1532 1.1 msaitoh rxbuf->addr = htole64(paddr);
1533 1.1 msaitoh continue;
1534 1.1 msaitoh }
1535 1.1 msaitoh #endif /* DEV_NETMAP */
1536 1.28 msaitoh
1537 1.28 msaitoh rxbuf->flags = 0;
1538 1.87 msaitoh rxbuf->buf = ixgbe_getcl();
1539 1.1 msaitoh if (rxbuf->buf == NULL) {
1540 1.95 msaitoh IXGBE_EVC_ADD(&rxr->no_mbuf, 1);
1541 1.1 msaitoh error = ENOBUFS;
1542 1.28 msaitoh goto fail;
1543 1.1 msaitoh }
1544 1.1 msaitoh mp = rxbuf->buf;
1545 1.1 msaitoh mp->m_pkthdr.len = mp->m_len = rxr->mbuf_sz;
1546 1.102 msaitoh IXGBE_M_ADJ(sc, rxr, mp);
1547 1.1 msaitoh /* Get the memory mapping */
1548 1.28 msaitoh error = bus_dmamap_load_mbuf(rxr->ptag->dt_dmat, rxbuf->pmap,
1549 1.28 msaitoh mp, BUS_DMA_NOWAIT);
1550 1.75 msaitoh if (error != 0) {
1551 1.75 msaitoh /*
1552 1.75 msaitoh * Clear this entry for later cleanup in
1553 1.75 msaitoh * ixgbe_discard() which is called via
1554 1.75 msaitoh * ixgbe_free_receive_ring().
1555 1.75 msaitoh */
1556 1.75 msaitoh m_freem(mp);
1557 1.75 msaitoh rxbuf->buf = NULL;
1558 1.85 msaitoh goto fail;
1559 1.75 msaitoh }
1560 1.1 msaitoh bus_dmamap_sync(rxr->ptag->dt_dmat, rxbuf->pmap,
1561 1.83 msaitoh 0, mp->m_pkthdr.len, BUS_DMASYNC_PREREAD);
1562 1.1 msaitoh /* Update the descriptor and the cached value */
1563 1.1 msaitoh rxr->rx_base[j].read.pkt_addr =
1564 1.1 msaitoh htole64(rxbuf->pmap->dm_segs[0].ds_addr);
1565 1.1 msaitoh rxbuf->addr = htole64(rxbuf->pmap->dm_segs[0].ds_addr);
1566 1.1 msaitoh }
1567 1.1 msaitoh
1568 1.1 msaitoh /* Setup our descriptor indices */
1569 1.1 msaitoh rxr->next_to_check = 0;
1570 1.102 msaitoh rxr->next_to_refresh = sc->num_rx_desc - 1; /* Fully allocated */
1571 1.1 msaitoh rxr->lro_enabled = FALSE;
1572 1.90 msaitoh rxr->discard_multidesc = false;
1573 1.95 msaitoh IXGBE_EVC_STORE(&rxr->rx_copies, 0);
1574 1.13 msaitoh #if 0 /* NetBSD */
1575 1.95 msaitoh IXGBE_EVC_STORE(&rxr->rx_bytes, 0);
1576 1.13 msaitoh #if 1 /* Fix inconsistency */
1577 1.95 msaitoh IXGBE_EVC_STORE(&rxr->rx_packets, 0);
1578 1.13 msaitoh #endif
1579 1.13 msaitoh #endif
1580 1.1 msaitoh rxr->vtag_strip = FALSE;
1581 1.1 msaitoh
1582 1.1 msaitoh ixgbe_dmamap_sync(rxr->rxdma.dma_tag, rxr->rxdma.dma_map,
1583 1.1 msaitoh BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
1584 1.1 msaitoh
1585 1.1 msaitoh /*
1586 1.28 msaitoh * Now set up the LRO interface
1587 1.28 msaitoh */
1588 1.1 msaitoh if (ixgbe_rsc_enable)
1589 1.1 msaitoh ixgbe_setup_hw_rsc(rxr);
1590 1.1 msaitoh #ifdef LRO
1591 1.1 msaitoh else if (ifp->if_capenable & IFCAP_LRO) {
1592 1.102 msaitoh device_t dev = sc->dev;
1593 1.1 msaitoh int err = tcp_lro_init(lro);
1594 1.1 msaitoh if (err) {
1595 1.1 msaitoh device_printf(dev, "LRO Initialization failed!\n");
1596 1.1 msaitoh goto fail;
1597 1.1 msaitoh }
1598 1.1 msaitoh INIT_DEBUGOUT("RX Soft LRO Initialized\n");
1599 1.1 msaitoh rxr->lro_enabled = TRUE;
1600 1.102 msaitoh lro->ifp = sc->ifp;
1601 1.1 msaitoh }
1602 1.1 msaitoh #endif /* LRO */
1603 1.1 msaitoh
1604 1.1 msaitoh IXGBE_RX_UNLOCK(rxr);
1605 1.28 msaitoh
1606 1.1 msaitoh return (0);
1607 1.1 msaitoh
1608 1.1 msaitoh fail:
1609 1.1 msaitoh ixgbe_free_receive_ring(rxr);
1610 1.1 msaitoh IXGBE_RX_UNLOCK(rxr);
1611 1.28 msaitoh
1612 1.1 msaitoh return (error);
1613 1.28 msaitoh } /* ixgbe_setup_receive_ring */
1614 1.1 msaitoh
1615 1.28 msaitoh /************************************************************************
1616 1.28 msaitoh * ixgbe_setup_receive_structures - Initialize all receive rings.
1617 1.28 msaitoh ************************************************************************/
1618 1.1 msaitoh int
1619 1.102 msaitoh ixgbe_setup_receive_structures(struct ixgbe_softc *sc)
1620 1.1 msaitoh {
1621 1.102 msaitoh struct rx_ring *rxr = sc->rx_rings;
1622 1.28 msaitoh int j;
1623 1.1 msaitoh
1624 1.62 msaitoh INIT_DEBUGOUT("ixgbe_setup_receive_structures");
1625 1.102 msaitoh for (j = 0; j < sc->num_queues; j++, rxr++)
1626 1.1 msaitoh if (ixgbe_setup_receive_ring(rxr))
1627 1.1 msaitoh goto fail;
1628 1.1 msaitoh
1629 1.1 msaitoh return (0);
1630 1.1 msaitoh fail:
1631 1.1 msaitoh /*
1632 1.1 msaitoh * Free RX buffers allocated so far, we will only handle
1633 1.1 msaitoh * the rings that completed, the failing case will have
1634 1.1 msaitoh * cleaned up for itself. 'j' failed, so its the terminus.
1635 1.1 msaitoh */
1636 1.1 msaitoh for (int i = 0; i < j; ++i) {
1637 1.102 msaitoh rxr = &sc->rx_rings[i];
1638 1.27 msaitoh IXGBE_RX_LOCK(rxr);
1639 1.1 msaitoh ixgbe_free_receive_ring(rxr);
1640 1.27 msaitoh IXGBE_RX_UNLOCK(rxr);
1641 1.1 msaitoh }
1642 1.1 msaitoh
1643 1.1 msaitoh return (ENOBUFS);
1644 1.28 msaitoh } /* ixgbe_setup_receive_structures */
1645 1.1 msaitoh
1646 1.3 msaitoh
1647 1.28 msaitoh /************************************************************************
1648 1.28 msaitoh * ixgbe_free_receive_structures - Free all receive rings.
1649 1.28 msaitoh ************************************************************************/
1650 1.1 msaitoh void
1651 1.102 msaitoh ixgbe_free_receive_structures(struct ixgbe_softc *sc)
1652 1.1 msaitoh {
1653 1.102 msaitoh struct rx_ring *rxr = sc->rx_rings;
1654 1.1 msaitoh
1655 1.1 msaitoh INIT_DEBUGOUT("ixgbe_free_receive_structures: begin");
1656 1.1 msaitoh
1657 1.102 msaitoh for (int i = 0; i < sc->num_queues; i++, rxr++) {
1658 1.1 msaitoh ixgbe_free_receive_buffers(rxr);
1659 1.1 msaitoh #ifdef LRO
1660 1.1 msaitoh /* Free LRO memory */
1661 1.28 msaitoh tcp_lro_free(&rxr->lro);
1662 1.1 msaitoh #endif /* LRO */
1663 1.1 msaitoh /* Free the ring memory as well */
1664 1.102 msaitoh ixgbe_dma_free(sc, &rxr->rxdma);
1665 1.1 msaitoh IXGBE_RX_LOCK_DESTROY(rxr);
1666 1.1 msaitoh }
1667 1.1 msaitoh
1668 1.102 msaitoh free(sc->rx_rings, M_DEVBUF);
1669 1.28 msaitoh } /* ixgbe_free_receive_structures */
1670 1.1 msaitoh
1671 1.1 msaitoh
1672 1.28 msaitoh /************************************************************************
1673 1.28 msaitoh * ixgbe_free_receive_buffers - Free receive ring data structures
1674 1.28 msaitoh ************************************************************************/
1675 1.1 msaitoh static void
1676 1.1 msaitoh ixgbe_free_receive_buffers(struct rx_ring *rxr)
1677 1.1 msaitoh {
1678 1.102 msaitoh struct ixgbe_softc *sc = rxr->sc;
1679 1.28 msaitoh struct ixgbe_rx_buf *rxbuf;
1680 1.1 msaitoh
1681 1.1 msaitoh INIT_DEBUGOUT("ixgbe_free_receive_buffers: begin");
1682 1.1 msaitoh
1683 1.1 msaitoh /* Cleanup any existing buffers */
1684 1.1 msaitoh if (rxr->rx_buffers != NULL) {
1685 1.102 msaitoh for (int i = 0; i < sc->num_rx_desc; i++) {
1686 1.1 msaitoh rxbuf = &rxr->rx_buffers[i];
1687 1.27 msaitoh ixgbe_rx_discard(rxr, i);
1688 1.1 msaitoh if (rxbuf->pmap != NULL) {
1689 1.1 msaitoh ixgbe_dmamap_destroy(rxr->ptag, rxbuf->pmap);
1690 1.1 msaitoh rxbuf->pmap = NULL;
1691 1.1 msaitoh }
1692 1.1 msaitoh }
1693 1.59 msaitoh
1694 1.1 msaitoh if (rxr->rx_buffers != NULL) {
1695 1.1 msaitoh free(rxr->rx_buffers, M_DEVBUF);
1696 1.1 msaitoh rxr->rx_buffers = NULL;
1697 1.1 msaitoh }
1698 1.1 msaitoh }
1699 1.1 msaitoh
1700 1.1 msaitoh if (rxr->ptag != NULL) {
1701 1.1 msaitoh ixgbe_dma_tag_destroy(rxr->ptag);
1702 1.1 msaitoh rxr->ptag = NULL;
1703 1.1 msaitoh }
1704 1.1 msaitoh
1705 1.1 msaitoh return;
1706 1.28 msaitoh } /* ixgbe_free_receive_buffers */
1707 1.1 msaitoh
1708 1.28 msaitoh /************************************************************************
1709 1.28 msaitoh * ixgbe_rx_input
1710 1.28 msaitoh ************************************************************************/
1711 1.1 msaitoh static __inline void
1712 1.28 msaitoh ixgbe_rx_input(struct rx_ring *rxr, struct ifnet *ifp, struct mbuf *m,
1713 1.28 msaitoh u32 ptype)
1714 1.1 msaitoh {
1715 1.102 msaitoh struct ixgbe_softc *sc = ifp->if_softc;
1716 1.1 msaitoh
1717 1.1 msaitoh #ifdef LRO
1718 1.102 msaitoh struct ethercom *ec = &sc->osdep.ec;
1719 1.1 msaitoh
1720 1.28 msaitoh /*
1721 1.28 msaitoh * ATM LRO is only for IP/TCP packets and TCP checksum of the packet
1722 1.28 msaitoh * should be computed by hardware. Also it should not have VLAN tag in
1723 1.28 msaitoh * ethernet header. In case of IPv6 we do not yet support ext. hdrs.
1724 1.28 msaitoh */
1725 1.1 msaitoh if (rxr->lro_enabled &&
1726 1.1 msaitoh (ec->ec_capenable & ETHERCAP_VLAN_HWTAGGING) != 0 &&
1727 1.1 msaitoh (ptype & IXGBE_RXDADV_PKTTYPE_ETQF) == 0 &&
1728 1.1 msaitoh ((ptype & (IXGBE_RXDADV_PKTTYPE_IPV4 | IXGBE_RXDADV_PKTTYPE_TCP)) ==
1729 1.1 msaitoh (IXGBE_RXDADV_PKTTYPE_IPV4 | IXGBE_RXDADV_PKTTYPE_TCP) ||
1730 1.1 msaitoh (ptype & (IXGBE_RXDADV_PKTTYPE_IPV6 | IXGBE_RXDADV_PKTTYPE_TCP)) ==
1731 1.1 msaitoh (IXGBE_RXDADV_PKTTYPE_IPV6 | IXGBE_RXDADV_PKTTYPE_TCP)) &&
1732 1.1 msaitoh (m->m_pkthdr.csum_flags & (CSUM_DATA_VALID | CSUM_PSEUDO_HDR)) ==
1733 1.1 msaitoh (CSUM_DATA_VALID | CSUM_PSEUDO_HDR)) {
1734 1.1 msaitoh /*
1735 1.1 msaitoh * Send to the stack if:
1736 1.1 msaitoh ** - LRO not enabled, or
1737 1.1 msaitoh ** - no LRO resources, or
1738 1.1 msaitoh ** - lro enqueue fails
1739 1.1 msaitoh */
1740 1.1 msaitoh if (rxr->lro.lro_cnt != 0)
1741 1.1 msaitoh if (tcp_lro_rx(&rxr->lro, m, 0) == 0)
1742 1.1 msaitoh return;
1743 1.1 msaitoh }
1744 1.1 msaitoh #endif /* LRO */
1745 1.1 msaitoh
1746 1.102 msaitoh if_percpuq_enqueue(sc->ipq, m);
1747 1.28 msaitoh } /* ixgbe_rx_input */
1748 1.1 msaitoh
1749 1.28 msaitoh /************************************************************************
1750 1.28 msaitoh * ixgbe_rx_discard
1751 1.28 msaitoh ************************************************************************/
1752 1.1 msaitoh static __inline void
1753 1.1 msaitoh ixgbe_rx_discard(struct rx_ring *rxr, int i)
1754 1.1 msaitoh {
1755 1.28 msaitoh struct ixgbe_rx_buf *rbuf;
1756 1.1 msaitoh
1757 1.1 msaitoh rbuf = &rxr->rx_buffers[i];
1758 1.1 msaitoh
1759 1.1 msaitoh /*
1760 1.70 msaitoh * With advanced descriptors the writeback clobbers the buffer addrs,
1761 1.70 msaitoh * so its easier to just free the existing mbufs and take the normal
1762 1.70 msaitoh * refresh path to get new buffers and mapping.
1763 1.28 msaitoh */
1764 1.1 msaitoh
1765 1.26 msaitoh if (rbuf->fmp != NULL) {/* Partial chain ? */
1766 1.27 msaitoh bus_dmamap_sync(rxr->ptag->dt_dmat, rbuf->pmap, 0,
1767 1.27 msaitoh rbuf->buf->m_pkthdr.len, BUS_DMASYNC_POSTREAD);
1768 1.72 rin ixgbe_dmamap_unload(rxr->ptag, rbuf->pmap);
1769 1.1 msaitoh m_freem(rbuf->fmp);
1770 1.1 msaitoh rbuf->fmp = NULL;
1771 1.1 msaitoh rbuf->buf = NULL; /* rbuf->buf is part of fmp's chain */
1772 1.1 msaitoh } else if (rbuf->buf) {
1773 1.27 msaitoh bus_dmamap_sync(rxr->ptag->dt_dmat, rbuf->pmap, 0,
1774 1.27 msaitoh rbuf->buf->m_pkthdr.len, BUS_DMASYNC_POSTREAD);
1775 1.72 rin ixgbe_dmamap_unload(rxr->ptag, rbuf->pmap);
1776 1.1 msaitoh m_free(rbuf->buf);
1777 1.1 msaitoh rbuf->buf = NULL;
1778 1.1 msaitoh }
1779 1.1 msaitoh
1780 1.1 msaitoh rbuf->flags = 0;
1781 1.1 msaitoh
1782 1.1 msaitoh return;
1783 1.28 msaitoh } /* ixgbe_rx_discard */
1784 1.1 msaitoh
1785 1.1 msaitoh
1786 1.28 msaitoh /************************************************************************
1787 1.28 msaitoh * ixgbe_rxeof
1788 1.1 msaitoh *
1789 1.28 msaitoh * Executes in interrupt context. It replenishes the
1790 1.28 msaitoh * mbufs in the descriptor and sends data which has
1791 1.28 msaitoh * been dma'ed into host memory to upper layer.
1792 1.1 msaitoh *
1793 1.28 msaitoh * Return TRUE for more work, FALSE for all clean.
1794 1.28 msaitoh ************************************************************************/
1795 1.1 msaitoh bool
1796 1.1 msaitoh ixgbe_rxeof(struct ix_queue *que)
1797 1.1 msaitoh {
1798 1.102 msaitoh struct ixgbe_softc *sc = que->sc;
1799 1.1 msaitoh struct rx_ring *rxr = que->rxr;
1800 1.102 msaitoh struct ifnet *ifp = sc->ifp;
1801 1.1 msaitoh #ifdef LRO
1802 1.1 msaitoh struct lro_ctrl *lro = &rxr->lro;
1803 1.1 msaitoh #endif /* LRO */
1804 1.28 msaitoh union ixgbe_adv_rx_desc *cur;
1805 1.28 msaitoh struct ixgbe_rx_buf *rbuf, *nbuf;
1806 1.1 msaitoh int i, nextp, processed = 0;
1807 1.1 msaitoh u32 staterr = 0;
1808 1.94 msaitoh u32 loopcount = 0, numdesc;
1809 1.102 msaitoh u32 limit = sc->rx_process_limit;
1810 1.102 msaitoh u32 rx_copy_len = sc->rx_copy_len;
1811 1.90 msaitoh bool discard_multidesc = rxr->discard_multidesc;
1812 1.94 msaitoh bool wraparound = false;
1813 1.94 msaitoh unsigned int syncremain;
1814 1.1 msaitoh #ifdef RSS
1815 1.1 msaitoh u16 pkt_info;
1816 1.1 msaitoh #endif
1817 1.1 msaitoh
1818 1.1 msaitoh IXGBE_RX_LOCK(rxr);
1819 1.1 msaitoh
1820 1.1 msaitoh #ifdef DEV_NETMAP
1821 1.102 msaitoh if (sc->feat_en & IXGBE_FEATURE_NETMAP) {
1822 1.28 msaitoh /* Same as the txeof routine: wakeup clients on intr. */
1823 1.28 msaitoh if (netmap_rx_irq(ifp, rxr->me, &processed)) {
1824 1.28 msaitoh IXGBE_RX_UNLOCK(rxr);
1825 1.28 msaitoh return (FALSE);
1826 1.28 msaitoh }
1827 1.1 msaitoh }
1828 1.1 msaitoh #endif /* DEV_NETMAP */
1829 1.1 msaitoh
1830 1.94 msaitoh /* Sync the ring. The size is rx_process_limit or the first half */
1831 1.94 msaitoh if ((rxr->next_to_check + limit) <= rxr->num_desc) {
1832 1.94 msaitoh /* Non-wraparound */
1833 1.94 msaitoh numdesc = limit;
1834 1.94 msaitoh syncremain = 0;
1835 1.94 msaitoh } else {
1836 1.94 msaitoh /* Wraparound. Sync the first half. */
1837 1.94 msaitoh numdesc = rxr->num_desc - rxr->next_to_check;
1838 1.94 msaitoh
1839 1.94 msaitoh /* Set the size of the last half */
1840 1.94 msaitoh syncremain = limit - numdesc;
1841 1.94 msaitoh }
1842 1.94 msaitoh bus_dmamap_sync(rxr->rxdma.dma_tag->dt_dmat,
1843 1.94 msaitoh rxr->rxdma.dma_map,
1844 1.94 msaitoh sizeof(union ixgbe_adv_rx_desc) * rxr->next_to_check,
1845 1.94 msaitoh sizeof(union ixgbe_adv_rx_desc) * numdesc,
1846 1.94 msaitoh BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE);
1847 1.94 msaitoh
1848 1.65 msaitoh /*
1849 1.65 msaitoh * The max number of loop is rx_process_limit. If discard_multidesc is
1850 1.65 msaitoh * true, continue processing to not to send broken packet to the upper
1851 1.65 msaitoh * layer.
1852 1.65 msaitoh */
1853 1.65 msaitoh for (i = rxr->next_to_check;
1854 1.89 msaitoh (loopcount < limit) || (discard_multidesc == true);) {
1855 1.65 msaitoh
1856 1.28 msaitoh struct mbuf *sendmp, *mp;
1857 1.64 knakahar struct mbuf *newmp;
1858 1.28 msaitoh u32 rsc, ptype;
1859 1.28 msaitoh u16 len;
1860 1.28 msaitoh u16 vtag = 0;
1861 1.28 msaitoh bool eop;
1862 1.93 msaitoh bool discard = false;
1863 1.53 msaitoh
1864 1.94 msaitoh if (wraparound) {
1865 1.94 msaitoh /* Sync the last half. */
1866 1.94 msaitoh KASSERT(syncremain != 0);
1867 1.94 msaitoh numdesc = syncremain;
1868 1.94 msaitoh wraparound = false;
1869 1.94 msaitoh } else if (__predict_false(loopcount >= limit)) {
1870 1.94 msaitoh KASSERT(discard_multidesc == true);
1871 1.94 msaitoh numdesc = 1;
1872 1.94 msaitoh } else
1873 1.94 msaitoh numdesc = 0;
1874 1.94 msaitoh
1875 1.94 msaitoh if (numdesc != 0)
1876 1.94 msaitoh bus_dmamap_sync(rxr->rxdma.dma_tag->dt_dmat,
1877 1.94 msaitoh rxr->rxdma.dma_map, 0,
1878 1.94 msaitoh sizeof(union ixgbe_adv_rx_desc) * numdesc,
1879 1.94 msaitoh BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE);
1880 1.1 msaitoh
1881 1.1 msaitoh cur = &rxr->rx_base[i];
1882 1.1 msaitoh staterr = le32toh(cur->wb.upper.status_error);
1883 1.1 msaitoh #ifdef RSS
1884 1.1 msaitoh pkt_info = le16toh(cur->wb.lower.lo_dword.hs_rss.pkt_info);
1885 1.1 msaitoh #endif
1886 1.1 msaitoh
1887 1.1 msaitoh if ((staterr & IXGBE_RXD_STAT_DD) == 0)
1888 1.1 msaitoh break;
1889 1.1 msaitoh
1890 1.89 msaitoh loopcount++;
1891 1.93 msaitoh sendmp = newmp = NULL;
1892 1.1 msaitoh nbuf = NULL;
1893 1.1 msaitoh rsc = 0;
1894 1.1 msaitoh cur->wb.upper.status_error = 0;
1895 1.1 msaitoh rbuf = &rxr->rx_buffers[i];
1896 1.1 msaitoh mp = rbuf->buf;
1897 1.1 msaitoh
1898 1.1 msaitoh len = le16toh(cur->wb.upper.length);
1899 1.1 msaitoh ptype = le32toh(cur->wb.lower.lo_dword.data) &
1900 1.1 msaitoh IXGBE_RXDADV_PKTTYPE_MASK;
1901 1.1 msaitoh eop = ((staterr & IXGBE_RXD_STAT_EOP) != 0);
1902 1.1 msaitoh
1903 1.1 msaitoh /* Make sure bad packets are discarded */
1904 1.1 msaitoh if (eop && (staterr & IXGBE_RXDADV_ERR_FRAME_ERR_MASK) != 0) {
1905 1.3 msaitoh #if __FreeBSD_version >= 1100036
1906 1.102 msaitoh if (sc->feat_en & IXGBE_FEATURE_VF)
1907 1.4 msaitoh if_inc_counter(ifp, IFCOUNTER_IERRORS, 1);
1908 1.3 msaitoh #endif
1909 1.95 msaitoh IXGBE_EVC_ADD(&rxr->rx_discarded, 1);
1910 1.1 msaitoh ixgbe_rx_discard(rxr, i);
1911 1.65 msaitoh discard_multidesc = false;
1912 1.1 msaitoh goto next_desc;
1913 1.1 msaitoh }
1914 1.1 msaitoh
1915 1.93 msaitoh if (__predict_false(discard_multidesc))
1916 1.93 msaitoh discard = true;
1917 1.93 msaitoh else {
1918 1.93 msaitoh /* Pre-alloc new mbuf. */
1919 1.93 msaitoh
1920 1.93 msaitoh if ((rbuf->fmp == NULL) &&
1921 1.97 msaitoh eop && (len <= rx_copy_len)) {
1922 1.93 msaitoh /* For short packet. See below. */
1923 1.93 msaitoh sendmp = m_gethdr(M_NOWAIT, MT_DATA);
1924 1.93 msaitoh if (__predict_false(sendmp == NULL)) {
1925 1.95 msaitoh IXGBE_EVC_ADD(&rxr->no_mbuf, 1);
1926 1.93 msaitoh discard = true;
1927 1.93 msaitoh }
1928 1.93 msaitoh } else {
1929 1.93 msaitoh /* For long packet. */
1930 1.93 msaitoh newmp = ixgbe_getcl();
1931 1.93 msaitoh if (__predict_false(newmp == NULL)) {
1932 1.95 msaitoh IXGBE_EVC_ADD(&rxr->no_mbuf, 1);
1933 1.93 msaitoh discard = true;
1934 1.93 msaitoh }
1935 1.93 msaitoh }
1936 1.93 msaitoh }
1937 1.92 msaitoh
1938 1.93 msaitoh if (__predict_false(discard)) {
1939 1.65 msaitoh /*
1940 1.65 msaitoh * Descriptor initialization is already done by the
1941 1.65 msaitoh * above code (cur->wb.upper.status_error = 0).
1942 1.65 msaitoh * So, we can reuse current rbuf->buf for new packet.
1943 1.65 msaitoh *
1944 1.65 msaitoh * Rewrite the buffer addr, see comment in
1945 1.65 msaitoh * ixgbe_rx_discard().
1946 1.65 msaitoh */
1947 1.65 msaitoh cur->read.pkt_addr = rbuf->addr;
1948 1.65 msaitoh m_freem(rbuf->fmp);
1949 1.65 msaitoh rbuf->fmp = NULL;
1950 1.65 msaitoh if (!eop) {
1951 1.65 msaitoh /* Discard the entire packet. */
1952 1.65 msaitoh discard_multidesc = true;
1953 1.65 msaitoh } else
1954 1.65 msaitoh discard_multidesc = false;
1955 1.64 knakahar goto next_desc;
1956 1.64 knakahar }
1957 1.65 msaitoh discard_multidesc = false;
1958 1.64 knakahar
1959 1.27 msaitoh bus_dmamap_sync(rxr->ptag->dt_dmat, rbuf->pmap, 0,
1960 1.27 msaitoh rbuf->buf->m_pkthdr.len, BUS_DMASYNC_POSTREAD);
1961 1.27 msaitoh
1962 1.1 msaitoh /*
1963 1.28 msaitoh * On 82599 which supports a hardware
1964 1.28 msaitoh * LRO (called HW RSC), packets need
1965 1.28 msaitoh * not be fragmented across sequential
1966 1.28 msaitoh * descriptors, rather the next descriptor
1967 1.28 msaitoh * is indicated in bits of the descriptor.
1968 1.99 andvar * This also means that we might process
1969 1.28 msaitoh * more than one packet at a time, something
1970 1.28 msaitoh * that has never been true before, it
1971 1.28 msaitoh * required eliminating global chain pointers
1972 1.28 msaitoh * in favor of what we are doing here. -jfv
1973 1.28 msaitoh */
1974 1.1 msaitoh if (!eop) {
1975 1.1 msaitoh /*
1976 1.28 msaitoh * Figure out the next descriptor
1977 1.28 msaitoh * of this frame.
1978 1.28 msaitoh */
1979 1.1 msaitoh if (rxr->hw_rsc == TRUE) {
1980 1.1 msaitoh rsc = ixgbe_rsc_count(cur);
1981 1.1 msaitoh rxr->rsc_num += (rsc - 1);
1982 1.1 msaitoh }
1983 1.1 msaitoh if (rsc) { /* Get hardware index */
1984 1.28 msaitoh nextp = ((staterr & IXGBE_RXDADV_NEXTP_MASK) >>
1985 1.1 msaitoh IXGBE_RXDADV_NEXTP_SHIFT);
1986 1.1 msaitoh } else { /* Just sequential */
1987 1.1 msaitoh nextp = i + 1;
1988 1.102 msaitoh if (nextp == sc->num_rx_desc)
1989 1.1 msaitoh nextp = 0;
1990 1.1 msaitoh }
1991 1.1 msaitoh nbuf = &rxr->rx_buffers[nextp];
1992 1.1 msaitoh prefetch(nbuf);
1993 1.1 msaitoh }
1994 1.1 msaitoh /*
1995 1.28 msaitoh * Rather than using the fmp/lmp global pointers
1996 1.28 msaitoh * we now keep the head of a packet chain in the
1997 1.28 msaitoh * buffer struct and pass this along from one
1998 1.28 msaitoh * descriptor to the next, until we get EOP.
1999 1.28 msaitoh */
2000 1.1 msaitoh /*
2001 1.28 msaitoh * See if there is a stored head
2002 1.28 msaitoh * that determines what we are
2003 1.28 msaitoh */
2004 1.93 msaitoh if (rbuf->fmp != NULL) {
2005 1.93 msaitoh /* Secondary frag */
2006 1.93 msaitoh sendmp = rbuf->fmp;
2007 1.93 msaitoh
2008 1.86 msaitoh /* Update new (used in future) mbuf */
2009 1.86 msaitoh newmp->m_pkthdr.len = newmp->m_len = rxr->mbuf_sz;
2010 1.102 msaitoh IXGBE_M_ADJ(sc, rxr, newmp);
2011 1.64 knakahar rbuf->buf = newmp;
2012 1.64 knakahar rbuf->fmp = NULL;
2013 1.86 msaitoh
2014 1.86 msaitoh /* For secondary frag */
2015 1.74 msaitoh mp->m_len = len;
2016 1.1 msaitoh mp->m_flags &= ~M_PKTHDR;
2017 1.86 msaitoh
2018 1.86 msaitoh /* For sendmp */
2019 1.1 msaitoh sendmp->m_pkthdr.len += mp->m_len;
2020 1.1 msaitoh } else {
2021 1.1 msaitoh /*
2022 1.86 msaitoh * It's the first segment of a multi descriptor
2023 1.86 msaitoh * packet or a single segment which contains a full
2024 1.86 msaitoh * packet.
2025 1.86 msaitoh */
2026 1.86 msaitoh
2027 1.97 msaitoh if (eop && (len <= rx_copy_len)) {
2028 1.93 msaitoh /*
2029 1.93 msaitoh * Optimize. This might be a small packet, may
2030 1.93 msaitoh * be just a TCP ACK. Copy into a new mbuf, and
2031 1.93 msaitoh * Leave the old mbuf+cluster for re-use.
2032 1.93 msaitoh */
2033 1.93 msaitoh sendmp->m_data += ETHER_ALIGN;
2034 1.93 msaitoh memcpy(mtod(sendmp, void *),
2035 1.93 msaitoh mtod(mp, void *), len);
2036 1.95 msaitoh IXGBE_EVC_ADD(&rxr->rx_copies, 1);
2037 1.93 msaitoh rbuf->flags |= IXGBE_RX_COPY;
2038 1.93 msaitoh } else {
2039 1.96 msaitoh /* For long packet */
2040 1.86 msaitoh
2041 1.86 msaitoh /* Update new (used in future) mbuf */
2042 1.86 msaitoh newmp->m_pkthdr.len = newmp->m_len
2043 1.86 msaitoh = rxr->mbuf_sz;
2044 1.102 msaitoh IXGBE_M_ADJ(sc, rxr, newmp);
2045 1.64 knakahar rbuf->buf = newmp;
2046 1.64 knakahar rbuf->fmp = NULL;
2047 1.86 msaitoh
2048 1.86 msaitoh /* For sendmp */
2049 1.1 msaitoh sendmp = mp;
2050 1.1 msaitoh }
2051 1.1 msaitoh
2052 1.1 msaitoh /* first desc of a non-ps chain */
2053 1.86 msaitoh sendmp->m_pkthdr.len = sendmp->m_len = len;
2054 1.1 msaitoh }
2055 1.1 msaitoh ++processed;
2056 1.1 msaitoh
2057 1.1 msaitoh /* Pass the head pointer on */
2058 1.1 msaitoh if (eop == 0) {
2059 1.1 msaitoh nbuf->fmp = sendmp;
2060 1.1 msaitoh sendmp = NULL;
2061 1.1 msaitoh mp->m_next = nbuf->buf;
2062 1.1 msaitoh } else { /* Sending this frame */
2063 1.1 msaitoh m_set_rcvif(sendmp, ifp);
2064 1.31 msaitoh ++rxr->packets;
2065 1.95 msaitoh IXGBE_EVC_ADD(&rxr->rx_packets, 1);
2066 1.1 msaitoh /* capture data for AIM */
2067 1.1 msaitoh rxr->bytes += sendmp->m_pkthdr.len;
2068 1.95 msaitoh IXGBE_EVC_ADD(&rxr->rx_bytes, sendmp->m_pkthdr.len);
2069 1.1 msaitoh /* Process vlan info */
2070 1.28 msaitoh if ((rxr->vtag_strip) && (staterr & IXGBE_RXD_STAT_VP))
2071 1.1 msaitoh vtag = le16toh(cur->wb.upper.vlan);
2072 1.1 msaitoh if (vtag) {
2073 1.29 knakahar vlan_set_tag(sendmp, vtag);
2074 1.1 msaitoh }
2075 1.1 msaitoh if ((ifp->if_capenable & IFCAP_RXCSUM) != 0) {
2076 1.1 msaitoh ixgbe_rx_checksum(staterr, sendmp, ptype,
2077 1.102 msaitoh &sc->stats.pf);
2078 1.1 msaitoh }
2079 1.8 msaitoh
2080 1.6 msaitoh #if 0 /* FreeBSD */
2081 1.28 msaitoh /*
2082 1.28 msaitoh * In case of multiqueue, we have RXCSUM.PCSD bit set
2083 1.28 msaitoh * and never cleared. This means we have RSS hash
2084 1.28 msaitoh * available to be used.
2085 1.28 msaitoh */
2086 1.102 msaitoh if (sc->num_queues > 1) {
2087 1.28 msaitoh sendmp->m_pkthdr.flowid =
2088 1.28 msaitoh le32toh(cur->wb.lower.hi_dword.rss);
2089 1.44 msaitoh switch (pkt_info & IXGBE_RXDADV_RSSTYPE_MASK) {
2090 1.44 msaitoh case IXGBE_RXDADV_RSSTYPE_IPV4:
2091 1.28 msaitoh M_HASHTYPE_SET(sendmp,
2092 1.28 msaitoh M_HASHTYPE_RSS_IPV4);
2093 1.28 msaitoh break;
2094 1.44 msaitoh case IXGBE_RXDADV_RSSTYPE_IPV4_TCP:
2095 1.28 msaitoh M_HASHTYPE_SET(sendmp,
2096 1.28 msaitoh M_HASHTYPE_RSS_TCP_IPV4);
2097 1.28 msaitoh break;
2098 1.44 msaitoh case IXGBE_RXDADV_RSSTYPE_IPV6:
2099 1.28 msaitoh M_HASHTYPE_SET(sendmp,
2100 1.28 msaitoh M_HASHTYPE_RSS_IPV6);
2101 1.28 msaitoh break;
2102 1.44 msaitoh case IXGBE_RXDADV_RSSTYPE_IPV6_TCP:
2103 1.28 msaitoh M_HASHTYPE_SET(sendmp,
2104 1.28 msaitoh M_HASHTYPE_RSS_TCP_IPV6);
2105 1.28 msaitoh break;
2106 1.44 msaitoh case IXGBE_RXDADV_RSSTYPE_IPV6_EX:
2107 1.28 msaitoh M_HASHTYPE_SET(sendmp,
2108 1.28 msaitoh M_HASHTYPE_RSS_IPV6_EX);
2109 1.28 msaitoh break;
2110 1.44 msaitoh case IXGBE_RXDADV_RSSTYPE_IPV6_TCP_EX:
2111 1.28 msaitoh M_HASHTYPE_SET(sendmp,
2112 1.28 msaitoh M_HASHTYPE_RSS_TCP_IPV6_EX);
2113 1.28 msaitoh break;
2114 1.6 msaitoh #if __FreeBSD_version > 1100000
2115 1.44 msaitoh case IXGBE_RXDADV_RSSTYPE_IPV4_UDP:
2116 1.28 msaitoh M_HASHTYPE_SET(sendmp,
2117 1.28 msaitoh M_HASHTYPE_RSS_UDP_IPV4);
2118 1.28 msaitoh break;
2119 1.44 msaitoh case IXGBE_RXDADV_RSSTYPE_IPV6_UDP:
2120 1.28 msaitoh M_HASHTYPE_SET(sendmp,
2121 1.28 msaitoh M_HASHTYPE_RSS_UDP_IPV6);
2122 1.28 msaitoh break;
2123 1.44 msaitoh case IXGBE_RXDADV_RSSTYPE_IPV6_UDP_EX:
2124 1.28 msaitoh M_HASHTYPE_SET(sendmp,
2125 1.28 msaitoh M_HASHTYPE_RSS_UDP_IPV6_EX);
2126 1.28 msaitoh break;
2127 1.28 msaitoh #endif
2128 1.44 msaitoh default:
2129 1.28 msaitoh M_HASHTYPE_SET(sendmp,
2130 1.28 msaitoh M_HASHTYPE_OPAQUE_HASH);
2131 1.28 msaitoh }
2132 1.28 msaitoh } else {
2133 1.28 msaitoh sendmp->m_pkthdr.flowid = que->msix;
2134 1.1 msaitoh M_HASHTYPE_SET(sendmp, M_HASHTYPE_OPAQUE);
2135 1.1 msaitoh }
2136 1.8 msaitoh #endif
2137 1.1 msaitoh }
2138 1.1 msaitoh next_desc:
2139 1.1 msaitoh ixgbe_dmamap_sync(rxr->rxdma.dma_tag, rxr->rxdma.dma_map,
2140 1.1 msaitoh BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
2141 1.1 msaitoh
2142 1.1 msaitoh /* Advance our pointers to the next descriptor. */
2143 1.94 msaitoh if (++i == rxr->num_desc) {
2144 1.94 msaitoh wraparound = true;
2145 1.1 msaitoh i = 0;
2146 1.94 msaitoh }
2147 1.82 msaitoh rxr->next_to_check = i;
2148 1.1 msaitoh
2149 1.1 msaitoh /* Now send to the stack or do LRO */
2150 1.85 msaitoh if (sendmp != NULL)
2151 1.1 msaitoh ixgbe_rx_input(rxr, ifp, sendmp, ptype);
2152 1.1 msaitoh
2153 1.28 msaitoh /* Every 8 descriptors we go to refresh mbufs */
2154 1.1 msaitoh if (processed == 8) {
2155 1.1 msaitoh ixgbe_refresh_mbufs(rxr, i);
2156 1.1 msaitoh processed = 0;
2157 1.1 msaitoh }
2158 1.1 msaitoh }
2159 1.1 msaitoh
2160 1.90 msaitoh /* Save the current status */
2161 1.90 msaitoh rxr->discard_multidesc = discard_multidesc;
2162 1.90 msaitoh
2163 1.1 msaitoh /* Refresh any remaining buf structs */
2164 1.1 msaitoh if (ixgbe_rx_unrefreshed(rxr))
2165 1.1 msaitoh ixgbe_refresh_mbufs(rxr, i);
2166 1.1 msaitoh
2167 1.28 msaitoh IXGBE_RX_UNLOCK(rxr);
2168 1.28 msaitoh
2169 1.1 msaitoh #ifdef LRO
2170 1.1 msaitoh /*
2171 1.1 msaitoh * Flush any outstanding LRO work
2172 1.1 msaitoh */
2173 1.10 msaitoh tcp_lro_flush_all(lro);
2174 1.1 msaitoh #endif /* LRO */
2175 1.1 msaitoh
2176 1.1 msaitoh /*
2177 1.28 msaitoh * Still have cleaning to do?
2178 1.28 msaitoh */
2179 1.1 msaitoh if ((staterr & IXGBE_RXD_STAT_DD) != 0)
2180 1.28 msaitoh return (TRUE);
2181 1.28 msaitoh
2182 1.28 msaitoh return (FALSE);
2183 1.28 msaitoh } /* ixgbe_rxeof */
2184 1.1 msaitoh
2185 1.1 msaitoh
2186 1.28 msaitoh /************************************************************************
2187 1.28 msaitoh * ixgbe_rx_checksum
2188 1.1 msaitoh *
2189 1.28 msaitoh * Verify that the hardware indicated that the checksum is valid.
2190 1.28 msaitoh * Inform the stack about the status of checksum so that stack
2191 1.28 msaitoh * doesn't spend time verifying the checksum.
2192 1.28 msaitoh ************************************************************************/
2193 1.1 msaitoh static void
2194 1.1 msaitoh ixgbe_rx_checksum(u32 staterr, struct mbuf * mp, u32 ptype,
2195 1.1 msaitoh struct ixgbe_hw_stats *stats)
2196 1.1 msaitoh {
2197 1.28 msaitoh u16 status = (u16)staterr;
2198 1.28 msaitoh u8 errors = (u8)(staterr >> 24);
2199 1.1 msaitoh #if 0
2200 1.28 msaitoh bool sctp = false;
2201 1.1 msaitoh
2202 1.1 msaitoh if ((ptype & IXGBE_RXDADV_PKTTYPE_ETQF) == 0 &&
2203 1.1 msaitoh (ptype & IXGBE_RXDADV_PKTTYPE_SCTP) != 0)
2204 1.8 msaitoh sctp = true;
2205 1.1 msaitoh #endif
2206 1.1 msaitoh
2207 1.8 msaitoh /* IPv4 checksum */
2208 1.1 msaitoh if (status & IXGBE_RXD_STAT_IPCS) {
2209 1.95 msaitoh IXGBE_EVC_ADD(&stats->ipcs, 1);
2210 1.1 msaitoh if (!(errors & IXGBE_RXD_ERR_IPE)) {
2211 1.1 msaitoh /* IP Checksum Good */
2212 1.1 msaitoh mp->m_pkthdr.csum_flags = M_CSUM_IPv4;
2213 1.1 msaitoh } else {
2214 1.95 msaitoh IXGBE_EVC_ADD(&stats->ipcs_bad, 1);
2215 1.1 msaitoh mp->m_pkthdr.csum_flags = M_CSUM_IPv4|M_CSUM_IPv4_BAD;
2216 1.1 msaitoh }
2217 1.1 msaitoh }
2218 1.8 msaitoh /* TCP/UDP/SCTP checksum */
2219 1.1 msaitoh if (status & IXGBE_RXD_STAT_L4CS) {
2220 1.95 msaitoh IXGBE_EVC_ADD(&stats->l4cs, 1);
2221 1.1 msaitoh int type = M_CSUM_TCPv4|M_CSUM_TCPv6|M_CSUM_UDPv4|M_CSUM_UDPv6;
2222 1.1 msaitoh if (!(errors & IXGBE_RXD_ERR_TCPE)) {
2223 1.1 msaitoh mp->m_pkthdr.csum_flags |= type;
2224 1.1 msaitoh } else {
2225 1.95 msaitoh IXGBE_EVC_ADD(&stats->l4cs_bad, 1);
2226 1.1 msaitoh mp->m_pkthdr.csum_flags |= type | M_CSUM_TCP_UDP_BAD;
2227 1.1 msaitoh }
2228 1.1 msaitoh }
2229 1.28 msaitoh } /* ixgbe_rx_checksum */
2230 1.1 msaitoh
2231 1.28 msaitoh /************************************************************************
2232 1.28 msaitoh * ixgbe_dma_malloc
2233 1.28 msaitoh ************************************************************************/
2234 1.1 msaitoh int
2235 1.102 msaitoh ixgbe_dma_malloc(struct ixgbe_softc *sc, const bus_size_t size,
2236 1.1 msaitoh struct ixgbe_dma_alloc *dma, const int mapflags)
2237 1.1 msaitoh {
2238 1.102 msaitoh device_t dev = sc->dev;
2239 1.28 msaitoh int r, rsegs;
2240 1.1 msaitoh
2241 1.28 msaitoh r = ixgbe_dma_tag_create(
2242 1.102 msaitoh /* parent */ sc->osdep.dmat,
2243 1.28 msaitoh /* alignment */ DBA_ALIGN,
2244 1.28 msaitoh /* bounds */ 0,
2245 1.28 msaitoh /* maxsize */ size,
2246 1.28 msaitoh /* nsegments */ 1,
2247 1.28 msaitoh /* maxsegsize */ size,
2248 1.28 msaitoh /* flags */ BUS_DMA_ALLOCNOW,
2249 1.1 msaitoh &dma->dma_tag);
2250 1.1 msaitoh if (r != 0) {
2251 1.1 msaitoh aprint_error_dev(dev,
2252 1.44 msaitoh "%s: ixgbe_dma_tag_create failed; error %d\n", __func__,
2253 1.44 msaitoh r);
2254 1.1 msaitoh goto fail_0;
2255 1.1 msaitoh }
2256 1.1 msaitoh
2257 1.28 msaitoh r = bus_dmamem_alloc(dma->dma_tag->dt_dmat, size,
2258 1.28 msaitoh dma->dma_tag->dt_alignment, dma->dma_tag->dt_boundary,
2259 1.28 msaitoh &dma->dma_seg, 1, &rsegs, BUS_DMA_NOWAIT);
2260 1.1 msaitoh if (r != 0) {
2261 1.1 msaitoh aprint_error_dev(dev,
2262 1.1 msaitoh "%s: bus_dmamem_alloc failed; error %d\n", __func__, r);
2263 1.1 msaitoh goto fail_1;
2264 1.1 msaitoh }
2265 1.1 msaitoh
2266 1.1 msaitoh r = bus_dmamem_map(dma->dma_tag->dt_dmat, &dma->dma_seg, rsegs,
2267 1.76 ryo size, &dma->dma_vaddr, BUS_DMA_NOWAIT | BUS_DMA_COHERENT);
2268 1.1 msaitoh if (r != 0) {
2269 1.1 msaitoh aprint_error_dev(dev, "%s: bus_dmamem_map failed; error %d\n",
2270 1.1 msaitoh __func__, r);
2271 1.1 msaitoh goto fail_2;
2272 1.1 msaitoh }
2273 1.1 msaitoh
2274 1.1 msaitoh r = ixgbe_dmamap_create(dma->dma_tag, 0, &dma->dma_map);
2275 1.1 msaitoh if (r != 0) {
2276 1.1 msaitoh aprint_error_dev(dev, "%s: bus_dmamem_map failed; error %d\n",
2277 1.1 msaitoh __func__, r);
2278 1.1 msaitoh goto fail_3;
2279 1.1 msaitoh }
2280 1.1 msaitoh
2281 1.28 msaitoh r = bus_dmamap_load(dma->dma_tag->dt_dmat, dma->dma_map,
2282 1.28 msaitoh dma->dma_vaddr, size, NULL, mapflags | BUS_DMA_NOWAIT);
2283 1.1 msaitoh if (r != 0) {
2284 1.1 msaitoh aprint_error_dev(dev, "%s: bus_dmamap_load failed; error %d\n",
2285 1.1 msaitoh __func__, r);
2286 1.1 msaitoh goto fail_4;
2287 1.1 msaitoh }
2288 1.1 msaitoh dma->dma_paddr = dma->dma_map->dm_segs[0].ds_addr;
2289 1.1 msaitoh dma->dma_size = size;
2290 1.1 msaitoh return 0;
2291 1.1 msaitoh fail_4:
2292 1.1 msaitoh ixgbe_dmamap_destroy(dma->dma_tag, dma->dma_map);
2293 1.1 msaitoh fail_3:
2294 1.1 msaitoh bus_dmamem_unmap(dma->dma_tag->dt_dmat, dma->dma_vaddr, size);
2295 1.1 msaitoh fail_2:
2296 1.1 msaitoh bus_dmamem_free(dma->dma_tag->dt_dmat, &dma->dma_seg, rsegs);
2297 1.1 msaitoh fail_1:
2298 1.1 msaitoh ixgbe_dma_tag_destroy(dma->dma_tag);
2299 1.1 msaitoh fail_0:
2300 1.1 msaitoh
2301 1.28 msaitoh return (r);
2302 1.28 msaitoh } /* ixgbe_dma_malloc */
2303 1.28 msaitoh
2304 1.28 msaitoh /************************************************************************
2305 1.28 msaitoh * ixgbe_dma_free
2306 1.28 msaitoh ************************************************************************/
2307 1.3 msaitoh void
2308 1.102 msaitoh ixgbe_dma_free(struct ixgbe_softc *sc, struct ixgbe_dma_alloc *dma)
2309 1.1 msaitoh {
2310 1.1 msaitoh bus_dmamap_sync(dma->dma_tag->dt_dmat, dma->dma_map, 0, dma->dma_size,
2311 1.1 msaitoh BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE);
2312 1.1 msaitoh ixgbe_dmamap_unload(dma->dma_tag, dma->dma_map);
2313 1.98 bouyer bus_dmamem_unmap(dma->dma_tag->dt_dmat, dma->dma_vaddr, dma->dma_size);
2314 1.1 msaitoh bus_dmamem_free(dma->dma_tag->dt_dmat, &dma->dma_seg, 1);
2315 1.1 msaitoh ixgbe_dma_tag_destroy(dma->dma_tag);
2316 1.28 msaitoh } /* ixgbe_dma_free */
2317 1.1 msaitoh
2318 1.1 msaitoh
2319 1.28 msaitoh /************************************************************************
2320 1.28 msaitoh * ixgbe_allocate_queues
2321 1.1 msaitoh *
2322 1.28 msaitoh * Allocate memory for the transmit and receive rings, and then
2323 1.28 msaitoh * the descriptors associated with each, called only once at attach.
2324 1.28 msaitoh ************************************************************************/
2325 1.1 msaitoh int
2326 1.102 msaitoh ixgbe_allocate_queues(struct ixgbe_softc *sc)
2327 1.1 msaitoh {
2328 1.102 msaitoh device_t dev = sc->dev;
2329 1.1 msaitoh struct ix_queue *que;
2330 1.1 msaitoh struct tx_ring *txr;
2331 1.1 msaitoh struct rx_ring *rxr;
2332 1.28 msaitoh int rsize, tsize, error = IXGBE_SUCCESS;
2333 1.28 msaitoh int txconf = 0, rxconf = 0;
2334 1.1 msaitoh
2335 1.28 msaitoh /* First, allocate the top level queue structs */
2336 1.102 msaitoh sc->queues = (struct ix_queue *)malloc(sizeof(struct ix_queue) *
2337 1.102 msaitoh sc->num_queues, M_DEVBUF, M_WAITOK | M_ZERO);
2338 1.1 msaitoh
2339 1.28 msaitoh /* Second, allocate the TX ring struct memory */
2340 1.102 msaitoh sc->tx_rings = malloc(sizeof(struct tx_ring) *
2341 1.102 msaitoh sc->num_queues, M_DEVBUF, M_WAITOK | M_ZERO);
2342 1.1 msaitoh
2343 1.28 msaitoh /* Third, allocate the RX ring */
2344 1.102 msaitoh sc->rx_rings = (struct rx_ring *)malloc(sizeof(struct rx_ring) *
2345 1.102 msaitoh sc->num_queues, M_DEVBUF, M_WAITOK | M_ZERO);
2346 1.1 msaitoh
2347 1.1 msaitoh /* For the ring itself */
2348 1.102 msaitoh tsize = roundup2(sc->num_tx_desc * sizeof(union ixgbe_adv_tx_desc),
2349 1.28 msaitoh DBA_ALIGN);
2350 1.1 msaitoh
2351 1.1 msaitoh /*
2352 1.1 msaitoh * Now set up the TX queues, txconf is needed to handle the
2353 1.1 msaitoh * possibility that things fail midcourse and we need to
2354 1.1 msaitoh * undo memory gracefully
2355 1.28 msaitoh */
2356 1.102 msaitoh for (int i = 0; i < sc->num_queues; i++, txconf++) {
2357 1.1 msaitoh /* Set up some basics */
2358 1.102 msaitoh txr = &sc->tx_rings[i];
2359 1.102 msaitoh txr->sc = sc;
2360 1.28 msaitoh txr->txr_interq = NULL;
2361 1.28 msaitoh /* In case SR-IOV is enabled, align the index properly */
2362 1.5 msaitoh #ifdef PCI_IOV
2363 1.102 msaitoh txr->me = ixgbe_vf_que_index(sc->iov_mode, sc->pool,
2364 1.28 msaitoh i);
2365 1.5 msaitoh #else
2366 1.1 msaitoh txr->me = i;
2367 1.5 msaitoh #endif
2368 1.102 msaitoh txr->num_desc = sc->num_tx_desc;
2369 1.1 msaitoh
2370 1.1 msaitoh /* Initialize the TX side lock */
2371 1.1 msaitoh mutex_init(&txr->tx_mtx, MUTEX_DEFAULT, IPL_NET);
2372 1.1 msaitoh
2373 1.102 msaitoh if (ixgbe_dma_malloc(sc, tsize, &txr->txdma,
2374 1.28 msaitoh BUS_DMA_NOWAIT)) {
2375 1.1 msaitoh aprint_error_dev(dev,
2376 1.1 msaitoh "Unable to allocate TX Descriptor memory\n");
2377 1.1 msaitoh error = ENOMEM;
2378 1.1 msaitoh goto err_tx_desc;
2379 1.1 msaitoh }
2380 1.1 msaitoh txr->tx_base = (union ixgbe_adv_tx_desc *)txr->txdma.dma_vaddr;
2381 1.1 msaitoh bzero((void *)txr->tx_base, tsize);
2382 1.1 msaitoh
2383 1.28 msaitoh /* Now allocate transmit buffers for the ring */
2384 1.28 msaitoh if (ixgbe_allocate_transmit_buffers(txr)) {
2385 1.1 msaitoh aprint_error_dev(dev,
2386 1.1 msaitoh "Critical Failure setting up transmit buffers\n");
2387 1.1 msaitoh error = ENOMEM;
2388 1.1 msaitoh goto err_tx_desc;
2389 1.63 msaitoh }
2390 1.102 msaitoh if (!(sc->feat_en & IXGBE_FEATURE_LEGACY_TX)) {
2391 1.28 msaitoh /* Allocate a buf ring */
2392 1.28 msaitoh txr->txr_interq = pcq_create(IXGBE_BR_SIZE, KM_SLEEP);
2393 1.28 msaitoh if (txr->txr_interq == NULL) {
2394 1.28 msaitoh aprint_error_dev(dev,
2395 1.28 msaitoh "Critical Failure setting up buf ring\n");
2396 1.28 msaitoh error = ENOMEM;
2397 1.28 msaitoh goto err_tx_desc;
2398 1.28 msaitoh }
2399 1.28 msaitoh }
2400 1.1 msaitoh }
2401 1.1 msaitoh
2402 1.1 msaitoh /*
2403 1.1 msaitoh * Next the RX queues...
2404 1.53 msaitoh */
2405 1.102 msaitoh rsize = roundup2(sc->num_rx_desc * sizeof(union ixgbe_adv_rx_desc),
2406 1.28 msaitoh DBA_ALIGN);
2407 1.102 msaitoh for (int i = 0; i < sc->num_queues; i++, rxconf++) {
2408 1.102 msaitoh rxr = &sc->rx_rings[i];
2409 1.1 msaitoh /* Set up some basics */
2410 1.102 msaitoh rxr->sc = sc;
2411 1.5 msaitoh #ifdef PCI_IOV
2412 1.28 msaitoh /* In case SR-IOV is enabled, align the index properly */
2413 1.102 msaitoh rxr->me = ixgbe_vf_que_index(sc->iov_mode, sc->pool,
2414 1.28 msaitoh i);
2415 1.5 msaitoh #else
2416 1.1 msaitoh rxr->me = i;
2417 1.5 msaitoh #endif
2418 1.102 msaitoh rxr->num_desc = sc->num_rx_desc;
2419 1.1 msaitoh
2420 1.1 msaitoh /* Initialize the RX side lock */
2421 1.1 msaitoh mutex_init(&rxr->rx_mtx, MUTEX_DEFAULT, IPL_NET);
2422 1.1 msaitoh
2423 1.102 msaitoh if (ixgbe_dma_malloc(sc, rsize, &rxr->rxdma,
2424 1.28 msaitoh BUS_DMA_NOWAIT)) {
2425 1.1 msaitoh aprint_error_dev(dev,
2426 1.1 msaitoh "Unable to allocate RxDescriptor memory\n");
2427 1.1 msaitoh error = ENOMEM;
2428 1.1 msaitoh goto err_rx_desc;
2429 1.1 msaitoh }
2430 1.1 msaitoh rxr->rx_base = (union ixgbe_adv_rx_desc *)rxr->rxdma.dma_vaddr;
2431 1.1 msaitoh bzero((void *)rxr->rx_base, rsize);
2432 1.1 msaitoh
2433 1.28 msaitoh /* Allocate receive buffers for the ring */
2434 1.1 msaitoh if (ixgbe_allocate_receive_buffers(rxr)) {
2435 1.1 msaitoh aprint_error_dev(dev,
2436 1.1 msaitoh "Critical Failure setting up receive buffers\n");
2437 1.1 msaitoh error = ENOMEM;
2438 1.1 msaitoh goto err_rx_desc;
2439 1.1 msaitoh }
2440 1.1 msaitoh }
2441 1.1 msaitoh
2442 1.1 msaitoh /*
2443 1.28 msaitoh * Finally set up the queue holding structs
2444 1.28 msaitoh */
2445 1.102 msaitoh for (int i = 0; i < sc->num_queues; i++) {
2446 1.102 msaitoh que = &sc->queues[i];
2447 1.102 msaitoh que->sc = sc;
2448 1.3 msaitoh que->me = i;
2449 1.102 msaitoh que->txr = &sc->tx_rings[i];
2450 1.102 msaitoh que->rxr = &sc->rx_rings[i];
2451 1.33 knakahar
2452 1.37 knakahar mutex_init(&que->dc_mtx, MUTEX_DEFAULT, IPL_NET);
2453 1.37 knakahar que->disabled_count = 0;
2454 1.1 msaitoh }
2455 1.1 msaitoh
2456 1.1 msaitoh return (0);
2457 1.1 msaitoh
2458 1.1 msaitoh err_rx_desc:
2459 1.102 msaitoh for (rxr = sc->rx_rings; rxconf > 0; rxr++, rxconf--)
2460 1.102 msaitoh ixgbe_dma_free(sc, &rxr->rxdma);
2461 1.1 msaitoh err_tx_desc:
2462 1.102 msaitoh for (txr = sc->tx_rings; txconf > 0; txr++, txconf--)
2463 1.102 msaitoh ixgbe_dma_free(sc, &txr->txdma);
2464 1.102 msaitoh free(sc->rx_rings, M_DEVBUF);
2465 1.102 msaitoh free(sc->tx_rings, M_DEVBUF);
2466 1.102 msaitoh free(sc->queues, M_DEVBUF);
2467 1.1 msaitoh return (error);
2468 1.28 msaitoh } /* ixgbe_allocate_queues */
2469 1.60 msaitoh
2470 1.60 msaitoh /************************************************************************
2471 1.60 msaitoh * ixgbe_free_queues
2472 1.60 msaitoh *
2473 1.60 msaitoh * Free descriptors for the transmit and receive rings, and then
2474 1.60 msaitoh * the memory associated with each.
2475 1.60 msaitoh ************************************************************************/
2476 1.60 msaitoh void
2477 1.102 msaitoh ixgbe_free_queues(struct ixgbe_softc *sc)
2478 1.60 msaitoh {
2479 1.60 msaitoh struct ix_queue *que;
2480 1.60 msaitoh int i;
2481 1.60 msaitoh
2482 1.102 msaitoh ixgbe_free_transmit_structures(sc);
2483 1.102 msaitoh ixgbe_free_receive_structures(sc);
2484 1.102 msaitoh for (i = 0; i < sc->num_queues; i++) {
2485 1.102 msaitoh que = &sc->queues[i];
2486 1.60 msaitoh mutex_destroy(&que->dc_mtx);
2487 1.60 msaitoh }
2488 1.102 msaitoh free(sc->queues, M_DEVBUF);
2489 1.60 msaitoh } /* ixgbe_free_queues */
2490