ixgbe.c revision 1.14.2.5 1 1.1 dyoung /******************************************************************************
2 1.1 dyoung
3 1.14.2.5 riz Copyright (c) 2001-2013, Intel Corporation
4 1.1 dyoung All rights reserved.
5 1.1 dyoung
6 1.1 dyoung Redistribution and use in source and binary forms, with or without
7 1.1 dyoung modification, are permitted provided that the following conditions are met:
8 1.1 dyoung
9 1.1 dyoung 1. Redistributions of source code must retain the above copyright notice,
10 1.1 dyoung this list of conditions and the following disclaimer.
11 1.1 dyoung
12 1.1 dyoung 2. Redistributions in binary form must reproduce the above copyright
13 1.1 dyoung notice, this list of conditions and the following disclaimer in the
14 1.1 dyoung documentation and/or other materials provided with the distribution.
15 1.1 dyoung
16 1.1 dyoung 3. Neither the name of the Intel Corporation nor the names of its
17 1.1 dyoung contributors may be used to endorse or promote products derived from
18 1.1 dyoung this software without specific prior written permission.
19 1.1 dyoung
20 1.1 dyoung THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
21 1.1 dyoung AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22 1.1 dyoung IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23 1.1 dyoung ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
24 1.1 dyoung LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
25 1.1 dyoung CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
26 1.1 dyoung SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
27 1.1 dyoung INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28 1.1 dyoung CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
29 1.1 dyoung ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
30 1.1 dyoung POSSIBILITY OF SUCH DAMAGE.
31 1.1 dyoung
32 1.1 dyoung ******************************************************************************/
33 1.1 dyoung /*
34 1.1 dyoung * Copyright (c) 2011 The NetBSD Foundation, Inc.
35 1.1 dyoung * All rights reserved.
36 1.1 dyoung *
37 1.1 dyoung * This code is derived from software contributed to The NetBSD Foundation
38 1.1 dyoung * by Coyote Point Systems, Inc.
39 1.1 dyoung *
40 1.1 dyoung * Redistribution and use in source and binary forms, with or without
41 1.1 dyoung * modification, are permitted provided that the following conditions
42 1.1 dyoung * are met:
43 1.1 dyoung * 1. Redistributions of source code must retain the above copyright
44 1.1 dyoung * notice, this list of conditions and the following disclaimer.
45 1.1 dyoung * 2. Redistributions in binary form must reproduce the above copyright
46 1.1 dyoung * notice, this list of conditions and the following disclaimer in the
47 1.1 dyoung * documentation and/or other materials provided with the distribution.
48 1.1 dyoung *
49 1.1 dyoung * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
50 1.1 dyoung * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
51 1.1 dyoung * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
52 1.1 dyoung * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
53 1.1 dyoung * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
54 1.1 dyoung * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
55 1.1 dyoung * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
56 1.1 dyoung * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
57 1.1 dyoung * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
58 1.1 dyoung * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
59 1.1 dyoung * POSSIBILITY OF SUCH DAMAGE.
60 1.1 dyoung */
61 1.14.2.5 riz /*$FreeBSD: head/sys/dev/ixgbe/ixgbe.c 250108 2013-04-30 16:18:29Z luigi $*/
62 1.14.2.5 riz /*$NetBSD: ixgbe.c,v 1.14.2.5 2015/05/06 23:29:21 riz Exp $*/
63 1.1 dyoung
64 1.1 dyoung #include "opt_inet.h"
65 1.14.2.3 martin #include "opt_inet6.h"
66 1.1 dyoung
67 1.1 dyoung #include "ixgbe.h"
68 1.14.2.5 riz #include "vlan.h"
69 1.1 dyoung
70 1.1 dyoung /*********************************************************************
71 1.1 dyoung * Set this to one to display debug statistics
72 1.1 dyoung *********************************************************************/
73 1.1 dyoung int ixgbe_display_debug_stats = 0;
74 1.1 dyoung
75 1.1 dyoung /*********************************************************************
76 1.1 dyoung * Driver version
77 1.1 dyoung *********************************************************************/
78 1.14.2.5 riz char ixgbe_driver_version[] = "2.5.8 - HEAD";
79 1.1 dyoung
80 1.1 dyoung /*********************************************************************
81 1.1 dyoung * PCI Device ID Table
82 1.1 dyoung *
83 1.1 dyoung * Used by probe to select devices to load on
84 1.1 dyoung * Last field stores an index into ixgbe_strings
85 1.1 dyoung * Last entry must be all 0s
86 1.1 dyoung *
87 1.1 dyoung * { Vendor ID, Device ID, SubVendor ID, SubDevice ID, String Index }
88 1.1 dyoung *********************************************************************/
89 1.1 dyoung
90 1.1 dyoung static ixgbe_vendor_info_t ixgbe_vendor_info_array[] =
91 1.1 dyoung {
92 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598AF_DUAL_PORT, 0, 0, 0},
93 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598AF_SINGLE_PORT, 0, 0, 0},
94 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598EB_CX4, 0, 0, 0},
95 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598AT, 0, 0, 0},
96 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598AT2, 0, 0, 0},
97 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598, 0, 0, 0},
98 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598_DA_DUAL_PORT, 0, 0, 0},
99 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598_CX4_DUAL_PORT, 0, 0, 0},
100 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598EB_XF_LR, 0, 0, 0},
101 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598_SR_DUAL_PORT_EM, 0, 0, 0},
102 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82598EB_SFP_LOM, 0, 0, 0},
103 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_KX4, 0, 0, 0},
104 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_KX4_MEZZ, 0, 0, 0},
105 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_SFP, 0, 0, 0},
106 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_XAUI_LOM, 0, 0, 0},
107 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_CX4, 0, 0, 0},
108 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_T3_LOM, 0, 0, 0},
109 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_COMBO_BACKPLANE, 0, 0, 0},
110 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_BACKPLANE_FCOE, 0, 0, 0},
111 1.14.2.3 martin {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_SFP_SF2, 0, 0, 0},
112 1.1 dyoung {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_SFP_FCOE, 0, 0, 0},
113 1.14.2.3 martin {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599EN_SFP, 0, 0, 0},
114 1.14.2.3 martin {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_82599_SFP_SF_QP, 0, 0, 0},
115 1.14.2.4 riz {IXGBE_INTEL_VENDOR_ID, IXGBE_DEV_ID_X540T, 0, 0, 0},
116 1.1 dyoung /* required last entry */
117 1.1 dyoung {0, 0, 0, 0, 0}
118 1.1 dyoung };
119 1.1 dyoung
120 1.1 dyoung /*********************************************************************
121 1.1 dyoung * Table of branding strings
122 1.1 dyoung *********************************************************************/
123 1.1 dyoung
124 1.1 dyoung static const char *ixgbe_strings[] = {
125 1.1 dyoung "Intel(R) PRO/10GbE PCI-Express Network Driver"
126 1.1 dyoung };
127 1.1 dyoung
128 1.1 dyoung /*********************************************************************
129 1.1 dyoung * Function prototypes
130 1.1 dyoung *********************************************************************/
131 1.1 dyoung static int ixgbe_probe(device_t, cfdata_t, void *);
132 1.1 dyoung static void ixgbe_attach(device_t, device_t, void *);
133 1.1 dyoung static int ixgbe_detach(device_t, int);
134 1.1 dyoung #if 0
135 1.1 dyoung static int ixgbe_shutdown(device_t);
136 1.1 dyoung #endif
137 1.14.2.5 riz #if IXGBE_LEGACY_TX
138 1.14.2.5 riz static void ixgbe_start(struct ifnet *);
139 1.14.2.5 riz static void ixgbe_start_locked(struct tx_ring *, struct ifnet *);
140 1.14.2.5 riz #else
141 1.1 dyoung static int ixgbe_mq_start(struct ifnet *, struct mbuf *);
142 1.1 dyoung static int ixgbe_mq_start_locked(struct ifnet *,
143 1.1 dyoung struct tx_ring *, struct mbuf *);
144 1.1 dyoung static void ixgbe_qflush(struct ifnet *);
145 1.14.2.5 riz static void ixgbe_deferred_mq_start(void *);
146 1.1 dyoung #endif
147 1.1 dyoung static int ixgbe_ioctl(struct ifnet *, u_long, void *);
148 1.1 dyoung static void ixgbe_ifstop(struct ifnet *, int);
149 1.1 dyoung static int ixgbe_init(struct ifnet *);
150 1.1 dyoung static void ixgbe_init_locked(struct adapter *);
151 1.1 dyoung static void ixgbe_stop(void *);
152 1.1 dyoung static void ixgbe_media_status(struct ifnet *, struct ifmediareq *);
153 1.1 dyoung static int ixgbe_media_change(struct ifnet *);
154 1.1 dyoung static void ixgbe_identify_hardware(struct adapter *);
155 1.1 dyoung static int ixgbe_allocate_pci_resources(struct adapter *,
156 1.1 dyoung const struct pci_attach_args *);
157 1.1 dyoung static int ixgbe_allocate_msix(struct adapter *,
158 1.1 dyoung const struct pci_attach_args *);
159 1.1 dyoung static int ixgbe_allocate_legacy(struct adapter *,
160 1.1 dyoung const struct pci_attach_args *);
161 1.1 dyoung static int ixgbe_allocate_queues(struct adapter *);
162 1.1 dyoung static int ixgbe_setup_msix(struct adapter *);
163 1.1 dyoung static void ixgbe_free_pci_resources(struct adapter *);
164 1.1 dyoung static void ixgbe_local_timer(void *);
165 1.1 dyoung static int ixgbe_setup_interface(device_t, struct adapter *);
166 1.1 dyoung static void ixgbe_config_link(struct adapter *);
167 1.1 dyoung
168 1.1 dyoung static int ixgbe_allocate_transmit_buffers(struct tx_ring *);
169 1.1 dyoung static int ixgbe_setup_transmit_structures(struct adapter *);
170 1.1 dyoung static void ixgbe_setup_transmit_ring(struct tx_ring *);
171 1.1 dyoung static void ixgbe_initialize_transmit_units(struct adapter *);
172 1.1 dyoung static void ixgbe_free_transmit_structures(struct adapter *);
173 1.1 dyoung static void ixgbe_free_transmit_buffers(struct tx_ring *);
174 1.1 dyoung
175 1.1 dyoung static int ixgbe_allocate_receive_buffers(struct rx_ring *);
176 1.1 dyoung static int ixgbe_setup_receive_structures(struct adapter *);
177 1.1 dyoung static int ixgbe_setup_receive_ring(struct rx_ring *);
178 1.1 dyoung static void ixgbe_initialize_receive_units(struct adapter *);
179 1.1 dyoung static void ixgbe_free_receive_structures(struct adapter *);
180 1.1 dyoung static void ixgbe_free_receive_buffers(struct rx_ring *);
181 1.1 dyoung static void ixgbe_setup_hw_rsc(struct rx_ring *);
182 1.1 dyoung
183 1.1 dyoung static void ixgbe_enable_intr(struct adapter *);
184 1.1 dyoung static void ixgbe_disable_intr(struct adapter *);
185 1.1 dyoung static void ixgbe_update_stats_counters(struct adapter *);
186 1.1 dyoung static bool ixgbe_txeof(struct tx_ring *);
187 1.14.2.5 riz static bool ixgbe_rxeof(struct ix_queue *);
188 1.1 dyoung static void ixgbe_rx_checksum(u32, struct mbuf *, u32,
189 1.1 dyoung struct ixgbe_hw_stats *);
190 1.1 dyoung static void ixgbe_set_promisc(struct adapter *);
191 1.1 dyoung static void ixgbe_set_multi(struct adapter *);
192 1.1 dyoung static void ixgbe_update_link_status(struct adapter *);
193 1.1 dyoung static void ixgbe_refresh_mbufs(struct rx_ring *, int);
194 1.1 dyoung static int ixgbe_xmit(struct tx_ring *, struct mbuf *);
195 1.1 dyoung static int ixgbe_set_flowcntl(SYSCTLFN_PROTO);
196 1.1 dyoung static int ixgbe_set_advertise(SYSCTLFN_PROTO);
197 1.14.2.4 riz static int ixgbe_set_thermal_test(SYSCTLFN_PROTO);
198 1.1 dyoung static int ixgbe_dma_malloc(struct adapter *, bus_size_t,
199 1.1 dyoung struct ixgbe_dma_alloc *, int);
200 1.1 dyoung static void ixgbe_dma_free(struct adapter *, struct ixgbe_dma_alloc *);
201 1.14.2.5 riz static int ixgbe_tx_ctx_setup(struct tx_ring *,
202 1.14.2.5 riz struct mbuf *, u32 *, u32 *);
203 1.14.2.5 riz static int ixgbe_tso_setup(struct tx_ring *,
204 1.14.2.5 riz struct mbuf *, u32 *, u32 *);
205 1.1 dyoung static void ixgbe_set_ivar(struct adapter *, u8, u8, s8);
206 1.1 dyoung static void ixgbe_configure_ivars(struct adapter *);
207 1.1 dyoung static u8 * ixgbe_mc_array_itr(struct ixgbe_hw *, u8 **, u32 *);
208 1.1 dyoung
209 1.1 dyoung static void ixgbe_setup_vlan_hw_support(struct adapter *);
210 1.1 dyoung #if 0
211 1.1 dyoung static void ixgbe_register_vlan(void *, struct ifnet *, u16);
212 1.1 dyoung static void ixgbe_unregister_vlan(void *, struct ifnet *, u16);
213 1.1 dyoung #endif
214 1.1 dyoung
215 1.1 dyoung static void ixgbe_add_hw_stats(struct adapter *adapter);
216 1.1 dyoung
217 1.1 dyoung static __inline void ixgbe_rx_discard(struct rx_ring *, int);
218 1.1 dyoung static __inline void ixgbe_rx_input(struct rx_ring *, struct ifnet *,
219 1.1 dyoung struct mbuf *, u32);
220 1.1 dyoung
221 1.14.2.4 riz static void ixgbe_enable_rx_drop(struct adapter *);
222 1.14.2.4 riz static void ixgbe_disable_rx_drop(struct adapter *);
223 1.14.2.4 riz
224 1.1 dyoung /* Support for pluggable optic modules */
225 1.1 dyoung static bool ixgbe_sfp_probe(struct adapter *);
226 1.1 dyoung static void ixgbe_setup_optics(struct adapter *);
227 1.1 dyoung
228 1.1 dyoung /* Legacy (single vector interrupt handler */
229 1.1 dyoung static int ixgbe_legacy_irq(void *);
230 1.1 dyoung
231 1.1 dyoung #if defined(NETBSD_MSI_OR_MSIX)
232 1.1 dyoung /* The MSI/X Interrupt handlers */
233 1.1 dyoung static void ixgbe_msix_que(void *);
234 1.1 dyoung static void ixgbe_msix_link(void *);
235 1.1 dyoung #endif
236 1.1 dyoung
237 1.1 dyoung /* Software interrupts for deferred work */
238 1.1 dyoung static void ixgbe_handle_que(void *);
239 1.1 dyoung static void ixgbe_handle_link(void *);
240 1.1 dyoung static void ixgbe_handle_msf(void *);
241 1.1 dyoung static void ixgbe_handle_mod(void *);
242 1.1 dyoung
243 1.1 dyoung const struct sysctlnode *ixgbe_sysctl_instance(struct adapter *);
244 1.1 dyoung static ixgbe_vendor_info_t *ixgbe_lookup(const struct pci_attach_args *);
245 1.1 dyoung
246 1.1 dyoung #ifdef IXGBE_FDIR
247 1.1 dyoung static void ixgbe_atr(struct tx_ring *, struct mbuf *);
248 1.1 dyoung static void ixgbe_reinit_fdir(void *, int);
249 1.1 dyoung #endif
250 1.1 dyoung
251 1.1 dyoung /*********************************************************************
252 1.1 dyoung * FreeBSD Device Interface Entry Points
253 1.1 dyoung *********************************************************************/
254 1.1 dyoung
255 1.1 dyoung CFATTACH_DECL3_NEW(ixg, sizeof(struct adapter),
256 1.1 dyoung ixgbe_probe, ixgbe_attach, ixgbe_detach, NULL, NULL, NULL,
257 1.1 dyoung DVF_DETACH_SHUTDOWN);
258 1.1 dyoung
259 1.1 dyoung #if 0
260 1.1 dyoung devclass_t ixgbe_devclass;
261 1.1 dyoung DRIVER_MODULE(ixgbe, pci, ixgbe_driver, ixgbe_devclass, 0, 0);
262 1.1 dyoung
263 1.1 dyoung MODULE_DEPEND(ixgbe, pci, 1, 1, 1);
264 1.1 dyoung MODULE_DEPEND(ixgbe, ether, 1, 1, 1);
265 1.1 dyoung #endif
266 1.1 dyoung
267 1.1 dyoung /*
268 1.1 dyoung ** TUNEABLE PARAMETERS:
269 1.1 dyoung */
270 1.1 dyoung
271 1.1 dyoung /*
272 1.1 dyoung ** AIM: Adaptive Interrupt Moderation
273 1.1 dyoung ** which means that the interrupt rate
274 1.1 dyoung ** is varied over time based on the
275 1.1 dyoung ** traffic for that interrupt vector
276 1.1 dyoung */
277 1.1 dyoung static int ixgbe_enable_aim = TRUE;
278 1.1 dyoung #define TUNABLE_INT(__x, __y)
279 1.1 dyoung TUNABLE_INT("hw.ixgbe.enable_aim", &ixgbe_enable_aim);
280 1.1 dyoung
281 1.14.2.3 martin static int ixgbe_max_interrupt_rate = (4000000 / IXGBE_LOW_LATENCY);
282 1.1 dyoung TUNABLE_INT("hw.ixgbe.max_interrupt_rate", &ixgbe_max_interrupt_rate);
283 1.1 dyoung
284 1.1 dyoung /* How many packets rxeof tries to clean at a time */
285 1.1 dyoung static int ixgbe_rx_process_limit = 256;
286 1.1 dyoung TUNABLE_INT("hw.ixgbe.rx_process_limit", &ixgbe_rx_process_limit);
287 1.1 dyoung
288 1.14.2.5 riz /* How many packets txeof tries to clean at a time */
289 1.14.2.5 riz static int ixgbe_tx_process_limit = 256;
290 1.14.2.5 riz TUNABLE_INT("hw.ixgbe.tx_process_limit", &ixgbe_tx_process_limit);
291 1.14.2.5 riz
292 1.1 dyoung /*
293 1.1 dyoung ** Smart speed setting, default to on
294 1.1 dyoung ** this only works as a compile option
295 1.1 dyoung ** right now as its during attach, set
296 1.1 dyoung ** this to 'ixgbe_smart_speed_off' to
297 1.1 dyoung ** disable.
298 1.1 dyoung */
299 1.1 dyoung static int ixgbe_smart_speed = ixgbe_smart_speed_on;
300 1.1 dyoung
301 1.1 dyoung /*
302 1.1 dyoung * MSIX should be the default for best performance,
303 1.1 dyoung * but this allows it to be forced off for testing.
304 1.1 dyoung */
305 1.1 dyoung static int ixgbe_enable_msix = 1;
306 1.1 dyoung TUNABLE_INT("hw.ixgbe.enable_msix", &ixgbe_enable_msix);
307 1.1 dyoung
308 1.1 dyoung #if defined(NETBSD_MSI_OR_MSIX)
309 1.1 dyoung /*
310 1.1 dyoung * Number of Queues, can be set to 0,
311 1.1 dyoung * it then autoconfigures based on the
312 1.1 dyoung * number of cpus with a max of 8. This
313 1.1 dyoung * can be overriden manually here.
314 1.1 dyoung */
315 1.1 dyoung static int ixgbe_num_queues = 0;
316 1.1 dyoung TUNABLE_INT("hw.ixgbe.num_queues", &ixgbe_num_queues);
317 1.1 dyoung #endif
318 1.1 dyoung
319 1.1 dyoung /*
320 1.1 dyoung ** Number of TX descriptors per ring,
321 1.1 dyoung ** setting higher than RX as this seems
322 1.1 dyoung ** the better performing choice.
323 1.1 dyoung */
324 1.1 dyoung static int ixgbe_txd = PERFORM_TXD;
325 1.1 dyoung TUNABLE_INT("hw.ixgbe.txd", &ixgbe_txd);
326 1.1 dyoung
327 1.1 dyoung /* Number of RX descriptors per ring */
328 1.1 dyoung static int ixgbe_rxd = PERFORM_RXD;
329 1.1 dyoung TUNABLE_INT("hw.ixgbe.rxd", &ixgbe_rxd);
330 1.1 dyoung
331 1.14.2.4 riz /*
332 1.14.2.4 riz ** HW RSC control:
333 1.14.2.4 riz ** this feature only works with
334 1.14.2.4 riz ** IPv4, and only on 82599 and later.
335 1.14.2.4 riz ** Also this will cause IP forwarding to
336 1.14.2.4 riz ** fail and that can't be controlled by
337 1.14.2.4 riz ** the stack as LRO can. For all these
338 1.14.2.4 riz ** reasons I've deemed it best to leave
339 1.14.2.4 riz ** this off and not bother with a tuneable
340 1.14.2.4 riz ** interface, this would need to be compiled
341 1.14.2.4 riz ** to enable.
342 1.14.2.4 riz */
343 1.14.2.4 riz static bool ixgbe_rsc_enable = FALSE;
344 1.14.2.4 riz
345 1.1 dyoung /* Keep running tab on them for sanity check */
346 1.1 dyoung static int ixgbe_total_ports;
347 1.1 dyoung
348 1.1 dyoung #ifdef IXGBE_FDIR
349 1.1 dyoung /*
350 1.1 dyoung ** For Flow Director: this is the
351 1.1 dyoung ** number of TX packets we sample
352 1.1 dyoung ** for the filter pool, this means
353 1.1 dyoung ** every 20th packet will be probed.
354 1.1 dyoung **
355 1.1 dyoung ** This feature can be disabled by
356 1.1 dyoung ** setting this to 0.
357 1.1 dyoung */
358 1.1 dyoung static int atr_sample_rate = 20;
359 1.1 dyoung /*
360 1.1 dyoung ** Flow Director actually 'steals'
361 1.1 dyoung ** part of the packet buffer as its
362 1.1 dyoung ** filter pool, this variable controls
363 1.1 dyoung ** how much it uses:
364 1.1 dyoung ** 0 = 64K, 1 = 128K, 2 = 256K
365 1.1 dyoung */
366 1.1 dyoung static int fdir_pballoc = 1;
367 1.1 dyoung #endif
368 1.1 dyoung
369 1.14.2.3 martin #ifdef DEV_NETMAP
370 1.14.2.3 martin /*
371 1.14.2.3 martin * The #ifdef DEV_NETMAP / #endif blocks in this file are meant to
372 1.14.2.3 martin * be a reference on how to implement netmap support in a driver.
373 1.14.2.3 martin * Additional comments are in ixgbe_netmap.h .
374 1.14.2.3 martin *
375 1.14.2.4 riz * <dev/netmap/ixgbe_netmap.h> contains functions for netmap support
376 1.14.2.3 martin * that extend the standard driver.
377 1.14.2.3 martin */
378 1.14.2.3 martin #include <dev/netmap/ixgbe_netmap.h>
379 1.14.2.3 martin #endif /* DEV_NETMAP */
380 1.14.2.3 martin
381 1.1 dyoung /*********************************************************************
382 1.1 dyoung * Device identification routine
383 1.1 dyoung *
384 1.1 dyoung * ixgbe_probe determines if the driver should be loaded on
385 1.1 dyoung * adapter based on PCI vendor/device id of the adapter.
386 1.1 dyoung *
387 1.1 dyoung * return 1 on success, 0 on failure
388 1.1 dyoung *********************************************************************/
389 1.1 dyoung
390 1.1 dyoung static int
391 1.1 dyoung ixgbe_probe(device_t dev, cfdata_t cf, void *aux)
392 1.1 dyoung {
393 1.1 dyoung const struct pci_attach_args *pa = aux;
394 1.1 dyoung
395 1.1 dyoung return (ixgbe_lookup(pa) != NULL) ? 1 : 0;
396 1.1 dyoung }
397 1.1 dyoung
398 1.1 dyoung static ixgbe_vendor_info_t *
399 1.1 dyoung ixgbe_lookup(const struct pci_attach_args *pa)
400 1.1 dyoung {
401 1.1 dyoung pcireg_t subid;
402 1.1 dyoung ixgbe_vendor_info_t *ent;
403 1.1 dyoung
404 1.1 dyoung INIT_DEBUGOUT("ixgbe_probe: begin");
405 1.1 dyoung
406 1.1 dyoung if (PCI_VENDOR(pa->pa_id) != IXGBE_INTEL_VENDOR_ID)
407 1.1 dyoung return NULL;
408 1.1 dyoung
409 1.1 dyoung subid = pci_conf_read(pa->pa_pc, pa->pa_tag, PCI_SUBSYS_ID_REG);
410 1.1 dyoung
411 1.1 dyoung for (ent = ixgbe_vendor_info_array; ent->vendor_id != 0; ent++) {
412 1.1 dyoung if (PCI_VENDOR(pa->pa_id) == ent->vendor_id &&
413 1.1 dyoung PCI_PRODUCT(pa->pa_id) == ent->device_id &&
414 1.1 dyoung
415 1.1 dyoung (PCI_SUBSYS_VENDOR(subid) == ent->subvendor_id ||
416 1.1 dyoung ent->subvendor_id == 0) &&
417 1.1 dyoung
418 1.1 dyoung (PCI_SUBSYS_ID(subid) == ent->subdevice_id ||
419 1.1 dyoung ent->subdevice_id == 0)) {
420 1.1 dyoung ++ixgbe_total_ports;
421 1.1 dyoung return ent;
422 1.1 dyoung }
423 1.1 dyoung }
424 1.1 dyoung return NULL;
425 1.1 dyoung }
426 1.1 dyoung
427 1.1 dyoung
428 1.1 dyoung static void
429 1.1 dyoung ixgbe_sysctl_attach(struct adapter *adapter)
430 1.1 dyoung {
431 1.1 dyoung struct sysctllog **log;
432 1.1 dyoung const struct sysctlnode *rnode, *cnode;
433 1.1 dyoung device_t dev;
434 1.1 dyoung
435 1.1 dyoung dev = adapter->dev;
436 1.1 dyoung log = &adapter->sysctllog;
437 1.1 dyoung
438 1.1 dyoung if ((rnode = ixgbe_sysctl_instance(adapter)) == NULL) {
439 1.1 dyoung aprint_error_dev(dev, "could not create sysctl root\n");
440 1.1 dyoung return;
441 1.1 dyoung }
442 1.1 dyoung
443 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
444 1.1 dyoung CTLFLAG_READONLY, CTLTYPE_INT,
445 1.1 dyoung "num_rx_desc", SYSCTL_DESCR("Number of rx descriptors"),
446 1.1 dyoung NULL, 0, &adapter->num_rx_desc, 0, CTL_CREATE, CTL_EOL) != 0)
447 1.1 dyoung aprint_error_dev(dev, "could not create sysctl\n");
448 1.1 dyoung
449 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
450 1.1 dyoung CTLFLAG_READONLY, CTLTYPE_INT,
451 1.1 dyoung "num_queues", SYSCTL_DESCR("Number of queues"),
452 1.1 dyoung NULL, 0, &adapter->num_queues, 0, CTL_CREATE, CTL_EOL) != 0)
453 1.1 dyoung aprint_error_dev(dev, "could not create sysctl\n");
454 1.1 dyoung
455 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
456 1.1 dyoung CTLFLAG_READWRITE, CTLTYPE_INT,
457 1.14.2.4 riz "fc", SYSCTL_DESCR("Flow Control"),
458 1.3 dsl ixgbe_set_flowcntl, 0, (void *)adapter, 0, CTL_CREATE, CTL_EOL) != 0)
459 1.1 dyoung aprint_error_dev(dev, "could not create sysctl\n");
460 1.1 dyoung
461 1.1 dyoung /* XXX This is an *instance* sysctl controlling a *global* variable.
462 1.1 dyoung * XXX It's that way in the FreeBSD driver that this derives from.
463 1.1 dyoung */
464 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
465 1.1 dyoung CTLFLAG_READWRITE, CTLTYPE_INT,
466 1.1 dyoung "enable_aim", SYSCTL_DESCR("Interrupt Moderation"),
467 1.1 dyoung NULL, 0, &ixgbe_enable_aim, 0, CTL_CREATE, CTL_EOL) != 0)
468 1.1 dyoung aprint_error_dev(dev, "could not create sysctl\n");
469 1.14.2.4 riz
470 1.14.2.4 riz if (sysctl_createv(log, 0, &rnode, &cnode,
471 1.14.2.4 riz CTLFLAG_READWRITE, CTLTYPE_INT,
472 1.14.2.4 riz "advertise_speed", SYSCTL_DESCR("Link Speed"),
473 1.14.2.4 riz ixgbe_set_advertise, 0, (void *)adapter, 0, CTL_CREATE, CTL_EOL) != 0)
474 1.14.2.4 riz aprint_error_dev(dev, "could not create sysctl\n");
475 1.14.2.4 riz
476 1.14.2.4 riz if (sysctl_createv(log, 0, &rnode, &cnode,
477 1.14.2.4 riz CTLFLAG_READWRITE, CTLTYPE_INT,
478 1.14.2.4 riz "ts", SYSCTL_DESCR("Thermal Test"),
479 1.14.2.4 riz ixgbe_set_thermal_test, 0, (void *)adapter, 0, CTL_CREATE, CTL_EOL) != 0)
480 1.14.2.4 riz aprint_error_dev(dev, "could not create sysctl\n");
481 1.1 dyoung }
482 1.1 dyoung
483 1.1 dyoung /*********************************************************************
484 1.1 dyoung * Device initialization routine
485 1.1 dyoung *
486 1.1 dyoung * The attach entry point is called when the driver is being loaded.
487 1.1 dyoung * This routine identifies the type of hardware, allocates all resources
488 1.1 dyoung * and initializes the hardware.
489 1.1 dyoung *
490 1.1 dyoung * return 0 on success, positive on failure
491 1.1 dyoung *********************************************************************/
492 1.1 dyoung
493 1.1 dyoung static void
494 1.1 dyoung ixgbe_attach(device_t parent, device_t dev, void *aux)
495 1.1 dyoung {
496 1.1 dyoung struct adapter *adapter;
497 1.1 dyoung struct ixgbe_hw *hw;
498 1.1 dyoung int error = 0;
499 1.1 dyoung u16 csum;
500 1.1 dyoung u32 ctrl_ext;
501 1.1 dyoung ixgbe_vendor_info_t *ent;
502 1.1 dyoung const struct pci_attach_args *pa = aux;
503 1.1 dyoung
504 1.1 dyoung INIT_DEBUGOUT("ixgbe_attach: begin");
505 1.1 dyoung
506 1.1 dyoung /* Allocate, clear, and link in our adapter structure */
507 1.1 dyoung adapter = device_private(dev);
508 1.1 dyoung adapter->dev = adapter->osdep.dev = dev;
509 1.1 dyoung hw = &adapter->hw;
510 1.1 dyoung adapter->osdep.pc = pa->pa_pc;
511 1.1 dyoung adapter->osdep.tag = pa->pa_tag;
512 1.1 dyoung adapter->osdep.dmat = pa->pa_dmat;
513 1.1 dyoung
514 1.1 dyoung ent = ixgbe_lookup(pa);
515 1.1 dyoung
516 1.1 dyoung KASSERT(ent != NULL);
517 1.1 dyoung
518 1.1 dyoung aprint_normal(": %s, Version - %s\n",
519 1.1 dyoung ixgbe_strings[ent->index], ixgbe_driver_version);
520 1.1 dyoung
521 1.1 dyoung /* Core Lock Init*/
522 1.1 dyoung IXGBE_CORE_LOCK_INIT(adapter, device_xname(dev));
523 1.1 dyoung
524 1.1 dyoung /* SYSCTL APIs */
525 1.1 dyoung
526 1.1 dyoung ixgbe_sysctl_attach(adapter);
527 1.1 dyoung
528 1.1 dyoung /* Set up the timer callout */
529 1.1 dyoung callout_init(&adapter->timer, 0);
530 1.1 dyoung
531 1.1 dyoung /* Determine hardware revision */
532 1.1 dyoung ixgbe_identify_hardware(adapter);
533 1.1 dyoung
534 1.1 dyoung /* Do base PCI setup - map BAR0 */
535 1.1 dyoung if (ixgbe_allocate_pci_resources(adapter, pa)) {
536 1.1 dyoung aprint_error_dev(dev, "Allocation of PCI resources failed\n");
537 1.1 dyoung error = ENXIO;
538 1.1 dyoung goto err_out;
539 1.1 dyoung }
540 1.1 dyoung
541 1.1 dyoung /* Do descriptor calc and sanity checks */
542 1.1 dyoung if (((ixgbe_txd * sizeof(union ixgbe_adv_tx_desc)) % DBA_ALIGN) != 0 ||
543 1.1 dyoung ixgbe_txd < MIN_TXD || ixgbe_txd > MAX_TXD) {
544 1.1 dyoung aprint_error_dev(dev, "TXD config issue, using default!\n");
545 1.1 dyoung adapter->num_tx_desc = DEFAULT_TXD;
546 1.1 dyoung } else
547 1.1 dyoung adapter->num_tx_desc = ixgbe_txd;
548 1.1 dyoung
549 1.1 dyoung /*
550 1.1 dyoung ** With many RX rings it is easy to exceed the
551 1.1 dyoung ** system mbuf allocation. Tuning nmbclusters
552 1.1 dyoung ** can alleviate this.
553 1.1 dyoung */
554 1.1 dyoung if (nmbclusters > 0 ) {
555 1.1 dyoung int s;
556 1.1 dyoung s = (ixgbe_rxd * adapter->num_queues) * ixgbe_total_ports;
557 1.1 dyoung if (s > nmbclusters) {
558 1.1 dyoung aprint_error_dev(dev, "RX Descriptors exceed "
559 1.1 dyoung "system mbuf max, using default instead!\n");
560 1.1 dyoung ixgbe_rxd = DEFAULT_RXD;
561 1.1 dyoung }
562 1.1 dyoung }
563 1.1 dyoung
564 1.1 dyoung if (((ixgbe_rxd * sizeof(union ixgbe_adv_rx_desc)) % DBA_ALIGN) != 0 ||
565 1.1 dyoung ixgbe_rxd < MIN_TXD || ixgbe_rxd > MAX_TXD) {
566 1.1 dyoung aprint_error_dev(dev, "RXD config issue, using default!\n");
567 1.1 dyoung adapter->num_rx_desc = DEFAULT_RXD;
568 1.1 dyoung } else
569 1.1 dyoung adapter->num_rx_desc = ixgbe_rxd;
570 1.1 dyoung
571 1.1 dyoung /* Allocate our TX/RX Queues */
572 1.1 dyoung if (ixgbe_allocate_queues(adapter)) {
573 1.1 dyoung error = ENOMEM;
574 1.1 dyoung goto err_out;
575 1.1 dyoung }
576 1.1 dyoung
577 1.1 dyoung /* Allocate multicast array memory. */
578 1.1 dyoung adapter->mta = malloc(sizeof(u8) * IXGBE_ETH_LENGTH_OF_ADDRESS *
579 1.1 dyoung MAX_NUM_MULTICAST_ADDRESSES, M_DEVBUF, M_NOWAIT);
580 1.1 dyoung if (adapter->mta == NULL) {
581 1.1 dyoung aprint_error_dev(dev, "Cannot allocate multicast setup array\n");
582 1.1 dyoung error = ENOMEM;
583 1.1 dyoung goto err_late;
584 1.1 dyoung }
585 1.1 dyoung
586 1.1 dyoung /* Initialize the shared code */
587 1.1 dyoung error = ixgbe_init_shared_code(hw);
588 1.1 dyoung if (error == IXGBE_ERR_SFP_NOT_PRESENT) {
589 1.1 dyoung /*
590 1.1 dyoung ** No optics in this port, set up
591 1.1 dyoung ** so the timer routine will probe
592 1.1 dyoung ** for later insertion.
593 1.1 dyoung */
594 1.1 dyoung adapter->sfp_probe = TRUE;
595 1.1 dyoung error = 0;
596 1.1 dyoung } else if (error == IXGBE_ERR_SFP_NOT_SUPPORTED) {
597 1.1 dyoung aprint_error_dev(dev,"Unsupported SFP+ module detected!\n");
598 1.1 dyoung error = EIO;
599 1.1 dyoung goto err_late;
600 1.1 dyoung } else if (error) {
601 1.1 dyoung aprint_error_dev(dev,"Unable to initialize the shared code\n");
602 1.1 dyoung error = EIO;
603 1.1 dyoung goto err_late;
604 1.1 dyoung }
605 1.1 dyoung
606 1.1 dyoung /* Make sure we have a good EEPROM before we read from it */
607 1.1 dyoung if (ixgbe_validate_eeprom_checksum(&adapter->hw, &csum) < 0) {
608 1.1 dyoung aprint_error_dev(dev,"The EEPROM Checksum Is Not Valid\n");
609 1.1 dyoung error = EIO;
610 1.1 dyoung goto err_late;
611 1.1 dyoung }
612 1.1 dyoung
613 1.1 dyoung error = ixgbe_init_hw(hw);
614 1.14.2.4 riz switch (error) {
615 1.14.2.4 riz case IXGBE_ERR_EEPROM_VERSION:
616 1.1 dyoung aprint_error_dev(dev, "This device is a pre-production adapter/"
617 1.1 dyoung "LOM. Please be aware there may be issues associated "
618 1.1 dyoung "with your hardware.\n If you are experiencing problems "
619 1.1 dyoung "please contact your Intel or hardware representative "
620 1.1 dyoung "who provided you with this hardware.\n");
621 1.14.2.4 riz break;
622 1.14.2.4 riz case IXGBE_ERR_SFP_NOT_SUPPORTED:
623 1.1 dyoung aprint_error_dev(dev,"Unsupported SFP+ Module\n");
624 1.1 dyoung error = EIO;
625 1.1 dyoung aprint_error_dev(dev,"Hardware Initialization Failure\n");
626 1.1 dyoung goto err_late;
627 1.14.2.4 riz case IXGBE_ERR_SFP_NOT_PRESENT:
628 1.14.2.4 riz device_printf(dev,"No SFP+ Module found\n");
629 1.14.2.4 riz /* falls thru */
630 1.14.2.4 riz default:
631 1.14.2.4 riz break;
632 1.1 dyoung }
633 1.1 dyoung
634 1.1 dyoung /* Detect and set physical type */
635 1.1 dyoung ixgbe_setup_optics(adapter);
636 1.1 dyoung
637 1.1 dyoung if ((adapter->msix > 1) && (ixgbe_enable_msix))
638 1.1 dyoung error = ixgbe_allocate_msix(adapter, pa);
639 1.1 dyoung else
640 1.1 dyoung error = ixgbe_allocate_legacy(adapter, pa);
641 1.1 dyoung if (error)
642 1.1 dyoung goto err_late;
643 1.1 dyoung
644 1.1 dyoung /* Setup OS specific network interface */
645 1.1 dyoung if (ixgbe_setup_interface(dev, adapter) != 0)
646 1.1 dyoung goto err_late;
647 1.1 dyoung
648 1.1 dyoung /* Initialize statistics */
649 1.1 dyoung ixgbe_update_stats_counters(adapter);
650 1.1 dyoung
651 1.1 dyoung /* Print PCIE bus type/speed/width info */
652 1.1 dyoung ixgbe_get_bus_info(hw);
653 1.1 dyoung aprint_normal_dev(dev,"PCI Express Bus: Speed %s %s\n",
654 1.1 dyoung ((hw->bus.speed == ixgbe_bus_speed_5000) ? "5.0Gb/s":
655 1.1 dyoung (hw->bus.speed == ixgbe_bus_speed_2500) ? "2.5Gb/s":"Unknown"),
656 1.1 dyoung (hw->bus.width == ixgbe_bus_width_pcie_x8) ? "Width x8" :
657 1.1 dyoung (hw->bus.width == ixgbe_bus_width_pcie_x4) ? "Width x4" :
658 1.1 dyoung (hw->bus.width == ixgbe_bus_width_pcie_x1) ? "Width x1" :
659 1.1 dyoung ("Unknown"));
660 1.1 dyoung
661 1.1 dyoung if ((hw->bus.width <= ixgbe_bus_width_pcie_x4) &&
662 1.1 dyoung (hw->bus.speed == ixgbe_bus_speed_2500)) {
663 1.1 dyoung aprint_error_dev(dev, "PCI-Express bandwidth available"
664 1.1 dyoung " for this card\n is not sufficient for"
665 1.1 dyoung " optimal performance.\n");
666 1.1 dyoung aprint_error_dev(dev, "For optimal performance a x8 "
667 1.1 dyoung "PCIE, or x4 PCIE 2 slot is required.\n");
668 1.1 dyoung }
669 1.1 dyoung
670 1.14.2.5 riz /* Set an initial default flow control value */
671 1.14.2.5 riz adapter->fc = ixgbe_fc_full;
672 1.14.2.5 riz
673 1.1 dyoung /* let hardware know driver is loaded */
674 1.1 dyoung ctrl_ext = IXGBE_READ_REG(hw, IXGBE_CTRL_EXT);
675 1.1 dyoung ctrl_ext |= IXGBE_CTRL_EXT_DRV_LOAD;
676 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_CTRL_EXT, ctrl_ext);
677 1.1 dyoung
678 1.1 dyoung ixgbe_add_hw_stats(adapter);
679 1.1 dyoung
680 1.14.2.3 martin #ifdef DEV_NETMAP
681 1.14.2.3 martin ixgbe_netmap_attach(adapter);
682 1.14.2.3 martin #endif /* DEV_NETMAP */
683 1.1 dyoung INIT_DEBUGOUT("ixgbe_attach: end");
684 1.1 dyoung return;
685 1.1 dyoung err_late:
686 1.1 dyoung ixgbe_free_transmit_structures(adapter);
687 1.1 dyoung ixgbe_free_receive_structures(adapter);
688 1.1 dyoung err_out:
689 1.1 dyoung if (adapter->ifp != NULL)
690 1.1 dyoung if_free(adapter->ifp);
691 1.1 dyoung ixgbe_free_pci_resources(adapter);
692 1.1 dyoung if (adapter->mta != NULL)
693 1.1 dyoung free(adapter->mta, M_DEVBUF);
694 1.1 dyoung return;
695 1.1 dyoung
696 1.1 dyoung }
697 1.1 dyoung
698 1.1 dyoung /*********************************************************************
699 1.1 dyoung * Device removal routine
700 1.1 dyoung *
701 1.1 dyoung * The detach entry point is called when the driver is being removed.
702 1.1 dyoung * This routine stops the adapter and deallocates all the resources
703 1.1 dyoung * that were allocated for driver operation.
704 1.1 dyoung *
705 1.1 dyoung * return 0 on success, positive on failure
706 1.1 dyoung *********************************************************************/
707 1.1 dyoung
708 1.1 dyoung static int
709 1.1 dyoung ixgbe_detach(device_t dev, int flags)
710 1.1 dyoung {
711 1.1 dyoung struct adapter *adapter = device_private(dev);
712 1.1 dyoung struct rx_ring *rxr = adapter->rx_rings;
713 1.1 dyoung struct ixgbe_hw_stats *stats = &adapter->stats;
714 1.1 dyoung struct ix_queue *que = adapter->queues;
715 1.14.2.4 riz struct tx_ring *txr = adapter->tx_rings;
716 1.1 dyoung u32 ctrl_ext;
717 1.1 dyoung
718 1.1 dyoung INIT_DEBUGOUT("ixgbe_detach: begin");
719 1.1 dyoung
720 1.14.2.5 riz #if NVLAN > 0
721 1.1 dyoung /* Make sure VLANs are not using driver */
722 1.1 dyoung if (!VLAN_ATTACHED(&adapter->osdep.ec))
723 1.1 dyoung ; /* nothing to do: no VLANs */
724 1.1 dyoung else if ((flags & (DETACH_SHUTDOWN|DETACH_FORCE)) != 0)
725 1.1 dyoung vlan_ifdetach(adapter->ifp);
726 1.1 dyoung else {
727 1.1 dyoung aprint_error_dev(dev, "VLANs in use\n");
728 1.1 dyoung return EBUSY;
729 1.1 dyoung }
730 1.14.2.5 riz #endif
731 1.1 dyoung
732 1.1 dyoung IXGBE_CORE_LOCK(adapter);
733 1.1 dyoung ixgbe_stop(adapter);
734 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
735 1.1 dyoung
736 1.14.2.4 riz for (int i = 0; i < adapter->num_queues; i++, que++, txr++) {
737 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
738 1.14.2.4 riz softint_disestablish(txr->txq_si);
739 1.14.2.4 riz #endif
740 1.1 dyoung softint_disestablish(que->que_si);
741 1.1 dyoung }
742 1.1 dyoung
743 1.1 dyoung /* Drain the Link queue */
744 1.1 dyoung softint_disestablish(adapter->link_si);
745 1.1 dyoung softint_disestablish(adapter->mod_si);
746 1.1 dyoung softint_disestablish(adapter->msf_si);
747 1.1 dyoung #ifdef IXGBE_FDIR
748 1.1 dyoung softint_disestablish(adapter->fdir_si);
749 1.1 dyoung #endif
750 1.1 dyoung
751 1.1 dyoung /* let hardware know driver is unloading */
752 1.1 dyoung ctrl_ext = IXGBE_READ_REG(&adapter->hw, IXGBE_CTRL_EXT);
753 1.1 dyoung ctrl_ext &= ~IXGBE_CTRL_EXT_DRV_LOAD;
754 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_CTRL_EXT, ctrl_ext);
755 1.1 dyoung
756 1.1 dyoung ether_ifdetach(adapter->ifp);
757 1.1 dyoung callout_halt(&adapter->timer, NULL);
758 1.14.2.3 martin #ifdef DEV_NETMAP
759 1.14.2.3 martin netmap_detach(adapter->ifp);
760 1.14.2.3 martin #endif /* DEV_NETMAP */
761 1.1 dyoung ixgbe_free_pci_resources(adapter);
762 1.1 dyoung #if 0 /* XXX the NetBSD port is probably missing something here */
763 1.1 dyoung bus_generic_detach(dev);
764 1.1 dyoung #endif
765 1.1 dyoung if_detach(adapter->ifp);
766 1.1 dyoung
767 1.1 dyoung sysctl_teardown(&adapter->sysctllog);
768 1.1 dyoung evcnt_detach(&adapter->handleq);
769 1.1 dyoung evcnt_detach(&adapter->req);
770 1.1 dyoung evcnt_detach(&adapter->morerx);
771 1.1 dyoung evcnt_detach(&adapter->moretx);
772 1.1 dyoung evcnt_detach(&adapter->txloops);
773 1.1 dyoung evcnt_detach(&adapter->efbig_tx_dma_setup);
774 1.1 dyoung evcnt_detach(&adapter->m_defrag_failed);
775 1.1 dyoung evcnt_detach(&adapter->efbig2_tx_dma_setup);
776 1.1 dyoung evcnt_detach(&adapter->einval_tx_dma_setup);
777 1.1 dyoung evcnt_detach(&adapter->other_tx_dma_setup);
778 1.1 dyoung evcnt_detach(&adapter->eagain_tx_dma_setup);
779 1.1 dyoung evcnt_detach(&adapter->enomem_tx_dma_setup);
780 1.1 dyoung evcnt_detach(&adapter->watchdog_events);
781 1.1 dyoung evcnt_detach(&adapter->tso_err);
782 1.1 dyoung evcnt_detach(&adapter->link_irq);
783 1.14.2.4 riz
784 1.14.2.4 riz txr = adapter->tx_rings;
785 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, rxr++, txr++) {
786 1.1 dyoung evcnt_detach(&txr->no_desc_avail);
787 1.1 dyoung evcnt_detach(&txr->total_packets);
788 1.14.2.5 riz evcnt_detach(&txr->tso_tx);
789 1.1 dyoung
790 1.1 dyoung if (i < __arraycount(adapter->stats.mpc)) {
791 1.1 dyoung evcnt_detach(&adapter->stats.mpc[i]);
792 1.1 dyoung }
793 1.1 dyoung if (i < __arraycount(adapter->stats.pxontxc)) {
794 1.1 dyoung evcnt_detach(&adapter->stats.pxontxc[i]);
795 1.1 dyoung evcnt_detach(&adapter->stats.pxonrxc[i]);
796 1.1 dyoung evcnt_detach(&adapter->stats.pxofftxc[i]);
797 1.1 dyoung evcnt_detach(&adapter->stats.pxoffrxc[i]);
798 1.1 dyoung evcnt_detach(&adapter->stats.pxon2offc[i]);
799 1.1 dyoung }
800 1.1 dyoung if (i < __arraycount(adapter->stats.qprc)) {
801 1.1 dyoung evcnt_detach(&adapter->stats.qprc[i]);
802 1.1 dyoung evcnt_detach(&adapter->stats.qptc[i]);
803 1.1 dyoung evcnt_detach(&adapter->stats.qbrc[i]);
804 1.1 dyoung evcnt_detach(&adapter->stats.qbtc[i]);
805 1.1 dyoung evcnt_detach(&adapter->stats.qprdc[i]);
806 1.1 dyoung }
807 1.1 dyoung
808 1.1 dyoung evcnt_detach(&rxr->rx_packets);
809 1.1 dyoung evcnt_detach(&rxr->rx_bytes);
810 1.1 dyoung evcnt_detach(&rxr->no_jmbuf);
811 1.1 dyoung evcnt_detach(&rxr->rx_discarded);
812 1.1 dyoung evcnt_detach(&rxr->rx_irq);
813 1.1 dyoung }
814 1.1 dyoung evcnt_detach(&stats->ipcs);
815 1.1 dyoung evcnt_detach(&stats->l4cs);
816 1.1 dyoung evcnt_detach(&stats->ipcs_bad);
817 1.1 dyoung evcnt_detach(&stats->l4cs_bad);
818 1.1 dyoung evcnt_detach(&stats->intzero);
819 1.1 dyoung evcnt_detach(&stats->legint);
820 1.1 dyoung evcnt_detach(&stats->crcerrs);
821 1.1 dyoung evcnt_detach(&stats->illerrc);
822 1.1 dyoung evcnt_detach(&stats->errbc);
823 1.1 dyoung evcnt_detach(&stats->mspdc);
824 1.1 dyoung evcnt_detach(&stats->mlfc);
825 1.1 dyoung evcnt_detach(&stats->mrfc);
826 1.1 dyoung evcnt_detach(&stats->rlec);
827 1.1 dyoung evcnt_detach(&stats->lxontxc);
828 1.1 dyoung evcnt_detach(&stats->lxonrxc);
829 1.1 dyoung evcnt_detach(&stats->lxofftxc);
830 1.1 dyoung evcnt_detach(&stats->lxoffrxc);
831 1.1 dyoung
832 1.1 dyoung /* Packet Reception Stats */
833 1.1 dyoung evcnt_detach(&stats->tor);
834 1.1 dyoung evcnt_detach(&stats->gorc);
835 1.1 dyoung evcnt_detach(&stats->tpr);
836 1.1 dyoung evcnt_detach(&stats->gprc);
837 1.1 dyoung evcnt_detach(&stats->mprc);
838 1.1 dyoung evcnt_detach(&stats->bprc);
839 1.1 dyoung evcnt_detach(&stats->prc64);
840 1.1 dyoung evcnt_detach(&stats->prc127);
841 1.1 dyoung evcnt_detach(&stats->prc255);
842 1.1 dyoung evcnt_detach(&stats->prc511);
843 1.1 dyoung evcnt_detach(&stats->prc1023);
844 1.1 dyoung evcnt_detach(&stats->prc1522);
845 1.1 dyoung evcnt_detach(&stats->ruc);
846 1.1 dyoung evcnt_detach(&stats->rfc);
847 1.1 dyoung evcnt_detach(&stats->roc);
848 1.1 dyoung evcnt_detach(&stats->rjc);
849 1.1 dyoung evcnt_detach(&stats->mngprc);
850 1.1 dyoung evcnt_detach(&stats->xec);
851 1.1 dyoung
852 1.1 dyoung /* Packet Transmission Stats */
853 1.1 dyoung evcnt_detach(&stats->gotc);
854 1.1 dyoung evcnt_detach(&stats->tpt);
855 1.1 dyoung evcnt_detach(&stats->gptc);
856 1.1 dyoung evcnt_detach(&stats->bptc);
857 1.1 dyoung evcnt_detach(&stats->mptc);
858 1.1 dyoung evcnt_detach(&stats->mngptc);
859 1.1 dyoung evcnt_detach(&stats->ptc64);
860 1.1 dyoung evcnt_detach(&stats->ptc127);
861 1.1 dyoung evcnt_detach(&stats->ptc255);
862 1.1 dyoung evcnt_detach(&stats->ptc511);
863 1.1 dyoung evcnt_detach(&stats->ptc1023);
864 1.1 dyoung evcnt_detach(&stats->ptc1522);
865 1.1 dyoung
866 1.1 dyoung ixgbe_free_transmit_structures(adapter);
867 1.1 dyoung ixgbe_free_receive_structures(adapter);
868 1.1 dyoung free(adapter->mta, M_DEVBUF);
869 1.1 dyoung
870 1.1 dyoung IXGBE_CORE_LOCK_DESTROY(adapter);
871 1.1 dyoung return (0);
872 1.1 dyoung }
873 1.1 dyoung
874 1.1 dyoung /*********************************************************************
875 1.1 dyoung *
876 1.1 dyoung * Shutdown entry point
877 1.1 dyoung *
878 1.1 dyoung **********************************************************************/
879 1.1 dyoung
880 1.1 dyoung #if 0 /* XXX NetBSD ought to register something like this through pmf(9) */
881 1.1 dyoung static int
882 1.1 dyoung ixgbe_shutdown(device_t dev)
883 1.1 dyoung {
884 1.1 dyoung struct adapter *adapter = device_private(dev);
885 1.1 dyoung IXGBE_CORE_LOCK(adapter);
886 1.1 dyoung ixgbe_stop(adapter);
887 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
888 1.1 dyoung return (0);
889 1.1 dyoung }
890 1.1 dyoung #endif
891 1.1 dyoung
892 1.1 dyoung
893 1.14.2.5 riz #ifdef IXGBE_LEGACY_TX
894 1.1 dyoung /*********************************************************************
895 1.1 dyoung * Transmit entry point
896 1.1 dyoung *
897 1.1 dyoung * ixgbe_start is called by the stack to initiate a transmit.
898 1.1 dyoung * The driver will remain in this routine as long as there are
899 1.1 dyoung * packets to transmit and transmit resources are available.
900 1.1 dyoung * In case resources are not available stack is notified and
901 1.1 dyoung * the packet is requeued.
902 1.1 dyoung **********************************************************************/
903 1.1 dyoung
904 1.1 dyoung static void
905 1.1 dyoung ixgbe_start_locked(struct tx_ring *txr, struct ifnet * ifp)
906 1.1 dyoung {
907 1.1 dyoung int rc;
908 1.1 dyoung struct mbuf *m_head;
909 1.1 dyoung struct adapter *adapter = txr->adapter;
910 1.1 dyoung
911 1.1 dyoung IXGBE_TX_LOCK_ASSERT(txr);
912 1.1 dyoung
913 1.14.2.4 riz if ((ifp->if_flags & IFF_RUNNING) == 0)
914 1.1 dyoung return;
915 1.1 dyoung if (!adapter->link_active)
916 1.1 dyoung return;
917 1.1 dyoung
918 1.1 dyoung while (!IFQ_IS_EMPTY(&ifp->if_snd)) {
919 1.14.2.4 riz if (txr->tx_avail <= IXGBE_QUEUE_MIN_FREE)
920 1.14.2.4 riz break;
921 1.1 dyoung
922 1.1 dyoung IFQ_POLL(&ifp->if_snd, m_head);
923 1.1 dyoung if (m_head == NULL)
924 1.1 dyoung break;
925 1.1 dyoung
926 1.1 dyoung if ((rc = ixgbe_xmit(txr, m_head)) == EAGAIN) {
927 1.1 dyoung break;
928 1.1 dyoung }
929 1.1 dyoung IFQ_DEQUEUE(&ifp->if_snd, m_head);
930 1.1 dyoung if (rc == EFBIG) {
931 1.1 dyoung struct mbuf *mtmp;
932 1.1 dyoung
933 1.14.2.5 riz if ((mtmp = m_defrag(m_head, M_NOWAIT)) != NULL) {
934 1.1 dyoung m_head = mtmp;
935 1.1 dyoung rc = ixgbe_xmit(txr, m_head);
936 1.1 dyoung if (rc != 0)
937 1.1 dyoung adapter->efbig2_tx_dma_setup.ev_count++;
938 1.1 dyoung } else
939 1.1 dyoung adapter->m_defrag_failed.ev_count++;
940 1.1 dyoung }
941 1.1 dyoung if (rc != 0) {
942 1.1 dyoung m_freem(m_head);
943 1.1 dyoung continue;
944 1.1 dyoung }
945 1.1 dyoung
946 1.1 dyoung /* Send a copy of the frame to the BPF listener */
947 1.1 dyoung bpf_mtap(ifp, m_head);
948 1.1 dyoung
949 1.1 dyoung /* Set watchdog on */
950 1.1 dyoung getmicrotime(&txr->watchdog_time);
951 1.1 dyoung txr->queue_status = IXGBE_QUEUE_WORKING;
952 1.1 dyoung
953 1.1 dyoung }
954 1.1 dyoung return;
955 1.1 dyoung }
956 1.1 dyoung
957 1.1 dyoung /*
958 1.1 dyoung * Legacy TX start - called by the stack, this
959 1.1 dyoung * always uses the first tx ring, and should
960 1.1 dyoung * not be used with multiqueue tx enabled.
961 1.1 dyoung */
962 1.1 dyoung static void
963 1.1 dyoung ixgbe_start(struct ifnet *ifp)
964 1.1 dyoung {
965 1.1 dyoung struct adapter *adapter = ifp->if_softc;
966 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
967 1.1 dyoung
968 1.1 dyoung if (ifp->if_flags & IFF_RUNNING) {
969 1.1 dyoung IXGBE_TX_LOCK(txr);
970 1.1 dyoung ixgbe_start_locked(txr, ifp);
971 1.1 dyoung IXGBE_TX_UNLOCK(txr);
972 1.1 dyoung }
973 1.1 dyoung return;
974 1.1 dyoung }
975 1.1 dyoung
976 1.14.2.5 riz #else /* ! IXGBE_LEGACY_TX */
977 1.14.2.5 riz
978 1.1 dyoung /*
979 1.1 dyoung ** Multiqueue Transmit driver
980 1.1 dyoung **
981 1.1 dyoung */
982 1.1 dyoung static int
983 1.1 dyoung ixgbe_mq_start(struct ifnet *ifp, struct mbuf *m)
984 1.1 dyoung {
985 1.1 dyoung struct adapter *adapter = ifp->if_softc;
986 1.1 dyoung struct ix_queue *que;
987 1.1 dyoung struct tx_ring *txr;
988 1.1 dyoung int i = 0, err = 0;
989 1.1 dyoung
990 1.1 dyoung /* Which queue to use */
991 1.1 dyoung if ((m->m_flags & M_FLOWID) != 0)
992 1.1 dyoung i = m->m_pkthdr.flowid % adapter->num_queues;
993 1.14.2.4 riz else
994 1.14.2.5 riz i = cpu_index(curcpu()) % adapter->num_queues;
995 1.1 dyoung
996 1.1 dyoung txr = &adapter->tx_rings[i];
997 1.1 dyoung que = &adapter->queues[i];
998 1.1 dyoung
999 1.1 dyoung if (IXGBE_TX_TRYLOCK(txr)) {
1000 1.1 dyoung err = ixgbe_mq_start_locked(ifp, txr, m);
1001 1.1 dyoung IXGBE_TX_UNLOCK(txr);
1002 1.1 dyoung } else {
1003 1.1 dyoung err = drbr_enqueue(ifp, txr->br, m);
1004 1.14.2.4 riz softint_schedule(txr->txq_si);
1005 1.1 dyoung }
1006 1.1 dyoung
1007 1.1 dyoung return (err);
1008 1.1 dyoung }
1009 1.1 dyoung
1010 1.1 dyoung static int
1011 1.1 dyoung ixgbe_mq_start_locked(struct ifnet *ifp, struct tx_ring *txr, struct mbuf *m)
1012 1.1 dyoung {
1013 1.1 dyoung struct adapter *adapter = txr->adapter;
1014 1.1 dyoung struct mbuf *next;
1015 1.1 dyoung int enqueued, err = 0;
1016 1.1 dyoung
1017 1.14.2.4 riz if (((ifp->if_flags & IFF_RUNNING) == 0) ||
1018 1.14.2.4 riz adapter->link_active == 0) {
1019 1.1 dyoung if (m != NULL)
1020 1.1 dyoung err = drbr_enqueue(ifp, txr->br, m);
1021 1.1 dyoung return (err);
1022 1.1 dyoung }
1023 1.1 dyoung
1024 1.1 dyoung enqueued = 0;
1025 1.14.2.5 riz if (m != NULL) {
1026 1.14.2.5 riz err = drbr_enqueue(ifp, txr->br, m);
1027 1.14.2.5 riz if (err) {
1028 1.1 dyoung return (err);
1029 1.14.2.5 riz }
1030 1.14.2.5 riz }
1031 1.1 dyoung
1032 1.1 dyoung /* Process the queue */
1033 1.14.2.5 riz while ((next = drbr_peek(ifp, txr->br)) != NULL) {
1034 1.1 dyoung if ((err = ixgbe_xmit(txr, &next)) != 0) {
1035 1.14.2.5 riz if (next == NULL) {
1036 1.14.2.5 riz drbr_advance(ifp, txr->br);
1037 1.14.2.5 riz } else {
1038 1.14.2.5 riz drbr_putback(ifp, txr->br, next);
1039 1.14.2.5 riz }
1040 1.1 dyoung break;
1041 1.1 dyoung }
1042 1.14.2.5 riz drbr_advance(ifp, txr->br);
1043 1.1 dyoung enqueued++;
1044 1.1 dyoung /* Send a copy of the frame to the BPF listener */
1045 1.1 dyoung bpf_mtap(ifp, next);
1046 1.1 dyoung if ((ifp->if_flags & IFF_RUNNING) == 0)
1047 1.1 dyoung break;
1048 1.1 dyoung if (txr->tx_avail < IXGBE_TX_OP_THRESHOLD)
1049 1.1 dyoung ixgbe_txeof(txr);
1050 1.1 dyoung }
1051 1.1 dyoung
1052 1.1 dyoung if (enqueued > 0) {
1053 1.1 dyoung /* Set watchdog on */
1054 1.1 dyoung txr->queue_status = IXGBE_QUEUE_WORKING;
1055 1.1 dyoung getmicrotime(&txr->watchdog_time);
1056 1.1 dyoung }
1057 1.1 dyoung
1058 1.14.2.4 riz if (txr->tx_avail < IXGBE_TX_CLEANUP_THRESHOLD)
1059 1.14.2.4 riz ixgbe_txeof(txr);
1060 1.14.2.4 riz
1061 1.1 dyoung return (err);
1062 1.1 dyoung }
1063 1.1 dyoung
1064 1.1 dyoung /*
1065 1.14.2.4 riz * Called from a taskqueue to drain queued transmit packets.
1066 1.14.2.4 riz */
1067 1.14.2.4 riz static void
1068 1.14.2.5 riz ixgbe_deferred_mq_start(void *arg)
1069 1.14.2.4 riz {
1070 1.14.2.4 riz struct tx_ring *txr = arg;
1071 1.14.2.4 riz struct adapter *adapter = txr->adapter;
1072 1.14.2.4 riz struct ifnet *ifp = adapter->ifp;
1073 1.14.2.4 riz
1074 1.14.2.4 riz IXGBE_TX_LOCK(txr);
1075 1.14.2.4 riz if (!drbr_empty(ifp, txr->br))
1076 1.14.2.4 riz ixgbe_mq_start_locked(ifp, txr, NULL);
1077 1.14.2.4 riz IXGBE_TX_UNLOCK(txr);
1078 1.14.2.4 riz }
1079 1.14.2.4 riz
1080 1.14.2.4 riz /*
1081 1.1 dyoung ** Flush all ring buffers
1082 1.1 dyoung */
1083 1.1 dyoung static void
1084 1.1 dyoung ixgbe_qflush(struct ifnet *ifp)
1085 1.1 dyoung {
1086 1.1 dyoung struct adapter *adapter = ifp->if_softc;
1087 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
1088 1.1 dyoung struct mbuf *m;
1089 1.1 dyoung
1090 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, txr++) {
1091 1.1 dyoung IXGBE_TX_LOCK(txr);
1092 1.1 dyoung while ((m = buf_ring_dequeue_sc(txr->br)) != NULL)
1093 1.1 dyoung m_freem(m);
1094 1.1 dyoung IXGBE_TX_UNLOCK(txr);
1095 1.1 dyoung }
1096 1.1 dyoung if_qflush(ifp);
1097 1.1 dyoung }
1098 1.14.2.5 riz #endif /* IXGBE_LEGACY_TX */
1099 1.1 dyoung
1100 1.1 dyoung static int
1101 1.1 dyoung ixgbe_ifflags_cb(struct ethercom *ec)
1102 1.1 dyoung {
1103 1.1 dyoung struct ifnet *ifp = &ec->ec_if;
1104 1.1 dyoung struct adapter *adapter = ifp->if_softc;
1105 1.1 dyoung int change = ifp->if_flags ^ adapter->if_flags, rc = 0;
1106 1.1 dyoung
1107 1.1 dyoung IXGBE_CORE_LOCK(adapter);
1108 1.1 dyoung
1109 1.1 dyoung if (change != 0)
1110 1.1 dyoung adapter->if_flags = ifp->if_flags;
1111 1.1 dyoung
1112 1.1 dyoung if ((change & ~(IFF_CANTCHANGE|IFF_DEBUG)) != 0)
1113 1.1 dyoung rc = ENETRESET;
1114 1.1 dyoung else if ((change & (IFF_PROMISC | IFF_ALLMULTI)) != 0)
1115 1.1 dyoung ixgbe_set_promisc(adapter);
1116 1.1 dyoung
1117 1.14.2.3 martin /* Set up VLAN support and filter */
1118 1.14.2.3 martin ixgbe_setup_vlan_hw_support(adapter);
1119 1.14.2.3 martin
1120 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
1121 1.1 dyoung
1122 1.1 dyoung return rc;
1123 1.1 dyoung }
1124 1.1 dyoung
1125 1.1 dyoung /*********************************************************************
1126 1.1 dyoung * Ioctl entry point
1127 1.1 dyoung *
1128 1.1 dyoung * ixgbe_ioctl is called when the user wants to configure the
1129 1.1 dyoung * interface.
1130 1.1 dyoung *
1131 1.1 dyoung * return 0 on success, positive on failure
1132 1.1 dyoung **********************************************************************/
1133 1.1 dyoung
1134 1.1 dyoung static int
1135 1.1 dyoung ixgbe_ioctl(struct ifnet * ifp, u_long command, void *data)
1136 1.1 dyoung {
1137 1.1 dyoung struct adapter *adapter = ifp->if_softc;
1138 1.14.2.5 riz struct ixgbe_hw *hw = &adapter->hw;
1139 1.1 dyoung struct ifcapreq *ifcr = data;
1140 1.1 dyoung struct ifreq *ifr = data;
1141 1.1 dyoung int error = 0;
1142 1.1 dyoung int l4csum_en;
1143 1.1 dyoung const int l4csum = IFCAP_CSUM_TCPv4_Rx|IFCAP_CSUM_UDPv4_Rx|
1144 1.1 dyoung IFCAP_CSUM_TCPv6_Rx|IFCAP_CSUM_UDPv6_Rx;
1145 1.1 dyoung
1146 1.1 dyoung switch (command) {
1147 1.1 dyoung case SIOCSIFFLAGS:
1148 1.1 dyoung IOCTL_DEBUGOUT("ioctl: SIOCSIFFLAGS (Set Interface Flags)");
1149 1.1 dyoung break;
1150 1.1 dyoung case SIOCADDMULTI:
1151 1.1 dyoung case SIOCDELMULTI:
1152 1.1 dyoung IOCTL_DEBUGOUT("ioctl: SIOC(ADD|DEL)MULTI");
1153 1.1 dyoung break;
1154 1.1 dyoung case SIOCSIFMEDIA:
1155 1.1 dyoung case SIOCGIFMEDIA:
1156 1.1 dyoung IOCTL_DEBUGOUT("ioctl: SIOCxIFMEDIA (Get/Set Interface Media)");
1157 1.1 dyoung break;
1158 1.1 dyoung case SIOCSIFCAP:
1159 1.1 dyoung IOCTL_DEBUGOUT("ioctl: SIOCSIFCAP (Set Capabilities)");
1160 1.1 dyoung break;
1161 1.1 dyoung case SIOCSIFMTU:
1162 1.1 dyoung IOCTL_DEBUGOUT("ioctl: SIOCSIFMTU (Set Interface MTU)");
1163 1.1 dyoung break;
1164 1.1 dyoung default:
1165 1.1 dyoung IOCTL_DEBUGOUT1("ioctl: UNKNOWN (0x%X)\n", (int)command);
1166 1.1 dyoung break;
1167 1.1 dyoung }
1168 1.1 dyoung
1169 1.1 dyoung switch (command) {
1170 1.1 dyoung case SIOCSIFMEDIA:
1171 1.1 dyoung case SIOCGIFMEDIA:
1172 1.1 dyoung return ifmedia_ioctl(ifp, ifr, &adapter->media, command);
1173 1.14.2.5 riz case SIOCGI2C:
1174 1.14.2.5 riz {
1175 1.14.2.5 riz struct ixgbe_i2c_req i2c;
1176 1.14.2.5 riz IOCTL_DEBUGOUT("ioctl: SIOCGI2C (Get I2C Data)");
1177 1.14.2.5 riz error = copyin(ifr->ifr_data, &i2c, sizeof(i2c));
1178 1.14.2.5 riz if (error)
1179 1.14.2.5 riz break;
1180 1.14.2.5 riz if ((i2c.dev_addr != 0xA0) || (i2c.dev_addr != 0xA2)){
1181 1.14.2.5 riz error = EINVAL;
1182 1.14.2.5 riz break;
1183 1.14.2.5 riz }
1184 1.14.2.5 riz hw->phy.ops.read_i2c_byte(hw, i2c.offset,
1185 1.14.2.5 riz i2c.dev_addr, i2c.data);
1186 1.14.2.5 riz error = copyout(&i2c, ifr->ifr_data, sizeof(i2c));
1187 1.14.2.5 riz break;
1188 1.14.2.5 riz }
1189 1.1 dyoung case SIOCSIFCAP:
1190 1.1 dyoung /* Layer-4 Rx checksum offload has to be turned on and
1191 1.1 dyoung * off as a unit.
1192 1.1 dyoung */
1193 1.1 dyoung l4csum_en = ifcr->ifcr_capenable & l4csum;
1194 1.1 dyoung if (l4csum_en != l4csum && l4csum_en != 0)
1195 1.1 dyoung return EINVAL;
1196 1.1 dyoung /*FALLTHROUGH*/
1197 1.1 dyoung case SIOCADDMULTI:
1198 1.1 dyoung case SIOCDELMULTI:
1199 1.1 dyoung case SIOCSIFFLAGS:
1200 1.1 dyoung case SIOCSIFMTU:
1201 1.1 dyoung default:
1202 1.1 dyoung if ((error = ether_ioctl(ifp, command, data)) != ENETRESET)
1203 1.1 dyoung return error;
1204 1.1 dyoung if ((ifp->if_flags & IFF_RUNNING) == 0)
1205 1.1 dyoung ;
1206 1.1 dyoung else if (command == SIOCSIFCAP || command == SIOCSIFMTU) {
1207 1.1 dyoung IXGBE_CORE_LOCK(adapter);
1208 1.1 dyoung ixgbe_init_locked(adapter);
1209 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
1210 1.1 dyoung } else if (command == SIOCADDMULTI || command == SIOCDELMULTI) {
1211 1.1 dyoung /*
1212 1.1 dyoung * Multicast list has changed; set the hardware filter
1213 1.1 dyoung * accordingly.
1214 1.1 dyoung */
1215 1.1 dyoung IXGBE_CORE_LOCK(adapter);
1216 1.1 dyoung ixgbe_disable_intr(adapter);
1217 1.1 dyoung ixgbe_set_multi(adapter);
1218 1.1 dyoung ixgbe_enable_intr(adapter);
1219 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
1220 1.1 dyoung }
1221 1.1 dyoung return 0;
1222 1.1 dyoung }
1223 1.14.2.5 riz
1224 1.14.2.5 riz return error;
1225 1.1 dyoung }
1226 1.1 dyoung
1227 1.1 dyoung /*********************************************************************
1228 1.1 dyoung * Init entry point
1229 1.1 dyoung *
1230 1.1 dyoung * This routine is used in two ways. It is used by the stack as
1231 1.1 dyoung * init entry point in network interface structure. It is also used
1232 1.1 dyoung * by the driver as a hw/sw initialization routine to get to a
1233 1.1 dyoung * consistent state.
1234 1.1 dyoung *
1235 1.1 dyoung * return 0 on success, positive on failure
1236 1.1 dyoung **********************************************************************/
1237 1.1 dyoung #define IXGBE_MHADD_MFS_SHIFT 16
1238 1.1 dyoung
1239 1.1 dyoung static void
1240 1.1 dyoung ixgbe_init_locked(struct adapter *adapter)
1241 1.1 dyoung {
1242 1.1 dyoung struct ifnet *ifp = adapter->ifp;
1243 1.1 dyoung device_t dev = adapter->dev;
1244 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
1245 1.1 dyoung u32 k, txdctl, mhadd, gpie;
1246 1.1 dyoung u32 rxdctl, rxctrl;
1247 1.1 dyoung
1248 1.1 dyoung /* XXX check IFF_UP and IFF_RUNNING, power-saving state! */
1249 1.1 dyoung
1250 1.1 dyoung KASSERT(mutex_owned(&adapter->core_mtx));
1251 1.1 dyoung INIT_DEBUGOUT("ixgbe_init: begin");
1252 1.1 dyoung hw->adapter_stopped = FALSE;
1253 1.1 dyoung ixgbe_stop_adapter(hw);
1254 1.1 dyoung callout_stop(&adapter->timer);
1255 1.1 dyoung
1256 1.1 dyoung /* XXX I moved this here from the SIOCSIFMTU case in ixgbe_ioctl(). */
1257 1.1 dyoung adapter->max_frame_size =
1258 1.1 dyoung ifp->if_mtu + ETHER_HDR_LEN + ETHER_CRC_LEN;
1259 1.1 dyoung
1260 1.1 dyoung /* reprogram the RAR[0] in case user changed it. */
1261 1.1 dyoung ixgbe_set_rar(hw, 0, adapter->hw.mac.addr, 0, IXGBE_RAH_AV);
1262 1.1 dyoung
1263 1.1 dyoung /* Get the latest mac address, User can use a LAA */
1264 1.1 dyoung memcpy(hw->mac.addr, CLLADDR(adapter->ifp->if_sadl),
1265 1.1 dyoung IXGBE_ETH_LENGTH_OF_ADDRESS);
1266 1.1 dyoung ixgbe_set_rar(hw, 0, hw->mac.addr, 0, 1);
1267 1.1 dyoung hw->addr_ctrl.rar_used_count = 1;
1268 1.1 dyoung
1269 1.1 dyoung /* Prepare transmit descriptors and buffers */
1270 1.1 dyoung if (ixgbe_setup_transmit_structures(adapter)) {
1271 1.1 dyoung device_printf(dev,"Could not setup transmit structures\n");
1272 1.1 dyoung ixgbe_stop(adapter);
1273 1.1 dyoung return;
1274 1.1 dyoung }
1275 1.1 dyoung
1276 1.1 dyoung ixgbe_init_hw(hw);
1277 1.1 dyoung ixgbe_initialize_transmit_units(adapter);
1278 1.1 dyoung
1279 1.1 dyoung /* Setup Multicast table */
1280 1.1 dyoung ixgbe_set_multi(adapter);
1281 1.1 dyoung
1282 1.1 dyoung /*
1283 1.1 dyoung ** Determine the correct mbuf pool
1284 1.14.2.4 riz ** for doing jumbo frames
1285 1.1 dyoung */
1286 1.1 dyoung if (adapter->max_frame_size <= 2048)
1287 1.1 dyoung adapter->rx_mbuf_sz = MCLBYTES;
1288 1.1 dyoung else if (adapter->max_frame_size <= 4096)
1289 1.1 dyoung adapter->rx_mbuf_sz = MJUMPAGESIZE;
1290 1.1 dyoung else if (adapter->max_frame_size <= 9216)
1291 1.1 dyoung adapter->rx_mbuf_sz = MJUM9BYTES;
1292 1.1 dyoung else
1293 1.1 dyoung adapter->rx_mbuf_sz = MJUM16BYTES;
1294 1.1 dyoung
1295 1.1 dyoung /* Prepare receive descriptors and buffers */
1296 1.1 dyoung if (ixgbe_setup_receive_structures(adapter)) {
1297 1.1 dyoung device_printf(dev,"Could not setup receive structures\n");
1298 1.1 dyoung ixgbe_stop(adapter);
1299 1.1 dyoung return;
1300 1.1 dyoung }
1301 1.1 dyoung
1302 1.1 dyoung /* Configure RX settings */
1303 1.1 dyoung ixgbe_initialize_receive_units(adapter);
1304 1.1 dyoung
1305 1.1 dyoung gpie = IXGBE_READ_REG(&adapter->hw, IXGBE_GPIE);
1306 1.1 dyoung
1307 1.1 dyoung /* Enable Fan Failure Interrupt */
1308 1.1 dyoung gpie |= IXGBE_SDP1_GPIEN;
1309 1.1 dyoung
1310 1.1 dyoung /* Add for Thermal detection */
1311 1.1 dyoung if (hw->mac.type == ixgbe_mac_82599EB)
1312 1.1 dyoung gpie |= IXGBE_SDP2_GPIEN;
1313 1.1 dyoung
1314 1.14.2.4 riz /* Thermal Failure Detection */
1315 1.14.2.4 riz if (hw->mac.type == ixgbe_mac_X540)
1316 1.14.2.4 riz gpie |= IXGBE_SDP0_GPIEN;
1317 1.14.2.4 riz
1318 1.1 dyoung if (adapter->msix > 1) {
1319 1.1 dyoung /* Enable Enhanced MSIX mode */
1320 1.1 dyoung gpie |= IXGBE_GPIE_MSIX_MODE;
1321 1.1 dyoung gpie |= IXGBE_GPIE_EIAME | IXGBE_GPIE_PBA_SUPPORT |
1322 1.1 dyoung IXGBE_GPIE_OCD;
1323 1.1 dyoung }
1324 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_GPIE, gpie);
1325 1.1 dyoung
1326 1.1 dyoung /* Set MTU size */
1327 1.1 dyoung if (ifp->if_mtu > ETHERMTU) {
1328 1.1 dyoung mhadd = IXGBE_READ_REG(hw, IXGBE_MHADD);
1329 1.1 dyoung mhadd &= ~IXGBE_MHADD_MFS_MASK;
1330 1.1 dyoung mhadd |= adapter->max_frame_size << IXGBE_MHADD_MFS_SHIFT;
1331 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_MHADD, mhadd);
1332 1.1 dyoung }
1333 1.1 dyoung
1334 1.1 dyoung /* Now enable all the queues */
1335 1.1 dyoung
1336 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++) {
1337 1.1 dyoung txdctl = IXGBE_READ_REG(hw, IXGBE_TXDCTL(i));
1338 1.1 dyoung txdctl |= IXGBE_TXDCTL_ENABLE;
1339 1.1 dyoung /* Set WTHRESH to 8, burst writeback */
1340 1.1 dyoung txdctl |= (8 << 16);
1341 1.14.2.4 riz /*
1342 1.14.2.4 riz * When the internal queue falls below PTHRESH (32),
1343 1.14.2.4 riz * start prefetching as long as there are at least
1344 1.14.2.4 riz * HTHRESH (1) buffers ready. The values are taken
1345 1.14.2.4 riz * from the Intel linux driver 3.8.21.
1346 1.14.2.4 riz * Prefetching enables tx line rate even with 1 queue.
1347 1.14.2.4 riz */
1348 1.14.2.4 riz txdctl |= (32 << 0) | (1 << 8);
1349 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_TXDCTL(i), txdctl);
1350 1.1 dyoung }
1351 1.1 dyoung
1352 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++) {
1353 1.1 dyoung rxdctl = IXGBE_READ_REG(hw, IXGBE_RXDCTL(i));
1354 1.1 dyoung if (hw->mac.type == ixgbe_mac_82598EB) {
1355 1.1 dyoung /*
1356 1.1 dyoung ** PTHRESH = 21
1357 1.1 dyoung ** HTHRESH = 4
1358 1.1 dyoung ** WTHRESH = 8
1359 1.1 dyoung */
1360 1.1 dyoung rxdctl &= ~0x3FFFFF;
1361 1.1 dyoung rxdctl |= 0x080420;
1362 1.1 dyoung }
1363 1.1 dyoung rxdctl |= IXGBE_RXDCTL_ENABLE;
1364 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RXDCTL(i), rxdctl);
1365 1.1 dyoung /* XXX I don't trust this loop, and I don't trust the
1366 1.1 dyoung * XXX memory barrier. What is this meant to do? --dyoung
1367 1.1 dyoung */
1368 1.1 dyoung for (k = 0; k < 10; k++) {
1369 1.1 dyoung if (IXGBE_READ_REG(hw, IXGBE_RXDCTL(i)) &
1370 1.1 dyoung IXGBE_RXDCTL_ENABLE)
1371 1.1 dyoung break;
1372 1.1 dyoung else
1373 1.1 dyoung msec_delay(1);
1374 1.1 dyoung }
1375 1.1 dyoung wmb();
1376 1.14.2.3 martin #ifdef DEV_NETMAP
1377 1.14.2.3 martin /*
1378 1.14.2.3 martin * In netmap mode, we must preserve the buffers made
1379 1.14.2.3 martin * available to userspace before the if_init()
1380 1.14.2.3 martin * (this is true by default on the TX side, because
1381 1.14.2.3 martin * init makes all buffers available to userspace).
1382 1.14.2.3 martin *
1383 1.14.2.3 martin * netmap_reset() and the device specific routines
1384 1.14.2.3 martin * (e.g. ixgbe_setup_receive_rings()) map these
1385 1.14.2.3 martin * buffers at the end of the NIC ring, so here we
1386 1.14.2.3 martin * must set the RDT (tail) register to make sure
1387 1.14.2.3 martin * they are not overwritten.
1388 1.14.2.3 martin *
1389 1.14.2.3 martin * In this driver the NIC ring starts at RDH = 0,
1390 1.14.2.3 martin * RDT points to the last slot available for reception (?),
1391 1.14.2.3 martin * so RDT = num_rx_desc - 1 means the whole ring is available.
1392 1.14.2.3 martin */
1393 1.14.2.3 martin if (ifp->if_capenable & IFCAP_NETMAP) {
1394 1.14.2.3 martin struct netmap_adapter *na = NA(adapter->ifp);
1395 1.14.2.3 martin struct netmap_kring *kring = &na->rx_rings[i];
1396 1.14.2.3 martin int t = na->num_rx_desc - 1 - kring->nr_hwavail;
1397 1.14.2.3 martin
1398 1.14.2.3 martin IXGBE_WRITE_REG(hw, IXGBE_RDT(i), t);
1399 1.14.2.3 martin } else
1400 1.14.2.3 martin #endif /* DEV_NETMAP */
1401 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDT(i), adapter->num_rx_desc - 1);
1402 1.1 dyoung }
1403 1.1 dyoung
1404 1.1 dyoung /* Set up VLAN support and filter */
1405 1.1 dyoung ixgbe_setup_vlan_hw_support(adapter);
1406 1.1 dyoung
1407 1.1 dyoung /* Enable Receive engine */
1408 1.1 dyoung rxctrl = IXGBE_READ_REG(hw, IXGBE_RXCTRL);
1409 1.1 dyoung if (hw->mac.type == ixgbe_mac_82598EB)
1410 1.1 dyoung rxctrl |= IXGBE_RXCTRL_DMBYPS;
1411 1.1 dyoung rxctrl |= IXGBE_RXCTRL_RXEN;
1412 1.1 dyoung ixgbe_enable_rx_dma(hw, rxctrl);
1413 1.1 dyoung
1414 1.1 dyoung callout_reset(&adapter->timer, hz, ixgbe_local_timer, adapter);
1415 1.1 dyoung
1416 1.1 dyoung /* Set up MSI/X routing */
1417 1.1 dyoung if (ixgbe_enable_msix) {
1418 1.1 dyoung ixgbe_configure_ivars(adapter);
1419 1.1 dyoung /* Set up auto-mask */
1420 1.1 dyoung if (hw->mac.type == ixgbe_mac_82598EB)
1421 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIAM, IXGBE_EICS_RTX_QUEUE);
1422 1.1 dyoung else {
1423 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIAM_EX(0), 0xFFFFFFFF);
1424 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIAM_EX(1), 0xFFFFFFFF);
1425 1.1 dyoung }
1426 1.1 dyoung } else { /* Simple settings for Legacy/MSI */
1427 1.1 dyoung ixgbe_set_ivar(adapter, 0, 0, 0);
1428 1.1 dyoung ixgbe_set_ivar(adapter, 0, 0, 1);
1429 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIAM, IXGBE_EICS_RTX_QUEUE);
1430 1.1 dyoung }
1431 1.1 dyoung
1432 1.1 dyoung #ifdef IXGBE_FDIR
1433 1.1 dyoung /* Init Flow director */
1434 1.14.2.4 riz if (hw->mac.type != ixgbe_mac_82598EB) {
1435 1.14.2.4 riz u32 hdrm = 32 << fdir_pballoc;
1436 1.14.2.4 riz
1437 1.14.2.4 riz hw->mac.ops.setup_rxpba(hw, 0, hdrm, PBA_STRATEGY_EQUAL);
1438 1.1 dyoung ixgbe_init_fdir_signature_82599(&adapter->hw, fdir_pballoc);
1439 1.14.2.4 riz }
1440 1.1 dyoung #endif
1441 1.1 dyoung
1442 1.1 dyoung /*
1443 1.1 dyoung ** Check on any SFP devices that
1444 1.1 dyoung ** need to be kick-started
1445 1.1 dyoung */
1446 1.1 dyoung if (hw->phy.type == ixgbe_phy_none) {
1447 1.1 dyoung int err = hw->phy.ops.identify(hw);
1448 1.1 dyoung if (err == IXGBE_ERR_SFP_NOT_SUPPORTED) {
1449 1.1 dyoung device_printf(dev,
1450 1.1 dyoung "Unsupported SFP+ module type was detected.\n");
1451 1.1 dyoung return;
1452 1.1 dyoung }
1453 1.1 dyoung }
1454 1.1 dyoung
1455 1.1 dyoung /* Set moderation on the Link interrupt */
1456 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EITR(adapter->linkvec), IXGBE_LINK_ITR);
1457 1.1 dyoung
1458 1.1 dyoung /* Config/Enable Link */
1459 1.1 dyoung ixgbe_config_link(adapter);
1460 1.1 dyoung
1461 1.14.2.4 riz /* Hardware Packet Buffer & Flow Control setup */
1462 1.14.2.4 riz {
1463 1.14.2.4 riz u32 rxpb, frame, size, tmp;
1464 1.14.2.4 riz
1465 1.14.2.4 riz frame = adapter->max_frame_size;
1466 1.14.2.4 riz
1467 1.14.2.4 riz /* Calculate High Water */
1468 1.14.2.4 riz if (hw->mac.type == ixgbe_mac_X540)
1469 1.14.2.4 riz tmp = IXGBE_DV_X540(frame, frame);
1470 1.14.2.4 riz else
1471 1.14.2.4 riz tmp = IXGBE_DV(frame, frame);
1472 1.14.2.4 riz size = IXGBE_BT2KB(tmp);
1473 1.14.2.4 riz rxpb = IXGBE_READ_REG(hw, IXGBE_RXPBSIZE(0)) >> 10;
1474 1.14.2.4 riz hw->fc.high_water[0] = rxpb - size;
1475 1.14.2.4 riz
1476 1.14.2.4 riz /* Now calculate Low Water */
1477 1.14.2.4 riz if (hw->mac.type == ixgbe_mac_X540)
1478 1.14.2.4 riz tmp = IXGBE_LOW_DV_X540(frame);
1479 1.14.2.4 riz else
1480 1.14.2.4 riz tmp = IXGBE_LOW_DV(frame);
1481 1.14.2.4 riz hw->fc.low_water[0] = IXGBE_BT2KB(tmp);
1482 1.14.2.4 riz
1483 1.14.2.5 riz hw->fc.requested_mode = adapter->fc;
1484 1.14.2.4 riz hw->fc.pause_time = IXGBE_FC_PAUSE;
1485 1.14.2.4 riz hw->fc.send_xon = TRUE;
1486 1.14.2.4 riz }
1487 1.14.2.4 riz /* Initialize the FC settings */
1488 1.14.2.4 riz ixgbe_start_hw(hw);
1489 1.14.2.4 riz
1490 1.1 dyoung /* And now turn on interrupts */
1491 1.1 dyoung ixgbe_enable_intr(adapter);
1492 1.1 dyoung
1493 1.1 dyoung /* Now inform the stack we're ready */
1494 1.1 dyoung ifp->if_flags |= IFF_RUNNING;
1495 1.1 dyoung
1496 1.1 dyoung return;
1497 1.1 dyoung }
1498 1.1 dyoung
1499 1.1 dyoung static int
1500 1.1 dyoung ixgbe_init(struct ifnet *ifp)
1501 1.1 dyoung {
1502 1.1 dyoung struct adapter *adapter = ifp->if_softc;
1503 1.1 dyoung
1504 1.1 dyoung IXGBE_CORE_LOCK(adapter);
1505 1.1 dyoung ixgbe_init_locked(adapter);
1506 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
1507 1.1 dyoung return 0; /* XXX ixgbe_init_locked cannot fail? really? */
1508 1.1 dyoung }
1509 1.1 dyoung
1510 1.1 dyoung
1511 1.1 dyoung /*
1512 1.1 dyoung **
1513 1.1 dyoung ** MSIX Interrupt Handlers and Tasklets
1514 1.1 dyoung **
1515 1.1 dyoung */
1516 1.1 dyoung
1517 1.1 dyoung static inline void
1518 1.1 dyoung ixgbe_enable_queue(struct adapter *adapter, u32 vector)
1519 1.1 dyoung {
1520 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
1521 1.13 christos u64 queue = (u64)(1ULL << vector);
1522 1.1 dyoung u32 mask;
1523 1.1 dyoung
1524 1.1 dyoung if (hw->mac.type == ixgbe_mac_82598EB) {
1525 1.1 dyoung mask = (IXGBE_EIMS_RTX_QUEUE & queue);
1526 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMS, mask);
1527 1.1 dyoung } else {
1528 1.1 dyoung mask = (queue & 0xFFFFFFFF);
1529 1.1 dyoung if (mask)
1530 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMS_EX(0), mask);
1531 1.1 dyoung mask = (queue >> 32);
1532 1.1 dyoung if (mask)
1533 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMS_EX(1), mask);
1534 1.1 dyoung }
1535 1.1 dyoung }
1536 1.1 dyoung
1537 1.11 joerg __unused static inline void
1538 1.1 dyoung ixgbe_disable_queue(struct adapter *adapter, u32 vector)
1539 1.1 dyoung {
1540 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
1541 1.13 christos u64 queue = (u64)(1ULL << vector);
1542 1.1 dyoung u32 mask;
1543 1.1 dyoung
1544 1.1 dyoung if (hw->mac.type == ixgbe_mac_82598EB) {
1545 1.1 dyoung mask = (IXGBE_EIMS_RTX_QUEUE & queue);
1546 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMC, mask);
1547 1.1 dyoung } else {
1548 1.1 dyoung mask = (queue & 0xFFFFFFFF);
1549 1.1 dyoung if (mask)
1550 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMC_EX(0), mask);
1551 1.1 dyoung mask = (queue >> 32);
1552 1.1 dyoung if (mask)
1553 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMC_EX(1), mask);
1554 1.1 dyoung }
1555 1.1 dyoung }
1556 1.1 dyoung
1557 1.1 dyoung static inline void
1558 1.1 dyoung ixgbe_rearm_queues(struct adapter *adapter, u64 queues)
1559 1.1 dyoung {
1560 1.1 dyoung u32 mask;
1561 1.1 dyoung
1562 1.1 dyoung if (adapter->hw.mac.type == ixgbe_mac_82598EB) {
1563 1.1 dyoung mask = (IXGBE_EIMS_RTX_QUEUE & queues);
1564 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EICS, mask);
1565 1.1 dyoung } else {
1566 1.1 dyoung mask = (queues & 0xFFFFFFFF);
1567 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EICS_EX(0), mask);
1568 1.1 dyoung mask = (queues >> 32);
1569 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EICS_EX(1), mask);
1570 1.1 dyoung }
1571 1.1 dyoung }
1572 1.1 dyoung
1573 1.1 dyoung
1574 1.1 dyoung static void
1575 1.1 dyoung ixgbe_handle_que(void *context)
1576 1.1 dyoung {
1577 1.1 dyoung struct ix_queue *que = context;
1578 1.1 dyoung struct adapter *adapter = que->adapter;
1579 1.1 dyoung struct tx_ring *txr = que->txr;
1580 1.1 dyoung struct ifnet *ifp = adapter->ifp;
1581 1.1 dyoung bool more;
1582 1.1 dyoung
1583 1.1 dyoung adapter->handleq.ev_count++;
1584 1.1 dyoung
1585 1.1 dyoung if (ifp->if_flags & IFF_RUNNING) {
1586 1.14.2.5 riz more = ixgbe_rxeof(que);
1587 1.1 dyoung IXGBE_TX_LOCK(txr);
1588 1.1 dyoung ixgbe_txeof(txr);
1589 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
1590 1.1 dyoung if (!drbr_empty(ifp, txr->br))
1591 1.1 dyoung ixgbe_mq_start_locked(ifp, txr, NULL);
1592 1.1 dyoung #else
1593 1.1 dyoung if (!IFQ_IS_EMPTY(&ifp->if_snd))
1594 1.1 dyoung ixgbe_start_locked(txr, ifp);
1595 1.1 dyoung #endif
1596 1.1 dyoung IXGBE_TX_UNLOCK(txr);
1597 1.1 dyoung if (more) {
1598 1.1 dyoung adapter->req.ev_count++;
1599 1.1 dyoung softint_schedule(que->que_si);
1600 1.1 dyoung return;
1601 1.1 dyoung }
1602 1.1 dyoung }
1603 1.1 dyoung
1604 1.1 dyoung /* Reenable this interrupt */
1605 1.1 dyoung ixgbe_enable_queue(adapter, que->msix);
1606 1.1 dyoung return;
1607 1.1 dyoung }
1608 1.1 dyoung
1609 1.1 dyoung
1610 1.1 dyoung /*********************************************************************
1611 1.1 dyoung *
1612 1.1 dyoung * Legacy Interrupt Service routine
1613 1.1 dyoung *
1614 1.1 dyoung **********************************************************************/
1615 1.1 dyoung
1616 1.1 dyoung static int
1617 1.1 dyoung ixgbe_legacy_irq(void *arg)
1618 1.1 dyoung {
1619 1.1 dyoung struct ix_queue *que = arg;
1620 1.1 dyoung struct adapter *adapter = que->adapter;
1621 1.14.2.1 martin struct ifnet *ifp = adapter->ifp;
1622 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
1623 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
1624 1.14.2.1 martin bool more_tx = false, more_rx = false;
1625 1.1 dyoung u32 reg_eicr, loop = MAX_LOOP;
1626 1.1 dyoung
1627 1.1 dyoung reg_eicr = IXGBE_READ_REG(hw, IXGBE_EICR);
1628 1.1 dyoung
1629 1.1 dyoung adapter->stats.legint.ev_count++;
1630 1.1 dyoung ++que->irqs;
1631 1.1 dyoung if (reg_eicr == 0) {
1632 1.1 dyoung adapter->stats.intzero.ev_count++;
1633 1.14.2.1 martin if ((ifp->if_flags & IFF_UP) != 0)
1634 1.14.2.1 martin ixgbe_enable_intr(adapter);
1635 1.1 dyoung return 0;
1636 1.1 dyoung }
1637 1.1 dyoung
1638 1.14.2.1 martin if ((ifp->if_flags & IFF_RUNNING) != 0) {
1639 1.14.2.5 riz more_rx = ixgbe_rxeof(que);
1640 1.1 dyoung
1641 1.14.2.1 martin IXGBE_TX_LOCK(txr);
1642 1.14.2.1 martin do {
1643 1.14.2.1 martin adapter->txloops.ev_count++;
1644 1.14.2.1 martin more_tx = ixgbe_txeof(txr);
1645 1.14.2.1 martin } while (loop-- && more_tx);
1646 1.14.2.1 martin IXGBE_TX_UNLOCK(txr);
1647 1.14.2.1 martin }
1648 1.1 dyoung
1649 1.1 dyoung if (more_rx || more_tx) {
1650 1.1 dyoung if (more_rx)
1651 1.1 dyoung adapter->morerx.ev_count++;
1652 1.1 dyoung if (more_tx)
1653 1.1 dyoung adapter->moretx.ev_count++;
1654 1.1 dyoung softint_schedule(que->que_si);
1655 1.1 dyoung }
1656 1.1 dyoung
1657 1.1 dyoung /* Check for fan failure */
1658 1.1 dyoung if ((hw->phy.media_type == ixgbe_media_type_copper) &&
1659 1.1 dyoung (reg_eicr & IXGBE_EICR_GPI_SDP1)) {
1660 1.1 dyoung device_printf(adapter->dev, "\nCRITICAL: FAN FAILURE!! "
1661 1.1 dyoung "REPLACE IMMEDIATELY!!\n");
1662 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMS, IXGBE_EICR_GPI_SDP1);
1663 1.1 dyoung }
1664 1.1 dyoung
1665 1.1 dyoung /* Link status change */
1666 1.1 dyoung if (reg_eicr & IXGBE_EICR_LSC)
1667 1.1 dyoung softint_schedule(adapter->link_si);
1668 1.1 dyoung
1669 1.1 dyoung ixgbe_enable_intr(adapter);
1670 1.1 dyoung return 1;
1671 1.1 dyoung }
1672 1.1 dyoung
1673 1.1 dyoung
1674 1.1 dyoung #if defined(NETBSD_MSI_OR_MSIX)
1675 1.1 dyoung /*********************************************************************
1676 1.1 dyoung *
1677 1.14.2.3 martin * MSIX Queue Interrupt Service routine
1678 1.1 dyoung *
1679 1.1 dyoung **********************************************************************/
1680 1.1 dyoung void
1681 1.1 dyoung ixgbe_msix_que(void *arg)
1682 1.1 dyoung {
1683 1.1 dyoung struct ix_queue *que = arg;
1684 1.1 dyoung struct adapter *adapter = que->adapter;
1685 1.1 dyoung struct tx_ring *txr = que->txr;
1686 1.1 dyoung struct rx_ring *rxr = que->rxr;
1687 1.1 dyoung bool more_tx, more_rx;
1688 1.1 dyoung u32 newitr = 0;
1689 1.1 dyoung
1690 1.14.2.4 riz ixgbe_disable_queue(adapter, que->msix);
1691 1.1 dyoung ++que->irqs;
1692 1.1 dyoung
1693 1.14.2.5 riz more_rx = ixgbe_rxeof(que);
1694 1.1 dyoung
1695 1.1 dyoung IXGBE_TX_LOCK(txr);
1696 1.1 dyoung more_tx = ixgbe_txeof(txr);
1697 1.14.2.3 martin /*
1698 1.14.2.3 martin ** Make certain that if the stack
1699 1.14.2.3 martin ** has anything queued the task gets
1700 1.14.2.3 martin ** scheduled to handle it.
1701 1.14.2.3 martin */
1702 1.14.2.5 riz #ifdef IXGBE_LEGACY_TX
1703 1.14.2.4 riz if (!IFQ_IS_EMPTY(&adapter->ifp->if_snd))
1704 1.14.2.3 martin #else
1705 1.14.2.3 martin if (!drbr_empty(adapter->ifp, txr->br))
1706 1.14.2.3 martin #endif
1707 1.14.2.3 martin more_tx = 1;
1708 1.1 dyoung IXGBE_TX_UNLOCK(txr);
1709 1.1 dyoung
1710 1.1 dyoung /* Do AIM now? */
1711 1.1 dyoung
1712 1.1 dyoung if (ixgbe_enable_aim == FALSE)
1713 1.1 dyoung goto no_calc;
1714 1.1 dyoung /*
1715 1.1 dyoung ** Do Adaptive Interrupt Moderation:
1716 1.1 dyoung ** - Write out last calculated setting
1717 1.1 dyoung ** - Calculate based on average size over
1718 1.1 dyoung ** the last interval.
1719 1.1 dyoung */
1720 1.1 dyoung if (que->eitr_setting)
1721 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw,
1722 1.1 dyoung IXGBE_EITR(que->msix), que->eitr_setting);
1723 1.1 dyoung
1724 1.1 dyoung que->eitr_setting = 0;
1725 1.1 dyoung
1726 1.1 dyoung /* Idle, do nothing */
1727 1.1 dyoung if ((txr->bytes == 0) && (rxr->bytes == 0))
1728 1.1 dyoung goto no_calc;
1729 1.1 dyoung
1730 1.1 dyoung if ((txr->bytes) && (txr->packets))
1731 1.1 dyoung newitr = txr->bytes/txr->packets;
1732 1.1 dyoung if ((rxr->bytes) && (rxr->packets))
1733 1.1 dyoung newitr = max(newitr,
1734 1.1 dyoung (rxr->bytes / rxr->packets));
1735 1.1 dyoung newitr += 24; /* account for hardware frame, crc */
1736 1.1 dyoung
1737 1.1 dyoung /* set an upper boundary */
1738 1.1 dyoung newitr = min(newitr, 3000);
1739 1.1 dyoung
1740 1.1 dyoung /* Be nice to the mid range */
1741 1.1 dyoung if ((newitr > 300) && (newitr < 1200))
1742 1.1 dyoung newitr = (newitr / 3);
1743 1.1 dyoung else
1744 1.1 dyoung newitr = (newitr / 2);
1745 1.1 dyoung
1746 1.1 dyoung if (adapter->hw.mac.type == ixgbe_mac_82598EB)
1747 1.1 dyoung newitr |= newitr << 16;
1748 1.1 dyoung else
1749 1.1 dyoung newitr |= IXGBE_EITR_CNT_WDIS;
1750 1.1 dyoung
1751 1.1 dyoung /* save for next interrupt */
1752 1.1 dyoung que->eitr_setting = newitr;
1753 1.1 dyoung
1754 1.1 dyoung /* Reset state */
1755 1.1 dyoung txr->bytes = 0;
1756 1.1 dyoung txr->packets = 0;
1757 1.1 dyoung rxr->bytes = 0;
1758 1.1 dyoung rxr->packets = 0;
1759 1.1 dyoung
1760 1.1 dyoung no_calc:
1761 1.1 dyoung if (more_tx || more_rx)
1762 1.1 dyoung softint_schedule(que->que_si);
1763 1.1 dyoung else /* Reenable this interrupt */
1764 1.1 dyoung ixgbe_enable_queue(adapter, que->msix);
1765 1.1 dyoung return;
1766 1.1 dyoung }
1767 1.1 dyoung
1768 1.1 dyoung
1769 1.1 dyoung static void
1770 1.1 dyoung ixgbe_msix_link(void *arg)
1771 1.1 dyoung {
1772 1.1 dyoung struct adapter *adapter = arg;
1773 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
1774 1.1 dyoung u32 reg_eicr;
1775 1.1 dyoung
1776 1.1 dyoung ++adapter->link_irq.ev_count;
1777 1.1 dyoung
1778 1.1 dyoung /* First get the cause */
1779 1.1 dyoung reg_eicr = IXGBE_READ_REG(hw, IXGBE_EICS);
1780 1.1 dyoung /* Clear interrupt with write */
1781 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EICR, reg_eicr);
1782 1.1 dyoung
1783 1.1 dyoung /* Link status change */
1784 1.1 dyoung if (reg_eicr & IXGBE_EICR_LSC)
1785 1.1 dyoung softint_schedule(adapter->link_si);
1786 1.1 dyoung
1787 1.1 dyoung if (adapter->hw.mac.type != ixgbe_mac_82598EB) {
1788 1.1 dyoung #ifdef IXGBE_FDIR
1789 1.1 dyoung if (reg_eicr & IXGBE_EICR_FLOW_DIR) {
1790 1.1 dyoung /* This is probably overkill :) */
1791 1.1 dyoung if (!atomic_cmpset_int(&adapter->fdir_reinit, 0, 1))
1792 1.1 dyoung return;
1793 1.14.2.4 riz /* Disable the interrupt */
1794 1.14.2.4 riz IXGBE_WRITE_REG(hw, IXGBE_EIMC, IXGBE_EICR_FLOW_DIR);
1795 1.1 dyoung softint_schedule(adapter->fdir_si);
1796 1.1 dyoung } else
1797 1.1 dyoung #endif
1798 1.1 dyoung if (reg_eicr & IXGBE_EICR_ECC) {
1799 1.1 dyoung device_printf(adapter->dev, "\nCRITICAL: ECC ERROR!! "
1800 1.1 dyoung "Please Reboot!!\n");
1801 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_ECC);
1802 1.1 dyoung } else
1803 1.1 dyoung
1804 1.1 dyoung if (reg_eicr & IXGBE_EICR_GPI_SDP1) {
1805 1.1 dyoung /* Clear the interrupt */
1806 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_GPI_SDP1);
1807 1.1 dyoung softint_schedule(adapter->msf_si);
1808 1.1 dyoung } else if (reg_eicr & IXGBE_EICR_GPI_SDP2) {
1809 1.1 dyoung /* Clear the interrupt */
1810 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_GPI_SDP2);
1811 1.1 dyoung softint_schedule(adapter->mod_si);
1812 1.1 dyoung }
1813 1.1 dyoung }
1814 1.1 dyoung
1815 1.1 dyoung /* Check for fan failure */
1816 1.1 dyoung if ((hw->device_id == IXGBE_DEV_ID_82598AT) &&
1817 1.1 dyoung (reg_eicr & IXGBE_EICR_GPI_SDP1)) {
1818 1.1 dyoung device_printf(adapter->dev, "\nCRITICAL: FAN FAILURE!! "
1819 1.1 dyoung "REPLACE IMMEDIATELY!!\n");
1820 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_GPI_SDP1);
1821 1.1 dyoung }
1822 1.1 dyoung
1823 1.14.2.4 riz /* Check for over temp condition */
1824 1.14.2.4 riz if ((hw->mac.type == ixgbe_mac_X540) &&
1825 1.14.2.5 riz (reg_eicr & IXGBE_EICR_TS)) {
1826 1.14.2.4 riz device_printf(adapter->dev, "\nCRITICAL: OVER TEMP!! "
1827 1.14.2.4 riz "PHY IS SHUT DOWN!!\n");
1828 1.14.2.4 riz device_printf(adapter->dev, "System shutdown required\n");
1829 1.14.2.5 riz IXGBE_WRITE_REG(hw, IXGBE_EICR, IXGBE_EICR_TS);
1830 1.14.2.4 riz }
1831 1.14.2.4 riz
1832 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIMS, IXGBE_EIMS_OTHER);
1833 1.1 dyoung return;
1834 1.1 dyoung }
1835 1.1 dyoung #endif
1836 1.1 dyoung
1837 1.1 dyoung /*********************************************************************
1838 1.1 dyoung *
1839 1.1 dyoung * Media Ioctl callback
1840 1.1 dyoung *
1841 1.1 dyoung * This routine is called whenever the user queries the status of
1842 1.1 dyoung * the interface using ifconfig.
1843 1.1 dyoung *
1844 1.1 dyoung **********************************************************************/
1845 1.1 dyoung static void
1846 1.1 dyoung ixgbe_media_status(struct ifnet * ifp, struct ifmediareq * ifmr)
1847 1.1 dyoung {
1848 1.1 dyoung struct adapter *adapter = ifp->if_softc;
1849 1.1 dyoung
1850 1.1 dyoung INIT_DEBUGOUT("ixgbe_media_status: begin");
1851 1.1 dyoung IXGBE_CORE_LOCK(adapter);
1852 1.1 dyoung ixgbe_update_link_status(adapter);
1853 1.1 dyoung
1854 1.1 dyoung ifmr->ifm_status = IFM_AVALID;
1855 1.1 dyoung ifmr->ifm_active = IFM_ETHER;
1856 1.1 dyoung
1857 1.1 dyoung if (!adapter->link_active) {
1858 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
1859 1.1 dyoung return;
1860 1.1 dyoung }
1861 1.1 dyoung
1862 1.1 dyoung ifmr->ifm_status |= IFM_ACTIVE;
1863 1.1 dyoung
1864 1.1 dyoung switch (adapter->link_speed) {
1865 1.14.2.4 riz case IXGBE_LINK_SPEED_100_FULL:
1866 1.14.2.4 riz ifmr->ifm_active |= IFM_100_TX | IFM_FDX;
1867 1.14.2.4 riz break;
1868 1.1 dyoung case IXGBE_LINK_SPEED_1GB_FULL:
1869 1.14.2.5 riz ifmr->ifm_active |= IFM_1000_SX | IFM_FDX;
1870 1.1 dyoung break;
1871 1.1 dyoung case IXGBE_LINK_SPEED_10GB_FULL:
1872 1.1 dyoung ifmr->ifm_active |= adapter->optics | IFM_FDX;
1873 1.1 dyoung break;
1874 1.1 dyoung }
1875 1.1 dyoung
1876 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
1877 1.1 dyoung
1878 1.1 dyoung return;
1879 1.1 dyoung }
1880 1.1 dyoung
1881 1.1 dyoung /*********************************************************************
1882 1.1 dyoung *
1883 1.1 dyoung * Media Ioctl callback
1884 1.1 dyoung *
1885 1.1 dyoung * This routine is called when the user changes speed/duplex using
1886 1.1 dyoung * media/mediopt option with ifconfig.
1887 1.1 dyoung *
1888 1.1 dyoung **********************************************************************/
1889 1.1 dyoung static int
1890 1.1 dyoung ixgbe_media_change(struct ifnet * ifp)
1891 1.1 dyoung {
1892 1.1 dyoung struct adapter *adapter = ifp->if_softc;
1893 1.1 dyoung struct ifmedia *ifm = &adapter->media;
1894 1.1 dyoung
1895 1.1 dyoung INIT_DEBUGOUT("ixgbe_media_change: begin");
1896 1.1 dyoung
1897 1.1 dyoung if (IFM_TYPE(ifm->ifm_media) != IFM_ETHER)
1898 1.1 dyoung return (EINVAL);
1899 1.1 dyoung
1900 1.1 dyoung switch (IFM_SUBTYPE(ifm->ifm_media)) {
1901 1.1 dyoung case IFM_AUTO:
1902 1.1 dyoung adapter->hw.phy.autoneg_advertised =
1903 1.14.2.4 riz IXGBE_LINK_SPEED_100_FULL |
1904 1.14.2.4 riz IXGBE_LINK_SPEED_1GB_FULL |
1905 1.14.2.4 riz IXGBE_LINK_SPEED_10GB_FULL;
1906 1.1 dyoung break;
1907 1.1 dyoung default:
1908 1.1 dyoung device_printf(adapter->dev, "Only auto media type\n");
1909 1.1 dyoung return (EINVAL);
1910 1.1 dyoung }
1911 1.1 dyoung
1912 1.1 dyoung return (0);
1913 1.1 dyoung }
1914 1.1 dyoung
1915 1.1 dyoung /*********************************************************************
1916 1.1 dyoung *
1917 1.1 dyoung * This routine maps the mbufs to tx descriptors, allowing the
1918 1.1 dyoung * TX engine to transmit the packets.
1919 1.1 dyoung * - return 0 on success, positive on failure
1920 1.1 dyoung *
1921 1.1 dyoung **********************************************************************/
1922 1.1 dyoung
1923 1.1 dyoung static int
1924 1.1 dyoung ixgbe_xmit(struct tx_ring *txr, struct mbuf *m_head)
1925 1.1 dyoung {
1926 1.1 dyoung struct m_tag *mtag;
1927 1.1 dyoung struct adapter *adapter = txr->adapter;
1928 1.1 dyoung struct ethercom *ec = &adapter->osdep.ec;
1929 1.1 dyoung u32 olinfo_status = 0, cmd_type_len;
1930 1.1 dyoung int i, j, error;
1931 1.14.2.5 riz int first;
1932 1.1 dyoung bus_dmamap_t map;
1933 1.9 skrll struct ixgbe_tx_buf *txbuf;
1934 1.1 dyoung union ixgbe_adv_tx_desc *txd = NULL;
1935 1.1 dyoung
1936 1.1 dyoung /* Basic descriptor defines */
1937 1.1 dyoung cmd_type_len = (IXGBE_ADVTXD_DTYP_DATA |
1938 1.1 dyoung IXGBE_ADVTXD_DCMD_IFCS | IXGBE_ADVTXD_DCMD_DEXT);
1939 1.1 dyoung
1940 1.1 dyoung if ((mtag = VLAN_OUTPUT_TAG(ec, m_head)) != NULL)
1941 1.1 dyoung cmd_type_len |= IXGBE_ADVTXD_DCMD_VLE;
1942 1.1 dyoung
1943 1.1 dyoung /*
1944 1.1 dyoung * Important to capture the first descriptor
1945 1.1 dyoung * used because it will contain the index of
1946 1.1 dyoung * the one we tell the hardware to report back
1947 1.1 dyoung */
1948 1.1 dyoung first = txr->next_avail_desc;
1949 1.1 dyoung txbuf = &txr->tx_buffers[first];
1950 1.1 dyoung map = txbuf->map;
1951 1.1 dyoung
1952 1.1 dyoung /*
1953 1.1 dyoung * Map the packet for DMA.
1954 1.1 dyoung */
1955 1.1 dyoung error = bus_dmamap_load_mbuf(txr->txtag->dt_dmat, map,
1956 1.1 dyoung m_head, BUS_DMA_NOWAIT);
1957 1.1 dyoung
1958 1.14.2.5 riz if (__predict_false(error)) {
1959 1.14.2.5 riz
1960 1.14.2.5 riz switch (error) {
1961 1.14.2.5 riz case EAGAIN:
1962 1.14.2.5 riz adapter->eagain_tx_dma_setup.ev_count++;
1963 1.14.2.5 riz return EAGAIN;
1964 1.14.2.5 riz case ENOMEM:
1965 1.14.2.5 riz adapter->enomem_tx_dma_setup.ev_count++;
1966 1.14.2.5 riz return EAGAIN;
1967 1.14.2.5 riz case EFBIG:
1968 1.14.2.5 riz /*
1969 1.14.2.5 riz * XXX Try it again?
1970 1.14.2.5 riz * do m_defrag() and retry bus_dmamap_load_mbuf().
1971 1.14.2.5 riz */
1972 1.14.2.5 riz adapter->efbig_tx_dma_setup.ev_count++;
1973 1.14.2.5 riz return error;
1974 1.14.2.5 riz case EINVAL:
1975 1.14.2.5 riz adapter->einval_tx_dma_setup.ev_count++;
1976 1.14.2.5 riz return error;
1977 1.14.2.5 riz default:
1978 1.14.2.5 riz adapter->other_tx_dma_setup.ev_count++;
1979 1.14.2.5 riz return error;
1980 1.14.2.5 riz case 0:
1981 1.14.2.5 riz break;
1982 1.14.2.5 riz }
1983 1.1 dyoung }
1984 1.1 dyoung
1985 1.1 dyoung /* Make certain there are enough descriptors */
1986 1.1 dyoung if (map->dm_nsegs > txr->tx_avail - 2) {
1987 1.1 dyoung txr->no_desc_avail.ev_count++;
1988 1.1 dyoung ixgbe_dmamap_unload(txr->txtag, txbuf->map);
1989 1.1 dyoung return EAGAIN;
1990 1.1 dyoung }
1991 1.1 dyoung
1992 1.1 dyoung /*
1993 1.1 dyoung ** Set up the appropriate offload context
1994 1.14.2.5 riz ** this will consume the first descriptor
1995 1.1 dyoung */
1996 1.14.2.5 riz error = ixgbe_tx_ctx_setup(txr, m_head, &cmd_type_len, &olinfo_status);
1997 1.14.2.5 riz if (__predict_false(error)) {
1998 1.14.2.5 riz return (error);
1999 1.14.2.5 riz }
2000 1.1 dyoung
2001 1.1 dyoung #ifdef IXGBE_FDIR
2002 1.1 dyoung /* Do the flow director magic */
2003 1.1 dyoung if ((txr->atr_sample) && (!adapter->fdir_reinit)) {
2004 1.1 dyoung ++txr->atr_count;
2005 1.1 dyoung if (txr->atr_count >= atr_sample_rate) {
2006 1.1 dyoung ixgbe_atr(txr, m_head);
2007 1.1 dyoung txr->atr_count = 0;
2008 1.1 dyoung }
2009 1.1 dyoung }
2010 1.1 dyoung #endif
2011 1.1 dyoung
2012 1.1 dyoung i = txr->next_avail_desc;
2013 1.1 dyoung for (j = 0; j < map->dm_nsegs; j++) {
2014 1.1 dyoung bus_size_t seglen;
2015 1.1 dyoung bus_addr_t segaddr;
2016 1.1 dyoung
2017 1.1 dyoung txbuf = &txr->tx_buffers[i];
2018 1.1 dyoung txd = &txr->tx_base[i];
2019 1.1 dyoung seglen = map->dm_segs[j].ds_len;
2020 1.1 dyoung segaddr = htole64(map->dm_segs[j].ds_addr);
2021 1.1 dyoung
2022 1.1 dyoung txd->read.buffer_addr = segaddr;
2023 1.1 dyoung txd->read.cmd_type_len = htole32(txr->txd_cmd |
2024 1.1 dyoung cmd_type_len |seglen);
2025 1.1 dyoung txd->read.olinfo_status = htole32(olinfo_status);
2026 1.1 dyoung
2027 1.14.2.5 riz if (++i == txr->num_desc)
2028 1.1 dyoung i = 0;
2029 1.1 dyoung }
2030 1.1 dyoung
2031 1.1 dyoung txd->read.cmd_type_len |=
2032 1.1 dyoung htole32(IXGBE_TXD_CMD_EOP | IXGBE_TXD_CMD_RS);
2033 1.1 dyoung txr->tx_avail -= map->dm_nsegs;
2034 1.1 dyoung txr->next_avail_desc = i;
2035 1.1 dyoung
2036 1.1 dyoung txbuf->m_head = m_head;
2037 1.14.2.5 riz /*
2038 1.14.2.5 riz ** Here we swap the map so the last descriptor,
2039 1.14.2.5 riz ** which gets the completion interrupt has the
2040 1.14.2.5 riz ** real map, and the first descriptor gets the
2041 1.14.2.5 riz ** unused map from this descriptor.
2042 1.14.2.5 riz */
2043 1.1 dyoung txr->tx_buffers[first].map = txbuf->map;
2044 1.1 dyoung txbuf->map = map;
2045 1.1 dyoung bus_dmamap_sync(txr->txtag->dt_dmat, map, 0, m_head->m_pkthdr.len,
2046 1.1 dyoung BUS_DMASYNC_PREWRITE);
2047 1.1 dyoung
2048 1.14.2.5 riz /* Set the EOP descriptor that will be marked done */
2049 1.1 dyoung txbuf = &txr->tx_buffers[first];
2050 1.14.2.5 riz txbuf->eop = txd;
2051 1.1 dyoung
2052 1.1 dyoung ixgbe_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
2053 1.1 dyoung BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
2054 1.1 dyoung /*
2055 1.1 dyoung * Advance the Transmit Descriptor Tail (Tdt), this tells the
2056 1.1 dyoung * hardware that this frame is available to transmit.
2057 1.1 dyoung */
2058 1.1 dyoung ++txr->total_packets.ev_count;
2059 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_TDT(txr->me), i);
2060 1.1 dyoung
2061 1.1 dyoung return 0;
2062 1.1 dyoung }
2063 1.1 dyoung
2064 1.1 dyoung static void
2065 1.1 dyoung ixgbe_set_promisc(struct adapter *adapter)
2066 1.1 dyoung {
2067 1.14.2.5 riz struct ether_multi *enm;
2068 1.14.2.5 riz struct ether_multistep step;
2069 1.1 dyoung u_int32_t reg_rctl;
2070 1.14.2.5 riz struct ethercom *ec = &adapter->osdep.ec;
2071 1.1 dyoung struct ifnet *ifp = adapter->ifp;
2072 1.14.2.5 riz int mcnt = 0;
2073 1.1 dyoung
2074 1.1 dyoung reg_rctl = IXGBE_READ_REG(&adapter->hw, IXGBE_FCTRL);
2075 1.1 dyoung reg_rctl &= (~IXGBE_FCTRL_UPE);
2076 1.14.2.5 riz if (ifp->if_flags & IFF_ALLMULTI)
2077 1.14.2.5 riz mcnt = MAX_NUM_MULTICAST_ADDRESSES;
2078 1.14.2.5 riz else {
2079 1.14.2.5 riz ETHER_FIRST_MULTI(step, ec, enm);
2080 1.14.2.5 riz while (enm != NULL) {
2081 1.14.2.5 riz if (mcnt == MAX_NUM_MULTICAST_ADDRESSES)
2082 1.14.2.5 riz break;
2083 1.14.2.5 riz mcnt++;
2084 1.14.2.5 riz ETHER_NEXT_MULTI(step, enm);
2085 1.14.2.5 riz }
2086 1.14.2.5 riz }
2087 1.14.2.5 riz if (mcnt < MAX_NUM_MULTICAST_ADDRESSES)
2088 1.14.2.5 riz reg_rctl &= (~IXGBE_FCTRL_MPE);
2089 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_FCTRL, reg_rctl);
2090 1.1 dyoung
2091 1.1 dyoung if (ifp->if_flags & IFF_PROMISC) {
2092 1.1 dyoung reg_rctl |= (IXGBE_FCTRL_UPE | IXGBE_FCTRL_MPE);
2093 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_FCTRL, reg_rctl);
2094 1.1 dyoung } else if (ifp->if_flags & IFF_ALLMULTI) {
2095 1.1 dyoung reg_rctl |= IXGBE_FCTRL_MPE;
2096 1.1 dyoung reg_rctl &= ~IXGBE_FCTRL_UPE;
2097 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_FCTRL, reg_rctl);
2098 1.1 dyoung }
2099 1.1 dyoung return;
2100 1.1 dyoung }
2101 1.1 dyoung
2102 1.1 dyoung
2103 1.1 dyoung /*********************************************************************
2104 1.1 dyoung * Multicast Update
2105 1.1 dyoung *
2106 1.1 dyoung * This routine is called whenever multicast address list is updated.
2107 1.1 dyoung *
2108 1.1 dyoung **********************************************************************/
2109 1.1 dyoung #define IXGBE_RAR_ENTRIES 16
2110 1.1 dyoung
2111 1.1 dyoung static void
2112 1.1 dyoung ixgbe_set_multi(struct adapter *adapter)
2113 1.1 dyoung {
2114 1.1 dyoung struct ether_multi *enm;
2115 1.1 dyoung struct ether_multistep step;
2116 1.1 dyoung u32 fctrl;
2117 1.1 dyoung u8 *mta;
2118 1.1 dyoung u8 *update_ptr;
2119 1.1 dyoung int mcnt = 0;
2120 1.1 dyoung struct ethercom *ec = &adapter->osdep.ec;
2121 1.1 dyoung struct ifnet *ifp = adapter->ifp;
2122 1.1 dyoung
2123 1.1 dyoung IOCTL_DEBUGOUT("ixgbe_set_multi: begin");
2124 1.1 dyoung
2125 1.1 dyoung mta = adapter->mta;
2126 1.1 dyoung bzero(mta, sizeof(u8) * IXGBE_ETH_LENGTH_OF_ADDRESS *
2127 1.1 dyoung MAX_NUM_MULTICAST_ADDRESSES);
2128 1.1 dyoung
2129 1.14.2.5 riz ifp->if_flags &= ~IFF_ALLMULTI;
2130 1.1 dyoung ETHER_FIRST_MULTI(step, ec, enm);
2131 1.1 dyoung while (enm != NULL) {
2132 1.14.2.5 riz if ((mcnt == MAX_NUM_MULTICAST_ADDRESSES) ||
2133 1.14.2.5 riz (memcmp(enm->enm_addrlo, enm->enm_addrhi,
2134 1.14.2.5 riz ETHER_ADDR_LEN) != 0)) {
2135 1.14.2.5 riz ifp->if_flags |= IFF_ALLMULTI;
2136 1.1 dyoung break;
2137 1.1 dyoung }
2138 1.1 dyoung bcopy(enm->enm_addrlo,
2139 1.1 dyoung &mta[mcnt * IXGBE_ETH_LENGTH_OF_ADDRESS],
2140 1.1 dyoung IXGBE_ETH_LENGTH_OF_ADDRESS);
2141 1.1 dyoung mcnt++;
2142 1.1 dyoung ETHER_NEXT_MULTI(step, enm);
2143 1.1 dyoung }
2144 1.1 dyoung
2145 1.14.2.5 riz fctrl = IXGBE_READ_REG(&adapter->hw, IXGBE_FCTRL);
2146 1.14.2.5 riz fctrl &= ~(IXGBE_FCTRL_UPE | IXGBE_FCTRL_MPE);
2147 1.14.2.5 riz if (ifp->if_flags & IFF_PROMISC)
2148 1.14.2.5 riz fctrl |= (IXGBE_FCTRL_UPE | IXGBE_FCTRL_MPE);
2149 1.14.2.5 riz else if (ifp->if_flags & IFF_ALLMULTI) {
2150 1.14.2.5 riz fctrl |= IXGBE_FCTRL_MPE;
2151 1.14.2.5 riz }
2152 1.14.2.5 riz
2153 1.14.2.5 riz IXGBE_WRITE_REG(&adapter->hw, IXGBE_FCTRL, fctrl);
2154 1.14.2.5 riz
2155 1.14.2.5 riz if (mcnt < MAX_NUM_MULTICAST_ADDRESSES) {
2156 1.14.2.5 riz update_ptr = mta;
2157 1.14.2.5 riz ixgbe_update_mc_addr_list(&adapter->hw,
2158 1.14.2.5 riz update_ptr, mcnt, ixgbe_mc_array_itr, TRUE);
2159 1.14.2.5 riz }
2160 1.1 dyoung
2161 1.1 dyoung return;
2162 1.1 dyoung }
2163 1.1 dyoung
2164 1.1 dyoung /*
2165 1.1 dyoung * This is an iterator function now needed by the multicast
2166 1.1 dyoung * shared code. It simply feeds the shared code routine the
2167 1.1 dyoung * addresses in the array of ixgbe_set_multi() one by one.
2168 1.1 dyoung */
2169 1.1 dyoung static u8 *
2170 1.1 dyoung ixgbe_mc_array_itr(struct ixgbe_hw *hw, u8 **update_ptr, u32 *vmdq)
2171 1.1 dyoung {
2172 1.1 dyoung u8 *addr = *update_ptr;
2173 1.1 dyoung u8 *newptr;
2174 1.1 dyoung *vmdq = 0;
2175 1.1 dyoung
2176 1.1 dyoung newptr = addr + IXGBE_ETH_LENGTH_OF_ADDRESS;
2177 1.1 dyoung *update_ptr = newptr;
2178 1.1 dyoung return addr;
2179 1.1 dyoung }
2180 1.1 dyoung
2181 1.1 dyoung
2182 1.1 dyoung /*********************************************************************
2183 1.1 dyoung * Timer routine
2184 1.1 dyoung *
2185 1.1 dyoung * This routine checks for link status,updates statistics,
2186 1.1 dyoung * and runs the watchdog check.
2187 1.1 dyoung *
2188 1.1 dyoung **********************************************************************/
2189 1.1 dyoung
2190 1.1 dyoung static void
2191 1.1 dyoung ixgbe_local_timer1(void *arg)
2192 1.1 dyoung {
2193 1.14.2.4 riz struct adapter *adapter = arg;
2194 1.1 dyoung device_t dev = adapter->dev;
2195 1.14.2.4 riz struct ix_queue *que = adapter->queues;
2196 1.14.2.4 riz struct tx_ring *txr = adapter->tx_rings;
2197 1.14.2.4 riz int hung = 0, paused = 0;
2198 1.1 dyoung
2199 1.1 dyoung KASSERT(mutex_owned(&adapter->core_mtx));
2200 1.1 dyoung
2201 1.1 dyoung /* Check for pluggable optics */
2202 1.1 dyoung if (adapter->sfp_probe)
2203 1.1 dyoung if (!ixgbe_sfp_probe(adapter))
2204 1.1 dyoung goto out; /* Nothing to do */
2205 1.1 dyoung
2206 1.1 dyoung ixgbe_update_link_status(adapter);
2207 1.1 dyoung ixgbe_update_stats_counters(adapter);
2208 1.1 dyoung
2209 1.1 dyoung /*
2210 1.1 dyoung * If the interface has been paused
2211 1.1 dyoung * then don't do the watchdog check
2212 1.1 dyoung */
2213 1.1 dyoung if (IXGBE_READ_REG(&adapter->hw, IXGBE_TFCS) & IXGBE_TFCS_TXOFF)
2214 1.14.2.4 riz paused = 1;
2215 1.1 dyoung
2216 1.1 dyoung /*
2217 1.14.2.4 riz ** Check the TX queues status
2218 1.14.2.4 riz ** - watchdog only if all queues show hung
2219 1.14.2.4 riz */
2220 1.14.2.4 riz for (int i = 0; i < adapter->num_queues; i++, que++, txr++) {
2221 1.14.2.4 riz if ((txr->queue_status == IXGBE_QUEUE_HUNG) &&
2222 1.14.2.4 riz (paused == 0))
2223 1.14.2.4 riz ++hung;
2224 1.14.2.4 riz else if (txr->queue_status == IXGBE_QUEUE_WORKING)
2225 1.14.2.4 riz softint_schedule(que->que_si);
2226 1.14.2.4 riz }
2227 1.14.2.4 riz /* Only truely watchdog if all queues show hung */
2228 1.14.2.4 riz if (hung == adapter->num_queues)
2229 1.14.2.4 riz goto watchdog;
2230 1.1 dyoung
2231 1.1 dyoung out:
2232 1.1 dyoung ixgbe_rearm_queues(adapter, adapter->que_mask);
2233 1.1 dyoung callout_reset(&adapter->timer, hz, ixgbe_local_timer, adapter);
2234 1.1 dyoung return;
2235 1.1 dyoung
2236 1.14.2.4 riz watchdog:
2237 1.1 dyoung device_printf(adapter->dev, "Watchdog timeout -- resetting\n");
2238 1.1 dyoung device_printf(dev,"Queue(%d) tdh = %d, hw tdt = %d\n", txr->me,
2239 1.1 dyoung IXGBE_READ_REG(&adapter->hw, IXGBE_TDH(txr->me)),
2240 1.1 dyoung IXGBE_READ_REG(&adapter->hw, IXGBE_TDT(txr->me)));
2241 1.1 dyoung device_printf(dev,"TX(%d) desc avail = %d,"
2242 1.1 dyoung "Next TX to Clean = %d\n",
2243 1.1 dyoung txr->me, txr->tx_avail, txr->next_to_clean);
2244 1.1 dyoung adapter->ifp->if_flags &= ~IFF_RUNNING;
2245 1.1 dyoung adapter->watchdog_events.ev_count++;
2246 1.1 dyoung ixgbe_init_locked(adapter);
2247 1.1 dyoung }
2248 1.1 dyoung
2249 1.1 dyoung static void
2250 1.1 dyoung ixgbe_local_timer(void *arg)
2251 1.1 dyoung {
2252 1.1 dyoung struct adapter *adapter = arg;
2253 1.1 dyoung
2254 1.1 dyoung IXGBE_CORE_LOCK(adapter);
2255 1.1 dyoung ixgbe_local_timer1(adapter);
2256 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
2257 1.1 dyoung }
2258 1.1 dyoung
2259 1.1 dyoung /*
2260 1.1 dyoung ** Note: this routine updates the OS on the link state
2261 1.1 dyoung ** the real check of the hardware only happens with
2262 1.1 dyoung ** a link interrupt.
2263 1.1 dyoung */
2264 1.1 dyoung static void
2265 1.1 dyoung ixgbe_update_link_status(struct adapter *adapter)
2266 1.1 dyoung {
2267 1.1 dyoung struct ifnet *ifp = adapter->ifp;
2268 1.1 dyoung device_t dev = adapter->dev;
2269 1.1 dyoung
2270 1.1 dyoung
2271 1.1 dyoung if (adapter->link_up){
2272 1.1 dyoung if (adapter->link_active == FALSE) {
2273 1.1 dyoung if (bootverbose)
2274 1.1 dyoung device_printf(dev,"Link is up %d Gbps %s \n",
2275 1.1 dyoung ((adapter->link_speed == 128)? 10:1),
2276 1.1 dyoung "Full Duplex");
2277 1.1 dyoung adapter->link_active = TRUE;
2278 1.14.2.4 riz /* Update any Flow Control changes */
2279 1.14.2.4 riz ixgbe_fc_enable(&adapter->hw);
2280 1.1 dyoung if_link_state_change(ifp, LINK_STATE_UP);
2281 1.1 dyoung }
2282 1.1 dyoung } else { /* Link down */
2283 1.1 dyoung if (adapter->link_active == TRUE) {
2284 1.1 dyoung if (bootverbose)
2285 1.1 dyoung device_printf(dev,"Link is Down\n");
2286 1.1 dyoung if_link_state_change(ifp, LINK_STATE_DOWN);
2287 1.1 dyoung adapter->link_active = FALSE;
2288 1.1 dyoung }
2289 1.1 dyoung }
2290 1.1 dyoung
2291 1.1 dyoung return;
2292 1.1 dyoung }
2293 1.1 dyoung
2294 1.1 dyoung
2295 1.1 dyoung static void
2296 1.1 dyoung ixgbe_ifstop(struct ifnet *ifp, int disable)
2297 1.1 dyoung {
2298 1.1 dyoung struct adapter *adapter = ifp->if_softc;
2299 1.1 dyoung
2300 1.1 dyoung IXGBE_CORE_LOCK(adapter);
2301 1.1 dyoung ixgbe_stop(adapter);
2302 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
2303 1.1 dyoung }
2304 1.1 dyoung
2305 1.1 dyoung /*********************************************************************
2306 1.1 dyoung *
2307 1.1 dyoung * This routine disables all traffic on the adapter by issuing a
2308 1.1 dyoung * global reset on the MAC and deallocates TX/RX buffers.
2309 1.1 dyoung *
2310 1.1 dyoung **********************************************************************/
2311 1.1 dyoung
2312 1.1 dyoung static void
2313 1.1 dyoung ixgbe_stop(void *arg)
2314 1.1 dyoung {
2315 1.1 dyoung struct ifnet *ifp;
2316 1.1 dyoung struct adapter *adapter = arg;
2317 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
2318 1.1 dyoung ifp = adapter->ifp;
2319 1.1 dyoung
2320 1.1 dyoung KASSERT(mutex_owned(&adapter->core_mtx));
2321 1.1 dyoung
2322 1.1 dyoung INIT_DEBUGOUT("ixgbe_stop: begin\n");
2323 1.1 dyoung ixgbe_disable_intr(adapter);
2324 1.14.2.4 riz callout_stop(&adapter->timer);
2325 1.1 dyoung
2326 1.14.2.4 riz /* Let the stack know...*/
2327 1.14.2.4 riz ifp->if_flags &= ~IFF_RUNNING;
2328 1.1 dyoung
2329 1.1 dyoung ixgbe_reset_hw(hw);
2330 1.1 dyoung hw->adapter_stopped = FALSE;
2331 1.1 dyoung ixgbe_stop_adapter(hw);
2332 1.1 dyoung /* Turn off the laser */
2333 1.1 dyoung if (hw->phy.multispeed_fiber)
2334 1.1 dyoung ixgbe_disable_tx_laser(hw);
2335 1.1 dyoung
2336 1.1 dyoung /* reprogram the RAR[0] in case user changed it. */
2337 1.1 dyoung ixgbe_set_rar(&adapter->hw, 0, adapter->hw.mac.addr, 0, IXGBE_RAH_AV);
2338 1.1 dyoung
2339 1.1 dyoung return;
2340 1.1 dyoung }
2341 1.1 dyoung
2342 1.1 dyoung
2343 1.1 dyoung /*********************************************************************
2344 1.1 dyoung *
2345 1.1 dyoung * Determine hardware revision.
2346 1.1 dyoung *
2347 1.1 dyoung **********************************************************************/
2348 1.1 dyoung static void
2349 1.1 dyoung ixgbe_identify_hardware(struct adapter *adapter)
2350 1.1 dyoung {
2351 1.1 dyoung pcitag_t tag;
2352 1.1 dyoung pci_chipset_tag_t pc;
2353 1.1 dyoung pcireg_t subid, id;
2354 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
2355 1.1 dyoung
2356 1.1 dyoung pc = adapter->osdep.pc;
2357 1.1 dyoung tag = adapter->osdep.tag;
2358 1.1 dyoung
2359 1.1 dyoung id = pci_conf_read(pc, tag, PCI_ID_REG);
2360 1.1 dyoung subid = pci_conf_read(pc, tag, PCI_SUBSYS_ID_REG);
2361 1.1 dyoung
2362 1.1 dyoung /* Save off the information about this board */
2363 1.1 dyoung hw->vendor_id = PCI_VENDOR(id);
2364 1.1 dyoung hw->device_id = PCI_PRODUCT(id);
2365 1.1 dyoung hw->revision_id =
2366 1.1 dyoung PCI_REVISION(pci_conf_read(pc, tag, PCI_CLASS_REG));
2367 1.1 dyoung hw->subsystem_vendor_id = PCI_SUBSYS_VENDOR(subid);
2368 1.1 dyoung hw->subsystem_device_id = PCI_SUBSYS_ID(subid);
2369 1.1 dyoung
2370 1.1 dyoung /* We need this here to set the num_segs below */
2371 1.1 dyoung ixgbe_set_mac_type(hw);
2372 1.1 dyoung
2373 1.1 dyoung /* Pick up the 82599 and VF settings */
2374 1.1 dyoung if (hw->mac.type != ixgbe_mac_82598EB) {
2375 1.1 dyoung hw->phy.smart_speed = ixgbe_smart_speed;
2376 1.1 dyoung adapter->num_segs = IXGBE_82599_SCATTER;
2377 1.1 dyoung } else
2378 1.1 dyoung adapter->num_segs = IXGBE_82598_SCATTER;
2379 1.1 dyoung
2380 1.1 dyoung return;
2381 1.1 dyoung }
2382 1.1 dyoung
2383 1.1 dyoung /*********************************************************************
2384 1.1 dyoung *
2385 1.1 dyoung * Determine optic type
2386 1.1 dyoung *
2387 1.1 dyoung **********************************************************************/
2388 1.1 dyoung static void
2389 1.1 dyoung ixgbe_setup_optics(struct adapter *adapter)
2390 1.1 dyoung {
2391 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
2392 1.1 dyoung int layer;
2393 1.14.2.5 riz
2394 1.1 dyoung layer = ixgbe_get_supported_physical_layer(hw);
2395 1.14.2.4 riz
2396 1.14.2.4 riz if (layer & IXGBE_PHYSICAL_LAYER_10GBASE_T) {
2397 1.14.2.4 riz adapter->optics = IFM_10G_T;
2398 1.14.2.4 riz return;
2399 1.14.2.4 riz }
2400 1.14.2.4 riz
2401 1.14.2.4 riz if (layer & IXGBE_PHYSICAL_LAYER_1000BASE_T) {
2402 1.14.2.4 riz adapter->optics = IFM_1000_T;
2403 1.14.2.4 riz return;
2404 1.14.2.4 riz }
2405 1.14.2.4 riz
2406 1.14.2.4 riz if (layer & IXGBE_PHYSICAL_LAYER_1000BASE_SX) {
2407 1.14.2.4 riz adapter->optics = IFM_1000_SX;
2408 1.14.2.4 riz return;
2409 1.14.2.4 riz }
2410 1.14.2.4 riz
2411 1.14.2.4 riz if (layer & (IXGBE_PHYSICAL_LAYER_10GBASE_LR |
2412 1.14.2.4 riz IXGBE_PHYSICAL_LAYER_10GBASE_LRM)) {
2413 1.14.2.4 riz adapter->optics = IFM_10G_LR;
2414 1.14.2.4 riz return;
2415 1.1 dyoung }
2416 1.14.2.4 riz
2417 1.14.2.4 riz if (layer & IXGBE_PHYSICAL_LAYER_10GBASE_SR) {
2418 1.14.2.4 riz adapter->optics = IFM_10G_SR;
2419 1.14.2.4 riz return;
2420 1.14.2.4 riz }
2421 1.14.2.4 riz
2422 1.14.2.4 riz if (layer & IXGBE_PHYSICAL_LAYER_SFP_PLUS_CU) {
2423 1.14.2.4 riz adapter->optics = IFM_10G_TWINAX;
2424 1.14.2.4 riz return;
2425 1.14.2.4 riz }
2426 1.14.2.4 riz
2427 1.14.2.4 riz if (layer & (IXGBE_PHYSICAL_LAYER_10GBASE_KX4 |
2428 1.14.2.4 riz IXGBE_PHYSICAL_LAYER_10GBASE_CX4)) {
2429 1.14.2.4 riz adapter->optics = IFM_10G_CX4;
2430 1.14.2.4 riz return;
2431 1.14.2.4 riz }
2432 1.14.2.4 riz
2433 1.14.2.4 riz /* If we get here just set the default */
2434 1.14.2.4 riz adapter->optics = IFM_ETHER | IFM_AUTO;
2435 1.1 dyoung return;
2436 1.1 dyoung }
2437 1.1 dyoung
2438 1.1 dyoung /*********************************************************************
2439 1.1 dyoung *
2440 1.1 dyoung * Setup the Legacy or MSI Interrupt handler
2441 1.1 dyoung *
2442 1.1 dyoung **********************************************************************/
2443 1.1 dyoung static int
2444 1.1 dyoung ixgbe_allocate_legacy(struct adapter *adapter, const struct pci_attach_args *pa)
2445 1.1 dyoung {
2446 1.14.2.5 riz device_t dev = adapter->dev;
2447 1.1 dyoung struct ix_queue *que = adapter->queues;
2448 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
2449 1.14.2.4 riz struct tx_ring *txr = adapter->tx_rings;
2450 1.14.2.4 riz #endif
2451 1.9 skrll char intrbuf[PCI_INTRSTR_LEN];
2452 1.9 skrll #if 0
2453 1.14.2.5 riz int rid = 0;
2454 1.1 dyoung
2455 1.1 dyoung /* MSI RID at 1 */
2456 1.1 dyoung if (adapter->msix == 1)
2457 1.1 dyoung rid = 1;
2458 1.9 skrll #endif
2459 1.1 dyoung
2460 1.1 dyoung /* We allocate a single interrupt resource */
2461 1.1 dyoung if (pci_intr_map(pa, &adapter->osdep.ih) != 0) {
2462 1.1 dyoung aprint_error_dev(dev, "unable to map interrupt\n");
2463 1.1 dyoung return ENXIO;
2464 1.1 dyoung } else {
2465 1.1 dyoung aprint_normal_dev(dev, "interrupting at %s\n",
2466 1.14 chs pci_intr_string(adapter->osdep.pc, adapter->osdep.ih,
2467 1.14 chs intrbuf, sizeof(intrbuf)));
2468 1.1 dyoung }
2469 1.1 dyoung
2470 1.1 dyoung /*
2471 1.1 dyoung * Try allocating a fast interrupt and the associated deferred
2472 1.1 dyoung * processing contexts.
2473 1.1 dyoung */
2474 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
2475 1.14.2.4 riz txr->txq_si = softint_establish(SOFTINT_NET, ixgbe_deferred_mq_start,
2476 1.14.2.4 riz txr);
2477 1.14.2.4 riz #endif
2478 1.1 dyoung que->que_si = softint_establish(SOFTINT_NET, ixgbe_handle_que, que);
2479 1.1 dyoung
2480 1.1 dyoung /* Tasklets for Link, SFP and Multispeed Fiber */
2481 1.1 dyoung adapter->link_si =
2482 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_handle_link, adapter);
2483 1.1 dyoung adapter->mod_si =
2484 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_handle_mod, adapter);
2485 1.1 dyoung adapter->msf_si =
2486 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_handle_msf, adapter);
2487 1.1 dyoung
2488 1.1 dyoung #ifdef IXGBE_FDIR
2489 1.1 dyoung adapter->fdir_si =
2490 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_reinit_fdir, adapter);
2491 1.1 dyoung #endif
2492 1.1 dyoung if (que->que_si == NULL ||
2493 1.1 dyoung adapter->link_si == NULL ||
2494 1.1 dyoung adapter->mod_si == NULL ||
2495 1.1 dyoung #ifdef IXGBE_FDIR
2496 1.1 dyoung adapter->fdir_si == NULL ||
2497 1.1 dyoung #endif
2498 1.1 dyoung adapter->msf_si == NULL) {
2499 1.1 dyoung aprint_error_dev(dev,
2500 1.1 dyoung "could not establish software interrupts\n");
2501 1.1 dyoung return ENXIO;
2502 1.1 dyoung }
2503 1.1 dyoung
2504 1.1 dyoung adapter->osdep.intr = pci_intr_establish(adapter->osdep.pc,
2505 1.1 dyoung adapter->osdep.ih, IPL_NET, ixgbe_legacy_irq, que);
2506 1.1 dyoung if (adapter->osdep.intr == NULL) {
2507 1.1 dyoung aprint_error_dev(dev, "failed to register interrupt handler\n");
2508 1.1 dyoung softint_disestablish(que->que_si);
2509 1.1 dyoung softint_disestablish(adapter->link_si);
2510 1.1 dyoung softint_disestablish(adapter->mod_si);
2511 1.1 dyoung softint_disestablish(adapter->msf_si);
2512 1.1 dyoung #ifdef IXGBE_FDIR
2513 1.1 dyoung softint_disestablish(adapter->fdir_si);
2514 1.1 dyoung #endif
2515 1.1 dyoung return ENXIO;
2516 1.1 dyoung }
2517 1.1 dyoung /* For simplicity in the handlers */
2518 1.1 dyoung adapter->que_mask = IXGBE_EIMS_ENABLE_MASK;
2519 1.1 dyoung
2520 1.1 dyoung return (0);
2521 1.1 dyoung }
2522 1.1 dyoung
2523 1.1 dyoung
2524 1.1 dyoung /*********************************************************************
2525 1.1 dyoung *
2526 1.1 dyoung * Setup MSIX Interrupt resources and handlers
2527 1.1 dyoung *
2528 1.1 dyoung **********************************************************************/
2529 1.1 dyoung static int
2530 1.1 dyoung ixgbe_allocate_msix(struct adapter *adapter, const struct pci_attach_args *pa)
2531 1.1 dyoung {
2532 1.1 dyoung #if !defined(NETBSD_MSI_OR_MSIX)
2533 1.1 dyoung return 0;
2534 1.1 dyoung #else
2535 1.1 dyoung device_t dev = adapter->dev;
2536 1.1 dyoung struct ix_queue *que = adapter->queues;
2537 1.14.2.4 riz struct tx_ring *txr = adapter->tx_rings;
2538 1.1 dyoung int error, rid, vector = 0;
2539 1.1 dyoung
2540 1.14.2.4 riz for (int i = 0; i < adapter->num_queues; i++, vector++, que++, txr++) {
2541 1.1 dyoung rid = vector + 1;
2542 1.1 dyoung que->res = bus_alloc_resource_any(dev, SYS_RES_IRQ, &rid,
2543 1.1 dyoung RF_SHAREABLE | RF_ACTIVE);
2544 1.1 dyoung if (que->res == NULL) {
2545 1.1 dyoung aprint_error_dev(dev,"Unable to allocate"
2546 1.1 dyoung " bus resource: que interrupt [%d]\n", vector);
2547 1.1 dyoung return (ENXIO);
2548 1.1 dyoung }
2549 1.1 dyoung /* Set the handler function */
2550 1.1 dyoung error = bus_setup_intr(dev, que->res,
2551 1.1 dyoung INTR_TYPE_NET | INTR_MPSAFE, NULL,
2552 1.1 dyoung ixgbe_msix_que, que, &que->tag);
2553 1.1 dyoung if (error) {
2554 1.1 dyoung que->res = NULL;
2555 1.1 dyoung aprint_error_dev(dev,
2556 1.1 dyoung "Failed to register QUE handler\n");
2557 1.1 dyoung return error;
2558 1.1 dyoung }
2559 1.1 dyoung #if __FreeBSD_version >= 800504
2560 1.1 dyoung bus_describe_intr(dev, que->res, que->tag, "que %d", i);
2561 1.1 dyoung #endif
2562 1.1 dyoung que->msix = vector;
2563 1.1 dyoung adapter->que_mask |= (u64)(1 << que->msix);
2564 1.1 dyoung /*
2565 1.1 dyoung ** Bind the msix vector, and thus the
2566 1.1 dyoung ** ring to the corresponding cpu.
2567 1.1 dyoung */
2568 1.1 dyoung if (adapter->num_queues > 1)
2569 1.1 dyoung bus_bind_intr(dev, que->res, i);
2570 1.1 dyoung
2571 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
2572 1.14.2.4 riz txr->txq_si = softint_establish(SOFTINT_NET,
2573 1.14.2.4 riz ixgbe_deferred_mq_start, txr);
2574 1.14.2.4 riz #endif
2575 1.14.2.4 riz que->que_si = softint_establish(SOFTINT_NET, ixgbe_handle_que,
2576 1.14.2.4 riz que);
2577 1.1 dyoung if (que->que_si == NULL) {
2578 1.1 dyoung aprint_error_dev(dev,
2579 1.1 dyoung "could not establish software interrupt\n");
2580 1.1 dyoung }
2581 1.1 dyoung }
2582 1.1 dyoung
2583 1.1 dyoung /* and Link */
2584 1.1 dyoung rid = vector + 1;
2585 1.1 dyoung adapter->res = bus_alloc_resource_any(dev,
2586 1.1 dyoung SYS_RES_IRQ, &rid, RF_SHAREABLE | RF_ACTIVE);
2587 1.1 dyoung if (!adapter->res) {
2588 1.1 dyoung aprint_error_dev(dev,"Unable to allocate bus resource: "
2589 1.1 dyoung "Link interrupt [%d]\n", rid);
2590 1.1 dyoung return (ENXIO);
2591 1.1 dyoung }
2592 1.1 dyoung /* Set the link handler function */
2593 1.1 dyoung error = bus_setup_intr(dev, adapter->res,
2594 1.1 dyoung INTR_TYPE_NET | INTR_MPSAFE, NULL,
2595 1.1 dyoung ixgbe_msix_link, adapter, &adapter->tag);
2596 1.1 dyoung if (error) {
2597 1.1 dyoung adapter->res = NULL;
2598 1.1 dyoung aprint_error_dev(dev, "Failed to register LINK handler\n");
2599 1.1 dyoung return (error);
2600 1.1 dyoung }
2601 1.1 dyoung #if __FreeBSD_version >= 800504
2602 1.1 dyoung bus_describe_intr(dev, adapter->res, adapter->tag, "link");
2603 1.1 dyoung #endif
2604 1.1 dyoung adapter->linkvec = vector;
2605 1.1 dyoung /* Tasklets for Link, SFP and Multispeed Fiber */
2606 1.1 dyoung adapter->link_si =
2607 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_handle_link, adapter);
2608 1.1 dyoung adapter->mod_si =
2609 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_handle_mod, adapter);
2610 1.1 dyoung adapter->msf_si =
2611 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_handle_msf, adapter);
2612 1.1 dyoung #ifdef IXGBE_FDIR
2613 1.1 dyoung adapter->fdir_si =
2614 1.1 dyoung softint_establish(SOFTINT_NET, ixgbe_reinit_fdir, adapter);
2615 1.1 dyoung #endif
2616 1.1 dyoung
2617 1.1 dyoung return (0);
2618 1.1 dyoung #endif
2619 1.1 dyoung }
2620 1.1 dyoung
2621 1.1 dyoung /*
2622 1.1 dyoung * Setup Either MSI/X or MSI
2623 1.1 dyoung */
2624 1.1 dyoung static int
2625 1.1 dyoung ixgbe_setup_msix(struct adapter *adapter)
2626 1.1 dyoung {
2627 1.1 dyoung #if !defined(NETBSD_MSI_OR_MSIX)
2628 1.1 dyoung return 0;
2629 1.1 dyoung #else
2630 1.1 dyoung device_t dev = adapter->dev;
2631 1.1 dyoung int rid, want, queues, msgs;
2632 1.1 dyoung
2633 1.1 dyoung /* Override by tuneable */
2634 1.1 dyoung if (ixgbe_enable_msix == 0)
2635 1.1 dyoung goto msi;
2636 1.1 dyoung
2637 1.1 dyoung /* First try MSI/X */
2638 1.1 dyoung rid = PCI_BAR(MSIX_82598_BAR);
2639 1.1 dyoung adapter->msix_mem = bus_alloc_resource_any(dev,
2640 1.1 dyoung SYS_RES_MEMORY, &rid, RF_ACTIVE);
2641 1.1 dyoung if (!adapter->msix_mem) {
2642 1.1 dyoung rid += 4; /* 82599 maps in higher BAR */
2643 1.1 dyoung adapter->msix_mem = bus_alloc_resource_any(dev,
2644 1.1 dyoung SYS_RES_MEMORY, &rid, RF_ACTIVE);
2645 1.1 dyoung }
2646 1.1 dyoung if (!adapter->msix_mem) {
2647 1.1 dyoung /* May not be enabled */
2648 1.1 dyoung device_printf(adapter->dev,
2649 1.1 dyoung "Unable to map MSIX table \n");
2650 1.1 dyoung goto msi;
2651 1.1 dyoung }
2652 1.1 dyoung
2653 1.1 dyoung msgs = pci_msix_count(dev);
2654 1.1 dyoung if (msgs == 0) { /* system has msix disabled */
2655 1.1 dyoung bus_release_resource(dev, SYS_RES_MEMORY,
2656 1.1 dyoung rid, adapter->msix_mem);
2657 1.1 dyoung adapter->msix_mem = NULL;
2658 1.1 dyoung goto msi;
2659 1.1 dyoung }
2660 1.1 dyoung
2661 1.1 dyoung /* Figure out a reasonable auto config value */
2662 1.1 dyoung queues = (mp_ncpus > (msgs-1)) ? (msgs-1) : mp_ncpus;
2663 1.1 dyoung
2664 1.1 dyoung if (ixgbe_num_queues != 0)
2665 1.1 dyoung queues = ixgbe_num_queues;
2666 1.1 dyoung /* Set max queues to 8 when autoconfiguring */
2667 1.1 dyoung else if ((ixgbe_num_queues == 0) && (queues > 8))
2668 1.1 dyoung queues = 8;
2669 1.1 dyoung
2670 1.1 dyoung /*
2671 1.1 dyoung ** Want one vector (RX/TX pair) per queue
2672 1.1 dyoung ** plus an additional for Link.
2673 1.1 dyoung */
2674 1.1 dyoung want = queues + 1;
2675 1.1 dyoung if (msgs >= want)
2676 1.1 dyoung msgs = want;
2677 1.1 dyoung else {
2678 1.1 dyoung device_printf(adapter->dev,
2679 1.1 dyoung "MSIX Configuration Problem, "
2680 1.1 dyoung "%d vectors but %d queues wanted!\n",
2681 1.1 dyoung msgs, want);
2682 1.1 dyoung return (0); /* Will go to Legacy setup */
2683 1.1 dyoung }
2684 1.1 dyoung if ((msgs) && pci_alloc_msix(dev, &msgs) == 0) {
2685 1.1 dyoung device_printf(adapter->dev,
2686 1.1 dyoung "Using MSIX interrupts with %d vectors\n", msgs);
2687 1.1 dyoung adapter->num_queues = queues;
2688 1.1 dyoung return (msgs);
2689 1.1 dyoung }
2690 1.1 dyoung msi:
2691 1.1 dyoung msgs = pci_msi_count(dev);
2692 1.1 dyoung if (msgs == 1 && pci_alloc_msi(dev, &msgs) == 0)
2693 1.14.2.3 martin device_printf(adapter->dev,"Using an MSI interrupt\n");
2694 1.14.2.3 martin else
2695 1.14.2.3 martin device_printf(adapter->dev,"Using a Legacy interrupt\n");
2696 1.1 dyoung return (msgs);
2697 1.1 dyoung #endif
2698 1.1 dyoung }
2699 1.1 dyoung
2700 1.1 dyoung
2701 1.1 dyoung static int
2702 1.1 dyoung ixgbe_allocate_pci_resources(struct adapter *adapter, const struct pci_attach_args *pa)
2703 1.1 dyoung {
2704 1.1 dyoung pcireg_t memtype;
2705 1.1 dyoung device_t dev = adapter->dev;
2706 1.1 dyoung bus_addr_t addr;
2707 1.1 dyoung int flags;
2708 1.1 dyoung
2709 1.1 dyoung memtype = pci_mapreg_type(pa->pa_pc, pa->pa_tag, PCI_BAR(0));
2710 1.1 dyoung switch (memtype) {
2711 1.1 dyoung case PCI_MAPREG_TYPE_MEM | PCI_MAPREG_MEM_TYPE_32BIT:
2712 1.1 dyoung case PCI_MAPREG_TYPE_MEM | PCI_MAPREG_MEM_TYPE_64BIT:
2713 1.1 dyoung adapter->osdep.mem_bus_space_tag = pa->pa_memt;
2714 1.1 dyoung if (pci_mapreg_info(pa->pa_pc, pa->pa_tag, PCI_BAR(0),
2715 1.1 dyoung memtype, &addr, &adapter->osdep.mem_size, &flags) != 0)
2716 1.1 dyoung goto map_err;
2717 1.1 dyoung if ((flags & BUS_SPACE_MAP_PREFETCHABLE) != 0) {
2718 1.1 dyoung aprint_normal_dev(dev, "clearing prefetchable bit\n");
2719 1.1 dyoung flags &= ~BUS_SPACE_MAP_PREFETCHABLE;
2720 1.1 dyoung }
2721 1.1 dyoung if (bus_space_map(adapter->osdep.mem_bus_space_tag, addr,
2722 1.1 dyoung adapter->osdep.mem_size, flags,
2723 1.1 dyoung &adapter->osdep.mem_bus_space_handle) != 0) {
2724 1.1 dyoung map_err:
2725 1.1 dyoung adapter->osdep.mem_size = 0;
2726 1.1 dyoung aprint_error_dev(dev, "unable to map BAR0\n");
2727 1.1 dyoung return ENXIO;
2728 1.1 dyoung }
2729 1.1 dyoung break;
2730 1.1 dyoung default:
2731 1.1 dyoung aprint_error_dev(dev, "unexpected type on BAR0\n");
2732 1.1 dyoung return ENXIO;
2733 1.1 dyoung }
2734 1.1 dyoung
2735 1.1 dyoung /* Legacy defaults */
2736 1.1 dyoung adapter->num_queues = 1;
2737 1.1 dyoung adapter->hw.back = &adapter->osdep;
2738 1.1 dyoung
2739 1.1 dyoung /*
2740 1.1 dyoung ** Now setup MSI or MSI/X, should
2741 1.1 dyoung ** return us the number of supported
2742 1.1 dyoung ** vectors. (Will be 1 for MSI)
2743 1.1 dyoung */
2744 1.1 dyoung adapter->msix = ixgbe_setup_msix(adapter);
2745 1.1 dyoung return (0);
2746 1.1 dyoung }
2747 1.1 dyoung
2748 1.1 dyoung static void
2749 1.1 dyoung ixgbe_free_pci_resources(struct adapter * adapter)
2750 1.1 dyoung {
2751 1.1 dyoung #if defined(NETBSD_MSI_OR_MSIX)
2752 1.1 dyoung struct ix_queue *que = adapter->queues;
2753 1.14 chs device_t dev = adapter->dev;
2754 1.1 dyoung #endif
2755 1.9 skrll int rid;
2756 1.1 dyoung
2757 1.9 skrll #if defined(NETBSD_MSI_OR_MSIX)
2758 1.9 skrll int memrid;
2759 1.1 dyoung if (adapter->hw.mac.type == ixgbe_mac_82598EB)
2760 1.1 dyoung memrid = PCI_BAR(MSIX_82598_BAR);
2761 1.1 dyoung else
2762 1.1 dyoung memrid = PCI_BAR(MSIX_82599_BAR);
2763 1.1 dyoung
2764 1.1 dyoung /*
2765 1.1 dyoung ** There is a slight possibility of a failure mode
2766 1.1 dyoung ** in attach that will result in entering this function
2767 1.1 dyoung ** before interrupt resources have been initialized, and
2768 1.1 dyoung ** in that case we do not want to execute the loops below
2769 1.1 dyoung ** We can detect this reliably by the state of the adapter
2770 1.1 dyoung ** res pointer.
2771 1.1 dyoung */
2772 1.1 dyoung if (adapter->res == NULL)
2773 1.1 dyoung goto mem;
2774 1.1 dyoung
2775 1.1 dyoung /*
2776 1.1 dyoung ** Release all msix queue resources:
2777 1.1 dyoung */
2778 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, que++) {
2779 1.1 dyoung rid = que->msix + 1;
2780 1.1 dyoung if (que->tag != NULL) {
2781 1.1 dyoung bus_teardown_intr(dev, que->res, que->tag);
2782 1.1 dyoung que->tag = NULL;
2783 1.1 dyoung }
2784 1.1 dyoung if (que->res != NULL)
2785 1.1 dyoung bus_release_resource(dev, SYS_RES_IRQ, rid, que->res);
2786 1.1 dyoung }
2787 1.1 dyoung #endif
2788 1.1 dyoung
2789 1.1 dyoung /* Clean the Legacy or Link interrupt last */
2790 1.1 dyoung if (adapter->linkvec) /* we are doing MSIX */
2791 1.1 dyoung rid = adapter->linkvec + 1;
2792 1.1 dyoung else
2793 1.1 dyoung (adapter->msix != 0) ? (rid = 1):(rid = 0);
2794 1.1 dyoung
2795 1.1 dyoung pci_intr_disestablish(adapter->osdep.pc, adapter->osdep.intr);
2796 1.1 dyoung adapter->osdep.intr = NULL;
2797 1.1 dyoung
2798 1.1 dyoung #if defined(NETBSD_MSI_OR_MSIX)
2799 1.1 dyoung mem:
2800 1.1 dyoung if (adapter->msix)
2801 1.1 dyoung pci_release_msi(dev);
2802 1.1 dyoung
2803 1.1 dyoung if (adapter->msix_mem != NULL)
2804 1.1 dyoung bus_release_resource(dev, SYS_RES_MEMORY,
2805 1.1 dyoung memrid, adapter->msix_mem);
2806 1.1 dyoung #endif
2807 1.1 dyoung
2808 1.1 dyoung if (adapter->osdep.mem_size != 0) {
2809 1.1 dyoung bus_space_unmap(adapter->osdep.mem_bus_space_tag,
2810 1.1 dyoung adapter->osdep.mem_bus_space_handle,
2811 1.1 dyoung adapter->osdep.mem_size);
2812 1.1 dyoung }
2813 1.1 dyoung
2814 1.1 dyoung return;
2815 1.1 dyoung }
2816 1.1 dyoung
2817 1.1 dyoung /*********************************************************************
2818 1.1 dyoung *
2819 1.1 dyoung * Setup networking device structure and register an interface.
2820 1.1 dyoung *
2821 1.1 dyoung **********************************************************************/
2822 1.1 dyoung static int
2823 1.1 dyoung ixgbe_setup_interface(device_t dev, struct adapter *adapter)
2824 1.1 dyoung {
2825 1.1 dyoung struct ethercom *ec = &adapter->osdep.ec;
2826 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
2827 1.1 dyoung struct ifnet *ifp;
2828 1.1 dyoung
2829 1.1 dyoung INIT_DEBUGOUT("ixgbe_setup_interface: begin");
2830 1.1 dyoung
2831 1.1 dyoung ifp = adapter->ifp = &ec->ec_if;
2832 1.1 dyoung strlcpy(ifp->if_xname, device_xname(dev), IFNAMSIZ);
2833 1.14.2.4 riz ifp->if_baudrate = IF_Gbps(10);
2834 1.1 dyoung ifp->if_init = ixgbe_init;
2835 1.1 dyoung ifp->if_stop = ixgbe_ifstop;
2836 1.1 dyoung ifp->if_softc = adapter;
2837 1.1 dyoung ifp->if_flags = IFF_BROADCAST | IFF_SIMPLEX | IFF_MULTICAST;
2838 1.1 dyoung ifp->if_ioctl = ixgbe_ioctl;
2839 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
2840 1.1 dyoung ifp->if_transmit = ixgbe_mq_start;
2841 1.1 dyoung ifp->if_qflush = ixgbe_qflush;
2842 1.14.2.4 riz #else
2843 1.14.2.4 riz ifp->if_start = ixgbe_start;
2844 1.14.2.4 riz IFQ_SET_MAXLEN(&ifp->if_snd, adapter->num_tx_desc - 2);
2845 1.1 dyoung #endif
2846 1.1 dyoung
2847 1.1 dyoung if_attach(ifp);
2848 1.1 dyoung ether_ifattach(ifp, adapter->hw.mac.addr);
2849 1.1 dyoung ether_set_ifflags_cb(ec, ixgbe_ifflags_cb);
2850 1.1 dyoung
2851 1.1 dyoung adapter->max_frame_size =
2852 1.1 dyoung ifp->if_mtu + ETHER_HDR_LEN + ETHER_CRC_LEN;
2853 1.1 dyoung
2854 1.1 dyoung /*
2855 1.1 dyoung * Tell the upper layer(s) we support long frames.
2856 1.1 dyoung */
2857 1.1 dyoung ifp->if_hdrlen = sizeof(struct ether_vlan_header);
2858 1.1 dyoung
2859 1.14.2.4 riz ifp->if_capabilities |= IFCAP_HWCSUM | IFCAP_TSOv4 | IFCAP_TSOv6;
2860 1.1 dyoung ifp->if_capenable = 0;
2861 1.1 dyoung
2862 1.1 dyoung ec->ec_capabilities |= ETHERCAP_VLAN_HWCSUM;
2863 1.1 dyoung ec->ec_capabilities |= ETHERCAP_JUMBO_MTU;
2864 1.14.2.4 riz ifp->if_capabilities |= IFCAP_LRO;
2865 1.14.2.3 martin ec->ec_capabilities |= ETHERCAP_VLAN_HWTAGGING
2866 1.14.2.3 martin | ETHERCAP_VLAN_MTU;
2867 1.1 dyoung ec->ec_capenable = ec->ec_capabilities;
2868 1.1 dyoung
2869 1.1 dyoung /*
2870 1.14.2.3 martin ** Don't turn this on by default, if vlans are
2871 1.1 dyoung ** created on another pseudo device (eg. lagg)
2872 1.1 dyoung ** then vlan events are not passed thru, breaking
2873 1.1 dyoung ** operation, but with HW FILTER off it works. If
2874 1.14.2.3 martin ** using vlans directly on the ixgbe driver you can
2875 1.1 dyoung ** enable this and get full hardware tag filtering.
2876 1.1 dyoung */
2877 1.1 dyoung ec->ec_capabilities |= ETHERCAP_VLAN_HWFILTER;
2878 1.1 dyoung
2879 1.1 dyoung /*
2880 1.1 dyoung * Specify the media types supported by this adapter and register
2881 1.1 dyoung * callbacks to update media and link information
2882 1.1 dyoung */
2883 1.1 dyoung ifmedia_init(&adapter->media, IFM_IMASK, ixgbe_media_change,
2884 1.1 dyoung ixgbe_media_status);
2885 1.1 dyoung ifmedia_add(&adapter->media, IFM_ETHER | adapter->optics, 0, NULL);
2886 1.1 dyoung ifmedia_set(&adapter->media, IFM_ETHER | adapter->optics);
2887 1.1 dyoung if (hw->device_id == IXGBE_DEV_ID_82598AT) {
2888 1.1 dyoung ifmedia_add(&adapter->media,
2889 1.1 dyoung IFM_ETHER | IFM_1000_T | IFM_FDX, 0, NULL);
2890 1.1 dyoung ifmedia_add(&adapter->media,
2891 1.1 dyoung IFM_ETHER | IFM_1000_T, 0, NULL);
2892 1.1 dyoung }
2893 1.1 dyoung ifmedia_add(&adapter->media, IFM_ETHER | IFM_AUTO, 0, NULL);
2894 1.1 dyoung ifmedia_set(&adapter->media, IFM_ETHER | IFM_AUTO);
2895 1.1 dyoung
2896 1.1 dyoung return (0);
2897 1.1 dyoung }
2898 1.1 dyoung
2899 1.1 dyoung static void
2900 1.1 dyoung ixgbe_config_link(struct adapter *adapter)
2901 1.1 dyoung {
2902 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
2903 1.1 dyoung u32 autoneg, err = 0;
2904 1.1 dyoung bool sfp, negotiate;
2905 1.1 dyoung
2906 1.1 dyoung sfp = ixgbe_is_sfp(hw);
2907 1.1 dyoung
2908 1.1 dyoung if (sfp) {
2909 1.14.2.2 martin void *ip;
2910 1.14.2.2 martin
2911 1.1 dyoung if (hw->phy.multispeed_fiber) {
2912 1.1 dyoung hw->mac.ops.setup_sfp(hw);
2913 1.1 dyoung ixgbe_enable_tx_laser(hw);
2914 1.14.2.2 martin ip = adapter->msf_si;
2915 1.1 dyoung } else {
2916 1.14.2.2 martin ip = adapter->mod_si;
2917 1.1 dyoung }
2918 1.14.2.2 martin
2919 1.14.2.2 martin kpreempt_disable();
2920 1.14.2.2 martin softint_schedule(ip);
2921 1.14.2.2 martin kpreempt_enable();
2922 1.1 dyoung } else {
2923 1.1 dyoung if (hw->mac.ops.check_link)
2924 1.14.2.5 riz err = ixgbe_check_link(hw, &adapter->link_speed,
2925 1.1 dyoung &adapter->link_up, FALSE);
2926 1.1 dyoung if (err)
2927 1.1 dyoung goto out;
2928 1.1 dyoung autoneg = hw->phy.autoneg_advertised;
2929 1.1 dyoung if ((!autoneg) && (hw->mac.ops.get_link_capabilities))
2930 1.1 dyoung err = hw->mac.ops.get_link_capabilities(hw,
2931 1.1 dyoung &autoneg, &negotiate);
2932 1.13 christos else
2933 1.13 christos negotiate = 0;
2934 1.1 dyoung if (err)
2935 1.1 dyoung goto out;
2936 1.1 dyoung if (hw->mac.ops.setup_link)
2937 1.14.2.5 riz err = hw->mac.ops.setup_link(hw,
2938 1.14.2.5 riz autoneg, adapter->link_up);
2939 1.1 dyoung }
2940 1.1 dyoung out:
2941 1.1 dyoung return;
2942 1.1 dyoung }
2943 1.1 dyoung
2944 1.1 dyoung /********************************************************************
2945 1.1 dyoung * Manage DMA'able memory.
2946 1.1 dyoung *******************************************************************/
2947 1.1 dyoung
2948 1.1 dyoung static int
2949 1.1 dyoung ixgbe_dma_malloc(struct adapter *adapter, const bus_size_t size,
2950 1.1 dyoung struct ixgbe_dma_alloc *dma, const int mapflags)
2951 1.1 dyoung {
2952 1.1 dyoung device_t dev = adapter->dev;
2953 1.1 dyoung int r, rsegs;
2954 1.1 dyoung
2955 1.1 dyoung r = ixgbe_dma_tag_create(adapter->osdep.dmat, /* parent */
2956 1.1 dyoung DBA_ALIGN, 0, /* alignment, bounds */
2957 1.1 dyoung size, /* maxsize */
2958 1.1 dyoung 1, /* nsegments */
2959 1.1 dyoung size, /* maxsegsize */
2960 1.1 dyoung BUS_DMA_ALLOCNOW, /* flags */
2961 1.1 dyoung &dma->dma_tag);
2962 1.1 dyoung if (r != 0) {
2963 1.1 dyoung aprint_error_dev(dev,
2964 1.1 dyoung "%s: ixgbe_dma_tag_create failed; error %d\n", __func__, r);
2965 1.1 dyoung goto fail_0;
2966 1.1 dyoung }
2967 1.1 dyoung
2968 1.1 dyoung r = bus_dmamem_alloc(dma->dma_tag->dt_dmat,
2969 1.1 dyoung size,
2970 1.1 dyoung dma->dma_tag->dt_alignment,
2971 1.1 dyoung dma->dma_tag->dt_boundary,
2972 1.1 dyoung &dma->dma_seg, 1, &rsegs, BUS_DMA_NOWAIT);
2973 1.1 dyoung if (r != 0) {
2974 1.1 dyoung aprint_error_dev(dev,
2975 1.1 dyoung "%s: bus_dmamem_alloc failed; error %d\n", __func__, r);
2976 1.1 dyoung goto fail_1;
2977 1.1 dyoung }
2978 1.1 dyoung
2979 1.1 dyoung r = bus_dmamem_map(dma->dma_tag->dt_dmat, &dma->dma_seg, rsegs,
2980 1.1 dyoung size, &dma->dma_vaddr, BUS_DMA_NOWAIT);
2981 1.1 dyoung if (r != 0) {
2982 1.1 dyoung aprint_error_dev(dev, "%s: bus_dmamem_map failed; error %d\n",
2983 1.1 dyoung __func__, r);
2984 1.1 dyoung goto fail_2;
2985 1.1 dyoung }
2986 1.1 dyoung
2987 1.1 dyoung r = ixgbe_dmamap_create(dma->dma_tag, 0, &dma->dma_map);
2988 1.1 dyoung if (r != 0) {
2989 1.1 dyoung aprint_error_dev(dev, "%s: bus_dmamem_map failed; error %d\n",
2990 1.1 dyoung __func__, r);
2991 1.1 dyoung goto fail_3;
2992 1.1 dyoung }
2993 1.1 dyoung
2994 1.1 dyoung r = bus_dmamap_load(dma->dma_tag->dt_dmat, dma->dma_map, dma->dma_vaddr,
2995 1.1 dyoung size,
2996 1.1 dyoung NULL,
2997 1.1 dyoung mapflags | BUS_DMA_NOWAIT);
2998 1.1 dyoung if (r != 0) {
2999 1.1 dyoung aprint_error_dev(dev, "%s: bus_dmamap_load failed; error %d\n",
3000 1.1 dyoung __func__, r);
3001 1.1 dyoung goto fail_4;
3002 1.1 dyoung }
3003 1.1 dyoung dma->dma_paddr = dma->dma_map->dm_segs[0].ds_addr;
3004 1.1 dyoung dma->dma_size = size;
3005 1.1 dyoung return 0;
3006 1.1 dyoung fail_4:
3007 1.1 dyoung ixgbe_dmamap_destroy(dma->dma_tag, dma->dma_map);
3008 1.1 dyoung fail_3:
3009 1.1 dyoung bus_dmamem_unmap(dma->dma_tag->dt_dmat, dma->dma_vaddr, size);
3010 1.1 dyoung fail_2:
3011 1.1 dyoung bus_dmamem_free(dma->dma_tag->dt_dmat, &dma->dma_seg, rsegs);
3012 1.1 dyoung fail_1:
3013 1.1 dyoung ixgbe_dma_tag_destroy(dma->dma_tag);
3014 1.1 dyoung fail_0:
3015 1.1 dyoung return r;
3016 1.1 dyoung }
3017 1.1 dyoung
3018 1.1 dyoung static void
3019 1.1 dyoung ixgbe_dma_free(struct adapter *adapter, struct ixgbe_dma_alloc *dma)
3020 1.1 dyoung {
3021 1.1 dyoung bus_dmamap_sync(dma->dma_tag->dt_dmat, dma->dma_map, 0, dma->dma_size,
3022 1.1 dyoung BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE);
3023 1.1 dyoung ixgbe_dmamap_unload(dma->dma_tag, dma->dma_map);
3024 1.1 dyoung bus_dmamem_free(dma->dma_tag->dt_dmat, &dma->dma_seg, 1);
3025 1.1 dyoung ixgbe_dma_tag_destroy(dma->dma_tag);
3026 1.1 dyoung }
3027 1.1 dyoung
3028 1.1 dyoung
3029 1.1 dyoung /*********************************************************************
3030 1.1 dyoung *
3031 1.1 dyoung * Allocate memory for the transmit and receive rings, and then
3032 1.1 dyoung * the descriptors associated with each, called only once at attach.
3033 1.1 dyoung *
3034 1.1 dyoung **********************************************************************/
3035 1.1 dyoung static int
3036 1.1 dyoung ixgbe_allocate_queues(struct adapter *adapter)
3037 1.1 dyoung {
3038 1.1 dyoung device_t dev = adapter->dev;
3039 1.1 dyoung struct ix_queue *que;
3040 1.1 dyoung struct tx_ring *txr;
3041 1.1 dyoung struct rx_ring *rxr;
3042 1.1 dyoung int rsize, tsize, error = IXGBE_SUCCESS;
3043 1.1 dyoung int txconf = 0, rxconf = 0;
3044 1.1 dyoung
3045 1.1 dyoung /* First allocate the top level queue structs */
3046 1.1 dyoung if (!(adapter->queues =
3047 1.1 dyoung (struct ix_queue *) malloc(sizeof(struct ix_queue) *
3048 1.1 dyoung adapter->num_queues, M_DEVBUF, M_NOWAIT | M_ZERO))) {
3049 1.1 dyoung aprint_error_dev(dev, "Unable to allocate queue memory\n");
3050 1.1 dyoung error = ENOMEM;
3051 1.1 dyoung goto fail;
3052 1.1 dyoung }
3053 1.1 dyoung
3054 1.1 dyoung /* First allocate the TX ring struct memory */
3055 1.1 dyoung if (!(adapter->tx_rings =
3056 1.1 dyoung (struct tx_ring *) malloc(sizeof(struct tx_ring) *
3057 1.1 dyoung adapter->num_queues, M_DEVBUF, M_NOWAIT | M_ZERO))) {
3058 1.1 dyoung aprint_error_dev(dev, "Unable to allocate TX ring memory\n");
3059 1.1 dyoung error = ENOMEM;
3060 1.1 dyoung goto tx_fail;
3061 1.1 dyoung }
3062 1.1 dyoung
3063 1.1 dyoung /* Next allocate the RX */
3064 1.1 dyoung if (!(adapter->rx_rings =
3065 1.1 dyoung (struct rx_ring *) malloc(sizeof(struct rx_ring) *
3066 1.1 dyoung adapter->num_queues, M_DEVBUF, M_NOWAIT | M_ZERO))) {
3067 1.1 dyoung aprint_error_dev(dev, "Unable to allocate RX ring memory\n");
3068 1.1 dyoung error = ENOMEM;
3069 1.1 dyoung goto rx_fail;
3070 1.1 dyoung }
3071 1.1 dyoung
3072 1.1 dyoung /* For the ring itself */
3073 1.1 dyoung tsize = roundup2(adapter->num_tx_desc *
3074 1.1 dyoung sizeof(union ixgbe_adv_tx_desc), DBA_ALIGN);
3075 1.1 dyoung
3076 1.1 dyoung /*
3077 1.1 dyoung * Now set up the TX queues, txconf is needed to handle the
3078 1.1 dyoung * possibility that things fail midcourse and we need to
3079 1.1 dyoung * undo memory gracefully
3080 1.1 dyoung */
3081 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, txconf++) {
3082 1.1 dyoung /* Set up some basics */
3083 1.1 dyoung txr = &adapter->tx_rings[i];
3084 1.1 dyoung txr->adapter = adapter;
3085 1.1 dyoung txr->me = i;
3086 1.14.2.5 riz txr->num_desc = adapter->num_tx_desc;
3087 1.1 dyoung
3088 1.1 dyoung /* Initialize the TX side lock */
3089 1.1 dyoung snprintf(txr->mtx_name, sizeof(txr->mtx_name), "%s:tx(%d)",
3090 1.1 dyoung device_xname(dev), txr->me);
3091 1.1 dyoung mutex_init(&txr->tx_mtx, MUTEX_DEFAULT, IPL_NET);
3092 1.1 dyoung
3093 1.1 dyoung if (ixgbe_dma_malloc(adapter, tsize,
3094 1.1 dyoung &txr->txdma, BUS_DMA_NOWAIT)) {
3095 1.1 dyoung aprint_error_dev(dev,
3096 1.1 dyoung "Unable to allocate TX Descriptor memory\n");
3097 1.1 dyoung error = ENOMEM;
3098 1.1 dyoung goto err_tx_desc;
3099 1.1 dyoung }
3100 1.1 dyoung txr->tx_base = (union ixgbe_adv_tx_desc *)txr->txdma.dma_vaddr;
3101 1.1 dyoung bzero((void *)txr->tx_base, tsize);
3102 1.1 dyoung
3103 1.1 dyoung /* Now allocate transmit buffers for the ring */
3104 1.1 dyoung if (ixgbe_allocate_transmit_buffers(txr)) {
3105 1.1 dyoung aprint_error_dev(dev,
3106 1.1 dyoung "Critical Failure setting up transmit buffers\n");
3107 1.1 dyoung error = ENOMEM;
3108 1.1 dyoung goto err_tx_desc;
3109 1.1 dyoung }
3110 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
3111 1.1 dyoung /* Allocate a buf ring */
3112 1.1 dyoung txr->br = buf_ring_alloc(IXGBE_BR_SIZE, M_DEVBUF,
3113 1.1 dyoung M_WAITOK, &txr->tx_mtx);
3114 1.1 dyoung if (txr->br == NULL) {
3115 1.1 dyoung aprint_error_dev(dev,
3116 1.1 dyoung "Critical Failure setting up buf ring\n");
3117 1.1 dyoung error = ENOMEM;
3118 1.1 dyoung goto err_tx_desc;
3119 1.1 dyoung }
3120 1.1 dyoung #endif
3121 1.1 dyoung }
3122 1.1 dyoung
3123 1.1 dyoung /*
3124 1.1 dyoung * Next the RX queues...
3125 1.1 dyoung */
3126 1.1 dyoung rsize = roundup2(adapter->num_rx_desc *
3127 1.1 dyoung sizeof(union ixgbe_adv_rx_desc), DBA_ALIGN);
3128 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, rxconf++) {
3129 1.1 dyoung rxr = &adapter->rx_rings[i];
3130 1.1 dyoung /* Set up some basics */
3131 1.1 dyoung rxr->adapter = adapter;
3132 1.1 dyoung rxr->me = i;
3133 1.14.2.5 riz rxr->num_desc = adapter->num_rx_desc;
3134 1.1 dyoung
3135 1.1 dyoung /* Initialize the RX side lock */
3136 1.1 dyoung snprintf(rxr->mtx_name, sizeof(rxr->mtx_name), "%s:rx(%d)",
3137 1.1 dyoung device_xname(dev), rxr->me);
3138 1.1 dyoung mutex_init(&rxr->rx_mtx, MUTEX_DEFAULT, IPL_NET);
3139 1.1 dyoung
3140 1.1 dyoung if (ixgbe_dma_malloc(adapter, rsize,
3141 1.1 dyoung &rxr->rxdma, BUS_DMA_NOWAIT)) {
3142 1.1 dyoung aprint_error_dev(dev,
3143 1.1 dyoung "Unable to allocate RxDescriptor memory\n");
3144 1.1 dyoung error = ENOMEM;
3145 1.1 dyoung goto err_rx_desc;
3146 1.1 dyoung }
3147 1.1 dyoung rxr->rx_base = (union ixgbe_adv_rx_desc *)rxr->rxdma.dma_vaddr;
3148 1.1 dyoung bzero((void *)rxr->rx_base, rsize);
3149 1.1 dyoung
3150 1.1 dyoung /* Allocate receive buffers for the ring*/
3151 1.1 dyoung if (ixgbe_allocate_receive_buffers(rxr)) {
3152 1.1 dyoung aprint_error_dev(dev,
3153 1.1 dyoung "Critical Failure setting up receive buffers\n");
3154 1.1 dyoung error = ENOMEM;
3155 1.1 dyoung goto err_rx_desc;
3156 1.1 dyoung }
3157 1.1 dyoung }
3158 1.1 dyoung
3159 1.1 dyoung /*
3160 1.1 dyoung ** Finally set up the queue holding structs
3161 1.1 dyoung */
3162 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++) {
3163 1.1 dyoung que = &adapter->queues[i];
3164 1.1 dyoung que->adapter = adapter;
3165 1.1 dyoung que->txr = &adapter->tx_rings[i];
3166 1.1 dyoung que->rxr = &adapter->rx_rings[i];
3167 1.1 dyoung }
3168 1.1 dyoung
3169 1.1 dyoung return (0);
3170 1.1 dyoung
3171 1.1 dyoung err_rx_desc:
3172 1.1 dyoung for (rxr = adapter->rx_rings; rxconf > 0; rxr++, rxconf--)
3173 1.1 dyoung ixgbe_dma_free(adapter, &rxr->rxdma);
3174 1.1 dyoung err_tx_desc:
3175 1.1 dyoung for (txr = adapter->tx_rings; txconf > 0; txr++, txconf--)
3176 1.1 dyoung ixgbe_dma_free(adapter, &txr->txdma);
3177 1.1 dyoung free(adapter->rx_rings, M_DEVBUF);
3178 1.1 dyoung rx_fail:
3179 1.1 dyoung free(adapter->tx_rings, M_DEVBUF);
3180 1.1 dyoung tx_fail:
3181 1.1 dyoung free(adapter->queues, M_DEVBUF);
3182 1.1 dyoung fail:
3183 1.1 dyoung return (error);
3184 1.1 dyoung }
3185 1.1 dyoung
3186 1.1 dyoung /*********************************************************************
3187 1.1 dyoung *
3188 1.1 dyoung * Allocate memory for tx_buffer structures. The tx_buffer stores all
3189 1.1 dyoung * the information needed to transmit a packet on the wire. This is
3190 1.1 dyoung * called only once at attach, setup is done every reset.
3191 1.1 dyoung *
3192 1.1 dyoung **********************************************************************/
3193 1.1 dyoung static int
3194 1.1 dyoung ixgbe_allocate_transmit_buffers(struct tx_ring *txr)
3195 1.1 dyoung {
3196 1.1 dyoung struct adapter *adapter = txr->adapter;
3197 1.1 dyoung device_t dev = adapter->dev;
3198 1.1 dyoung struct ixgbe_tx_buf *txbuf;
3199 1.1 dyoung int error, i;
3200 1.1 dyoung
3201 1.1 dyoung /*
3202 1.1 dyoung * Setup DMA descriptor areas.
3203 1.1 dyoung */
3204 1.1 dyoung if ((error = ixgbe_dma_tag_create(adapter->osdep.dmat, /* parent */
3205 1.1 dyoung 1, 0, /* alignment, bounds */
3206 1.1 dyoung IXGBE_TSO_SIZE, /* maxsize */
3207 1.1 dyoung adapter->num_segs, /* nsegments */
3208 1.1 dyoung PAGE_SIZE, /* maxsegsize */
3209 1.1 dyoung 0, /* flags */
3210 1.1 dyoung &txr->txtag))) {
3211 1.1 dyoung aprint_error_dev(dev,"Unable to allocate TX DMA tag\n");
3212 1.1 dyoung goto fail;
3213 1.1 dyoung }
3214 1.1 dyoung
3215 1.1 dyoung if (!(txr->tx_buffers =
3216 1.1 dyoung (struct ixgbe_tx_buf *) malloc(sizeof(struct ixgbe_tx_buf) *
3217 1.1 dyoung adapter->num_tx_desc, M_DEVBUF, M_NOWAIT | M_ZERO))) {
3218 1.1 dyoung aprint_error_dev(dev, "Unable to allocate tx_buffer memory\n");
3219 1.1 dyoung error = ENOMEM;
3220 1.1 dyoung goto fail;
3221 1.1 dyoung }
3222 1.1 dyoung
3223 1.1 dyoung /* Create the descriptor buffer dma maps */
3224 1.1 dyoung txbuf = txr->tx_buffers;
3225 1.1 dyoung for (i = 0; i < adapter->num_tx_desc; i++, txbuf++) {
3226 1.1 dyoung error = ixgbe_dmamap_create(txr->txtag, 0, &txbuf->map);
3227 1.1 dyoung if (error != 0) {
3228 1.14.2.4 riz aprint_error_dev(dev,
3229 1.14.2.4 riz "Unable to create TX DMA map (%d)\n", error);
3230 1.1 dyoung goto fail;
3231 1.1 dyoung }
3232 1.1 dyoung }
3233 1.1 dyoung
3234 1.1 dyoung return 0;
3235 1.1 dyoung fail:
3236 1.1 dyoung /* We free all, it handles case where we are in the middle */
3237 1.1 dyoung ixgbe_free_transmit_structures(adapter);
3238 1.1 dyoung return (error);
3239 1.1 dyoung }
3240 1.1 dyoung
3241 1.1 dyoung /*********************************************************************
3242 1.1 dyoung *
3243 1.1 dyoung * Initialize a transmit ring.
3244 1.1 dyoung *
3245 1.1 dyoung **********************************************************************/
3246 1.1 dyoung static void
3247 1.1 dyoung ixgbe_setup_transmit_ring(struct tx_ring *txr)
3248 1.1 dyoung {
3249 1.1 dyoung struct adapter *adapter = txr->adapter;
3250 1.1 dyoung struct ixgbe_tx_buf *txbuf;
3251 1.1 dyoung int i;
3252 1.14.2.3 martin #ifdef DEV_NETMAP
3253 1.14.2.3 martin struct netmap_adapter *na = NA(adapter->ifp);
3254 1.14.2.3 martin struct netmap_slot *slot;
3255 1.14.2.3 martin #endif /* DEV_NETMAP */
3256 1.1 dyoung
3257 1.1 dyoung /* Clear the old ring contents */
3258 1.1 dyoung IXGBE_TX_LOCK(txr);
3259 1.14.2.3 martin #ifdef DEV_NETMAP
3260 1.14.2.3 martin /*
3261 1.14.2.3 martin * (under lock): if in netmap mode, do some consistency
3262 1.14.2.3 martin * checks and set slot to entry 0 of the netmap ring.
3263 1.14.2.3 martin */
3264 1.14.2.3 martin slot = netmap_reset(na, NR_TX, txr->me, 0);
3265 1.14.2.3 martin #endif /* DEV_NETMAP */
3266 1.1 dyoung bzero((void *)txr->tx_base,
3267 1.1 dyoung (sizeof(union ixgbe_adv_tx_desc)) * adapter->num_tx_desc);
3268 1.1 dyoung /* Reset indices */
3269 1.1 dyoung txr->next_avail_desc = 0;
3270 1.1 dyoung txr->next_to_clean = 0;
3271 1.1 dyoung
3272 1.1 dyoung /* Free any existing tx buffers. */
3273 1.1 dyoung txbuf = txr->tx_buffers;
3274 1.14.2.5 riz for (i = 0; i < txr->num_desc; i++, txbuf++) {
3275 1.1 dyoung if (txbuf->m_head != NULL) {
3276 1.1 dyoung bus_dmamap_sync(txr->txtag->dt_dmat, txbuf->map,
3277 1.1 dyoung 0, txbuf->m_head->m_pkthdr.len,
3278 1.1 dyoung BUS_DMASYNC_POSTWRITE);
3279 1.1 dyoung ixgbe_dmamap_unload(txr->txtag, txbuf->map);
3280 1.1 dyoung m_freem(txbuf->m_head);
3281 1.1 dyoung txbuf->m_head = NULL;
3282 1.1 dyoung }
3283 1.14.2.3 martin #ifdef DEV_NETMAP
3284 1.14.2.3 martin /*
3285 1.14.2.3 martin * In netmap mode, set the map for the packet buffer.
3286 1.14.2.3 martin * NOTE: Some drivers (not this one) also need to set
3287 1.14.2.3 martin * the physical buffer address in the NIC ring.
3288 1.14.2.3 martin * Slots in the netmap ring (indexed by "si") are
3289 1.14.2.3 martin * kring->nkr_hwofs positions "ahead" wrt the
3290 1.14.2.3 martin * corresponding slot in the NIC ring. In some drivers
3291 1.14.2.4 riz * (not here) nkr_hwofs can be negative. Function
3292 1.14.2.4 riz * netmap_idx_n2k() handles wraparounds properly.
3293 1.14.2.3 martin */
3294 1.14.2.3 martin if (slot) {
3295 1.14.2.4 riz int si = netmap_idx_n2k(&na->tx_rings[txr->me], i);
3296 1.14.2.3 martin netmap_load_map(txr->txtag, txbuf->map, NMB(slot + si));
3297 1.14.2.3 martin }
3298 1.14.2.3 martin #endif /* DEV_NETMAP */
3299 1.14.2.5 riz /* Clear the EOP descriptor pointer */
3300 1.14.2.5 riz txbuf->eop = NULL;
3301 1.1 dyoung }
3302 1.1 dyoung
3303 1.1 dyoung #ifdef IXGBE_FDIR
3304 1.1 dyoung /* Set the rate at which we sample packets */
3305 1.1 dyoung if (adapter->hw.mac.type != ixgbe_mac_82598EB)
3306 1.1 dyoung txr->atr_sample = atr_sample_rate;
3307 1.1 dyoung #endif
3308 1.1 dyoung
3309 1.1 dyoung /* Set number of descriptors available */
3310 1.1 dyoung txr->tx_avail = adapter->num_tx_desc;
3311 1.1 dyoung
3312 1.1 dyoung ixgbe_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
3313 1.1 dyoung BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
3314 1.1 dyoung IXGBE_TX_UNLOCK(txr);
3315 1.1 dyoung }
3316 1.1 dyoung
3317 1.1 dyoung /*********************************************************************
3318 1.1 dyoung *
3319 1.1 dyoung * Initialize all transmit rings.
3320 1.1 dyoung *
3321 1.1 dyoung **********************************************************************/
3322 1.1 dyoung static int
3323 1.1 dyoung ixgbe_setup_transmit_structures(struct adapter *adapter)
3324 1.1 dyoung {
3325 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
3326 1.1 dyoung
3327 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, txr++)
3328 1.1 dyoung ixgbe_setup_transmit_ring(txr);
3329 1.1 dyoung
3330 1.1 dyoung return (0);
3331 1.1 dyoung }
3332 1.1 dyoung
3333 1.1 dyoung /*********************************************************************
3334 1.1 dyoung *
3335 1.1 dyoung * Enable transmit unit.
3336 1.1 dyoung *
3337 1.1 dyoung **********************************************************************/
3338 1.1 dyoung static void
3339 1.1 dyoung ixgbe_initialize_transmit_units(struct adapter *adapter)
3340 1.1 dyoung {
3341 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
3342 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
3343 1.1 dyoung
3344 1.1 dyoung /* Setup the Base and Length of the Tx Descriptor Ring */
3345 1.1 dyoung
3346 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, txr++) {
3347 1.1 dyoung u64 tdba = txr->txdma.dma_paddr;
3348 1.1 dyoung u32 txctrl;
3349 1.1 dyoung
3350 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_TDBAL(i),
3351 1.1 dyoung (tdba & 0x00000000ffffffffULL));
3352 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_TDBAH(i), (tdba >> 32));
3353 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_TDLEN(i),
3354 1.14.2.5 riz adapter->num_tx_desc * sizeof(union ixgbe_adv_tx_desc));
3355 1.1 dyoung
3356 1.1 dyoung /* Setup the HW Tx Head and Tail descriptor pointers */
3357 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_TDH(i), 0);
3358 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_TDT(i), 0);
3359 1.1 dyoung
3360 1.1 dyoung /* Setup Transmit Descriptor Cmd Settings */
3361 1.1 dyoung txr->txd_cmd = IXGBE_TXD_CMD_IFCS;
3362 1.1 dyoung txr->queue_status = IXGBE_QUEUE_IDLE;
3363 1.1 dyoung
3364 1.14.2.5 riz /* Set the processing limit */
3365 1.14.2.5 riz txr->process_limit = ixgbe_tx_process_limit;
3366 1.14.2.5 riz
3367 1.1 dyoung /* Disable Head Writeback */
3368 1.1 dyoung switch (hw->mac.type) {
3369 1.1 dyoung case ixgbe_mac_82598EB:
3370 1.1 dyoung txctrl = IXGBE_READ_REG(hw, IXGBE_DCA_TXCTRL(i));
3371 1.1 dyoung break;
3372 1.1 dyoung case ixgbe_mac_82599EB:
3373 1.14.2.4 riz case ixgbe_mac_X540:
3374 1.1 dyoung default:
3375 1.1 dyoung txctrl = IXGBE_READ_REG(hw, IXGBE_DCA_TXCTRL_82599(i));
3376 1.1 dyoung break;
3377 1.1 dyoung }
3378 1.14.2.4 riz txctrl &= ~IXGBE_DCA_TXCTRL_DESC_WRO_EN;
3379 1.1 dyoung switch (hw->mac.type) {
3380 1.1 dyoung case ixgbe_mac_82598EB:
3381 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_DCA_TXCTRL(i), txctrl);
3382 1.1 dyoung break;
3383 1.1 dyoung case ixgbe_mac_82599EB:
3384 1.14.2.4 riz case ixgbe_mac_X540:
3385 1.1 dyoung default:
3386 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_DCA_TXCTRL_82599(i), txctrl);
3387 1.1 dyoung break;
3388 1.1 dyoung }
3389 1.1 dyoung
3390 1.1 dyoung }
3391 1.1 dyoung
3392 1.1 dyoung if (hw->mac.type != ixgbe_mac_82598EB) {
3393 1.1 dyoung u32 dmatxctl, rttdcs;
3394 1.1 dyoung dmatxctl = IXGBE_READ_REG(hw, IXGBE_DMATXCTL);
3395 1.1 dyoung dmatxctl |= IXGBE_DMATXCTL_TE;
3396 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_DMATXCTL, dmatxctl);
3397 1.1 dyoung /* Disable arbiter to set MTQC */
3398 1.1 dyoung rttdcs = IXGBE_READ_REG(hw, IXGBE_RTTDCS);
3399 1.1 dyoung rttdcs |= IXGBE_RTTDCS_ARBDIS;
3400 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RTTDCS, rttdcs);
3401 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_MTQC, IXGBE_MTQC_64Q_1PB);
3402 1.1 dyoung rttdcs &= ~IXGBE_RTTDCS_ARBDIS;
3403 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RTTDCS, rttdcs);
3404 1.1 dyoung }
3405 1.1 dyoung
3406 1.1 dyoung return;
3407 1.1 dyoung }
3408 1.1 dyoung
3409 1.1 dyoung /*********************************************************************
3410 1.1 dyoung *
3411 1.1 dyoung * Free all transmit rings.
3412 1.1 dyoung *
3413 1.1 dyoung **********************************************************************/
3414 1.1 dyoung static void
3415 1.1 dyoung ixgbe_free_transmit_structures(struct adapter *adapter)
3416 1.1 dyoung {
3417 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
3418 1.1 dyoung
3419 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, txr++) {
3420 1.1 dyoung ixgbe_free_transmit_buffers(txr);
3421 1.1 dyoung ixgbe_dma_free(adapter, &txr->txdma);
3422 1.1 dyoung IXGBE_TX_LOCK_DESTROY(txr);
3423 1.1 dyoung }
3424 1.1 dyoung free(adapter->tx_rings, M_DEVBUF);
3425 1.1 dyoung }
3426 1.1 dyoung
3427 1.1 dyoung /*********************************************************************
3428 1.1 dyoung *
3429 1.1 dyoung * Free transmit ring related data structures.
3430 1.1 dyoung *
3431 1.1 dyoung **********************************************************************/
3432 1.1 dyoung static void
3433 1.1 dyoung ixgbe_free_transmit_buffers(struct tx_ring *txr)
3434 1.1 dyoung {
3435 1.1 dyoung struct adapter *adapter = txr->adapter;
3436 1.1 dyoung struct ixgbe_tx_buf *tx_buffer;
3437 1.1 dyoung int i;
3438 1.1 dyoung
3439 1.1 dyoung INIT_DEBUGOUT("free_transmit_ring: begin");
3440 1.1 dyoung
3441 1.1 dyoung if (txr->tx_buffers == NULL)
3442 1.1 dyoung return;
3443 1.1 dyoung
3444 1.1 dyoung tx_buffer = txr->tx_buffers;
3445 1.1 dyoung for (i = 0; i < adapter->num_tx_desc; i++, tx_buffer++) {
3446 1.1 dyoung if (tx_buffer->m_head != NULL) {
3447 1.1 dyoung bus_dmamap_sync(txr->txtag->dt_dmat, tx_buffer->map,
3448 1.1 dyoung 0, tx_buffer->m_head->m_pkthdr.len,
3449 1.1 dyoung BUS_DMASYNC_POSTWRITE);
3450 1.1 dyoung ixgbe_dmamap_unload(txr->txtag, tx_buffer->map);
3451 1.1 dyoung m_freem(tx_buffer->m_head);
3452 1.1 dyoung tx_buffer->m_head = NULL;
3453 1.1 dyoung if (tx_buffer->map != NULL) {
3454 1.1 dyoung ixgbe_dmamap_destroy(txr->txtag,
3455 1.1 dyoung tx_buffer->map);
3456 1.1 dyoung tx_buffer->map = NULL;
3457 1.1 dyoung }
3458 1.1 dyoung } else if (tx_buffer->map != NULL) {
3459 1.1 dyoung ixgbe_dmamap_unload(txr->txtag, tx_buffer->map);
3460 1.1 dyoung ixgbe_dmamap_destroy(txr->txtag, tx_buffer->map);
3461 1.1 dyoung tx_buffer->map = NULL;
3462 1.1 dyoung }
3463 1.1 dyoung }
3464 1.14.2.5 riz #ifndef IXGBE_LEGACY_TX
3465 1.1 dyoung if (txr->br != NULL)
3466 1.1 dyoung buf_ring_free(txr->br, M_DEVBUF);
3467 1.1 dyoung #endif
3468 1.1 dyoung if (txr->tx_buffers != NULL) {
3469 1.1 dyoung free(txr->tx_buffers, M_DEVBUF);
3470 1.1 dyoung txr->tx_buffers = NULL;
3471 1.1 dyoung }
3472 1.1 dyoung if (txr->txtag != NULL) {
3473 1.1 dyoung ixgbe_dma_tag_destroy(txr->txtag);
3474 1.1 dyoung txr->txtag = NULL;
3475 1.1 dyoung }
3476 1.1 dyoung return;
3477 1.1 dyoung }
3478 1.1 dyoung
3479 1.1 dyoung /*********************************************************************
3480 1.1 dyoung *
3481 1.14.2.5 riz * Advanced Context Descriptor setup for VLAN, CSUM or TSO
3482 1.1 dyoung *
3483 1.1 dyoung **********************************************************************/
3484 1.1 dyoung
3485 1.14.2.5 riz static int
3486 1.14.2.5 riz ixgbe_tx_ctx_setup(struct tx_ring *txr, struct mbuf *mp,
3487 1.14.2.5 riz u32 *cmd_type_len, u32 *olinfo_status)
3488 1.1 dyoung {
3489 1.1 dyoung struct m_tag *mtag;
3490 1.1 dyoung struct adapter *adapter = txr->adapter;
3491 1.1 dyoung struct ethercom *ec = &adapter->osdep.ec;
3492 1.1 dyoung struct ixgbe_adv_tx_context_desc *TXD;
3493 1.1 dyoung struct ether_vlan_header *eh;
3494 1.1 dyoung struct ip ip;
3495 1.1 dyoung struct ip6_hdr ip6;
3496 1.14.2.5 riz u32 vlan_macip_lens = 0, type_tucmd_mlhl = 0;
3497 1.14.2.5 riz int ehdrlen, ip_hlen = 0;
3498 1.1 dyoung u16 etype;
3499 1.12 hannken u8 ipproto __diagused = 0;
3500 1.14.2.5 riz int offload = TRUE;
3501 1.14.2.5 riz int ctxd = txr->next_avail_desc;
3502 1.14.2.5 riz u16 vtag = 0;
3503 1.14.2.5 riz
3504 1.14.2.5 riz /* First check if TSO is to be used */
3505 1.14.2.5 riz if (mp->m_pkthdr.csum_flags & (M_CSUM_TSOv4|M_CSUM_TSOv6))
3506 1.14.2.5 riz return (ixgbe_tso_setup(txr, mp, cmd_type_len, olinfo_status));
3507 1.1 dyoung
3508 1.14.2.5 riz if ((mp->m_pkthdr.csum_flags & M_CSUM_OFFLOAD) == 0)
3509 1.14.2.5 riz offload = FALSE;
3510 1.1 dyoung
3511 1.14.2.5 riz /* Indicate the whole packet as payload when not doing TSO */
3512 1.14.2.5 riz *olinfo_status |= mp->m_pkthdr.len << IXGBE_ADVTXD_PAYLEN_SHIFT;
3513 1.14.2.5 riz
3514 1.14.2.5 riz /* Now ready a context descriptor */
3515 1.1 dyoung TXD = (struct ixgbe_adv_tx_context_desc *) &txr->tx_base[ctxd];
3516 1.1 dyoung
3517 1.1 dyoung /*
3518 1.1 dyoung ** In advanced descriptors the vlan tag must
3519 1.14.2.5 riz ** be placed into the context descriptor. Hence
3520 1.14.2.5 riz ** we need to make one even if not doing offloads.
3521 1.1 dyoung */
3522 1.1 dyoung if ((mtag = VLAN_OUTPUT_TAG(ec, mp)) != NULL) {
3523 1.1 dyoung vtag = htole16(VLAN_TAG_VALUE(mtag) & 0xffff);
3524 1.1 dyoung vlan_macip_lens |= (vtag << IXGBE_ADVTXD_VLAN_SHIFT);
3525 1.14.2.5 riz } else if (offload == FALSE) /* ... no offload to do */
3526 1.1 dyoung return 0;
3527 1.1 dyoung
3528 1.1 dyoung /*
3529 1.1 dyoung * Determine where frame payload starts.
3530 1.1 dyoung * Jump over vlan headers if already present,
3531 1.1 dyoung * helpful for QinQ too.
3532 1.1 dyoung */
3533 1.1 dyoung KASSERT(mp->m_len >= offsetof(struct ether_vlan_header, evl_tag));
3534 1.1 dyoung eh = mtod(mp, struct ether_vlan_header *);
3535 1.1 dyoung if (eh->evl_encap_proto == htons(ETHERTYPE_VLAN)) {
3536 1.1 dyoung KASSERT(mp->m_len >= sizeof(struct ether_vlan_header));
3537 1.1 dyoung etype = ntohs(eh->evl_proto);
3538 1.1 dyoung ehdrlen = ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN;
3539 1.1 dyoung } else {
3540 1.1 dyoung etype = ntohs(eh->evl_encap_proto);
3541 1.1 dyoung ehdrlen = ETHER_HDR_LEN;
3542 1.1 dyoung }
3543 1.1 dyoung
3544 1.1 dyoung /* Set the ether header length */
3545 1.1 dyoung vlan_macip_lens |= ehdrlen << IXGBE_ADVTXD_MACLEN_SHIFT;
3546 1.1 dyoung
3547 1.1 dyoung switch (etype) {
3548 1.1 dyoung case ETHERTYPE_IP:
3549 1.1 dyoung m_copydata(mp, ehdrlen, sizeof(ip), &ip);
3550 1.1 dyoung ip_hlen = ip.ip_hl << 2;
3551 1.1 dyoung ipproto = ip.ip_p;
3552 1.1 dyoung #if 0
3553 1.1 dyoung ip.ip_sum = 0;
3554 1.1 dyoung m_copyback(mp, ehdrlen, sizeof(ip), &ip);
3555 1.1 dyoung #else
3556 1.1 dyoung KASSERT((mp->m_pkthdr.csum_flags & M_CSUM_IPv4) == 0 ||
3557 1.1 dyoung ip.ip_sum == 0);
3558 1.1 dyoung #endif
3559 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_IPV4;
3560 1.1 dyoung break;
3561 1.1 dyoung case ETHERTYPE_IPV6:
3562 1.1 dyoung m_copydata(mp, ehdrlen, sizeof(ip6), &ip6);
3563 1.1 dyoung ip_hlen = sizeof(ip6);
3564 1.14.2.4 riz /* XXX-BZ this will go badly in case of ext hdrs. */
3565 1.1 dyoung ipproto = ip6.ip6_nxt;
3566 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_IPV6;
3567 1.1 dyoung break;
3568 1.1 dyoung default:
3569 1.1 dyoung break;
3570 1.1 dyoung }
3571 1.1 dyoung
3572 1.1 dyoung if ((mp->m_pkthdr.csum_flags & M_CSUM_IPv4) != 0)
3573 1.14.2.5 riz *olinfo_status |= IXGBE_TXD_POPTS_IXSM << 8;
3574 1.1 dyoung
3575 1.1 dyoung vlan_macip_lens |= ip_hlen;
3576 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_DCMD_DEXT | IXGBE_ADVTXD_DTYP_CTXT;
3577 1.1 dyoung
3578 1.1 dyoung if (mp->m_pkthdr.csum_flags & (M_CSUM_TCPv4|M_CSUM_TCPv6)) {
3579 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_L4T_TCP;
3580 1.14.2.5 riz *olinfo_status |= IXGBE_TXD_POPTS_TXSM << 8;
3581 1.1 dyoung KASSERT(ipproto == IPPROTO_TCP);
3582 1.1 dyoung } else if (mp->m_pkthdr.csum_flags & (M_CSUM_UDPv4|M_CSUM_UDPv6)) {
3583 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_L4T_UDP;
3584 1.14.2.5 riz *olinfo_status |= IXGBE_TXD_POPTS_TXSM << 8;
3585 1.1 dyoung KASSERT(ipproto == IPPROTO_UDP);
3586 1.1 dyoung }
3587 1.1 dyoung
3588 1.1 dyoung /* Now copy bits into descriptor */
3589 1.14.2.5 riz TXD->vlan_macip_lens = htole32(vlan_macip_lens);
3590 1.14.2.5 riz TXD->type_tucmd_mlhl = htole32(type_tucmd_mlhl);
3591 1.1 dyoung TXD->seqnum_seed = htole32(0);
3592 1.1 dyoung TXD->mss_l4len_idx = htole32(0);
3593 1.1 dyoung
3594 1.1 dyoung /* We've consumed the first desc, adjust counters */
3595 1.14.2.5 riz if (++ctxd == txr->num_desc)
3596 1.1 dyoung ctxd = 0;
3597 1.1 dyoung txr->next_avail_desc = ctxd;
3598 1.1 dyoung --txr->tx_avail;
3599 1.1 dyoung
3600 1.14.2.5 riz return 0;
3601 1.1 dyoung }
3602 1.1 dyoung
3603 1.1 dyoung /**********************************************************************
3604 1.1 dyoung *
3605 1.1 dyoung * Setup work for hardware segmentation offload (TSO) on
3606 1.1 dyoung * adapters using advanced tx descriptors
3607 1.1 dyoung *
3608 1.1 dyoung **********************************************************************/
3609 1.14.2.5 riz static int
3610 1.14.2.5 riz ixgbe_tso_setup(struct tx_ring *txr, struct mbuf *mp,
3611 1.14.2.5 riz u32 *cmd_type_len, u32 *olinfo_status)
3612 1.1 dyoung {
3613 1.1 dyoung struct m_tag *mtag;
3614 1.1 dyoung struct adapter *adapter = txr->adapter;
3615 1.1 dyoung struct ethercom *ec = &adapter->osdep.ec;
3616 1.1 dyoung struct ixgbe_adv_tx_context_desc *TXD;
3617 1.1 dyoung u32 vlan_macip_lens = 0, type_tucmd_mlhl = 0;
3618 1.14.2.5 riz u32 mss_l4len_idx = 0, paylen;
3619 1.14.2.4 riz u16 vtag = 0, eh_type;
3620 1.14.2.4 riz int ctxd, ehdrlen, ip_hlen, tcp_hlen;
3621 1.1 dyoung struct ether_vlan_header *eh;
3622 1.14.2.4 riz #ifdef INET6
3623 1.14.2.4 riz struct ip6_hdr *ip6;
3624 1.14.2.4 riz #endif
3625 1.14.2.4 riz #ifdef INET
3626 1.1 dyoung struct ip *ip;
3627 1.14.2.4 riz #endif
3628 1.1 dyoung struct tcphdr *th;
3629 1.1 dyoung
3630 1.1 dyoung
3631 1.1 dyoung /*
3632 1.1 dyoung * Determine where frame payload starts.
3633 1.1 dyoung * Jump over vlan headers if already present
3634 1.1 dyoung */
3635 1.1 dyoung eh = mtod(mp, struct ether_vlan_header *);
3636 1.14.2.4 riz if (eh->evl_encap_proto == htons(ETHERTYPE_VLAN)) {
3637 1.1 dyoung ehdrlen = ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN;
3638 1.14.2.4 riz eh_type = eh->evl_proto;
3639 1.14.2.4 riz } else {
3640 1.1 dyoung ehdrlen = ETHER_HDR_LEN;
3641 1.14.2.4 riz eh_type = eh->evl_encap_proto;
3642 1.14.2.4 riz }
3643 1.1 dyoung
3644 1.14.2.4 riz switch (ntohs(eh_type)) {
3645 1.14.2.4 riz #ifdef INET6
3646 1.14.2.4 riz case ETHERTYPE_IPV6:
3647 1.14.2.4 riz ip6 = (struct ip6_hdr *)(mp->m_data + ehdrlen);
3648 1.14.2.4 riz /* XXX-BZ For now we do not pretend to support ext. hdrs. */
3649 1.14.2.4 riz if (ip6->ip6_nxt != IPPROTO_TCP)
3650 1.14.2.5 riz return (ENXIO);
3651 1.14.2.4 riz ip_hlen = sizeof(struct ip6_hdr);
3652 1.14.2.5 riz ip6 = (struct ip6_hdr *)(mp->m_data + ehdrlen);
3653 1.14.2.4 riz th = (struct tcphdr *)((char *)ip6 + ip_hlen);
3654 1.14.2.4 riz th->th_sum = in6_cksum_phdr(&ip6->ip6_src,
3655 1.14.2.4 riz &ip6->ip6_dst, 0, htonl(IPPROTO_TCP));
3656 1.14.2.4 riz type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_IPV6;
3657 1.14.2.4 riz break;
3658 1.14.2.4 riz #endif
3659 1.14.2.4 riz #ifdef INET
3660 1.14.2.4 riz case ETHERTYPE_IP:
3661 1.14.2.4 riz ip = (struct ip *)(mp->m_data + ehdrlen);
3662 1.14.2.4 riz if (ip->ip_p != IPPROTO_TCP)
3663 1.14.2.5 riz return (ENXIO);
3664 1.14.2.4 riz ip->ip_sum = 0;
3665 1.14.2.4 riz ip_hlen = ip->ip_hl << 2;
3666 1.14.2.4 riz th = (struct tcphdr *)((char *)ip + ip_hlen);
3667 1.14.2.4 riz th->th_sum = in_cksum_phdr(ip->ip_src.s_addr,
3668 1.14.2.4 riz ip->ip_dst.s_addr, htons(IPPROTO_TCP));
3669 1.14.2.4 riz type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_IPV4;
3670 1.14.2.4 riz /* Tell transmit desc to also do IPv4 checksum. */
3671 1.14.2.4 riz *olinfo_status |= IXGBE_TXD_POPTS_IXSM << 8;
3672 1.14.2.4 riz break;
3673 1.14.2.4 riz #endif
3674 1.14.2.4 riz default:
3675 1.14.2.4 riz panic("%s: CSUM_TSO but no supported IP version (0x%04x)",
3676 1.14.2.4 riz __func__, ntohs(eh_type));
3677 1.14.2.4 riz break;
3678 1.14.2.4 riz }
3679 1.1 dyoung
3680 1.1 dyoung ctxd = txr->next_avail_desc;
3681 1.1 dyoung TXD = (struct ixgbe_adv_tx_context_desc *) &txr->tx_base[ctxd];
3682 1.1 dyoung
3683 1.1 dyoung tcp_hlen = th->th_off << 2;
3684 1.1 dyoung
3685 1.1 dyoung /* This is used in the transmit desc in encap */
3686 1.14.2.5 riz paylen = mp->m_pkthdr.len - ehdrlen - ip_hlen - tcp_hlen;
3687 1.1 dyoung
3688 1.1 dyoung /* VLAN MACLEN IPLEN */
3689 1.1 dyoung if ((mtag = VLAN_OUTPUT_TAG(ec, mp)) != NULL) {
3690 1.1 dyoung vtag = htole16(VLAN_TAG_VALUE(mtag) & 0xffff);
3691 1.1 dyoung vlan_macip_lens |= (vtag << IXGBE_ADVTXD_VLAN_SHIFT);
3692 1.1 dyoung }
3693 1.1 dyoung
3694 1.1 dyoung vlan_macip_lens |= ehdrlen << IXGBE_ADVTXD_MACLEN_SHIFT;
3695 1.1 dyoung vlan_macip_lens |= ip_hlen;
3696 1.14.2.5 riz TXD->vlan_macip_lens = htole32(vlan_macip_lens);
3697 1.1 dyoung
3698 1.1 dyoung /* ADV DTYPE TUCMD */
3699 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_DCMD_DEXT | IXGBE_ADVTXD_DTYP_CTXT;
3700 1.1 dyoung type_tucmd_mlhl |= IXGBE_ADVTXD_TUCMD_L4T_TCP;
3701 1.14.2.5 riz TXD->type_tucmd_mlhl = htole32(type_tucmd_mlhl);
3702 1.1 dyoung
3703 1.1 dyoung /* MSS L4LEN IDX */
3704 1.1 dyoung mss_l4len_idx |= (mp->m_pkthdr.segsz << IXGBE_ADVTXD_MSS_SHIFT);
3705 1.1 dyoung mss_l4len_idx |= (tcp_hlen << IXGBE_ADVTXD_L4LEN_SHIFT);
3706 1.1 dyoung TXD->mss_l4len_idx = htole32(mss_l4len_idx);
3707 1.1 dyoung
3708 1.1 dyoung TXD->seqnum_seed = htole32(0);
3709 1.1 dyoung
3710 1.14.2.5 riz if (++ctxd == txr->num_desc)
3711 1.1 dyoung ctxd = 0;
3712 1.1 dyoung
3713 1.1 dyoung txr->tx_avail--;
3714 1.1 dyoung txr->next_avail_desc = ctxd;
3715 1.14.2.5 riz *cmd_type_len |= IXGBE_ADVTXD_DCMD_TSE;
3716 1.14.2.5 riz *olinfo_status |= IXGBE_TXD_POPTS_TXSM << 8;
3717 1.14.2.5 riz *olinfo_status |= paylen << IXGBE_ADVTXD_PAYLEN_SHIFT;
3718 1.14.2.5 riz ++txr->tso_tx.ev_count;
3719 1.14.2.5 riz return (0);
3720 1.1 dyoung }
3721 1.1 dyoung
3722 1.1 dyoung #ifdef IXGBE_FDIR
3723 1.1 dyoung /*
3724 1.1 dyoung ** This routine parses packet headers so that Flow
3725 1.1 dyoung ** Director can make a hashed filter table entry
3726 1.1 dyoung ** allowing traffic flows to be identified and kept
3727 1.1 dyoung ** on the same cpu. This would be a performance
3728 1.1 dyoung ** hit, but we only do it at IXGBE_FDIR_RATE of
3729 1.1 dyoung ** packets.
3730 1.1 dyoung */
3731 1.1 dyoung static void
3732 1.1 dyoung ixgbe_atr(struct tx_ring *txr, struct mbuf *mp)
3733 1.1 dyoung {
3734 1.1 dyoung struct adapter *adapter = txr->adapter;
3735 1.1 dyoung struct ix_queue *que;
3736 1.1 dyoung struct ip *ip;
3737 1.1 dyoung struct tcphdr *th;
3738 1.1 dyoung struct udphdr *uh;
3739 1.1 dyoung struct ether_vlan_header *eh;
3740 1.1 dyoung union ixgbe_atr_hash_dword input = {.dword = 0};
3741 1.1 dyoung union ixgbe_atr_hash_dword common = {.dword = 0};
3742 1.1 dyoung int ehdrlen, ip_hlen;
3743 1.1 dyoung u16 etype;
3744 1.1 dyoung
3745 1.1 dyoung eh = mtod(mp, struct ether_vlan_header *);
3746 1.1 dyoung if (eh->evl_encap_proto == htons(ETHERTYPE_VLAN)) {
3747 1.1 dyoung ehdrlen = ETHER_HDR_LEN + ETHER_VLAN_ENCAP_LEN;
3748 1.1 dyoung etype = eh->evl_proto;
3749 1.1 dyoung } else {
3750 1.1 dyoung ehdrlen = ETHER_HDR_LEN;
3751 1.1 dyoung etype = eh->evl_encap_proto;
3752 1.1 dyoung }
3753 1.1 dyoung
3754 1.1 dyoung /* Only handling IPv4 */
3755 1.1 dyoung if (etype != htons(ETHERTYPE_IP))
3756 1.1 dyoung return;
3757 1.1 dyoung
3758 1.1 dyoung ip = (struct ip *)(mp->m_data + ehdrlen);
3759 1.1 dyoung ip_hlen = ip->ip_hl << 2;
3760 1.1 dyoung
3761 1.1 dyoung /* check if we're UDP or TCP */
3762 1.1 dyoung switch (ip->ip_p) {
3763 1.1 dyoung case IPPROTO_TCP:
3764 1.1 dyoung th = (struct tcphdr *)((char *)ip + ip_hlen);
3765 1.1 dyoung /* src and dst are inverted */
3766 1.1 dyoung common.port.dst ^= th->th_sport;
3767 1.1 dyoung common.port.src ^= th->th_dport;
3768 1.1 dyoung input.formatted.flow_type ^= IXGBE_ATR_FLOW_TYPE_TCPV4;
3769 1.1 dyoung break;
3770 1.1 dyoung case IPPROTO_UDP:
3771 1.1 dyoung uh = (struct udphdr *)((char *)ip + ip_hlen);
3772 1.1 dyoung /* src and dst are inverted */
3773 1.1 dyoung common.port.dst ^= uh->uh_sport;
3774 1.1 dyoung common.port.src ^= uh->uh_dport;
3775 1.1 dyoung input.formatted.flow_type ^= IXGBE_ATR_FLOW_TYPE_UDPV4;
3776 1.1 dyoung break;
3777 1.1 dyoung default:
3778 1.1 dyoung return;
3779 1.1 dyoung }
3780 1.1 dyoung
3781 1.1 dyoung input.formatted.vlan_id = htobe16(mp->m_pkthdr.ether_vtag);
3782 1.1 dyoung if (mp->m_pkthdr.ether_vtag)
3783 1.1 dyoung common.flex_bytes ^= htons(ETHERTYPE_VLAN);
3784 1.1 dyoung else
3785 1.1 dyoung common.flex_bytes ^= etype;
3786 1.1 dyoung common.ip ^= ip->ip_src.s_addr ^ ip->ip_dst.s_addr;
3787 1.1 dyoung
3788 1.1 dyoung que = &adapter->queues[txr->me];
3789 1.1 dyoung /*
3790 1.1 dyoung ** This assumes the Rx queue and Tx
3791 1.1 dyoung ** queue are bound to the same CPU
3792 1.1 dyoung */
3793 1.1 dyoung ixgbe_fdir_add_signature_filter_82599(&adapter->hw,
3794 1.1 dyoung input, common, que->msix);
3795 1.1 dyoung }
3796 1.1 dyoung #endif /* IXGBE_FDIR */
3797 1.1 dyoung
3798 1.1 dyoung /**********************************************************************
3799 1.1 dyoung *
3800 1.1 dyoung * Examine each tx_buffer in the used queue. If the hardware is done
3801 1.1 dyoung * processing the packet then free associated resources. The
3802 1.1 dyoung * tx_buffer is put back on the free queue.
3803 1.1 dyoung *
3804 1.1 dyoung **********************************************************************/
3805 1.1 dyoung static bool
3806 1.1 dyoung ixgbe_txeof(struct tx_ring *txr)
3807 1.1 dyoung {
3808 1.14.2.5 riz struct adapter *adapter = txr->adapter;
3809 1.14.2.5 riz struct ifnet *ifp = adapter->ifp;
3810 1.14.2.5 riz u32 work, processed = 0;
3811 1.14.2.5 riz u16 limit = txr->process_limit;
3812 1.14.2.5 riz struct ixgbe_tx_buf *buf;
3813 1.14.2.5 riz union ixgbe_adv_tx_desc *txd;
3814 1.1 dyoung struct timeval now, elapsed;
3815 1.1 dyoung
3816 1.1 dyoung KASSERT(mutex_owned(&txr->tx_mtx));
3817 1.1 dyoung
3818 1.14.2.3 martin #ifdef DEV_NETMAP
3819 1.14.2.3 martin if (ifp->if_capenable & IFCAP_NETMAP) {
3820 1.14.2.3 martin struct netmap_adapter *na = NA(ifp);
3821 1.14.2.3 martin struct netmap_kring *kring = &na->tx_rings[txr->me];
3822 1.14.2.5 riz txd = txr->tx_base;
3823 1.14.2.3 martin bus_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
3824 1.14.2.3 martin BUS_DMASYNC_POSTREAD);
3825 1.14.2.3 martin /*
3826 1.14.2.3 martin * In netmap mode, all the work is done in the context
3827 1.14.2.3 martin * of the client thread. Interrupt handlers only wake up
3828 1.14.2.3 martin * clients, which may be sleeping on individual rings
3829 1.14.2.3 martin * or on a global resource for all rings.
3830 1.14.2.3 martin * To implement tx interrupt mitigation, we wake up the client
3831 1.14.2.3 martin * thread roughly every half ring, even if the NIC interrupts
3832 1.14.2.3 martin * more frequently. This is implemented as follows:
3833 1.14.2.3 martin * - ixgbe_txsync() sets kring->nr_kflags with the index of
3834 1.14.2.3 martin * the slot that should wake up the thread (nkr_num_slots
3835 1.14.2.3 martin * means the user thread should not be woken up);
3836 1.14.2.3 martin * - the driver ignores tx interrupts unless netmap_mitigate=0
3837 1.14.2.3 martin * or the slot has the DD bit set.
3838 1.14.2.3 martin *
3839 1.14.2.3 martin * When the driver has separate locks, we need to
3840 1.14.2.3 martin * release and re-acquire txlock to avoid deadlocks.
3841 1.14.2.3 martin * XXX see if we can find a better way.
3842 1.14.2.3 martin */
3843 1.14.2.3 martin if (!netmap_mitigate ||
3844 1.14.2.3 martin (kring->nr_kflags < kring->nkr_num_slots &&
3845 1.14.2.5 riz txd[kring->nr_kflags].wb.status & IXGBE_TXD_STAT_DD)) {
3846 1.14.2.5 riz netmap_tx_irq(ifp, txr->me |
3847 1.14.2.5 riz (NETMAP_LOCKED_ENTER|NETMAP_LOCKED_EXIT));
3848 1.14.2.3 martin }
3849 1.14.2.3 martin return FALSE;
3850 1.14.2.3 martin }
3851 1.14.2.3 martin #endif /* DEV_NETMAP */
3852 1.14.2.3 martin
3853 1.14.2.5 riz if (txr->tx_avail == txr->num_desc) {
3854 1.1 dyoung txr->queue_status = IXGBE_QUEUE_IDLE;
3855 1.1 dyoung return false;
3856 1.1 dyoung }
3857 1.1 dyoung
3858 1.14.2.5 riz /* Get work starting point */
3859 1.14.2.5 riz work = txr->next_to_clean;
3860 1.14.2.5 riz buf = &txr->tx_buffers[work];
3861 1.14.2.5 riz txd = &txr->tx_base[work];
3862 1.14.2.5 riz work -= txr->num_desc; /* The distance to ring end */
3863 1.1 dyoung ixgbe_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
3864 1.1 dyoung BUS_DMASYNC_POSTREAD);
3865 1.14.2.5 riz do {
3866 1.14.2.5 riz union ixgbe_adv_tx_desc *eop= buf->eop;
3867 1.14.2.5 riz if (eop == NULL) /* No work */
3868 1.14.2.5 riz break;
3869 1.1 dyoung
3870 1.14.2.5 riz if ((eop->wb.status & IXGBE_TXD_STAT_DD) == 0)
3871 1.14.2.5 riz break; /* I/O not complete */
3872 1.14.2.5 riz
3873 1.14.2.5 riz if (buf->m_head) {
3874 1.14.2.5 riz txr->bytes +=
3875 1.14.2.5 riz buf->m_head->m_pkthdr.len;
3876 1.14.2.5 riz bus_dmamap_sync(txr->txtag->dt_dmat,
3877 1.14.2.5 riz buf->map,
3878 1.14.2.5 riz 0, buf->m_head->m_pkthdr.len,
3879 1.14.2.5 riz BUS_DMASYNC_POSTWRITE);
3880 1.14.2.5 riz ixgbe_dmamap_unload(txr->txtag,
3881 1.14.2.5 riz buf->map);
3882 1.14.2.5 riz m_freem(buf->m_head);
3883 1.14.2.5 riz buf->m_head = NULL;
3884 1.14.2.5 riz /*
3885 1.14.2.5 riz * NetBSD: Don't override buf->map with NULL here.
3886 1.14.2.5 riz * It'll panic when a ring runs one lap around.
3887 1.14.2.5 riz */
3888 1.14.2.5 riz }
3889 1.14.2.5 riz buf->eop = NULL;
3890 1.14.2.5 riz ++txr->tx_avail;
3891 1.14.2.5 riz
3892 1.14.2.5 riz /* We clean the range if multi segment */
3893 1.14.2.5 riz while (txd != eop) {
3894 1.14.2.5 riz ++txd;
3895 1.14.2.5 riz ++buf;
3896 1.14.2.5 riz ++work;
3897 1.14.2.5 riz /* wrap the ring? */
3898 1.14.2.5 riz if (__predict_false(!work)) {
3899 1.14.2.5 riz work -= txr->num_desc;
3900 1.14.2.5 riz buf = txr->tx_buffers;
3901 1.14.2.5 riz txd = txr->tx_base;
3902 1.14.2.5 riz }
3903 1.14.2.5 riz if (buf->m_head) {
3904 1.1 dyoung txr->bytes +=
3905 1.14.2.5 riz buf->m_head->m_pkthdr.len;
3906 1.1 dyoung bus_dmamap_sync(txr->txtag->dt_dmat,
3907 1.14.2.5 riz buf->map,
3908 1.14.2.5 riz 0, buf->m_head->m_pkthdr.len,
3909 1.1 dyoung BUS_DMASYNC_POSTWRITE);
3910 1.14.2.5 riz ixgbe_dmamap_unload(txr->txtag,
3911 1.14.2.5 riz buf->map);
3912 1.14.2.5 riz m_freem(buf->m_head);
3913 1.14.2.5 riz buf->m_head = NULL;
3914 1.14.2.5 riz /*
3915 1.14.2.5 riz * NetBSD: Don't override buf->map with NULL
3916 1.14.2.5 riz * here. It'll panic when a ring runs one lap
3917 1.14.2.5 riz * around.
3918 1.14.2.5 riz */
3919 1.1 dyoung }
3920 1.14.2.5 riz ++txr->tx_avail;
3921 1.14.2.5 riz buf->eop = NULL;
3922 1.1 dyoung
3923 1.1 dyoung }
3924 1.1 dyoung ++txr->packets;
3925 1.14.2.5 riz ++processed;
3926 1.1 dyoung ++ifp->if_opackets;
3927 1.14.2.5 riz getmicrotime(&txr->watchdog_time);
3928 1.14.2.5 riz
3929 1.14.2.5 riz /* Try the next packet */
3930 1.14.2.5 riz ++txd;
3931 1.14.2.5 riz ++buf;
3932 1.14.2.5 riz ++work;
3933 1.14.2.5 riz /* reset with a wrap */
3934 1.14.2.5 riz if (__predict_false(!work)) {
3935 1.14.2.5 riz work -= txr->num_desc;
3936 1.14.2.5 riz buf = txr->tx_buffers;
3937 1.14.2.5 riz txd = txr->tx_base;
3938 1.14.2.5 riz }
3939 1.14.2.5 riz prefetch(txd);
3940 1.14.2.5 riz } while (__predict_true(--limit));
3941 1.14.2.5 riz
3942 1.1 dyoung ixgbe_dmamap_sync(txr->txdma.dma_tag, txr->txdma.dma_map,
3943 1.1 dyoung BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
3944 1.1 dyoung
3945 1.14.2.5 riz work += txr->num_desc;
3946 1.14.2.5 riz txr->next_to_clean = work;
3947 1.1 dyoung
3948 1.1 dyoung /*
3949 1.1 dyoung ** Watchdog calculation, we know there's
3950 1.1 dyoung ** work outstanding or the first return
3951 1.1 dyoung ** would have been taken, so none processed
3952 1.1 dyoung ** for too long indicates a hang.
3953 1.1 dyoung */
3954 1.1 dyoung getmicrotime(&now);
3955 1.1 dyoung timersub(&now, &txr->watchdog_time, &elapsed);
3956 1.1 dyoung if (!processed && tvtohz(&elapsed) > IXGBE_WATCHDOG)
3957 1.1 dyoung txr->queue_status = IXGBE_QUEUE_HUNG;
3958 1.1 dyoung
3959 1.14.2.5 riz if (txr->tx_avail == txr->num_desc) {
3960 1.14.2.4 riz txr->queue_status = IXGBE_QUEUE_IDLE;
3961 1.14.2.4 riz return false;
3962 1.1 dyoung }
3963 1.1 dyoung
3964 1.1 dyoung return true;
3965 1.1 dyoung }
3966 1.1 dyoung
3967 1.1 dyoung /*********************************************************************
3968 1.1 dyoung *
3969 1.1 dyoung * Refresh mbuf buffers for RX descriptor rings
3970 1.1 dyoung * - now keeps its own state so discards due to resource
3971 1.1 dyoung * exhaustion are unnecessary, if an mbuf cannot be obtained
3972 1.1 dyoung * it just returns, keeping its placeholder, thus it can simply
3973 1.1 dyoung * be recalled to try again.
3974 1.1 dyoung *
3975 1.1 dyoung **********************************************************************/
3976 1.1 dyoung static void
3977 1.1 dyoung ixgbe_refresh_mbufs(struct rx_ring *rxr, int limit)
3978 1.1 dyoung {
3979 1.1 dyoung struct adapter *adapter = rxr->adapter;
3980 1.1 dyoung struct ixgbe_rx_buf *rxbuf;
3981 1.14.2.4 riz struct mbuf *mp;
3982 1.1 dyoung int i, j, error;
3983 1.1 dyoung bool refreshed = false;
3984 1.1 dyoung
3985 1.1 dyoung i = j = rxr->next_to_refresh;
3986 1.1 dyoung /* Control the loop with one beyond */
3987 1.14.2.5 riz if (++j == rxr->num_desc)
3988 1.1 dyoung j = 0;
3989 1.1 dyoung
3990 1.1 dyoung while (j != limit) {
3991 1.1 dyoung rxbuf = &rxr->rx_buffers[i];
3992 1.14.2.4 riz if (rxbuf->buf == NULL) {
3993 1.14.2.5 riz mp = ixgbe_getjcl(&adapter->jcl_head, M_NOWAIT,
3994 1.14.2.5 riz MT_DATA, M_PKTHDR, rxr->mbuf_sz);
3995 1.1 dyoung if (mp == NULL) {
3996 1.1 dyoung rxr->no_jmbuf.ev_count++;
3997 1.1 dyoung goto update;
3998 1.1 dyoung }
3999 1.14.2.5 riz if (adapter->max_frame_size <= (MCLBYTES - ETHER_ALIGN))
4000 1.14.2.5 riz m_adj(mp, ETHER_ALIGN);
4001 1.1 dyoung } else
4002 1.14.2.4 riz mp = rxbuf->buf;
4003 1.1 dyoung
4004 1.14.2.5 riz mp->m_pkthdr.len = mp->m_len = rxr->mbuf_sz;
4005 1.14.2.4 riz /* If we're dealing with an mbuf that was copied rather
4006 1.14.2.4 riz * than replaced, there's no need to go through busdma.
4007 1.14.2.4 riz */
4008 1.14.2.4 riz if ((rxbuf->flags & IXGBE_RX_COPY) == 0) {
4009 1.14.2.4 riz /* Get the memory mapping */
4010 1.14.2.5 riz error = bus_dmamap_load_mbuf(rxr->ptag->dt_dmat,
4011 1.14.2.5 riz rxbuf->pmap, mp, BUS_DMA_NOWAIT);
4012 1.14.2.4 riz if (error != 0) {
4013 1.14.2.4 riz printf("Refresh mbufs: payload dmamap load"
4014 1.14.2.4 riz " failure - %d\n", error);
4015 1.14.2.4 riz m_free(mp);
4016 1.14.2.4 riz rxbuf->buf = NULL;
4017 1.14.2.4 riz goto update;
4018 1.14.2.4 riz }
4019 1.14.2.4 riz rxbuf->buf = mp;
4020 1.14.2.5 riz bus_dmamap_sync(rxr->ptag->dt_dmat, rxbuf->pmap,
4021 1.14.2.4 riz 0, mp->m_pkthdr.len, BUS_DMASYNC_PREREAD);
4022 1.14.2.4 riz rxbuf->addr = rxr->rx_base[i].read.pkt_addr =
4023 1.14.2.5 riz htole64(rxbuf->pmap->dm_segs[0].ds_addr);
4024 1.14.2.4 riz } else {
4025 1.14.2.4 riz rxr->rx_base[i].read.pkt_addr = rxbuf->addr;
4026 1.14.2.4 riz rxbuf->flags &= ~IXGBE_RX_COPY;
4027 1.14.2.4 riz }
4028 1.1 dyoung
4029 1.1 dyoung refreshed = true;
4030 1.1 dyoung /* Next is precalculated */
4031 1.1 dyoung i = j;
4032 1.1 dyoung rxr->next_to_refresh = i;
4033 1.14.2.5 riz if (++j == rxr->num_desc)
4034 1.1 dyoung j = 0;
4035 1.1 dyoung }
4036 1.1 dyoung update:
4037 1.1 dyoung if (refreshed) /* Update hardware tail index */
4038 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw,
4039 1.1 dyoung IXGBE_RDT(rxr->me), rxr->next_to_refresh);
4040 1.1 dyoung return;
4041 1.1 dyoung }
4042 1.1 dyoung
4043 1.1 dyoung /*********************************************************************
4044 1.1 dyoung *
4045 1.1 dyoung * Allocate memory for rx_buffer structures. Since we use one
4046 1.1 dyoung * rx_buffer per received packet, the maximum number of rx_buffer's
4047 1.1 dyoung * that we'll need is equal to the number of receive descriptors
4048 1.1 dyoung * that we've allocated.
4049 1.1 dyoung *
4050 1.1 dyoung **********************************************************************/
4051 1.1 dyoung static int
4052 1.1 dyoung ixgbe_allocate_receive_buffers(struct rx_ring *rxr)
4053 1.1 dyoung {
4054 1.1 dyoung struct adapter *adapter = rxr->adapter;
4055 1.1 dyoung device_t dev = adapter->dev;
4056 1.1 dyoung struct ixgbe_rx_buf *rxbuf;
4057 1.1 dyoung int i, bsize, error;
4058 1.1 dyoung
4059 1.14.2.5 riz bsize = sizeof(struct ixgbe_rx_buf) * rxr->num_desc;
4060 1.1 dyoung if (!(rxr->rx_buffers =
4061 1.1 dyoung (struct ixgbe_rx_buf *) malloc(bsize,
4062 1.1 dyoung M_DEVBUF, M_NOWAIT | M_ZERO))) {
4063 1.1 dyoung aprint_error_dev(dev, "Unable to allocate rx_buffer memory\n");
4064 1.1 dyoung error = ENOMEM;
4065 1.1 dyoung goto fail;
4066 1.1 dyoung }
4067 1.1 dyoung
4068 1.1 dyoung if ((error = ixgbe_dma_tag_create(adapter->osdep.dmat, /* parent */
4069 1.1 dyoung 1, 0, /* alignment, bounds */
4070 1.1 dyoung MJUM16BYTES, /* maxsize */
4071 1.1 dyoung 1, /* nsegments */
4072 1.1 dyoung MJUM16BYTES, /* maxsegsize */
4073 1.1 dyoung 0, /* flags */
4074 1.14.2.5 riz &rxr->ptag))) {
4075 1.1 dyoung aprint_error_dev(dev, "Unable to create RX DMA tag\n");
4076 1.1 dyoung goto fail;
4077 1.1 dyoung }
4078 1.1 dyoung
4079 1.14.2.5 riz for (i = 0; i < rxr->num_desc; i++, rxbuf++) {
4080 1.1 dyoung rxbuf = &rxr->rx_buffers[i];
4081 1.14.2.5 riz error = ixgbe_dmamap_create(rxr->ptag,
4082 1.14.2.5 riz BUS_DMA_NOWAIT, &rxbuf->pmap);
4083 1.1 dyoung if (error) {
4084 1.14.2.4 riz aprint_error_dev(dev, "Unable to create RX dma map\n");
4085 1.1 dyoung goto fail;
4086 1.1 dyoung }
4087 1.1 dyoung }
4088 1.1 dyoung
4089 1.1 dyoung return (0);
4090 1.1 dyoung
4091 1.1 dyoung fail:
4092 1.1 dyoung /* Frees all, but can handle partial completion */
4093 1.1 dyoung ixgbe_free_receive_structures(adapter);
4094 1.1 dyoung return (error);
4095 1.1 dyoung }
4096 1.1 dyoung
4097 1.1 dyoung /*
4098 1.1 dyoung ** Used to detect a descriptor that has
4099 1.1 dyoung ** been merged by Hardware RSC.
4100 1.1 dyoung */
4101 1.1 dyoung static inline u32
4102 1.1 dyoung ixgbe_rsc_count(union ixgbe_adv_rx_desc *rx)
4103 1.1 dyoung {
4104 1.1 dyoung return (le32toh(rx->wb.lower.lo_dword.data) &
4105 1.1 dyoung IXGBE_RXDADV_RSCCNT_MASK) >> IXGBE_RXDADV_RSCCNT_SHIFT;
4106 1.1 dyoung }
4107 1.1 dyoung
4108 1.1 dyoung /*********************************************************************
4109 1.1 dyoung *
4110 1.1 dyoung * Initialize Hardware RSC (LRO) feature on 82599
4111 1.1 dyoung * for an RX ring, this is toggled by the LRO capability
4112 1.1 dyoung * even though it is transparent to the stack.
4113 1.1 dyoung *
4114 1.14.2.4 riz * NOTE: since this HW feature only works with IPV4 and
4115 1.14.2.4 riz * our testing has shown soft LRO to be as effective
4116 1.14.2.4 riz * I have decided to disable this by default.
4117 1.14.2.4 riz *
4118 1.1 dyoung **********************************************************************/
4119 1.1 dyoung static void
4120 1.1 dyoung ixgbe_setup_hw_rsc(struct rx_ring *rxr)
4121 1.1 dyoung {
4122 1.1 dyoung struct adapter *adapter = rxr->adapter;
4123 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
4124 1.1 dyoung u32 rscctrl, rdrxctl;
4125 1.1 dyoung
4126 1.14.2.4 riz /* If turning LRO/RSC off we need to disable it */
4127 1.14.2.4 riz if ((adapter->ifp->if_capenable & IFCAP_LRO) == 0) {
4128 1.14.2.4 riz rscctrl = IXGBE_READ_REG(hw, IXGBE_RSCCTL(rxr->me));
4129 1.14.2.4 riz rscctrl &= ~IXGBE_RSCCTL_RSCEN;
4130 1.14.2.4 riz return;
4131 1.14.2.4 riz }
4132 1.14.2.4 riz
4133 1.1 dyoung rdrxctl = IXGBE_READ_REG(hw, IXGBE_RDRXCTL);
4134 1.1 dyoung rdrxctl &= ~IXGBE_RDRXCTL_RSCFRSTSIZE;
4135 1.14.2.4 riz #ifdef DEV_NETMAP /* crcstrip is optional in netmap */
4136 1.14.2.4 riz if (adapter->ifp->if_capenable & IFCAP_NETMAP && !ix_crcstrip)
4137 1.14.2.4 riz #endif /* DEV_NETMAP */
4138 1.1 dyoung rdrxctl |= IXGBE_RDRXCTL_CRCSTRIP;
4139 1.1 dyoung rdrxctl |= IXGBE_RDRXCTL_RSCACKC;
4140 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDRXCTL, rdrxctl);
4141 1.1 dyoung
4142 1.1 dyoung rscctrl = IXGBE_READ_REG(hw, IXGBE_RSCCTL(rxr->me));
4143 1.1 dyoung rscctrl |= IXGBE_RSCCTL_RSCEN;
4144 1.1 dyoung /*
4145 1.1 dyoung ** Limit the total number of descriptors that
4146 1.1 dyoung ** can be combined, so it does not exceed 64K
4147 1.1 dyoung */
4148 1.14.2.5 riz if (rxr->mbuf_sz == MCLBYTES)
4149 1.1 dyoung rscctrl |= IXGBE_RSCCTL_MAXDESC_16;
4150 1.14.2.5 riz else if (rxr->mbuf_sz == MJUMPAGESIZE)
4151 1.1 dyoung rscctrl |= IXGBE_RSCCTL_MAXDESC_8;
4152 1.14.2.5 riz else if (rxr->mbuf_sz == MJUM9BYTES)
4153 1.1 dyoung rscctrl |= IXGBE_RSCCTL_MAXDESC_4;
4154 1.1 dyoung else /* Using 16K cluster */
4155 1.1 dyoung rscctrl |= IXGBE_RSCCTL_MAXDESC_1;
4156 1.1 dyoung
4157 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RSCCTL(rxr->me), rscctrl);
4158 1.1 dyoung
4159 1.1 dyoung /* Enable TCP header recognition */
4160 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_PSRTYPE(0),
4161 1.1 dyoung (IXGBE_READ_REG(hw, IXGBE_PSRTYPE(0)) |
4162 1.1 dyoung IXGBE_PSRTYPE_TCPHDR));
4163 1.1 dyoung
4164 1.1 dyoung /* Disable RSC for ACK packets */
4165 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RSCDBU,
4166 1.1 dyoung (IXGBE_RSCDBU_RSCACKDIS | IXGBE_READ_REG(hw, IXGBE_RSCDBU)));
4167 1.1 dyoung
4168 1.1 dyoung rxr->hw_rsc = TRUE;
4169 1.1 dyoung }
4170 1.1 dyoung
4171 1.1 dyoung
4172 1.1 dyoung static void
4173 1.1 dyoung ixgbe_free_receive_ring(struct rx_ring *rxr)
4174 1.1 dyoung {
4175 1.1 dyoung struct ixgbe_rx_buf *rxbuf;
4176 1.1 dyoung int i;
4177 1.1 dyoung
4178 1.14.2.5 riz for (i = 0; i < rxr->num_desc; i++) {
4179 1.1 dyoung rxbuf = &rxr->rx_buffers[i];
4180 1.14.2.4 riz if (rxbuf->buf != NULL) {
4181 1.14.2.5 riz bus_dmamap_sync(rxr->ptag->dt_dmat, rxbuf->pmap,
4182 1.14.2.4 riz 0, rxbuf->buf->m_pkthdr.len,
4183 1.1 dyoung BUS_DMASYNC_POSTREAD);
4184 1.14.2.5 riz ixgbe_dmamap_unload(rxr->ptag, rxbuf->pmap);
4185 1.14.2.4 riz rxbuf->buf->m_flags |= M_PKTHDR;
4186 1.14.2.4 riz m_freem(rxbuf->buf);
4187 1.14.2.4 riz rxbuf->buf = NULL;
4188 1.1 dyoung }
4189 1.1 dyoung }
4190 1.1 dyoung }
4191 1.1 dyoung
4192 1.1 dyoung
4193 1.1 dyoung /*********************************************************************
4194 1.1 dyoung *
4195 1.1 dyoung * Initialize a receive ring and its buffers.
4196 1.1 dyoung *
4197 1.1 dyoung **********************************************************************/
4198 1.1 dyoung static int
4199 1.1 dyoung ixgbe_setup_receive_ring(struct rx_ring *rxr)
4200 1.1 dyoung {
4201 1.1 dyoung struct adapter *adapter;
4202 1.1 dyoung struct ixgbe_rx_buf *rxbuf;
4203 1.1 dyoung #ifdef LRO
4204 1.14.2.4 riz struct ifnet *ifp;
4205 1.1 dyoung struct lro_ctrl *lro = &rxr->lro;
4206 1.1 dyoung #endif /* LRO */
4207 1.1 dyoung int rsize, error = 0;
4208 1.14.2.3 martin #ifdef DEV_NETMAP
4209 1.14.2.3 martin struct netmap_adapter *na = NA(rxr->adapter->ifp);
4210 1.14.2.3 martin struct netmap_slot *slot;
4211 1.14.2.3 martin #endif /* DEV_NETMAP */
4212 1.1 dyoung
4213 1.1 dyoung adapter = rxr->adapter;
4214 1.14.2.4 riz #ifdef LRO
4215 1.1 dyoung ifp = adapter->ifp;
4216 1.14.2.4 riz #endif /* LRO */
4217 1.1 dyoung
4218 1.1 dyoung /* Clear the ring contents */
4219 1.1 dyoung IXGBE_RX_LOCK(rxr);
4220 1.14.2.3 martin #ifdef DEV_NETMAP
4221 1.14.2.3 martin /* same as in ixgbe_setup_transmit_ring() */
4222 1.14.2.3 martin slot = netmap_reset(na, NR_RX, rxr->me, 0);
4223 1.14.2.3 martin #endif /* DEV_NETMAP */
4224 1.1 dyoung rsize = roundup2(adapter->num_rx_desc *
4225 1.1 dyoung sizeof(union ixgbe_adv_rx_desc), DBA_ALIGN);
4226 1.1 dyoung bzero((void *)rxr->rx_base, rsize);
4227 1.14.2.5 riz /* Cache the size */
4228 1.14.2.5 riz rxr->mbuf_sz = adapter->rx_mbuf_sz;
4229 1.1 dyoung
4230 1.1 dyoung /* Free current RX buffer structs and their mbufs */
4231 1.1 dyoung ixgbe_free_receive_ring(rxr);
4232 1.1 dyoung
4233 1.14.2.2 martin IXGBE_RX_UNLOCK(rxr);
4234 1.14.2.2 martin
4235 1.1 dyoung /* Now reinitialize our supply of jumbo mbufs. The number
4236 1.1 dyoung * or size of jumbo mbufs may have changed.
4237 1.1 dyoung */
4238 1.14.2.5 riz ixgbe_jcl_reinit(&adapter->jcl_head, rxr->ptag->dt_dmat,
4239 1.1 dyoung 2 * adapter->num_rx_desc, adapter->rx_mbuf_sz);
4240 1.1 dyoung
4241 1.14.2.2 martin IXGBE_RX_LOCK(rxr);
4242 1.14.2.2 martin
4243 1.1 dyoung /* Now replenish the mbufs */
4244 1.14.2.5 riz for (int j = 0; j != rxr->num_desc; ++j) {
4245 1.14.2.4 riz struct mbuf *mp;
4246 1.1 dyoung
4247 1.1 dyoung rxbuf = &rxr->rx_buffers[j];
4248 1.14.2.3 martin #ifdef DEV_NETMAP
4249 1.14.2.3 martin /*
4250 1.14.2.3 martin * In netmap mode, fill the map and set the buffer
4251 1.14.2.3 martin * address in the NIC ring, considering the offset
4252 1.14.2.3 martin * between the netmap and NIC rings (see comment in
4253 1.14.2.3 martin * ixgbe_setup_transmit_ring() ). No need to allocate
4254 1.14.2.3 martin * an mbuf, so end the block with a continue;
4255 1.14.2.3 martin */
4256 1.14.2.3 martin if (slot) {
4257 1.14.2.4 riz int sj = netmap_idx_n2k(&na->rx_rings[rxr->me], j);
4258 1.14.2.3 martin uint64_t paddr;
4259 1.14.2.3 martin void *addr;
4260 1.14.2.3 martin
4261 1.14.2.3 martin addr = PNMB(slot + sj, &paddr);
4262 1.14.2.5 riz netmap_load_map(rxr->ptag, rxbuf->pmap, addr);
4263 1.14.2.3 martin /* Update descriptor */
4264 1.14.2.3 martin rxr->rx_base[j].read.pkt_addr = htole64(paddr);
4265 1.14.2.3 martin continue;
4266 1.14.2.3 martin }
4267 1.14.2.3 martin #endif /* DEV_NETMAP */
4268 1.14.2.5 riz rxbuf->buf = ixgbe_getjcl(&adapter->jcl_head, M_NOWAIT,
4269 1.1 dyoung MT_DATA, M_PKTHDR, adapter->rx_mbuf_sz);
4270 1.14.2.4 riz if (rxbuf->buf == NULL) {
4271 1.1 dyoung error = ENOBUFS;
4272 1.1 dyoung goto fail;
4273 1.1 dyoung }
4274 1.14.2.4 riz mp = rxbuf->buf;
4275 1.14.2.5 riz mp->m_pkthdr.len = mp->m_len = rxr->mbuf_sz;
4276 1.1 dyoung /* Get the memory mapping */
4277 1.14.2.5 riz error = bus_dmamap_load_mbuf(rxr->ptag->dt_dmat,
4278 1.14.2.5 riz rxbuf->pmap, mp, BUS_DMA_NOWAIT);
4279 1.1 dyoung if (error != 0)
4280 1.1 dyoung goto fail;
4281 1.14.2.5 riz bus_dmamap_sync(rxr->ptag->dt_dmat, rxbuf->pmap,
4282 1.1 dyoung 0, adapter->rx_mbuf_sz, BUS_DMASYNC_PREREAD);
4283 1.1 dyoung /* Update descriptor */
4284 1.1 dyoung rxr->rx_base[j].read.pkt_addr =
4285 1.14.2.5 riz htole64(rxbuf->pmap->dm_segs[0].ds_addr);
4286 1.1 dyoung }
4287 1.1 dyoung
4288 1.1 dyoung
4289 1.1 dyoung /* Setup our descriptor indices */
4290 1.1 dyoung rxr->next_to_check = 0;
4291 1.1 dyoung rxr->next_to_refresh = 0;
4292 1.1 dyoung rxr->lro_enabled = FALSE;
4293 1.14.2.4 riz rxr->rx_copies.ev_count = 0;
4294 1.1 dyoung rxr->rx_bytes.ev_count = 0;
4295 1.1 dyoung rxr->discard = FALSE;
4296 1.14.2.4 riz rxr->vtag_strip = FALSE;
4297 1.1 dyoung
4298 1.1 dyoung ixgbe_dmamap_sync(rxr->rxdma.dma_tag, rxr->rxdma.dma_map,
4299 1.1 dyoung BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
4300 1.1 dyoung
4301 1.1 dyoung /*
4302 1.1 dyoung ** Now set up the LRO interface:
4303 1.1 dyoung */
4304 1.14.2.4 riz if (ixgbe_rsc_enable)
4305 1.1 dyoung ixgbe_setup_hw_rsc(rxr);
4306 1.1 dyoung #ifdef LRO
4307 1.1 dyoung else if (ifp->if_capenable & IFCAP_LRO) {
4308 1.9 skrll device_t dev = adapter->dev;
4309 1.1 dyoung int err = tcp_lro_init(lro);
4310 1.1 dyoung if (err) {
4311 1.1 dyoung device_printf(dev, "LRO Initialization failed!\n");
4312 1.1 dyoung goto fail;
4313 1.1 dyoung }
4314 1.1 dyoung INIT_DEBUGOUT("RX Soft LRO Initialized\n");
4315 1.1 dyoung rxr->lro_enabled = TRUE;
4316 1.1 dyoung lro->ifp = adapter->ifp;
4317 1.1 dyoung }
4318 1.1 dyoung #endif /* LRO */
4319 1.1 dyoung
4320 1.1 dyoung IXGBE_RX_UNLOCK(rxr);
4321 1.1 dyoung return (0);
4322 1.1 dyoung
4323 1.1 dyoung fail:
4324 1.1 dyoung ixgbe_free_receive_ring(rxr);
4325 1.1 dyoung IXGBE_RX_UNLOCK(rxr);
4326 1.1 dyoung return (error);
4327 1.1 dyoung }
4328 1.1 dyoung
4329 1.1 dyoung /*********************************************************************
4330 1.1 dyoung *
4331 1.1 dyoung * Initialize all receive rings.
4332 1.1 dyoung *
4333 1.1 dyoung **********************************************************************/
4334 1.1 dyoung static int
4335 1.1 dyoung ixgbe_setup_receive_structures(struct adapter *adapter)
4336 1.1 dyoung {
4337 1.1 dyoung struct rx_ring *rxr = adapter->rx_rings;
4338 1.1 dyoung int j;
4339 1.1 dyoung
4340 1.1 dyoung for (j = 0; j < adapter->num_queues; j++, rxr++)
4341 1.1 dyoung if (ixgbe_setup_receive_ring(rxr))
4342 1.1 dyoung goto fail;
4343 1.1 dyoung
4344 1.1 dyoung return (0);
4345 1.1 dyoung fail:
4346 1.1 dyoung /*
4347 1.1 dyoung * Free RX buffers allocated so far, we will only handle
4348 1.1 dyoung * the rings that completed, the failing case will have
4349 1.1 dyoung * cleaned up for itself. 'j' failed, so its the terminus.
4350 1.1 dyoung */
4351 1.1 dyoung for (int i = 0; i < j; ++i) {
4352 1.1 dyoung rxr = &adapter->rx_rings[i];
4353 1.1 dyoung ixgbe_free_receive_ring(rxr);
4354 1.1 dyoung }
4355 1.1 dyoung
4356 1.1 dyoung return (ENOBUFS);
4357 1.1 dyoung }
4358 1.1 dyoung
4359 1.1 dyoung /*********************************************************************
4360 1.1 dyoung *
4361 1.1 dyoung * Setup receive registers and features.
4362 1.1 dyoung *
4363 1.1 dyoung **********************************************************************/
4364 1.1 dyoung #define IXGBE_SRRCTL_BSIZEHDRSIZE_SHIFT 2
4365 1.1 dyoung
4366 1.14.2.3 martin #define BSIZEPKT_ROUNDUP ((1<<IXGBE_SRRCTL_BSIZEPKT_SHIFT)-1)
4367 1.14.2.3 martin
4368 1.1 dyoung static void
4369 1.1 dyoung ixgbe_initialize_receive_units(struct adapter *adapter)
4370 1.1 dyoung {
4371 1.1 dyoung int i;
4372 1.1 dyoung struct rx_ring *rxr = adapter->rx_rings;
4373 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
4374 1.1 dyoung struct ifnet *ifp = adapter->ifp;
4375 1.1 dyoung u32 bufsz, rxctrl, fctrl, srrctl, rxcsum;
4376 1.1 dyoung u32 reta, mrqc = 0, hlreg, r[10];
4377 1.1 dyoung
4378 1.1 dyoung
4379 1.1 dyoung /*
4380 1.1 dyoung * Make sure receives are disabled while
4381 1.1 dyoung * setting up the descriptor ring
4382 1.1 dyoung */
4383 1.1 dyoung rxctrl = IXGBE_READ_REG(hw, IXGBE_RXCTRL);
4384 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RXCTRL,
4385 1.1 dyoung rxctrl & ~IXGBE_RXCTRL_RXEN);
4386 1.1 dyoung
4387 1.1 dyoung /* Enable broadcasts */
4388 1.1 dyoung fctrl = IXGBE_READ_REG(hw, IXGBE_FCTRL);
4389 1.1 dyoung fctrl |= IXGBE_FCTRL_BAM;
4390 1.1 dyoung fctrl |= IXGBE_FCTRL_DPF;
4391 1.1 dyoung fctrl |= IXGBE_FCTRL_PMCF;
4392 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_FCTRL, fctrl);
4393 1.1 dyoung
4394 1.1 dyoung /* Set for Jumbo Frames? */
4395 1.1 dyoung hlreg = IXGBE_READ_REG(hw, IXGBE_HLREG0);
4396 1.1 dyoung if (ifp->if_mtu > ETHERMTU)
4397 1.1 dyoung hlreg |= IXGBE_HLREG0_JUMBOEN;
4398 1.1 dyoung else
4399 1.1 dyoung hlreg &= ~IXGBE_HLREG0_JUMBOEN;
4400 1.14.2.4 riz #ifdef DEV_NETMAP
4401 1.14.2.4 riz /* crcstrip is conditional in netmap (in RDRXCTL too ?) */
4402 1.14.2.4 riz if (ifp->if_capenable & IFCAP_NETMAP && !ix_crcstrip)
4403 1.14.2.4 riz hlreg &= ~IXGBE_HLREG0_RXCRCSTRP;
4404 1.14.2.4 riz else
4405 1.14.2.4 riz hlreg |= IXGBE_HLREG0_RXCRCSTRP;
4406 1.14.2.4 riz #endif /* DEV_NETMAP */
4407 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_HLREG0, hlreg);
4408 1.1 dyoung
4409 1.14.2.4 riz bufsz = (adapter->rx_mbuf_sz +
4410 1.14.2.4 riz BSIZEPKT_ROUNDUP) >> IXGBE_SRRCTL_BSIZEPKT_SHIFT;
4411 1.1 dyoung
4412 1.1 dyoung for (i = 0; i < adapter->num_queues; i++, rxr++) {
4413 1.1 dyoung u64 rdba = rxr->rxdma.dma_paddr;
4414 1.1 dyoung
4415 1.1 dyoung /* Setup the Base and Length of the Rx Descriptor Ring */
4416 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDBAL(i),
4417 1.1 dyoung (rdba & 0x00000000ffffffffULL));
4418 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDBAH(i), (rdba >> 32));
4419 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDLEN(i),
4420 1.1 dyoung adapter->num_rx_desc * sizeof(union ixgbe_adv_rx_desc));
4421 1.1 dyoung
4422 1.1 dyoung /* Set up the SRRCTL register */
4423 1.1 dyoung srrctl = IXGBE_READ_REG(hw, IXGBE_SRRCTL(i));
4424 1.1 dyoung srrctl &= ~IXGBE_SRRCTL_BSIZEHDR_MASK;
4425 1.1 dyoung srrctl &= ~IXGBE_SRRCTL_BSIZEPKT_MASK;
4426 1.1 dyoung srrctl |= bufsz;
4427 1.14.2.4 riz srrctl |= IXGBE_SRRCTL_DESCTYPE_ADV_ONEBUF;
4428 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_SRRCTL(i), srrctl);
4429 1.1 dyoung
4430 1.1 dyoung /* Setup the HW Rx Head and Tail Descriptor Pointers */
4431 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDH(i), 0);
4432 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RDT(i), 0);
4433 1.14.2.5 riz
4434 1.14.2.5 riz /* Set the processing limit */
4435 1.14.2.5 riz rxr->process_limit = ixgbe_rx_process_limit;
4436 1.1 dyoung }
4437 1.1 dyoung
4438 1.1 dyoung if (adapter->hw.mac.type != ixgbe_mac_82598EB) {
4439 1.1 dyoung u32 psrtype = IXGBE_PSRTYPE_TCPHDR |
4440 1.1 dyoung IXGBE_PSRTYPE_UDPHDR |
4441 1.1 dyoung IXGBE_PSRTYPE_IPV4HDR |
4442 1.1 dyoung IXGBE_PSRTYPE_IPV6HDR;
4443 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_PSRTYPE(0), psrtype);
4444 1.1 dyoung }
4445 1.1 dyoung
4446 1.1 dyoung rxcsum = IXGBE_READ_REG(hw, IXGBE_RXCSUM);
4447 1.1 dyoung
4448 1.1 dyoung /* Setup RSS */
4449 1.1 dyoung if (adapter->num_queues > 1) {
4450 1.1 dyoung int j;
4451 1.1 dyoung reta = 0;
4452 1.1 dyoung
4453 1.1 dyoung /* set up random bits */
4454 1.2 tls cprng_fast(&r, sizeof(r));
4455 1.1 dyoung
4456 1.1 dyoung /* Set up the redirection table */
4457 1.1 dyoung for (i = 0, j = 0; i < 128; i++, j++) {
4458 1.1 dyoung if (j == adapter->num_queues) j = 0;
4459 1.1 dyoung reta = (reta << 8) | (j * 0x11);
4460 1.1 dyoung if ((i & 3) == 3)
4461 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RETA(i >> 2), reta);
4462 1.1 dyoung }
4463 1.1 dyoung
4464 1.1 dyoung /* Now fill our hash function seeds */
4465 1.1 dyoung for (i = 0; i < 10; i++)
4466 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RSSRK(i), r[i]);
4467 1.1 dyoung
4468 1.1 dyoung /* Perform hash on these packet types */
4469 1.1 dyoung mrqc = IXGBE_MRQC_RSSEN
4470 1.1 dyoung | IXGBE_MRQC_RSS_FIELD_IPV4
4471 1.1 dyoung | IXGBE_MRQC_RSS_FIELD_IPV4_TCP
4472 1.1 dyoung | IXGBE_MRQC_RSS_FIELD_IPV4_UDP
4473 1.1 dyoung | IXGBE_MRQC_RSS_FIELD_IPV6_EX_TCP
4474 1.1 dyoung | IXGBE_MRQC_RSS_FIELD_IPV6_EX
4475 1.1 dyoung | IXGBE_MRQC_RSS_FIELD_IPV6
4476 1.1 dyoung | IXGBE_MRQC_RSS_FIELD_IPV6_TCP
4477 1.1 dyoung | IXGBE_MRQC_RSS_FIELD_IPV6_UDP
4478 1.1 dyoung | IXGBE_MRQC_RSS_FIELD_IPV6_EX_UDP;
4479 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_MRQC, mrqc);
4480 1.1 dyoung
4481 1.1 dyoung /* RSS and RX IPP Checksum are mutually exclusive */
4482 1.1 dyoung rxcsum |= IXGBE_RXCSUM_PCSD;
4483 1.1 dyoung }
4484 1.1 dyoung
4485 1.1 dyoung if (ifp->if_capenable & IFCAP_RXCSUM)
4486 1.1 dyoung rxcsum |= IXGBE_RXCSUM_PCSD;
4487 1.1 dyoung
4488 1.1 dyoung if (!(rxcsum & IXGBE_RXCSUM_PCSD))
4489 1.1 dyoung rxcsum |= IXGBE_RXCSUM_IPPCSE;
4490 1.1 dyoung
4491 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RXCSUM, rxcsum);
4492 1.1 dyoung
4493 1.1 dyoung return;
4494 1.1 dyoung }
4495 1.1 dyoung
4496 1.1 dyoung /*********************************************************************
4497 1.1 dyoung *
4498 1.1 dyoung * Free all receive rings.
4499 1.1 dyoung *
4500 1.1 dyoung **********************************************************************/
4501 1.1 dyoung static void
4502 1.1 dyoung ixgbe_free_receive_structures(struct adapter *adapter)
4503 1.1 dyoung {
4504 1.1 dyoung struct rx_ring *rxr = adapter->rx_rings;
4505 1.1 dyoung
4506 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, rxr++) {
4507 1.1 dyoung #ifdef LRO
4508 1.1 dyoung struct lro_ctrl *lro = &rxr->lro;
4509 1.1 dyoung #endif /* LRO */
4510 1.1 dyoung ixgbe_free_receive_buffers(rxr);
4511 1.1 dyoung #ifdef LRO
4512 1.1 dyoung /* Free LRO memory */
4513 1.1 dyoung tcp_lro_free(lro);
4514 1.1 dyoung #endif /* LRO */
4515 1.1 dyoung /* Free the ring memory as well */
4516 1.1 dyoung ixgbe_dma_free(adapter, &rxr->rxdma);
4517 1.14.2.2 martin IXGBE_RX_LOCK_DESTROY(rxr);
4518 1.1 dyoung }
4519 1.1 dyoung
4520 1.1 dyoung free(adapter->rx_rings, M_DEVBUF);
4521 1.1 dyoung }
4522 1.1 dyoung
4523 1.1 dyoung
4524 1.1 dyoung /*********************************************************************
4525 1.1 dyoung *
4526 1.1 dyoung * Free receive ring data structures
4527 1.1 dyoung *
4528 1.1 dyoung **********************************************************************/
4529 1.1 dyoung static void
4530 1.1 dyoung ixgbe_free_receive_buffers(struct rx_ring *rxr)
4531 1.1 dyoung {
4532 1.1 dyoung struct adapter *adapter = rxr->adapter;
4533 1.1 dyoung struct ixgbe_rx_buf *rxbuf;
4534 1.1 dyoung
4535 1.1 dyoung INIT_DEBUGOUT("free_receive_structures: begin");
4536 1.1 dyoung
4537 1.1 dyoung /* Cleanup any existing buffers */
4538 1.1 dyoung if (rxr->rx_buffers != NULL) {
4539 1.1 dyoung for (int i = 0; i < adapter->num_rx_desc; i++) {
4540 1.1 dyoung rxbuf = &rxr->rx_buffers[i];
4541 1.14.2.4 riz if (rxbuf->buf != NULL) {
4542 1.14.2.5 riz bus_dmamap_sync(rxr->ptag->dt_dmat,
4543 1.14.2.5 riz rxbuf->pmap, 0, rxbuf->buf->m_pkthdr.len,
4544 1.1 dyoung BUS_DMASYNC_POSTREAD);
4545 1.14.2.5 riz ixgbe_dmamap_unload(rxr->ptag, rxbuf->pmap);
4546 1.14.2.4 riz rxbuf->buf->m_flags |= M_PKTHDR;
4547 1.14.2.4 riz m_freem(rxbuf->buf);
4548 1.1 dyoung }
4549 1.14.2.4 riz rxbuf->buf = NULL;
4550 1.14.2.5 riz if (rxbuf->pmap != NULL) {
4551 1.14.2.5 riz ixgbe_dmamap_destroy(rxr->ptag, rxbuf->pmap);
4552 1.14.2.5 riz rxbuf->pmap = NULL;
4553 1.1 dyoung }
4554 1.1 dyoung }
4555 1.1 dyoung if (rxr->rx_buffers != NULL) {
4556 1.1 dyoung free(rxr->rx_buffers, M_DEVBUF);
4557 1.1 dyoung rxr->rx_buffers = NULL;
4558 1.1 dyoung }
4559 1.1 dyoung }
4560 1.1 dyoung
4561 1.14.2.5 riz if (rxr->ptag != NULL) {
4562 1.14.2.5 riz ixgbe_dma_tag_destroy(rxr->ptag);
4563 1.14.2.5 riz rxr->ptag = NULL;
4564 1.1 dyoung }
4565 1.1 dyoung
4566 1.1 dyoung return;
4567 1.1 dyoung }
4568 1.1 dyoung
4569 1.1 dyoung static __inline void
4570 1.1 dyoung ixgbe_rx_input(struct rx_ring *rxr, struct ifnet *ifp, struct mbuf *m, u32 ptype)
4571 1.1 dyoung {
4572 1.1 dyoung int s;
4573 1.1 dyoung
4574 1.9 skrll #ifdef LRO
4575 1.9 skrll struct adapter *adapter = ifp->if_softc;
4576 1.9 skrll struct ethercom *ec = &adapter->osdep.ec;
4577 1.1 dyoung
4578 1.1 dyoung /*
4579 1.14.2.4 riz * ATM LRO is only for IP/TCP packets and TCP checksum of the packet
4580 1.1 dyoung * should be computed by hardware. Also it should not have VLAN tag in
4581 1.14.2.4 riz * ethernet header. In case of IPv6 we do not yet support ext. hdrs.
4582 1.1 dyoung */
4583 1.1 dyoung if (rxr->lro_enabled &&
4584 1.1 dyoung (ec->ec_capenable & ETHERCAP_VLAN_HWTAGGING) != 0 &&
4585 1.1 dyoung (ptype & IXGBE_RXDADV_PKTTYPE_ETQF) == 0 &&
4586 1.14.2.4 riz ((ptype & (IXGBE_RXDADV_PKTTYPE_IPV4 | IXGBE_RXDADV_PKTTYPE_TCP)) ==
4587 1.14.2.4 riz (IXGBE_RXDADV_PKTTYPE_IPV4 | IXGBE_RXDADV_PKTTYPE_TCP) ||
4588 1.14.2.4 riz (ptype & (IXGBE_RXDADV_PKTTYPE_IPV6 | IXGBE_RXDADV_PKTTYPE_TCP)) ==
4589 1.14.2.4 riz (IXGBE_RXDADV_PKTTYPE_IPV6 | IXGBE_RXDADV_PKTTYPE_TCP)) &&
4590 1.1 dyoung (m->m_pkthdr.csum_flags & (CSUM_DATA_VALID | CSUM_PSEUDO_HDR)) ==
4591 1.1 dyoung (CSUM_DATA_VALID | CSUM_PSEUDO_HDR)) {
4592 1.1 dyoung /*
4593 1.1 dyoung * Send to the stack if:
4594 1.1 dyoung ** - LRO not enabled, or
4595 1.1 dyoung ** - no LRO resources, or
4596 1.1 dyoung ** - lro enqueue fails
4597 1.1 dyoung */
4598 1.1 dyoung if (rxr->lro.lro_cnt != 0)
4599 1.1 dyoung if (tcp_lro_rx(&rxr->lro, m, 0) == 0)
4600 1.1 dyoung return;
4601 1.1 dyoung }
4602 1.1 dyoung #endif /* LRO */
4603 1.1 dyoung
4604 1.1 dyoung IXGBE_RX_UNLOCK(rxr);
4605 1.1 dyoung
4606 1.1 dyoung s = splnet();
4607 1.1 dyoung /* Pass this up to any BPF listeners. */
4608 1.1 dyoung bpf_mtap(ifp, m);
4609 1.1 dyoung (*ifp->if_input)(ifp, m);
4610 1.1 dyoung splx(s);
4611 1.1 dyoung
4612 1.1 dyoung IXGBE_RX_LOCK(rxr);
4613 1.1 dyoung }
4614 1.1 dyoung
4615 1.1 dyoung static __inline void
4616 1.1 dyoung ixgbe_rx_discard(struct rx_ring *rxr, int i)
4617 1.1 dyoung {
4618 1.1 dyoung struct ixgbe_rx_buf *rbuf;
4619 1.1 dyoung
4620 1.1 dyoung rbuf = &rxr->rx_buffers[i];
4621 1.1 dyoung
4622 1.1 dyoung if (rbuf->fmp != NULL) {/* Partial chain ? */
4623 1.1 dyoung rbuf->fmp->m_flags |= M_PKTHDR;
4624 1.1 dyoung m_freem(rbuf->fmp);
4625 1.1 dyoung rbuf->fmp = NULL;
4626 1.1 dyoung }
4627 1.1 dyoung
4628 1.1 dyoung /*
4629 1.1 dyoung ** With advanced descriptors the writeback
4630 1.1 dyoung ** clobbers the buffer addrs, so its easier
4631 1.1 dyoung ** to just free the existing mbufs and take
4632 1.1 dyoung ** the normal refresh path to get new buffers
4633 1.1 dyoung ** and mapping.
4634 1.1 dyoung */
4635 1.14.2.4 riz if (rbuf->buf) {
4636 1.14.2.4 riz m_free(rbuf->buf);
4637 1.14.2.4 riz rbuf->buf = NULL;
4638 1.1 dyoung }
4639 1.1 dyoung
4640 1.1 dyoung return;
4641 1.1 dyoung }
4642 1.1 dyoung
4643 1.1 dyoung
4644 1.1 dyoung /*********************************************************************
4645 1.1 dyoung *
4646 1.1 dyoung * This routine executes in interrupt context. It replenishes
4647 1.1 dyoung * the mbufs in the descriptor and sends data which has been
4648 1.1 dyoung * dma'ed into host memory to upper layer.
4649 1.1 dyoung *
4650 1.1 dyoung * We loop at most count times if count is > 0, or until done if
4651 1.1 dyoung * count < 0.
4652 1.1 dyoung *
4653 1.1 dyoung * Return TRUE for more work, FALSE for all clean.
4654 1.1 dyoung *********************************************************************/
4655 1.1 dyoung static bool
4656 1.14.2.5 riz ixgbe_rxeof(struct ix_queue *que)
4657 1.1 dyoung {
4658 1.1 dyoung struct adapter *adapter = que->adapter;
4659 1.1 dyoung struct rx_ring *rxr = que->rxr;
4660 1.1 dyoung struct ifnet *ifp = adapter->ifp;
4661 1.1 dyoung #ifdef LRO
4662 1.1 dyoung struct lro_ctrl *lro = &rxr->lro;
4663 1.1 dyoung struct lro_entry *queued;
4664 1.1 dyoung #endif /* LRO */
4665 1.1 dyoung int i, nextp, processed = 0;
4666 1.1 dyoung u32 staterr = 0;
4667 1.14.2.5 riz u16 count = rxr->process_limit;
4668 1.1 dyoung union ixgbe_adv_rx_desc *cur;
4669 1.1 dyoung struct ixgbe_rx_buf *rbuf, *nbuf;
4670 1.1 dyoung
4671 1.1 dyoung IXGBE_RX_LOCK(rxr);
4672 1.1 dyoung
4673 1.14.2.3 martin #ifdef DEV_NETMAP
4674 1.14.2.5 riz /* Same as the txeof routine: wakeup clients on intr. */
4675 1.14.2.5 riz if (netmap_rx_irq(ifp, rxr->me | NETMAP_LOCKED_ENTER, &processed))
4676 1.14.2.3 martin return (FALSE);
4677 1.14.2.3 martin #endif /* DEV_NETMAP */
4678 1.1 dyoung for (i = rxr->next_to_check; count != 0;) {
4679 1.14.2.4 riz struct mbuf *sendmp, *mp;
4680 1.1 dyoung u32 rsc, ptype;
4681 1.14.2.4 riz u16 len;
4682 1.14.2.4 riz u16 vtag = 0;
4683 1.1 dyoung bool eop;
4684 1.1 dyoung
4685 1.1 dyoung /* Sync the ring. */
4686 1.1 dyoung ixgbe_dmamap_sync(rxr->rxdma.dma_tag, rxr->rxdma.dma_map,
4687 1.1 dyoung BUS_DMASYNC_POSTREAD | BUS_DMASYNC_POSTWRITE);
4688 1.1 dyoung
4689 1.1 dyoung cur = &rxr->rx_base[i];
4690 1.1 dyoung staterr = le32toh(cur->wb.upper.status_error);
4691 1.1 dyoung
4692 1.1 dyoung if ((staterr & IXGBE_RXD_STAT_DD) == 0)
4693 1.1 dyoung break;
4694 1.1 dyoung if ((ifp->if_flags & IFF_RUNNING) == 0)
4695 1.1 dyoung break;
4696 1.1 dyoung
4697 1.1 dyoung count--;
4698 1.1 dyoung sendmp = NULL;
4699 1.1 dyoung nbuf = NULL;
4700 1.1 dyoung rsc = 0;
4701 1.1 dyoung cur->wb.upper.status_error = 0;
4702 1.1 dyoung rbuf = &rxr->rx_buffers[i];
4703 1.14.2.4 riz mp = rbuf->buf;
4704 1.1 dyoung
4705 1.14.2.4 riz len = le16toh(cur->wb.upper.length);
4706 1.1 dyoung ptype = le32toh(cur->wb.lower.lo_dword.data) &
4707 1.1 dyoung IXGBE_RXDADV_PKTTYPE_MASK;
4708 1.1 dyoung eop = ((staterr & IXGBE_RXD_STAT_EOP) != 0);
4709 1.1 dyoung
4710 1.1 dyoung /* Make sure bad packets are discarded */
4711 1.1 dyoung if (((staterr & IXGBE_RXDADV_ERR_FRAME_ERR_MASK) != 0) ||
4712 1.1 dyoung (rxr->discard)) {
4713 1.1 dyoung rxr->rx_discarded.ev_count++;
4714 1.1 dyoung if (eop)
4715 1.1 dyoung rxr->discard = FALSE;
4716 1.1 dyoung else
4717 1.1 dyoung rxr->discard = TRUE;
4718 1.1 dyoung ixgbe_rx_discard(rxr, i);
4719 1.1 dyoung goto next_desc;
4720 1.1 dyoung }
4721 1.1 dyoung
4722 1.1 dyoung /*
4723 1.1 dyoung ** On 82599 which supports a hardware
4724 1.1 dyoung ** LRO (called HW RSC), packets need
4725 1.1 dyoung ** not be fragmented across sequential
4726 1.1 dyoung ** descriptors, rather the next descriptor
4727 1.1 dyoung ** is indicated in bits of the descriptor.
4728 1.1 dyoung ** This also means that we might proceses
4729 1.1 dyoung ** more than one packet at a time, something
4730 1.1 dyoung ** that has never been true before, it
4731 1.1 dyoung ** required eliminating global chain pointers
4732 1.1 dyoung ** in favor of what we are doing here. -jfv
4733 1.1 dyoung */
4734 1.1 dyoung if (!eop) {
4735 1.1 dyoung /*
4736 1.1 dyoung ** Figure out the next descriptor
4737 1.1 dyoung ** of this frame.
4738 1.1 dyoung */
4739 1.1 dyoung if (rxr->hw_rsc == TRUE) {
4740 1.1 dyoung rsc = ixgbe_rsc_count(cur);
4741 1.1 dyoung rxr->rsc_num += (rsc - 1);
4742 1.1 dyoung }
4743 1.1 dyoung if (rsc) { /* Get hardware index */
4744 1.1 dyoung nextp = ((staterr &
4745 1.1 dyoung IXGBE_RXDADV_NEXTP_MASK) >>
4746 1.1 dyoung IXGBE_RXDADV_NEXTP_SHIFT);
4747 1.1 dyoung } else { /* Just sequential */
4748 1.1 dyoung nextp = i + 1;
4749 1.1 dyoung if (nextp == adapter->num_rx_desc)
4750 1.1 dyoung nextp = 0;
4751 1.1 dyoung }
4752 1.1 dyoung nbuf = &rxr->rx_buffers[nextp];
4753 1.1 dyoung prefetch(nbuf);
4754 1.1 dyoung }
4755 1.1 dyoung /*
4756 1.1 dyoung ** Rather than using the fmp/lmp global pointers
4757 1.1 dyoung ** we now keep the head of a packet chain in the
4758 1.1 dyoung ** buffer struct and pass this along from one
4759 1.1 dyoung ** descriptor to the next, until we get EOP.
4760 1.1 dyoung */
4761 1.14.2.4 riz mp->m_len = len;
4762 1.14.2.4 riz /*
4763 1.14.2.4 riz ** See if there is a stored head
4764 1.14.2.4 riz ** that determines what we are
4765 1.14.2.4 riz */
4766 1.14.2.4 riz sendmp = rbuf->fmp;
4767 1.14.2.4 riz
4768 1.14.2.4 riz if (sendmp != NULL) { /* secondary frag */
4769 1.14.2.4 riz rbuf->buf = rbuf->fmp = NULL;
4770 1.14.2.4 riz mp->m_flags &= ~M_PKTHDR;
4771 1.14.2.4 riz sendmp->m_pkthdr.len += mp->m_len;
4772 1.1 dyoung } else {
4773 1.1 dyoung /*
4774 1.14.2.4 riz * Optimize. This might be a small packet,
4775 1.14.2.4 riz * maybe just a TCP ACK. Do a fast copy that
4776 1.14.2.4 riz * is cache aligned into a new mbuf, and
4777 1.14.2.4 riz * leave the old mbuf+cluster for re-use.
4778 1.14.2.4 riz */
4779 1.14.2.4 riz if (eop && len <= IXGBE_RX_COPY_LEN) {
4780 1.14.2.5 riz sendmp = m_gethdr(M_NOWAIT, MT_DATA);
4781 1.14.2.4 riz if (sendmp != NULL) {
4782 1.14.2.4 riz sendmp->m_data +=
4783 1.14.2.4 riz IXGBE_RX_COPY_ALIGN;
4784 1.14.2.4 riz ixgbe_bcopy(mp->m_data,
4785 1.14.2.4 riz sendmp->m_data, len);
4786 1.14.2.4 riz sendmp->m_len = len;
4787 1.14.2.4 riz rxr->rx_copies.ev_count++;
4788 1.14.2.4 riz rbuf->flags |= IXGBE_RX_COPY;
4789 1.1 dyoung }
4790 1.1 dyoung }
4791 1.14.2.4 riz if (sendmp == NULL) {
4792 1.14.2.4 riz rbuf->buf = rbuf->fmp = NULL;
4793 1.14.2.4 riz sendmp = mp;
4794 1.14.2.4 riz }
4795 1.14.2.4 riz
4796 1.14.2.4 riz /* first desc of a non-ps chain */
4797 1.14.2.4 riz sendmp->m_flags |= M_PKTHDR;
4798 1.14.2.4 riz sendmp->m_pkthdr.len = mp->m_len;
4799 1.1 dyoung }
4800 1.1 dyoung ++processed;
4801 1.14.2.4 riz /* Pass the head pointer on */
4802 1.14.2.4 riz if (eop == 0) {
4803 1.14.2.4 riz nbuf->fmp = sendmp;
4804 1.14.2.4 riz sendmp = NULL;
4805 1.14.2.4 riz mp->m_next = nbuf->buf;
4806 1.14.2.4 riz } else { /* Sending this frame */
4807 1.1 dyoung sendmp->m_pkthdr.rcvif = ifp;
4808 1.1 dyoung ifp->if_ipackets++;
4809 1.1 dyoung rxr->rx_packets.ev_count++;
4810 1.1 dyoung /* capture data for AIM */
4811 1.1 dyoung rxr->bytes += sendmp->m_pkthdr.len;
4812 1.1 dyoung rxr->rx_bytes.ev_count += sendmp->m_pkthdr.len;
4813 1.14.2.4 riz /* Process vlan info */
4814 1.14.2.4 riz if ((rxr->vtag_strip) &&
4815 1.14.2.4 riz (staterr & IXGBE_RXD_STAT_VP))
4816 1.14.2.4 riz vtag = le16toh(cur->wb.upper.vlan);
4817 1.14.2.4 riz if (vtag) {
4818 1.14.2.4 riz VLAN_INPUT_TAG(ifp, sendmp, vtag,
4819 1.14.2.4 riz printf("%s: could not apply VLAN "
4820 1.14.2.4 riz "tag", __func__));
4821 1.14.2.4 riz }
4822 1.1 dyoung if ((ifp->if_capenable & IFCAP_RXCSUM) != 0) {
4823 1.1 dyoung ixgbe_rx_checksum(staterr, sendmp, ptype,
4824 1.1 dyoung &adapter->stats);
4825 1.1 dyoung }
4826 1.1 dyoung #if __FreeBSD_version >= 800000
4827 1.1 dyoung sendmp->m_pkthdr.flowid = que->msix;
4828 1.1 dyoung sendmp->m_flags |= M_FLOWID;
4829 1.1 dyoung #endif
4830 1.1 dyoung }
4831 1.1 dyoung next_desc:
4832 1.1 dyoung ixgbe_dmamap_sync(rxr->rxdma.dma_tag, rxr->rxdma.dma_map,
4833 1.1 dyoung BUS_DMASYNC_PREREAD | BUS_DMASYNC_PREWRITE);
4834 1.1 dyoung
4835 1.1 dyoung /* Advance our pointers to the next descriptor. */
4836 1.14.2.5 riz if (++i == rxr->num_desc)
4837 1.1 dyoung i = 0;
4838 1.1 dyoung
4839 1.1 dyoung /* Now send to the stack or do LRO */
4840 1.1 dyoung if (sendmp != NULL) {
4841 1.1 dyoung rxr->next_to_check = i;
4842 1.1 dyoung ixgbe_rx_input(rxr, ifp, sendmp, ptype);
4843 1.1 dyoung i = rxr->next_to_check;
4844 1.1 dyoung }
4845 1.1 dyoung
4846 1.1 dyoung /* Every 8 descriptors we go to refresh mbufs */
4847 1.1 dyoung if (processed == 8) {
4848 1.1 dyoung ixgbe_refresh_mbufs(rxr, i);
4849 1.1 dyoung processed = 0;
4850 1.1 dyoung }
4851 1.1 dyoung }
4852 1.1 dyoung
4853 1.1 dyoung /* Refresh any remaining buf structs */
4854 1.1 dyoung if (ixgbe_rx_unrefreshed(rxr))
4855 1.1 dyoung ixgbe_refresh_mbufs(rxr, i);
4856 1.1 dyoung
4857 1.1 dyoung rxr->next_to_check = i;
4858 1.1 dyoung
4859 1.1 dyoung #ifdef LRO
4860 1.1 dyoung /*
4861 1.1 dyoung * Flush any outstanding LRO work
4862 1.1 dyoung */
4863 1.1 dyoung while ((queued = SLIST_FIRST(&lro->lro_active)) != NULL) {
4864 1.1 dyoung SLIST_REMOVE_HEAD(&lro->lro_active, next);
4865 1.1 dyoung tcp_lro_flush(lro, queued);
4866 1.1 dyoung }
4867 1.1 dyoung #endif /* LRO */
4868 1.1 dyoung
4869 1.1 dyoung IXGBE_RX_UNLOCK(rxr);
4870 1.1 dyoung
4871 1.1 dyoung /*
4872 1.1 dyoung ** We still have cleaning to do?
4873 1.1 dyoung ** Schedule another interrupt if so.
4874 1.1 dyoung */
4875 1.1 dyoung if ((staterr & IXGBE_RXD_STAT_DD) != 0) {
4876 1.13 christos ixgbe_rearm_queues(adapter, (u64)(1ULL << que->msix));
4877 1.1 dyoung return true;
4878 1.1 dyoung }
4879 1.1 dyoung
4880 1.1 dyoung return false;
4881 1.1 dyoung }
4882 1.1 dyoung
4883 1.1 dyoung
4884 1.1 dyoung /*********************************************************************
4885 1.1 dyoung *
4886 1.1 dyoung * Verify that the hardware indicated that the checksum is valid.
4887 1.1 dyoung * Inform the stack about the status of checksum so that stack
4888 1.1 dyoung * doesn't spend time verifying the checksum.
4889 1.1 dyoung *
4890 1.1 dyoung *********************************************************************/
4891 1.1 dyoung static void
4892 1.1 dyoung ixgbe_rx_checksum(u32 staterr, struct mbuf * mp, u32 ptype,
4893 1.1 dyoung struct ixgbe_hw_stats *stats)
4894 1.1 dyoung {
4895 1.1 dyoung u16 status = (u16) staterr;
4896 1.1 dyoung u8 errors = (u8) (staterr >> 24);
4897 1.9 skrll #if 0
4898 1.1 dyoung bool sctp = FALSE;
4899 1.1 dyoung
4900 1.1 dyoung if ((ptype & IXGBE_RXDADV_PKTTYPE_ETQF) == 0 &&
4901 1.1 dyoung (ptype & IXGBE_RXDADV_PKTTYPE_SCTP) != 0)
4902 1.1 dyoung sctp = TRUE;
4903 1.9 skrll #endif
4904 1.1 dyoung
4905 1.1 dyoung if (status & IXGBE_RXD_STAT_IPCS) {
4906 1.1 dyoung stats->ipcs.ev_count++;
4907 1.1 dyoung if (!(errors & IXGBE_RXD_ERR_IPE)) {
4908 1.1 dyoung /* IP Checksum Good */
4909 1.1 dyoung mp->m_pkthdr.csum_flags = M_CSUM_IPv4;
4910 1.1 dyoung
4911 1.1 dyoung } else {
4912 1.1 dyoung stats->ipcs_bad.ev_count++;
4913 1.1 dyoung mp->m_pkthdr.csum_flags = M_CSUM_IPv4|M_CSUM_IPv4_BAD;
4914 1.1 dyoung }
4915 1.1 dyoung }
4916 1.1 dyoung if (status & IXGBE_RXD_STAT_L4CS) {
4917 1.1 dyoung stats->l4cs.ev_count++;
4918 1.1 dyoung u16 type = M_CSUM_TCPv4|M_CSUM_TCPv6|M_CSUM_UDPv4|M_CSUM_UDPv6;
4919 1.1 dyoung if (!(errors & IXGBE_RXD_ERR_TCPE)) {
4920 1.1 dyoung mp->m_pkthdr.csum_flags |= type;
4921 1.1 dyoung } else {
4922 1.1 dyoung stats->l4cs_bad.ev_count++;
4923 1.1 dyoung mp->m_pkthdr.csum_flags |= type | M_CSUM_TCP_UDP_BAD;
4924 1.1 dyoung }
4925 1.1 dyoung }
4926 1.1 dyoung return;
4927 1.1 dyoung }
4928 1.1 dyoung
4929 1.1 dyoung
4930 1.1 dyoung #if 0 /* XXX Badly need to overhaul vlan(4) on NetBSD. */
4931 1.1 dyoung /*
4932 1.1 dyoung ** This routine is run via an vlan config EVENT,
4933 1.1 dyoung ** it enables us to use the HW Filter table since
4934 1.1 dyoung ** we can get the vlan id. This just creates the
4935 1.1 dyoung ** entry in the soft version of the VFTA, init will
4936 1.1 dyoung ** repopulate the real table.
4937 1.1 dyoung */
4938 1.1 dyoung static void
4939 1.1 dyoung ixgbe_register_vlan(void *arg, struct ifnet *ifp, u16 vtag)
4940 1.1 dyoung {
4941 1.1 dyoung struct adapter *adapter = ifp->if_softc;
4942 1.1 dyoung u16 index, bit;
4943 1.1 dyoung
4944 1.1 dyoung if (ifp->if_softc != arg) /* Not our event */
4945 1.1 dyoung return;
4946 1.1 dyoung
4947 1.1 dyoung if ((vtag == 0) || (vtag > 4095)) /* Invalid */
4948 1.1 dyoung return;
4949 1.1 dyoung
4950 1.1 dyoung IXGBE_CORE_LOCK(adapter);
4951 1.1 dyoung index = (vtag >> 5) & 0x7F;
4952 1.1 dyoung bit = vtag & 0x1F;
4953 1.1 dyoung adapter->shadow_vfta[index] |= (1 << bit);
4954 1.1 dyoung ixgbe_init_locked(adapter);
4955 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
4956 1.1 dyoung }
4957 1.1 dyoung
4958 1.1 dyoung /*
4959 1.1 dyoung ** This routine is run via an vlan
4960 1.1 dyoung ** unconfig EVENT, remove our entry
4961 1.1 dyoung ** in the soft vfta.
4962 1.1 dyoung */
4963 1.1 dyoung static void
4964 1.1 dyoung ixgbe_unregister_vlan(void *arg, struct ifnet *ifp, u16 vtag)
4965 1.1 dyoung {
4966 1.1 dyoung struct adapter *adapter = ifp->if_softc;
4967 1.1 dyoung u16 index, bit;
4968 1.1 dyoung
4969 1.1 dyoung if (ifp->if_softc != arg)
4970 1.1 dyoung return;
4971 1.1 dyoung
4972 1.1 dyoung if ((vtag == 0) || (vtag > 4095)) /* Invalid */
4973 1.1 dyoung return;
4974 1.1 dyoung
4975 1.1 dyoung IXGBE_CORE_LOCK(adapter);
4976 1.1 dyoung index = (vtag >> 5) & 0x7F;
4977 1.1 dyoung bit = vtag & 0x1F;
4978 1.1 dyoung adapter->shadow_vfta[index] &= ~(1 << bit);
4979 1.1 dyoung /* Re-init to load the changes */
4980 1.1 dyoung ixgbe_init_locked(adapter);
4981 1.1 dyoung IXGBE_CORE_UNLOCK(adapter);
4982 1.1 dyoung }
4983 1.1 dyoung #endif
4984 1.1 dyoung
4985 1.1 dyoung static void
4986 1.1 dyoung ixgbe_setup_vlan_hw_support(struct adapter *adapter)
4987 1.1 dyoung {
4988 1.1 dyoung struct ethercom *ec = &adapter->osdep.ec;
4989 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
4990 1.14.2.4 riz struct rx_ring *rxr;
4991 1.1 dyoung u32 ctrl;
4992 1.1 dyoung
4993 1.1 dyoung /*
4994 1.1 dyoung ** We get here thru init_locked, meaning
4995 1.1 dyoung ** a soft reset, this has already cleared
4996 1.1 dyoung ** the VFTA and other state, so if there
4997 1.1 dyoung ** have been no vlan's registered do nothing.
4998 1.1 dyoung */
4999 1.1 dyoung if (!VLAN_ATTACHED(&adapter->osdep.ec)) {
5000 1.1 dyoung return;
5001 1.1 dyoung }
5002 1.1 dyoung
5003 1.1 dyoung /*
5004 1.1 dyoung ** A soft reset zero's out the VFTA, so
5005 1.1 dyoung ** we need to repopulate it now.
5006 1.1 dyoung */
5007 1.1 dyoung for (int i = 0; i < IXGBE_VFTA_SIZE; i++)
5008 1.1 dyoung if (adapter->shadow_vfta[i] != 0)
5009 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_VFTA(i),
5010 1.1 dyoung adapter->shadow_vfta[i]);
5011 1.1 dyoung
5012 1.1 dyoung ctrl = IXGBE_READ_REG(hw, IXGBE_VLNCTRL);
5013 1.1 dyoung /* Enable the Filter Table if enabled */
5014 1.1 dyoung if (ec->ec_capenable & ETHERCAP_VLAN_HWFILTER) {
5015 1.1 dyoung ctrl &= ~IXGBE_VLNCTRL_CFIEN;
5016 1.1 dyoung ctrl |= IXGBE_VLNCTRL_VFE;
5017 1.1 dyoung }
5018 1.1 dyoung if (hw->mac.type == ixgbe_mac_82598EB)
5019 1.1 dyoung ctrl |= IXGBE_VLNCTRL_VME;
5020 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_VLNCTRL, ctrl);
5021 1.1 dyoung
5022 1.14.2.4 riz /* Setup the queues for vlans */
5023 1.14.2.4 riz for (int i = 0; i < adapter->num_queues; i++) {
5024 1.14.2.4 riz rxr = &adapter->rx_rings[i];
5025 1.14.2.4 riz /* On 82599 the VLAN enable is per/queue in RXDCTL */
5026 1.14.2.4 riz if (hw->mac.type != ixgbe_mac_82598EB) {
5027 1.1 dyoung ctrl = IXGBE_READ_REG(hw, IXGBE_RXDCTL(i));
5028 1.14.2.4 riz ctrl |= IXGBE_RXDCTL_VME;
5029 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_RXDCTL(i), ctrl);
5030 1.1 dyoung }
5031 1.14.2.4 riz rxr->vtag_strip = TRUE;
5032 1.14.2.4 riz }
5033 1.1 dyoung }
5034 1.1 dyoung
5035 1.1 dyoung static void
5036 1.1 dyoung ixgbe_enable_intr(struct adapter *adapter)
5037 1.1 dyoung {
5038 1.14.2.5 riz struct ixgbe_hw *hw = &adapter->hw;
5039 1.14.2.5 riz struct ix_queue *que = adapter->queues;
5040 1.14.2.5 riz u32 mask, fwsm;
5041 1.1 dyoung
5042 1.14.2.5 riz mask = (IXGBE_EIMS_ENABLE_MASK & ~IXGBE_EIMS_RTX_QUEUE);
5043 1.1 dyoung /* Enable Fan Failure detection */
5044 1.1 dyoung if (hw->device_id == IXGBE_DEV_ID_82598AT)
5045 1.1 dyoung mask |= IXGBE_EIMS_GPI_SDP1;
5046 1.14.2.5 riz
5047 1.14.2.5 riz switch (adapter->hw.mac.type) {
5048 1.14.2.5 riz case ixgbe_mac_82599EB:
5049 1.14.2.5 riz mask |= IXGBE_EIMS_ECC;
5050 1.14.2.5 riz mask |= IXGBE_EIMS_GPI_SDP0;
5051 1.14.2.5 riz mask |= IXGBE_EIMS_GPI_SDP1;
5052 1.14.2.5 riz mask |= IXGBE_EIMS_GPI_SDP2;
5053 1.1 dyoung #ifdef IXGBE_FDIR
5054 1.14.2.5 riz mask |= IXGBE_EIMS_FLOW_DIR;
5055 1.1 dyoung #endif
5056 1.14.2.5 riz break;
5057 1.14.2.5 riz case ixgbe_mac_X540:
5058 1.14.2.5 riz mask |= IXGBE_EIMS_ECC;
5059 1.14.2.5 riz /* Detect if Thermal Sensor is enabled */
5060 1.14.2.5 riz fwsm = IXGBE_READ_REG(hw, IXGBE_FWSM);
5061 1.14.2.5 riz if (fwsm & IXGBE_FWSM_TS_ENABLED)
5062 1.14.2.5 riz mask |= IXGBE_EIMS_TS;
5063 1.14.2.5 riz #ifdef IXGBE_FDIR
5064 1.14.2.5 riz mask |= IXGBE_EIMS_FLOW_DIR;
5065 1.14.2.5 riz #endif
5066 1.14.2.5 riz /* falls through */
5067 1.14.2.5 riz default:
5068 1.14.2.5 riz break;
5069 1.1 dyoung }
5070 1.1 dyoung
5071 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIMS, mask);
5072 1.1 dyoung
5073 1.1 dyoung /* With RSS we use auto clear */
5074 1.1 dyoung if (adapter->msix_mem) {
5075 1.1 dyoung mask = IXGBE_EIMS_ENABLE_MASK;
5076 1.1 dyoung /* Don't autoclear Link */
5077 1.1 dyoung mask &= ~IXGBE_EIMS_OTHER;
5078 1.1 dyoung mask &= ~IXGBE_EIMS_LSC;
5079 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_EIAC, mask);
5080 1.1 dyoung }
5081 1.1 dyoung
5082 1.1 dyoung /*
5083 1.1 dyoung ** Now enable all queues, this is done separately to
5084 1.1 dyoung ** allow for handling the extended (beyond 32) MSIX
5085 1.1 dyoung ** vectors that can be used by 82599
5086 1.1 dyoung */
5087 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, que++)
5088 1.1 dyoung ixgbe_enable_queue(adapter, que->msix);
5089 1.1 dyoung
5090 1.1 dyoung IXGBE_WRITE_FLUSH(hw);
5091 1.1 dyoung
5092 1.1 dyoung return;
5093 1.1 dyoung }
5094 1.1 dyoung
5095 1.1 dyoung static void
5096 1.1 dyoung ixgbe_disable_intr(struct adapter *adapter)
5097 1.1 dyoung {
5098 1.1 dyoung if (adapter->msix_mem)
5099 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIAC, 0);
5100 1.1 dyoung if (adapter->hw.mac.type == ixgbe_mac_82598EB) {
5101 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIMC, ~0);
5102 1.1 dyoung } else {
5103 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIMC, 0xFFFF0000);
5104 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIMC_EX(0), ~0);
5105 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIMC_EX(1), ~0);
5106 1.1 dyoung }
5107 1.1 dyoung IXGBE_WRITE_FLUSH(&adapter->hw);
5108 1.1 dyoung return;
5109 1.1 dyoung }
5110 1.1 dyoung
5111 1.1 dyoung u16
5112 1.1 dyoung ixgbe_read_pci_cfg(struct ixgbe_hw *hw, u32 reg)
5113 1.1 dyoung {
5114 1.1 dyoung switch (reg % 4) {
5115 1.1 dyoung case 0:
5116 1.1 dyoung return pci_conf_read(hw->back->pc, hw->back->tag, reg) &
5117 1.1 dyoung __BITS(15, 0);
5118 1.1 dyoung case 2:
5119 1.1 dyoung return __SHIFTOUT(pci_conf_read(hw->back->pc, hw->back->tag,
5120 1.1 dyoung reg - 2), __BITS(31, 16));
5121 1.1 dyoung default:
5122 1.1 dyoung panic("%s: invalid register (%" PRIx32, __func__, reg);
5123 1.1 dyoung break;
5124 1.1 dyoung }
5125 1.1 dyoung }
5126 1.1 dyoung
5127 1.1 dyoung void
5128 1.1 dyoung ixgbe_write_pci_cfg(struct ixgbe_hw *hw, u32 reg, u16 value)
5129 1.1 dyoung {
5130 1.1 dyoung pcireg_t old;
5131 1.1 dyoung
5132 1.1 dyoung switch (reg % 4) {
5133 1.1 dyoung case 0:
5134 1.1 dyoung old = pci_conf_read(hw->back->pc, hw->back->tag, reg) &
5135 1.1 dyoung __BITS(31, 16);
5136 1.1 dyoung pci_conf_write(hw->back->pc, hw->back->tag, reg, value | old);
5137 1.1 dyoung break;
5138 1.1 dyoung case 2:
5139 1.1 dyoung old = pci_conf_read(hw->back->pc, hw->back->tag, reg - 2) &
5140 1.1 dyoung __BITS(15, 0);
5141 1.1 dyoung pci_conf_write(hw->back->pc, hw->back->tag, reg - 2,
5142 1.1 dyoung __SHIFTIN(value, __BITS(31, 16)) | old);
5143 1.1 dyoung break;
5144 1.1 dyoung default:
5145 1.1 dyoung panic("%s: invalid register (%" PRIx32, __func__, reg);
5146 1.1 dyoung break;
5147 1.1 dyoung }
5148 1.1 dyoung
5149 1.1 dyoung return;
5150 1.1 dyoung }
5151 1.1 dyoung
5152 1.1 dyoung /*
5153 1.1 dyoung ** Setup the correct IVAR register for a particular MSIX interrupt
5154 1.1 dyoung ** (yes this is all very magic and confusing :)
5155 1.1 dyoung ** - entry is the register array entry
5156 1.1 dyoung ** - vector is the MSIX vector for this queue
5157 1.1 dyoung ** - type is RX/TX/MISC
5158 1.1 dyoung */
5159 1.1 dyoung static void
5160 1.1 dyoung ixgbe_set_ivar(struct adapter *adapter, u8 entry, u8 vector, s8 type)
5161 1.1 dyoung {
5162 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
5163 1.1 dyoung u32 ivar, index;
5164 1.1 dyoung
5165 1.1 dyoung vector |= IXGBE_IVAR_ALLOC_VAL;
5166 1.1 dyoung
5167 1.1 dyoung switch (hw->mac.type) {
5168 1.1 dyoung
5169 1.1 dyoung case ixgbe_mac_82598EB:
5170 1.1 dyoung if (type == -1)
5171 1.1 dyoung entry = IXGBE_IVAR_OTHER_CAUSES_INDEX;
5172 1.1 dyoung else
5173 1.1 dyoung entry += (type * 64);
5174 1.1 dyoung index = (entry >> 2) & 0x1F;
5175 1.1 dyoung ivar = IXGBE_READ_REG(hw, IXGBE_IVAR(index));
5176 1.1 dyoung ivar &= ~(0xFF << (8 * (entry & 0x3)));
5177 1.1 dyoung ivar |= (vector << (8 * (entry & 0x3)));
5178 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw, IXGBE_IVAR(index), ivar);
5179 1.1 dyoung break;
5180 1.1 dyoung
5181 1.1 dyoung case ixgbe_mac_82599EB:
5182 1.14.2.4 riz case ixgbe_mac_X540:
5183 1.1 dyoung if (type == -1) { /* MISC IVAR */
5184 1.1 dyoung index = (entry & 1) * 8;
5185 1.1 dyoung ivar = IXGBE_READ_REG(hw, IXGBE_IVAR_MISC);
5186 1.1 dyoung ivar &= ~(0xFF << index);
5187 1.1 dyoung ivar |= (vector << index);
5188 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_IVAR_MISC, ivar);
5189 1.1 dyoung } else { /* RX/TX IVARS */
5190 1.1 dyoung index = (16 * (entry & 1)) + (8 * type);
5191 1.1 dyoung ivar = IXGBE_READ_REG(hw, IXGBE_IVAR(entry >> 1));
5192 1.1 dyoung ivar &= ~(0xFF << index);
5193 1.1 dyoung ivar |= (vector << index);
5194 1.1 dyoung IXGBE_WRITE_REG(hw, IXGBE_IVAR(entry >> 1), ivar);
5195 1.1 dyoung }
5196 1.1 dyoung
5197 1.1 dyoung default:
5198 1.1 dyoung break;
5199 1.1 dyoung }
5200 1.1 dyoung }
5201 1.1 dyoung
5202 1.1 dyoung static void
5203 1.1 dyoung ixgbe_configure_ivars(struct adapter *adapter)
5204 1.1 dyoung {
5205 1.1 dyoung struct ix_queue *que = adapter->queues;
5206 1.1 dyoung u32 newitr;
5207 1.1 dyoung
5208 1.1 dyoung if (ixgbe_max_interrupt_rate > 0)
5209 1.14.2.3 martin newitr = (4000000 / ixgbe_max_interrupt_rate) & 0x0FF8;
5210 1.1 dyoung else
5211 1.1 dyoung newitr = 0;
5212 1.1 dyoung
5213 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, que++) {
5214 1.1 dyoung /* First the RX queue entry */
5215 1.1 dyoung ixgbe_set_ivar(adapter, i, que->msix, 0);
5216 1.1 dyoung /* ... and the TX */
5217 1.1 dyoung ixgbe_set_ivar(adapter, i, que->msix, 1);
5218 1.1 dyoung /* Set an Initial EITR value */
5219 1.1 dyoung IXGBE_WRITE_REG(&adapter->hw,
5220 1.1 dyoung IXGBE_EITR(que->msix), newitr);
5221 1.1 dyoung }
5222 1.1 dyoung
5223 1.1 dyoung /* For the Link interrupt */
5224 1.1 dyoung ixgbe_set_ivar(adapter, 1, adapter->linkvec, -1);
5225 1.1 dyoung }
5226 1.1 dyoung
5227 1.1 dyoung /*
5228 1.1 dyoung ** ixgbe_sfp_probe - called in the local timer to
5229 1.1 dyoung ** determine if a port had optics inserted.
5230 1.1 dyoung */
5231 1.1 dyoung static bool ixgbe_sfp_probe(struct adapter *adapter)
5232 1.1 dyoung {
5233 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
5234 1.1 dyoung device_t dev = adapter->dev;
5235 1.1 dyoung bool result = FALSE;
5236 1.1 dyoung
5237 1.1 dyoung if ((hw->phy.type == ixgbe_phy_nl) &&
5238 1.1 dyoung (hw->phy.sfp_type == ixgbe_sfp_type_not_present)) {
5239 1.1 dyoung s32 ret = hw->phy.ops.identify_sfp(hw);
5240 1.1 dyoung if (ret)
5241 1.1 dyoung goto out;
5242 1.1 dyoung ret = hw->phy.ops.reset(hw);
5243 1.1 dyoung if (ret == IXGBE_ERR_SFP_NOT_SUPPORTED) {
5244 1.1 dyoung device_printf(dev,"Unsupported SFP+ module detected!");
5245 1.1 dyoung device_printf(dev, "Reload driver with supported module.\n");
5246 1.1 dyoung adapter->sfp_probe = FALSE;
5247 1.1 dyoung goto out;
5248 1.1 dyoung } else
5249 1.1 dyoung device_printf(dev,"SFP+ module detected!\n");
5250 1.1 dyoung /* We now have supported optics */
5251 1.1 dyoung adapter->sfp_probe = FALSE;
5252 1.1 dyoung /* Set the optics type so system reports correctly */
5253 1.1 dyoung ixgbe_setup_optics(adapter);
5254 1.1 dyoung result = TRUE;
5255 1.1 dyoung }
5256 1.1 dyoung out:
5257 1.1 dyoung return (result);
5258 1.1 dyoung }
5259 1.1 dyoung
5260 1.1 dyoung /*
5261 1.1 dyoung ** Tasklet handler for MSIX Link interrupts
5262 1.1 dyoung ** - do outside interrupt since it might sleep
5263 1.1 dyoung */
5264 1.1 dyoung static void
5265 1.1 dyoung ixgbe_handle_link(void *context)
5266 1.1 dyoung {
5267 1.1 dyoung struct adapter *adapter = context;
5268 1.1 dyoung
5269 1.13 christos if (ixgbe_check_link(&adapter->hw,
5270 1.13 christos &adapter->link_speed, &adapter->link_up, 0) == 0)
5271 1.13 christos ixgbe_update_link_status(adapter);
5272 1.1 dyoung }
5273 1.1 dyoung
5274 1.1 dyoung /*
5275 1.1 dyoung ** Tasklet for handling SFP module interrupts
5276 1.1 dyoung */
5277 1.1 dyoung static void
5278 1.1 dyoung ixgbe_handle_mod(void *context)
5279 1.1 dyoung {
5280 1.1 dyoung struct adapter *adapter = context;
5281 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
5282 1.1 dyoung device_t dev = adapter->dev;
5283 1.1 dyoung u32 err;
5284 1.1 dyoung
5285 1.1 dyoung err = hw->phy.ops.identify_sfp(hw);
5286 1.1 dyoung if (err == IXGBE_ERR_SFP_NOT_SUPPORTED) {
5287 1.1 dyoung device_printf(dev,
5288 1.1 dyoung "Unsupported SFP+ module type was detected.\n");
5289 1.1 dyoung return;
5290 1.1 dyoung }
5291 1.1 dyoung err = hw->mac.ops.setup_sfp(hw);
5292 1.1 dyoung if (err == IXGBE_ERR_SFP_NOT_SUPPORTED) {
5293 1.1 dyoung device_printf(dev,
5294 1.1 dyoung "Setup failure - unsupported SFP+ module type.\n");
5295 1.1 dyoung return;
5296 1.1 dyoung }
5297 1.1 dyoung softint_schedule(adapter->msf_si);
5298 1.1 dyoung return;
5299 1.1 dyoung }
5300 1.1 dyoung
5301 1.1 dyoung
5302 1.1 dyoung /*
5303 1.1 dyoung ** Tasklet for handling MSF (multispeed fiber) interrupts
5304 1.1 dyoung */
5305 1.1 dyoung static void
5306 1.1 dyoung ixgbe_handle_msf(void *context)
5307 1.1 dyoung {
5308 1.1 dyoung struct adapter *adapter = context;
5309 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
5310 1.1 dyoung u32 autoneg;
5311 1.1 dyoung bool negotiate;
5312 1.1 dyoung
5313 1.1 dyoung autoneg = hw->phy.autoneg_advertised;
5314 1.1 dyoung if ((!autoneg) && (hw->mac.ops.get_link_capabilities))
5315 1.1 dyoung hw->mac.ops.get_link_capabilities(hw, &autoneg, &negotiate);
5316 1.13 christos else
5317 1.13 christos negotiate = 0;
5318 1.1 dyoung if (hw->mac.ops.setup_link)
5319 1.14.2.5 riz hw->mac.ops.setup_link(hw, autoneg, TRUE);
5320 1.1 dyoung return;
5321 1.1 dyoung }
5322 1.1 dyoung
5323 1.1 dyoung #ifdef IXGBE_FDIR
5324 1.1 dyoung /*
5325 1.1 dyoung ** Tasklet for reinitializing the Flow Director filter table
5326 1.1 dyoung */
5327 1.1 dyoung static void
5328 1.1 dyoung ixgbe_reinit_fdir(void *context)
5329 1.1 dyoung {
5330 1.1 dyoung struct adapter *adapter = context;
5331 1.1 dyoung struct ifnet *ifp = adapter->ifp;
5332 1.1 dyoung
5333 1.1 dyoung if (adapter->fdir_reinit != 1) /* Shouldn't happen */
5334 1.1 dyoung return;
5335 1.1 dyoung ixgbe_reinit_fdir_tables_82599(&adapter->hw);
5336 1.1 dyoung adapter->fdir_reinit = 0;
5337 1.14.2.4 riz /* re-enable flow director interrupts */
5338 1.14.2.4 riz IXGBE_WRITE_REG(&adapter->hw, IXGBE_EIMS, IXGBE_EIMS_FLOW_DIR);
5339 1.1 dyoung /* Restart the interface */
5340 1.1 dyoung ifp->if_flags |= IFF_RUNNING;
5341 1.1 dyoung return;
5342 1.1 dyoung }
5343 1.1 dyoung #endif
5344 1.1 dyoung
5345 1.1 dyoung /**********************************************************************
5346 1.1 dyoung *
5347 1.1 dyoung * Update the board statistics counters.
5348 1.1 dyoung *
5349 1.1 dyoung **********************************************************************/
5350 1.1 dyoung static void
5351 1.1 dyoung ixgbe_update_stats_counters(struct adapter *adapter)
5352 1.1 dyoung {
5353 1.1 dyoung struct ifnet *ifp = adapter->ifp;
5354 1.1 dyoung struct ixgbe_hw *hw = &adapter->hw;
5355 1.1 dyoung u32 missed_rx = 0, bprc, lxon, lxoff, total;
5356 1.1 dyoung u64 total_missed_rx = 0;
5357 1.14.2.4 riz uint64_t crcerrs, rlec;
5358 1.1 dyoung
5359 1.14.2.4 riz crcerrs = IXGBE_READ_REG(hw, IXGBE_CRCERRS);
5360 1.14.2.4 riz adapter->stats.crcerrs.ev_count += crcerrs;
5361 1.1 dyoung adapter->stats.illerrc.ev_count += IXGBE_READ_REG(hw, IXGBE_ILLERRC);
5362 1.1 dyoung adapter->stats.errbc.ev_count += IXGBE_READ_REG(hw, IXGBE_ERRBC);
5363 1.1 dyoung adapter->stats.mspdc.ev_count += IXGBE_READ_REG(hw, IXGBE_MSPDC);
5364 1.1 dyoung
5365 1.14.2.5 riz /*
5366 1.14.2.5 riz ** Note: these are for the 8 possible traffic classes,
5367 1.14.2.5 riz ** which in current implementation is unused,
5368 1.14.2.5 riz ** therefore only 0 should read real data.
5369 1.14.2.5 riz */
5370 1.1 dyoung for (int i = 0; i < __arraycount(adapter->stats.mpc); i++) {
5371 1.1 dyoung int j = i % adapter->num_queues;
5372 1.1 dyoung u32 mp;
5373 1.1 dyoung mp = IXGBE_READ_REG(hw, IXGBE_MPC(i));
5374 1.1 dyoung /* missed_rx tallies misses for the gprc workaround */
5375 1.1 dyoung missed_rx += mp;
5376 1.1 dyoung /* global total per queue */
5377 1.1 dyoung adapter->stats.mpc[j].ev_count += mp;
5378 1.1 dyoung /* Running comprehensive total for stats display */
5379 1.14.2.4 riz total_missed_rx += mp;
5380 1.14.2.5 riz if (hw->mac.type == ixgbe_mac_82598EB) {
5381 1.1 dyoung adapter->stats.rnbc[j] +=
5382 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_RNBC(i));
5383 1.14.2.5 riz adapter->stats.qbtc[j].ev_count +=
5384 1.14.2.5 riz IXGBE_READ_REG(hw, IXGBE_QBTC(i));
5385 1.14.2.5 riz adapter->stats.qbrc[j].ev_count +=
5386 1.14.2.5 riz IXGBE_READ_REG(hw, IXGBE_QBRC(i));
5387 1.14.2.5 riz adapter->stats.pxonrxc[j].ev_count +=
5388 1.14.2.5 riz IXGBE_READ_REG(hw, IXGBE_PXONRXC(i));
5389 1.14.2.5 riz } else {
5390 1.14.2.5 riz adapter->stats.pxonrxc[j].ev_count +=
5391 1.14.2.5 riz IXGBE_READ_REG(hw, IXGBE_PXONRXCNT(i));
5392 1.14.2.5 riz }
5393 1.1 dyoung adapter->stats.pxontxc[j].ev_count +=
5394 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_PXONTXC(i));
5395 1.1 dyoung adapter->stats.pxofftxc[j].ev_count +=
5396 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_PXOFFTXC(i));
5397 1.1 dyoung adapter->stats.pxoffrxc[j].ev_count +=
5398 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_PXOFFRXC(i));
5399 1.1 dyoung adapter->stats.pxon2offc[j].ev_count +=
5400 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_PXON2OFFCNT(i));
5401 1.1 dyoung }
5402 1.1 dyoung for (int i = 0; i < __arraycount(adapter->stats.qprc); i++) {
5403 1.1 dyoung int j = i % adapter->num_queues;
5404 1.1 dyoung adapter->stats.qprc[j].ev_count += IXGBE_READ_REG(hw, IXGBE_QPRC(i));
5405 1.1 dyoung adapter->stats.qptc[j].ev_count += IXGBE_READ_REG(hw, IXGBE_QPTC(i));
5406 1.1 dyoung adapter->stats.qprdc[j].ev_count += IXGBE_READ_REG(hw, IXGBE_QPRDC(i));
5407 1.1 dyoung }
5408 1.1 dyoung adapter->stats.mlfc.ev_count += IXGBE_READ_REG(hw, IXGBE_MLFC);
5409 1.1 dyoung adapter->stats.mrfc.ev_count += IXGBE_READ_REG(hw, IXGBE_MRFC);
5410 1.14.2.4 riz rlec = IXGBE_READ_REG(hw, IXGBE_RLEC);
5411 1.14.2.4 riz adapter->stats.rlec.ev_count += rlec;
5412 1.1 dyoung
5413 1.1 dyoung /* Hardware workaround, gprc counts missed packets */
5414 1.1 dyoung adapter->stats.gprc.ev_count += IXGBE_READ_REG(hw, IXGBE_GPRC) - missed_rx;
5415 1.1 dyoung
5416 1.1 dyoung lxon = IXGBE_READ_REG(hw, IXGBE_LXONTXC);
5417 1.1 dyoung adapter->stats.lxontxc.ev_count += lxon;
5418 1.1 dyoung lxoff = IXGBE_READ_REG(hw, IXGBE_LXOFFTXC);
5419 1.1 dyoung adapter->stats.lxofftxc.ev_count += lxoff;
5420 1.1 dyoung total = lxon + lxoff;
5421 1.1 dyoung
5422 1.1 dyoung if (hw->mac.type != ixgbe_mac_82598EB) {
5423 1.1 dyoung adapter->stats.gorc.ev_count += IXGBE_READ_REG(hw, IXGBE_GORCL) +
5424 1.1 dyoung ((u64)IXGBE_READ_REG(hw, IXGBE_GORCH) << 32);
5425 1.1 dyoung adapter->stats.gotc.ev_count += IXGBE_READ_REG(hw, IXGBE_GOTCL) +
5426 1.1 dyoung ((u64)IXGBE_READ_REG(hw, IXGBE_GOTCH) << 32) - total * ETHER_MIN_LEN;
5427 1.1 dyoung adapter->stats.tor.ev_count += IXGBE_READ_REG(hw, IXGBE_TORL) +
5428 1.1 dyoung ((u64)IXGBE_READ_REG(hw, IXGBE_TORH) << 32);
5429 1.1 dyoung adapter->stats.lxonrxc.ev_count += IXGBE_READ_REG(hw, IXGBE_LXONRXCNT);
5430 1.1 dyoung adapter->stats.lxoffrxc.ev_count += IXGBE_READ_REG(hw, IXGBE_LXOFFRXCNT);
5431 1.1 dyoung } else {
5432 1.1 dyoung adapter->stats.lxonrxc.ev_count += IXGBE_READ_REG(hw, IXGBE_LXONRXC);
5433 1.1 dyoung adapter->stats.lxoffrxc.ev_count += IXGBE_READ_REG(hw, IXGBE_LXOFFRXC);
5434 1.1 dyoung /* 82598 only has a counter in the high register */
5435 1.1 dyoung adapter->stats.gorc.ev_count += IXGBE_READ_REG(hw, IXGBE_GORCH);
5436 1.1 dyoung adapter->stats.gotc.ev_count += IXGBE_READ_REG(hw, IXGBE_GOTCH) - total * ETHER_MIN_LEN;
5437 1.1 dyoung adapter->stats.tor.ev_count += IXGBE_READ_REG(hw, IXGBE_TORH);
5438 1.1 dyoung }
5439 1.1 dyoung
5440 1.1 dyoung /*
5441 1.1 dyoung * Workaround: mprc hardware is incorrectly counting
5442 1.1 dyoung * broadcasts, so for now we subtract those.
5443 1.1 dyoung */
5444 1.1 dyoung bprc = IXGBE_READ_REG(hw, IXGBE_BPRC);
5445 1.1 dyoung adapter->stats.bprc.ev_count += bprc;
5446 1.1 dyoung adapter->stats.mprc.ev_count += IXGBE_READ_REG(hw, IXGBE_MPRC) - ((hw->mac.type == ixgbe_mac_82598EB) ? bprc : 0);
5447 1.1 dyoung
5448 1.1 dyoung adapter->stats.prc64.ev_count += IXGBE_READ_REG(hw, IXGBE_PRC64);
5449 1.1 dyoung adapter->stats.prc127.ev_count += IXGBE_READ_REG(hw, IXGBE_PRC127);
5450 1.1 dyoung adapter->stats.prc255.ev_count += IXGBE_READ_REG(hw, IXGBE_PRC255);
5451 1.1 dyoung adapter->stats.prc511.ev_count += IXGBE_READ_REG(hw, IXGBE_PRC511);
5452 1.1 dyoung adapter->stats.prc1023.ev_count += IXGBE_READ_REG(hw, IXGBE_PRC1023);
5453 1.1 dyoung adapter->stats.prc1522.ev_count += IXGBE_READ_REG(hw, IXGBE_PRC1522);
5454 1.1 dyoung
5455 1.1 dyoung adapter->stats.gptc.ev_count += IXGBE_READ_REG(hw, IXGBE_GPTC) - total;
5456 1.1 dyoung adapter->stats.mptc.ev_count += IXGBE_READ_REG(hw, IXGBE_MPTC) - total;
5457 1.1 dyoung adapter->stats.ptc64.ev_count += IXGBE_READ_REG(hw, IXGBE_PTC64) - total;
5458 1.1 dyoung
5459 1.1 dyoung adapter->stats.ruc.ev_count += IXGBE_READ_REG(hw, IXGBE_RUC);
5460 1.1 dyoung adapter->stats.rfc.ev_count += IXGBE_READ_REG(hw, IXGBE_RFC);
5461 1.1 dyoung adapter->stats.roc.ev_count += IXGBE_READ_REG(hw, IXGBE_ROC);
5462 1.1 dyoung adapter->stats.rjc.ev_count += IXGBE_READ_REG(hw, IXGBE_RJC);
5463 1.1 dyoung adapter->stats.mngprc.ev_count += IXGBE_READ_REG(hw, IXGBE_MNGPRC);
5464 1.1 dyoung adapter->stats.mngpdc.ev_count += IXGBE_READ_REG(hw, IXGBE_MNGPDC);
5465 1.1 dyoung adapter->stats.mngptc.ev_count += IXGBE_READ_REG(hw, IXGBE_MNGPTC);
5466 1.1 dyoung adapter->stats.tpr.ev_count += IXGBE_READ_REG(hw, IXGBE_TPR);
5467 1.1 dyoung adapter->stats.tpt.ev_count += IXGBE_READ_REG(hw, IXGBE_TPT);
5468 1.1 dyoung adapter->stats.ptc127.ev_count += IXGBE_READ_REG(hw, IXGBE_PTC127);
5469 1.1 dyoung adapter->stats.ptc255.ev_count += IXGBE_READ_REG(hw, IXGBE_PTC255);
5470 1.1 dyoung adapter->stats.ptc511.ev_count += IXGBE_READ_REG(hw, IXGBE_PTC511);
5471 1.1 dyoung adapter->stats.ptc1023.ev_count += IXGBE_READ_REG(hw, IXGBE_PTC1023);
5472 1.1 dyoung adapter->stats.ptc1522.ev_count += IXGBE_READ_REG(hw, IXGBE_PTC1522);
5473 1.1 dyoung adapter->stats.bptc.ev_count += IXGBE_READ_REG(hw, IXGBE_BPTC);
5474 1.1 dyoung adapter->stats.xec.ev_count += IXGBE_READ_REG(hw, IXGBE_XEC);
5475 1.1 dyoung adapter->stats.fccrc.ev_count += IXGBE_READ_REG(hw, IXGBE_FCCRC);
5476 1.1 dyoung adapter->stats.fclast.ev_count += IXGBE_READ_REG(hw, IXGBE_FCLAST);
5477 1.1 dyoung
5478 1.1 dyoung /* Only read FCOE on 82599 */
5479 1.1 dyoung if (hw->mac.type != ixgbe_mac_82598EB) {
5480 1.1 dyoung adapter->stats.fcoerpdc.ev_count +=
5481 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_FCOERPDC);
5482 1.1 dyoung adapter->stats.fcoeprc.ev_count +=
5483 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_FCOEPRC);
5484 1.1 dyoung adapter->stats.fcoeptc.ev_count +=
5485 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_FCOEPTC);
5486 1.1 dyoung adapter->stats.fcoedwrc.ev_count +=
5487 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_FCOEDWRC);
5488 1.1 dyoung adapter->stats.fcoedwtc.ev_count +=
5489 1.1 dyoung IXGBE_READ_REG(hw, IXGBE_FCOEDWTC);
5490 1.1 dyoung }
5491 1.1 dyoung
5492 1.1 dyoung /* Fill out the OS statistics structure */
5493 1.14.2.4 riz /*
5494 1.14.2.4 riz * NetBSD: Don't override if_{i|o}{packets|bytes|mcasts} with
5495 1.14.2.4 riz * adapter->stats counters. It's required to make ifconfig -z
5496 1.14.2.4 riz * (SOICZIFDATA) work.
5497 1.14.2.4 riz */
5498 1.1 dyoung ifp->if_collisions = 0;
5499 1.14.2.5 riz
5500 1.1 dyoung /* Rx Errors */
5501 1.14.2.5 riz ifp->if_iqdrops += total_missed_rx;
5502 1.14.2.5 riz ifp->if_ierrors += crcerrs + rlec;
5503 1.1 dyoung }
5504 1.1 dyoung
5505 1.1 dyoung /** ixgbe_sysctl_tdh_handler - Handler function
5506 1.1 dyoung * Retrieves the TDH value from the hardware
5507 1.1 dyoung */
5508 1.1 dyoung static int
5509 1.1 dyoung ixgbe_sysctl_tdh_handler(SYSCTLFN_ARGS)
5510 1.1 dyoung {
5511 1.1 dyoung struct sysctlnode node;
5512 1.1 dyoung uint32_t val;
5513 1.1 dyoung struct tx_ring *txr;
5514 1.1 dyoung
5515 1.1 dyoung node = *rnode;
5516 1.1 dyoung txr = (struct tx_ring *)node.sysctl_data;
5517 1.1 dyoung if (txr == NULL)
5518 1.1 dyoung return 0;
5519 1.1 dyoung val = IXGBE_READ_REG(&txr->adapter->hw, IXGBE_TDH(txr->me));
5520 1.1 dyoung node.sysctl_data = &val;
5521 1.1 dyoung return sysctl_lookup(SYSCTLFN_CALL(&node));
5522 1.1 dyoung }
5523 1.1 dyoung
5524 1.1 dyoung /** ixgbe_sysctl_tdt_handler - Handler function
5525 1.1 dyoung * Retrieves the TDT value from the hardware
5526 1.1 dyoung */
5527 1.1 dyoung static int
5528 1.1 dyoung ixgbe_sysctl_tdt_handler(SYSCTLFN_ARGS)
5529 1.1 dyoung {
5530 1.1 dyoung struct sysctlnode node;
5531 1.1 dyoung uint32_t val;
5532 1.1 dyoung struct tx_ring *txr;
5533 1.1 dyoung
5534 1.1 dyoung node = *rnode;
5535 1.1 dyoung txr = (struct tx_ring *)node.sysctl_data;
5536 1.1 dyoung if (txr == NULL)
5537 1.1 dyoung return 0;
5538 1.1 dyoung val = IXGBE_READ_REG(&txr->adapter->hw, IXGBE_TDT(txr->me));
5539 1.1 dyoung node.sysctl_data = &val;
5540 1.1 dyoung return sysctl_lookup(SYSCTLFN_CALL(&node));
5541 1.1 dyoung }
5542 1.1 dyoung
5543 1.1 dyoung /** ixgbe_sysctl_rdh_handler - Handler function
5544 1.1 dyoung * Retrieves the RDH value from the hardware
5545 1.1 dyoung */
5546 1.1 dyoung static int
5547 1.1 dyoung ixgbe_sysctl_rdh_handler(SYSCTLFN_ARGS)
5548 1.1 dyoung {
5549 1.1 dyoung struct sysctlnode node;
5550 1.1 dyoung uint32_t val;
5551 1.1 dyoung struct rx_ring *rxr;
5552 1.1 dyoung
5553 1.1 dyoung node = *rnode;
5554 1.1 dyoung rxr = (struct rx_ring *)node.sysctl_data;
5555 1.1 dyoung if (rxr == NULL)
5556 1.1 dyoung return 0;
5557 1.1 dyoung val = IXGBE_READ_REG(&rxr->adapter->hw, IXGBE_RDH(rxr->me));
5558 1.1 dyoung node.sysctl_data = &val;
5559 1.1 dyoung return sysctl_lookup(SYSCTLFN_CALL(&node));
5560 1.1 dyoung }
5561 1.1 dyoung
5562 1.1 dyoung /** ixgbe_sysctl_rdt_handler - Handler function
5563 1.1 dyoung * Retrieves the RDT value from the hardware
5564 1.1 dyoung */
5565 1.1 dyoung static int
5566 1.1 dyoung ixgbe_sysctl_rdt_handler(SYSCTLFN_ARGS)
5567 1.1 dyoung {
5568 1.1 dyoung struct sysctlnode node;
5569 1.1 dyoung uint32_t val;
5570 1.1 dyoung struct rx_ring *rxr;
5571 1.1 dyoung
5572 1.1 dyoung node = *rnode;
5573 1.1 dyoung rxr = (struct rx_ring *)node.sysctl_data;
5574 1.1 dyoung if (rxr == NULL)
5575 1.1 dyoung return 0;
5576 1.1 dyoung val = IXGBE_READ_REG(&rxr->adapter->hw, IXGBE_RDT(rxr->me));
5577 1.1 dyoung node.sysctl_data = &val;
5578 1.1 dyoung return sysctl_lookup(SYSCTLFN_CALL(&node));
5579 1.1 dyoung }
5580 1.1 dyoung
5581 1.1 dyoung static int
5582 1.1 dyoung ixgbe_sysctl_interrupt_rate_handler(SYSCTLFN_ARGS)
5583 1.1 dyoung {
5584 1.14.2.3 martin int error;
5585 1.1 dyoung struct sysctlnode node;
5586 1.1 dyoung struct ix_queue *que;
5587 1.1 dyoung uint32_t reg, usec, rate;
5588 1.1 dyoung
5589 1.1 dyoung node = *rnode;
5590 1.1 dyoung que = (struct ix_queue *)node.sysctl_data;
5591 1.1 dyoung if (que == NULL)
5592 1.1 dyoung return 0;
5593 1.1 dyoung reg = IXGBE_READ_REG(&que->adapter->hw, IXGBE_EITR(que->msix));
5594 1.1 dyoung usec = ((reg & 0x0FF8) >> 3);
5595 1.1 dyoung if (usec > 0)
5596 1.14.2.3 martin rate = 500000 / usec;
5597 1.1 dyoung else
5598 1.1 dyoung rate = 0;
5599 1.1 dyoung node.sysctl_data = &rate;
5600 1.14.2.3 martin error = sysctl_lookup(SYSCTLFN_CALL(&node));
5601 1.14.2.3 martin if (error)
5602 1.14.2.3 martin return error;
5603 1.14.2.3 martin reg &= ~0xfff; /* default, no limitation */
5604 1.14.2.3 martin ixgbe_max_interrupt_rate = 0;
5605 1.14.2.3 martin if (rate > 0 && rate < 500000) {
5606 1.14.2.3 martin if (rate < 1000)
5607 1.14.2.3 martin rate = 1000;
5608 1.14.2.3 martin ixgbe_max_interrupt_rate = rate;
5609 1.14.2.3 martin reg |= ((4000000/rate) & 0xff8 );
5610 1.14.2.3 martin }
5611 1.14.2.3 martin IXGBE_WRITE_REG(&que->adapter->hw, IXGBE_EITR(que->msix), reg);
5612 1.14.2.3 martin return 0;
5613 1.1 dyoung }
5614 1.1 dyoung
5615 1.1 dyoung const struct sysctlnode *
5616 1.1 dyoung ixgbe_sysctl_instance(struct adapter *adapter)
5617 1.1 dyoung {
5618 1.1 dyoung const char *dvname;
5619 1.1 dyoung struct sysctllog **log;
5620 1.1 dyoung int rc;
5621 1.1 dyoung const struct sysctlnode *rnode;
5622 1.1 dyoung
5623 1.1 dyoung log = &adapter->sysctllog;
5624 1.1 dyoung dvname = device_xname(adapter->dev);
5625 1.1 dyoung
5626 1.1 dyoung if ((rc = sysctl_createv(log, 0, NULL, &rnode,
5627 1.1 dyoung 0, CTLTYPE_NODE, dvname,
5628 1.1 dyoung SYSCTL_DESCR("ixgbe information and settings"),
5629 1.7 pooka NULL, 0, NULL, 0, CTL_HW, CTL_CREATE, CTL_EOL)) != 0)
5630 1.1 dyoung goto err;
5631 1.1 dyoung
5632 1.1 dyoung return rnode;
5633 1.1 dyoung err:
5634 1.1 dyoung printf("%s: sysctl_createv failed, rc = %d\n", __func__, rc);
5635 1.1 dyoung return NULL;
5636 1.1 dyoung }
5637 1.1 dyoung
5638 1.1 dyoung /*
5639 1.1 dyoung * Add sysctl variables, one per statistic, to the system.
5640 1.1 dyoung */
5641 1.1 dyoung static void
5642 1.1 dyoung ixgbe_add_hw_stats(struct adapter *adapter)
5643 1.1 dyoung {
5644 1.1 dyoung device_t dev = adapter->dev;
5645 1.1 dyoung const struct sysctlnode *rnode, *cnode;
5646 1.1 dyoung struct sysctllog **log = &adapter->sysctllog;
5647 1.1 dyoung struct tx_ring *txr = adapter->tx_rings;
5648 1.1 dyoung struct rx_ring *rxr = adapter->rx_rings;
5649 1.1 dyoung struct ixgbe_hw_stats *stats = &adapter->stats;
5650 1.1 dyoung
5651 1.1 dyoung /* Driver Statistics */
5652 1.1 dyoung #if 0
5653 1.1 dyoung /* These counters are not updated by the software */
5654 1.1 dyoung SYSCTL_ADD_ULONG(ctx, child, OID_AUTO, "dropped",
5655 1.1 dyoung CTLFLAG_RD, &adapter->dropped_pkts,
5656 1.1 dyoung "Driver dropped packets");
5657 1.1 dyoung SYSCTL_ADD_ULONG(ctx, child, OID_AUTO, "mbuf_header_failed",
5658 1.1 dyoung CTLFLAG_RD, &adapter->mbuf_header_failed,
5659 1.1 dyoung "???");
5660 1.1 dyoung SYSCTL_ADD_ULONG(ctx, child, OID_AUTO, "mbuf_packet_failed",
5661 1.1 dyoung CTLFLAG_RD, &adapter->mbuf_packet_failed,
5662 1.1 dyoung "???");
5663 1.1 dyoung SYSCTL_ADD_ULONG(ctx, child, OID_AUTO, "no_tx_map_avail",
5664 1.1 dyoung CTLFLAG_RD, &adapter->no_tx_map_avail,
5665 1.1 dyoung "???");
5666 1.1 dyoung #endif
5667 1.1 dyoung evcnt_attach_dynamic(&adapter->handleq, EVCNT_TYPE_MISC,
5668 1.1 dyoung NULL, device_xname(dev), "Handled queue in softint");
5669 1.1 dyoung evcnt_attach_dynamic(&adapter->req, EVCNT_TYPE_MISC,
5670 1.1 dyoung NULL, device_xname(dev), "Requeued in softint");
5671 1.1 dyoung evcnt_attach_dynamic(&adapter->morerx, EVCNT_TYPE_MISC,
5672 1.1 dyoung NULL, device_xname(dev), "Interrupt handler more rx");
5673 1.1 dyoung evcnt_attach_dynamic(&adapter->moretx, EVCNT_TYPE_MISC,
5674 1.1 dyoung NULL, device_xname(dev), "Interrupt handler more tx");
5675 1.1 dyoung evcnt_attach_dynamic(&adapter->txloops, EVCNT_TYPE_MISC,
5676 1.1 dyoung NULL, device_xname(dev), "Interrupt handler tx loops");
5677 1.1 dyoung evcnt_attach_dynamic(&adapter->efbig_tx_dma_setup, EVCNT_TYPE_MISC,
5678 1.1 dyoung NULL, device_xname(dev), "Driver tx dma soft fail EFBIG");
5679 1.1 dyoung evcnt_attach_dynamic(&adapter->m_defrag_failed, EVCNT_TYPE_MISC,
5680 1.1 dyoung NULL, device_xname(dev), "m_defrag() failed");
5681 1.1 dyoung evcnt_attach_dynamic(&adapter->efbig2_tx_dma_setup, EVCNT_TYPE_MISC,
5682 1.1 dyoung NULL, device_xname(dev), "Driver tx dma hard fail EFBIG");
5683 1.1 dyoung evcnt_attach_dynamic(&adapter->einval_tx_dma_setup, EVCNT_TYPE_MISC,
5684 1.1 dyoung NULL, device_xname(dev), "Driver tx dma hard fail EINVAL");
5685 1.1 dyoung evcnt_attach_dynamic(&adapter->other_tx_dma_setup, EVCNT_TYPE_MISC,
5686 1.1 dyoung NULL, device_xname(dev), "Driver tx dma hard fail other");
5687 1.1 dyoung evcnt_attach_dynamic(&adapter->eagain_tx_dma_setup, EVCNT_TYPE_MISC,
5688 1.1 dyoung NULL, device_xname(dev), "Driver tx dma soft fail EAGAIN");
5689 1.1 dyoung evcnt_attach_dynamic(&adapter->enomem_tx_dma_setup, EVCNT_TYPE_MISC,
5690 1.1 dyoung NULL, device_xname(dev), "Driver tx dma soft fail ENOMEM");
5691 1.1 dyoung evcnt_attach_dynamic(&adapter->watchdog_events, EVCNT_TYPE_MISC,
5692 1.1 dyoung NULL, device_xname(dev), "Watchdog timeouts");
5693 1.1 dyoung evcnt_attach_dynamic(&adapter->tso_err, EVCNT_TYPE_MISC,
5694 1.1 dyoung NULL, device_xname(dev), "TSO errors");
5695 1.1 dyoung evcnt_attach_dynamic(&adapter->link_irq, EVCNT_TYPE_MISC,
5696 1.1 dyoung NULL, device_xname(dev), "Link MSIX IRQ Handled");
5697 1.1 dyoung
5698 1.1 dyoung for (int i = 0; i < adapter->num_queues; i++, rxr++, txr++) {
5699 1.1 dyoung snprintf(adapter->queues[i].evnamebuf,
5700 1.1 dyoung sizeof(adapter->queues[i].evnamebuf), "%s queue%d",
5701 1.1 dyoung device_xname(dev), i);
5702 1.1 dyoung snprintf(adapter->queues[i].namebuf,
5703 1.1 dyoung sizeof(adapter->queues[i].namebuf), "queue%d", i);
5704 1.1 dyoung
5705 1.1 dyoung if ((rnode = ixgbe_sysctl_instance(adapter)) == NULL) {
5706 1.1 dyoung aprint_error_dev(dev, "could not create sysctl root\n");
5707 1.1 dyoung break;
5708 1.1 dyoung }
5709 1.1 dyoung
5710 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &rnode,
5711 1.1 dyoung 0, CTLTYPE_NODE,
5712 1.1 dyoung adapter->queues[i].namebuf, SYSCTL_DESCR("Queue Name"),
5713 1.1 dyoung NULL, 0, NULL, 0, CTL_CREATE, CTL_EOL) != 0)
5714 1.1 dyoung break;
5715 1.1 dyoung
5716 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
5717 1.14.2.3 martin CTLFLAG_READWRITE, CTLTYPE_INT,
5718 1.1 dyoung "interrupt_rate", SYSCTL_DESCR("Interrupt Rate"),
5719 1.5 dsl ixgbe_sysctl_interrupt_rate_handler, 0,
5720 1.5 dsl (void *)&adapter->queues[i], 0, CTL_CREATE, CTL_EOL) != 0)
5721 1.1 dyoung break;
5722 1.1 dyoung
5723 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
5724 1.14.2.3 martin CTLFLAG_READONLY, CTLTYPE_QUAD,
5725 1.14.2.3 martin "irqs", SYSCTL_DESCR("irqs on this queue"),
5726 1.14.2.3 martin NULL, 0, &(adapter->queues[i].irqs),
5727 1.14.2.3 martin 0, CTL_CREATE, CTL_EOL) != 0)
5728 1.14.2.3 martin break;
5729 1.14.2.3 martin
5730 1.14.2.3 martin if (sysctl_createv(log, 0, &rnode, &cnode,
5731 1.1 dyoung CTLFLAG_READONLY, CTLTYPE_INT,
5732 1.1 dyoung "txd_head", SYSCTL_DESCR("Transmit Descriptor Head"),
5733 1.4 dsl ixgbe_sysctl_tdh_handler, 0, (void *)txr,
5734 1.1 dyoung 0, CTL_CREATE, CTL_EOL) != 0)
5735 1.1 dyoung break;
5736 1.1 dyoung
5737 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
5738 1.1 dyoung CTLFLAG_READONLY, CTLTYPE_INT,
5739 1.1 dyoung "txd_tail", SYSCTL_DESCR("Transmit Descriptor Tail"),
5740 1.4 dsl ixgbe_sysctl_tdt_handler, 0, (void *)txr,
5741 1.1 dyoung 0, CTL_CREATE, CTL_EOL) != 0)
5742 1.1 dyoung break;
5743 1.1 dyoung
5744 1.14.2.5 riz evcnt_attach_dynamic(&txr->tso_tx, EVCNT_TYPE_MISC,
5745 1.14.2.5 riz NULL, device_xname(dev), "TSO");
5746 1.1 dyoung evcnt_attach_dynamic(&txr->no_desc_avail, EVCNT_TYPE_MISC,
5747 1.1 dyoung NULL, adapter->queues[i].evnamebuf,
5748 1.1 dyoung "Queue No Descriptor Available");
5749 1.1 dyoung evcnt_attach_dynamic(&txr->total_packets, EVCNT_TYPE_MISC,
5750 1.1 dyoung NULL, adapter->queues[i].evnamebuf,
5751 1.1 dyoung "Queue Packets Transmitted");
5752 1.1 dyoung
5753 1.1 dyoung #ifdef LRO
5754 1.1 dyoung struct lro_ctrl *lro = &rxr->lro;
5755 1.1 dyoung #endif /* LRO */
5756 1.1 dyoung
5757 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
5758 1.1 dyoung CTLFLAG_READONLY,
5759 1.1 dyoung CTLTYPE_INT,
5760 1.1 dyoung "rxd_head", SYSCTL_DESCR("Receive Descriptor Head"),
5761 1.4 dsl ixgbe_sysctl_rdh_handler, 0, (void *)rxr, 0,
5762 1.1 dyoung CTL_CREATE, CTL_EOL) != 0)
5763 1.1 dyoung break;
5764 1.1 dyoung
5765 1.1 dyoung if (sysctl_createv(log, 0, &rnode, &cnode,
5766 1.1 dyoung CTLFLAG_READONLY,
5767 1.1 dyoung CTLTYPE_INT,
5768 1.1 dyoung "rxd_tail", SYSCTL_DESCR("Receive Descriptor Tail"),
5769 1.4 dsl ixgbe_sysctl_rdt_handler, 0, (void *)rxr, 0,
5770 1.1 dyoung CTL_CREATE, CTL_EOL) != 0)
5771 1.1 dyoung break;
5772 1.1 dyoung
5773 1.1 dyoung if (i < __arraycount(adapter->stats.mpc)) {
5774 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.mpc[i],
5775 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
5776 1.1 dyoung "Missed Packet Count");
5777 1.1 dyoung }
5778 1.1 dyoung if (i < __arraycount(adapter->stats.pxontxc)) {
5779 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.pxontxc[i],
5780 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
5781 1.1 dyoung "pxontxc");
5782 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.pxonrxc[i],
5783 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
5784 1.1 dyoung "pxonrxc");
5785 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.pxofftxc[i],
5786 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
5787 1.1 dyoung "pxofftxc");
5788 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.pxoffrxc[i],
5789 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
5790 1.1 dyoung "pxoffrxc");
5791 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.pxon2offc[i],
5792 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
5793 1.1 dyoung "pxon2offc");
5794 1.1 dyoung }
5795 1.1 dyoung if (i < __arraycount(adapter->stats.qprc)) {
5796 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.qprc[i],
5797 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
5798 1.1 dyoung "qprc");
5799 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.qptc[i],
5800 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
5801 1.1 dyoung "qptc");
5802 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.qbrc[i],
5803 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
5804 1.1 dyoung "qbrc");
5805 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.qbtc[i],
5806 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
5807 1.1 dyoung "qbtc");
5808 1.1 dyoung evcnt_attach_dynamic(&adapter->stats.qprdc[i],
5809 1.1 dyoung EVCNT_TYPE_MISC, NULL, adapter->queues[i].evnamebuf,
5810 1.1 dyoung "qprdc");
5811 1.1 dyoung }
5812 1.1 dyoung
5813 1.1 dyoung evcnt_attach_dynamic(&rxr->rx_packets, EVCNT_TYPE_MISC,
5814 1.1 dyoung NULL, adapter->queues[i].evnamebuf, "Queue Packets Received");
5815 1.1 dyoung evcnt_attach_dynamic(&rxr->rx_bytes, EVCNT_TYPE_MISC,
5816 1.1 dyoung NULL, adapter->queues[i].evnamebuf, "Queue Bytes Received");
5817 1.14.2.4 riz evcnt_attach_dynamic(&rxr->rx_copies, EVCNT_TYPE_MISC,
5818 1.14.2.4 riz NULL, adapter->queues[i].evnamebuf, "Copied RX Frames");
5819 1.1 dyoung evcnt_attach_dynamic(&rxr->no_jmbuf, EVCNT_TYPE_MISC,
5820 1.1 dyoung NULL, adapter->queues[i].evnamebuf, "Rx no jumbo mbuf");
5821 1.1 dyoung evcnt_attach_dynamic(&rxr->rx_discarded, EVCNT_TYPE_MISC,
5822 1.1 dyoung NULL, adapter->queues[i].evnamebuf, "Rx discarded");
5823 1.1 dyoung evcnt_attach_dynamic(&rxr->rx_irq, EVCNT_TYPE_MISC,
5824 1.1 dyoung NULL, adapter->queues[i].evnamebuf, "Rx interrupts");
5825 1.1 dyoung #ifdef LRO
5826 1.1 dyoung SYSCTL_ADD_INT(ctx, queue_list, OID_AUTO, "lro_queued",
5827 1.1 dyoung CTLFLAG_RD, &lro->lro_queued, 0,
5828 1.1 dyoung "LRO Queued");
5829 1.1 dyoung SYSCTL_ADD_INT(ctx, queue_list, OID_AUTO, "lro_flushed",
5830 1.1 dyoung CTLFLAG_RD, &lro->lro_flushed, 0,
5831 1.1 dyoung "LRO Flushed");
5832 1.1 dyoung #endif /* LRO */
5833 1.1 dyoung }
5834 1.1 dyoung
5835 1.1 dyoung /* MAC stats get the own sub node */
5836 1.1 dyoung
5837 1.1 dyoung
5838 1.1 dyoung snprintf(stats->namebuf,
5839 1.1 dyoung sizeof(stats->namebuf), "%s MAC Statistics", device_xname(dev));
5840 1.1 dyoung
5841 1.1 dyoung evcnt_attach_dynamic(&stats->ipcs, EVCNT_TYPE_MISC, NULL,
5842 1.1 dyoung stats->namebuf, "rx csum offload - IP");
5843 1.1 dyoung evcnt_attach_dynamic(&stats->l4cs, EVCNT_TYPE_MISC, NULL,
5844 1.1 dyoung stats->namebuf, "rx csum offload - L4");
5845 1.1 dyoung evcnt_attach_dynamic(&stats->ipcs_bad, EVCNT_TYPE_MISC, NULL,
5846 1.1 dyoung stats->namebuf, "rx csum offload - IP bad");
5847 1.1 dyoung evcnt_attach_dynamic(&stats->l4cs_bad, EVCNT_TYPE_MISC, NULL,
5848 1.1 dyoung stats->namebuf, "rx csum offload - L4 bad");
5849 1.1 dyoung evcnt_attach_dynamic(&stats->intzero, EVCNT_TYPE_MISC, NULL,
5850 1.1 dyoung stats->namebuf, "Interrupt conditions zero");
5851 1.1 dyoung evcnt_attach_dynamic(&stats->legint, EVCNT_TYPE_MISC, NULL,
5852 1.1 dyoung stats->namebuf, "Legacy interrupts");
5853 1.1 dyoung evcnt_attach_dynamic(&stats->crcerrs, EVCNT_TYPE_MISC, NULL,
5854 1.1 dyoung stats->namebuf, "CRC Errors");
5855 1.1 dyoung evcnt_attach_dynamic(&stats->illerrc, EVCNT_TYPE_MISC, NULL,
5856 1.1 dyoung stats->namebuf, "Illegal Byte Errors");
5857 1.1 dyoung evcnt_attach_dynamic(&stats->errbc, EVCNT_TYPE_MISC, NULL,
5858 1.1 dyoung stats->namebuf, "Byte Errors");
5859 1.1 dyoung evcnt_attach_dynamic(&stats->mspdc, EVCNT_TYPE_MISC, NULL,
5860 1.1 dyoung stats->namebuf, "MAC Short Packets Discarded");
5861 1.1 dyoung evcnt_attach_dynamic(&stats->mlfc, EVCNT_TYPE_MISC, NULL,
5862 1.1 dyoung stats->namebuf, "MAC Local Faults");
5863 1.1 dyoung evcnt_attach_dynamic(&stats->mrfc, EVCNT_TYPE_MISC, NULL,
5864 1.1 dyoung stats->namebuf, "MAC Remote Faults");
5865 1.1 dyoung evcnt_attach_dynamic(&stats->rlec, EVCNT_TYPE_MISC, NULL,
5866 1.1 dyoung stats->namebuf, "Receive Length Errors");
5867 1.1 dyoung evcnt_attach_dynamic(&stats->lxontxc, EVCNT_TYPE_MISC, NULL,
5868 1.1 dyoung stats->namebuf, "Link XON Transmitted");
5869 1.1 dyoung evcnt_attach_dynamic(&stats->lxonrxc, EVCNT_TYPE_MISC, NULL,
5870 1.1 dyoung stats->namebuf, "Link XON Received");
5871 1.1 dyoung evcnt_attach_dynamic(&stats->lxofftxc, EVCNT_TYPE_MISC, NULL,
5872 1.1 dyoung stats->namebuf, "Link XOFF Transmitted");
5873 1.1 dyoung evcnt_attach_dynamic(&stats->lxoffrxc, EVCNT_TYPE_MISC, NULL,
5874 1.1 dyoung stats->namebuf, "Link XOFF Received");
5875 1.1 dyoung
5876 1.1 dyoung /* Packet Reception Stats */
5877 1.1 dyoung evcnt_attach_dynamic(&stats->tor, EVCNT_TYPE_MISC, NULL,
5878 1.1 dyoung stats->namebuf, "Total Octets Received");
5879 1.1 dyoung evcnt_attach_dynamic(&stats->gorc, EVCNT_TYPE_MISC, NULL,
5880 1.1 dyoung stats->namebuf, "Good Octets Received");
5881 1.1 dyoung evcnt_attach_dynamic(&stats->tpr, EVCNT_TYPE_MISC, NULL,
5882 1.1 dyoung stats->namebuf, "Total Packets Received");
5883 1.1 dyoung evcnt_attach_dynamic(&stats->gprc, EVCNT_TYPE_MISC, NULL,
5884 1.1 dyoung stats->namebuf, "Good Packets Received");
5885 1.1 dyoung evcnt_attach_dynamic(&stats->mprc, EVCNT_TYPE_MISC, NULL,
5886 1.1 dyoung stats->namebuf, "Multicast Packets Received");
5887 1.1 dyoung evcnt_attach_dynamic(&stats->bprc, EVCNT_TYPE_MISC, NULL,
5888 1.1 dyoung stats->namebuf, "Broadcast Packets Received");
5889 1.1 dyoung evcnt_attach_dynamic(&stats->prc64, EVCNT_TYPE_MISC, NULL,
5890 1.1 dyoung stats->namebuf, "64 byte frames received ");
5891 1.1 dyoung evcnt_attach_dynamic(&stats->prc127, EVCNT_TYPE_MISC, NULL,
5892 1.1 dyoung stats->namebuf, "65-127 byte frames received");
5893 1.1 dyoung evcnt_attach_dynamic(&stats->prc255, EVCNT_TYPE_MISC, NULL,
5894 1.1 dyoung stats->namebuf, "128-255 byte frames received");
5895 1.1 dyoung evcnt_attach_dynamic(&stats->prc511, EVCNT_TYPE_MISC, NULL,
5896 1.1 dyoung stats->namebuf, "256-511 byte frames received");
5897 1.1 dyoung evcnt_attach_dynamic(&stats->prc1023, EVCNT_TYPE_MISC, NULL,
5898 1.1 dyoung stats->namebuf, "512-1023 byte frames received");
5899 1.1 dyoung evcnt_attach_dynamic(&stats->prc1522, EVCNT_TYPE_MISC, NULL,
5900 1.1 dyoung stats->namebuf, "1023-1522 byte frames received");
5901 1.1 dyoung evcnt_attach_dynamic(&stats->ruc, EVCNT_TYPE_MISC, NULL,
5902 1.1 dyoung stats->namebuf, "Receive Undersized");
5903 1.1 dyoung evcnt_attach_dynamic(&stats->rfc, EVCNT_TYPE_MISC, NULL,
5904 1.1 dyoung stats->namebuf, "Fragmented Packets Received ");
5905 1.1 dyoung evcnt_attach_dynamic(&stats->roc, EVCNT_TYPE_MISC, NULL,
5906 1.1 dyoung stats->namebuf, "Oversized Packets Received");
5907 1.1 dyoung evcnt_attach_dynamic(&stats->rjc, EVCNT_TYPE_MISC, NULL,
5908 1.1 dyoung stats->namebuf, "Received Jabber");
5909 1.1 dyoung evcnt_attach_dynamic(&stats->mngprc, EVCNT_TYPE_MISC, NULL,
5910 1.1 dyoung stats->namebuf, "Management Packets Received");
5911 1.1 dyoung evcnt_attach_dynamic(&stats->xec, EVCNT_TYPE_MISC, NULL,
5912 1.1 dyoung stats->namebuf, "Checksum Errors");
5913 1.1 dyoung
5914 1.1 dyoung /* Packet Transmission Stats */
5915 1.1 dyoung evcnt_attach_dynamic(&stats->gotc, EVCNT_TYPE_MISC, NULL,
5916 1.1 dyoung stats->namebuf, "Good Octets Transmitted");
5917 1.1 dyoung evcnt_attach_dynamic(&stats->tpt, EVCNT_TYPE_MISC, NULL,
5918 1.1 dyoung stats->namebuf, "Total Packets Transmitted");
5919 1.1 dyoung evcnt_attach_dynamic(&stats->gptc, EVCNT_TYPE_MISC, NULL,
5920 1.1 dyoung stats->namebuf, "Good Packets Transmitted");
5921 1.1 dyoung evcnt_attach_dynamic(&stats->bptc, EVCNT_TYPE_MISC, NULL,
5922 1.1 dyoung stats->namebuf, "Broadcast Packets Transmitted");
5923 1.1 dyoung evcnt_attach_dynamic(&stats->mptc, EVCNT_TYPE_MISC, NULL,
5924 1.1 dyoung stats->namebuf, "Multicast Packets Transmitted");
5925 1.1 dyoung evcnt_attach_dynamic(&stats->mngptc, EVCNT_TYPE_MISC, NULL,
5926 1.1 dyoung stats->namebuf, "Management Packets Transmitted");
5927 1.1 dyoung evcnt_attach_dynamic(&stats->ptc64, EVCNT_TYPE_MISC, NULL,
5928 1.1 dyoung stats->namebuf, "64 byte frames transmitted ");
5929 1.1 dyoung evcnt_attach_dynamic(&stats->ptc127, EVCNT_TYPE_MISC, NULL,
5930 1.1 dyoung stats->namebuf, "65-127 byte frames transmitted");
5931 1.1 dyoung evcnt_attach_dynamic(&stats->ptc255, EVCNT_TYPE_MISC, NULL,
5932 1.1 dyoung stats->namebuf, "128-255 byte frames transmitted");
5933 1.1 dyoung evcnt_attach_dynamic(&stats->ptc511, EVCNT_TYPE_MISC, NULL,
5934 1.1 dyoung stats->namebuf, "256-511 byte frames transmitted");
5935 1.1 dyoung evcnt_attach_dynamic(&stats->ptc1023, EVCNT_TYPE_MISC, NULL,
5936 1.1 dyoung stats->namebuf, "512-1023 byte frames transmitted");
5937 1.1 dyoung evcnt_attach_dynamic(&stats->ptc1522, EVCNT_TYPE_MISC, NULL,
5938 1.1 dyoung stats->namebuf, "1024-1522 byte frames transmitted");
5939 1.1 dyoung }
5940 1.1 dyoung
5941 1.1 dyoung /*
5942 1.1 dyoung ** Set flow control using sysctl:
5943 1.1 dyoung ** Flow control values:
5944 1.1 dyoung ** 0 - off
5945 1.1 dyoung ** 1 - rx pause
5946 1.1 dyoung ** 2 - tx pause
5947 1.1 dyoung ** 3 - full
5948 1.1 dyoung */
5949 1.1 dyoung static int
5950 1.1 dyoung ixgbe_set_flowcntl(SYSCTLFN_ARGS)
5951 1.1 dyoung {
5952 1.1 dyoung struct sysctlnode node;
5953 1.14.2.4 riz int error, last;
5954 1.1 dyoung struct adapter *adapter;
5955 1.1 dyoung
5956 1.1 dyoung node = *rnode;
5957 1.1 dyoung adapter = (struct adapter *)node.sysctl_data;
5958 1.14.2.4 riz node.sysctl_data = &adapter->fc;
5959 1.14.2.4 riz last = adapter->fc;
5960 1.1 dyoung error = sysctl_lookup(SYSCTLFN_CALL(&node));
5961 1.1 dyoung if (error != 0 || newp == NULL)
5962 1.1 dyoung return error;
5963 1.1 dyoung
5964 1.1 dyoung /* Don't bother if it's not changed */
5965 1.14.2.4 riz if (adapter->fc == last)
5966 1.1 dyoung return (0);
5967 1.1 dyoung
5968 1.14.2.4 riz switch (adapter->fc) {
5969 1.1 dyoung case ixgbe_fc_rx_pause:
5970 1.1 dyoung case ixgbe_fc_tx_pause:
5971 1.1 dyoung case ixgbe_fc_full:
5972 1.14.2.4 riz adapter->hw.fc.requested_mode = adapter->fc;
5973 1.14.2.4 riz if (adapter->num_queues > 1)
5974 1.14.2.4 riz ixgbe_disable_rx_drop(adapter);
5975 1.1 dyoung break;
5976 1.1 dyoung case ixgbe_fc_none:
5977 1.1 dyoung adapter->hw.fc.requested_mode = ixgbe_fc_none;
5978 1.14.2.4 riz if (adapter->num_queues > 1)
5979 1.14.2.4 riz ixgbe_enable_rx_drop(adapter);
5980 1.14.2.5 riz break;
5981 1.14.2.5 riz default:
5982 1.14.2.5 riz adapter->fc = last;
5983 1.14.2.5 riz return (EINVAL);
5984 1.1 dyoung }
5985 1.14.2.4 riz /* Don't autoneg if forcing a value */
5986 1.14.2.4 riz adapter->hw.fc.disable_fc_autoneg = TRUE;
5987 1.14.2.4 riz ixgbe_fc_enable(&adapter->hw);
5988 1.1 dyoung return 0;
5989 1.1 dyoung }
5990 1.1 dyoung
5991 1.1 dyoung /*
5992 1.1 dyoung ** Control link advertise speed:
5993 1.1 dyoung ** 1 - advertise only 1G
5994 1.14.2.4 riz ** 2 - advertise 100Mb
5995 1.14.2.4 riz ** 3 - advertise normal
5996 1.1 dyoung */
5997 1.1 dyoung static int
5998 1.1 dyoung ixgbe_set_advertise(SYSCTLFN_ARGS)
5999 1.1 dyoung {
6000 1.1 dyoung struct sysctlnode node;
6001 1.14.2.3 martin int t, error = 0;
6002 1.1 dyoung struct adapter *adapter;
6003 1.14.2.4 riz device_t dev;
6004 1.1 dyoung struct ixgbe_hw *hw;
6005 1.1 dyoung ixgbe_link_speed speed, last;
6006 1.1 dyoung
6007 1.1 dyoung node = *rnode;
6008 1.1 dyoung adapter = (struct adapter *)node.sysctl_data;
6009 1.14.2.4 riz dev = adapter->dev;
6010 1.14.2.4 riz hw = &adapter->hw;
6011 1.14.2.4 riz last = adapter->advertise;
6012 1.1 dyoung t = adapter->advertise;
6013 1.1 dyoung node.sysctl_data = &t;
6014 1.1 dyoung error = sysctl_lookup(SYSCTLFN_CALL(&node));
6015 1.1 dyoung if (error != 0 || newp == NULL)
6016 1.1 dyoung return error;
6017 1.1 dyoung
6018 1.14.2.4 riz if (adapter->advertise == last) /* no change */
6019 1.14.2.4 riz return (0);
6020 1.14.2.4 riz
6021 1.1 dyoung if (t == -1)
6022 1.1 dyoung return 0;
6023 1.1 dyoung
6024 1.1 dyoung adapter->advertise = t;
6025 1.1 dyoung
6026 1.1 dyoung if (!((hw->phy.media_type == ixgbe_media_type_copper) ||
6027 1.1 dyoung (hw->phy.multispeed_fiber)))
6028 1.14.2.5 riz return (EINVAL);
6029 1.1 dyoung
6030 1.14.2.4 riz if ((adapter->advertise == 2) && (hw->mac.type != ixgbe_mac_X540)) {
6031 1.14.2.4 riz device_printf(dev, "Set Advertise: 100Mb on X540 only\n");
6032 1.14.2.5 riz return (EINVAL);
6033 1.14.2.4 riz }
6034 1.14.2.4 riz
6035 1.1 dyoung if (adapter->advertise == 1)
6036 1.1 dyoung speed = IXGBE_LINK_SPEED_1GB_FULL;
6037 1.14.2.4 riz else if (adapter->advertise == 2)
6038 1.14.2.4 riz speed = IXGBE_LINK_SPEED_100_FULL;
6039 1.14.2.4 riz else if (adapter->advertise == 3)
6040 1.1 dyoung speed = IXGBE_LINK_SPEED_1GB_FULL |
6041 1.1 dyoung IXGBE_LINK_SPEED_10GB_FULL;
6042 1.14.2.5 riz else {/* bogus value */
6043 1.14.2.5 riz adapter->advertise = last;
6044 1.14.2.5 riz return (EINVAL);
6045 1.14.2.5 riz }
6046 1.1 dyoung
6047 1.1 dyoung hw->mac.autotry_restart = TRUE;
6048 1.14.2.5 riz hw->mac.ops.setup_link(hw, speed, TRUE);
6049 1.1 dyoung
6050 1.1 dyoung return 0;
6051 1.1 dyoung }
6052 1.14.2.4 riz
6053 1.14.2.4 riz /*
6054 1.14.2.4 riz ** Thermal Shutdown Trigger
6055 1.14.2.4 riz ** - cause a Thermal Overtemp IRQ
6056 1.14.2.4 riz */
6057 1.14.2.4 riz static int
6058 1.14.2.4 riz ixgbe_set_thermal_test(SYSCTLFN_ARGS)
6059 1.14.2.4 riz {
6060 1.14.2.4 riz struct sysctlnode node;
6061 1.14.2.4 riz int error, fire = 0;
6062 1.14.2.4 riz struct adapter *adapter;
6063 1.14.2.4 riz struct ixgbe_hw *hw;
6064 1.14.2.4 riz
6065 1.14.2.4 riz node = *rnode;
6066 1.14.2.4 riz adapter = (struct adapter *)node.sysctl_data;
6067 1.14.2.4 riz hw = &adapter->hw;
6068 1.14.2.4 riz
6069 1.14.2.4 riz if (hw->mac.type != ixgbe_mac_X540)
6070 1.14.2.4 riz return (0);
6071 1.14.2.4 riz
6072 1.14.2.4 riz node.sysctl_data = &fire;
6073 1.14.2.4 riz error = sysctl_lookup(SYSCTLFN_CALL(&node));
6074 1.14.2.4 riz if ((error) || (newp == NULL))
6075 1.14.2.4 riz return (error);
6076 1.14.2.4 riz
6077 1.14.2.4 riz if (fire) {
6078 1.14.2.4 riz u32 reg = IXGBE_READ_REG(hw, IXGBE_EICS);
6079 1.14.2.4 riz reg |= IXGBE_EICR_TS;
6080 1.14.2.4 riz IXGBE_WRITE_REG(hw, IXGBE_EICS, reg);
6081 1.14.2.4 riz }
6082 1.14.2.4 riz
6083 1.14.2.4 riz return (0);
6084 1.14.2.4 riz }
6085 1.14.2.4 riz
6086 1.14.2.4 riz /*
6087 1.14.2.4 riz ** Enable the hardware to drop packets when the buffer is
6088 1.14.2.4 riz ** full. This is useful when multiqueue,so that no single
6089 1.14.2.4 riz ** queue being full stalls the entire RX engine. We only
6090 1.14.2.4 riz ** enable this when Multiqueue AND when Flow Control is
6091 1.14.2.4 riz ** disabled.
6092 1.14.2.4 riz */
6093 1.14.2.4 riz static void
6094 1.14.2.4 riz ixgbe_enable_rx_drop(struct adapter *adapter)
6095 1.14.2.4 riz {
6096 1.14.2.4 riz struct ixgbe_hw *hw = &adapter->hw;
6097 1.14.2.4 riz
6098 1.14.2.4 riz for (int i = 0; i < adapter->num_queues; i++) {
6099 1.14.2.4 riz u32 srrctl = IXGBE_READ_REG(hw, IXGBE_SRRCTL(i));
6100 1.14.2.4 riz srrctl |= IXGBE_SRRCTL_DROP_EN;
6101 1.14.2.4 riz IXGBE_WRITE_REG(hw, IXGBE_SRRCTL(i), srrctl);
6102 1.14.2.4 riz }
6103 1.14.2.4 riz }
6104 1.14.2.4 riz
6105 1.14.2.4 riz static void
6106 1.14.2.4 riz ixgbe_disable_rx_drop(struct adapter *adapter)
6107 1.14.2.4 riz {
6108 1.14.2.4 riz struct ixgbe_hw *hw = &adapter->hw;
6109 1.14.2.4 riz
6110 1.14.2.4 riz for (int i = 0; i < adapter->num_queues; i++) {
6111 1.14.2.4 riz u32 srrctl = IXGBE_READ_REG(hw, IXGBE_SRRCTL(i));
6112 1.14.2.4 riz srrctl &= ~IXGBE_SRRCTL_DROP_EN;
6113 1.14.2.4 riz IXGBE_WRITE_REG(hw, IXGBE_SRRCTL(i), srrctl);
6114 1.14.2.4 riz }
6115 1.14.2.4 riz }
6116